find('*[!b38fd2b1fe7f4747d6b1c1254ccd055e]') as $element) { if(in_array($element->tag, $keptText)) { $element->outertext = $element->plaintext; } elseif(in_array($element->tag, $removedTags)) { $element->outertext = ''; } else { foreach($element->getAllAttributes() as $attributeName => $attribute) { if(!in_array($attributeName, $keptAttributes)) $element->removeAttribute($attributeName); } } } return $htmlContent; } function backgroundToImg($htmlContent) { $regex = '/background-image[ ]{0,}:[ ]{0,}url\([\'"]{0,}(.*?)[\'"]{0,}\)/'; $htmlContent = str_get_html($htmlContent); foreach($htmlContent->find('*[!b38fd2b1fe7f4747d6b1c1254ccd055e]') as $element) { if(preg_match($regex, $element->style, $matches) > 0) { $element->outertext = ''; } } return $htmlContent; } /** * Convert relative links in HTML into absolute links * @param $content HTML content to fix. Supports HTML objects or string objects * @param $server full URL to the page containing relative links * @return content with fixed URLs, as HTML object or string depending on input type */ function defaultLinkTo($content, $server){ $string_convert = false; if (is_string($content)) { $string_convert = true; $content = str_get_html($content); } foreach($content->find('img') as $image) { $image->src = urljoin($server, $image->src); } foreach($content->find('a') as $anchor) { $anchor->href = urljoin($server, $anchor->href); } if ($string_convert) { $content = $content->outertext; } return $content; } /** * Extract the first part of a string matching the specified start and end delimiters * @param $string input string, e.g. '