array( 'user_agent' => ini_get('user_agent'), 'accept_encoding' => 'gzip' ) ); if(defined('PROXY_URL') && !defined('NOPROXY')){ $contextOptions['http']['proxy'] = PROXY_URL; $contextOptions['http']['request_fulluri'] = true; if(is_null($context)){ $context = stream_context_create($contextOptions); } else { $prevContext = $context; if(!stream_context_set_option($context, $contextOptions)){ $context = $prevContext; } } } if(is_null($maxlen)){ $content = @file_get_contents($url, $use_include_path, $context, $offset); } else { $content = @file_get_contents($url, $use_include_path, $context, $offset, $maxlen); } if($content === false) debugMessage('Cant\'t download ' . $url); // handle compressed data foreach($http_response_header as $header){ if(stristr($header, 'content-encoding')){ switch(true){ case stristr($header, 'gzip'): $content = gzinflate(substr($content, 10, -8)); break; case stristr($header, 'compress'): //TODO case stristr($header, 'deflate'): //TODO case stristr($header, 'brotli'): //TODO returnServerError($header . '=> Not implemented yet'); break; case stristr($header, 'identity'): break; default: returnServerError($header . '=> Unknown compression'); } } } return $content; } function getSimpleHTMLDOM($url , $use_include_path = false , $context = null , $offset = 0 , $maxLen = null , $lowercase = true , $forceTagsClosed = true , $target_charset = DEFAULT_TARGET_CHARSET , $stripRN = true , $defaultBRText = DEFAULT_BR_TEXT , $defaultSpanText = DEFAULT_SPAN_TEXT ){ $content = getContents($url, $use_include_path, $context, $offset, $maxLen); return str_get_html($content , $lowercase , $forceTagsClosed , $target_charset , $stripRN , $defaultBRText , $defaultSpanText); } /** * Maintain locally cached versions of pages to avoid multiple downloads. * @param url url to cache * @param duration duration of the cache file in seconds (default: 24h/86400s) * @return content of the file as string */ function getSimpleHTMLDOMCached($url , $duration = 86400 , $use_include_path = false , $context = null , $offset = 0 , $maxLen = null , $lowercase = true , $forceTagsClosed = true , $target_charset = DEFAULT_TARGET_CHARSET , $stripRN = true , $defaultBRText = DEFAULT_BR_TEXT , $defaultSpanText = DEFAULT_SPAN_TEXT ){ debugMessage('Caching url ' . $url . ', duration ' . $duration); // Initialize cache $cache = Cache::create('FileCache'); $cache->setPath(CACHE_DIR . '/pages'); $cache->purgeCache(86400); // 24 hours (forced) $params = [$url]; $cache->setParameters($params); // Determine if cached file is within duration $time = $cache->getTime(); if($time !== false && (time() - $duration < $time) && (!defined('DEBUG') || DEBUG !== true)){ // Contents within duration $content = $cache->loadData(); } else { // Content not within duration $content = getContents($url, $use_include_path, $context, $offset, $maxLen); if($content !== false){ $cache->saveData($content); } } return str_get_html($content , $lowercase , $forceTagsClosed , $target_charset , $stripRN , $defaultBRText , $defaultSpanText); } ?>