From 0ff3cf0e0b03e113eabac0525489172963677b18 Mon Sep 17 00:00:00 2001 From: ORelio Date: Sun, 20 Mar 2016 15:59:25 +0100 Subject: [PATCH] [FS] Add FuturaSciences RSS expander for all the feeds provided by Futura-Sciences. --- bridges/FuturaSciencesBridge.php | 219 +++++++++++++++++++++++++++++++ 1 file changed, 219 insertions(+) create mode 100644 bridges/FuturaSciencesBridge.php diff --git a/bridges/FuturaSciencesBridge.php b/bridges/FuturaSciencesBridge.php new file mode 100644 index 00000000..222c7cdd --- /dev/null +++ b/bridges/FuturaSciencesBridge.php @@ -0,0 +1,219 @@ +maintainer = 'ORelio'; + $this->name = $this->getName(); + $this->uri = $this->getURI(); + $this->description = 'Returns the newest articles.'; + $this->update = '2016-03-20'; + + $this->parameters[] = + '[ + { + "name" : "Feed", + "type" : "list", + "identifier" : "feed", + "values" : + [ + { "name" : "---- Select ----", "value" : "" }, + + { "name" : "", "value" : "" }, + { "name" : "Les flux multi-magazines", "value" : "" }, + + { "name" : "    Les dernières actualités de Futura-Sciences", "value" : "actualites" }, + { "name" : "    Les dernières définitions de Futura-Sciences", "value" : "definitions" }, + { "name" : "    Les dernières photos de Futura-Sciences", "value" : "photos" }, + { "name" : "    Les dernières questions - réponses de Futura-Sciences", "value" : "questions-reponses" }, + { "name" : "    Les derniers dossiers de Futura-Sciences", "value" : "dossiers" }, + + { "name" : "", "value" : "" }, + { "name" : "Les flux Services", "value" : "" }, + + { "name" : "    Les cartes virtuelles de Futura-Sciences", "value" : "services/cartes-virtuelles" }, + { "name" : "    Les fonds d\'écran de Futura-Sciences", "value" : "services/fonds-ecran" }, + + { "name" : "", "value" : "" }, + { "name" : "Les flux Santé", "value" : "" }, + + { "name" : "    Les dernières actualités de Futura-Santé", "value" : "sante/actualites" }, + { "name" : "    Les dernières définitions de Futura-Santé", "value" : "sante/definitions" }, + { "name" : "    Les dernières questions-réponses de Futura-Santé", "value" : "sante/questions-reponses" }, + { "name" : "    Les derniers dossiers de Futura-Santé", "value" : "sante/dossiers" }, + + { "name" : "", "value" : "" }, + { "name" : "Les flux High-Tech", "value" : "" }, + + { "name" : "    Les dernières actualités de Futura High-Tech", "value" : "high-tech/actualites" }, + { "name" : "    Les dernières astuces de Futura High-Tech", "value" : "high-tech/questions-reponses" }, + { "name" : "    Les dernières définitions de Futura High-Tech", "value" : "high-tech/definitions" }, + { "name" : "    Les derniers dossiers de Futura High-Tech", "value" : "high-tech/dossiers" }, + + { "name" : "", "value" : "" }, + { "name" : "Les flux Espace", "value" : "" }, + + { "name" : "    Les dernières actualités de Futura-Espace", "value" : "espace/actualites" }, + { "name" : "    Les dernières définitions de Futura-Espace", "value" : "espace/definitions" }, + { "name" : "    Les dernières questions-réponses de Futura-Espace", "value" : "espace/questions-reponses" }, + { "name" : "    Les derniers dossiers de Futura-Espace", "value" : "espace/dossiers" }, + + { "name" : "", "value" : "" }, + { "name" : "Les flux Environnement", "value" : "" }, + + { "name" : "    Les dernières actualités de Futura-Environnement", "value" : "environnement/actualites" }, + { "name" : "    Les dernières définitions de Futura-Environnement", "value" : "environnement/definitions" }, + { "name" : "    Les dernières questions - réponses de Futura-Environnement", "value" : "environnement/questions-reponses" }, + { "name" : "    Les derniers dossiers de Futura-Environnement", "value" : "environnement/dossiers" }, + + { "name" : "", "value" : "" }, + { "name" : "Les flux Maison", "value" : "" }, + + { "name" : "    Les dernières actualités de Futura-Maison", "value" : "maison/actualites" }, + { "name" : "    Les dernières astuces de Futura-Maison", "value" : "maison/questions-reponses" }, + { "name" : "    Les dernières définitions de Futura-Maison", "value" : "maison/definitions" }, + { "name" : "    Les derniers dossiers de Futura-Maison", "value" : "maison/dossiers" }, + + { "name" : "", "value" : "" }, + { "name" : "Les flux Nature", "value" : "" }, + + { "name" : "    Les dernières actualités de Futura-Nature", "value" : "nature/actualites" }, + { "name" : "    Les dernières définitions de Futura-Nature", "value" : "nature/definitions" }, + { "name" : "    Les dernières questions-réponses de Futura-Nature", "value" : "nature/questions-reponses" }, + { "name" : "    Les derniers dossiers de Futura-Nature", "value" : "nature/dossiers" }, + + { "name" : "", "value" : "" }, + { "name" : "Les flux Terre", "value" : "" }, + + { "name" : "    Les dernières actualités de Futura-Terre", "value" : "terre/actualites" }, + { "name" : "    Les dernières définitions de Futura-Terre", "value" : "terre/definitions" }, + { "name" : "    Les dernières questions-réponses de Futura-Terre", "value" : "terre/questions-reponses" }, + { "name" : "    Les derniers dossiers de Futura-Terre", "value" : "terre/dossiers" }, + + { "name" : "", "value" : "" }, + { "name" : "Les flux Matière", "value" : "" }, + + { "name" : "    Les dernières actualités de Futura-Matière", "value" : "matiere/actualites" }, + { "name" : "    Les dernières définitions de Futura-Matière", "value" : "matiere/definitions" }, + { "name" : "    Les dernières questions-réponses de Futura-Matière", "value" : "matiere/questions-reponses" }, + { "name" : "    Les derniers dossiers de Futura-Matière", "value" : "matiere/dossiers" }, + + { "name" : "", "value" : "" }, + { "name" : "Les flux Mathématiques", "value" : "" }, + + { "name" : "    Les dernières actualités de Futura-Mathématiques", "value" : "mathematiques/actualites" }, + { "name" : "    Les derniers dossiers de Futura-Mathématiques", "value" : "mathematiques/dossiers" } + ] + } + ]'; + + } + + public function collectData(array $param) { + + function StripCDATA($string) { + $string = str_replace('', '', $string); + return $string; + } + + function StripWithDelimiters($string, $start, $end) { + while (strpos($string, $start) !== false) { + $section_to_remove = substr($string, strpos($string, $start)); + $section_to_remove = substr($section_to_remove, 0, strpos($section_to_remove, $end) + strlen($end)); + $string = str_replace($section_to_remove, '', $string); + } return $string; + } + + function StripRecursiveHTMLSection($string, $tag_name, $tag_start) { + $open_tag = '<'.$tag_name; + $close_tag = ''; + $close_tag_length = strlen($close_tag); + if (strpos($tag_start, $open_tag) === 0) { + while (strpos($string, $tag_start) !== false) { + $max_recursion = 100; + $section_to_remove = null; + $section_start = strpos($string, $tag_start); + $search_offset = $section_start; + do { + $max_recursion--; + $section_end = strpos($string, $close_tag, $search_offset); + $search_offset = $section_end + $close_tag_length; + $section_to_remove = substr($string, $section_start, $section_end - $section_start + $close_tag_length); + $open_tag_count = substr_count($section_to_remove, $open_tag); + $close_tag_count = substr_count($section_to_remove, $close_tag); + } while ($open_tag_count > $close_tag_count && $max_recursion > 0); + $string = str_replace($section_to_remove, '', $string); + } + } + return $string; + } + + if (empty($param['feed'])) + $this->returnError('Please select a feed to display.'.$url, 400); + if ($param['feed'] !== preg_replace('/[^a-zA-Z-\/]+/', '', $param['feed']) || substr_count($param['feed'], '/') > 1 || strlen($param['feed'] > 64)) + $this->returnError('Invalid "feed" parameter.'.$url, 400); + + $url = $this->getURI().'rss/'.$param['feed'].'.xml'; + $html = file_get_html($url) or $this->returnError('Could not request Futura-Sciences: '.$url, 500); + $limit = 0; + + foreach($html->find('item') as $element) { + if ($limit < 10) { + $article_url = str_replace('#xtor=RSS-8', '', StripCDATA($element->find('guid', 0)->plaintext)); + $article = file_get_html($article_url) or $this->returnError('Could not request Futura-Sciences: '.$article_url, 500); + $contents = $article->find('div.content', 0)->innertext; + $author = trim(str_replace(', Futura-Sciences', '', $article->find('span.author', 0)->plaintext)); + if (empty($author)) + $author = StripCDATA($element->find('author', 0)->plaintext); + + foreach (array( + '
'); + $contents = StripWithDelimiters($contents, '