Rss-Bridge/bridges/WeLiveSecurityBridge.php

<?php
class WeLiveSecurityBridge extends BridgeAbstract {

    public function loadMetadatas() {
        $this->maintainer = 'ORelio';
        $this->name = 'We Live Security';
        $this->uri = 'http://www.welivesecurity.com/';
        $this->description = 'Returns the newest articles.';
        $this->update = '2016-08-06';
    }

    public function collectData(array $param) {

        function ExtractFromDelimiters($string, $start, $end) {
            if (strpos($string, $start) !== false) {
                $section_retrieved = substr($string, strpos($string, $start) + strlen($start));
                $section_retrieved = substr($section_retrieved, 0, strpos($section_retrieved, $end));
                return $section_retrieved;
            } return false;
        }

        function StripWithDelimiters($string, $start, $end) {
            while (strpos($string, $start) !== false) {
                $section_to_remove = substr($string, strpos($string, $start));
                $section_to_remove = substr($section_to_remove, 0, strpos($section_to_remove, $end) + strlen($end));
                $string = str_replace($section_to_remove, '', $string);
            } return $string;
        }

        $feed = $this->getURI().'feed/';
        $html = $this->file_get_html($feed) or $this->returnError('Could not request '.$this->getName().': '.$feed, 500);
        $limit = 0;

        foreach ($html->find('item') as $element) {
            if ($limit < 5) {

                $article_image = $element->find('image', 0)->plaintext;
                $article_url = ExtractFromDelimiters($element->innertext, '<link>', '</link>');
                $article_summary = ExtractFromDelimiters($element->innertext, '<description><![CDATA[<p>', '</p>');
                $article_html = file_get_contents($article_url) or $this->returnError('Could not request '.$this->getName().': '.$article_url, 500);
                if (substr($article_html, 0, 2) == "\x1f\x8b") //http://www.gzip.org/zlib/rfc-gzip.html#header-trailer -> GZip ID1
                    $article_html = gzdecode($article_html);   //Response is GZipped even if we didn't accept GZip!? Let's decompress...
                $article_html = str_get_html($article_html);   //Now we have our HTML data. But still, that's an important HTTP violation...
                $article_content = $article_html->find('div.wlistingsingletext', 0)->innertext;
                $article_content = StripWithDelimiters($article_content, '<script', '</script>');
                $article_content = '<p><img src="'.$article_image.'" /></p>'
                    .'<p><b>'.$article_summary.'</b></p>'
                    .trim($article_content);

                $item = new \Item();
                $item->uri = $article_url;
                $item->thumbnailUri = $article_image;
                $item->title = $element->find('title', 0)->plaintext;
                $item->author = $article_html->find('a[rel=author]', 0)->plaintext;
                $item->timestamp = strtotime($element->find('pubDate', 0)->plaintext);
                $item->content = $article_content;
                $this->items[] = $item;
                $limit++;

            }
        }
    }
}
[WeLiveSecurity] New bridge, Security News. 2016-07-19 19:37:33 +02:00			`<?php`
			`class WeLiveSecurityBridge extends BridgeAbstract {`

			`public function loadMetadatas() {`
			`$this->maintainer = 'ORelio';`
bridges: Put name/uri directly in bridge metadata Some bridges used getName() and getURI() to put information into the metadatas. Instead the metadatas should be initialized with data and (not yet done) returned by default via getName() and getURI(). 2016-08-06 17:55:29 +02:00			`$this->name = 'We Live Security';`
			`$this->uri = 'http://www.welivesecurity.com/';`
[WeLiveSecurity] New bridge, Security News. 2016-07-19 19:37:33 +02:00			`$this->description = 'Returns the newest articles.';`
bridges: Remove getCacheDuration if default BridgeAbstract will return 3600 seconds by default, so the function can be removed from any bridge implementing getCacheDuration returning the same value. Documentation updated accordingly. 2016-08-06 16:17:58 +02:00			`$this->update = '2016-08-06';`
[WeLiveSecurity] New bridge, Security News. 2016-07-19 19:37:33 +02:00			`}`

			`public function collectData(array $param) {`

			`function ExtractFromDelimiters($string, $start, $end) {`
			`if (strpos($string, $start) !== false) {`
			`$section_retrieved = substr($string, strpos($string, $start) + strlen($start));`
			`$section_retrieved = substr($section_retrieved, 0, strpos($section_retrieved, $end));`
			`return $section_retrieved;`
			`} return false;`
			`}`

			`function StripWithDelimiters($string, $start, $end) {`
			`while (strpos($string, $start) !== false) {`
			`$section_to_remove = substr($string, strpos($string, $start));`
			`$section_to_remove = substr($section_to_remove, 0, strpos($section_to_remove, $end) + strlen($end));`
			`$string = str_replace($section_to_remove, '', $string);`
			`} return $string;`
			`}`

			`$feed = $this->getURI().'feed/';`
			`$html = $this->file_get_html($feed) or $this->returnError('Could not request '.$this->getName().': '.$feed, 500);`
			`$limit = 0;`

			`foreach ($html->find('item') as $element) {`
			`if ($limit < 5) {`

			`$article_image = $element->find('image', 0)->plaintext;`
			`$article_url = ExtractFromDelimiters($element->innertext, '<link>', '</link>');`
			`$article_summary = ExtractFromDelimiters($element->innertext, '<description><![CDATA[<p>', '</p>');`
			`$article_html = file_get_contents($article_url) or $this->returnError('Could not request '.$this->getName().': '.$article_url, 500);`
			`if (substr($article_html, 0, 2) == "\x1f\x8b") //http://www.gzip.org/zlib/rfc-gzip.html#header-trailer -> GZip ID1`
			`$article_html = gzdecode($article_html); //Response is GZipped even if we didn't accept GZip!? Let's decompress...`
			`$article_html = str_get_html($article_html); //Now we have our HTML data. But still, that's an important HTTP violation...`
			`$article_content = $article_html->find('div.wlistingsingletext', 0)->innertext;`
			`$article_content = StripWithDelimiters($article_content, '<script', '</script>');`
			`$article_content = '<p><img src="'.$article_image.'" /></p>'`
			`.'<p><b>'.$article_summary.'</b></p>'`
			`.trim($article_content);`

			`$item = new \Item();`
			`$item->uri = $article_url;`
			`$item->thumbnailUri = $article_image;`
			`$item->title = $element->find('title', 0)->plaintext;`
			`$item->author = $article_html->find('a[rel=author]', 0)->plaintext;`
			`$item->timestamp = strtotime($element->find('pubDate', 0)->plaintext);`
			`$item->content = $article_content;`
			`$this->items[] = $item;`
			`$limit++;`

			`}`
			`}`
			`}`
			`}`