Rss-Bridge/bridges/ScmbBridge.php
logmanoriginal 052844f5e1 all: Use ->remove() instead of ->outertext = ''
simplehtmldom 1.9 introduced new functions to recursively remove
nodes from the DOM. This allows removing elements without the need
to re-load the document by using $html->load($html->save()), which
is very inefficient.

Find more information about remove() at
https://simplehtmldom.sourceforge.io/docs/1.9/api/simple_html_dom_node/remove/
2019-06-01 21:29:57 +02:00

39 lines
1.2 KiB
PHP

<?php
class ScmbBridge extends BridgeAbstract {
const MAINTAINER = 'Astalaseven';
const NAME = 'Se Coucher Moins Bête Bridge';
const URI = 'http://secouchermoinsbete.fr';
const CACHE_TIMEOUT = 21600; // 6h
const DESCRIPTION = 'Returns the newest anecdotes.';
public function collectData(){
$html = '';
$html = getSimpleHTMLDOM(self::URI)
or returnServerError('Could not request Se Coucher Moins Bete.');
foreach($html->find('article') as $article) {
$item = array();
$item['uri'] = self::URI . $article->find('p.summary a', 0)->href;
$item['title'] = $article->find('header h1 a', 0)->innertext;
// remove text "En savoir plus" from anecdote content
$article->find('span.read-more', 0)->remove();
$content = $article->find('p.summary a', 0)->innertext;
// remove superfluous spaces at the end
$content = substr($content, 0, strlen($content) - 17);
// get publication date
$str_date = $article->find('time', 0)->datetime;
list($date, $time) = explode(' ', $str_date);
list($y, $m, $d) = explode('-', $date);
list($h, $i) = explode(':', $time);
$timestamp = mktime($h, $i, 0, $m, $d, $y);
$item['timestamp'] = $timestamp;
$item['content'] = $content;
$this->items[] = $item;
}
}
}