Rss-Bridge/bridges/PcGamerBridge.php

45 lines
1.4 KiB
PHP
Raw Permalink Normal View History

<?php
class PcGamerBridge extends BridgeAbstract
{
2017-12-24 22:45:56 +01:00
const NAME = 'PC Gamer';
const URI = 'https://www.pcgamer.com/archive/';
2017-12-24 22:45:56 +01:00
const DESCRIPTION = 'PC Gamer Most Read Stories';
const CACHE_TIMEOUT = 3600;
const MAINTAINER = 'IceWreck, mdemoss';
2017-12-24 22:45:56 +01:00
public function collectData()
{
$html = getSimpleHTMLDOMCached($this->getURI(), 300);
$stories = $html->find('ul.basic-list li.day-article');
$i = 0;
// Find induvidual stories in the archive page
2017-12-24 22:45:56 +01:00
foreach ($stories as $element) {
if($i == 15) break;
2017-12-24 22:45:56 +01:00
$item['uri'] = $element->find('a', 0)->href;
// error_log(print_r($item['uri'], TRUE));
2017-12-24 22:45:56 +01:00
$articleHtml = getSimpleHTMLDOMCached($item['uri']);
$item['title'] = $element->find('a', 0)->plaintext;
2017-12-24 22:45:56 +01:00
$item['timestamp'] = strtotime($articleHtml->find('meta[name=pub_date]', 0)->content);
$item['author'] = $articleHtml->find('span.by-author a', 0)->plaintext;
// Get the article content
$articleContents = $articleHtml->find('#article-body', 0);
/*
By default the img src has a link to an error image and then the actual image
is added in by JS. So we replace the error image with the actual full size image
whoose link is in one of the attributes of the img tag
*/
foreach($articleContents->find('img') as $img) {
$imgsrc = $img->getAttribute('data-original-mos');
// error_log($imgsrc);
$img->src = $imgsrc;
}
$item['content'] = $articleContents;
2017-12-24 22:45:56 +01:00
$this->items[] = $item;
$i++;
2017-12-24 22:45:56 +01:00
}
}
}