parent
5c6c79baf4
commit
91e73b00b5
1 changed files with 194 additions and 0 deletions
194
bridges/NationalGeographicBridge.php
Normal file
194
bridges/NationalGeographicBridge.php
Normal file
|
@ -0,0 +1,194 @@
|
|||
<?php
|
||||
class NationalGeographicBridge extends BridgeAbstract {
|
||||
|
||||
const CONTEXT_BY_TOPIC = 'By Topic';
|
||||
const PARAMETER_TOPIC = 'topic';
|
||||
const PARAMETER_FULL_ARTICLE = 'full';
|
||||
const TOPIC_MAGAZINE = 'Magazine';
|
||||
const TOPIC_LATEST_STORIES = 'Latest Stories';
|
||||
|
||||
const NAME = 'National Geographic';
|
||||
const URI = 'https://www.nationalgeographic.com/';
|
||||
const DESCRIPTION = 'Fetches the latest articles from the National Geographic Magazine';
|
||||
const MAINTAINER = 'logmanoriginal';
|
||||
const PARAMETERS = array(
|
||||
self::CONTEXT_BY_TOPIC => array(
|
||||
self::PARAMETER_TOPIC => array(
|
||||
'name' => 'Topic',
|
||||
'type' => 'list',
|
||||
'values' => array(
|
||||
self::TOPIC_MAGAZINE => 'magazine',
|
||||
self::TOPIC_LATEST_STORIES => 'latest-stories'
|
||||
),
|
||||
'title' => 'Select your topic',
|
||||
'defaultValue' => 'Magazine'
|
||||
)
|
||||
),
|
||||
'global' => array(
|
||||
self::PARAMETER_FULL_ARTICLE => array(
|
||||
'name' => 'Full Article',
|
||||
'type' => 'checkbox',
|
||||
'title' => 'Enable to load full articles (takes longer)'
|
||||
)
|
||||
)
|
||||
);
|
||||
|
||||
private $topicName = '';
|
||||
|
||||
public function getURI() {
|
||||
switch ($this->queriedContext) {
|
||||
case self::CONTEXT_BY_TOPIC: {
|
||||
return self::URI . $this->getInput(self::PARAMETER_TOPIC);
|
||||
} break;
|
||||
default: {
|
||||
return parent::getURI();
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
public function collectData() {
|
||||
$this->topicName = $this->getTopicName($this->getInput(self::PARAMETER_TOPIC));
|
||||
|
||||
switch($this->topicName) {
|
||||
case self::TOPIC_MAGAZINE: {
|
||||
return $this->collectMagazine();
|
||||
} break;
|
||||
case self::TOPIC_LATEST_STORIES: {
|
||||
return $this->collectLatestStories();
|
||||
} break;
|
||||
default: {
|
||||
returnServerError('Unknown topic: "' . $this->topicName . '"');
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
public function getName() {
|
||||
switch ($this->queriedContext) {
|
||||
case self::CONTEXT_BY_TOPIC: {
|
||||
return static::NAME . ': ' . $this->topicName;
|
||||
} break;
|
||||
default: {
|
||||
return parent::getName();
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
private function getTopicName($topic) {
|
||||
return array_search($topic, static::PARAMETERS[self::CONTEXT_BY_TOPIC][self::PARAMETER_TOPIC]['values']);
|
||||
}
|
||||
|
||||
private function collectMagazine() {
|
||||
$uri = $this->getURI();
|
||||
|
||||
$html = getSimpleHTMLDOM($uri)
|
||||
or returnServerError('Could not request ' . $uri);
|
||||
|
||||
$script = $html->find('#lead-component script')[0];
|
||||
|
||||
$json = json_decode($script->innertext, true);
|
||||
|
||||
// This is probably going to break in the future, fix it then :)
|
||||
foreach($json['body']['0']['multilayout_promo_beta']['stories'] as $story) {
|
||||
$this->addStory($story);
|
||||
}
|
||||
}
|
||||
|
||||
private function collectLatestStories() {
|
||||
$uri = self::URI . 'latest-stories/_jcr_content/content/hubfeed.promo-hub-feed-all-stories.json';
|
||||
|
||||
$json_raw = getContents($uri)
|
||||
or returnServerError('Could not request ' . $uri);
|
||||
|
||||
foreach(json_decode($json_raw, true) as $story) {
|
||||
$this->addStory($story);
|
||||
}
|
||||
}
|
||||
|
||||
private function addStory($story) {
|
||||
$title = 'Unknown title';
|
||||
$content = '';
|
||||
|
||||
foreach($story['components'] as $component) {
|
||||
switch($component['content_type']) {
|
||||
case 'title': {
|
||||
$title = $component['title']['text'];
|
||||
} break;
|
||||
case 'dek': {
|
||||
$content = $component['dek']['text'];
|
||||
} break;
|
||||
}
|
||||
}
|
||||
|
||||
$item = array();
|
||||
|
||||
$item['uri'] = $story['uri'];
|
||||
$item['title'] = $title;
|
||||
|
||||
// if full article is requested!
|
||||
if ($this->getInput(self::PARAMETER_FULL_ARTICLE))
|
||||
$item['content'] = $this->getFullArticle($item['uri']);
|
||||
else
|
||||
$item['content'] = $content;
|
||||
|
||||
if (isset($story['promo_image'])) {
|
||||
switch($story['promo_image']['content_type']) {
|
||||
case 'image': {
|
||||
$item['enclosures'][] = $story['promo_image']['image']['uri'];
|
||||
} break;
|
||||
}
|
||||
}
|
||||
|
||||
if (isset($story['lead_media'])) {
|
||||
$media = $story['lead_media'];
|
||||
switch($media['content_type']) {
|
||||
case 'image': {
|
||||
// Don't add if promo_image was added
|
||||
if (empty($item['enclosures']))
|
||||
$item['enclosures'][] = $media['image']['uri'];
|
||||
} break;
|
||||
case 'image_gallery': {
|
||||
foreach($media['image_gallery']['images'] as $image) {
|
||||
$item['enclosures'][] = $image['uri'];
|
||||
}
|
||||
} break;
|
||||
}
|
||||
}
|
||||
|
||||
$this->items[] = $item;
|
||||
}
|
||||
|
||||
private function getFullArticle($uri) {
|
||||
$html = getSimpleHTMLDOMCached($uri)
|
||||
or returnServerError('Could not load ' . $uri);
|
||||
|
||||
$html = defaultLinkTo($html, $uri);
|
||||
|
||||
$content = '';
|
||||
|
||||
foreach($html->find('
|
||||
.content > .smartbody.text,
|
||||
.content > .section.image script[type="text/json"],
|
||||
.content > .section.image span[itemprop="caption"],
|
||||
.content > .section.inline script[type="text/json"]
|
||||
') as $element) {
|
||||
if ($element->tag === 'script') {
|
||||
$json = json_decode($element->innertext, true);
|
||||
if (isset($json['src'])) {
|
||||
$content .= '<img src="' . $json['src'] . '" width="100%" alt="' . $json['alt'] . '">';
|
||||
} elseif (isset($json['galleryType']) && isset($json['endpoint'])) {
|
||||
$doc = getContents($json['endpoint'])
|
||||
or returnServerError('Could not load ' . $json['endpoint']);
|
||||
$json = json_decode($doc, true);
|
||||
foreach($json['items'] as $item) {
|
||||
$content .= '<p>' . $item['caption'] . '</p>';
|
||||
$content .= '<img src="' . $item['url'] . '" width="100%" alt="' . $item['caption'] . '">';
|
||||
}
|
||||
}
|
||||
} else {
|
||||
$content .= $element->outertext;
|
||||
}
|
||||
}
|
||||
|
||||
return $content;
|
||||
}
|
||||
}
|
Loading…
Reference in a new issue