[RadioMelodieBridge] Update to support new Website (#1101)
* [RadioMelodieBridge] Update to support new Website
This commit is contained in:
parent
7b8dd93a8e
commit
f9c4a84c25
1 changed files with 71 additions and 17 deletions
|
@ -1,34 +1,88 @@
|
||||||
<?php
|
<?php
|
||||||
class RadioMelodieBridge extends BridgeAbstract {
|
class RadioMelodieBridge extends BridgeAbstract {
|
||||||
const NAME = 'Radio Melodie Actu';
|
const NAME = 'Radio Melodie Actu';
|
||||||
const URI = 'https://www.radiomelodie.com/';
|
const URI = 'https://www.radiomelodie.com';
|
||||||
const DESCRIPTION = 'Retourne les actualités publiées par Radio Melodie';
|
const DESCRIPTION = 'Retourne les actualités publiées par Radio Melodie';
|
||||||
const MAINTAINER = 'sysadminstory';
|
const MAINTAINER = 'sysadminstory';
|
||||||
|
|
||||||
public function getIcon() {
|
public function getIcon() {
|
||||||
return self::URI . 'img/favicon.png';
|
return self::URI . '/img/favicon.png';
|
||||||
}
|
}
|
||||||
|
|
||||||
public function collectData(){
|
public function collectData(){
|
||||||
$html = getSimpleHTMLDOM(self::URI . 'actu')
|
$html = getSimpleHTMLDOM(self::URI . '/actu/')
|
||||||
or returnServerError('Could not request Radio Melodie.');
|
or returnServerError('Could not request Radio Melodie.');
|
||||||
$list = $html->find('div[class=actuitem]');
|
$list = $html->find('div[class=actu_col1]', 0)->children();;
|
||||||
foreach($list as $element) {
|
foreach($list as $element) {
|
||||||
|
if($element->tag == 'a') {
|
||||||
|
$articleURL = self::URI . $element->href;
|
||||||
|
$article = getSimpleHTMLDOM($articleURL);
|
||||||
|
|
||||||
|
// Initialise arrays
|
||||||
$item = array();
|
$item = array();
|
||||||
|
$audio = array();
|
||||||
|
$picture = array();
|
||||||
|
|
||||||
// Get picture URL
|
// Get the Main picture URL
|
||||||
$pictureHTML = $element->find('div[class=picture]');
|
$picture[] = $this->rewriteImage($article->find('img[id=picturearticle]', 0)->src);
|
||||||
preg_match(
|
$audioHTML = $article->find('div[class=sm2-playlist-wrapper]');
|
||||||
'/background-image:url\((.*)\);/',
|
|
||||||
$pictureHTML[0]->getAttribute('style'),
|
|
||||||
$pictures);
|
|
||||||
$pictureURL = $pictures[1];
|
|
||||||
|
|
||||||
$item['enclosures'] = array($pictureURL);
|
// Remove the audio placeholder under the Audio player with an <audio>
|
||||||
$item['uri'] = self::URI . $element->parent()->href;
|
// element and add the audio element to the enclosure
|
||||||
$item['title'] = $element->find('h3', 0)->plaintext;
|
foreach($audioHTML as $audioElement) {
|
||||||
$item['content'] = $element->find('p', 0)->plaintext . '<br/><img src="' . $pictureURL . '"/>';
|
$audioURL = $audioElement->find('a', 0)->href;
|
||||||
|
$audio[] = $audioURL;
|
||||||
|
$audioElement->outertext = '<audio controls src="' . $audioURL . '"></audio>';
|
||||||
|
$article->save();
|
||||||
|
}
|
||||||
|
|
||||||
|
// Rewrite pictures URL
|
||||||
|
$imgs = $article->find('img[src^="https://www.radiomelodie.com/image.php]');
|
||||||
|
foreach($imgs as $img) {
|
||||||
|
$img->src = $this->rewriteImage($img->src);
|
||||||
|
$article->save();
|
||||||
|
}
|
||||||
|
|
||||||
|
// Remove inline audio player HTML
|
||||||
|
$inlinePlayers = $article->find('div[class*=sm2-main-controls]');
|
||||||
|
foreach($inlinePlayers as $inlinePlayer) {
|
||||||
|
$inlinePlayer->outertext = '';
|
||||||
|
$article->save();
|
||||||
|
}
|
||||||
|
|
||||||
|
// Remove Google Ads
|
||||||
|
$ads = $article->find('div[style^=margin:25px 0; position:relative; height:auto;]');
|
||||||
|
foreach($ads as $ad) {
|
||||||
|
$ad->outertext = '';
|
||||||
|
$article->save();
|
||||||
|
}
|
||||||
|
|
||||||
|
$author = $article->find('div[id=author]', 0)->find('span', 0)->plaintext;
|
||||||
|
|
||||||
|
$item['enclosures'] = array_merge($picture, $audio);
|
||||||
|
$item['author'] = $author;
|
||||||
|
$item['uri'] = $articleURL;
|
||||||
|
$item['title'] = $article->find('meta[property=og:title]', 0)->content;
|
||||||
|
$date_category = $article->find('div[class*=date]', 0)->plaintext;
|
||||||
|
$header = $article->find('a[class=fancybox]', 0)->innertext;
|
||||||
|
$textDOM = $article->find('div[class=text_content]', 0);
|
||||||
|
$textDOM->find('div[id=author]', 0)->outertext = '';
|
||||||
|
$article->save();
|
||||||
|
$text = $textDOM->innertext;
|
||||||
|
$item['content'] = '<h1>' . $item['title'] . '</h1>' . $date_category . $header . $text;
|
||||||
$this->items[] = $item;
|
$this->items[] = $item;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Function to rewrite image URL to use the real Image URL and not the resized one (which is very slow)
|
||||||
|
*/
|
||||||
|
private function rewriteImage($url)
|
||||||
|
{
|
||||||
|
$parts = explode('?', $url);
|
||||||
|
parse_str($parts[1], $params);
|
||||||
|
return self::URI . '/' . $params['image'];
|
||||||
|
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
Loading…
Reference in a new issue