Improve LeMondeDiploBridge.php

This commit is contained in:
Damien Calesse 2014-07-22 20:02:40 +02:00
parent 6d284ad5af
commit 1c38a91d41

View file

@ -10,6 +10,7 @@
* @description Returns most recent results from MondeDiplo. * @description Returns most recent results from MondeDiplo.
* @maintainer Pitchoule * @maintainer Pitchoule
*/ */
class MondeDiploBridge extends BridgeAbstract{ class MondeDiploBridge extends BridgeAbstract{
public function collectData(array $param){ public function collectData(array $param){
@ -17,24 +18,36 @@ class MondeDiploBridge extends BridgeAbstract{
$html = file_get_html($link) or $this->returnError('Could not request MondeDiplo. for : ' . $link , 404); $html = file_get_html($link) or $this->returnError('Could not request MondeDiplo. for : ' . $link , 404);
foreach($html->find('div[class=grid_10 alpha omega laune]') as $element) { foreach($html->find('div.laune') as $element) {
$item = new Item(); $item = new Item();
$item->uri = 'http://www.monde-diplomatique.fr'.$element->find('a', 0)->href; $item->uri = 'http://www.monde-diplomatique.fr'.$element->find('a', 0)->href;
$NumArticle = explode("/", $element->find('a', 0)->href);
$item->title = $element->find('h3', 0)->plaintext; $item->title = $element->find('h3', 0)->plaintext;
$item->content = $element->find('div[class=crayon article-intro-'.$NumArticle[4].' intro]', 0)->plaintext; $item->content = $element->find('div.dates_auteurs', 0)->plaintext. '<br>' .strstr($element->find('div', 0)->plaintext, $element->find('div.dates_auteurs', 0)->plaintext, true);
$this->items[] = $item; $this->items[] = $item;
} }
foreach($html->find('div.titraille') as $element) { $liste = $html->find('div.listes', 0); // First list
foreach ($liste->find('li') as $e) {
$item = new Item();
$item->uri = 'http://www.monde-diplomatique.fr' . $e->find('a', 0)->href;
$item->title = $e->find('a', 0)->plaintext;
$item->content = $e->find('div.dates_auteurs', 0)->plaintext;
$this->items[] = $item;
}
foreach($html->find('div.liste ul li') as $element) {
if ($element->getAttribute('class') != 'intrapub') {
$item = new Item(); $item = new Item();
$item->uri = 'http://www.monde-diplomatique.fr'.$element->find('a', 0)->href; $item->uri = 'http://www.monde-diplomatique.fr'.$element->find('a', 0)->href;
$item->title = $element->find('h3', 0)->plaintext; $item->title = $element->find('h3', 0)->plaintext;
$item->content = $element->find('div.dates_auteurs', 0)->plaintext; $item->content = $element->find('div.dates_auteurs', 0)->plaintext . ' <br> ' . $element->find('div.intro', 0)->plaintext;
$this->items[] = $item; $this->items[] = $item;
} }
} }
}
public function getName(){ public function getName(){
return 'Monde Diplomatique'; return 'Monde Diplomatique';
} }