<?php class CollegeDeFranceBridge extends BridgeAbstract { const MAINTAINER = 'pit-fgfjiudghdf'; const NAME = 'CollegeDeFrance'; const URI = 'https://www.college-de-france.fr/'; const CACHE_TIMEOUT = 10800; // 3h const DESCRIPTION = 'Returns the latest audio and video from CollegeDeFrance'; public function collectData(){ $months = array( '01' => 'janv.', '02' => 'févr.', '03' => 'mars', '04' => 'avr.', '05' => 'mai', '06' => 'juin', '07' => 'juil.', '08' => 'août', '09' => 'sept.', '10' => 'oct.', '11' => 'nov.', '12' => 'déc.' ); // The "API" used by the site returns a list of partial HTML in this form /* <li> * <a href="/site/thomas-romer/guestlecturer-2016-04-15-14h30.htm" data-target="after"> * <span class="date"><span class="list-icon list-icon-video"></span> * <span class="list-icon list-icon-audio"></span>15 avr. 2016</span> * <span class="lecturer">Christopher Hays</span> * <span class='title'>Imagery of Divine Suckling in the Hebrew Bible and the Ancient Near East</span> * </a> * </li> */ $html = getSimpleHTMLDOM(self::URI . 'components/search-audiovideo.jsp?fulltext=&siteid=1156951719600&lang=FR&type=all') or returnServerError('Could not request CollegeDeFrance.'); foreach($html->find('a[data-target]') as $element) { $item = array(); $item['title'] = $element->find('.title', 0)->plaintext; // Most relative URLs contains an hour in addition to the date, so let's use it // <a href="/site/yann-lecun/course-2016-04-08-11h00.htm" data-target="after"> // // Sometimes there's an __1, perhaps it signifies an update // "/site/patrick-boucheron/seminar-2016-05-03-18h00__1.htm" // // But unfortunately some don't have any hours info // <a href="/site/institut-physique/ // The-Mysteries-of-Decoherence-Sebastien-Gleyzes-[Video-3-35].htm" data-target="after"> $timezone = new DateTimeZone('Europe/Paris'); // strpos($element->href, '201') will break in 2020 but it'll // probably break prior to then due to site changes anyway $d = DateTime::createFromFormat( '!Y-m-d-H\hi', substr($element->href, strpos($element->href, '201'), 16), $timezone ); if(!$d) { $d = DateTime::createFromFormat( '!d m Y', trim(str_replace( array_values($months), array_keys($months), $element->find('.date', 0)->plaintext )), $timezone ); } $item['timestamp'] = $d->format('U'); $item['content'] = $element->find('.lecturer', 0)->innertext . ' - ' . $element->find('.title', 0)->innertext; $item['uri'] = self::URI . $element->href; $this->items[] = $item; } } }