12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970 |
- <?php
- class CollegeDeFranceBridge extends BridgeAbstract{
- const MAINTAINER = "pit-fgfjiudghdf";
- const NAME = "CollegeDeFrance";
- const URI = "http://www.college-de-france.fr/";
- const CACHE_TIMEOUT = 10800; // 3h
- const DESCRIPTION = "Returns the latest audio and video from CollegeDeFrance";
- public function collectData(){
- $months = array(
- '01' => 'janv.',
- '02' => 'févr.',
- '03' => 'mars',
- '04' => 'avr.',
- '05' => 'mai',
- '06' => 'juin',
- '07' => 'juil.',
- '08' => 'août',
- '09' => 'sept.',
- '10' => 'oct.',
- '11' => 'nov.',
- '12' => 'déc.'
- );
- // The "API" used by the site returns a list of partial HTML in this form
- /* <li>
- * <a href="/site/thomas-romer/guestlecturer-2016-04-15-14h30.htm" data-target="after">
- * <span class="date"><span class="list-icon list-icon-video"></span><span class="list-icon list-icon-audio"></span>15 avr. 2016</span>
- * <span class="lecturer">Christopher Hays</span>
- * <span class='title'>Imagery of Divine Suckling in the Hebrew Bible and the Ancient Near East</span>
- * </a>
- * </li>
- */
- $html = getSimpleHTMLDOM(self::URI.'components/search-audiovideo.jsp?fulltext=&siteid=1156951719600&lang=FR&type=all')
- or returnServerError('Could not request CollegeDeFrance.');
- foreach($html->find('a[data-target]') as $element) {
- $item = array();
- $item['title'] = $element->find('.title', 0)->plaintext;
- // Most relative URLs contains an hour in addition to the date, so let's use it
- // <a href="/site/yann-lecun/course-2016-04-08-11h00.htm" data-target="after">
- //
- // Sometimes there's an __1, perhaps it signifies an update "/site/patrick-boucheron/seminar-2016-05-03-18h00__1.htm"
- //
- // But unfortunately some don't have any hours info
- // <a href="/site/institut-physique/The-Mysteries-of-Decoherence-Sebastien-Gleyzes-[Video-3-35].htm" data-target="after">
- $timezone = new DateTimeZone('Europe/Paris');
- // strpos($element->href, '201') will break in 2020 but it'll probably break prior to then due to site changes anyway
- $d = DateTime::createFromFormat(
- '!Y-m-d-H\hi',
- substr($element->href, strpos($element->href, '201'), 16),
- $timezone
- );
- if(!$d){
- $d=DateTime::createFromFormat(
- '!d m Y',
- trim(str_replace(
- array_values($months),
- array_keys($months),
- $element->find('.date', 0)->plaintext
- )),
- $timezone
- );
- }
- $item['timestamp'] = $d->format('U');
- $item['content'] = $element->find('.lecturer', 0)->innertext . ' - ' . $element->find('.title', 0)->innertext;
- $item['uri'] = self::URI . $element->href;
- $this->items[] = $item;
- }
- }
- }
|