2016-01-19 19:20:21 +01:00
|
|
|
<?php
|
2016-09-10 19:11:09 +02:00
|
|
|
class JapanExpoBridge extends BridgeAbstract {
|
2016-01-19 19:20:21 +01:00
|
|
|
|
2017-02-11 16:16:56 +01:00
|
|
|
const MAINTAINER = 'Ginko';
|
|
|
|
const NAME = 'Japan Expo Actualités';
|
|
|
|
const URI = 'http://www.japan-expo-paris.com/fr/actualites';
|
|
|
|
const CACHE_TIMEOUT = 14400; // 4h
|
|
|
|
const DESCRIPTION = 'Returns most recent entries from Japan Expo actualités.';
|
|
|
|
const PARAMETERS = array( array(
|
|
|
|
'mode' => array(
|
|
|
|
'name' => 'Show full contents',
|
|
|
|
'type' => 'checkbox',
|
|
|
|
)
|
|
|
|
));
|
2016-01-19 19:20:21 +01:00
|
|
|
|
2017-02-11 16:16:56 +01:00
|
|
|
public function collectData(){
|
2016-01-19 19:20:21 +01:00
|
|
|
|
2017-02-11 16:16:56 +01:00
|
|
|
function frenchPubDateToTimestamp($date_to_parse) {
|
|
|
|
return strtotime(
|
|
|
|
strtr(
|
|
|
|
strtolower(str_replace('Publié le ', '', $date_to_parse)),
|
|
|
|
array(
|
|
|
|
'janvier' => 'jan',
|
|
|
|
'février' => 'feb',
|
|
|
|
'mars' => 'march',
|
|
|
|
'avril' => 'apr',
|
|
|
|
'mai' => 'may',
|
|
|
|
'juin' => 'jun',
|
|
|
|
'juillet' => 'jul',
|
|
|
|
'août' => 'aug',
|
|
|
|
'septembre' => 'sep',
|
|
|
|
'octobre' => 'oct',
|
|
|
|
'novembre' => 'nov',
|
|
|
|
'décembre' => 'dec'
|
|
|
|
)
|
|
|
|
)
|
|
|
|
);
|
|
|
|
}
|
2016-06-25 12:12:33 +02:00
|
|
|
|
2017-02-11 16:16:56 +01:00
|
|
|
$convert_article_images = function($matches){
|
|
|
|
if(is_array($matches) && count($matches) > 1){
|
|
|
|
return '<img src="' . $matches[1] . '" />';
|
|
|
|
}
|
|
|
|
};
|
2016-01-19 19:20:21 +01:00
|
|
|
|
2017-02-11 16:16:56 +01:00
|
|
|
$html = getSimpleHTMLDOM(self::URI)
|
|
|
|
or returnServerError('Could not request JapanExpo: ' . self::URI);
|
|
|
|
$fullcontent = $this->getInput('mode');
|
|
|
|
$count = 0;
|
2016-06-25 12:12:33 +02:00
|
|
|
|
2017-02-11 16:16:56 +01:00
|
|
|
foreach($html->find('a._tile2') as $element){
|
2016-06-25 12:12:33 +02:00
|
|
|
|
2017-02-11 16:16:56 +01:00
|
|
|
$url = $element->href;
|
|
|
|
$thumbnail = 'http://s.japan-expo.com/katana/images/JES049/paris.png';
|
|
|
|
preg_match('/url\(([^)]+)\)/', $element->find('img.rspvimgset', 0)->style, $img_search_result);
|
2016-06-25 12:12:33 +02:00
|
|
|
|
2017-02-11 16:16:56 +01:00
|
|
|
if(count($img_search_result) >= 2)
|
|
|
|
$thumbnail = trim($img_search_result[1], "'");
|
2016-08-29 11:52:13 +02:00
|
|
|
|
2017-02-11 16:16:56 +01:00
|
|
|
if($fullcontent){
|
|
|
|
if($count >= 5){
|
|
|
|
break;
|
|
|
|
}
|
2016-06-25 12:12:33 +02:00
|
|
|
|
2017-02-11 16:16:56 +01:00
|
|
|
$article_html = getSimpleHTMLDOMCached('Could not request JapanExpo: ' . $url);
|
|
|
|
$header = $article_html->find('header.pageHeadBox', 0);
|
|
|
|
$timestamp = strtotime($header->find('time', 0)->datetime);
|
|
|
|
$title_html = $header->find('div.section', 0)->next_sibling();
|
|
|
|
$title = $title_html->plaintext;
|
|
|
|
$headings = $title_html->next_sibling()->outertext;
|
|
|
|
$article = $article_html->find('div.content', 0)->innertext;
|
|
|
|
$article = preg_replace_callback(
|
|
|
|
'/<img [^>]+ style="[^\(]+\(\'([^\']+)\'[^>]+>/i',
|
|
|
|
$convert_article_images,
|
|
|
|
$article);
|
|
|
|
|
|
|
|
$content = $headings . $article;
|
|
|
|
} else {
|
|
|
|
$date_text = $element->find('span.date', 0)->plaintext;
|
|
|
|
$timestamp = frenchPubDateToTimestamp($date_text);
|
|
|
|
$title = trim($element->find('span._title', 0)->plaintext);
|
|
|
|
$content = '<img src="'
|
|
|
|
. $thumbnail
|
|
|
|
. '"></img><br />'
|
|
|
|
. $date_text
|
|
|
|
. '<br /><a href="'
|
|
|
|
. $url
|
|
|
|
. '">Lire l\'article</a>';
|
|
|
|
}
|
|
|
|
|
|
|
|
$item = array();
|
|
|
|
$item['uri'] = $url;
|
|
|
|
$item['title'] = $title;
|
|
|
|
$item['timestamp'] = $timestamp;
|
|
|
|
$item['content'] = $content;
|
|
|
|
$this->items[] = $item;
|
|
|
|
$count++;
|
|
|
|
}
|
|
|
|
}
|
2016-01-19 19:20:21 +01:00
|
|
|
}
|