1
0
Fork 0
forked from blallo/rss-bridge
rss-bridge/bridges/WordPressBridge.php
2017-02-15 19:38:32 +01:00

76 lines
2.1 KiB
PHP

<?php
class WordPressBridge extends FeedExpander {
const MAINTAINER = 'aledeg';
const NAME = 'Wordpress Bridge';
const URI = 'https://wordpress.org/';
const CACHE_TIMEOUT = 10800; // 3h
const DESCRIPTION = 'Returns the newest full posts of a Wordpress powered website';
const PARAMETERS = array( array(
'url' => array(
'name' => 'Blog URL',
'required' => true
)
));
private function clearContent($content){
$content = preg_replace('/<script[^>]*>[^<]*<\/script>/', '', $content);
$content = preg_replace('/<div class="wpa".*/', '', $content);
$content = preg_replace('/<form.*\/form>/', '', $content);
return $content;
}
protected function parseItem($newItem){
$item = parent::parseItem($newItem);
$article_html = getSimpleHTMLDOMCached($item['uri']);
$article = null;
switch(true){
case !is_null($article_html->find('article', 0)):
// most common content div
$article = $article_html->find('article', 0);
break;
case !is_null($article_html->find('.single-content', 0)):
// another common content div
$article = $article_html->find('.single-content', 0);
break;
case !is_null($article_html->find('.post-content', 0)):
// another common content div
$article = $article_html->find('.post-content', 0);
break;
case !is_null($article_html->find('.post', 0)):
// for old WordPress themes without HTML5
$article = $article_html->find('.post', 0);
break;
}
if(!is_null($article)){
$item['content'] = $this->clearContent($article->innertext);
}
return $item;
}
public function getURI(){
$url = $this->getInput('url');
if(empty($url)){
$url = parent::getURI();
}
return $url;
}
public function collectData(){
if($this->getInput('url') && substr($this->getInput('url'), 0, strlen('http')) !== 'http'){
// just in case someone find a way to access local files by playing with the url
returnClientError('The url parameter must either refer to http or https protocol.');
}
try{
$this->collectExpandableDatas($this->getURI() . '/feed/atom/');
}catch (HttpException $e){
$this->collectExpandableDatas($this->getURI() . '/?feed=atom');
}
}
}