forked from blallo/rss-bridge
f1fb95b257
- returnError, returnServerError, returnClientError ,debugMessage are moved to lib/error.php - getContents, getSimpleHTMLDOM, getSimpleHTMLDOMCached are moved to lib/contents.php Signed-off-by: Pierre Mazière <pierre.maziere@gmx.com>
76 lines
2 KiB
PHP
76 lines
2 KiB
PHP
<?php
|
|
class WordPressBridge extends FeedExpander {
|
|
const MAINTAINER = "aledeg";
|
|
const NAME = "Wordpress Bridge";
|
|
const URI = "https://wordpress.org/";
|
|
const DESCRIPTION = "Returns the newest full posts of a Wordpress powered website";
|
|
|
|
const PARAMETERS = array( array(
|
|
'url'=>array(
|
|
'name'=>'Blog URL',
|
|
'required'=>true
|
|
)
|
|
));
|
|
|
|
private function clearContent($content) {
|
|
$content = preg_replace('/<script[^>]*>[^<]*<\/script>/', '', $content);
|
|
$content = preg_replace('/<div class="wpa".*/', '', $content);
|
|
$content = preg_replace('/<form.*\/form>/', '', $content);
|
|
return $content;
|
|
}
|
|
|
|
protected function parseItem($newItem){
|
|
$item=parent::parseItem($newItem);
|
|
|
|
$article_html = getSimpleHTMLDOMCached($item['uri']);
|
|
|
|
$article=null;
|
|
switch(true){
|
|
case !is_null($article_html->find('article',0)):
|
|
// most common content div
|
|
$article = $article_html->find('article', 0);
|
|
break;
|
|
case !is_null($article_html->find('.single-content',0)):
|
|
// another common content div
|
|
$article = $article_html->find('.single-content', 0);
|
|
break;
|
|
case !is_null($article_html->find('.post-content',0)):
|
|
// another common content div
|
|
$article = $article_html->find('.post-content', 0);
|
|
break;
|
|
|
|
case !is_null($article_html->find('.post',0)):
|
|
// for old WordPress themes without HTML5
|
|
$article = $article_html->find('.post', 0);
|
|
break;
|
|
}
|
|
|
|
if(!is_null($article)){
|
|
$item['content'] = $this->clearContent($article->innertext);
|
|
}
|
|
|
|
return $item;
|
|
}
|
|
|
|
public function getURI(){
|
|
$url = $this->getInput('url');
|
|
if(empty($url)){
|
|
$url = static::URI;
|
|
}
|
|
return $url;
|
|
}
|
|
|
|
public function collectData(){
|
|
if($this->getInput('url') && substr($this->getInput('url'),0,strlen('http'))!=='http'){
|
|
// just in case someone find a way to access local files by playing with the url
|
|
returnClientError('The url parameter must either refer to http or https protocol.');
|
|
}
|
|
|
|
$this->collectExpandableDatas($this->getURI().'/feed/atom/');
|
|
|
|
}
|
|
|
|
public function getCacheDuration() {
|
|
return 3600*3; // 3 hours
|
|
}
|
|
}
|