1
0
Fork 0
forked from blallo/rss-bridge
rss-bridge/bridges/TwitterBridgeCleanExtended.php
Pierre Mazière f05bd15393 TwitterBridge*: fix HTML entities in title
Signed-off-by: Pierre Mazière <pierre.maziere@gmx.com>
2016-07-08 16:11:57 +02:00

90 lines
3.4 KiB
PHP

<?php
//Based on https://github.com/sebsauvage/rss-bridge/blob/master/bridges/TwitterBridgeClean.php by vinzv
class TwitterBridgeCleanExtended extends BridgeAbstract{
private $request;
public function loadMetadatas() {
$this->maintainer = "Max Mehl";
$this->name = "Twitter Bridge Clean Extended";
$this->uri = "http://twitter.com/";
$this->description = "Returns user timelines showing RTs correctly or search results for keywords/hashtags (without using their API).";
$this->update = "2016-01-27";
$this->parameters["By keyword or hashtag"] =
'[
{
"name" : "Keyword or #hashtag",
"identifier" : "q"
}
]';
$this->parameters["By username"] =
'[
{
"name" : "username",
"identifier" : "u"
}
]';
}
public function collectData(array $param){
$html = '';
if (isset($param['q'])) { /* keyword search mode */
$this->request = $param['q'];
$html = $this->file_get_html('https://twitter.com/search?q='.urlencode($this->request).'&f=tweets') or $this->returnError('No results for this query.', 404);
}
elseif (isset($param['u'])) { /* user timeline mode */
$this->request = $param['u'];
$html = $this->file_get_html('http://twitter.com/'.urlencode($this->request)) or $this->returnError('Requested username can\'t be found.', 404);
}
else {
$this->returnError('You must specify a keyword (?q=...) or a Twitter username (?u=...).', 400);
}
foreach($html->find('div.js-stream-tweet') as $tweet) {
$item = new \Item();
$item->username = $tweet->getAttribute('data-screen-name'); // extract username and sanitize
$item->fullname = $tweet->getAttribute('data-name'); // extract fullname (pseudonym)
$item->avatar = $tweet->find('img', 0)->src; // get avatar link
$item->id = $tweet->getAttribute('data-tweet-id'); // get TweetID
$item->uri = 'https://twitter.com'.$tweet->find('a.js-permalink', 0)->getAttribute('href'); // get tweet link
$item->timestamp = $tweet->find('span.js-short-timestamp', 0)->getAttribute('data-time'); // extract tweet timestamp
// processing content links
foreach($tweet->find('a') as $link) {
if($link->hasAttribute('data-expanded-url') ) {
$link->href = $link->getAttribute('data-expanded-url');
}
$link->removeAttribute('data-expanded-url');
$link->removeAttribute('data-query-source');
$link->removeAttribute('rel');
$link->removeAttribute('class');
$link->removeAttribute('target');
$link->removeAttribute('title');
$link->removeAttribute('dir');
}
$item->content = str_replace('pic.twitter.com', 'https://pic.twitter.com', strip_tags($tweet->find('p.js-tweet-text', 0)->innertext)); // extract tweet text
if(isset($param['u'])) {
if($item->username != $param['u']) {
$item->content = '&#9851; @' . $item->username . ': ' . $item->content;
}
}
$item->title = html_entity_decode($item->content,ENT_QUOTES,'UTF-8');
$this->items[] = $item;
}
}
public function getName(){
return (!empty($this->request) ? $this->request : '');
}
public function getURI(){
return 'http://twitter.com';
}
public function getCacheDuration(){
return 300; // 5 minutes
}
}