2013-08-15 12:05:58 +02:00
< ? php
/**
* RssBridgeYoutube
* Returns the newest videos
*
* @ name Youtube Bridge
2014-05-25 23:27:14 +02:00
* @ homepage https :// www . youtube . com /
2014-06-20 17:00:36 +02:00
* @ description Returns the 10 newest videos by username / playlist or search
2014-05-21 19:15:52 +02:00
* @ maintainer mitsukarenai
2014-06-20 17:00:36 +02:00
* @ update 2014 - 06 - 20
2013-08-15 12:05:58 +02:00
* @ use1 ( u = " username " )
2014-05-14 12:39:12 +02:00
* @ use2 ( p = " playlist id " )
* @ use3 ( s = " search keyword " , pa = " page " )
2014-05-14 14:34:06 +02:00
*
* WARNING : to parse big playlists ( over ~ 90 videos ), you need to edit simple_html_dom . php :
* change : define ( 'MAX_FILE_SIZE' , 600000 );
* into : define ( 'MAX_FILE_SIZE' , 900000 ); ( or more )
2013-08-15 12:05:58 +02:00
*/
class YoutubeBridge extends BridgeAbstract {
2013-08-15 13:58:58 +02:00
2014-06-20 17:00:36 +02:00
private $request ;
2013-08-15 13:58:58 +02:00
2014-06-20 17:00:36 +02:00
public function collectData ( array $param ){
2014-06-20 16:41:51 +02:00
2014-06-20 17:00:36 +02:00
function getPublishDate ( $id ) {
// relies on Youtube API; deprecated
2014-07-16 16:32:44 +02:00
$json = json_decode ( file_get_contents ( " https://gdata.youtube.com/feeds/api/videos/ $id ?v=2&alt=json " ), TRUE );
2014-06-20 17:00:36 +02:00
$timestamp = strtotime ( $json [ 'entry' ][ 'published' ][ '$t' ]);
return $timestamp ;
}
2014-06-20 16:41:51 +02:00
2014-06-20 17:00:36 +02:00
$html = '' ;
$limit = 10 ;
$count = 0 ;
2014-05-14 12:39:12 +02:00
2014-06-20 17:00:36 +02:00
if ( isset ( $param [ 'u' ])) { /* user timeline mode */
$this -> request = $param [ 'u' ];
$html = file_get_html ( 'https://www.youtube.com/user/' . urlencode ( $this -> request ) . '/videos' ) or $this -> returnError ( 'Could not request Youtube.' , 404 );
2014-05-14 12:39:12 +02:00
2014-06-20 17:00:36 +02:00
foreach ( $html -> find ( 'li.channels-content-item' ) as $element ) {
if ( $count < $limit ) {
$item = new \Item ();
2014-07-16 16:32:44 +02:00
$videoquery = parse_url ( $element -> find ( 'a' , 0 ) -> href , PHP_URL_QUERY ); parse_str ( $videoquery , $videoquery );
$item -> id = $videoquery [ 'v' ];
$item -> uri = 'https://www.youtube.com/watch?v=' . $item -> id ;
2014-06-20 17:00:36 +02:00
$item -> thumbnailUri = 'https:' . $element -> find ( 'img' , 0 ) -> src ;
$item -> title = trim ( $element -> find ( 'h3' , 0 ) -> plaintext );
$item -> timestamp = getPublishDate ( $item -> id );
$item -> content = '<a href="' . $item -> uri . '"><img src="' . $item -> thumbnailUri . '" /></a><br><a href="' . $item -> uri . '">' . $item -> title . '</a>' ;
$this -> items [] = $item ;
$count ++ ;
}
}
}
2014-05-14 12:39:12 +02:00
2014-06-20 17:00:36 +02:00
else if ( isset ( $param [ 'p' ])) { /* playlist mode */
$this -> request = $param [ 'p' ];
$html = file_get_html ( 'https://www.youtube.com/playlist?list=' . urlencode ( $this -> request ) . '' ) or $this -> returnError ( 'Could not request Youtube.' , 404 );
foreach ( $html -> find ( 'tr.pl-video' ) as $element ) {
if ( $count < $limit ) {
$item = new \Item ();
$item -> uri = 'https://www.youtube.com' . $element -> find ( '.pl-video-title a' , 0 ) -> href ;
$item -> thumbnailUri = 'https:' . str_replace ( '/default.' , '/mqdefault.' , $element -> find ( '.pl-video-thumbnail img' , 0 ) -> src );
$item -> title = trim ( $element -> find ( '.pl-video-title a' , 0 ) -> plaintext );
$item -> id = str_replace ( '/watch?v=' , '' , $element -> find ( 'a' , 0 ) -> href );
$item -> timestamp = getPublishDate ( $item -> id );
$item -> content = '<a href="' . $item -> uri . '"><img src="' . $item -> thumbnailUri . '" /></a><br><a href="' . $item -> uri . '">' . $item -> title . '</a>' ;
$this -> items [] = $item ;
$count ++ ;
}
$this -> request = 'Playlist ' . trim ( str_replace ( ' - YouTube' , '' , $html -> find ( 'title' , 0 ) -> plaintext )) . ', by ' . $html -> find ( 'h1' , 0 ) -> plaintext ;
}
2014-06-20 17:04:27 +02:00
}
2013-08-15 12:05:58 +02:00
2014-06-20 17:00:36 +02:00
else if ( isset ( $param [ 's' ])) { /* search mode */
$this -> request = $param [ 's' ]; $page = 1 ; if ( isset ( $param [ 'pa' ])) $page = ( int ) preg_replace ( " /[^0-9]/ " , '' , $param [ 'pa' ]);
$html = file_get_html ( 'https://www.youtube.com/results?search_query=' . urlencode ( $this -> request ) . '&&page=' . $page . '&filters=video&search_sort=video_date_uploaded' ) or $this -> returnError ( 'Could not request Youtube.' , 404 );
2013-08-15 12:05:58 +02:00
2014-06-20 17:00:36 +02:00
foreach ( $html -> find ( 'li.yt-lockup' ) as $element ) {
$item = new \Item ();
$item -> uri = 'https://www.youtube.com' . $element -> find ( 'a' , 0 ) -> href ;
$checkthumb = $element -> find ( 'img' , 0 ) -> getAttribute ( 'data-thumb' );
if ( $checkthumb !== FALSE )
$item -> thumbnailUri = $checkthumb ;
else
$item -> thumbnailUri = '' . $element -> find ( 'img' , 0 ) -> src ;
$item -> title = trim ( $element -> find ( 'h3' , 0 ) -> plaintext );
$item -> id = str_replace ( '/watch?v=' , '' , $element -> find ( 'a' , 0 ) -> href );
//$item->timestamp = getPublishDate($item->id); /* better not use it here */
$item -> content = '<a href="' . $item -> uri . '"><img src="' . $item -> thumbnailUri . '" /></a><br><a href="' . $item -> uri . '">' . $item -> title . '</a>' ;
$this -> items [] = $item ;
}
$this -> request = 'Search: ' . str_replace ( ' - YouTube' , '' , $html -> find ( 'title' , 0 ) -> plaintext );
}
else
$this -> returnError ( 'You must either specify a Youtube username (?u=...) or a playlist id (?p=...) or search (?s=...)' , 400 );
}
public function getName (){
return ( ! empty ( $this -> request ) ? $this -> request . ' - ' : '' ) . 'Youtube Bridge' ;
}
2013-08-15 12:05:58 +02:00
2014-06-20 17:00:36 +02:00
public function getURI (){
return 'https://www.youtube.com/' ;
}
public function getCacheDuration (){
return 10800 ; // 3 hours
}
2013-08-15 12:05:58 +02:00
}