2013-08-15 12:05:58 +02:00
< ? php
/**
* RssBridgeYoutube
* Returns the newest videos
2015-11-01 12:17:36 +01:00
* WARNING : to parse big playlists ( over ~ 90 videos ), you need to edit simple_html_dom . php :
2014-05-14 14:34:06 +02:00
* change : define ( 'MAX_FILE_SIZE' , 600000 );
* into : define ( 'MAX_FILE_SIZE' , 900000 ); ( or more )
2013-08-15 12:05:58 +02:00
*/
2015-11-01 12:17:36 +01:00
class YoutubeBridge extends BridgeAbstract {
public function loadMetadatas () {
2016-05-03 23:45:32 +02:00
$this -> name = 'YouTube Bridge' ;
$this -> homepage = $this -> getURI ();
$this -> description = 'Returns the 10 newest videos by username/channel/playlist or search' ;
$this -> maintainer = 'mitsukarenai' ;
$this -> update = '02/05/2016' ;
2015-11-01 12:17:36 +01:00
2016-05-03 23:45:32 +02:00
$this -> parameters [ 'By username' ] =
2015-11-01 12:17:36 +01:00
' [
{
" type " : " text " ,
" identifier " : " u " ,
" name " : " username " ,
2015-11-11 22:45:24 +01:00
" exampleValue " : " test " ,
" required " : " required "
2015-11-01 12:17:36 +01:00
}
] ' ;
$this -> parameters [ 'By channel id' ] =
' [
{
2016-05-21 11:45:09 +02:00
" type " : " text " ,
2015-11-01 12:17:36 +01:00
" identifier " : " c " ,
" name " : " channel id " ,
2016-05-03 23:45:32 +02:00
" exampleValue " : " 15 " ,
2015-11-11 22:45:24 +01:00
" required " : " required "
2015-11-01 12:17:36 +01:00
}
] ' ;
$this -> parameters [ 'By playlist Id' ] =
' [
{
2016-05-21 11:45:09 +02:00
" type " : " text " ,
" identifier " : " p " ,
2015-11-01 12:17:36 +01:00
" name " : " playlist id " ,
" exampleValue " : " 15 "
}
] ' ;
2016-05-03 23:45:32 +02:00
$this -> parameters [ 'Search result' ] =
2015-11-01 12:17:36 +01:00
' [
{
" type " : " text " ,
" identifier " : " s " ,
" name " : " search keyword " ,
" exampleValue " : " test "
},
{
" type " : " number " ,
" identifier " : " pa " ,
" name " : " page " ,
" exampleValue " : " 1 "
}
] ' ;
}
2016-05-03 23:45:32 +02:00
private function ytBridgeQueryVideoInfo ( $vid , & $author , & $desc , & $time ) {
2016-06-25 23:17:42 +02:00
$html = $this -> file_get_html ( $this -> getURI () . " watch?v= $vid " );
2016-05-03 23:45:32 +02:00
$author = $html -> innertext ;
$author = substr ( $author , strpos ( $author , '"author=' ) + 8 );
$author = substr ( $author , 0 , strpos ( $author , '\u0026' ));
$desc = $html -> find ( 'div#watch-description-text' , 0 ) -> innertext ;
$time = strtotime ( $html -> find ( 'meta[itemprop=datePublished]' , 0 ) -> getAttribute ( 'content' ));
}
2014-06-20 16:41:51 +02:00
2016-05-03 23:45:32 +02:00
private function ytBridgeAddItem ( $vid , $title , $author , $desc , $time ) {
$item = new \Item ();
$item -> id = $vid ;
$item -> title = $title ;
$item -> author = $author ;
$item -> timestamp = $time ;
$item -> uri = $this -> getURI () . 'watch?v=' . $vid ;
$item -> thumbnailUri = str_replace ( '/www.' , '/img.' , $this -> getURI ()) . 'vi/' . $vid . '/0.jpg' ;
$item -> content = '<a href="' . $item -> uri . '"><img src="' . $item -> thumbnailUri . '" /></a><br />' . $desc ;
$this -> items [] = $item ;
}
2014-06-20 16:41:51 +02:00
2016-05-03 23:45:32 +02:00
private function ytBridgeParseXmlFeed ( $xml ) {
foreach ( $xml -> find ( 'entry' ) as $element ) {
2016-05-21 11:45:09 +02:00
$title = $this -> ytBridgeFixTitle ( $element -> find ( 'title' , 0 ) -> plaintext );
2016-05-03 23:45:32 +02:00
$author = $element -> find ( 'name' , 0 ) -> plaintext ;
$desc = $element -> find ( 'media:description' , 0 ) -> innertext ;
$vid = str_replace ( 'yt:video:' , '' , $element -> find ( 'id' , 0 ) -> plaintext );
$time = strtotime ( $element -> find ( 'published' , 0 ) -> plaintext );
$this -> ytBridgeAddItem ( $vid , $title , $author , $desc , $time );
}
2016-05-21 11:45:09 +02:00
$this -> request = $this -> ytBridgeFixTitle ( $xml -> find ( 'feed > title' , 0 ) -> plaintext );
2016-05-03 23:45:32 +02:00
}
2014-05-14 12:39:12 +02:00
2016-05-03 23:45:32 +02:00
private function ytBridgeParseHtmlListing ( $html , $element_selector , $title_selector ) {
$limit = 10 ; $count = 0 ;
foreach ( $html -> find ( $element_selector ) as $element ) {
if ( $count < $limit ) {
$author = '' ; $desc = '' ; $time = 0 ;
$vid = str_replace ( '/watch?v=' , '' , $element -> find ( 'a' , 0 ) -> href );
2016-05-21 11:45:09 +02:00
$title = $this -> ytBridgeFixTitle ( $element -> find ( $title_selector , 0 ) -> plaintext );
if ( $title != '[Private Video]' ) {
$this -> ytBridgeQueryVideoInfo ( $vid , $author , $desc , $time );
$this -> ytBridgeAddItem ( $vid , $title , $author , $desc , $time );
$count ++ ;
}
2014-06-20 17:00:36 +02:00
}
}
2016-05-03 23:45:32 +02:00
}
2016-05-21 11:45:09 +02:00
private function ytBridgeFixTitle ( $title ) {
// convert both Ӓ and " to UTF-8
return html_entity_decode ( mb_convert_encoding ( trim ( $title ), 'UTF-8' , 'HTML-ENTITIES' ));
}
2016-05-03 23:45:32 +02:00
public function collectData ( array $param ) {
$xml = '' ;
$html = '' ;
$url_feed = '' ;
$url_listing = '' ;
2014-05-14 12:39:12 +02:00
2016-05-03 23:45:32 +02:00
if ( isset ( $param [ 'u' ])) { /* User and Channel modes */
$this -> request = $param [ 'u' ];
$url_feed = $this -> getURI () . 'feeds/videos.xml?user=' . urlencode ( $this -> request );
$url_listing = $this -> getURI () . 'user/' . urlencode ( $this -> request ) . '/videos' ;
} else if ( isset ( $param [ 'c' ])) {
2014-08-19 21:35:56 +02:00
$this -> request = $param [ 'c' ];
2016-05-03 23:45:32 +02:00
$url_feed = $this -> getURI () . 'feeds/videos.xml?channel_id=' . urlencode ( $this -> request );
$url_listing = $this -> getURI () . 'channel/' . urlencode ( $this -> request ) . '/videos' ;
}
if ( ! empty ( $url_feed ) && ! empty ( $url_listing )) {
2016-06-25 23:17:42 +02:00
if ( $xml = $this -> file_get_html ( $url_feed )) {
2016-05-03 23:45:32 +02:00
$this -> ytBridgeParseXmlFeed ( $xml );
2016-06-25 23:17:42 +02:00
} else if ( $html = $this -> file_get_html ( $url_listing )) {
2016-05-03 23:45:32 +02:00
$this -> ytBridgeParseHtmlListing ( $html , 'li.channels-content-item' , 'h3' );
} else $this -> returnError ( " Could not request YouTube. Tried: \n - $url_feed\n - $url_listing " , 500 );
2014-08-19 21:35:56 +02:00
}
2016-05-03 23:45:32 +02:00
else if ( isset ( $param [ 'p' ])) { /* playlist mode */
2014-06-20 17:00:36 +02:00
$this -> request = $param [ 'p' ];
2016-05-03 23:45:32 +02:00
$url_listing = $this -> getURI () . 'playlist?list=' . urlencode ( $this -> request );
2016-06-25 23:17:42 +02:00
$html = $this -> file_get_html ( $url_listing ) or $this -> returnError ( " Could not request YouTube. Tried: \n - $url_listing " , 500 );
2016-05-03 23:45:32 +02:00
$this -> ytBridgeParseHtmlListing ( $html , 'tr.pl-video' , '.pl-video-title a' );
2016-05-21 11:45:09 +02:00
$this -> request = 'Playlist: ' . str_replace ( ' - YouTube' , '' , $html -> find ( 'title' , 0 ) -> plaintext );
2014-06-20 17:04:27 +02:00
}
2013-08-15 12:05:58 +02:00
2016-05-03 23:45:32 +02:00
else if ( isset ( $param [ 's' ])) { /* search mode */
$this -> request = $param [ 's' ]; $page = 1 ; if ( isset ( $param [ 'pa' ])) $page = ( int ) preg_replace ( " /[^0-9]/ " , '' , $param [ 'pa' ]);
$url_listing = $this -> getURI () . 'results?search_query=' . urlencode ( $this -> request ) . '&page=' . $page . '&filters=video&search_sort=video_date_uploaded' ;
2016-06-25 23:17:42 +02:00
$html = $this -> file_get_html ( $url_listing ) or $this -> returnError ( " Could not request YouTube. Tried: \n - $url_listing " , 500 );
2016-05-03 23:45:32 +02:00
$this -> ytBridgeParseHtmlListing ( $html , 'div.yt-lockup' , 'h3' );
$this -> request = 'Search: ' . str_replace ( ' - YouTube' , '' , $html -> find ( 'title' , 0 ) -> plaintext );
2014-06-20 17:00:36 +02:00
}
2016-05-03 23:45:32 +02:00
else { /* no valid mode */
$this -> returnError ( " You must either specify either: \n - YouTube username (?u=...) \n - Channel id (?c=...) \n - Playlist id (?p=...) \n - Search (?s=...) " , 400 );
}
}
2014-06-20 17:00:36 +02:00
public function getName (){
2016-05-03 23:45:32 +02:00
return ( ! empty ( $this -> request ) ? $this -> request . ' - ' : '' ) . 'YouTube Bridge' ;
2014-06-20 17:00:36 +02:00
}
2013-08-15 12:05:58 +02:00
2014-06-20 17:00:36 +02:00
public function getURI (){
return 'https://www.youtube.com/' ;
}
public function getCacheDuration (){
return 10800 ; // 3 hours
}
2013-08-15 12:05:58 +02:00
}