From 0a35003237ec4a137117f438ab84d0a2a472aa75 Mon Sep 17 00:00:00 2001 From: Albirew Date: Sat, 21 May 2016 18:27:30 +0200 Subject: [PATCH] Added Bridge for Novel Updates contain dirty fix to bypass simpledom bug, see issue #259 for details --- bridges/NovelUpdatesBridge.php | 59 ++++++++++++++++++++++++++++++++++ 1 file changed, 59 insertions(+) create mode 100644 bridges/NovelUpdatesBridge.php diff --git a/bridges/NovelUpdatesBridge.php b/bridges/NovelUpdatesBridge.php new file mode 100644 index 0000000..f48e45d --- /dev/null +++ b/bridges/NovelUpdatesBridge.php @@ -0,0 +1,59 @@ +maintainer = "albirew"; + $this->name = "Novel Updates"; + $this->uri = "http://www.novelupdates.com/"; + $this->description = "Returns releases from Novel Updates"; + $this->update = "2016-05-21"; + $this->parameters[] = + '[ + { + "name" : "Novel URL", + "identifier" : "n" + } + ]'; + } + + public function collectData(array $param){ + if (!isset($param['n'])) + $this->returnError('You must specify the novel URL (/series/...)', 400); + $thread = parse_url($param['n']) or $this->returnError('This URL seems malformed, please check it.', 400); + if($thread['host'] !== 'www.novelupdates.com') + $this->returnError('NovelUpdates URL only.', 400); + if(strpos($thread['path'], 'series/') === FALSE) + $this->returnError('You must specify the novel URL.', 400); + $url = 'http://www.novelupdates.com'.$thread['path'].''; + $fullhtml = file_get_html($url) or $this->returnError("Could not request NovelUpdates, novel not found", 404); + $this->request = $fullhtml->find('h4.seriestitle', 0)->plaintext; + // dirty fix for nasty simpledom bug: https://github.com/sebsauvage/rss-bridge/issues/259 + // forcefully removes tbody + $html = $fullhtml->find('table#myTable', 0)->innertext; + $html = stristr($html, ''); //strip thead + $html = stristr($html, ''); //remove tbody + $html = str_get_html(stristr($html, '', true)); //remove last tbody and get back as an array + foreach($html->find('tr') as $element){ + $item = new \Item(); + $item->uri = $element->find('td', 2)->find('a', 0)->href; + $item->title = $element->find('td', 2)->find('a', 0)->plaintext; + $item->team = $element->find('td', 1)->innertext; + $item->timestamp = strtotime($element->find('td', 0)->plaintext); + $item->content = ''.$this->request.' - '.$item->title.' by '.$item->team.'
'.$fullhtml->find('div.seriesimg', 0)->innertext.''; + $this->items[] = $item; + } + } + public function getName(){ + return (!empty($this->request) ? $this->request.' - ' : '') .'Novel Updates'; + } + public function getURI(){ + return 'http://www.novelupdates.com/'; + } + public function getDescription(){ + return "Novel Updates - Directory of Translated Novels"; + } + public function getCacheDuration(){ + return 21600; // 6 hours + } +}