123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110 |
- <?php
- class UsbekEtRicaBridge extends BridgeAbstract {
- const MAINTAINER = 'logmanoriginal';
- const NAME = 'Usbek & Rica Bridge';
- const URI = 'https://usbeketrica.com';
- const DESCRIPTION = 'Returns latest articles from the front page';
- const PARAMETERS = array(
- array(
- 'limit' => array(
- 'name' => 'Number of articles to return',
- 'type' => 'number',
- 'required' => false,
- 'title' => 'Specifies the maximum number of articles to return',
- 'defaultValue' => -1
- ),
- 'fullarticle' => array(
- 'name' => 'Load full article',
- 'type' => 'checkbox',
- 'required' => false,
- 'title' => 'Activate to load full articles',
- )
- )
- );
- public function collectData(){
- $limit = $this->getInput('limit');
- $fullarticle = $this->getInput('fullarticle');
- $html = getSimpleHTMLDOM($this->getURI());
- $articles = $html->find('div.details');
- foreach($articles as $article) {
- $item = array();
- $title = $article->find('div.card-title', 0);
- if($title) {
- $item['title'] = $title->plaintext;
- } else {
- // Sometimes we get rubbish, ignore.
- continue;
- }
- $author = $article->find('div.author span', 0);
- if($author) {
- $item['author'] = $author->plaintext;
- }
- $uri = $article->find('a.read', 0)->href;
- if(substr($uri, 0, 1) === 'h') { // absolute uri
- $item['uri'] = $uri;
- } else { // relative uri
- $item['uri'] = $this->getURI() . $uri;
- }
- if($fullarticle) {
- $content = $this->loadFullArticle($item['uri']);
- }
- if($fullarticle && !is_null($content)) {
- $item['content'] = $content;
- } else {
- $excerpt = $article->find('div.card-excerpt', 0);
- if($excerpt) {
- $item['content'] = $excerpt->plaintext;
- }
- }
- $image = $article->find('div.card-img img', 0);
- if($image) {
- $item['enclosures'] = array(
- $image->src
- );
- }
- $this->items[] = $item;
- if($limit > 0 && count($this->items) >= $limit) {
- break;
- }
- }
- }
- /**
- * Loads the full article and returns the contents
- * @param $uri The article URI
- * @return The article content
- */
- private function loadFullArticle($uri){
- $html = getSimpleHTMLDOMCached($uri);
- $content = $html->find('section.main', 0);
- if($content) {
- return $this->replaceUriInHtmlElement($content);
- }
- return null;
- }
- /**
- * Replaces all relative URIs with absolute ones
- * @param $element A simplehtmldom element
- * @return The $element->innertext with all URIs replaced
- */
- private function replaceUriInHtmlElement($element){
- return str_replace('href="/', 'href="' . $this->getURI() . '/', $element->innertext);
- }
- }
|