From 2500d0df9329cddfe8c07b49036c42561e784f51 Mon Sep 17 00:00:00 2001
From: logmanoriginal
Date: Sun, 9 Apr 2017 23:26:35 +0200
Subject: [PATCH] [PinterestBridge] Fix implementation after DOM changes
Due to breaking DOM changes this bridge required re-implementation.
With this fix the brige will make use of the JSON data embedded in
the returned HTML. The content returned for all contexts is similar
with only a few differences due to limitations of the JSON.
Feeds returned for a given username and board will by default make
use of the provided RSS feed instead of using the custom filter.
This bahaviour can be changed by setting the optional parameter
'&r=off' (on by default)
Notice: The JSON data for userdata and search results is very
different, so two functions were implemented to account for that.
References #498
---
bridges/PinterestBridge.php | 148 +++++++++++++++++++++++-------------
1 file changed, 95 insertions(+), 53 deletions(-)
diff --git a/bridges/PinterestBridge.php b/bridges/PinterestBridge.php
index 6898979..7597c43 100644
--- a/bridges/PinterestBridge.php
+++ b/bridges/PinterestBridge.php
@@ -1,9 +1,9 @@
array(
'name' => 'board',
'required' => true
+ ),
+ 'r' => array(
+ 'name' => 'Use provided RSS',
+ 'type' => 'checkbox',
+ 'required' => false,
+ 'defaultValue' => 'checked',
+ 'title' => 'Uncheck to return data via custom filters (more data)'
)
),
'From search' => array(
@@ -26,81 +33,116 @@ class PinterestBridge extends BridgeAbstract {
);
public function collectData(){
- $html = getSimpleHTMLDOM($this->getURI());
- if(!$html){
- switch($this->queriedContext){
+ switch($this->queriedContext){
case 'By username and board':
- returnServerError('Username and/or board not found');
+ if($this->getInput('r')){
+ $this->collectExpandableDatas($this->getURI() . '.rss');
+ } else {
+ $html = getSimpleHTMLDOMCached($this->getURI());
+ $this->getUserResults($html);
+ }
+ break;
case 'From search':
- returnServerError('Could not request Pinterest.');
- }
+ default:
+ $html = getSimpleHTMLDOMCached($this->getURI());
+ $this->getSearchResults($html);
}
+ }
- if($this->queriedContext === 'From search'){
- foreach($html->find('div.pinWrapper') as $div){
- $item = array();
+ private function getUserResults($html){
+ $json = json_decode($html->find('#jsInit1', 0)->innertext, true);
+ $results = $json['tree']['children'][0]['children'][0]['children'][0]['options']['props']['data']['board_feed'];
+ $username = $json['resourceDataCache'][0]['data']['owner']['username'];
+ $fullname = $json['resourceDataCache'][0]['data']['owner']['full_name'];
+ $avatar = $json['resourceDataCache'][0]['data']['owner']['image_small_url'];
- $a = $div->find('a.pinImageWrapper', 0);
- $img = $a->find('img', 0);
+ foreach($results as $result){
+ $item = array();
- $item['uri'] = $this->getURI() . $a->getAttribute('href');
- $item['content'] = '';
+ $item['uri'] = $result['link'];
- $avatar = $div->find('div.creditImg', 0)->find('img', 0);
- $avatar = $avatar->getAttribute('data-src');
- $avatar = str_replace("\\", "", $avatar);
+ // Some use regular titles, others provide 'advanced' infos, a few
+ // provide even less info. Thus we attempt multiple options.
+ $item['title'] = trim($result['title']);
- $username = $div->find('div.creditName', 0);
- $board = $div->find('div.creditTitle', 0);
+ if($item['title'] === "")
+ $item['title'] = trim($result['rich_summary']['display_name']);
- $item['username'] = $username->innertext;
- $item['fullname'] = $board->innertext;
- $item['avatar'] = $avatar;
+ if($item['title'] === "")
+ $item['title'] = trim($result['description']);
- $item['content'] .= '
'
+ . '" />'
. $item['username']
- . '
'
- . $item['fullname'];
+ . '
'
+ . $item['fullname']
+ . '
'
+ . $result['description']
+ . '
';
- $item['title'] = $img->getAttribute('alt');
- $this->items[] = $item;
- }
- } elseif($this->queriedContext === 'By username and board'){
- $container = $html->find('SCRIPT[type="application/ld+json"]', 0)
- or returnServerError('Unable to find data container!');
+ $item['enclosures'] = array($result['images']['orig']['url']);
- $json = json_decode($container->innertext, true);
+ $this->items[] = $item;
+ }
+ }
- foreach($json['itemListElement'] as $element){
- $item = array();
+ private function getSearchResults($html){
+ $json = json_decode($html->find('#jsInit1', 0)->innertext, true);
+ $results = $json['resourceDataCache'][0]['data']['results'];
- $item['uri'] = $element['item']['sharedContent']['author']['url'];
- $item['title'] = $element['item']['name'];
- $item['author'] = $element['item']['user']['name'];
- $item['timestamp'] = strtotime($element['item']['datePublished']);
- $item['content'] = <<
-
-
-{$element['item']['text']}
-EOD;
+ foreach($results as $result){
+ $item = array();
- $this->items[] = $item;
- }
+ $item['uri'] = self::URI . $result['board']['url'];
+
+ // Some use regular titles, others provide 'advanced' infos, a few
+ // provide even less info. Thus we attempt multiple options.
+ $item['title'] = trim($result['title']);
+
+ if($item['title'] === "")
+ $item['title'] = trim($result['rich_summary']['display_name']);
+
+ if($item['title'] === "")
+ $item['title'] = trim($result['grid_description']);
+
+ $item['timestamp'] = strtotime($result['created_at']);
+ $item['username'] = $result['pinner']['username'];
+ $item['fullname'] = $result['pinner']['full_name'];
+ $item['avatar'] = $result['pinner']['image_small_url'];
+ $item['author'] = $item['username'] . ' (' . $item['fullname'] . ')';
+ $item['content'] = ''
+ . $item['username']
+ . '
'
+ . $item['fullname']
+ . '
'
+ . $result['description']
+ . '
';
+
+ $item['enclosures'] = array($result['images']['orig']['url']);
+
+ $this->items[] = $item;
}
}
public function getURI(){
switch($this->queriedContext){
case 'By username and board':
- $uri = self::URI . urlencode($this->getInput('u')) . '/' . urlencode($this->getInput('b'));
+ $uri = self::URI . '/' . urlencode($this->getInput('u')) . '/' . urlencode($this->getInput('b'));// . '.rss';
break;
case 'From search':
- $uri = self::URI . 'search/?q=' . urlencode($this->getInput('q'));
+ $uri = self::URI . '/search/?q=' . urlencode($this->getInput('q'));
break;
default: return parent::getURI();
}
@@ -110,7 +152,7 @@ EOD;
public function getName(){
switch($this->queriedContext){
case 'By username and board':
- $specific = $this->getInput('u') . '-' . $this->getInput('b');
+ $specific = $this->getInput('u') . ' - ' . $this->getInput('b');
break;
case 'From search':
$specific = $this->getInput('q');