diff options
Diffstat (limited to 'bridges/GoogleSearchBridge.php')
-rw-r--r-- | bridges/GoogleSearchBridge.php | 64 |
1 files changed, 64 insertions, 0 deletions
diff --git a/bridges/GoogleSearchBridge.php b/bridges/GoogleSearchBridge.php new file mode 100644 index 0000000..2eb5841 --- /dev/null +++ b/bridges/GoogleSearchBridge.php @@ -0,0 +1,64 @@ +<?php +/** +* Returns the 100 most recent links in results in past year, sorting by date (most recent first). +* Example: +* http://www.google.com/search?q=sebsauvage&num=100&complete=0&tbs=qdr:y,sbd:1 +* complete=0&num=100 : get 100 results +* qdr:y : in past year +* sbd:1 : sort by date (will only work if qdr: is specified) +*/ +class GoogleSearchBridge extends BridgeAbstract { + + const MAINTAINER = 'sebsauvage'; + const NAME = 'Google search'; + const URI = 'https://www.google.com/'; + const CACHE_TIMEOUT = 1800; // 30min + const DESCRIPTION = 'Returns most recent results from Google search.'; + + const PARAMETERS = array(array( + 'q' => array( + 'name' => 'keyword', + 'required' => true + ) + )); + + public function collectData(){ + $html = ''; + + $html = getSimpleHTMLDOM(self::URI + . 'search?q=' + . urlencode($this->getInput('q')) + .'&num=100&complete=0&tbs=qdr:y,sbd:1') + or returnServerError('No results for this query.'); + + $emIsRes = $html->find('div[id=ires]', 0); + + if(!is_null($emIsRes)) { + foreach($emIsRes->find('div[class=g]') as $element) { + + $item = array(); + + // Extract direct URL from google href (eg. /url?q=...) + $t = $element->find('a[href]', 0)->href; + $item['uri'] = '' . $t; + parse_str(parse_url($t, PHP_URL_QUERY), $parameters); + if(isset($parameters['q'])) { + $item['uri'] = $parameters['q']; + } + + $item['title'] = $element->find('h3', 0)->plaintext; + $item['content'] = $element->find('span[class=st]', 0)->plaintext; + + $this->items[] = $item; + } + } + } + + public function getName(){ + if(!is_null($this->getInput('q'))) { + return $this->getInput('q') . ' - Google search'; + } + + return parent::getName(); + } +} |