summaryrefslogtreecommitdiff
path: root/bridges/GoogleSearchBridge.php
blob: 2eb5841184ae885f55598b2cc048580332021135 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
<?php
/**
* Returns the 100 most recent links in results in past year, sorting by date (most recent first).
* Example:
* http://www.google.com/search?q=sebsauvage&num=100&complete=0&tbs=qdr:y,sbd:1
*    complete=0&num=100 : get 100 results
*    qdr:y : in past year
*    sbd:1 : sort by date (will only work if qdr: is specified)
*/
class GoogleSearchBridge extends BridgeAbstract {

	const MAINTAINER = 'sebsauvage';
	const NAME = 'Google search';
	const URI = 'https://www.google.com/';
	const CACHE_TIMEOUT = 1800; // 30min
	const DESCRIPTION = 'Returns most recent results from Google search.';

	const PARAMETERS = array(array(
		'q' => array(
			'name' => 'keyword',
			'required' => true
		)
	));

	public function collectData(){
		$html = '';

		$html = getSimpleHTMLDOM(self::URI
		. 'search?q='
		. urlencode($this->getInput('q'))
		.'&num=100&complete=0&tbs=qdr:y,sbd:1')
			or returnServerError('No results for this query.');

		$emIsRes = $html->find('div[id=ires]', 0);

		if(!is_null($emIsRes)) {
			foreach($emIsRes->find('div[class=g]') as $element) {

				$item = array();

				// Extract direct URL from google href (eg. /url?q=...)
				$t = $element->find('a[href]', 0)->href;
				$item['uri'] = '' . $t;
				parse_str(parse_url($t, PHP_URL_QUERY), $parameters);
				if(isset($parameters['q'])) {
					$item['uri'] = $parameters['q'];
				}

				$item['title'] = $element->find('h3', 0)->plaintext;
				$item['content'] = $element->find('span[class=st]', 0)->plaintext;

				$this->items[] = $item;
			}
		}
	}

	public function getName(){
		if(!is_null($this->getInput('q'))) {
			return $this->getInput('q') . ' - Google search';
		}

		return parent::getName();
	}
}