summaryrefslogtreecommitdiff
path: root/bridges/ReporterreBridge.php
blob: db1104c11ebe65b6674821ddaea6c792813be7f8 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
<?php
class ReporterreBridge extends BridgeAbstract {

		const MAINTAINER = 'nyutag';
		const NAME = 'Reporterre Bridge';
		const URI = 'http://www.reporterre.net/';
		const DESCRIPTION = 'Returns the newest articles.';

		private function extractContent($url){
			$html2 = getSimpleHTMLDOM($url);

			foreach($html2->find('div[style=text-align:justify]') as $e) {
				$text = $e->outertext;
			}

			$html2->clear();
			unset($html2);

			// Replace all relative urls with absolute ones
			$text = preg_replace(
				'/(href|src)(\=[\"\'])(?!http)([^"\']+)/ims',
				"$1$2" . self::URI . "$3",
				$text
			);

			$text = strip_tags($text, '<p><br><a><img>');
			return $text;
		}

	public function collectData(){
		$html = getSimpleHTMLDOM(self::URI . 'spip.php?page=backend')
			or returnServerError('Could not request Reporterre.');
		$limit = 0;

		foreach($html->find('item') as $element) {
			if($limit < 5) {
				$item = array();
				$item['title'] = html_entity_decode($element->find('title', 0)->plaintext);
				$item['timestamp'] = strtotime($element->find('dc:date', 0)->plaintext);
				$item['uri'] = $element->find('guid', 0)->innertext;
				$item['content'] = html_entity_decode($this->extractContent($item['uri']));
				$this->items[] = $item;
				$limit++;
			}
		}
	}
}