aboutsummaryrefslogtreecommitdiff
path: root/bridges/ReporterreBridge.php
blob: 78c60d5f599a019eb99af2f1cd4610d5963c998d (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
<?php

/**
 * See https://reporterre.net/spip.php?page=backend-simple
 */
class ReporterreBridge extends BridgeAbstract
{
    const MAINTAINER = 'nyutag';
    const NAME = 'Reporterre Bridge';
    const URI = 'https://www.reporterre.net/';
    const DESCRIPTION = 'Returns the newest articles. See also their official feed https://reporterre.net/spip.php?page=backend-simple';

    public function collectData()
    {
        //$url = self::URI . 'spip.php?page=backend';
        $url = self::URI . 'spip.php?page=backend-simple';
        $html = getSimpleHTMLDOM($url);
        $limit = 0;

        foreach ($html->find('item') as $element) {
            if ($limit < 5) {
                $item = [];
                $item['title'] = html_entity_decode($element->find('title', 0)->plaintext);
                $item['timestamp'] = strtotime($element->find('dc:date', 0)->plaintext);
                $item['uri'] = $element->find('guid', 0)->innertext;
                //$item['content'] = html_entity_decode($this->extractContent($item['uri']));
                $item['content'] = htmlspecialchars_decode($element->find('description', 0)->plaintext);
                $this->items[] = $item;
                $limit++;
            }
        }
    }

    private function extractContent($url)
    {
        $html2 = getSimpleHTMLDOM($url);
        $html2 = defaultLinkTo($html2, self::URI);

        foreach ($html2->find('div[style=text-align:justify]') as $e) {
            $text = $e->outertext;
        }

        $html2->clear();
        unset($html2);

        $text = strip_tags($text, '<p><br><a><img>');
        return $text;
    }
}