aboutsummaryrefslogtreecommitdiff
path: root/lib/FormatAbstract.php
blob: 7a4c6c92e7ed2912a115a6a8ae5a4b9dc7be7bd5 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
<?php

/**
 * This file is part of RSS-Bridge, a PHP project capable of generating RSS and
 * Atom feeds for websites that don't have one.
 *
 * For the full license information, please view the UNLICENSE file distributed
 * with this source code.
 *
 * @package Core
 * @license https://unlicense.org/ UNLICENSE
 * @link    https://github.com/rss-bridge/rss-bridge
 */

/**
 * An abstract class for format implementations
 *
 * This class implements {@see FormatInterface}
 */
abstract class FormatAbstract implements FormatInterface
{
    /** The default charset (UTF-8) */
    const DEFAULT_CHARSET = 'UTF-8';

    /** MIME type of format output */
    const MIME_TYPE = 'text/plain';

    /** @var string $charset The charset */
    protected $charset;

    /** @var array $items The items */
    protected $items;

    /**
     * @var int $lastModified A timestamp to indicate the last modified time of
     * the output data.
     */
    protected $lastModified;

    /** @var array $extraInfos The extra infos */
    protected $extraInfos;

    /** {@inheritdoc} */
    public function getMimeType()
    {
        return static::MIME_TYPE;
    }

    /**
     * {@inheritdoc}
     *
     * @param string $charset {@inheritdoc}
     */
    public function setCharset($charset)
    {
        $this->charset = $charset;

        return $this;
    }

    /** {@inheritdoc} */
    public function getCharset()
    {
        $charset = $this->charset;

        return is_null($charset) ? static::DEFAULT_CHARSET : $charset;
    }

    /**
     * Set the last modified time
     *
     * @param int $lastModified The last modified time
     * @return void
     */
    public function setLastModified($lastModified)
    {
        $this->lastModified = $lastModified;
    }

    /**
     * {@inheritdoc}
     *
     * @param array $items {@inheritdoc}
     */
    public function setItems(array $items)
    {
        $this->items = $items;

        return $this;
    }

    /** {@inheritdoc} */
    public function getItems()
    {
        if (!is_array($this->items)) {
            throw new \LogicException('Feed the ' . get_class($this) . ' with "setItems" method before !');
        }

        return $this->items;
    }

    /**
     * {@inheritdoc}
     *
     * @param array $extraInfos {@inheritdoc}
     */
    public function setExtraInfos(array $extraInfos = [])
    {
        foreach (['name', 'uri', 'icon', 'donationUri'] as $infoName) {
            if (!isset($extraInfos[$infoName])) {
                $extraInfos[$infoName] = '';
            }
        }

        $this->extraInfos = $extraInfos;

        return $this;
    }

    /** {@inheritdoc} */
    public function getExtraInfos()
    {
        if (is_null($this->extraInfos)) { // No extra info ?
            $this->setExtraInfos(); // Define with default value
        }

        return $this->extraInfos;
    }

    /**
     * Sanitize HTML while leaving it functional.
     *
     * Keeps HTML as-is (with clickable hyperlinks) while reducing annoying and
     * potentially dangerous things.
     *
     * @param string $html The HTML content
     * @return string The sanitized HTML content
     *
     * @todo This belongs into `html.php`
     * @todo Maybe switch to http://htmlpurifier.org/
     * @todo Maybe switch to http://www.bioinformatics.org/phplabware/internal_utilities/htmLawed/index.php
     */
    protected function sanitizeHtml(string $html): string
    {
        $html = str_replace('<script', '<&zwnj;script', $html); // Disable scripts, but leave them visible.
        $html = str_replace('<iframe', '<&zwnj;iframe', $html);
        $html = str_replace('<link', '<&zwnj;link', $html);
        // We leave alone object and embed so that videos can play in RSS readers.
        return $html;
    }
}