1<?php
2
3/**
4 * SimplePie
5 *
6 * A PHP-Based RSS and Atom Feed Framework.
7 * Takes the hard work out of managing a complete RSS/Atom solution.
8 *
9 * Copyright (c) 2004-2022, Ryan Parman, Sam Sneddon, Ryan McCue, and contributors
10 * All rights reserved.
11 *
12 * Redistribution and use in source and binary forms, with or without modification, are
13 * permitted provided that the following conditions are met:
14 *
15 * 	* Redistributions of source code must retain the above copyright notice, this list of
16 * 	  conditions and the following disclaimer.
17 *
18 * 	* Redistributions in binary form must reproduce the above copyright notice, this list
19 * 	  of conditions and the following disclaimer in the documentation and/or other materials
20 * 	  provided with the distribution.
21 *
22 * 	* Neither the name of the SimplePie Team nor the names of its contributors may be used
23 * 	  to endorse or promote products derived from this software without specific prior
24 * 	  written permission.
25 *
26 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS
27 * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY
28 * AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDERS
29 * AND CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
30 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
31 * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
32 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
33 * OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
34 * POSSIBILITY OF SUCH DAMAGE.
35 *
36 * @package SimplePie
37 * @copyright 2004-2016 Ryan Parman, Sam Sneddon, Ryan McCue
38 * @author Ryan Parman
39 * @author Sam Sneddon
40 * @author Ryan McCue
41 * @link http://simplepie.org/ SimplePie
42 * @license http://www.opensource.org/licenses/bsd-license.php BSD License
43 */
44
45namespace SimplePie;
46
47use SimplePie\XML\Declaration\Parser as DeclarationParser;
48
49/**
50 * Parses XML into something sane
51 *
52 *
53 * This class can be overloaded with {@see \SimplePie\SimplePie::set_parser_class()}
54 *
55 * @package SimplePie
56 * @subpackage Parsing
57 */
58class Parser implements RegistryAware
59{
60    public $error_code;
61    public $error_string;
62    public $current_line;
63    public $current_column;
64    public $current_byte;
65    public $separator = ' ';
66    public $namespace = [''];
67    public $element = [''];
68    public $xml_base = [''];
69    public $xml_base_explicit = [false];
70    public $xml_lang = [''];
71    public $data = [];
72    public $datas = [[]];
73    public $current_xhtml_construct = -1;
74    public $encoding;
75    protected $registry;
76
77    public function set_registry(\SimplePie\Registry $registry)/* : void */
78    {
79        $this->registry = $registry;
80    }
81
82    public function parse(&$data, $encoding, $url = '')
83    {
84        if (class_exists('DOMXpath') && function_exists('Mf2\parse')) {
85            $doc = new \DOMDocument();
86            @$doc->loadHTML($data);
87            $xpath = new \DOMXpath($doc);
88            // Check for both h-feed and h-entry, as both a feed with no entries
89            // and a list of entries without an h-feed wrapper are both valid.
90            $query = '//*[contains(concat(" ", @class, " "), " h-feed ") or '.
91                'contains(concat(" ", @class, " "), " h-entry ")]';
92            $result = $xpath->query($query);
93            if ($result->length !== 0) {
94                return $this->parse_microformats($data, $url);
95            }
96        }
97
98        // Use UTF-8 if we get passed US-ASCII, as every US-ASCII character is a UTF-8 character
99        if (strtoupper($encoding) === 'US-ASCII') {
100            $this->encoding = 'UTF-8';
101        } else {
102            $this->encoding = $encoding;
103        }
104
105        // Strip BOM:
106        // UTF-32 Big Endian BOM
107        if (substr($data, 0, 4) === "\x00\x00\xFE\xFF") {
108            $data = substr($data, 4);
109        }
110        // UTF-32 Little Endian BOM
111        elseif (substr($data, 0, 4) === "\xFF\xFE\x00\x00") {
112            $data = substr($data, 4);
113        }
114        // UTF-16 Big Endian BOM
115        elseif (substr($data, 0, 2) === "\xFE\xFF") {
116            $data = substr($data, 2);
117        }
118        // UTF-16 Little Endian BOM
119        elseif (substr($data, 0, 2) === "\xFF\xFE") {
120            $data = substr($data, 2);
121        }
122        // UTF-8 BOM
123        elseif (substr($data, 0, 3) === "\xEF\xBB\xBF") {
124            $data = substr($data, 3);
125        }
126
127        if (substr($data, 0, 5) === '<?xml' && strspn(substr($data, 5, 1), "\x09\x0A\x0D\x20") && ($pos = strpos($data, '?>')) !== false) {
128            $declaration = $this->registry->create(DeclarationParser::class, [substr($data, 5, $pos - 5)]);
129            if ($declaration->parse()) {
130                $data = substr($data, $pos + 2);
131                $data = '<?xml version="' . $declaration->version . '" encoding="' . $encoding . '" standalone="' . (($declaration->standalone) ? 'yes' : 'no') . '"?>' ."\n". $this->declare_html_entities() . $data;
132            } else {
133                $this->error_string = 'SimplePie bug! Please report this!';
134                return false;
135            }
136        }
137
138        $return = true;
139
140        static $xml_is_sane = null;
141        if ($xml_is_sane === null) {
142            $parser_check = xml_parser_create();
143            xml_parse_into_struct($parser_check, '<foo>&amp;</foo>', $values);
144            xml_parser_free($parser_check);
145            $xml_is_sane = isset($values[0]['value']);
146        }
147
148        // Create the parser
149        if ($xml_is_sane) {
150            $xml = xml_parser_create_ns($this->encoding, $this->separator);
151            xml_parser_set_option($xml, XML_OPTION_SKIP_WHITE, 1);
152            xml_parser_set_option($xml, XML_OPTION_CASE_FOLDING, 0);
153            xml_set_character_data_handler($xml, [$this, 'cdata']);
154            xml_set_element_handler($xml, [$this, 'tag_open'], [$this, 'tag_close']);
155
156            // Parse!
157            $wrapper = @is_writable(sys_get_temp_dir()) ? 'php://temp' : 'php://memory';
158            if (($stream = fopen($wrapper, 'r+')) &&
159                fwrite($stream, $data) &&
160                rewind($stream)) {
161                //Parse by chunks not to use too much memory
162                do {
163                    $stream_data = fread($stream, 1048576);
164                    if (!xml_parse($xml, $stream_data === false ? '' : $stream_data, feof($stream))) {
165                        $this->error_code = xml_get_error_code($xml);
166                        $this->error_string = xml_error_string($this->error_code);
167                        $return = false;
168                        break;
169                    }
170                } while (!feof($stream));
171                fclose($stream);
172            } else {
173                $return = false;
174            }
175
176            $this->current_line = xml_get_current_line_number($xml);
177            $this->current_column = xml_get_current_column_number($xml);
178            $this->current_byte = xml_get_current_byte_index($xml);
179            xml_parser_free($xml);
180            return $return;
181        }
182
183        libxml_clear_errors();
184        $xml = new \XMLReader();
185        $xml->xml($data);
186        while (@$xml->read()) {
187            switch ($xml->nodeType) {
188                case constant('XMLReader::END_ELEMENT'):
189                    if ($xml->namespaceURI !== '') {
190                        $tagName = $xml->namespaceURI . $this->separator . $xml->localName;
191                    } else {
192                        $tagName = $xml->localName;
193                    }
194                    $this->tag_close(null, $tagName);
195                    break;
196                case constant('XMLReader::ELEMENT'):
197                    $empty = $xml->isEmptyElement;
198                    if ($xml->namespaceURI !== '') {
199                        $tagName = $xml->namespaceURI . $this->separator . $xml->localName;
200                    } else {
201                        $tagName = $xml->localName;
202                    }
203                    $attributes = [];
204                    while ($xml->moveToNextAttribute()) {
205                        if ($xml->namespaceURI !== '') {
206                            $attrName = $xml->namespaceURI . $this->separator . $xml->localName;
207                        } else {
208                            $attrName = $xml->localName;
209                        }
210                        $attributes[$attrName] = $xml->value;
211                    }
212                    $this->tag_open(null, $tagName, $attributes);
213                    if ($empty) {
214                        $this->tag_close(null, $tagName);
215                    }
216                    break;
217                case constant('XMLReader::TEXT'):
218
219                case constant('XMLReader::CDATA'):
220                    $this->cdata(null, $xml->value);
221                    break;
222            }
223        }
224        if ($error = libxml_get_last_error()) {
225            $this->error_code = $error->code;
226            $this->error_string = $error->message;
227            $this->current_line = $error->line;
228            $this->current_column = $error->column;
229            return false;
230        }
231
232        return true;
233    }
234
235    public function get_error_code()
236    {
237        return $this->error_code;
238    }
239
240    public function get_error_string()
241    {
242        return $this->error_string;
243    }
244
245    public function get_current_line()
246    {
247        return $this->current_line;
248    }
249
250    public function get_current_column()
251    {
252        return $this->current_column;
253    }
254
255    public function get_current_byte()
256    {
257        return $this->current_byte;
258    }
259
260    public function get_data()
261    {
262        return $this->data;
263    }
264
265    public function tag_open($parser, $tag, $attributes)
266    {
267        [$this->namespace[], $this->element[]] = $this->split_ns($tag);
268
269        $attribs = [];
270        foreach ($attributes as $name => $value) {
271            [$attrib_namespace, $attribute] = $this->split_ns($name);
272            $attribs[$attrib_namespace][$attribute] = $value;
273        }
274
275        if (isset($attribs[\SimplePie\SimplePie::NAMESPACE_XML]['base'])) {
276            $base = $this->registry->call(Misc::class, 'absolutize_url', [$attribs[\SimplePie\SimplePie::NAMESPACE_XML]['base'], end($this->xml_base)]);
277            if ($base !== false) {
278                $this->xml_base[] = $base;
279                $this->xml_base_explicit[] = true;
280            }
281        } else {
282            $this->xml_base[] = end($this->xml_base);
283            $this->xml_base_explicit[] = end($this->xml_base_explicit);
284        }
285
286        if (isset($attribs[\SimplePie\SimplePie::NAMESPACE_XML]['lang'])) {
287            $this->xml_lang[] = $attribs[\SimplePie\SimplePie::NAMESPACE_XML]['lang'];
288        } else {
289            $this->xml_lang[] = end($this->xml_lang);
290        }
291
292        if ($this->current_xhtml_construct >= 0) {
293            $this->current_xhtml_construct++;
294            if (end($this->namespace) === \SimplePie\SimplePie::NAMESPACE_XHTML) {
295                $this->data['data'] .= '<' . end($this->element);
296                if (isset($attribs[''])) {
297                    foreach ($attribs[''] as $name => $value) {
298                        $this->data['data'] .= ' ' . $name . '="' . htmlspecialchars($value, ENT_COMPAT, $this->encoding) . '"';
299                    }
300                }
301                $this->data['data'] .= '>';
302            }
303        } else {
304            $this->datas[] = &$this->data;
305            $this->data = &$this->data['child'][end($this->namespace)][end($this->element)][];
306            $this->data = ['data' => '', 'attribs' => $attribs, 'xml_base' => end($this->xml_base), 'xml_base_explicit' => end($this->xml_base_explicit), 'xml_lang' => end($this->xml_lang)];
307            if ((end($this->namespace) === \SimplePie\SimplePie::NAMESPACE_ATOM_03 && in_array(end($this->element), ['title', 'tagline', 'copyright', 'info', 'summary', 'content']) && isset($attribs['']['mode']) && $attribs['']['mode'] === 'xml')
308            || (end($this->namespace) === \SimplePie\SimplePie::NAMESPACE_ATOM_10 && in_array(end($this->element), ['rights', 'subtitle', 'summary', 'info', 'title', 'content']) && isset($attribs['']['type']) && $attribs['']['type'] === 'xhtml')
309            || (end($this->namespace) === \SimplePie\SimplePie::NAMESPACE_RSS_20 && in_array(end($this->element), ['title']))
310            || (end($this->namespace) === \SimplePie\SimplePie::NAMESPACE_RSS_090 && in_array(end($this->element), ['title']))
311            || (end($this->namespace) === \SimplePie\SimplePie::NAMESPACE_RSS_10 && in_array(end($this->element), ['title']))) {
312                $this->current_xhtml_construct = 0;
313            }
314        }
315    }
316
317    public function cdata($parser, $cdata)
318    {
319        if ($this->current_xhtml_construct >= 0) {
320            $this->data['data'] .= htmlspecialchars($cdata, ENT_QUOTES, $this->encoding);
321        } else {
322            $this->data['data'] .= $cdata;
323        }
324    }
325
326    public function tag_close($parser, $tag)
327    {
328        if ($this->current_xhtml_construct >= 0) {
329            $this->current_xhtml_construct--;
330            if (end($this->namespace) === \SimplePie\SimplePie::NAMESPACE_XHTML && !in_array(end($this->element), ['area', 'base', 'basefont', 'br', 'col', 'frame', 'hr', 'img', 'input', 'isindex', 'link', 'meta', 'param'])) {
331                $this->data['data'] .= '</' . end($this->element) . '>';
332            }
333        }
334        if ($this->current_xhtml_construct === -1) {
335            $this->data = &$this->datas[count($this->datas) - 1];
336            array_pop($this->datas);
337        }
338
339        array_pop($this->element);
340        array_pop($this->namespace);
341        array_pop($this->xml_base);
342        array_pop($this->xml_base_explicit);
343        array_pop($this->xml_lang);
344    }
345
346    public function split_ns($string)
347    {
348        static $cache = [];
349        if (!isset($cache[$string])) {
350            if ($pos = strpos($string, $this->separator)) {
351                static $separator_length;
352                if (!$separator_length) {
353                    $separator_length = strlen($this->separator);
354                }
355                $namespace = substr($string, 0, $pos);
356                $local_name = substr($string, $pos + $separator_length);
357                if (strtolower($namespace) === \SimplePie\SimplePie::NAMESPACE_ITUNES) {
358                    $namespace = \SimplePie\SimplePie::NAMESPACE_ITUNES;
359                }
360
361                // Normalize the Media RSS namespaces
362                if ($namespace === \SimplePie\SimplePie::NAMESPACE_MEDIARSS_WRONG ||
363                    $namespace === \SimplePie\SimplePie::NAMESPACE_MEDIARSS_WRONG2 ||
364                    $namespace === \SimplePie\SimplePie::NAMESPACE_MEDIARSS_WRONG3 ||
365                    $namespace === \SimplePie\SimplePie::NAMESPACE_MEDIARSS_WRONG4 ||
366                    $namespace === \SimplePie\SimplePie::NAMESPACE_MEDIARSS_WRONG5) {
367                    $namespace = \SimplePie\SimplePie::NAMESPACE_MEDIARSS;
368                }
369                $cache[$string] = [$namespace, $local_name];
370            } else {
371                $cache[$string] = ['', $string];
372            }
373        }
374        return $cache[$string];
375    }
376
377    private function parse_hcard($data, $category = false)
378    {
379        $name = '';
380        $link = '';
381        // Check if h-card is set and pass that information on in the link.
382        if (isset($data['type']) && in_array('h-card', $data['type'])) {
383            if (isset($data['properties']['name'][0])) {
384                $name = $data['properties']['name'][0];
385            }
386            if (isset($data['properties']['url'][0])) {
387                $link = $data['properties']['url'][0];
388                if ($name === '') {
389                    $name = $link;
390                } else {
391                    // can't have commas in categories.
392                    $name = str_replace(',', '', $name);
393                }
394                $person_tag = $category ? '<span class="person-tag"></span>' : '';
395                return '<a class="h-card" href="'.$link.'">'.$person_tag.$name.'</a>';
396            }
397        }
398        return $data['value'] ?? '';
399    }
400
401    private function parse_microformats(&$data, $url)
402    {
403        $feed_title = '';
404        $feed_author = null;
405        $author_cache = [];
406        $items = [];
407        $entries = [];
408        $mf = \Mf2\parse($data, $url);
409        // First look for an h-feed.
410        $h_feed = [];
411        foreach ($mf['items'] as $mf_item) {
412            if (in_array('h-feed', $mf_item['type'])) {
413                $h_feed = $mf_item;
414                break;
415            }
416            // Also look for h-feed or h-entry in the children of each top level item.
417            if (!isset($mf_item['children'][0]['type'])) {
418                continue;
419            }
420            if (in_array('h-feed', $mf_item['children'][0]['type'])) {
421                $h_feed = $mf_item['children'][0];
422                // In this case the parent of the h-feed may be an h-card, so use it as
423                // the feed_author.
424                if (in_array('h-card', $mf_item['type'])) {
425                    $feed_author = $mf_item;
426                }
427                break;
428            } elseif (in_array('h-entry', $mf_item['children'][0]['type'])) {
429                $entries = $mf_item['children'];
430                // In this case the parent of the h-entry list may be an h-card, so use
431                // it as the feed_author.
432                if (in_array('h-card', $mf_item['type'])) {
433                    $feed_author = $mf_item;
434                }
435                break;
436            }
437        }
438        if (isset($h_feed['children'])) {
439            $entries = $h_feed['children'];
440            // Also set the feed title and store author from the h-feed if available.
441            if (isset($mf['items'][0]['properties']['name'][0])) {
442                $feed_title = $mf['items'][0]['properties']['name'][0];
443            }
444            if (isset($mf['items'][0]['properties']['author'][0])) {
445                $feed_author = $mf['items'][0]['properties']['author'][0];
446            }
447        } elseif (count($entries) === 0) {
448            $entries = $mf['items'];
449        }
450        for ($i = 0; $i < count($entries); $i++) {
451            $entry = $entries[$i];
452            if (in_array('h-entry', $entry['type'])) {
453                $item = [];
454                $title = '';
455                $description = '';
456                if (isset($entry['properties']['url'][0])) {
457                    $link = $entry['properties']['url'][0];
458                    if (isset($link['value'])) {
459                        $link = $link['value'];
460                    }
461                    $item['link'] = [['data' => $link]];
462                }
463                if (isset($entry['properties']['uid'][0])) {
464                    $guid = $entry['properties']['uid'][0];
465                    if (isset($guid['value'])) {
466                        $guid = $guid['value'];
467                    }
468                    $item['guid'] = [['data' => $guid]];
469                }
470                if (isset($entry['properties']['name'][0])) {
471                    $title = $entry['properties']['name'][0];
472                    if (isset($title['value'])) {
473                        $title = $title['value'];
474                    }
475                    $item['title'] = [['data' => $title]];
476                }
477                if (isset($entry['properties']['author'][0]) || isset($feed_author)) {
478                    // author is a special case, it can be plain text or an h-card array.
479                    // If it's plain text it can also be a url that should be followed to
480                    // get the actual h-card.
481                    $author = $entry['properties']['author'][0] ?? $feed_author;
482                    if (!is_string($author)) {
483                        $author = $this->parse_hcard($author);
484                    } elseif (strpos($author, 'http') === 0) {
485                        if (isset($author_cache[$author])) {
486                            $author = $author_cache[$author];
487                        } else {
488                            $mf = \Mf2\fetch($author);
489                            foreach ($mf['items'] as $hcard) {
490                                // Only interested in an h-card by itself in this case.
491                                if (!in_array('h-card', $hcard['type'])) {
492                                    continue;
493                                }
494                                // It must have a url property matching what we fetched.
495                                if (!isset($hcard['properties']['url']) ||
496                                        !(in_array($author, $hcard['properties']['url']))) {
497                                    continue;
498                                }
499                                // Save parse_hcard the trouble of finding the correct url.
500                                $hcard['properties']['url'][0] = $author;
501                                // Cache this h-card for the next h-entry to check.
502                                $author_cache[$author] = $this->parse_hcard($hcard);
503                                $author = $author_cache[$author];
504                                break;
505                            }
506                        }
507                    }
508                    $item['author'] = [['data' => $author]];
509                }
510                if (isset($entry['properties']['photo'][0])) {
511                    // If a photo is also in content, don't need to add it again here.
512                    $content = '';
513                    if (isset($entry['properties']['content'][0]['html'])) {
514                        $content = $entry['properties']['content'][0]['html'];
515                    }
516                    $photo_list = [];
517                    for ($j = 0; $j < count($entry['properties']['photo']); $j++) {
518                        $photo = $entry['properties']['photo'][$j];
519                        if (!empty($photo) && strpos($content, $photo) === false) {
520                            $photo_list[] = $photo;
521                        }
522                    }
523                    // When there's more than one photo show the first and use a lightbox.
524                    // Need a permanent, unique name for the image set, but don't have
525                    // anything unique except for the content itself, so use that.
526                    $count = count($photo_list);
527                    if ($count > 1) {
528                        $image_set_id = preg_replace('/[[:^alnum:]]/', '', $photo_list[0]);
529                        $description = '<p>';
530                        for ($j = 0; $j < $count; $j++) {
531                            $hidden = $j === 0 ? '' : 'class="hidden" ';
532                            $description .= '<a href="'.$photo_list[$j].'" '.$hidden.
533                                'data-lightbox="image-set-'.$image_set_id.'">'.
534                                '<img src="'.$photo_list[$j].'"></a>';
535                        }
536                        $description .= '<br><b>'.$count.' photos</b></p>';
537                    } elseif ($count == 1) {
538                        $description = '<p><img src="'.$photo_list[0].'"></p>';
539                    }
540                }
541                if (isset($entry['properties']['content'][0]['html'])) {
542                    // e-content['value'] is the same as p-name when they are on the same
543                    // element. Use this to replace title with a strip_tags version so
544                    // that alt text from images is not included in the title.
545                    if ($entry['properties']['content'][0]['value'] === $title) {
546                        $title = strip_tags($entry['properties']['content'][0]['html']);
547                        $item['title'] = [['data' => $title]];
548                    }
549                    $description .= $entry['properties']['content'][0]['html'];
550                    if (isset($entry['properties']['in-reply-to'][0])) {
551                        $in_reply_to = '';
552                        if (is_string($entry['properties']['in-reply-to'][0])) {
553                            $in_reply_to = $entry['properties']['in-reply-to'][0];
554                        } elseif (isset($entry['properties']['in-reply-to'][0]['value'])) {
555                            $in_reply_to = $entry['properties']['in-reply-to'][0]['value'];
556                        }
557                        if ($in_reply_to !== '') {
558                            $description .= '<p><span class="in-reply-to"></span> '.
559                                '<a href="'.$in_reply_to.'">'.$in_reply_to.'</a><p>';
560                        }
561                    }
562                    $item['description'] = [['data' => $description]];
563                }
564                if (isset($entry['properties']['category'])) {
565                    $category_csv = '';
566                    // Categories can also contain h-cards.
567                    foreach ($entry['properties']['category'] as $category) {
568                        if ($category_csv !== '') {
569                            $category_csv .= ', ';
570                        }
571                        if (is_string($category)) {
572                            // Can't have commas in categories.
573                            $category_csv .= str_replace(',', '', $category);
574                        } else {
575                            $category_csv .= $this->parse_hcard($category, true);
576                        }
577                    }
578                    $item['category'] = [['data' => $category_csv]];
579                }
580                if (isset($entry['properties']['published'][0])) {
581                    $timestamp = strtotime($entry['properties']['published'][0]);
582                    $pub_date = date('F j Y g:ia', $timestamp).' GMT';
583                    $item['pubDate'] = [['data' => $pub_date]];
584                }
585                // The title and description are set to the empty string to represent
586                // a deleted item (which also makes it an invalid rss item).
587                if (isset($entry['properties']['deleted'][0])) {
588                    $item['title'] = [['data' => '']];
589                    $item['description'] = [['data' => '']];
590                }
591                $items[] = ['child' => ['' => $item]];
592            }
593        }
594        // Mimic RSS data format when storing microformats.
595        $link = [['data' => $url]];
596        $image = '';
597        if (!is_string($feed_author) &&
598                isset($feed_author['properties']['photo'][0])) {
599            $image = [['child' => ['' => ['url' =>
600                [['data' => $feed_author['properties']['photo'][0]]]]]]];
601        }
602        // Use the name given for the h-feed, or get the title from the html.
603        if ($feed_title !== '') {
604            $feed_title = [['data' => htmlspecialchars($feed_title)]];
605        } elseif ($position = strpos($data, '<title>')) {
606            $start = $position < 200 ? 0 : $position - 200;
607            $check = substr($data, $start, 400);
608            $matches = [];
609            if (preg_match('/<title>(.+)<\/title>/', $check, $matches)) {
610                $feed_title = [['data' => htmlspecialchars($matches[1])]];
611            }
612        }
613        $channel = ['channel' => [['child' => ['' =>
614            ['link' => $link, 'image' => $image, 'title' => $feed_title,
615                  'item' => $items]]]]];
616        $rss = [['attribs' => ['' => ['version' => '2.0']],
617                           'child' => ['' => $channel]]];
618        $this->data = ['child' => ['' => ['rss' => $rss]]];
619        return true;
620    }
621
622    private function declare_html_entities()
623    {
624        // This is required because the RSS specification says that entity-encoded
625        // html is allowed, but the xml specification says they must be declared.
626        return '<!DOCTYPE html [ <!ENTITY nbsp "&#x00A0;"> <!ENTITY iexcl "&#x00A1;"> <!ENTITY cent "&#x00A2;"> <!ENTITY pound "&#x00A3;"> <!ENTITY curren "&#x00A4;"> <!ENTITY yen "&#x00A5;"> <!ENTITY brvbar "&#x00A6;"> <!ENTITY sect "&#x00A7;"> <!ENTITY uml "&#x00A8;"> <!ENTITY copy "&#x00A9;"> <!ENTITY ordf "&#x00AA;"> <!ENTITY laquo "&#x00AB;"> <!ENTITY not "&#x00AC;"> <!ENTITY shy "&#x00AD;"> <!ENTITY reg "&#x00AE;"> <!ENTITY macr "&#x00AF;"> <!ENTITY deg "&#x00B0;"> <!ENTITY plusmn "&#x00B1;"> <!ENTITY sup2 "&#x00B2;"> <!ENTITY sup3 "&#x00B3;"> <!ENTITY acute "&#x00B4;"> <!ENTITY micro "&#x00B5;"> <!ENTITY para "&#x00B6;"> <!ENTITY middot "&#x00B7;"> <!ENTITY cedil "&#x00B8;"> <!ENTITY sup1 "&#x00B9;"> <!ENTITY ordm "&#x00BA;"> <!ENTITY raquo "&#x00BB;"> <!ENTITY frac14 "&#x00BC;"> <!ENTITY frac12 "&#x00BD;"> <!ENTITY frac34 "&#x00BE;"> <!ENTITY iquest "&#x00BF;"> <!ENTITY Agrave "&#x00C0;"> <!ENTITY Aacute "&#x00C1;"> <!ENTITY Acirc "&#x00C2;"> <!ENTITY Atilde "&#x00C3;"> <!ENTITY Auml "&#x00C4;"> <!ENTITY Aring "&#x00C5;"> <!ENTITY AElig "&#x00C6;"> <!ENTITY Ccedil "&#x00C7;"> <!ENTITY Egrave "&#x00C8;"> <!ENTITY Eacute "&#x00C9;"> <!ENTITY Ecirc "&#x00CA;"> <!ENTITY Euml "&#x00CB;"> <!ENTITY Igrave "&#x00CC;"> <!ENTITY Iacute "&#x00CD;"> <!ENTITY Icirc "&#x00CE;"> <!ENTITY Iuml "&#x00CF;"> <!ENTITY ETH "&#x00D0;"> <!ENTITY Ntilde "&#x00D1;"> <!ENTITY Ograve "&#x00D2;"> <!ENTITY Oacute "&#x00D3;"> <!ENTITY Ocirc "&#x00D4;"> <!ENTITY Otilde "&#x00D5;"> <!ENTITY Ouml "&#x00D6;"> <!ENTITY times "&#x00D7;"> <!ENTITY Oslash "&#x00D8;"> <!ENTITY Ugrave "&#x00D9;"> <!ENTITY Uacute "&#x00DA;"> <!ENTITY Ucirc "&#x00DB;"> <!ENTITY Uuml "&#x00DC;"> <!ENTITY Yacute "&#x00DD;"> <!ENTITY THORN "&#x00DE;"> <!ENTITY szlig "&#x00DF;"> <!ENTITY agrave "&#x00E0;"> <!ENTITY aacute "&#x00E1;"> <!ENTITY acirc "&#x00E2;"> <!ENTITY atilde "&#x00E3;"> <!ENTITY auml "&#x00E4;"> <!ENTITY aring "&#x00E5;"> <!ENTITY aelig "&#x00E6;"> <!ENTITY ccedil "&#x00E7;"> <!ENTITY egrave "&#x00E8;"> <!ENTITY eacute "&#x00E9;"> <!ENTITY ecirc "&#x00EA;"> <!ENTITY euml "&#x00EB;"> <!ENTITY igrave "&#x00EC;"> <!ENTITY iacute "&#x00ED;"> <!ENTITY icirc "&#x00EE;"> <!ENTITY iuml "&#x00EF;"> <!ENTITY eth "&#x00F0;"> <!ENTITY ntilde "&#x00F1;"> <!ENTITY ograve "&#x00F2;"> <!ENTITY oacute "&#x00F3;"> <!ENTITY ocirc "&#x00F4;"> <!ENTITY otilde "&#x00F5;"> <!ENTITY ouml "&#x00F6;"> <!ENTITY divide "&#x00F7;"> <!ENTITY oslash "&#x00F8;"> <!ENTITY ugrave "&#x00F9;"> <!ENTITY uacute "&#x00FA;"> <!ENTITY ucirc "&#x00FB;"> <!ENTITY uuml "&#x00FC;"> <!ENTITY yacute "&#x00FD;"> <!ENTITY thorn "&#x00FE;"> <!ENTITY yuml "&#x00FF;"> <!ENTITY OElig "&#x0152;"> <!ENTITY oelig "&#x0153;"> <!ENTITY Scaron "&#x0160;"> <!ENTITY scaron "&#x0161;"> <!ENTITY Yuml "&#x0178;"> <!ENTITY fnof "&#x0192;"> <!ENTITY circ "&#x02C6;"> <!ENTITY tilde "&#x02DC;"> <!ENTITY Alpha "&#x0391;"> <!ENTITY Beta "&#x0392;"> <!ENTITY Gamma "&#x0393;"> <!ENTITY Epsilon "&#x0395;"> <!ENTITY Zeta "&#x0396;"> <!ENTITY Eta "&#x0397;"> <!ENTITY Theta "&#x0398;"> <!ENTITY Iota "&#x0399;"> <!ENTITY Kappa "&#x039A;"> <!ENTITY Lambda "&#x039B;"> <!ENTITY Mu "&#x039C;"> <!ENTITY Nu "&#x039D;"> <!ENTITY Xi "&#x039E;"> <!ENTITY Omicron "&#x039F;"> <!ENTITY Pi "&#x03A0;"> <!ENTITY Rho "&#x03A1;"> <!ENTITY Sigma "&#x03A3;"> <!ENTITY Tau "&#x03A4;"> <!ENTITY Upsilon "&#x03A5;"> <!ENTITY Phi "&#x03A6;"> <!ENTITY Chi "&#x03A7;"> <!ENTITY Psi "&#x03A8;"> <!ENTITY Omega "&#x03A9;"> <!ENTITY alpha "&#x03B1;"> <!ENTITY beta "&#x03B2;"> <!ENTITY gamma "&#x03B3;"> <!ENTITY delta "&#x03B4;"> <!ENTITY epsilon "&#x03B5;"> <!ENTITY zeta "&#x03B6;"> <!ENTITY eta "&#x03B7;"> <!ENTITY theta "&#x03B8;"> <!ENTITY iota "&#x03B9;"> <!ENTITY kappa "&#x03BA;"> <!ENTITY lambda "&#x03BB;"> <!ENTITY mu "&#x03BC;"> <!ENTITY nu "&#x03BD;"> <!ENTITY xi "&#x03BE;"> <!ENTITY omicron "&#x03BF;"> <!ENTITY pi "&#x03C0;"> <!ENTITY rho "&#x03C1;"> <!ENTITY sigmaf "&#x03C2;"> <!ENTITY sigma "&#x03C3;"> <!ENTITY tau "&#x03C4;"> <!ENTITY upsilon "&#x03C5;"> <!ENTITY phi "&#x03C6;"> <!ENTITY chi "&#x03C7;"> <!ENTITY psi "&#x03C8;"> <!ENTITY omega "&#x03C9;"> <!ENTITY thetasym "&#x03D1;"> <!ENTITY upsih "&#x03D2;"> <!ENTITY piv "&#x03D6;"> <!ENTITY ensp "&#x2002;"> <!ENTITY emsp "&#x2003;"> <!ENTITY thinsp "&#x2009;"> <!ENTITY zwnj "&#x200C;"> <!ENTITY zwj "&#x200D;"> <!ENTITY lrm "&#x200E;"> <!ENTITY rlm "&#x200F;"> <!ENTITY ndash "&#x2013;"> <!ENTITY mdash "&#x2014;"> <!ENTITY lsquo "&#x2018;"> <!ENTITY rsquo "&#x2019;"> <!ENTITY sbquo "&#x201A;"> <!ENTITY ldquo "&#x201C;"> <!ENTITY rdquo "&#x201D;"> <!ENTITY bdquo "&#x201E;"> <!ENTITY dagger "&#x2020;"> <!ENTITY Dagger "&#x2021;"> <!ENTITY bull "&#x2022;"> <!ENTITY hellip "&#x2026;"> <!ENTITY permil "&#x2030;"> <!ENTITY prime "&#x2032;"> <!ENTITY Prime "&#x2033;"> <!ENTITY lsaquo "&#x2039;"> <!ENTITY rsaquo "&#x203A;"> <!ENTITY oline "&#x203E;"> <!ENTITY frasl "&#x2044;"> <!ENTITY euro "&#x20AC;"> <!ENTITY image "&#x2111;"> <!ENTITY weierp "&#x2118;"> <!ENTITY real "&#x211C;"> <!ENTITY trade "&#x2122;"> <!ENTITY alefsym "&#x2135;"> <!ENTITY larr "&#x2190;"> <!ENTITY uarr "&#x2191;"> <!ENTITY rarr "&#x2192;"> <!ENTITY darr "&#x2193;"> <!ENTITY harr "&#x2194;"> <!ENTITY crarr "&#x21B5;"> <!ENTITY lArr "&#x21D0;"> <!ENTITY uArr "&#x21D1;"> <!ENTITY rArr "&#x21D2;"> <!ENTITY dArr "&#x21D3;"> <!ENTITY hArr "&#x21D4;"> <!ENTITY forall "&#x2200;"> <!ENTITY part "&#x2202;"> <!ENTITY exist "&#x2203;"> <!ENTITY empty "&#x2205;"> <!ENTITY nabla "&#x2207;"> <!ENTITY isin "&#x2208;"> <!ENTITY notin "&#x2209;"> <!ENTITY ni "&#x220B;"> <!ENTITY prod "&#x220F;"> <!ENTITY sum "&#x2211;"> <!ENTITY minus "&#x2212;"> <!ENTITY lowast "&#x2217;"> <!ENTITY radic "&#x221A;"> <!ENTITY prop "&#x221D;"> <!ENTITY infin "&#x221E;"> <!ENTITY ang "&#x2220;"> <!ENTITY and "&#x2227;"> <!ENTITY or "&#x2228;"> <!ENTITY cap "&#x2229;"> <!ENTITY cup "&#x222A;"> <!ENTITY int "&#x222B;"> <!ENTITY there4 "&#x2234;"> <!ENTITY sim "&#x223C;"> <!ENTITY cong "&#x2245;"> <!ENTITY asymp "&#x2248;"> <!ENTITY ne "&#x2260;"> <!ENTITY equiv "&#x2261;"> <!ENTITY le "&#x2264;"> <!ENTITY ge "&#x2265;"> <!ENTITY sub "&#x2282;"> <!ENTITY sup "&#x2283;"> <!ENTITY nsub "&#x2284;"> <!ENTITY sube "&#x2286;"> <!ENTITY supe "&#x2287;"> <!ENTITY oplus "&#x2295;"> <!ENTITY otimes "&#x2297;"> <!ENTITY perp "&#x22A5;"> <!ENTITY sdot "&#x22C5;"> <!ENTITY lceil "&#x2308;"> <!ENTITY rceil "&#x2309;"> <!ENTITY lfloor "&#x230A;"> <!ENTITY rfloor "&#x230B;"> <!ENTITY lang "&#x2329;"> <!ENTITY rang "&#x232A;"> <!ENTITY loz "&#x25CA;"> <!ENTITY spades "&#x2660;"> <!ENTITY clubs "&#x2663;"> <!ENTITY hearts "&#x2665;"> <!ENTITY diams "&#x2666;"> ]>';
627    }
628}
629
630class_alias('SimplePie\Parser', 'SimplePie_Parser');
631