From 865ecc87963dc3b26e66296616eef2a1cc41ac3f Mon Sep 17 00:00:00 2001 From: Andrew Dolgov Date: Wed, 25 Oct 2023 12:55:09 +0300 Subject: move to psr-4 autoloader --- classes/FeedItem_Atom.php | 224 ++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 224 insertions(+) create mode 100644 classes/FeedItem_Atom.php (limited to 'classes/FeedItem_Atom.php') diff --git a/classes/FeedItem_Atom.php b/classes/FeedItem_Atom.php new file mode 100644 index 000000000..f6c96f959 --- /dev/null +++ b/classes/FeedItem_Atom.php @@ -0,0 +1,224 @@ +elem->getElementsByTagName("id")->item(0); + + if ($id) { + return $id->nodeValue; + } else { + return clean($this->get_link()); + } + } + + /** + * @return int|false a timestamp on success, false otherwise + */ + function get_date() { + $updated = $this->elem->getElementsByTagName("updated")->item(0); + + if ($updated) { + return strtotime($updated->nodeValue ?? ''); + } + + $published = $this->elem->getElementsByTagName("published")->item(0); + + if ($published) { + return strtotime($published->nodeValue ?? ''); + } + + $date = $this->xpath->query("dc:date", $this->elem)->item(0); + + if ($date) { + return strtotime($date->nodeValue ?? ''); + } + + // consistent with strtotime failing to parse + return false; + } + + + function get_link(): string { + $links = $this->elem->getElementsByTagName("link"); + + foreach ($links as $link) { + /** @phpstan-ignore-next-line */ + if ($link->hasAttribute("href") && + (!$link->hasAttribute("rel") + || $link->getAttribute("rel") == "alternate" + || $link->getAttribute("rel") == "standout")) { + $base = $this->xpath->evaluate("string(ancestor-or-self::*[@xml:base][1]/@xml:base)", $link); + + if ($base) + return UrlHelper::rewrite_relative($base, clean(trim($link->getAttribute("href")))); + else + return clean(trim($link->getAttribute("href"))); + } + } + + return ''; + } + + function get_title(): string { + $title = $this->elem->getElementsByTagName("title")->item(0); + return $title ? clean(trim($title->nodeValue)) : ''; + } + + /** + * @param string|null $base optional (returns $content if $base is null) + * @param string $content an HTML string + * + * @return string the rewritten XML or original $content + */ + private function rewrite_content_to_base(?string $base = null, ?string $content = '') { + + if (!empty($base) && !empty($content)) { + + $tmpdoc = new DOMDocument(); + if (@$tmpdoc->loadHTML('' . $content)) { + $tmpxpath = new DOMXPath($tmpdoc); + + $elems = $tmpxpath->query("(//*[@href]|//*[@src])"); + + foreach ($elems as $elem) { + if ($elem->hasAttribute("href")) { + $elem->setAttribute("href", + UrlHelper::rewrite_relative($base, $elem->getAttribute("href"))); + } else if ($elem->hasAttribute("src")) { + $elem->setAttribute("src", + UrlHelper::rewrite_relative($base, $elem->getAttribute("src"))); + } + } + + // Fall back to $content if saveXML somehow fails (i.e. returns false) + $modified_content = $tmpdoc->saveXML(); + return $modified_content !== false ? $modified_content : $content; + } + } + + return $content; + } + + function get_content(): string { + /** @var DOMElement|null */ + $content = $this->elem->getElementsByTagName("content")->item(0); + + if ($content) { + $base = $this->xpath->evaluate("string(ancestor-or-self::*[@xml:base][1]/@xml:base)", $content); + + if ($content->hasAttribute('type')) { + if ($content->getAttribute('type') == 'xhtml') { + for ($i = 0; $i < $content->childNodes->length; $i++) { + $child = $content->childNodes->item($i); + + if ($child->hasChildNodes()) { + return $this->rewrite_content_to_base($base, $this->doc->saveHTML($child)); + } + } + } + } + + return $this->rewrite_content_to_base($base, $this->subtree_or_text($content)); + } + + return ''; + } + + // TODO: duplicate code should be merged with get_content() + function get_description(): string { + /** @var DOMElement|null */ + $content = $this->elem->getElementsByTagName("summary")->item(0); + + if ($content) { + $base = $this->xpath->evaluate("string(ancestor-or-self::*[@xml:base][1]/@xml:base)", $content); + + if ($content->hasAttribute('type')) { + if ($content->getAttribute('type') == 'xhtml') { + for ($i = 0; $i < $content->childNodes->length; $i++) { + $child = $content->childNodes->item($i); + + if ($child->hasChildNodes()) { + return $this->rewrite_content_to_base($base, $this->doc->saveHTML($child)); + } + } + } + } + + return $this->rewrite_content_to_base($base, $this->subtree_or_text($content)); + } + + return ''; + } + + /** + * @return array + */ + function get_categories(): array { + $categories = $this->elem->getElementsByTagName("category"); + $cats = []; + + foreach ($categories as $cat) { + if ($cat->hasAttribute("term")) + array_push($cats, $cat->getAttribute("term")); + } + + $categories = $this->xpath->query("dc:subject", $this->elem); + + foreach ($categories as $cat) { + array_push($cats, $cat->nodeValue); + } + + return $this->normalize_categories($cats); + } + + /** + * @return array + */ + function get_enclosures(): array { + $links = $this->elem->getElementsByTagName("link"); + + $encs = []; + + foreach ($links as $link) { + /** @phpstan-ignore-next-line */ + if ($link->hasAttribute("href") && $link->hasAttribute("rel")) { + $base = $this->xpath->evaluate("string(ancestor-or-self::*[@xml:base][1]/@xml:base)", $link); + + if ($link->getAttribute("rel") == "enclosure") { + $enc = new FeedEnclosure(); + + $enc->type = clean($link->getAttribute("type")); + $enc->length = clean($link->getAttribute("length")); + $enc->link = clean($link->getAttribute("href")); + + if (!empty($base)) { + $enc->link = UrlHelper::rewrite_relative($base, $enc->link); + } + + array_push($encs, $enc); + } + } + } + + array_push($encs, ...parent::get_enclosures()); + + return $encs; + } + + function get_language(): string { + $lang = $this->elem->getAttributeNS(self::NS_XML, "lang"); + + if (!empty($lang)) { + return clean($lang); + } else { + // Fall back to the language declared on the feed, if any. + foreach ($this->doc->childNodes as $child) { + if (method_exists($child, "getAttributeNS")) { + return clean($child->getAttributeNS(self::NS_XML, "lang")); + } + } + } + return ''; + } +} -- cgit v1.2.3