From cc85704f3cc798e9df7813ab9e2de955d7152ada Mon Sep 17 00:00:00 2001 From: Andrew Dolgov Date: Mon, 26 Nov 2012 14:33:18 +0400 Subject: implement experimental article on-import data filters --- classes/filter.php | 14 +++++++++++++ classes/filter/redditimgur.php | 47 ++++++++++++++++++++++++++++++++++++++++++ 2 files changed, 61 insertions(+) create mode 100644 classes/filter.php create mode 100644 classes/filter/redditimgur.php (limited to 'classes') diff --git a/classes/filter.php b/classes/filter.php new file mode 100644 index 000000000..8d6bf6f26 --- /dev/null +++ b/classes/filter.php @@ -0,0 +1,14 @@ +link = $link; + } + + function filter_article($article) { + return $article; + } + +} +?> diff --git a/classes/filter/redditimgur.php b/classes/filter/redditimgur.php new file mode 100644 index 000000000..6b41015e7 --- /dev/null +++ b/classes/filter/redditimgur.php @@ -0,0 +1,47 @@ +loadHTML($article["content"]); + + if ($doc) { + $xpath = new DOMXPath($doc); + $entries = $xpath->query('(//a[@href]|//img[@src])'); + + foreach ($entries as $entry) { + if ($entry->hasAttribute("href")) { + if (preg_match("/i.imgur.com\/.*?.jpg/", $entry->getAttribute("href"))) { + + $img = $doc->createElement('img'); + $img->setAttribute("src", $entry->getAttribute("href")); + + $entry->parentNode->replaceChild($img, $entry); + } + } + + // remove tiny thumbnails + if ($entry->hasAttribute("src")) { + if ($entry->parentNode && $entry->parentNode->parentNode) { + $entry->parentNode->parentNode->removeChild($entry->parentNode); + } + } + } + + $node = $doc->getElementsByTagName('body')->item(0); + + if ($node) { + $article["content"] = $doc->saveXML($node, LIBXML_NOEMPTYTAG); + } + } + } + } + + return $article; + } +} +?> -- cgit v1.2.3