summaryrefslogtreecommitdiff
path: root/test
diff options
context:
space:
mode:
authorAndres Rey <[email protected]>2018-11-25 21:14:25 +0000
committerAndres Rey <[email protected]>2018-11-25 21:14:25 +0000
commit93ca4484e2720a96f67f6b8edf8d17a39ada2e1b (patch)
treee2c951f0262ff45c4406601058b4bb90cd7930d4 /test
parent3046a6ae3e1610e9c2d60e9c4c72d817c286ad4b (diff)
Update test expectations
Diffstat (limited to 'test')
-rw-r--r--test/test-pages/001/expected-metadata.json8
-rw-r--r--test/test-pages/002/expected-metadata.json8
-rw-r--r--test/test-pages/003-metadata-preferred/expected-metadata.json8
-rw-r--r--test/test-pages/004-metadata-space-separated-properties/expected-metadata.json8
-rw-r--r--test/test-pages/aclu/expected-metadata.json9
-rw-r--r--test/test-pages/ars-1/expected-metadata.json9
-rw-r--r--test/test-pages/base-url-base-element-relative/expected-metadata.json6
-rw-r--r--test/test-pages/base-url-base-element/expected-metadata.json6
-rw-r--r--test/test-pages/base-url/expected-metadata.json8
-rw-r--r--test/test-pages/basic-tags-cleaning/expected-metadata.json8
-rw-r--r--test/test-pages/bbc-1/expected-metadata.json9
-rw-r--r--test/test-pages/blogger/expected-metadata.json9
-rw-r--r--test/test-pages/breitbart/expected-metadata.json11
-rw-r--r--test/test-pages/bug-1255978/expected-metadata.json11
-rw-r--r--test/test-pages/buzzfeed-1/expected-metadata.json7
-rw-r--r--test/test-pages/challenges/expected-metadata.json5
-rw-r--r--test/test-pages/clean-links/expected-metadata.json8
-rw-r--r--test/test-pages/cnet-svg-classes/expected-metadata.json7
-rw-r--r--test/test-pages/cnet/expected-metadata.json11
-rw-r--r--test/test-pages/cnn/expected-metadata.json11
-rw-r--r--test/test-pages/comment-inside-script-parsing/expected-metadata.json8
-rw-r--r--test/test-pages/daringfireball-1/expected-metadata.json8
-rw-r--r--test/test-pages/different-sources-for-images/expected-metadata.json8
-rw-r--r--test/test-pages/ehow-1/expected-metadata.json9
-rw-r--r--test/test-pages/ehow-2/expected-metadata.json9
-rw-r--r--test/test-pages/embedded-videos/expected-metadata.json8
-rw-r--r--test/test-pages/engadget/expected-metadata.json7
-rw-r--r--test/test-pages/fortressofsolitude/expected-metadata.json9
-rw-r--r--test/test-pages/gmw/expected-metadata.json10
-rw-r--r--test/test-pages/heise/expected-metadata.json9
-rw-r--r--test/test-pages/herald-sun-1/expected-metadata.json9
-rw-r--r--test/test-pages/hidden-nodes/expected-metadata.json6
-rw-r--r--test/test-pages/hukumusume/expected-metadata.json6
-rw-r--r--test/test-pages/iab-1/expected-metadata.json9
-rw-r--r--test/test-pages/ietf-1/expected-metadata.json6
-rw-r--r--test/test-pages/infobae/expected-metadata.json9
-rw-r--r--test/test-pages/keep-images/expected-metadata.json9
-rw-r--r--test/test-pages/la-nacion/expected-metadata.json7
-rw-r--r--test/test-pages/lemonde-1/expected-metadata.json9
-rw-r--r--test/test-pages/lemonde-2/expected-metadata.json7
-rw-r--r--test/test-pages/liberation-1/expected-metadata.json9
-rw-r--r--test/test-pages/lifehacker-post-comment-load/expected-metadata.json9
-rw-r--r--test/test-pages/lifehacker-working/expected-metadata.json9
-rw-r--r--test/test-pages/links-in-tables/expected-metadata.json9
-rw-r--r--test/test-pages/lwn-1/expected-metadata.json8
-rw-r--r--test/test-pages/medium-1/expected-metadata.json9
-rw-r--r--test/test-pages/medium-2/expected-metadata.json9
-rw-r--r--test/test-pages/medium-3/expected-metadata.json11
-rw-r--r--test/test-pages/missing-paragraphs/expected-metadata.json8
-rw-r--r--test/test-pages/mozilla-1/expected-metadata.json11
-rw-r--r--test/test-pages/mozilla-2/expected-metadata.json11
-rw-r--r--test/test-pages/msn/expected-metadata.json9
-rw-r--r--test/test-pages/nytimes-1/expected-metadata.json11
-rw-r--r--test/test-pages/nytimes-2/expected-metadata.json11
-rw-r--r--test/test-pages/pixnet/expected-metadata.json11
-rw-r--r--test/test-pages/remove-extra-brs/expected-metadata.json8
-rw-r--r--test/test-pages/remove-extra-paragraphs/expected-metadata.json8
-rw-r--r--test/test-pages/remove-script-tags/expected-metadata.json8
-rw-r--r--test/test-pages/reordering-paragraphs/expected-metadata.json8
-rw-r--r--test/test-pages/replace-brs/expected-metadata.json8
-rw-r--r--test/test-pages/replace-font-tags/expected-metadata.json8
-rw-r--r--test/test-pages/rtl-1/expected-metadata.json10
-rw-r--r--test/test-pages/rtl-2/expected-metadata.json10
-rw-r--r--test/test-pages/rtl-3/expected-metadata.json10
-rw-r--r--test/test-pages/rtl-4/expected-metadata.json10
-rw-r--r--test/test-pages/salon-1/expected-metadata.json9
-rw-r--r--test/test-pages/simplyfound-1/expected-metadata.json9
-rw-r--r--test/test-pages/social-buttons/expected-metadata.json8
-rw-r--r--test/test-pages/style-tags-removal/expected-metadata.json8
-rw-r--r--test/test-pages/svg-parsing/expected-metadata.json8
-rw-r--r--test/test-pages/table-style-attributes/expected-metadata.json10
-rw-r--r--test/test-pages/telegraph/expected-metadata.json7
-rw-r--r--test/test-pages/title-and-h1-discrepancy/expected-metadata.json6
-rw-r--r--test/test-pages/tmz-1/expected-metadata.json9
-rw-r--r--test/test-pages/tumblr/expected-metadata.json11
-rw-r--r--test/test-pages/wapo-1/expected-metadata.json9
-rw-r--r--test/test-pages/wapo-2/expected-metadata.json9
-rw-r--r--test/test-pages/webmd-1/expected-metadata.json9
-rw-r--r--test/test-pages/webmd-2/expected-metadata.json9
-rw-r--r--test/test-pages/wikia/expected-metadata.json11
-rw-r--r--test/test-pages/wikipedia/expected-metadata.json10
-rw-r--r--test/test-pages/wordpress/expected-metadata.json11
-rw-r--r--test/test-pages/yahoo-1/expected-metadata.json11
-rw-r--r--test/test-pages/yahoo-2/expected-metadata.json9
-rw-r--r--test/test-pages/yahoo-3/expected-metadata.json9
-rw-r--r--test/test-pages/yahoo-4/expected-metadata.json11
-rw-r--r--test/test-pages/youth/expected-metadata.json10
87 files changed, 410 insertions, 355 deletions
diff --git a/test/test-pages/001/expected-metadata.json b/test/test-pages/001/expected-metadata.json
index c58545d..f11c7b4 100644
--- a/test/test-pages/001/expected-metadata.json
+++ b/test/test-pages/001/expected-metadata.json
@@ -1,5 +1,5 @@
{
- "Title": "Get your Frontend JavaScript Code Covered | Code",
- "Author": "Nicolas Perriault —",
- "Excerpt": "Nicolas Perriault's homepage."
-}
+ "Title": "Get your Frontend JavaScript Code Covered | Code",
+ "Author": "Nicolas Perriault —",
+ "Excerpt": "Nicolas Perriault's homepage."
+} \ No newline at end of file
diff --git a/test/test-pages/002/expected-metadata.json b/test/test-pages/002/expected-metadata.json
index a351dd4..a9fb9d3 100644
--- a/test/test-pages/002/expected-metadata.json
+++ b/test/test-pages/002/expected-metadata.json
@@ -1,5 +1,5 @@
{
- "Title": "This API is so Fetching!",
- "Author": "Nikhil Marathe",
- "Excerpt": "For more than a decade the Web has used XMLHttpRequest (XHR) to achieve asynchronous requests in JavaScript. While very useful, XHR is not a very ..."
-}
+ "Title": "This API is so Fetching!",
+ "Author": "Nikhil Marathe",
+ "Excerpt": "For more than a decade the Web has used XMLHttpRequest (XHR) to achieve asynchronous requests in JavaScript. While very useful, XHR is not a very ..."
+} \ No newline at end of file
diff --git a/test/test-pages/003-metadata-preferred/expected-metadata.json b/test/test-pages/003-metadata-preferred/expected-metadata.json
index a702e4a..b81f0a6 100644
--- a/test/test-pages/003-metadata-preferred/expected-metadata.json
+++ b/test/test-pages/003-metadata-preferred/expected-metadata.json
@@ -1,5 +1,5 @@
{
- "Title": "Dublin Core property title",
- "Author": "Dublin Core property author",
- "Excerpt": "Dublin Core property description"
-}
+ "Title": "Dublin Core property title",
+ "Author": "Dublin Core property author",
+ "Excerpt": "Dublin Core property description"
+} \ No newline at end of file
diff --git a/test/test-pages/004-metadata-space-separated-properties/expected-metadata.json b/test/test-pages/004-metadata-space-separated-properties/expected-metadata.json
index a41ac6b..5f7fda2 100644
--- a/test/test-pages/004-metadata-space-separated-properties/expected-metadata.json
+++ b/test/test-pages/004-metadata-space-separated-properties/expected-metadata.json
@@ -1,5 +1,5 @@
{
- "Title": "Preferred title",
- "Author": "Creator Name",
- "Excerpt": "Preferred description"
-}
+ "Title": "Preferred title",
+ "Author": "Creator Name",
+ "Excerpt": "Preferred description"
+} \ No newline at end of file
diff --git a/test/test-pages/aclu/expected-metadata.json b/test/test-pages/aclu/expected-metadata.json
index f954b98..82fefd5 100644
--- a/test/test-pages/aclu/expected-metadata.json
+++ b/test/test-pages/aclu/expected-metadata.json
@@ -1,5 +1,6 @@
{
- "Title": "Facebook Is Tracking Me Even Though I’m Not on Facebook",
- "Author": "By Daniel Kahn Gillmor, Senior Staff Technologist, ACLU Speech, Privacy, and Technology Project",
- "Excerpt": "I don't use Facebook. I'm not technophobic — I'm a geek. I've been using email since the early 1990s, I have accounts on hundreds of services around the net, and I do software development and internet protocol design both for work and for fun. I believe that a globe-spanning communications network like the internet can be a positive social force, and I publish much of my own work on the open web."
-}
+ "Title": "Facebook Is Tracking Me Even Though I’m Not on Facebook",
+ "Author": "By Daniel Kahn Gillmor, Senior Staff Technologist, ACLU Speech, Privacy, and Technology Project",
+ "Excerpt": "I don't use Facebook. I'm not technophobic — I'm a geek. I've been using email since the early 1990s, I have accounts on hundreds of services around the net, and I do software development and internet protocol design both for work and for fun. I believe that a globe-spanning communications network like the internet can be a positive social force, and I publish much of my own work on the open web.",
+ "Image": "https:\/\/www.aclu.org\/sites\/default\/files\/styles\/metatag_og_image_1200x630\/public\/field_share_image\/web18-facebook-socialshare-1200x628-v02.png?itok=p77cQjOm"
+} \ No newline at end of file
diff --git a/test/test-pages/ars-1/expected-metadata.json b/test/test-pages/ars-1/expected-metadata.json
index 8b3d493..5909f3e 100644
--- a/test/test-pages/ars-1/expected-metadata.json
+++ b/test/test-pages/ars-1/expected-metadata.json
@@ -1,5 +1,6 @@
{
- "Title": "Just-released Minecraft exploit makes it easy to crash game servers",
- "Author": "by Dan Goodin - Apr 16, 2015 8:02 pm UTC",
- "Excerpt": "Two-year-old bug exposes thousands of servers to crippling attack."
-}
+ "Title": "Just-released Minecraft exploit makes it easy to crash game servers",
+ "Author": "by Dan Goodin - Apr 16, 2015 8:02 pm UTC",
+ "Excerpt": "Two-year-old bug exposes thousands of servers to crippling attack.",
+ "Image": "http:\/\/cdn.arstechnica.net\/wp-content\/uploads\/2015\/04\/server-crash-640x426.jpg"
+} \ No newline at end of file
diff --git a/test/test-pages/base-url-base-element-relative/expected-metadata.json b/test/test-pages/base-url-base-element-relative/expected-metadata.json
index eb78f28..7e3b35a 100644
--- a/test/test-pages/base-url-base-element-relative/expected-metadata.json
+++ b/test/test-pages/base-url-base-element-relative/expected-metadata.json
@@ -1,4 +1,4 @@
{
- "Title": "Base URL with base relative test",
- "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum."
-}
+ "Title": "Base URL with base relative test",
+ "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum."
+} \ No newline at end of file
diff --git a/test/test-pages/base-url-base-element/expected-metadata.json b/test/test-pages/base-url-base-element/expected-metadata.json
index 4a22f75..3545f80 100644
--- a/test/test-pages/base-url-base-element/expected-metadata.json
+++ b/test/test-pages/base-url-base-element/expected-metadata.json
@@ -1,4 +1,4 @@
{
- "Title": "Base URL with base test",
- "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum."
-}
+ "Title": "Base URL with base test",
+ "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum."
+} \ No newline at end of file
diff --git a/test/test-pages/base-url/expected-metadata.json b/test/test-pages/base-url/expected-metadata.json
index b26e5cf..1c8014d 100644
--- a/test/test-pages/base-url/expected-metadata.json
+++ b/test/test-pages/base-url/expected-metadata.json
@@ -1,5 +1,5 @@
{
- "Title": "Base URL test",
- "Author": null,
- "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum."
-}
+ "Title": "Base URL test",
+ "Author": null,
+ "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum."
+} \ No newline at end of file
diff --git a/test/test-pages/basic-tags-cleaning/expected-metadata.json b/test/test-pages/basic-tags-cleaning/expected-metadata.json
index f3292d5..1382512 100644
--- a/test/test-pages/basic-tags-cleaning/expected-metadata.json
+++ b/test/test-pages/basic-tags-cleaning/expected-metadata.json
@@ -1,5 +1,5 @@
{
- "Title": "Basic tag cleaning test",
- "Author": null,
- "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua."
-}
+ "Title": "Basic tag cleaning test",
+ "Author": null,
+ "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua."
+} \ No newline at end of file
diff --git a/test/test-pages/bbc-1/expected-metadata.json b/test/test-pages/bbc-1/expected-metadata.json
index 545e317..fb1ad45 100644
--- a/test/test-pages/bbc-1/expected-metadata.json
+++ b/test/test-pages/bbc-1/expected-metadata.json
@@ -1,5 +1,6 @@
{
- "Title": "Obama admits US gun laws are his 'biggest frustration' - BBC News",
- "Author": null,
- "Excerpt": "President Barack Obama tells the BBC his failure to pass \"common sense gun safety laws\" is the greatest frustration of his presidency."
-}
+ "Title": "Obama admits US gun laws are his 'biggest frustration' - BBC News",
+ "Author": null,
+ "Excerpt": "President Barack Obama tells the BBC his failure to pass \"common sense gun safety laws\" is the greatest frustration of his presidency.",
+ "Image": "http:\/\/ichef.bbci.co.uk\/news\/1024\/cpsprodpb\/3D8B\/production\/_84455751_84455749.jpg"
+} \ No newline at end of file
diff --git a/test/test-pages/blogger/expected-metadata.json b/test/test-pages/blogger/expected-metadata.json
index f912e3b..eef4912 100644
--- a/test/test-pages/blogger/expected-metadata.json
+++ b/test/test-pages/blogger/expected-metadata.json
@@ -1,5 +1,6 @@
{
- "Title": "Open Verilog flow for Silego GreenPak4 programmable logic devices",
- "Author": null,
- "Excerpt": "I've written a couple of posts in the past few months but they were all for the blog at work so I figured I'm long overdue for one on Silic..."
-}
+ "Title": "Open Verilog flow for Silego GreenPak4 programmable logic devices",
+ "Author": null,
+ "Excerpt": "I've written a couple of posts in the past few months but they were all for the blog at work so I figured I'm long overdue for one on Silic...",
+ "Image": "https:\/\/1.bp.blogspot.com\/-YIPC5jkXkDE\/Vy7YPSqFKWI\/AAAAAAAAAxI\/a7D6Ji2GxoUvcrwUkI4RLZcr2LFQEJCTACLcB\/w1200-h630-p-nu\/block-diagram.png"
+} \ No newline at end of file
diff --git a/test/test-pages/breitbart/expected-metadata.json b/test/test-pages/breitbart/expected-metadata.json
index 8bbbd41..3c7d29e 100644
--- a/test/test-pages/breitbart/expected-metadata.json
+++ b/test/test-pages/breitbart/expected-metadata.json
@@ -1,6 +1,7 @@
{
- "Title": "'Neutral' Snopes Fact-Checker David Emery: 'Are There Any Un-Angry Trump Supporters?' - Breitbart",
- "Author": "by Lucas Nolan22 Dec 2016651",
- "Direction": null,
- "Excerpt": "Snopes fact checker and staff writer David Emery posted to Twitter asking if there were “any un-angry Trump supporters?”"
-}
+ "Title": "'Neutral' Snopes Fact-Checker David Emery: 'Are There Any Un-Angry Trump Supporters?' - Breitbart",
+ "Author": "by Lucas Nolan22 Dec 2016651",
+ "Direction": null,
+ "Excerpt": "Snopes fact checker and staff writer David Emery posted to Twitter asking if there were “any un-angry Trump supporters?”",
+ "Image": "http:\/\/fakehost\/test\/480"
+} \ No newline at end of file
diff --git a/test/test-pages/bug-1255978/expected-metadata.json b/test/test-pages/bug-1255978/expected-metadata.json
index db7c652..e85fe42 100644
--- a/test/test-pages/bug-1255978/expected-metadata.json
+++ b/test/test-pages/bug-1255978/expected-metadata.json
@@ -1,6 +1,7 @@
{
- "Title": "Seven secrets that hotel owners don't want you to know",
- "Author": "Hazel Sheffield",
- "Direction": null,
- "Excerpt": "Most people go to hotels for the pleasure of sleeping in a giant bed with clean white sheets and waking up to fresh towels in the morning. But those towels and sheets might not be as clean as they look, according to the hotel bosses that responded to an online thread about the things hotel owners don’t want you to know."
-}
+ "Title": "Seven secrets that hotel owners don't want you to know",
+ "Author": "Hazel Sheffield",
+ "Direction": null,
+ "Excerpt": "Most people go to hotels for the pleasure of sleeping in a giant bed with clean white sheets and waking up to fresh towels in the morning. But those towels and sheets might not be as clean as they look, according to the hotel bosses that responded to an online thread about the things hotel owners don’t want you to know.",
+ "Image": "https:\/\/static.independent.co.uk\/s3fs-public\/thumbnails\/image\/2015\/12\/06\/10\/bed-hotel-room.jpg"
+} \ No newline at end of file
diff --git a/test/test-pages/buzzfeed-1/expected-metadata.json b/test/test-pages/buzzfeed-1/expected-metadata.json
index 5b04b83..c269f76 100644
--- a/test/test-pages/buzzfeed-1/expected-metadata.json
+++ b/test/test-pages/buzzfeed-1/expected-metadata.json
@@ -1,4 +1,5 @@
{
- "Title": "Student Dies After Diet Pills She Bought Online \"Burned Her Up From Within\"",
- "Excerpt": "An inquest into Eloise Parry's death has been adjourned until July."
-}
+ "Title": "Student Dies After Diet Pills She Bought Online \"Burned Her Up From Within\"",
+ "Excerpt": "An inquest into Eloise Parry's death has been adjourned until July.",
+ "Image": "http:\/\/fakehost\/test\/412"
+} \ No newline at end of file
diff --git a/test/test-pages/challenges/expected-metadata.json b/test/test-pages/challenges/expected-metadata.json
index 3b8b0a4..80e7aee 100644
--- a/test/test-pages/challenges/expected-metadata.json
+++ b/test/test-pages/challenges/expected-metadata.json
@@ -1,3 +1,4 @@
{
- "Title": "Les motivations du tueur de Las Vegas demeurent floues"
-}
+ "Title": "Les motivations du tueur de Las Vegas demeurent floues",
+ "Image": "http:\/\/fakehost\/img\/cha\/placeholders\/placeholder_1000x750.jpg"
+} \ No newline at end of file
diff --git a/test/test-pages/clean-links/expected-metadata.json b/test/test-pages/clean-links/expected-metadata.json
index 7993d55..cc7923f 100644
--- a/test/test-pages/clean-links/expected-metadata.json
+++ b/test/test-pages/clean-links/expected-metadata.json
@@ -1,5 +1,5 @@
{
- "Title": "Bartleby the Scrivener Web Study Text",
- "Author": null,
- "Excerpt": "Ere introducing the scrivener, as he first appeared to me, it is fit \n I make some mention of myself, my employees, my business, my chambers, \n and general surroundings; because some such description is indispensable \n to an adequate understanding of the chief character about to be presented."
-}
+ "Title": "Bartleby the Scrivener Web Study Text",
+ "Author": null,
+ "Excerpt": "Ere introducing the scrivener, as he first appeared to me, it is fit \n I make some mention of myself, my employees, my business, my chambers, \n and general surroundings; because some such description is indispensable \n to an adequate understanding of the chief character about to be presented."
+} \ No newline at end of file
diff --git a/test/test-pages/cnet-svg-classes/expected-metadata.json b/test/test-pages/cnet-svg-classes/expected-metadata.json
index ebebc0f..f6f4d46 100644
--- a/test/test-pages/cnet-svg-classes/expected-metadata.json
+++ b/test/test-pages/cnet-svg-classes/expected-metadata.json
@@ -1,4 +1,5 @@
{
- "Title": "Twitter Lite se estrena en México, Venezuela y otros nueve países",
- "Excerpt": "Twitter Lite llega a 11 países de América Latina, para ayudar a los usuarios con mala señal de sus redes móviles."
-}
+ "Title": "Twitter Lite se estrena en México, Venezuela y otros nueve países",
+ "Excerpt": "Twitter Lite llega a 11 países de América Latina, para ayudar a los usuarios con mala señal de sus redes móviles.",
+ "Image": "https:\/\/cdn1.cnet.com\/img\/JumVcu1ZSLtPP8ui0UWaSlgi5RU=\/670x503\/2017\/12\/01\/b36ce794-e0b8-495c-a198-184923a8f4e9\/twitter-lite.jpg"
+} \ No newline at end of file
diff --git a/test/test-pages/cnet/expected-metadata.json b/test/test-pages/cnet/expected-metadata.json
index 744652d..e120194 100644
--- a/test/test-pages/cnet/expected-metadata.json
+++ b/test/test-pages/cnet/expected-metadata.json
@@ -1,6 +1,7 @@
{
- "Title": "Zuckerberg offers peek at Facebook's acquisition strategies",
- "Author": "Steven Musil",
- "Direction": null,
- "Excerpt": "Facebook CEO says be a friend and have a shared vision, but scare them when you have to and move fast."
-}
+ "Title": "Zuckerberg offers peek at Facebook's acquisition strategies",
+ "Author": "Steven Musil",
+ "Direction": null,
+ "Excerpt": "Facebook CEO says be a friend and have a shared vision, but scare them when you have to and move fast.",
+ "Image": "https:\/\/cnet3.cbsistatic.com\/img\/1JaRRjqhoGxDVkFxTRRWkZgyK2Q=\/670x503\/2014\/03\/21\/863df5d9-e8b8-4b38-851b-5e3f77f2cf0e\/mark-zuckerberg-facebook-home-10671610x407.jpg"
+} \ No newline at end of file
diff --git a/test/test-pages/cnn/expected-metadata.json b/test/test-pages/cnn/expected-metadata.json
index d88d406..978bdf7 100644
--- a/test/test-pages/cnn/expected-metadata.json
+++ b/test/test-pages/cnn/expected-metadata.json
@@ -1,6 +1,7 @@
{
- "Title": "The 'birth lottery' and economic mobility",
- "Author": "Ahiza Garcia",
- "Direction": null,
- "Excerpt": "A recently-released report on poverty and inequality found that the U.S. ranks the lowest among countries with welfare states."
-}
+ "Title": "The 'birth lottery' and economic mobility",
+ "Author": "Ahiza Garcia",
+ "Direction": null,
+ "Excerpt": "A recently-released report on poverty and inequality found that the U.S. ranks the lowest among countries with welfare states.",
+ "Image": "http:\/\/i2.cdn.turner.com\/money\/dam\/assets\/141103182938-income-inequality-780x439.png"
+} \ No newline at end of file
diff --git a/test/test-pages/comment-inside-script-parsing/expected-metadata.json b/test/test-pages/comment-inside-script-parsing/expected-metadata.json
index e5ad501..f4e5750 100644
--- a/test/test-pages/comment-inside-script-parsing/expected-metadata.json
+++ b/test/test-pages/comment-inside-script-parsing/expected-metadata.json
@@ -1,5 +1,5 @@
{
- "Title": "Test script parsing",
- "Author": null,
- "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua."
-}
+ "Title": "Test script parsing",
+ "Author": null,
+ "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua."
+} \ No newline at end of file
diff --git a/test/test-pages/daringfireball-1/expected-metadata.json b/test/test-pages/daringfireball-1/expected-metadata.json
index 477261f..b9969de 100644
--- a/test/test-pages/daringfireball-1/expected-metadata.json
+++ b/test/test-pages/daringfireball-1/expected-metadata.json
@@ -1,5 +1,5 @@
{
- "Title": "Daring Fireball: Colophon",
- "Author": null,
- "Excerpt": "Daring Fireball is written and produced by John Gruber."
-}
+ "Title": "Daring Fireball: Colophon",
+ "Author": null,
+ "Excerpt": "Daring Fireball is written and produced by John Gruber."
+} \ No newline at end of file
diff --git a/test/test-pages/different-sources-for-images/expected-metadata.json b/test/test-pages/different-sources-for-images/expected-metadata.json
index 31f1ff3..7bfc756 100644
--- a/test/test-pages/different-sources-for-images/expected-metadata.json
+++ b/test/test-pages/different-sources-for-images/expected-metadata.json
@@ -1,5 +1,5 @@
{
- "Title": "Image sources test",
- "Author": null,
- "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum."
-}
+ "Title": "Image sources test",
+ "Author": null,
+ "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum."
+} \ No newline at end of file
diff --git a/test/test-pages/ehow-1/expected-metadata.json b/test/test-pages/ehow-1/expected-metadata.json
index 9e2782b..f19b038 100644
--- a/test/test-pages/ehow-1/expected-metadata.json
+++ b/test/test-pages/ehow-1/expected-metadata.json
@@ -1,5 +1,6 @@
{
- "Title": "How to Build a Terrarium | eHow",
- "Author": "Lucy Akins",
- "Excerpt": "Glass cloche terrariums are not only appealing to the eye, but they also preserve a bit of nature in your home and serve as a simple, yet beautiful, piece of art. Closed terrariums are easy to care for, as they retain much of their own moisture and provide a warm environment with a consistent level of humidity. You won’t have to water the..."
-}
+ "Title": "How to Build a Terrarium | eHow",
+ "Author": "Lucy Akins",
+ "Excerpt": "Glass cloche terrariums are not only appealing to the eye, but they also preserve a bit of nature in your home and serve as a simple, yet beautiful, piece of art. Closed terrariums are easy to care for, as they retain much of their own moisture and provide a warm environment with a consistent level of humidity. You won’t have to water the...",
+ "Image": "http:\/\/img-aws.ehowcdn.com\/200x200\/cme\/photography.prod.demandstudios.com\/16149374-814f-40bc-baf3-ca20f149f0ba.jpg"
+} \ No newline at end of file
diff --git a/test/test-pages/ehow-2/expected-metadata.json b/test/test-pages/ehow-2/expected-metadata.json
index 2967b61..43eff45 100644
--- a/test/test-pages/ehow-2/expected-metadata.json
+++ b/test/test-pages/ehow-2/expected-metadata.json
@@ -1,5 +1,6 @@
{
- "Title": "How to Throw a Graduation Party on a Budget | eHow",
- "Author": "Gina Roberts-Grey",
- "Excerpt": "Graduation parties are a great way to commemorate the years of hard work teens and college co-eds devote to education. They’re also costly for mom and dad.The average cost of a graduation party in 2013 was a whopping $1,200, according to Graduationparty.com; $700 of that was allocated for food. However that budget was based on Midwestern..."
-}
+ "Title": "How to Throw a Graduation Party on a Budget | eHow",
+ "Author": "Gina Roberts-Grey",
+ "Excerpt": "Graduation parties are a great way to commemorate the years of hard work teens and college co-eds devote to education. They’re also costly for mom and dad.The average cost of a graduation party in 2013 was a whopping $1,200, according to Graduationparty.com; $700 of that was allocated for food. However that budget was based on Midwestern...",
+ "Image": "http:\/\/img-aws.ehowcdn.com\/200x200\/cme\/cme_public_images\/www_ehow_com\/cdn-write.demandstudios.com\/upload\/image\/2F\/86\/5547EF62-EAF5-4256-945D-0496F61C862F\/5547EF62-EAF5-4256-945D-0496F61C862F.jpg"
+} \ No newline at end of file
diff --git a/test/test-pages/embedded-videos/expected-metadata.json b/test/test-pages/embedded-videos/expected-metadata.json
index 46e3094..e22af78 100644
--- a/test/test-pages/embedded-videos/expected-metadata.json
+++ b/test/test-pages/embedded-videos/expected-metadata.json
@@ -1,5 +1,5 @@
{
- "Title": "Embedded videos test",
- "Author": null,
- "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum."
-}
+ "Title": "Embedded videos test",
+ "Author": null,
+ "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum."
+} \ No newline at end of file
diff --git a/test/test-pages/engadget/expected-metadata.json b/test/test-pages/engadget/expected-metadata.json
index eb1ed25..d00b669 100644
--- a/test/test-pages/engadget/expected-metadata.json
+++ b/test/test-pages/engadget/expected-metadata.json
@@ -1,4 +1,5 @@
{
- "Title": "Xbox One X review: A console that keeps up with gaming PCs",
- "Excerpt": "The Xbox One X is the most powerful gaming console ever, but it's not for everyone yet."
-}
+ "Title": "Xbox One X review: A console that keeps up with gaming PCs",
+ "Excerpt": "The Xbox One X is the most powerful gaming console ever, but it's not for everyone yet.",
+ "Image": "http:\/\/fakehost\/test\/630"
+} \ No newline at end of file
diff --git a/test/test-pages/fortressofsolitude/expected-metadata.json b/test/test-pages/fortressofsolitude/expected-metadata.json
index 2efe2a7..54d1b36 100644
--- a/test/test-pages/fortressofsolitude/expected-metadata.json
+++ b/test/test-pages/fortressofsolitude/expected-metadata.json
@@ -1,5 +1,6 @@
{
- "Title": "Céline Dion Belches Her Way Onto Deadpool 2's Soundtrack",
- "Author": "Written by Edward Wallace",
- "Excerpt": "Just when you think the marketing behind the film couldn't get any more amazing, they go and release a music video from the Deadpool 2 soundtrack starring Canadian singer Céline Dion."
-}
+ "Title": "Céline Dion Belches Her Way Onto Deadpool 2's Soundtrack",
+ "Author": "Written by Edward Wallace",
+ "Excerpt": "Just when you think the marketing behind the film couldn't get any more amazing, they go and release a music video from the Deadpool 2 soundtrack starring Canadian singer Céline Dion.",
+ "Image": "http:\/\/fakehost\/test\/Céline Dion Belches Her Way Onto Deadpool 2's Soundtrack"
+} \ No newline at end of file
diff --git a/test/test-pages/gmw/expected-metadata.json b/test/test-pages/gmw/expected-metadata.json
index 2997886..cba8ceb 100644
--- a/test/test-pages/gmw/expected-metadata.json
+++ b/test/test-pages/gmw/expected-metadata.json
@@ -1,6 +1,6 @@
{
- "Title": "宇航员在太空中喝酒会怎么样?后果很严重 _探索者 _光明网",
- "Author": "肖春芳",
- "Direction": null,
- "Excerpt": "不幸的是,对于希望能喝上一杯的太空探险者,那些将他们送上太空的政府机构普遍禁止他们染指包括酒在内的含酒精饮料。"
-}
+ "Title": "宇航员在太空中喝酒会怎么样?后果很严重 _探索者 _光明网",
+ "Author": "肖春芳",
+ "Direction": null,
+ "Excerpt": "不幸的是,对于希望能喝上一杯的太空探险者,那些将他们送上太空的政府机构普遍禁止他们染指包括酒在内的含酒精饮料。"
+} \ No newline at end of file
diff --git a/test/test-pages/heise/expected-metadata.json b/test/test-pages/heise/expected-metadata.json
index ae180bf..ffad06a 100644
--- a/test/test-pages/heise/expected-metadata.json
+++ b/test/test-pages/heise/expected-metadata.json
@@ -1,5 +1,6 @@
{
- "Title": "1Password für Mac generiert Einmal-Passwörter",
- "Author": "Mac & i",
- "Excerpt": "Das in der iOS-Version bereits enthaltene TOTP-Feature ist nun auch für OS X 10.10 verfügbar. Zudem gibt es neue Zusatzfelder in der Datenbank und weitere Verbesserungen."
-}
+ "Title": "1Password für Mac generiert Einmal-Passwörter",
+ "Author": "Mac & i",
+ "Excerpt": "Das in der iOS-Version bereits enthaltene TOTP-Feature ist nun auch für OS X 10.10 verfügbar. Zudem gibt es neue Zusatzfelder in der Datenbank und weitere Verbesserungen.",
+ "Image": "http:\/\/www.heise.de\/imgs\/18\/1\/4\/6\/2\/3\/5\/1\/Barcode-Scanner-With-Border-f0c62350bd8d9d96.jpeg"
+} \ No newline at end of file
diff --git a/test/test-pages/herald-sun-1/expected-metadata.json b/test/test-pages/herald-sun-1/expected-metadata.json
index b8ad6c2..1f84910 100644
--- a/test/test-pages/herald-sun-1/expected-metadata.json
+++ b/test/test-pages/herald-sun-1/expected-metadata.json
@@ -1,5 +1,6 @@
{
- "Title": "Angry media won’t buckle over new surveillance laws",
- "Author": "JOE HILDEBRAND",
- "Excerpt": "A HIGH-powered federal government team has been doing the rounds of media organisations in the past few days in an attempt to allay concerns about the impact of new surveillance legislation on press freedom. It failed."
-}
+ "Title": "Angry media won’t buckle over new surveillance laws",
+ "Author": "JOE HILDEBRAND",
+ "Excerpt": "A HIGH-powered federal government team has been doing the rounds of media organisations in the past few days in an attempt to allay concerns about the impact of new surveillance legislation on press freedom. It failed.",
+ "Image": "http:\/\/api.news.com.au\/content\/1.0\/heraldsun\/images\/1227261885862?format=jpg&group=iphone&size=medium"
+} \ No newline at end of file
diff --git a/test/test-pages/hidden-nodes/expected-metadata.json b/test/test-pages/hidden-nodes/expected-metadata.json
index 37bab58..c243f7a 100644
--- a/test/test-pages/hidden-nodes/expected-metadata.json
+++ b/test/test-pages/hidden-nodes/expected-metadata.json
@@ -1,4 +1,4 @@
{
- "Title": "Lorem ipsum dolor sit amet, consetetur sadipscing elitr, sed diam nonumy eirmod tempor invidunt",
- "Excerpt": "Lorem ipsum dolor sit amet, consetetur sadipscing elitr, sed diam nonumy eirmod tempor invidunt ut labore et dolore magna aliquyam erat, sed diam voluptua. At vero eos et accusam et justo duo dolores et ea rebum. Stet clita kasd gubergren, no sea takimata sanctus est Lorem ipsum dolor sit amet. Lorem ipsum dolor sit amet, consetetur sadipscing elitr, sed diam nonumy eirmod tempor invidunt ut labore et dolore magna aliquyam erat, sed diam voluptua. At vero eos et accusam et justo duo dolores et ea rebum. Stet clita kasd gubergren, no sea takimata sanctus est Lorem ipsum dolor sit amet. Lorem ipsum dolor sit amet, consetetur sadipscing elitr, sed diam nonumy eirmod tempor invidunt ut labore et dolore magna aliquyam erat, sed diam voluptua. At vero eos et accusam et justo duo dolores et ea rebum. Stet clita kasd gubergren, no sea takimata sanctus est Lorem ipsum dolor sit amet."
-}
+ "Title": "Lorem ipsum dolor sit amet, consetetur sadipscing elitr, sed diam nonumy eirmod tempor invidunt",
+ "Excerpt": "Lorem ipsum dolor sit amet, consetetur sadipscing elitr, sed diam nonumy eirmod tempor invidunt ut labore et dolore magna aliquyam erat, sed diam voluptua. At vero eos et accusam et justo duo dolores et ea rebum. Stet clita kasd gubergren, no sea takimata sanctus est Lorem ipsum dolor sit amet. Lorem ipsum dolor sit amet, consetetur sadipscing elitr, sed diam nonumy eirmod tempor invidunt ut labore et dolore magna aliquyam erat, sed diam voluptua. At vero eos et accusam et justo duo dolores et ea rebum. Stet clita kasd gubergren, no sea takimata sanctus est Lorem ipsum dolor sit amet. Lorem ipsum dolor sit amet, consetetur sadipscing elitr, sed diam nonumy eirmod tempor invidunt ut labore et dolore magna aliquyam erat, sed diam voluptua. At vero eos et accusam et justo duo dolores et ea rebum. Stet clita kasd gubergren, no sea takimata sanctus est Lorem ipsum dolor sit amet."
+} \ No newline at end of file
diff --git a/test/test-pages/hukumusume/expected-metadata.json b/test/test-pages/hukumusume/expected-metadata.json
index 97317fc..f2f7e76 100644
--- a/test/test-pages/hukumusume/expected-metadata.json
+++ b/test/test-pages/hukumusume/expected-metadata.json
@@ -1,4 +1,4 @@
{
- "Title": "欲張りなイヌ <福娘童話集 きょうのイソップ童話>",
- "Excerpt": "福娘童話集 > きょうのイソップ童話 > 1月のイソップ童話 > 欲張りなイヌ"
-}
+ "Title": "欲張りなイヌ <福娘童話集 きょうのイソップ童話>",
+ "Excerpt": "福娘童話集 > きょうのイソップ童話 > 1月のイソップ童話 > 欲張りなイヌ"
+} \ No newline at end of file
diff --git a/test/test-pages/iab-1/expected-metadata.json b/test/test-pages/iab-1/expected-metadata.json
index b1f885e..0ea6fea 100644
--- a/test/test-pages/iab-1/expected-metadata.json
+++ b/test/test-pages/iab-1/expected-metadata.json
@@ -1,5 +1,6 @@
{
- "Title": "Getting LEAN with Digital Ad UX | IAB",
- "Author": "By\n\t\t\tScott Cunningham",
- "Excerpt": "We messed up. As technologists, tasked with delivering content and services to users, we lost track of the user experience. Twenty years ago we saw an explosion of websites, built by developers around the world, providing all forms of content. This was the beginning of an age of enlightenment, the intersection of content and technology. … Continued"
-}
+ "Title": "Getting LEAN with Digital Ad UX | IAB",
+ "Author": "By\n\t\t\tScott Cunningham",
+ "Excerpt": "We messed up. As technologists, tasked with delivering content and services to users, we lost track of the user experience. Twenty years ago we saw an explosion of websites, built by developers around the world, providing all forms of content. This was the beginning of an age of enlightenment, the intersection of content and technology. … Continued",
+ "Image": "http:\/\/www.iab.com\/wp-content\/uploads\/2015\/10\/getting-lean-with-digital-ad-ux-300x250.jpg"
+} \ No newline at end of file
diff --git a/test/test-pages/ietf-1/expected-metadata.json b/test/test-pages/ietf-1/expected-metadata.json
index f783f67..2babd23 100644
--- a/test/test-pages/ietf-1/expected-metadata.json
+++ b/test/test-pages/ietf-1/expected-metadata.json
@@ -1,4 +1,4 @@
{
- "Title": "remoteStorage",
- "Author": "Jong, Michiel de"
-}
+ "Title": "remoteStorage",
+ "Author": "Jong, Michiel de"
+} \ No newline at end of file
diff --git a/test/test-pages/infobae/expected-metadata.json b/test/test-pages/infobae/expected-metadata.json
index e8b24b1..45a0ac8 100644
--- a/test/test-pages/infobae/expected-metadata.json
+++ b/test/test-pages/infobae/expected-metadata.json
@@ -1,5 +1,6 @@
{
- "Title": "Una patota de varones atacó a un rugbier gay: \"Te vamos a matar por puto\"",
- "Author": "Por Mauricio Luna 1 de diciembre de 2017",
- "Excerpt": "Jonathan Castellari fue salvajemente golpeado en un local de comidas rápidas, mientras esperaba el desayuno junto a un amigo. Podría perder un ojo"
-}
+ "Title": "Una patota de varones atacó a un rugbier gay: \"Te vamos a matar por puto\"",
+ "Author": "Por Mauricio Luna 1 de diciembre de 2017",
+ "Excerpt": "Jonathan Castellari fue salvajemente golpeado en un local de comidas rápidas, mientras esperaba el desayuno junto a un amigo. Podría perder un ojo",
+ "Image": "https:\/\/www.infobae.com\/new-resizer\/shi8E0F5ldd8a7vtvFaJomRURqU=\/1200x0\/filters:quality(100)\/s3.amazonaws.com\/arc-wordpress-client-uploads\/infobae-wp\/wp-content\/uploads\/2017\/12\/01154429\/Rugbier-golpeado-1920.jpg"
+} \ No newline at end of file
diff --git a/test/test-pages/keep-images/expected-metadata.json b/test/test-pages/keep-images/expected-metadata.json
index 6c2c29a..ac3808e 100644
--- a/test/test-pages/keep-images/expected-metadata.json
+++ b/test/test-pages/keep-images/expected-metadata.json
@@ -1,5 +1,6 @@
{
- "Title": "Inside the Deep Web Drug Lab",
- "Author": "Joseph Cox",
- "Excerpt": "Welcome to DoctorX’s Barcelona lab, where the drugs you bought online are tested for safety and purity. No questions ask…"
-}
+ "Title": "Inside the Deep Web Drug Lab",
+ "Author": "Joseph Cox",
+ "Excerpt": "Welcome to DoctorX’s Barcelona lab, where the drugs you bought online are tested for safety and purity. No questions ask…",
+ "Image": "https:\/\/d262ilb51hltx0.cloudfront.net\/max\/800\/1*sLDnS1UWEFIS33uLMxq3cw.jpeg"
+} \ No newline at end of file
diff --git a/test/test-pages/la-nacion/expected-metadata.json b/test/test-pages/la-nacion/expected-metadata.json
index ddba3d8..2f5b6c5 100644
--- a/test/test-pages/la-nacion/expected-metadata.json
+++ b/test/test-pages/la-nacion/expected-metadata.json
@@ -1,4 +1,5 @@
{
- "Title": "Una solución no violenta para la cuestión mapuche",
- "Excerpt": "Los pueblos indígenas reclaman por derechos que permanecen incumplidos, por eso es más eficiente canalizar la protesta que reprimirla"
-}
+ "Title": "Una solución no violenta para la cuestión mapuche",
+ "Excerpt": "Los pueblos indígenas reclaman por derechos que permanecen incumplidos, por eso es más eficiente canalizar la protesta que reprimirla",
+ "Image": "http:\/\/bucket.glanacion.com\/anexos\/fotos\/77\/2585177.jpg"
+} \ No newline at end of file
diff --git a/test/test-pages/lemonde-1/expected-metadata.json b/test/test-pages/lemonde-1/expected-metadata.json
index 3d8792a..e0d0a9c 100644
--- a/test/test-pages/lemonde-1/expected-metadata.json
+++ b/test/test-pages/lemonde-1/expected-metadata.json
@@ -1,5 +1,6 @@
{
- "Title": "Le projet de loi sur le renseignement massivement approuvé à l'Assemblée",
- "Author": null,
- "Excerpt": "Largement approuvé par les députés, le texte sera désormais examiné par le Sénat, puis le Conseil constitutionnel."
-}
+ "Title": "Le projet de loi sur le renseignement massivement approuvé à l'Assemblée",
+ "Author": null,
+ "Excerpt": "Largement approuvé par les députés, le texte sera désormais examiné par le Sénat, puis le Conseil constitutionnel.",
+ "Image": "http:\/\/fakehost\/test\/image\/jpeg"
+} \ No newline at end of file
diff --git a/test/test-pages/lemonde-2/expected-metadata.json b/test/test-pages/lemonde-2/expected-metadata.json
index f82607a..2706a54 100644
--- a/test/test-pages/lemonde-2/expected-metadata.json
+++ b/test/test-pages/lemonde-2/expected-metadata.json
@@ -1 +1,6 @@
-{"Title":"La crise europ\u00e9enne est une crise de la dette, pas de l'euro","Author":null,"Excerpt":"Le retour \u00e0 la stabilit\u00e9 co\u00fbtera des milliards d'euros, mais l'Union europ\u00e9enne en vaut la peine, estime un collectif d'industriels."} \ No newline at end of file
+{
+ "Title": "La crise européenne est une crise de la dette, pas de l'euro",
+ "Author": null,
+ "Excerpt": "Le retour à la stabilité coûtera des milliards d'euros, mais l'Union européenne en vaut la peine, estime un collectif d'industriels.",
+ "Image": "http:\/\/s1.lemde.fr\/medias\/web\/1.2.705\/img\/placeholder\/default.png"
+} \ No newline at end of file
diff --git a/test/test-pages/liberation-1/expected-metadata.json b/test/test-pages/liberation-1/expected-metadata.json
index 7040bd8..bce9274 100644
--- a/test/test-pages/liberation-1/expected-metadata.json
+++ b/test/test-pages/liberation-1/expected-metadata.json
@@ -1,5 +1,6 @@
{
- "Title": "Un troisième Français mort dans le séisme au Népal",
- "Author": "AFP",
- "Excerpt": "Laurent Fabius a accueilli jeudi matin à Roissy un premier avion spécial ramenant des rescapés."
-}
+ "Title": "Un troisième Français mort dans le séisme au Népal",
+ "Author": "AFP",
+ "Excerpt": "Laurent Fabius a accueilli jeudi matin à Roissy un premier avion spécial ramenant des rescapés.",
+ "Image": "http:\/\/md1.libe.com\/photo\/755923-000_hkg10175905.jpg?modified_at=1430371146&amp;width=750"
+} \ No newline at end of file
diff --git a/test/test-pages/lifehacker-post-comment-load/expected-metadata.json b/test/test-pages/lifehacker-post-comment-load/expected-metadata.json
index 1c7f82b..368bece 100644
--- a/test/test-pages/lifehacker-post-comment-load/expected-metadata.json
+++ b/test/test-pages/lifehacker-post-comment-load/expected-metadata.json
@@ -1,5 +1,6 @@
{
- "Title": "How to Program Your Mind to Stop Buying Crap You Don’t Need",
- "Author": "Patrick Allan",
- "Excerpt": "We all buy things from time to time that we don't really need. It's okay to appeal to your wants every once in a while, as long as you're in control. If you struggle with clutter, impulse buys, and buyer's remorse, here's how to put your mind in the right place before you even set foot in a store."
-}
+ "Title": "How to Program Your Mind to Stop Buying Crap You Don’t Need",
+ "Author": "Patrick Allan",
+ "Excerpt": "We all buy things from time to time that we don't really need. It's okay to appeal to your wants every once in a while, as long as you're in control. If you struggle with clutter, impulse buys, and buyer's remorse, here's how to put your mind in the right place before you even set foot in a store.",
+ "Image": "http:\/\/i.kinja-img.com\/gawker-media\/image\/upload\/s--hqqO9fze--\/n1s6c2m6kc07iqdyllj6.jpg"
+} \ No newline at end of file
diff --git a/test/test-pages/lifehacker-working/expected-metadata.json b/test/test-pages/lifehacker-working/expected-metadata.json
index 1c7f82b..368bece 100644
--- a/test/test-pages/lifehacker-working/expected-metadata.json
+++ b/test/test-pages/lifehacker-working/expected-metadata.json
@@ -1,5 +1,6 @@
{
- "Title": "How to Program Your Mind to Stop Buying Crap You Don’t Need",
- "Author": "Patrick Allan",
- "Excerpt": "We all buy things from time to time that we don't really need. It's okay to appeal to your wants every once in a while, as long as you're in control. If you struggle with clutter, impulse buys, and buyer's remorse, here's how to put your mind in the right place before you even set foot in a store."
-}
+ "Title": "How to Program Your Mind to Stop Buying Crap You Don’t Need",
+ "Author": "Patrick Allan",
+ "Excerpt": "We all buy things from time to time that we don't really need. It's okay to appeal to your wants every once in a while, as long as you're in control. If you struggle with clutter, impulse buys, and buyer's remorse, here's how to put your mind in the right place before you even set foot in a store.",
+ "Image": "http:\/\/i.kinja-img.com\/gawker-media\/image\/upload\/s--hqqO9fze--\/n1s6c2m6kc07iqdyllj6.jpg"
+} \ No newline at end of file
diff --git a/test/test-pages/links-in-tables/expected-metadata.json b/test/test-pages/links-in-tables/expected-metadata.json
index 6ff5704..3f72532 100644
--- a/test/test-pages/links-in-tables/expected-metadata.json
+++ b/test/test-pages/links-in-tables/expected-metadata.json
@@ -1,5 +1,6 @@
{
- "Title": "Saving Data: Reducing the size of App Updates by 65%",
- "Author": null,
- "Excerpt": "Posted by Andrew Hayden, Software Engineer on Google Play Android users are downloading tens of billions of apps and games on Google Pla..."
-}
+ "Title": "Saving Data: Reducing the size of App Updates by 65%",
+ "Author": null,
+ "Excerpt": "Posted by Andrew Hayden, Software Engineer on Google Play Android users are downloading tens of billions of apps and games on Google Pla...",
+ "Image": "https:\/\/2.bp.blogspot.com\/-chCZZinlUTg\/WEcxvJo9gdI\/AAAAAAAADnk\/3ND_BspqN6Y2j5xxkLFW3RyS2Ig0NHZpQCLcB\/w1200-h630-p-k-nu\/ipsum-opsum.gif"
+} \ No newline at end of file
diff --git a/test/test-pages/lwn-1/expected-metadata.json b/test/test-pages/lwn-1/expected-metadata.json
index 7a7ca1c..ac856e4 100644
--- a/test/test-pages/lwn-1/expected-metadata.json
+++ b/test/test-pages/lwn-1/expected-metadata.json
@@ -1,5 +1,5 @@
{
- "Title": "LWN.net Weekly Edition for March 26, 2015 [LWN.net]",
- "Author": "By Nathan Willis\n March 25, 2015",
- "Excerpt": "The Arduino has been one of the biggest success stories of the open-hardware movement, but that success does not protect it from internal conflict. In recent months, two of the project's founders have come into conflict about the direction of future efforts—and that conflict has turned into a legal dispute about who owns the rights to the Arduino trademark."
-}
+ "Title": "LWN.net Weekly Edition for March 26, 2015 [LWN.net]",
+ "Author": "By Nathan Willis\n March 25, 2015",
+ "Excerpt": "The Arduino has been one of the biggest success stories of the open-hardware movement, but that success does not protect it from internal conflict. In recent months, two of the project's founders have come into conflict about the direction of future efforts—and that conflict has turned into a legal dispute about who owns the rights to the Arduino trademark."
+} \ No newline at end of file
diff --git a/test/test-pages/medium-1/expected-metadata.json b/test/test-pages/medium-1/expected-metadata.json
index e3e098c..ce4c1a9 100644
--- a/test/test-pages/medium-1/expected-metadata.json
+++ b/test/test-pages/medium-1/expected-metadata.json
@@ -1,5 +1,6 @@
{
- "Title": "The Open Journalism Project: Better Student Journalism",
- "Author": "Pippin Lee",
- "Excerpt": "We pushed out the first version of the Open Journalism site in January. Here’s what we’ve learned about student journali…"
-}
+ "Title": "The Open Journalism Project: Better Student Journalism",
+ "Author": "Pippin Lee",
+ "Excerpt": "We pushed out the first version of the Open Journalism site in January. Here’s what we’ve learned about student journali…",
+ "Image": "https:\/\/d262ilb51hltx0.cloudfront.net\/max\/800\/1*oBWUXtszDsiv_-Qq2bFLTQ.png"
+} \ No newline at end of file
diff --git a/test/test-pages/medium-2/expected-metadata.json b/test/test-pages/medium-2/expected-metadata.json
index 395fb03..1257405 100644
--- a/test/test-pages/medium-2/expected-metadata.json
+++ b/test/test-pages/medium-2/expected-metadata.json
@@ -1,5 +1,6 @@
{
- "Title": "On Behalf of “Literally”",
- "Author": "Courtney Kirchoff",
- "Excerpt": "In defense of the word “literally” and why you or someone you know should stop misusing the word, lest they drive us fig…"
-}
+ "Title": "On Behalf of “Literally”",
+ "Author": "Courtney Kirchoff",
+ "Excerpt": "In defense of the word “literally” and why you or someone you know should stop misusing the word, lest they drive us fig…",
+ "Image": "https:\/\/d262ilb51hltx0.cloudfront.net\/max\/1600\/1*eR_J8DurqygbhrwDg-WPnQ.png"
+} \ No newline at end of file
diff --git a/test/test-pages/medium-3/expected-metadata.json b/test/test-pages/medium-3/expected-metadata.json
index b2e66b9..c35c9d7 100644
--- a/test/test-pages/medium-3/expected-metadata.json
+++ b/test/test-pages/medium-3/expected-metadata.json
@@ -1,6 +1,7 @@
{
- "Title": "Samantha and The Great Big Lie",
- "Author": "John C. Welch",
- "Direction": null,
- "Excerpt": "How to get shanked doing what people say they want"
-}
+ "Title": "Samantha and The Great Big Lie",
+ "Author": "John C. Welch",
+ "Direction": null,
+ "Excerpt": "How to get shanked doing what people say they want",
+ "Image": "https:\/\/cdn-images-1.medium.com\/max\/1200\/1*kbPh7V97eyRodSOw2-ALDw.png"
+} \ No newline at end of file
diff --git a/test/test-pages/missing-paragraphs/expected-metadata.json b/test/test-pages/missing-paragraphs/expected-metadata.json
index ecd9fbc..a48bc86 100644
--- a/test/test-pages/missing-paragraphs/expected-metadata.json
+++ b/test/test-pages/missing-paragraphs/expected-metadata.json
@@ -1,5 +1,5 @@
{
- "Title": "Lorem ipsum dolor sit amet, consetetur sadipscing elitr, sed diam nonumy\n eirmod tempor invidunt",
- "Author": "Henri Sivonen",
- "Excerpt": "Lorem ipsum dolor sit amet, consetetur sadipscing elitr, sed diam nonumy\n eirmod tempor invidunt ut labore et dolore magna aliquyam erat, sed diam\n voluptua. At vero eos et accusam et justo duo dolores et ea rebum. Stet\n clita kasd gubergren, no sea takimata sanctus est Lorem ipsum dolor sit\n amet. Lorem ipsum dolor sit amet, consetetur sadipscing elitr, sed diam\n nonumy eirmod tempor invidunt ut labore et dolore magna aliquyam erat,\n sed diam voluptua. At vero eos et accusam et justo duo dolores et ea rebum.\n Stet clita kasd gubergren, no sea takimata sanctus est Lorem ipsum dolor\n sit amet. Lorem ipsum dolor sit amet, consetetur sadipscing elitr, sed\n diam nonumy eirmod tempor invidunt ut labore et dolore magna aliquyam erat,\n sed diam voluptua. At vero eos et accusam et justo duo dolores et ea rebum.\n Stet clita kasd gubergren, no sea takimata sanctus est Lorem ipsum dolor\n sit amet."
-}
+ "Title": "Lorem ipsum dolor sit amet, consetetur sadipscing elitr, sed diam nonumy\n eirmod tempor invidunt",
+ "Author": "Henri Sivonen",
+ "Excerpt": "Lorem ipsum dolor sit amet, consetetur sadipscing elitr, sed diam nonumy\n eirmod tempor invidunt ut labore et dolore magna aliquyam erat, sed diam\n voluptua. At vero eos et accusam et justo duo dolores et ea rebum. Stet\n clita kasd gubergren, no sea takimata sanctus est Lorem ipsum dolor sit\n amet. Lorem ipsum dolor sit amet, consetetur sadipscing elitr, sed diam\n nonumy eirmod tempor invidunt ut labore et dolore magna aliquyam erat,\n sed diam voluptua. At vero eos et accusam et justo duo dolores et ea rebum.\n Stet clita kasd gubergren, no sea takimata sanctus est Lorem ipsum dolor\n sit amet. Lorem ipsum dolor sit amet, consetetur sadipscing elitr, sed\n diam nonumy eirmod tempor invidunt ut labore et dolore magna aliquyam erat,\n sed diam voluptua. At vero eos et accusam et justo duo dolores et ea rebum.\n Stet clita kasd gubergren, no sea takimata sanctus est Lorem ipsum dolor\n sit amet."
+} \ No newline at end of file
diff --git a/test/test-pages/mozilla-1/expected-metadata.json b/test/test-pages/mozilla-1/expected-metadata.json
index 3a93f8f..4ffdf79 100644
--- a/test/test-pages/mozilla-1/expected-metadata.json
+++ b/test/test-pages/mozilla-1/expected-metadata.json
@@ -1,6 +1,7 @@
{
- "Title": "Firefox — Customize and make it your own — The most flexible browser on the Web",
- "Author": null,
- "Direction": "ltr",
- "Excerpt": "It’s easier than ever to personalize Firefox and make it work the way\n you do.\n No other browser gives you so much choice and flexibility."
-}
+ "Title": "Firefox — Customize and make it your own — The most flexible browser on the Web",
+ "Author": null,
+ "Direction": "ltr",
+ "Excerpt": "It’s easier than ever to personalize Firefox and make it work the way\n you do.\n No other browser gives you so much choice and flexibility.",
+ "Image": "https:\/\/mozorg.cdn.mozilla.net\/media\/img\/firefox\/template\/page-image.af8027a425de.png"
+} \ No newline at end of file
diff --git a/test/test-pages/mozilla-2/expected-metadata.json b/test/test-pages/mozilla-2/expected-metadata.json
index de229d8..0b84253 100644
--- a/test/test-pages/mozilla-2/expected-metadata.json
+++ b/test/test-pages/mozilla-2/expected-metadata.json
@@ -1,6 +1,7 @@
{
- "Title": "Welcome to Firefox Developer Edition",
- "Author": null,
- "Direction": "ltr",
- "Excerpt": "Built for those who build the Web. Introducing the only browser made for developers."
-}
+ "Title": "Welcome to Firefox Developer Edition",
+ "Author": null,
+ "Direction": "ltr",
+ "Excerpt": "Built for those who build the Web. Introducing the only browser made for developers.",
+ "Image": "https:\/\/mozorg.cdn.mozilla.net\/media\/img\/firefox\/developer\/page-image.03bbe7da3199.png"
+} \ No newline at end of file
diff --git a/test/test-pages/msn/expected-metadata.json b/test/test-pages/msn/expected-metadata.json
index 4916e95..7b50117 100644
--- a/test/test-pages/msn/expected-metadata.json
+++ b/test/test-pages/msn/expected-metadata.json
@@ -1,5 +1,6 @@
{
- "Title": "Nintendo's first iPhone game will launch in December for $10",
- "Author": "Alex Perry\n \n 1 day ago",
- "Excerpt": "Nintendo and Apple shocked the world earlier this year by announcing \"Super Mario Run,\" the legendary gaming company's first foray into mobile gaming.&nbsp;"
-}
+ "Title": "Nintendo's first iPhone game will launch in December for $10",
+ "Author": "Alex Perry\n \n 1 day ago",
+ "Excerpt": "Nintendo and Apple shocked the world earlier this year by announcing \"Super Mario Run,\" the legendary gaming company's first foray into mobile gaming.&nbsp;",
+ "Image": "http:\/\/img-s-msn-com.akamaized.net\/tenant\/amp\/entityid\/AAkk5fh.img"
+} \ No newline at end of file
diff --git a/test/test-pages/nytimes-1/expected-metadata.json b/test/test-pages/nytimes-1/expected-metadata.json
index c8b12aa..098429d 100644
--- a/test/test-pages/nytimes-1/expected-metadata.json
+++ b/test/test-pages/nytimes-1/expected-metadata.json
@@ -1,6 +1,7 @@
{
- "Title": "United States to Lift Sudan Sanctions",
- "Author": "Jeffrey Gettleman",
- "Direction": null,
- "Excerpt": "For the first time since the 1990s, the country will be able to trade extensively with the United States."
-}
+ "Title": "United States to Lift Sudan Sanctions",
+ "Author": "Jeffrey Gettleman",
+ "Direction": null,
+ "Excerpt": "For the first time since the 1990s, the country will be able to trade extensively with the United States.",
+ "Image": "https:\/\/static01.nyt.com\/images\/2017\/01\/14\/world\/13SUDAN-1\/13SUDAN-1-facebookJumbo.jpg"
+} \ No newline at end of file
diff --git a/test/test-pages/nytimes-2/expected-metadata.json b/test/test-pages/nytimes-2/expected-metadata.json
index d8c62b1..3254c74 100644
--- a/test/test-pages/nytimes-2/expected-metadata.json
+++ b/test/test-pages/nytimes-2/expected-metadata.json
@@ -1,6 +1,7 @@
{
- "Title": "Yahoo’s Sale to Verizon Leaves Shareholders With Little Say",
- "Author": "Steven Davidoff Solomon",
- "Direction": null,
- "Excerpt": "The internet giant’s decision to sell its business is plagued with challenges that reveal how unusual deal structures can affect shareholders."
-}
+ "Title": "Yahoo’s Sale to Verizon Leaves Shareholders With Little Say",
+ "Author": "Steven Davidoff Solomon",
+ "Direction": null,
+ "Excerpt": "The internet giant’s decision to sell its business is plagued with challenges that reveal how unusual deal structures can affect shareholders.",
+ "Image": "https:\/\/static01.nyt.com\/images\/2016\/07\/30\/business\/db-dealprof\/db-dealprof-facebookJumbo.jpg"
+} \ No newline at end of file
diff --git a/test/test-pages/pixnet/expected-metadata.json b/test/test-pages/pixnet/expected-metadata.json
index 97554c7..ffdd41d 100644
--- a/test/test-pages/pixnet/expected-metadata.json
+++ b/test/test-pages/pixnet/expected-metadata.json
@@ -1,6 +1,7 @@
{
- "Title": "新竹尖石_美樹營地賞楓 (2) @ 史蒂文的家_藍天 :: 痞客邦 PIXNET ::",
- "Author": "史蒂文的家_藍天 (stevenhgm)",
- "Direction": null,
- "Excerpt": "一波波接續性低溫寒流報到 已將新竹尖石鄉後山一帶層層山巒披上嫣紅的彩衣 玉峰道路一路上雲氣山嵐滯留山頭 順路下切蜿蜒道路後不久即抵達來到&quot;玉峰國小&quot; &quot;美樹&quot;美"
-}
+ "Title": "新竹尖石_美樹營地賞楓 (2) @ 史蒂文的家_藍天 :: 痞客邦 PIXNET ::",
+ "Author": "史蒂文的家_藍天 (stevenhgm)",
+ "Direction": null,
+ "Excerpt": "一波波接續性低溫寒流報到 已將新竹尖石鄉後山一帶層層山巒披上嫣紅的彩衣 玉峰道路一路上雲氣山嵐滯留山頭 順路下切蜿蜒道路後不久即抵達來到&quot;玉峰國小&quot; &quot;美樹&quot;美",
+ "Image": "http:\/\/pic.pimg.tw\/stevenhgm\/1387895093-631461272.jpg"
+} \ No newline at end of file
diff --git a/test/test-pages/remove-extra-brs/expected-metadata.json b/test/test-pages/remove-extra-brs/expected-metadata.json
index 152d972..b378339 100644
--- a/test/test-pages/remove-extra-brs/expected-metadata.json
+++ b/test/test-pages/remove-extra-brs/expected-metadata.json
@@ -1,5 +1,5 @@
{
- "Title": "Remove trailing brs test",
- "Author": null,
- "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua."
-}
+ "Title": "Remove trailing brs test",
+ "Author": null,
+ "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua."
+} \ No newline at end of file
diff --git a/test/test-pages/remove-extra-paragraphs/expected-metadata.json b/test/test-pages/remove-extra-paragraphs/expected-metadata.json
index 4a21b9b..fc6c06e 100644
--- a/test/test-pages/remove-extra-paragraphs/expected-metadata.json
+++ b/test/test-pages/remove-extra-paragraphs/expected-metadata.json
@@ -1,5 +1,5 @@
{
- "Title": "Replace font tags test",
- "Author": null,
- "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua."
-}
+ "Title": "Replace font tags test",
+ "Author": null,
+ "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua."
+} \ No newline at end of file
diff --git a/test/test-pages/remove-script-tags/expected-metadata.json b/test/test-pages/remove-script-tags/expected-metadata.json
index 96ec024..c0567d8 100644
--- a/test/test-pages/remove-script-tags/expected-metadata.json
+++ b/test/test-pages/remove-script-tags/expected-metadata.json
@@ -1,5 +1,5 @@
{
- "Title": "Remove script tags test",
- "Author": null,
- "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua."
-}
+ "Title": "Remove script tags test",
+ "Author": null,
+ "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua."
+} \ No newline at end of file
diff --git a/test/test-pages/reordering-paragraphs/expected-metadata.json b/test/test-pages/reordering-paragraphs/expected-metadata.json
index cae2da5..27f5eaf 100644
--- a/test/test-pages/reordering-paragraphs/expected-metadata.json
+++ b/test/test-pages/reordering-paragraphs/expected-metadata.json
@@ -1,5 +1,5 @@
{
- "Title": "",
- "Author": null,
- "Excerpt": "Regarding item# 11111, under sufficiently extreme conditions, quarks may\n become deconfined and exist as free particles. In the course of asymptotic\n freedom, the strong interaction becomes weaker at higher temperatures.\n Eventually, color confinement would be lost and an extremely hot plasma\n of freely moving quarks and gluons would be formed. This theoretical phase\n of matter is called quark-gluon plasma.[81] The exact conditions needed\n to give rise to this state are unknown and have been the subject of a great\n deal of speculation and experimentation."
-}
+ "Title": "",
+ "Author": null,
+ "Excerpt": "Regarding item# 11111, under sufficiently extreme conditions, quarks may\n become deconfined and exist as free particles. In the course of asymptotic\n freedom, the strong interaction becomes weaker at higher temperatures.\n Eventually, color confinement would be lost and an extremely hot plasma\n of freely moving quarks and gluons would be formed. This theoretical phase\n of matter is called quark-gluon plasma.[81] The exact conditions needed\n to give rise to this state are unknown and have been the subject of a great\n deal of speculation and experimentation."
+} \ No newline at end of file
diff --git a/test/test-pages/replace-brs/expected-metadata.json b/test/test-pages/replace-brs/expected-metadata.json
index c73456d..4a3ab99 100644
--- a/test/test-pages/replace-brs/expected-metadata.json
+++ b/test/test-pages/replace-brs/expected-metadata.json
@@ -1,5 +1,5 @@
{
- "Title": "Replace brs test",
- "Author": null,
- "Excerpt": "Lorem ipsumdolor sit"
-}
+ "Title": "Replace brs test",
+ "Author": null,
+ "Excerpt": "Lorem ipsumdolor sit"
+} \ No newline at end of file
diff --git a/test/test-pages/replace-font-tags/expected-metadata.json b/test/test-pages/replace-font-tags/expected-metadata.json
index c669818..1fc0cd4 100644
--- a/test/test-pages/replace-font-tags/expected-metadata.json
+++ b/test/test-pages/replace-font-tags/expected-metadata.json
@@ -1,5 +1,5 @@
{
- "Title": "Replace font tags test",
- "Author": null,
- "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum."
-}
+ "Title": "Replace font tags test",
+ "Author": null,
+ "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum."
+} \ No newline at end of file
diff --git a/test/test-pages/rtl-1/expected-metadata.json b/test/test-pages/rtl-1/expected-metadata.json
index 3c14748..d26d69a 100644
--- a/test/test-pages/rtl-1/expected-metadata.json
+++ b/test/test-pages/rtl-1/expected-metadata.json
@@ -1,6 +1,6 @@
{
- "Title": "RTL Test",
- "Author": null,
- "Excerpt": "Lorem ipsum dolor sit amet.",
- "Direction": "rtl"
-}
+ "Title": "RTL Test",
+ "Author": null,
+ "Excerpt": "Lorem ipsum dolor sit amet.",
+ "Direction": "rtl"
+} \ No newline at end of file
diff --git a/test/test-pages/rtl-2/expected-metadata.json b/test/test-pages/rtl-2/expected-metadata.json
index 3c14748..d26d69a 100644
--- a/test/test-pages/rtl-2/expected-metadata.json
+++ b/test/test-pages/rtl-2/expected-metadata.json
@@ -1,6 +1,6 @@
{
- "Title": "RTL Test",
- "Author": null,
- "Excerpt": "Lorem ipsum dolor sit amet.",
- "Direction": "rtl"
-}
+ "Title": "RTL Test",
+ "Author": null,
+ "Excerpt": "Lorem ipsum dolor sit amet.",
+ "Direction": "rtl"
+} \ No newline at end of file
diff --git a/test/test-pages/rtl-3/expected-metadata.json b/test/test-pages/rtl-3/expected-metadata.json
index 3c14748..d26d69a 100644
--- a/test/test-pages/rtl-3/expected-metadata.json
+++ b/test/test-pages/rtl-3/expected-metadata.json
@@ -1,6 +1,6 @@
{
- "Title": "RTL Test",
- "Author": null,
- "Excerpt": "Lorem ipsum dolor sit amet.",
- "Direction": "rtl"
-}
+ "Title": "RTL Test",
+ "Author": null,
+ "Excerpt": "Lorem ipsum dolor sit amet.",
+ "Direction": "rtl"
+} \ No newline at end of file
diff --git a/test/test-pages/rtl-4/expected-metadata.json b/test/test-pages/rtl-4/expected-metadata.json
index ee2b37a..a9690b7 100644
--- a/test/test-pages/rtl-4/expected-metadata.json
+++ b/test/test-pages/rtl-4/expected-metadata.json
@@ -1,6 +1,6 @@
{
- "Title": "RTL Test",
- "Author": null,
- "Excerpt": "Lorem ipsum dolor sit amet.",
- "Direction": null
-}
+ "Title": "RTL Test",
+ "Author": null,
+ "Excerpt": "Lorem ipsum dolor sit amet.",
+ "Direction": null
+} \ No newline at end of file
diff --git a/test/test-pages/salon-1/expected-metadata.json b/test/test-pages/salon-1/expected-metadata.json
index 71fc109..cd47b7f 100644
--- a/test/test-pages/salon-1/expected-metadata.json
+++ b/test/test-pages/salon-1/expected-metadata.json
@@ -1,5 +1,6 @@
{
- "Title": "The sharing economy is a lie: Uber, Ayn Rand and the truth about tech and libertarians",
- "Author": "Joanna Rothkopf",
- "Excerpt": "Disruptive companies talk a good game about sharing. Uber's really just an under-regulated company making riches"
-}
+ "Title": "The sharing economy is a lie: Uber, Ayn Rand and the truth about tech and libertarians",
+ "Author": "Joanna Rothkopf",
+ "Excerpt": "Disruptive companies talk a good game about sharing. Uber's really just an under-regulated company making riches",
+ "Image": "http:\/\/media.salon.com\/2014\/12\/uber_rand_paul.jpg"
+} \ No newline at end of file
diff --git a/test/test-pages/simplyfound-1/expected-metadata.json b/test/test-pages/simplyfound-1/expected-metadata.json
index 3772bbd..9c8fb6b 100644
--- a/test/test-pages/simplyfound-1/expected-metadata.json
+++ b/test/test-pages/simplyfound-1/expected-metadata.json
@@ -1,5 +1,6 @@
{
- "Title": "Raspberry Pi 3 - The credit card sized PC that cost only $35 - All-time bestselling computer in UK",
- "Author": null,
- "Excerpt": "The Raspberry Pi Foundation started by a handful of volunteers in 2012 when they released the original Raspberry Pi 256MB Model B without knowing what to expect. In a short four-year period they have grown to over sixty full-time employees and ha..."
-}
+ "Title": "Raspberry Pi 3 - The credit card sized PC that cost only $35 - All-time bestselling computer in UK",
+ "Author": null,
+ "Excerpt": "The Raspberry Pi Foundation started by a handful of volunteers in 2012 when they released the original Raspberry Pi 256MB Model B without knowing what to expect. In a short four-year period they have grown to over sixty full-time employees and ha...",
+ "Image": "https:\/\/d34hb2g9mvfppu.cloudfront.net\/m\/images\/cache\/images\/2016\/02\/29\/apcnews2012raspberry_pi_logo_mainimage8_jpg8_322_27630a8388eb_lg.jpg"
+} \ No newline at end of file
diff --git a/test/test-pages/social-buttons/expected-metadata.json b/test/test-pages/social-buttons/expected-metadata.json
index 50d7ac6..545b72f 100644
--- a/test/test-pages/social-buttons/expected-metadata.json
+++ b/test/test-pages/social-buttons/expected-metadata.json
@@ -1,5 +1,5 @@
{
- "Title": "Share buttons removal test",
- "Author": null,
- "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum."
-}
+ "Title": "Share buttons removal test",
+ "Author": null,
+ "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum."
+} \ No newline at end of file
diff --git a/test/test-pages/style-tags-removal/expected-metadata.json b/test/test-pages/style-tags-removal/expected-metadata.json
index e30a764..44f6efe 100644
--- a/test/test-pages/style-tags-removal/expected-metadata.json
+++ b/test/test-pages/style-tags-removal/expected-metadata.json
@@ -1,5 +1,5 @@
{
- "Title": "Style tags removal",
- "Author": null,
- "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum."
-}
+ "Title": "Style tags removal",
+ "Author": null,
+ "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum."
+} \ No newline at end of file
diff --git a/test/test-pages/svg-parsing/expected-metadata.json b/test/test-pages/svg-parsing/expected-metadata.json
index 2192d3b..be5e333 100644
--- a/test/test-pages/svg-parsing/expected-metadata.json
+++ b/test/test-pages/svg-parsing/expected-metadata.json
@@ -1,5 +1,5 @@
{
- "Title": "SVG parsing",
- "Author": null,
- "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\ntempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\nquis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\nconsequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\ncillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\nproident, sunt in culpa qui officia deserunt mollit anim id est laborum."
-}
+ "Title": "SVG parsing",
+ "Author": null,
+ "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\ntempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\nquis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\nconsequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\ncillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\nproident, sunt in culpa qui officia deserunt mollit anim id est laborum."
+} \ No newline at end of file
diff --git a/test/test-pages/table-style-attributes/expected-metadata.json b/test/test-pages/table-style-attributes/expected-metadata.json
index 3866f09..f677d3e 100644
--- a/test/test-pages/table-style-attributes/expected-metadata.json
+++ b/test/test-pages/table-style-attributes/expected-metadata.json
@@ -1,6 +1,6 @@
{
- "Title": "linux video",
- "Author": null,
- "Direction": null,
- "Excerpt": "linux usability\n ...or, why do I bother. © 2002, 2003\n Jamie Zawinski"
-}
+ "Title": "linux video",
+ "Author": null,
+ "Direction": null,
+ "Excerpt": "linux usability\n ...or, why do I bother. © 2002, 2003\n Jamie Zawinski"
+} \ No newline at end of file
diff --git a/test/test-pages/telegraph/expected-metadata.json b/test/test-pages/telegraph/expected-metadata.json
index 196d045..94a330d 100644
--- a/test/test-pages/telegraph/expected-metadata.json
+++ b/test/test-pages/telegraph/expected-metadata.json
@@ -1,4 +1,5 @@
{
- "Title": "Zimbabwe coup: Robert Mugabe and wife Grace 'insisting he finishes his term', as priest steps in to mediate",
- "Excerpt": "Zimbabwe President Robert Mugabe, his wife Grace and two key figures from her G40 political faction are under house arrest at Mugabe's &quot;Blue House&quot; compound in Harare and are insisting the 93 year-old finishes his presidential term, a source said."
-}
+ "Title": "Zimbabwe coup: Robert Mugabe and wife Grace 'insisting he finishes his term', as priest steps in to mediate",
+ "Excerpt": "Zimbabwe President Robert Mugabe, his wife Grace and two key figures from her G40 political faction are under house arrest at Mugabe's &quot;Blue House&quot; compound in Harare and are insisting the 93 year-old finishes his presidential term, a source said.",
+ "Image": "http:\/\/www.telegraph.co.uk\/content\/dam\/news\/2017\/11\/16\/TELEMMGLPICT000146889449-xlarge_trans_NvBQzQNjv4BqySoB6nTCgtc7U4LQ_FPO4hKi2sT3vi7ux2-RDZwC4QA.jpeg"
+} \ No newline at end of file
diff --git a/test/test-pages/title-and-h1-discrepancy/expected-metadata.json b/test/test-pages/title-and-h1-discrepancy/expected-metadata.json
index 2840904..5d2f573 100644
--- a/test/test-pages/title-and-h1-discrepancy/expected-metadata.json
+++ b/test/test-pages/title-and-h1-discrepancy/expected-metadata.json
@@ -1,4 +1,4 @@
{
- "Title": "This is a long title with a colon: Hello there",
- "Excerpt": "Lorem\n ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum."
-}
+ "Title": "This is a long title with a colon: Hello there",
+ "Excerpt": "Lorem\n ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum."
+} \ No newline at end of file
diff --git a/test/test-pages/tmz-1/expected-metadata.json b/test/test-pages/tmz-1/expected-metadata.json
index 994d596..684127f 100644
--- a/test/test-pages/tmz-1/expected-metadata.json
+++ b/test/test-pages/tmz-1/expected-metadata.json
@@ -1,5 +1,6 @@
{
- "Title": "Lupita Nyong'o's $150K Pearl Oscar Dress -- STOLEN!!!",
- "Author": null,
- "Excerpt": "Lupita Nyong'o's now-famous Oscar dress -- adorned in pearls -- was stolen right out of her hotel room ... TMZ has learned. Law enforcement sources tell…"
-}
+ "Title": "Lupita Nyong'o's $150K Pearl Oscar Dress -- STOLEN!!!",
+ "Author": null,
+ "Excerpt": "Lupita Nyong'o's now-famous Oscar dress -- adorned in pearls -- was stolen right out of her hotel room ... TMZ has learned. Law enforcement sources tell…",
+ "Image": "http:\/\/ll-media.tmz.com\/2015\/02\/26\/0225-lupita-nyongo-getty-01-1200x630.jpg"
+} \ No newline at end of file
diff --git a/test/test-pages/tumblr/expected-metadata.json b/test/test-pages/tumblr/expected-metadata.json
index 4589af0..d0ecb00 100644
--- a/test/test-pages/tumblr/expected-metadata.json
+++ b/test/test-pages/tumblr/expected-metadata.json
@@ -1,6 +1,7 @@
{
- "Title": "Minecraft 1.8 - The Bountiful Update",
- "Author": null,
- "Direction": null,
- "Excerpt": "+ Added Granite, Andesite, and Diorite stone blocks, with smooth versions\n+ Added Slime Block\n+ Added Iron Trapdoor\n+ Added Prismarine and Sea Lantern blocks\n+ Added the Ocean Monument\n+ Added Red..."
-}
+ "Title": "Minecraft 1.8 - The Bountiful Update",
+ "Author": null,
+ "Direction": null,
+ "Excerpt": "+ Added Granite, Andesite, and Diorite stone blocks, with smooth versions\n+ Added Slime Block\n+ Added Iron Trapdoor\n+ Added Prismarine and Sea Lantern blocks\n+ Added the Ocean Monument\n+ Added Red...",
+ "Image": "http:\/\/assets.tumblr.com\/images\/og\/fb_landscape_share.png"
+} \ No newline at end of file
diff --git a/test/test-pages/wapo-1/expected-metadata.json b/test/test-pages/wapo-1/expected-metadata.json
index ac80bbb..401a73a 100644
--- a/test/test-pages/wapo-1/expected-metadata.json
+++ b/test/test-pages/wapo-1/expected-metadata.json
@@ -1,5 +1,6 @@
{
- "Title": "Attack stokes instability fears in North Africa",
- "Author": "By Erin Cunningham",
- "Excerpt": "The assault on Tunisia’s most renowned museum, in which gunmen killed at least 19 people, could heighten tensions in a nation that has become deeply divided between pro- and anti-Islamist factions."
-}
+ "Title": "Attack stokes instability fears in North Africa",
+ "Author": "By Erin Cunningham",
+ "Excerpt": "The assault on Tunisia’s most renowned museum, in which gunmen killed at least 19 people, could heighten tensions in a nation that has become deeply divided between pro- and anti-Islamist factions.",
+ "Image": "http:\/\/img.washingtonpost.com\/rw\/2010-2019\/WashingtonPost\/2015\/03\/18\/Foreign\/Images\/Nic6429927.jpg"
+} \ No newline at end of file
diff --git a/test/test-pages/wapo-2/expected-metadata.json b/test/test-pages/wapo-2/expected-metadata.json
index bee9dd4..7a9493e 100644
--- a/test/test-pages/wapo-2/expected-metadata.json
+++ b/test/test-pages/wapo-2/expected-metadata.json
@@ -1,5 +1,6 @@
{
- "Title": "Where do strained U.S.-Israeli relations go after Netanyahu’s victory?",
- "Author": "By Steven Mufson",
- "Excerpt": "Few foreign leaders have so brazenly stood up to President Obama and the relationship could face its next test this month."
-}
+ "Title": "Where do strained U.S.-Israeli relations go after Netanyahu’s victory?",
+ "Author": "By Steven Mufson",
+ "Excerpt": "Few foreign leaders have so brazenly stood up to President Obama and the relationship could face its next test this month.",
+ "Image": "http:\/\/img.washingtonpost.com\/rw\/2010-2019\/WashingtonPost\/2015\/03\/18\/National-Economy\/Images\/Nic6429750-1138.jpg"
+} \ No newline at end of file
diff --git a/test/test-pages/webmd-1/expected-metadata.json b/test/test-pages/webmd-1/expected-metadata.json
index 315ee82..76d3dbc 100644
--- a/test/test-pages/webmd-1/expected-metadata.json
+++ b/test/test-pages/webmd-1/expected-metadata.json
@@ -1,5 +1,6 @@
{
- "Title": "Babies Who Eat Peanuts Early May Avoid Allergy",
- "Author": "By Brenda Goodman, MA\n WebMD Health News",
- "Excerpt": "Life-threatening peanut allergies have mysteriously been on the rise in the past decade, with little hope for a cure. But a groundbreaking new study may offer a way to stem that rise, while another may offer some hope for those who are already allergic."
-}
+ "Title": "Babies Who Eat Peanuts Early May Avoid Allergy",
+ "Author": "By Brenda Goodman, MA\n WebMD Health News",
+ "Excerpt": "Life-threatening peanut allergies have mysteriously been on the rise in the past decade, with little hope for a cure. But a groundbreaking new study may offer a way to stem that rise, while another may offer some hope for those who are already allergic.",
+ "Image": "http:\/\/img.webmd.com\/dtmcms\/live\/webmd\/consumer_assets\/site_images\/miscellaneous\/webmd_FB_logo_bluebkgrd.jpg?v=1"
+} \ No newline at end of file
diff --git a/test/test-pages/webmd-2/expected-metadata.json b/test/test-pages/webmd-2/expected-metadata.json
index 3bbb5fd..dc0d878 100644
--- a/test/test-pages/webmd-2/expected-metadata.json
+++ b/test/test-pages/webmd-2/expected-metadata.json
@@ -1,5 +1,6 @@
{
- "Title": "Superbugs: What They Are and How You Get Them",
- "Author": "By Kelli Miller\n WebMD Health News",
- "Excerpt": "Drug-resistant bacteria, dubbed"
-}
+ "Title": "Superbugs: What They Are and How You Get Them",
+ "Author": "By Kelli Miller\n WebMD Health News",
+ "Excerpt": "Drug-resistant bacteria, dubbed",
+ "Image": "http:\/\/img.webmd.com\/dtmcms\/live\/webmd\/consumer_assets\/site_images\/miscellaneous\/webmd_FB_logo_bluebkgrd.jpg?v=1"
+} \ No newline at end of file
diff --git a/test/test-pages/wikia/expected-metadata.json b/test/test-pages/wikia/expected-metadata.json
index 3ad3235..4769623 100644
--- a/test/test-pages/wikia/expected-metadata.json
+++ b/test/test-pages/wikia/expected-metadata.json
@@ -1,6 +1,7 @@
{
- "Title": "'Star Wars' Original Cuts Might Get Released for 40th Anniversary",
- "Author": "James Akinaka",
- "Direction": null,
- "Excerpt": "As a 40th birthday present to the Star Wars Saga and its fans, Lucasfilm could re-release the original versions of the original trilogy films."
-}
+ "Title": "'Star Wars' Original Cuts Might Get Released for 40th Anniversary",
+ "Author": "James Akinaka",
+ "Direction": null,
+ "Excerpt": "As a 40th birthday present to the Star Wars Saga and its fans, Lucasfilm could re-release the original versions of the original trilogy films.",
+ "Image": "http:\/\/fakehost\/test\/720"
+} \ No newline at end of file
diff --git a/test/test-pages/wikipedia/expected-metadata.json b/test/test-pages/wikipedia/expected-metadata.json
index 52b13ff..8f22810 100644
--- a/test/test-pages/wikipedia/expected-metadata.json
+++ b/test/test-pages/wikipedia/expected-metadata.json
@@ -1,6 +1,6 @@
{
- "Title": "Mozilla - Wikipedia",
- "Author": null,
- "Direction": "ltr",
- "Excerpt": "Mozilla is a free-software community, created in 1998 by members of Netscape. The Mozilla community uses, develops, spreads and supports Mozilla products, thereby promoting exclusively free software and open standards, with only minor exceptions.[1] The community is supported institutionally by the Mozilla Foundation and its tax-paying subsidiary, the Mozilla Corporation.[2]"
-}
+ "Title": "Mozilla - Wikipedia",
+ "Author": null,
+ "Direction": "ltr",
+ "Excerpt": "Mozilla is a free-software community, created in 1998 by members of Netscape. The Mozilla community uses, develops, spreads and supports Mozilla products, thereby promoting exclusively free software and open standards, with only minor exceptions.[1] The community is supported institutionally by the Mozilla Foundation and its tax-paying subsidiary, the Mozilla Corporation.[2]"
+} \ No newline at end of file
diff --git a/test/test-pages/wordpress/expected-metadata.json b/test/test-pages/wordpress/expected-metadata.json
index c9d6abd..a9dcbfa 100644
--- a/test/test-pages/wordpress/expected-metadata.json
+++ b/test/test-pages/wordpress/expected-metadata.json
@@ -1,6 +1,7 @@
{
- "Title": "Stack Overflow Jobs Data Shows ReactJS Skills in High Demand, WordPress Market Oversaturated with Developers",
- "Author": null,
- "Direction": null,
- "Excerpt": "Stack Overflow published its analysis of 2017 hiring trends based on the targeting options employers selected when posting to Stack Overflow Jobs. The report, which compares data from 200 companies…"
-}
+ "Title": "Stack Overflow Jobs Data Shows ReactJS Skills in High Demand, WordPress Market Oversaturated with Developers",
+ "Author": null,
+ "Direction": null,
+ "Excerpt": "Stack Overflow published its analysis of 2017 hiring trends based on the targeting options employers selected when posting to Stack Overflow Jobs. The report, which compares data from 200 companies…",
+ "Image": "http:\/\/fakehost\/test\/470"
+} \ No newline at end of file
diff --git a/test/test-pages/yahoo-1/expected-metadata.json b/test/test-pages/yahoo-1/expected-metadata.json
index e4bcca1..2d7eb9b 100644
--- a/test/test-pages/yahoo-1/expected-metadata.json
+++ b/test/test-pages/yahoo-1/expected-metadata.json
@@ -1,6 +1,7 @@
{
- "Title": "These are the 8 coolest PlayStation VR games",
- "Author": "Ben Silverman",
- "Direction": null,
- "Excerpt": "To help you decide what’s what, I’ve put together this list of the 8 PSVR games worth considering. Beloved cult hit “Rez” gets the VR treatment to help launch the PSVR, and the results are terrific. Chaos, for sure, and also “Thumper.” Called a “violent rhythm game” by its creators, “Thumper” is, well"
-}
+ "Title": "These are the 8 coolest PlayStation VR games",
+ "Author": "Ben Silverman",
+ "Direction": null,
+ "Excerpt": "To help you decide what’s what, I’ve put together this list of the 8 PSVR games worth considering. Beloved cult hit “Rez” gets the VR treatment to help launch the PSVR, and the results are terrific. Chaos, for sure, and also “Thumper.” Called a “violent rhythm game” by its creators, “Thumper” is, well",
+ "Image": "http:\/\/l3.yimg.com\/uu\/api\/res\/1.2\/4eRCPf9lJt_3q29.outekQ--\/aD02Njk7dz03NDQ7c209MTthcHBpZD15dGFjaHlvbg--\/http:\/\/media.zenfs.com\/en\/homerun\/feed_manager_auto_publish_494\/4406ef57dcb40376c513903b03bef048"
+} \ No newline at end of file
diff --git a/test/test-pages/yahoo-2/expected-metadata.json b/test/test-pages/yahoo-2/expected-metadata.json
index fe406c3..98e35c4 100644
--- a/test/test-pages/yahoo-2/expected-metadata.json
+++ b/test/test-pages/yahoo-2/expected-metadata.json
@@ -1,5 +1,6 @@
{
- "Title": "Yahoo News - Latest News & Headlines",
- "Author": "NATALIYA VASILYEVA",
- "Excerpt": "The latest news and headlines from Yahoo! News. Get breaking news stories and in-depth coverage with videos and photos."
-}
+ "Title": "Yahoo News - Latest News & Headlines",
+ "Author": "NATALIYA VASILYEVA",
+ "Excerpt": "The latest news and headlines from Yahoo! News. Get breaking news stories and in-depth coverage with videos and photos.",
+ "Image": "https:\/\/s.yimg.com\/os\/mit\/media\/m\/social\/images\/social_default_logo-1481777.png"
+} \ No newline at end of file
diff --git a/test/test-pages/yahoo-3/expected-metadata.json b/test/test-pages/yahoo-3/expected-metadata.json
index 1ffa6e7..adce0d3 100644
--- a/test/test-pages/yahoo-3/expected-metadata.json
+++ b/test/test-pages/yahoo-3/expected-metadata.json
@@ -1,5 +1,6 @@
{
- "Title": "Veteran Wraps Baby in American Flag, Photo Sparks Controversy",
- "Excerpt": "A photographer and Navy veteran is fighting back after a photo she posted to Facebook started an online backlash. Vanessa Hicks said she had no idea her photo would be considered controversial. The photo, from a military family’s newborn photo shoot, showed a newborn infant wrapped in an American flag held by his father, who was in his military uniform. Hicks, a Navy veteran herself and the wife of an active-duty Navy member, said her intention was to honor the flag as well as her clients, who wanted to incorporate their military service in the photo shoot.",
- "Author": "By GILLIAN MOHNEY\n March 11, 2015 3:46 PM"
-}
+ "Title": "Veteran Wraps Baby in American Flag, Photo Sparks Controversy",
+ "Excerpt": "A photographer and Navy veteran is fighting back after a photo she posted to Facebook started an online backlash. Vanessa Hicks said she had no idea her photo would be considered controversial. The photo, from a military family’s newborn photo shoot, showed a newborn infant wrapped in an American flag held by his father, who was in his military uniform. Hicks, a Navy veteran herself and the wife of an active-duty Navy member, said her intention was to honor the flag as well as her clients, who wanted to incorporate their military service in the photo shoot.",
+ "Author": "By GILLIAN MOHNEY\n March 11, 2015 3:46 PM",
+ "Image": "https:\/\/s.yimg.com\/bt\/api\/res\/1.2\/qZaM9MLUOrxLg4IfXt_Niw--\/YXBwaWQ9eW5ld3NfbGVnbztxPTc1O3c9NjAw\/http:\/\/media.zenfs.com\/en-US\/video\/video.abcnewsplus.com\/559ecdbafdb839129816b5c79a996975.cf.png"
+} \ No newline at end of file
diff --git a/test/test-pages/yahoo-4/expected-metadata.json b/test/test-pages/yahoo-4/expected-metadata.json
index 8048fe7..82557ef 100644
--- a/test/test-pages/yahoo-4/expected-metadata.json
+++ b/test/test-pages/yahoo-4/expected-metadata.json
@@ -1,6 +1,7 @@
{
- "Title": "トレンドマイクロ、公衆無線LANを安全に使うためのアプリ「フリーWi-Fiプロテクション」(CNET Japan) - Yahoo!ニュース",
- "Author": null,
- "Direction": null,
- "Excerpt": "トレンドマイクロは3月9日、Wi-Fi利用時の通信を暗号化し保護するスマホ・タブレット - Yahoo!ニュース(CNET Japan)"
-}
+ "Title": "トレンドマイクロ、公衆無線LANを安全に使うためのアプリ「フリーWi-Fiプロテクション」(CNET Japan) - Yahoo!ニュース",
+ "Author": null,
+ "Direction": null,
+ "Excerpt": "トレンドマイクロは3月9日、Wi-Fi利用時の通信を暗号化し保護するスマホ・タブレット - Yahoo!ニュース(CNET Japan)",
+ "Image": "http:\/\/fakehost\/test\/600"
+} \ No newline at end of file
diff --git a/test/test-pages/youth/expected-metadata.json b/test/test-pages/youth/expected-metadata.json
index cf1afac..666b15d 100644
--- a/test/test-pages/youth/expected-metadata.json
+++ b/test/test-pages/youth/expected-metadata.json
@@ -1,6 +1,6 @@
{
- "Title": "海外留学生看两会:出国前后关注点大不同_教育频道_中国青年网",
- "Author": "青网校园崔宁宁",
- "Direction": null,
- "Excerpt": "图为马素湘在澳大利亚悉尼游玩时的近影。出国前后关注点大不同出国前:政治科目会出啥考题?出国后:国家未来将如何发展?在采访中,我们了解到不少学子在出国前就每年守在电脑前观看两会直播。但是,随着年龄和阅历的增长,学子对两会的关注点在出国前后发生了很大的变化。在法国里昂国立应用科学院留学的卢宇表示,他还是个中学生时,就开始关注两会了。“我高中毕业后就出国留学了。"
-}
+ "Title": "海外留学生看两会:出国前后关注点大不同_教育频道_中国青年网",
+ "Author": "青网校园崔宁宁",
+ "Direction": null,
+ "Excerpt": "图为马素湘在澳大利亚悉尼游玩时的近影。出国前后关注点大不同出国前:政治科目会出啥考题?出国后:国家未来将如何发展?在采访中,我们了解到不少学子在出国前就每年守在电脑前观看两会直播。但是,随着年龄和阅历的增长,学子对两会的关注点在出国前后发生了很大的变化。在法国里昂国立应用科学院留学的卢宇表示,他还是个中学生时,就开始关注两会了。“我高中毕业后就出国留学了。"
+} \ No newline at end of file