summaryrefslogtreecommitdiff
path: root/test
diff options
context:
space:
mode:
authorAndres Rey <[email protected]>2018-11-26 22:40:10 +0000
committerAndres Rey <[email protected]>2018-11-26 22:40:10 +0000
commit2fa332ff8d44dec300904538bfa3a196e051dcfd (patch)
tree30cf3f5560ac14dd6e30ebb8e2f8fbcd704b1acf /test
parent4dfbc5db03d429741454b076f35c2513a1a525ab (diff)
Add all missing metadata bits
Diffstat (limited to 'test')
-rw-r--r--test/test-pages/001/expected-metadata.json4
-rw-r--r--test/test-pages/002/expected-metadata.json4
-rw-r--r--test/test-pages/003-metadata-preferred/expected-metadata.json4
-rw-r--r--test/test-pages/004-metadata-space-separated-properties/expected-metadata.json4
-rw-r--r--test/test-pages/aclu/expected-metadata.json3
-rw-r--r--test/test-pages/ars-1/expected-metadata.json3
-rw-r--r--test/test-pages/base-url-base-element-relative/expected-metadata.json5
-rw-r--r--test/test-pages/base-url-base-element/expected-metadata.json5
-rw-r--r--test/test-pages/base-url/expected-metadata.json4
-rw-r--r--test/test-pages/basic-tags-cleaning/expected-metadata.json4
-rw-r--r--test/test-pages/bbc-1/expected-metadata.json3
-rw-r--r--test/test-pages/blogger/expected-metadata.json3
-rw-r--r--test/test-pages/buzzfeed-1/expected-metadata.json4
-rw-r--r--test/test-pages/challenges/expected-metadata.json5
-rw-r--r--test/test-pages/clean-links/expected-metadata.json4
-rw-r--r--test/test-pages/cnet-svg-classes/expected-metadata.json4
-rw-r--r--test/test-pages/comment-inside-script-parsing/expected-metadata.json4
-rw-r--r--test/test-pages/daringfireball-1/expected-metadata.json4
-rw-r--r--test/test-pages/different-sources-for-images/expected-metadata.json4
-rw-r--r--test/test-pages/ehow-1/expected-metadata.json3
-rw-r--r--test/test-pages/ehow-2/expected-metadata.json3
-rw-r--r--test/test-pages/embedded-videos/expected-metadata.json4
-rw-r--r--test/test-pages/engadget/expected-metadata.json4
-rw-r--r--test/test-pages/fortressofsolitude/expected-metadata.json3
-rw-r--r--test/test-pages/gmw/expected-metadata.json3
-rw-r--r--test/test-pages/heise/expected-metadata.json3
-rw-r--r--test/test-pages/herald-sun-1/expected-metadata.json3
-rw-r--r--test/test-pages/hidden-nodes/expected-metadata.json5
-rw-r--r--test/test-pages/hukumusume/expected-metadata.json5
-rw-r--r--test/test-pages/iab-1/expected-metadata.json3
-rw-r--r--test/test-pages/ietf-1/expected-metadata.json5
-rw-r--r--test/test-pages/infobae/expected-metadata.json3
-rw-r--r--test/test-pages/keep-images/expected-metadata.json3
-rw-r--r--test/test-pages/la-nacion/expected-metadata.json4
-rw-r--r--test/test-pages/lemonde-1/expected-metadata.json3
-rw-r--r--test/test-pages/lemonde-2/expected-metadata.json3
-rw-r--r--test/test-pages/liberation-1/expected-metadata.json3
-rw-r--r--test/test-pages/lifehacker-post-comment-load/expected-metadata.json3
-rw-r--r--test/test-pages/lifehacker-working/expected-metadata.json3
-rw-r--r--test/test-pages/links-in-tables/expected-metadata.json3
-rw-r--r--test/test-pages/lwn-1/expected-metadata.json4
-rw-r--r--test/test-pages/medium-1/expected-metadata.json3
-rw-r--r--test/test-pages/medium-2/expected-metadata.json3
-rw-r--r--test/test-pages/missing-paragraphs/expected-metadata.json4
-rw-r--r--test/test-pages/msn/expected-metadata.json3
-rw-r--r--test/test-pages/remove-extra-brs/expected-metadata.json4
-rw-r--r--test/test-pages/remove-extra-paragraphs/expected-metadata.json4
-rw-r--r--test/test-pages/remove-script-tags/expected-metadata.json4
-rw-r--r--test/test-pages/reordering-paragraphs/expected-metadata.json6
-rw-r--r--test/test-pages/replace-brs/expected-metadata.json4
-rw-r--r--test/test-pages/replace-font-tags/expected-metadata.json4
-rw-r--r--test/test-pages/rtl-1/expected-metadata.json3
-rw-r--r--test/test-pages/rtl-2/expected-metadata.json3
-rw-r--r--test/test-pages/rtl-3/expected-metadata.json3
-rw-r--r--test/test-pages/rtl-4/expected-metadata.json3
-rw-r--r--test/test-pages/salon-1/expected-metadata.json3
-rw-r--r--test/test-pages/simplyfound-1/expected-metadata.json3
-rw-r--r--test/test-pages/social-buttons/expected-metadata.json4
-rw-r--r--test/test-pages/style-tags-removal/expected-metadata.json4
-rw-r--r--test/test-pages/svg-parsing/expected-metadata.json4
-rw-r--r--test/test-pages/table-style-attributes/expected-metadata.json3
-rw-r--r--test/test-pages/telegraph/expected-metadata.json4
-rw-r--r--test/test-pages/title-and-h1-discrepancy/expected-metadata.json5
-rw-r--r--test/test-pages/tmz-1/expected-metadata.json3
-rw-r--r--test/test-pages/wapo-1/expected-metadata.json3
-rw-r--r--test/test-pages/wapo-2/expected-metadata.json3
-rw-r--r--test/test-pages/webmd-1/expected-metadata.json3
-rw-r--r--test/test-pages/webmd-2/expected-metadata.json3
-rw-r--r--test/test-pages/wikipedia/expected-metadata.json3
-rw-r--r--test/test-pages/yahoo-2/expected-metadata.json3
-rw-r--r--test/test-pages/yahoo-3/expected-metadata.json3
-rw-r--r--test/test-pages/youth/expected-metadata.json3
72 files changed, 186 insertions, 73 deletions
diff --git a/test/test-pages/001/expected-metadata.json b/test/test-pages/001/expected-metadata.json
index f11c7b4..7913001 100644
--- a/test/test-pages/001/expected-metadata.json
+++ b/test/test-pages/001/expected-metadata.json
@@ -1,5 +1,7 @@
{
"Title": "Get your Frontend JavaScript Code Covered | Code",
"Author": "Nicolas Perriault —",
- "Excerpt": "Nicolas Perriault's homepage."
+ "Excerpt": "Nicolas Perriault's homepage.",
+ "Direction": null,
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/002/expected-metadata.json b/test/test-pages/002/expected-metadata.json
index a9fb9d3..6777d36 100644
--- a/test/test-pages/002/expected-metadata.json
+++ b/test/test-pages/002/expected-metadata.json
@@ -1,5 +1,7 @@
{
"Title": "This API is so Fetching!",
"Author": "Nikhil Marathe",
- "Excerpt": "For more than a decade the Web has used XMLHttpRequest (XHR) to achieve asynchronous requests in JavaScript. While very useful, XHR is not a very ..."
+ "Excerpt": "For more than a decade the Web has used XMLHttpRequest (XHR) to achieve asynchronous requests in JavaScript. While very useful, XHR is not a very ...",
+ "Direction": null,
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/003-metadata-preferred/expected-metadata.json b/test/test-pages/003-metadata-preferred/expected-metadata.json
index b81f0a6..557881c 100644
--- a/test/test-pages/003-metadata-preferred/expected-metadata.json
+++ b/test/test-pages/003-metadata-preferred/expected-metadata.json
@@ -1,5 +1,7 @@
{
"Title": "Dublin Core property title",
"Author": "Dublin Core property author",
- "Excerpt": "Dublin Core property description"
+ "Excerpt": "Dublin Core property description",
+ "Direction": null,
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/004-metadata-space-separated-properties/expected-metadata.json b/test/test-pages/004-metadata-space-separated-properties/expected-metadata.json
index 5f7fda2..4007b7b 100644
--- a/test/test-pages/004-metadata-space-separated-properties/expected-metadata.json
+++ b/test/test-pages/004-metadata-space-separated-properties/expected-metadata.json
@@ -1,5 +1,7 @@
{
"Title": "Preferred title",
"Author": "Creator Name",
- "Excerpt": "Preferred description"
+ "Excerpt": "Preferred description",
+ "Direction": null,
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/aclu/expected-metadata.json b/test/test-pages/aclu/expected-metadata.json
index 82fefd5..87432d3 100644
--- a/test/test-pages/aclu/expected-metadata.json
+++ b/test/test-pages/aclu/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "Facebook Is Tracking Me Even Though I’m Not on Facebook",
"Author": "By Daniel Kahn Gillmor, Senior Staff Technologist, ACLU Speech, Privacy, and Technology Project",
"Excerpt": "I don't use Facebook. I'm not technophobic — I'm a geek. I've been using email since the early 1990s, I have accounts on hundreds of services around the net, and I do software development and internet protocol design both for work and for fun. I believe that a globe-spanning communications network like the internet can be a positive social force, and I publish much of my own work on the open web.",
- "Image": "https:\/\/www.aclu.org\/sites\/default\/files\/styles\/metatag_og_image_1200x630\/public\/field_share_image\/web18-facebook-socialshare-1200x628-v02.png?itok=p77cQjOm"
+ "Image": "https:\/\/www.aclu.org\/sites\/default\/files\/styles\/metatag_og_image_1200x630\/public\/field_share_image\/web18-facebook-socialshare-1200x628-v02.png?itok=p77cQjOm",
+ "Direction": "ltr"
} \ No newline at end of file
diff --git a/test/test-pages/ars-1/expected-metadata.json b/test/test-pages/ars-1/expected-metadata.json
index 5909f3e..7b57849 100644
--- a/test/test-pages/ars-1/expected-metadata.json
+++ b/test/test-pages/ars-1/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "Just-released Minecraft exploit makes it easy to crash game servers",
"Author": "by Dan Goodin - Apr 16, 2015 8:02 pm UTC",
"Excerpt": "Two-year-old bug exposes thousands of servers to crippling attack.",
- "Image": "http:\/\/cdn.arstechnica.net\/wp-content\/uploads\/2015\/04\/server-crash-640x426.jpg"
+ "Image": "http:\/\/cdn.arstechnica.net\/wp-content\/uploads\/2015\/04\/server-crash-640x426.jpg",
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/base-url-base-element-relative/expected-metadata.json b/test/test-pages/base-url-base-element-relative/expected-metadata.json
index 7e3b35a..1a489a7 100644
--- a/test/test-pages/base-url-base-element-relative/expected-metadata.json
+++ b/test/test-pages/base-url-base-element-relative/expected-metadata.json
@@ -1,4 +1,7 @@
{
"Title": "Base URL with base relative test",
- "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum."
+ "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum.",
+ "Author": null,
+ "Direction": null,
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/base-url-base-element/expected-metadata.json b/test/test-pages/base-url-base-element/expected-metadata.json
index 3545f80..1eb382f 100644
--- a/test/test-pages/base-url-base-element/expected-metadata.json
+++ b/test/test-pages/base-url-base-element/expected-metadata.json
@@ -1,4 +1,7 @@
{
"Title": "Base URL with base test",
- "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum."
+ "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum.",
+ "Author": null,
+ "Direction": null,
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/base-url/expected-metadata.json b/test/test-pages/base-url/expected-metadata.json
index 1c8014d..f73949e 100644
--- a/test/test-pages/base-url/expected-metadata.json
+++ b/test/test-pages/base-url/expected-metadata.json
@@ -1,5 +1,7 @@
{
"Title": "Base URL test",
"Author": null,
- "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum."
+ "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum.",
+ "Direction": null,
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/basic-tags-cleaning/expected-metadata.json b/test/test-pages/basic-tags-cleaning/expected-metadata.json
index 1382512..bcce076 100644
--- a/test/test-pages/basic-tags-cleaning/expected-metadata.json
+++ b/test/test-pages/basic-tags-cleaning/expected-metadata.json
@@ -1,5 +1,7 @@
{
"Title": "Basic tag cleaning test",
"Author": null,
- "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua."
+ "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua.",
+ "Direction": null,
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/bbc-1/expected-metadata.json b/test/test-pages/bbc-1/expected-metadata.json
index fb1ad45..82698bd 100644
--- a/test/test-pages/bbc-1/expected-metadata.json
+++ b/test/test-pages/bbc-1/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "Obama admits US gun laws are his 'biggest frustration' - BBC News",
"Author": null,
"Excerpt": "President Barack Obama tells the BBC his failure to pass \"common sense gun safety laws\" is the greatest frustration of his presidency.",
- "Image": "http:\/\/ichef.bbci.co.uk\/news\/1024\/cpsprodpb\/3D8B\/production\/_84455751_84455749.jpg"
+ "Image": "http:\/\/ichef.bbci.co.uk\/news\/1024\/cpsprodpb\/3D8B\/production\/_84455751_84455749.jpg",
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/blogger/expected-metadata.json b/test/test-pages/blogger/expected-metadata.json
index eef4912..1de8a0c 100644
--- a/test/test-pages/blogger/expected-metadata.json
+++ b/test/test-pages/blogger/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "Open Verilog flow for Silego GreenPak4 programmable logic devices",
"Author": null,
"Excerpt": "I've written a couple of posts in the past few months but they were all for the blog at work so I figured I'm long overdue for one on Silic...",
- "Image": "https:\/\/1.bp.blogspot.com\/-YIPC5jkXkDE\/Vy7YPSqFKWI\/AAAAAAAAAxI\/a7D6Ji2GxoUvcrwUkI4RLZcr2LFQEJCTACLcB\/w1200-h630-p-nu\/block-diagram.png"
+ "Image": "https:\/\/1.bp.blogspot.com\/-YIPC5jkXkDE\/Vy7YPSqFKWI\/AAAAAAAAAxI\/a7D6Ji2GxoUvcrwUkI4RLZcr2LFQEJCTACLcB\/w1200-h630-p-nu\/block-diagram.png",
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/buzzfeed-1/expected-metadata.json b/test/test-pages/buzzfeed-1/expected-metadata.json
index c269f76..1966ef9 100644
--- a/test/test-pages/buzzfeed-1/expected-metadata.json
+++ b/test/test-pages/buzzfeed-1/expected-metadata.json
@@ -1,5 +1,7 @@
{
"Title": "Student Dies After Diet Pills She Bought Online \"Burned Her Up From Within\"",
"Excerpt": "An inquest into Eloise Parry's death has been adjourned until July.",
- "Image": "http:\/\/fakehost\/test\/412"
+ "Image": "http:\/\/fakehost\/test\/412",
+ "Author": null,
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/challenges/expected-metadata.json b/test/test-pages/challenges/expected-metadata.json
index 80e7aee..e5e7f10 100644
--- a/test/test-pages/challenges/expected-metadata.json
+++ b/test/test-pages/challenges/expected-metadata.json
@@ -1,4 +1,7 @@
{
"Title": "Les motivations du tueur de Las Vegas demeurent floues",
- "Image": "http:\/\/fakehost\/img\/cha\/placeholders\/placeholder_1000x750.jpg"
+ "Image": "http:\/\/fakehost\/img\/cha\/placeholders\/placeholder_1000x750.jpg",
+ "Author": null,
+ "Direction": null,
+ "Excerpt": "par Alexandria Sage et Lisa Girion"
} \ No newline at end of file
diff --git a/test/test-pages/clean-links/expected-metadata.json b/test/test-pages/clean-links/expected-metadata.json
index cc7923f..9fd9722 100644
--- a/test/test-pages/clean-links/expected-metadata.json
+++ b/test/test-pages/clean-links/expected-metadata.json
@@ -1,5 +1,7 @@
{
"Title": "Bartleby the Scrivener Web Study Text",
"Author": null,
- "Excerpt": "Ere introducing the scrivener, as he first appeared to me, it is fit \n I make some mention of myself, my employees, my business, my chambers, \n and general surroundings; because some such description is indispensable \n to an adequate understanding of the chief character about to be presented."
+ "Excerpt": "Ere introducing the scrivener, as he first appeared to me, it is fit \n I make some mention of myself, my employees, my business, my chambers, \n and general surroundings; because some such description is indispensable \n to an adequate understanding of the chief character about to be presented.",
+ "Direction": null,
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/cnet-svg-classes/expected-metadata.json b/test/test-pages/cnet-svg-classes/expected-metadata.json
index f6f4d46..a6ca13d 100644
--- a/test/test-pages/cnet-svg-classes/expected-metadata.json
+++ b/test/test-pages/cnet-svg-classes/expected-metadata.json
@@ -1,5 +1,7 @@
{
"Title": "Twitter Lite se estrena en México, Venezuela y otros nueve países",
"Excerpt": "Twitter Lite llega a 11 países de América Latina, para ayudar a los usuarios con mala señal de sus redes móviles.",
- "Image": "https:\/\/cdn1.cnet.com\/img\/JumVcu1ZSLtPP8ui0UWaSlgi5RU=\/670x503\/2017\/12\/01\/b36ce794-e0b8-495c-a198-184923a8f4e9\/twitter-lite.jpg"
+ "Image": "https:\/\/cdn1.cnet.com\/img\/JumVcu1ZSLtPP8ui0UWaSlgi5RU=\/670x503\/2017\/12\/01\/b36ce794-e0b8-495c-a198-184923a8f4e9\/twitter-lite.jpg",
+ "Author": null,
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/comment-inside-script-parsing/expected-metadata.json b/test/test-pages/comment-inside-script-parsing/expected-metadata.json
index f4e5750..65dd54e 100644
--- a/test/test-pages/comment-inside-script-parsing/expected-metadata.json
+++ b/test/test-pages/comment-inside-script-parsing/expected-metadata.json
@@ -1,5 +1,7 @@
{
"Title": "Test script parsing",
"Author": null,
- "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua."
+ "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua.",
+ "Direction": null,
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/daringfireball-1/expected-metadata.json b/test/test-pages/daringfireball-1/expected-metadata.json
index b9969de..e7c3e77 100644
--- a/test/test-pages/daringfireball-1/expected-metadata.json
+++ b/test/test-pages/daringfireball-1/expected-metadata.json
@@ -1,5 +1,7 @@
{
"Title": "Daring Fireball: Colophon",
"Author": null,
- "Excerpt": "Daring Fireball is written and produced by John Gruber."
+ "Excerpt": "Daring Fireball is written and produced by John Gruber.",
+ "Direction": null,
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/different-sources-for-images/expected-metadata.json b/test/test-pages/different-sources-for-images/expected-metadata.json
index 7bfc756..e90c53b 100644
--- a/test/test-pages/different-sources-for-images/expected-metadata.json
+++ b/test/test-pages/different-sources-for-images/expected-metadata.json
@@ -1,5 +1,7 @@
{
"Title": "Image sources test",
"Author": null,
- "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum."
+ "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum.",
+ "Direction": null,
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/ehow-1/expected-metadata.json b/test/test-pages/ehow-1/expected-metadata.json
index f19b038..faac669 100644
--- a/test/test-pages/ehow-1/expected-metadata.json
+++ b/test/test-pages/ehow-1/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "How to Build a Terrarium | eHow",
"Author": "Lucy Akins",
"Excerpt": "Glass cloche terrariums are not only appealing to the eye, but they also preserve a bit of nature in your home and serve as a simple, yet beautiful, piece of art. Closed terrariums are easy to care for, as they retain much of their own moisture and provide a warm environment with a consistent level of humidity. You won’t have to water the...",
- "Image": "http:\/\/img-aws.ehowcdn.com\/200x200\/cme\/photography.prod.demandstudios.com\/16149374-814f-40bc-baf3-ca20f149f0ba.jpg"
+ "Image": "http:\/\/img-aws.ehowcdn.com\/200x200\/cme\/photography.prod.demandstudios.com\/16149374-814f-40bc-baf3-ca20f149f0ba.jpg",
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/ehow-2/expected-metadata.json b/test/test-pages/ehow-2/expected-metadata.json
index 43eff45..e563673 100644
--- a/test/test-pages/ehow-2/expected-metadata.json
+++ b/test/test-pages/ehow-2/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "How to Throw a Graduation Party on a Budget | eHow",
"Author": "Gina Roberts-Grey",
"Excerpt": "Graduation parties are a great way to commemorate the years of hard work teens and college co-eds devote to education. They’re also costly for mom and dad.The average cost of a graduation party in 2013 was a whopping $1,200, according to Graduationparty.com; $700 of that was allocated for food. However that budget was based on Midwestern...",
- "Image": "http:\/\/img-aws.ehowcdn.com\/200x200\/cme\/cme_public_images\/www_ehow_com\/cdn-write.demandstudios.com\/upload\/image\/2F\/86\/5547EF62-EAF5-4256-945D-0496F61C862F\/5547EF62-EAF5-4256-945D-0496F61C862F.jpg"
+ "Image": "http:\/\/img-aws.ehowcdn.com\/200x200\/cme\/cme_public_images\/www_ehow_com\/cdn-write.demandstudios.com\/upload\/image\/2F\/86\/5547EF62-EAF5-4256-945D-0496F61C862F\/5547EF62-EAF5-4256-945D-0496F61C862F.jpg",
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/embedded-videos/expected-metadata.json b/test/test-pages/embedded-videos/expected-metadata.json
index e22af78..8473f13 100644
--- a/test/test-pages/embedded-videos/expected-metadata.json
+++ b/test/test-pages/embedded-videos/expected-metadata.json
@@ -1,5 +1,7 @@
{
"Title": "Embedded videos test",
"Author": null,
- "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum."
+ "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum.",
+ "Direction": null,
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/engadget/expected-metadata.json b/test/test-pages/engadget/expected-metadata.json
index d00b669..0eb0040 100644
--- a/test/test-pages/engadget/expected-metadata.json
+++ b/test/test-pages/engadget/expected-metadata.json
@@ -1,5 +1,7 @@
{
"Title": "Xbox One X review: A console that keeps up with gaming PCs",
"Excerpt": "The Xbox One X is the most powerful gaming console ever, but it's not for everyone yet.",
- "Image": "http:\/\/fakehost\/test\/630"
+ "Image": "http:\/\/fakehost\/test\/630",
+ "Author": null,
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/fortressofsolitude/expected-metadata.json b/test/test-pages/fortressofsolitude/expected-metadata.json
index 54d1b36..17c133e 100644
--- a/test/test-pages/fortressofsolitude/expected-metadata.json
+++ b/test/test-pages/fortressofsolitude/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "Céline Dion Belches Her Way Onto Deadpool 2's Soundtrack",
"Author": "Written by Edward Wallace",
"Excerpt": "Just when you think the marketing behind the film couldn't get any more amazing, they go and release a music video from the Deadpool 2 soundtrack starring Canadian singer Céline Dion.",
- "Image": "http:\/\/fakehost\/test\/Céline Dion Belches Her Way Onto Deadpool 2's Soundtrack"
+ "Image": "http:\/\/fakehost\/test\/Céline Dion Belches Her Way Onto Deadpool 2's Soundtrack",
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/gmw/expected-metadata.json b/test/test-pages/gmw/expected-metadata.json
index cba8ceb..eb5f7f8 100644
--- a/test/test-pages/gmw/expected-metadata.json
+++ b/test/test-pages/gmw/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "宇航员在太空中喝酒会怎么样?后果很严重 _探索者 _光明网",
"Author": "肖春芳",
"Direction": null,
- "Excerpt": "不幸的是,对于希望能喝上一杯的太空探险者,那些将他们送上太空的政府机构普遍禁止他们染指包括酒在内的含酒精饮料。"
+ "Excerpt": "不幸的是,对于希望能喝上一杯的太空探险者,那些将他们送上太空的政府机构普遍禁止他们染指包括酒在内的含酒精饮料。",
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/heise/expected-metadata.json b/test/test-pages/heise/expected-metadata.json
index ffad06a..9044ea1 100644
--- a/test/test-pages/heise/expected-metadata.json
+++ b/test/test-pages/heise/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "1Password für Mac generiert Einmal-Passwörter",
"Author": "Mac & i",
"Excerpt": "Das in der iOS-Version bereits enthaltene TOTP-Feature ist nun auch für OS X 10.10 verfügbar. Zudem gibt es neue Zusatzfelder in der Datenbank und weitere Verbesserungen.",
- "Image": "http:\/\/www.heise.de\/imgs\/18\/1\/4\/6\/2\/3\/5\/1\/Barcode-Scanner-With-Border-f0c62350bd8d9d96.jpeg"
+ "Image": "http:\/\/www.heise.de\/imgs\/18\/1\/4\/6\/2\/3\/5\/1\/Barcode-Scanner-With-Border-f0c62350bd8d9d96.jpeg",
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/herald-sun-1/expected-metadata.json b/test/test-pages/herald-sun-1/expected-metadata.json
index 1f84910..47ae6e9 100644
--- a/test/test-pages/herald-sun-1/expected-metadata.json
+++ b/test/test-pages/herald-sun-1/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "Angry media won’t buckle over new surveillance laws",
"Author": "JOE HILDEBRAND",
"Excerpt": "A HIGH-powered federal government team has been doing the rounds of media organisations in the past few days in an attempt to allay concerns about the impact of new surveillance legislation on press freedom. It failed.",
- "Image": "http:\/\/api.news.com.au\/content\/1.0\/heraldsun\/images\/1227261885862?format=jpg&group=iphone&size=medium"
+ "Image": "http:\/\/api.news.com.au\/content\/1.0\/heraldsun\/images\/1227261885862?format=jpg&group=iphone&size=medium",
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/hidden-nodes/expected-metadata.json b/test/test-pages/hidden-nodes/expected-metadata.json
index c243f7a..0642498 100644
--- a/test/test-pages/hidden-nodes/expected-metadata.json
+++ b/test/test-pages/hidden-nodes/expected-metadata.json
@@ -1,4 +1,7 @@
{
"Title": "Lorem ipsum dolor sit amet, consetetur sadipscing elitr, sed diam nonumy eirmod tempor invidunt",
- "Excerpt": "Lorem ipsum dolor sit amet, consetetur sadipscing elitr, sed diam nonumy eirmod tempor invidunt ut labore et dolore magna aliquyam erat, sed diam voluptua. At vero eos et accusam et justo duo dolores et ea rebum. Stet clita kasd gubergren, no sea takimata sanctus est Lorem ipsum dolor sit amet. Lorem ipsum dolor sit amet, consetetur sadipscing elitr, sed diam nonumy eirmod tempor invidunt ut labore et dolore magna aliquyam erat, sed diam voluptua. At vero eos et accusam et justo duo dolores et ea rebum. Stet clita kasd gubergren, no sea takimata sanctus est Lorem ipsum dolor sit amet. Lorem ipsum dolor sit amet, consetetur sadipscing elitr, sed diam nonumy eirmod tempor invidunt ut labore et dolore magna aliquyam erat, sed diam voluptua. At vero eos et accusam et justo duo dolores et ea rebum. Stet clita kasd gubergren, no sea takimata sanctus est Lorem ipsum dolor sit amet."
+ "Excerpt": "Lorem ipsum dolor sit amet, consetetur sadipscing elitr, sed diam nonumy eirmod tempor invidunt ut labore et dolore magna aliquyam erat, sed diam voluptua. At vero eos et accusam et justo duo dolores et ea rebum. Stet clita kasd gubergren, no sea takimata sanctus est Lorem ipsum dolor sit amet. Lorem ipsum dolor sit amet, consetetur sadipscing elitr, sed diam nonumy eirmod tempor invidunt ut labore et dolore magna aliquyam erat, sed diam voluptua. At vero eos et accusam et justo duo dolores et ea rebum. Stet clita kasd gubergren, no sea takimata sanctus est Lorem ipsum dolor sit amet. Lorem ipsum dolor sit amet, consetetur sadipscing elitr, sed diam nonumy eirmod tempor invidunt ut labore et dolore magna aliquyam erat, sed diam voluptua. At vero eos et accusam et justo duo dolores et ea rebum. Stet clita kasd gubergren, no sea takimata sanctus est Lorem ipsum dolor sit amet.",
+ "Author": null,
+ "Direction": null,
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/hukumusume/expected-metadata.json b/test/test-pages/hukumusume/expected-metadata.json
index f2f7e76..58f4852 100644
--- a/test/test-pages/hukumusume/expected-metadata.json
+++ b/test/test-pages/hukumusume/expected-metadata.json
@@ -1,4 +1,7 @@
{
"Title": "欲張りなイヌ <福娘童話集 きょうのイソップ童話>",
- "Excerpt": "福娘童話集 > きょうのイソップ童話 > 1月のイソップ童話 > 欲張りなイヌ"
+ "Excerpt": "福娘童話集 > きょうのイソップ童話 > 1月のイソップ童話 > 欲張りなイヌ",
+ "Author": null,
+ "Direction": null,
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/iab-1/expected-metadata.json b/test/test-pages/iab-1/expected-metadata.json
index 0ea6fea..e804946 100644
--- a/test/test-pages/iab-1/expected-metadata.json
+++ b/test/test-pages/iab-1/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "Getting LEAN with Digital Ad UX | IAB",
"Author": "By\n\t\t\tScott Cunningham",
"Excerpt": "We messed up. As technologists, tasked with delivering content and services to users, we lost track of the user experience. Twenty years ago we saw an explosion of websites, built by developers around the world, providing all forms of content. This was the beginning of an age of enlightenment, the intersection of content and technology. … Continued",
- "Image": "http:\/\/www.iab.com\/wp-content\/uploads\/2015\/10\/getting-lean-with-digital-ad-ux-300x250.jpg"
+ "Image": "http:\/\/www.iab.com\/wp-content\/uploads\/2015\/10\/getting-lean-with-digital-ad-ux-300x250.jpg",
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/ietf-1/expected-metadata.json b/test/test-pages/ietf-1/expected-metadata.json
index 2babd23..95a5463 100644
--- a/test/test-pages/ietf-1/expected-metadata.json
+++ b/test/test-pages/ietf-1/expected-metadata.json
@@ -1,4 +1,7 @@
{
"Title": "remoteStorage",
- "Author": "Jong, Michiel de"
+ "Author": "Jong, Michiel de",
+ "Direction": null,
+ "Excerpt": null,
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/infobae/expected-metadata.json b/test/test-pages/infobae/expected-metadata.json
index 45a0ac8..fb51b49 100644
--- a/test/test-pages/infobae/expected-metadata.json
+++ b/test/test-pages/infobae/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "Una patota de varones atacó a un rugbier gay: \"Te vamos a matar por puto\"",
"Author": "Por Mauricio Luna 1 de diciembre de 2017",
"Excerpt": "Jonathan Castellari fue salvajemente golpeado en un local de comidas rápidas, mientras esperaba el desayuno junto a un amigo. Podría perder un ojo",
- "Image": "https:\/\/www.infobae.com\/new-resizer\/shi8E0F5ldd8a7vtvFaJomRURqU=\/1200x0\/filters:quality(100)\/s3.amazonaws.com\/arc-wordpress-client-uploads\/infobae-wp\/wp-content\/uploads\/2017\/12\/01154429\/Rugbier-golpeado-1920.jpg"
+ "Image": "https:\/\/www.infobae.com\/new-resizer\/shi8E0F5ldd8a7vtvFaJomRURqU=\/1200x0\/filters:quality(100)\/s3.amazonaws.com\/arc-wordpress-client-uploads\/infobae-wp\/wp-content\/uploads\/2017\/12\/01154429\/Rugbier-golpeado-1920.jpg",
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/keep-images/expected-metadata.json b/test/test-pages/keep-images/expected-metadata.json
index ac3808e..04f0cf0 100644
--- a/test/test-pages/keep-images/expected-metadata.json
+++ b/test/test-pages/keep-images/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "Inside the Deep Web Drug Lab",
"Author": "Joseph Cox",
"Excerpt": "Welcome to DoctorX’s Barcelona lab, where the drugs you bought online are tested for safety and purity. No questions ask…",
- "Image": "https:\/\/d262ilb51hltx0.cloudfront.net\/max\/800\/1*sLDnS1UWEFIS33uLMxq3cw.jpeg"
+ "Image": "https:\/\/d262ilb51hltx0.cloudfront.net\/max\/800\/1*sLDnS1UWEFIS33uLMxq3cw.jpeg",
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/la-nacion/expected-metadata.json b/test/test-pages/la-nacion/expected-metadata.json
index 2f5b6c5..1fc7b51 100644
--- a/test/test-pages/la-nacion/expected-metadata.json
+++ b/test/test-pages/la-nacion/expected-metadata.json
@@ -1,5 +1,7 @@
{
"Title": "Una solución no violenta para la cuestión mapuche",
"Excerpt": "Los pueblos indígenas reclaman por derechos que permanecen incumplidos, por eso es más eficiente canalizar la protesta que reprimirla",
- "Image": "http:\/\/bucket.glanacion.com\/anexos\/fotos\/77\/2585177.jpg"
+ "Image": "http:\/\/bucket.glanacion.com\/anexos\/fotos\/77\/2585177.jpg",
+ "Author": null,
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/lemonde-1/expected-metadata.json b/test/test-pages/lemonde-1/expected-metadata.json
index e0d0a9c..23160f4 100644
--- a/test/test-pages/lemonde-1/expected-metadata.json
+++ b/test/test-pages/lemonde-1/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "Le projet de loi sur le renseignement massivement approuvé à l'Assemblée",
"Author": null,
"Excerpt": "Largement approuvé par les députés, le texte sera désormais examiné par le Sénat, puis le Conseil constitutionnel.",
- "Image": "http:\/\/fakehost\/test\/image\/jpeg"
+ "Image": "http:\/\/fakehost\/test\/image\/jpeg",
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/lemonde-2/expected-metadata.json b/test/test-pages/lemonde-2/expected-metadata.json
index 2706a54..a2ce5b6 100644
--- a/test/test-pages/lemonde-2/expected-metadata.json
+++ b/test/test-pages/lemonde-2/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "La crise européenne est une crise de la dette, pas de l'euro",
"Author": null,
"Excerpt": "Le retour à la stabilité coûtera des milliards d'euros, mais l'Union européenne en vaut la peine, estime un collectif d'industriels.",
- "Image": "http:\/\/s1.lemde.fr\/medias\/web\/1.2.705\/img\/placeholder\/default.png"
+ "Image": "http:\/\/s1.lemde.fr\/medias\/web\/1.2.705\/img\/placeholder\/default.png",
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/liberation-1/expected-metadata.json b/test/test-pages/liberation-1/expected-metadata.json
index bce9274..e1577f4 100644
--- a/test/test-pages/liberation-1/expected-metadata.json
+++ b/test/test-pages/liberation-1/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "Un troisième Français mort dans le séisme au Népal",
"Author": "AFP",
"Excerpt": "Laurent Fabius a accueilli jeudi matin à Roissy un premier avion spécial ramenant des rescapés.",
- "Image": "http:\/\/md1.libe.com\/photo\/755923-000_hkg10175905.jpg?modified_at=1430371146&amp;width=750"
+ "Image": "http:\/\/md1.libe.com\/photo\/755923-000_hkg10175905.jpg?modified_at=1430371146&amp;width=750",
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/lifehacker-post-comment-load/expected-metadata.json b/test/test-pages/lifehacker-post-comment-load/expected-metadata.json
index 368bece..c660b5e 100644
--- a/test/test-pages/lifehacker-post-comment-load/expected-metadata.json
+++ b/test/test-pages/lifehacker-post-comment-load/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "How to Program Your Mind to Stop Buying Crap You Don’t Need",
"Author": "Patrick Allan",
"Excerpt": "We all buy things from time to time that we don't really need. It's okay to appeal to your wants every once in a while, as long as you're in control. If you struggle with clutter, impulse buys, and buyer's remorse, here's how to put your mind in the right place before you even set foot in a store.",
- "Image": "http:\/\/i.kinja-img.com\/gawker-media\/image\/upload\/s--hqqO9fze--\/n1s6c2m6kc07iqdyllj6.jpg"
+ "Image": "http:\/\/i.kinja-img.com\/gawker-media\/image\/upload\/s--hqqO9fze--\/n1s6c2m6kc07iqdyllj6.jpg",
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/lifehacker-working/expected-metadata.json b/test/test-pages/lifehacker-working/expected-metadata.json
index 368bece..c660b5e 100644
--- a/test/test-pages/lifehacker-working/expected-metadata.json
+++ b/test/test-pages/lifehacker-working/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "How to Program Your Mind to Stop Buying Crap You Don’t Need",
"Author": "Patrick Allan",
"Excerpt": "We all buy things from time to time that we don't really need. It's okay to appeal to your wants every once in a while, as long as you're in control. If you struggle with clutter, impulse buys, and buyer's remorse, here's how to put your mind in the right place before you even set foot in a store.",
- "Image": "http:\/\/i.kinja-img.com\/gawker-media\/image\/upload\/s--hqqO9fze--\/n1s6c2m6kc07iqdyllj6.jpg"
+ "Image": "http:\/\/i.kinja-img.com\/gawker-media\/image\/upload\/s--hqqO9fze--\/n1s6c2m6kc07iqdyllj6.jpg",
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/links-in-tables/expected-metadata.json b/test/test-pages/links-in-tables/expected-metadata.json
index 3f72532..f833e26 100644
--- a/test/test-pages/links-in-tables/expected-metadata.json
+++ b/test/test-pages/links-in-tables/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "Saving Data: Reducing the size of App Updates by 65%",
"Author": null,
"Excerpt": "Posted by Andrew Hayden, Software Engineer on Google Play Android users are downloading tens of billions of apps and games on Google Pla...",
- "Image": "https:\/\/2.bp.blogspot.com\/-chCZZinlUTg\/WEcxvJo9gdI\/AAAAAAAADnk\/3ND_BspqN6Y2j5xxkLFW3RyS2Ig0NHZpQCLcB\/w1200-h630-p-k-nu\/ipsum-opsum.gif"
+ "Image": "https:\/\/2.bp.blogspot.com\/-chCZZinlUTg\/WEcxvJo9gdI\/AAAAAAAADnk\/3ND_BspqN6Y2j5xxkLFW3RyS2Ig0NHZpQCLcB\/w1200-h630-p-k-nu\/ipsum-opsum.gif",
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/lwn-1/expected-metadata.json b/test/test-pages/lwn-1/expected-metadata.json
index ac856e4..15778b2 100644
--- a/test/test-pages/lwn-1/expected-metadata.json
+++ b/test/test-pages/lwn-1/expected-metadata.json
@@ -1,5 +1,7 @@
{
"Title": "LWN.net Weekly Edition for March 26, 2015 [LWN.net]",
"Author": "By Nathan Willis\n March 25, 2015",
- "Excerpt": "The Arduino has been one of the biggest success stories of the open-hardware movement, but that success does not protect it from internal conflict. In recent months, two of the project's founders have come into conflict about the direction of future efforts—and that conflict has turned into a legal dispute about who owns the rights to the Arduino trademark."
+ "Excerpt": "The Arduino has been one of the biggest success stories of the open-hardware movement, but that success does not protect it from internal conflict. In recent months, two of the project's founders have come into conflict about the direction of future efforts—and that conflict has turned into a legal dispute about who owns the rights to the Arduino trademark.",
+ "Direction": null,
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/medium-1/expected-metadata.json b/test/test-pages/medium-1/expected-metadata.json
index ce4c1a9..85803a7 100644
--- a/test/test-pages/medium-1/expected-metadata.json
+++ b/test/test-pages/medium-1/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "The Open Journalism Project: Better Student Journalism",
"Author": "Pippin Lee",
"Excerpt": "We pushed out the first version of the Open Journalism site in January. Here’s what we’ve learned about student journali…",
- "Image": "https:\/\/d262ilb51hltx0.cloudfront.net\/max\/800\/1*oBWUXtszDsiv_-Qq2bFLTQ.png"
+ "Image": "https:\/\/d262ilb51hltx0.cloudfront.net\/max\/800\/1*oBWUXtszDsiv_-Qq2bFLTQ.png",
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/medium-2/expected-metadata.json b/test/test-pages/medium-2/expected-metadata.json
index 1257405..1e7aa99 100644
--- a/test/test-pages/medium-2/expected-metadata.json
+++ b/test/test-pages/medium-2/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "On Behalf of “Literally”",
"Author": "Courtney Kirchoff",
"Excerpt": "In defense of the word “literally” and why you or someone you know should stop misusing the word, lest they drive us fig…",
- "Image": "https:\/\/d262ilb51hltx0.cloudfront.net\/max\/1600\/1*eR_J8DurqygbhrwDg-WPnQ.png"
+ "Image": "https:\/\/d262ilb51hltx0.cloudfront.net\/max\/1600\/1*eR_J8DurqygbhrwDg-WPnQ.png",
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/missing-paragraphs/expected-metadata.json b/test/test-pages/missing-paragraphs/expected-metadata.json
index a48bc86..7014daa 100644
--- a/test/test-pages/missing-paragraphs/expected-metadata.json
+++ b/test/test-pages/missing-paragraphs/expected-metadata.json
@@ -1,5 +1,7 @@
{
"Title": "Lorem ipsum dolor sit amet, consetetur sadipscing elitr, sed diam nonumy\n eirmod tempor invidunt",
"Author": "Henri Sivonen",
- "Excerpt": "Lorem ipsum dolor sit amet, consetetur sadipscing elitr, sed diam nonumy\n eirmod tempor invidunt ut labore et dolore magna aliquyam erat, sed diam\n voluptua. At vero eos et accusam et justo duo dolores et ea rebum. Stet\n clita kasd gubergren, no sea takimata sanctus est Lorem ipsum dolor sit\n amet. Lorem ipsum dolor sit amet, consetetur sadipscing elitr, sed diam\n nonumy eirmod tempor invidunt ut labore et dolore magna aliquyam erat,\n sed diam voluptua. At vero eos et accusam et justo duo dolores et ea rebum.\n Stet clita kasd gubergren, no sea takimata sanctus est Lorem ipsum dolor\n sit amet. Lorem ipsum dolor sit amet, consetetur sadipscing elitr, sed\n diam nonumy eirmod tempor invidunt ut labore et dolore magna aliquyam erat,\n sed diam voluptua. At vero eos et accusam et justo duo dolores et ea rebum.\n Stet clita kasd gubergren, no sea takimata sanctus est Lorem ipsum dolor\n sit amet."
+ "Excerpt": "Lorem ipsum dolor sit amet, consetetur sadipscing elitr, sed diam nonumy\n eirmod tempor invidunt ut labore et dolore magna aliquyam erat, sed diam\n voluptua. At vero eos et accusam et justo duo dolores et ea rebum. Stet\n clita kasd gubergren, no sea takimata sanctus est Lorem ipsum dolor sit\n amet. Lorem ipsum dolor sit amet, consetetur sadipscing elitr, sed diam\n nonumy eirmod tempor invidunt ut labore et dolore magna aliquyam erat,\n sed diam voluptua. At vero eos et accusam et justo duo dolores et ea rebum.\n Stet clita kasd gubergren, no sea takimata sanctus est Lorem ipsum dolor\n sit amet. Lorem ipsum dolor sit amet, consetetur sadipscing elitr, sed\n diam nonumy eirmod tempor invidunt ut labore et dolore magna aliquyam erat,\n sed diam voluptua. At vero eos et accusam et justo duo dolores et ea rebum.\n Stet clita kasd gubergren, no sea takimata sanctus est Lorem ipsum dolor\n sit amet.",
+ "Direction": null,
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/msn/expected-metadata.json b/test/test-pages/msn/expected-metadata.json
index 7b50117..5eade78 100644
--- a/test/test-pages/msn/expected-metadata.json
+++ b/test/test-pages/msn/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "Nintendo's first iPhone game will launch in December for $10",
"Author": "Alex Perry\n \n 1 day ago",
"Excerpt": "Nintendo and Apple shocked the world earlier this year by announcing \"Super Mario Run,\" the legendary gaming company's first foray into mobile gaming.&nbsp;",
- "Image": "http:\/\/img-s-msn-com.akamaized.net\/tenant\/amp\/entityid\/AAkk5fh.img"
+ "Image": "http:\/\/img-s-msn-com.akamaized.net\/tenant\/amp\/entityid\/AAkk5fh.img",
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/remove-extra-brs/expected-metadata.json b/test/test-pages/remove-extra-brs/expected-metadata.json
index b378339..a6286b4 100644
--- a/test/test-pages/remove-extra-brs/expected-metadata.json
+++ b/test/test-pages/remove-extra-brs/expected-metadata.json
@@ -1,5 +1,7 @@
{
"Title": "Remove trailing brs test",
"Author": null,
- "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua."
+ "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua.",
+ "Direction": null,
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/remove-extra-paragraphs/expected-metadata.json b/test/test-pages/remove-extra-paragraphs/expected-metadata.json
index fc6c06e..fe63d26 100644
--- a/test/test-pages/remove-extra-paragraphs/expected-metadata.json
+++ b/test/test-pages/remove-extra-paragraphs/expected-metadata.json
@@ -1,5 +1,7 @@
{
"Title": "Replace font tags test",
"Author": null,
- "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua."
+ "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua.",
+ "Direction": null,
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/remove-script-tags/expected-metadata.json b/test/test-pages/remove-script-tags/expected-metadata.json
index c0567d8..7e430dd 100644
--- a/test/test-pages/remove-script-tags/expected-metadata.json
+++ b/test/test-pages/remove-script-tags/expected-metadata.json
@@ -1,5 +1,7 @@
{
"Title": "Remove script tags test",
"Author": null,
- "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua."
+ "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua.",
+ "Direction": null,
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/reordering-paragraphs/expected-metadata.json b/test/test-pages/reordering-paragraphs/expected-metadata.json
index 27f5eaf..c9764b9 100644
--- a/test/test-pages/reordering-paragraphs/expected-metadata.json
+++ b/test/test-pages/reordering-paragraphs/expected-metadata.json
@@ -1,5 +1,7 @@
{
- "Title": "",
+ "Title": null,
"Author": null,
- "Excerpt": "Regarding item# 11111, under sufficiently extreme conditions, quarks may\n become deconfined and exist as free particles. In the course of asymptotic\n freedom, the strong interaction becomes weaker at higher temperatures.\n Eventually, color confinement would be lost and an extremely hot plasma\n of freely moving quarks and gluons would be formed. This theoretical phase\n of matter is called quark-gluon plasma.[81] The exact conditions needed\n to give rise to this state are unknown and have been the subject of a great\n deal of speculation and experimentation."
+ "Excerpt": "Regarding item# 11111, under sufficiently extreme conditions, quarks may\n become deconfined and exist as free particles. In the course of asymptotic\n freedom, the strong interaction becomes weaker at higher temperatures.\n Eventually, color confinement would be lost and an extremely hot plasma\n of freely moving quarks and gluons would be formed. This theoretical phase\n of matter is called quark-gluon plasma.[81] The exact conditions needed\n to give rise to this state are unknown and have been the subject of a great\n deal of speculation and experimentation.",
+ "Direction": null,
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/replace-brs/expected-metadata.json b/test/test-pages/replace-brs/expected-metadata.json
index 4a3ab99..e9adc90 100644
--- a/test/test-pages/replace-brs/expected-metadata.json
+++ b/test/test-pages/replace-brs/expected-metadata.json
@@ -1,5 +1,7 @@
{
"Title": "Replace brs test",
"Author": null,
- "Excerpt": "Lorem ipsumdolor sit"
+ "Excerpt": "Lorem ipsumdolor sit",
+ "Direction": null,
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/replace-font-tags/expected-metadata.json b/test/test-pages/replace-font-tags/expected-metadata.json
index 1fc0cd4..31289ff 100644
--- a/test/test-pages/replace-font-tags/expected-metadata.json
+++ b/test/test-pages/replace-font-tags/expected-metadata.json
@@ -1,5 +1,7 @@
{
"Title": "Replace font tags test",
"Author": null,
- "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum."
+ "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum.",
+ "Direction": null,
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/rtl-1/expected-metadata.json b/test/test-pages/rtl-1/expected-metadata.json
index d26d69a..afead27 100644
--- a/test/test-pages/rtl-1/expected-metadata.json
+++ b/test/test-pages/rtl-1/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "RTL Test",
"Author": null,
"Excerpt": "Lorem ipsum dolor sit amet.",
- "Direction": "rtl"
+ "Direction": "rtl",
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/rtl-2/expected-metadata.json b/test/test-pages/rtl-2/expected-metadata.json
index d26d69a..afead27 100644
--- a/test/test-pages/rtl-2/expected-metadata.json
+++ b/test/test-pages/rtl-2/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "RTL Test",
"Author": null,
"Excerpt": "Lorem ipsum dolor sit amet.",
- "Direction": "rtl"
+ "Direction": "rtl",
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/rtl-3/expected-metadata.json b/test/test-pages/rtl-3/expected-metadata.json
index d26d69a..afead27 100644
--- a/test/test-pages/rtl-3/expected-metadata.json
+++ b/test/test-pages/rtl-3/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "RTL Test",
"Author": null,
"Excerpt": "Lorem ipsum dolor sit amet.",
- "Direction": "rtl"
+ "Direction": "rtl",
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/rtl-4/expected-metadata.json b/test/test-pages/rtl-4/expected-metadata.json
index a9690b7..c102518 100644
--- a/test/test-pages/rtl-4/expected-metadata.json
+++ b/test/test-pages/rtl-4/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "RTL Test",
"Author": null,
"Excerpt": "Lorem ipsum dolor sit amet.",
- "Direction": null
+ "Direction": null,
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/salon-1/expected-metadata.json b/test/test-pages/salon-1/expected-metadata.json
index cd47b7f..502d35f 100644
--- a/test/test-pages/salon-1/expected-metadata.json
+++ b/test/test-pages/salon-1/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "The sharing economy is a lie: Uber, Ayn Rand and the truth about tech and libertarians",
"Author": "Joanna Rothkopf",
"Excerpt": "Disruptive companies talk a good game about sharing. Uber's really just an under-regulated company making riches",
- "Image": "http:\/\/media.salon.com\/2014\/12\/uber_rand_paul.jpg"
+ "Image": "http:\/\/media.salon.com\/2014\/12\/uber_rand_paul.jpg",
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/simplyfound-1/expected-metadata.json b/test/test-pages/simplyfound-1/expected-metadata.json
index 9c8fb6b..17aa266 100644
--- a/test/test-pages/simplyfound-1/expected-metadata.json
+++ b/test/test-pages/simplyfound-1/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "Raspberry Pi 3 - The credit card sized PC that cost only $35 - All-time bestselling computer in UK",
"Author": null,
"Excerpt": "The Raspberry Pi Foundation started by a handful of volunteers in 2012 when they released the original Raspberry Pi 256MB Model B without knowing what to expect. In a short four-year period they have grown to over sixty full-time employees and ha...",
- "Image": "https:\/\/d34hb2g9mvfppu.cloudfront.net\/m\/images\/cache\/images\/2016\/02\/29\/apcnews2012raspberry_pi_logo_mainimage8_jpg8_322_27630a8388eb_lg.jpg"
+ "Image": "https:\/\/d34hb2g9mvfppu.cloudfront.net\/m\/images\/cache\/images\/2016\/02\/29\/apcnews2012raspberry_pi_logo_mainimage8_jpg8_322_27630a8388eb_lg.jpg",
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/social-buttons/expected-metadata.json b/test/test-pages/social-buttons/expected-metadata.json
index 545b72f..d7c828f 100644
--- a/test/test-pages/social-buttons/expected-metadata.json
+++ b/test/test-pages/social-buttons/expected-metadata.json
@@ -1,5 +1,7 @@
{
"Title": "Share buttons removal test",
"Author": null,
- "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum."
+ "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum.",
+ "Direction": null,
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/style-tags-removal/expected-metadata.json b/test/test-pages/style-tags-removal/expected-metadata.json
index 44f6efe..dc267d4 100644
--- a/test/test-pages/style-tags-removal/expected-metadata.json
+++ b/test/test-pages/style-tags-removal/expected-metadata.json
@@ -1,5 +1,7 @@
{
"Title": "Style tags removal",
"Author": null,
- "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum."
+ "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum.",
+ "Direction": null,
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/svg-parsing/expected-metadata.json b/test/test-pages/svg-parsing/expected-metadata.json
index be5e333..e983b2f 100644
--- a/test/test-pages/svg-parsing/expected-metadata.json
+++ b/test/test-pages/svg-parsing/expected-metadata.json
@@ -1,5 +1,7 @@
{
"Title": "SVG parsing",
"Author": null,
- "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\ntempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\nquis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\nconsequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\ncillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\nproident, sunt in culpa qui officia deserunt mollit anim id est laborum."
+ "Excerpt": "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\ntempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\nquis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\nconsequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\ncillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\nproident, sunt in culpa qui officia deserunt mollit anim id est laborum.",
+ "Direction": null,
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/table-style-attributes/expected-metadata.json b/test/test-pages/table-style-attributes/expected-metadata.json
index f677d3e..08157c1 100644
--- a/test/test-pages/table-style-attributes/expected-metadata.json
+++ b/test/test-pages/table-style-attributes/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "linux video",
"Author": null,
"Direction": null,
- "Excerpt": "linux usability\n ...or, why do I bother. © 2002, 2003\n Jamie Zawinski"
+ "Excerpt": "linux usability\n ...or, why do I bother. © 2002, 2003\n Jamie Zawinski",
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/telegraph/expected-metadata.json b/test/test-pages/telegraph/expected-metadata.json
index 94a330d..8de1040 100644
--- a/test/test-pages/telegraph/expected-metadata.json
+++ b/test/test-pages/telegraph/expected-metadata.json
@@ -1,5 +1,7 @@
{
"Title": "Zimbabwe coup: Robert Mugabe and wife Grace 'insisting he finishes his term', as priest steps in to mediate",
"Excerpt": "Zimbabwe President Robert Mugabe, his wife Grace and two key figures from her G40 political faction are under house arrest at Mugabe's &quot;Blue House&quot; compound in Harare and are insisting the 93 year-old finishes his presidential term, a source said.",
- "Image": "http:\/\/www.telegraph.co.uk\/content\/dam\/news\/2017\/11\/16\/TELEMMGLPICT000146889449-xlarge_trans_NvBQzQNjv4BqySoB6nTCgtc7U4LQ_FPO4hKi2sT3vi7ux2-RDZwC4QA.jpeg"
+ "Image": "http:\/\/www.telegraph.co.uk\/content\/dam\/news\/2017\/11\/16\/TELEMMGLPICT000146889449-xlarge_trans_NvBQzQNjv4BqySoB6nTCgtc7U4LQ_FPO4hKi2sT3vi7ux2-RDZwC4QA.jpeg",
+ "Author": "Our Foreign Staff \n \n\n16 November 2017 • 2:15pm",
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/title-and-h1-discrepancy/expected-metadata.json b/test/test-pages/title-and-h1-discrepancy/expected-metadata.json
index 5d2f573..fb02536 100644
--- a/test/test-pages/title-and-h1-discrepancy/expected-metadata.json
+++ b/test/test-pages/title-and-h1-discrepancy/expected-metadata.json
@@ -1,4 +1,7 @@
{
"Title": "This is a long title with a colon: Hello there",
- "Excerpt": "Lorem\n ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum."
+ "Excerpt": "Lorem\n ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod\n incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam,\n quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo\n consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse\n cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non\n proident, sunt in culpa qui officia deserunt mollit anim id est laborum.",
+ "Author": null,
+ "Direction": null,
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/tmz-1/expected-metadata.json b/test/test-pages/tmz-1/expected-metadata.json
index 684127f..364beed 100644
--- a/test/test-pages/tmz-1/expected-metadata.json
+++ b/test/test-pages/tmz-1/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "Lupita Nyong'o's $150K Pearl Oscar Dress -- STOLEN!!!",
"Author": null,
"Excerpt": "Lupita Nyong'o's now-famous Oscar dress -- adorned in pearls -- was stolen right out of her hotel room ... TMZ has learned. Law enforcement sources tell…",
- "Image": "http:\/\/ll-media.tmz.com\/2015\/02\/26\/0225-lupita-nyongo-getty-01-1200x630.jpg"
+ "Image": "http:\/\/ll-media.tmz.com\/2015\/02\/26\/0225-lupita-nyongo-getty-01-1200x630.jpg",
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/wapo-1/expected-metadata.json b/test/test-pages/wapo-1/expected-metadata.json
index 401a73a..5a89ef0 100644
--- a/test/test-pages/wapo-1/expected-metadata.json
+++ b/test/test-pages/wapo-1/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "Attack stokes instability fears in North Africa",
"Author": "By Erin Cunningham",
"Excerpt": "The assault on Tunisia’s most renowned museum, in which gunmen killed at least 19 people, could heighten tensions in a nation that has become deeply divided between pro- and anti-Islamist factions.",
- "Image": "http:\/\/img.washingtonpost.com\/rw\/2010-2019\/WashingtonPost\/2015\/03\/18\/Foreign\/Images\/Nic6429927.jpg"
+ "Image": "http:\/\/img.washingtonpost.com\/rw\/2010-2019\/WashingtonPost\/2015\/03\/18\/Foreign\/Images\/Nic6429927.jpg",
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/wapo-2/expected-metadata.json b/test/test-pages/wapo-2/expected-metadata.json
index 7a9493e..3bd32ec 100644
--- a/test/test-pages/wapo-2/expected-metadata.json
+++ b/test/test-pages/wapo-2/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "Where do strained U.S.-Israeli relations go after Netanyahu’s victory?",
"Author": "By Steven Mufson",
"Excerpt": "Few foreign leaders have so brazenly stood up to President Obama and the relationship could face its next test this month.",
- "Image": "http:\/\/img.washingtonpost.com\/rw\/2010-2019\/WashingtonPost\/2015\/03\/18\/National-Economy\/Images\/Nic6429750-1138.jpg"
+ "Image": "http:\/\/img.washingtonpost.com\/rw\/2010-2019\/WashingtonPost\/2015\/03\/18\/National-Economy\/Images\/Nic6429750-1138.jpg",
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/webmd-1/expected-metadata.json b/test/test-pages/webmd-1/expected-metadata.json
index 76d3dbc..3afd752 100644
--- a/test/test-pages/webmd-1/expected-metadata.json
+++ b/test/test-pages/webmd-1/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "Babies Who Eat Peanuts Early May Avoid Allergy",
"Author": "By Brenda Goodman, MA\n WebMD Health News",
"Excerpt": "Life-threatening peanut allergies have mysteriously been on the rise in the past decade, with little hope for a cure. But a groundbreaking new study may offer a way to stem that rise, while another may offer some hope for those who are already allergic.",
- "Image": "http:\/\/img.webmd.com\/dtmcms\/live\/webmd\/consumer_assets\/site_images\/miscellaneous\/webmd_FB_logo_bluebkgrd.jpg?v=1"
+ "Image": "http:\/\/img.webmd.com\/dtmcms\/live\/webmd\/consumer_assets\/site_images\/miscellaneous\/webmd_FB_logo_bluebkgrd.jpg?v=1",
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/webmd-2/expected-metadata.json b/test/test-pages/webmd-2/expected-metadata.json
index dc0d878..b037ba1 100644
--- a/test/test-pages/webmd-2/expected-metadata.json
+++ b/test/test-pages/webmd-2/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "Superbugs: What They Are and How You Get Them",
"Author": "By Kelli Miller\n WebMD Health News",
"Excerpt": "Drug-resistant bacteria, dubbed",
- "Image": "http:\/\/img.webmd.com\/dtmcms\/live\/webmd\/consumer_assets\/site_images\/miscellaneous\/webmd_FB_logo_bluebkgrd.jpg?v=1"
+ "Image": "http:\/\/img.webmd.com\/dtmcms\/live\/webmd\/consumer_assets\/site_images\/miscellaneous\/webmd_FB_logo_bluebkgrd.jpg?v=1",
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/wikipedia/expected-metadata.json b/test/test-pages/wikipedia/expected-metadata.json
index 8f22810..8ee82cf 100644
--- a/test/test-pages/wikipedia/expected-metadata.json
+++ b/test/test-pages/wikipedia/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "Mozilla - Wikipedia",
"Author": null,
"Direction": "ltr",
- "Excerpt": "Mozilla is a free-software community, created in 1998 by members of Netscape. The Mozilla community uses, develops, spreads and supports Mozilla products, thereby promoting exclusively free software and open standards, with only minor exceptions.[1] The community is supported institutionally by the Mozilla Foundation and its tax-paying subsidiary, the Mozilla Corporation.[2]"
+ "Excerpt": "Mozilla is a free-software community, created in 1998 by members of Netscape. The Mozilla community uses, develops, spreads and supports Mozilla products, thereby promoting exclusively free software and open standards, with only minor exceptions.[1] The community is supported institutionally by the Mozilla Foundation and its tax-paying subsidiary, the Mozilla Corporation.[2]",
+ "Image": null
} \ No newline at end of file
diff --git a/test/test-pages/yahoo-2/expected-metadata.json b/test/test-pages/yahoo-2/expected-metadata.json
index 98e35c4..e593271 100644
--- a/test/test-pages/yahoo-2/expected-metadata.json
+++ b/test/test-pages/yahoo-2/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "Yahoo News - Latest News & Headlines",
"Author": "NATALIYA VASILYEVA",
"Excerpt": "The latest news and headlines from Yahoo! News. Get breaking news stories and in-depth coverage with videos and photos.",
- "Image": "https:\/\/s.yimg.com\/os\/mit\/media\/m\/social\/images\/social_default_logo-1481777.png"
+ "Image": "https:\/\/s.yimg.com\/os\/mit\/media\/m\/social\/images\/social_default_logo-1481777.png",
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/yahoo-3/expected-metadata.json b/test/test-pages/yahoo-3/expected-metadata.json
index adce0d3..a3ad573 100644
--- a/test/test-pages/yahoo-3/expected-metadata.json
+++ b/test/test-pages/yahoo-3/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "Veteran Wraps Baby in American Flag, Photo Sparks Controversy",
"Excerpt": "A photographer and Navy veteran is fighting back after a photo she posted to Facebook started an online backlash. Vanessa Hicks said she had no idea her photo would be considered controversial. The photo, from a military family’s newborn photo shoot, showed a newborn infant wrapped in an American flag held by his father, who was in his military uniform. Hicks, a Navy veteran herself and the wife of an active-duty Navy member, said her intention was to honor the flag as well as her clients, who wanted to incorporate their military service in the photo shoot.",
"Author": "By GILLIAN MOHNEY\n March 11, 2015 3:46 PM",
- "Image": "https:\/\/s.yimg.com\/bt\/api\/res\/1.2\/qZaM9MLUOrxLg4IfXt_Niw--\/YXBwaWQ9eW5ld3NfbGVnbztxPTc1O3c9NjAw\/http:\/\/media.zenfs.com\/en-US\/video\/video.abcnewsplus.com\/559ecdbafdb839129816b5c79a996975.cf.png"
+ "Image": "https:\/\/s.yimg.com\/bt\/api\/res\/1.2\/qZaM9MLUOrxLg4IfXt_Niw--\/YXBwaWQ9eW5ld3NfbGVnbztxPTc1O3c9NjAw\/http:\/\/media.zenfs.com\/en-US\/video\/video.abcnewsplus.com\/559ecdbafdb839129816b5c79a996975.cf.png",
+ "Direction": null
} \ No newline at end of file
diff --git a/test/test-pages/youth/expected-metadata.json b/test/test-pages/youth/expected-metadata.json
index 666b15d..4608fd7 100644
--- a/test/test-pages/youth/expected-metadata.json
+++ b/test/test-pages/youth/expected-metadata.json
@@ -2,5 +2,6 @@
"Title": "海外留学生看两会:出国前后关注点大不同_教育频道_中国青年网",
"Author": "青网校园崔宁宁",
"Direction": null,
- "Excerpt": "图为马素湘在澳大利亚悉尼游玩时的近影。出国前后关注点大不同出国前:政治科目会出啥考题?出国后:国家未来将如何发展?在采访中,我们了解到不少学子在出国前就每年守在电脑前观看两会直播。但是,随着年龄和阅历的增长,学子对两会的关注点在出国前后发生了很大的变化。在法国里昂国立应用科学院留学的卢宇表示,他还是个中学生时,就开始关注两会了。“我高中毕业后就出国留学了。"
+ "Excerpt": "图为马素湘在澳大利亚悉尼游玩时的近影。出国前后关注点大不同出国前:政治科目会出啥考题?出国后:国家未来将如何发展?在采访中,我们了解到不少学子在出国前就每年守在电脑前观看两会直播。但是,随着年龄和阅历的增长,学子对两会的关注点在出国前后发生了很大的变化。在法国里昂国立应用科学院留学的卢宇表示,他还是个中学生时,就开始关注两会了。“我高中毕业后就出国留学了。",
+ "Image": null
} \ No newline at end of file