aboutsummaryrefslogtreecommitdiffhomepage
path: root/inc/3rdparty/site_config/standard/washingtonpost.com.txt
diff options
context:
space:
mode:
authorNicolas LÅ“uillet <nicolas@loeuillet.org>2014-07-13 10:15:40 +0200
committerNicolas LÅ“uillet <nicolas@loeuillet.org>2014-07-13 10:15:40 +0200
commit4e067ceabd705201a16b4c92cf4b23f3b990326c (patch)
tree939f3a8e5ff3ab9ee414a57a895d3e78e1d46ce3 /inc/3rdparty/site_config/standard/washingtonpost.com.txt
parent58dbe103889148def78b0fc8744d3f94c56a1561 (diff)
downloadwallabag-4e067ceabd705201a16b4c92cf4b23f3b990326c.tar.gz
wallabag-4e067ceabd705201a16b4c92cf4b23f3b990326c.tar.zst
wallabag-4e067ceabd705201a16b4c92cf4b23f3b990326c.zip
updated specific configuration for parsing
Diffstat (limited to 'inc/3rdparty/site_config/standard/washingtonpost.com.txt')
-rwxr-xr-x[-rw-r--r--]inc/3rdparty/site_config/standard/washingtonpost.com.txt51
1 files changed, 31 insertions, 20 deletions
diff --git a/inc/3rdparty/site_config/standard/washingtonpost.com.txt b/inc/3rdparty/site_config/standard/washingtonpost.com.txt
index 2931ca5f..0aa9f1d8 100644..100755
--- a/inc/3rdparty/site_config/standard/washingtonpost.com.txt
+++ b/inc/3rdparty/site_config/standard/washingtonpost.com.txt
@@ -1,21 +1,32 @@
1body: //div[@class="article_body"] 1# Seems to be redirecting to articles.washingtonpost.com for many users
2author://meta[@name='DC.creator']/@content 2
3title://meta[@name='title']/@content 3body: //div[contains(@class, "article_body")]
4date://div[contains(@class,'byline')]//span[contains(@class,'published')]/@title 4# print view
5date://meta[@name="DC.date.issued"]/@content 5body: //div[@id='print_facet']//div[@id='body']
6strip://div[@class="relative primary-slot padding-top img-border gallery-container photo-wrapper"] 6
7strip://div[@id="wp-column six end"] 7author://meta[@name='DC.creator']/@content
8strip://div[contains(@class,'hidden')] 8title://meta[@name='title']/@content
9strip://div[@id='article-side-rail'] 9date://div[contains(@class,'byline')]//span[contains(@class,'published')]/@title
10strip://div[@class="module component todays-paper-module curved"] 10date://meta[@name="DC.date.issued"]/@content
11strip://div[@class="module component live-qa curved img-border"] 11strip://div[@class="relative primary-slot padding-top img-border gallery-container photo-wrapper"]
12strip://div[@class="module component newsletter-signup curved"] 12strip://div[@id="wp-column six end"]
13strip://div[@class="module featured-stories component curved img-border"] 13strip://div[contains(@class,'hidden')]
14 14strip://div[@id='article-side-rail']
15strip_id_or_class: carousel 15strip://div[@class="module component todays-paper-module curved"]
16strip_id_or_class: toolbar 16strip://div[@class="module component live-qa curved img-border"]
17strip_id_or_class: module 17strip://div[@class="module component newsletter-signup curved"]
18 18strip://div[@class="module featured-stories component curved img-border"]
19test_url: http://www.washingtonpost.com/world/europe/in-europe-new-fears-of-german-might/2011/10/19/gIQA3baZ7L_story.html?hpid=z1 19
20test_url: http://www.washingtonpost.com/national/health-science/radical-theory-of-first-americans-places-stone-age-europeans-in-delmarva-20000-years-ago/2012/02/28/gIQA4mriiR_story.html 20strip_id_or_class: carousel
21strip_id_or_class: toolbar
22strip_id_or_class: module
23
24# Change gJQAwdJG4U_story.html to gJQAwdJG4U_print.html
25single_page_link: concat(substring-before(//link[@rel="canonical"]/@href, "_story.html"), "_print.html")
26
27# [OLD] Change gJQAwdJG4U_story.html to gJQAwdJG4U_story_print.html
28#single_page_link: concat(substring-before(//link[@rel="canonical"]/@href, "_story.html"), "_story_print.html")
29
30test_url: http://www.washingtonpost.com/world/europe/in-europe-new-fears-of-german-might/2011/10/19/gIQA3baZ7L_story.html?hpid=z1
31test_url: http://www.washingtonpost.com/national/health-science/radical-theory-of-first-americans-places-stone-age-europeans-in-delmarva-20000-years-ago/2012/02/28/gIQA4mriiR_story.html
21test_url: http://www.washingtonpost.com/lifestyle/magazine/the-sorry-fate-of-a-tech-pioneer-halsey-minor-and-historic-virginia-estate-carters-grove/2012/05/30/gJQAwdJG4U_story.html \ No newline at end of file 32test_url: http://www.washingtonpost.com/lifestyle/magazine/the-sorry-fate-of-a-tech-pioneer-halsey-minor-and-historic-virginia-estate-carters-grove/2012/05/30/gJQAwdJG4U_story.html \ No newline at end of file