]> git.immae.eu Git - github/wallabag/wallabag.git/blob - inc/3rdparty/site_config/standard/washingtonpost.com.txt
update config from @fivefilters
[github/wallabag/wallabag.git] / inc / 3rdparty / site_config / standard / washingtonpost.com.txt
1 # Seems to be redirecting to articles.washingtonpost.com for many users
2
3 body: //div[contains(@class, "article_body")]
4 # print view
5 body: //div[@id='print_facet']//div[@id='body']
6
7 author://meta[@name='DC.creator']/@content
8 author://span[@class="pb-byline"]
9 author://h3[@property='dc.creator']//a[@rel='author']
10 title://meta[@name='title']/@content
11 date://div[contains(@class,'byline')]//span[contains(@class,'published')]/@title
12 date://meta[@name="DC.date.issued"]/@content
13 date://span[contains(@class,"pb-timestamp")]
14 date://meta[@name="eomportal-lastUpdate"]/@content
15
16 strip://div[@class="relative primary-slot padding-top img-border gallery-container photo-wrapper"]
17 strip://div[@id="wp-column six end"]
18 strip://div[contains(@class,'hidden')]
19 strip://div[@id='article-side-rail']
20 strip://div[@class="module component todays-paper-module curved"]
21 strip://div[@class="module component live-qa curved img-border"]
22 strip://div[@class="module component newsletter-signup curved"]
23 strip://div[@class="module featured-stories component curved img-border"]
24
25 strip_id_or_class: carousel
26 strip_id_or_class: toolbar
27 strip_id_or_class: module
28
29 # Change gJQAwdJG4U_story.html to gJQAwdJG4U_print.html
30 single_page_link: concat(substring-before(//link[@rel="canonical"]/@href, "_story.html"), "_print.html")
31 if_page_contains: //link[@rel="canonical" and contains(@href, '_story.html')]
32
33 # [OLD] Change gJQAwdJG4U_story.html to gJQAwdJG4U_story_print.html
34 #single_page_link: concat(substring-before(//link[@rel="canonical"]/@href, "_story.html"), "_story_print.html")
35
36 test_url: http://www.washingtonpost.com/world/europe/in-europe-new-fears-of-german-might/2011/10/19/gIQA3baZ7L_story.html?hpid=z1
37 test_url: http://www.washingtonpost.com/national/health-science/radical-theory-of-first-americans-places-stone-age-europeans-in-delmarva-20000-years-ago/2012/02/28/gIQA4mriiR_story.html
38 test_url: http://www.washingtonpost.com/lifestyle/magazine/the-sorry-fate-of-a-tech-pioneer-halsey-minor-and-historic-virginia-estate-carters-grove/2012/05/30/gJQAwdJG4U_story.html