X-Git-Url: https://git.immae.eu/?a=blobdiff_plain;f=inc%2F3rdparty%2Fsite_config%2Fstandard%2Ftheatlantic.com.txt;h=36864197bd88d0c57c39b89b325d11c3a6485123;hb=3bb6a8ed2ab40b17d3f3b9925664c8da38ea2570;hp=3fc5611b2c9964666b671da5cd293fb56f8600a4;hpb=7efe6a03d5431efe9e217c6129cfd93e6acb94d2;p=github%2Fwallabag%2Fwallabag.git diff --git a/inc/3rdparty/site_config/standard/theatlantic.com.txt b/inc/3rdparty/site_config/standard/theatlantic.com.txt index 3fc5611b..36864197 100755 --- a/inc/3rdparty/site_config/standard/theatlantic.com.txt +++ b/inc/3rdparty/site_config/standard/theatlantic.com.txt @@ -1,5 +1,6 @@ title: //div[contains(@class, 'articleHead')]//h1 +body: //div[@itemprop='articleBody'] body: //div[@class='articleText'] body: //div[@class='articleContent'] body: //div[@id='article'] @@ -13,10 +14,14 @@ strip: //p[contains(., 'This article available online at:')] strip: //p[contains(., 'This article available online at:')]/following::* strip: //div[@class='earthbox'] -single_page_link: //article//a[contains(@class, 'print')] +single_page_link: //div[contains(@class, 'article-tools')]//a[contains(@class, 'print')] native_ad_clue: //meta[@property="og:url" and contains(@content, '/sponsored/')] +#multi-page article +test_url: http://www.theatlantic.com/magazine/archive/2014/12/the-real-roots-of-midlife-crisis/382235/ +test_contains: The curve tends to evince itself + test_url: http://www.theatlantic.com/technology/archive/2011/04/want-to-see-how-crazy-a-bot-run-market-can-be/237773/ test_url: http://www.theatlantic.com/magazine/archive/2007/11/the-autumn-of-the-multitaskers/6342/ -test_url: http://www.theatlantic.com/entertainment/archive/2012/04/30-rock-live-a-funny-reminder-of-why-sitcoms-arent-shot-live-anymore/256447/ \ No newline at end of file +test_url: http://www.theatlantic.com/entertainment/archive/2012/04/30-rock-live-a-funny-reminder-of-why-sitcoms-arent-shot-live-anymore/256447/