diff options
Diffstat (limited to 'inc/3rdparty/site_config/standard/theatlantic.com.txt')
-rwxr-xr-x | inc/3rdparty/site_config/standard/theatlantic.com.txt | 22 |
1 files changed, 0 insertions, 22 deletions
diff --git a/inc/3rdparty/site_config/standard/theatlantic.com.txt b/inc/3rdparty/site_config/standard/theatlantic.com.txt deleted file mode 100755 index 3fc5611b..00000000 --- a/inc/3rdparty/site_config/standard/theatlantic.com.txt +++ /dev/null | |||
@@ -1,22 +0,0 @@ | |||
1 | title: //div[contains(@class, 'articleHead')]//h1 | ||
2 | |||
3 | body: //div[@class='articleText'] | ||
4 | body: //div[@class='articleContent'] | ||
5 | body: //div[@id='article'] | ||
6 | date: //*[contains(@class, 'date')] | ||
7 | author: //div[@id='profile']//*[@class='authors']//a[1] | ||
8 | author: //*[@class='author']/span | ||
9 | prune: no | ||
10 | |||
11 | strip: //div[@class='moreOnBoxWithImages'] | ||
12 | strip: //p[contains(., 'This article available online at:')] | ||
13 | strip: //p[contains(., 'This article available online at:')]/following::* | ||
14 | strip: //div[@class='earthbox'] | ||
15 | |||
16 | single_page_link: //article//a[contains(@class, 'print')] | ||
17 | |||
18 | native_ad_clue: //meta[@property="og:url" and contains(@content, '/sponsored/')] | ||
19 | |||
20 | test_url: http://www.theatlantic.com/technology/archive/2011/04/want-to-see-how-crazy-a-bot-run-market-can-be/237773/ | ||
21 | test_url: http://www.theatlantic.com/magazine/archive/2007/11/the-autumn-of-the-multitaskers/6342/ | ||
22 | test_url: http://www.theatlantic.com/entertainment/archive/2012/04/30-rock-live-a-funny-reminder-of-why-sitcoms-arent-shot-live-anymore/256447/ \ No newline at end of file | ||