diff options
author | Nicolas LÅ“uillet <nicolas.loeuillet@gmail.com> | 2013-12-06 10:13:03 +0100 |
---|---|---|
committer | Nicolas LÅ“uillet <nicolas.loeuillet@gmail.com> | 2013-12-06 10:13:03 +0100 |
commit | ac4d114214d820b20e18518a2dbc809337e39043 (patch) | |
tree | 27886128ef949b7f8dd174b0646b5a4d99883b44 /inc/3rdparty/site_config/standard/abcnews.go.com.txt | |
parent | d5501950e2470d52f6bf5954d2179010cdee0475 (diff) | |
download | wallabag-ac4d114214d820b20e18518a2dbc809337e39043.tar.gz wallabag-ac4d114214d820b20e18518a2dbc809337e39043.tar.zst wallabag-ac4d114214d820b20e18518a2dbc809337e39043.zip |
[add] new specific configuration files
Diffstat (limited to 'inc/3rdparty/site_config/standard/abcnews.go.com.txt')
-rw-r--r-- | inc/3rdparty/site_config/standard/abcnews.go.com.txt | 27 |
1 files changed, 27 insertions, 0 deletions
diff --git a/inc/3rdparty/site_config/standard/abcnews.go.com.txt b/inc/3rdparty/site_config/standard/abcnews.go.com.txt new file mode 100644 index 00000000..c515d3e4 --- /dev/null +++ b/inc/3rdparty/site_config/standard/abcnews.go.com.txt | |||
@@ -0,0 +1,27 @@ | |||
1 | title: //h1[@class='headline'] | ||
2 | body: //div[@id='storyText'] | ||
3 | # for video entries | ||
4 | body: //img[@id='ff-img'] | //div[@id='meta']//div[contains(@class, 'overview')] | ||
5 | author: //div[@class='byline'] | ||
6 | date: //div[@class='date'] | ||
7 | strip: //*[@id='date_partner'] | ||
8 | |||
9 | strip: //div[@class='breadcrumb'] | ||
10 | strip: //div[contains(@class,'show_tools')] | ||
11 | strip: //div[@id='sponsoredByAd'] | ||
12 | strip: //div[contains(@class,'rel_container')] | ||
13 | strip: //p[a[starts-with(@href, 'http://www.twitter.com')]] | ||
14 | strip: //p[a[starts-with(@href, 'http://www.facebook.com')]] | ||
15 | strip: //p[contains(., 'Click here to return to')] | ||
16 | #strip_id_or_class: media | ||
17 | strip_id_or_class: mediaplayer | ||
18 | |||
19 | replace_string(<link rel="image_src" href="http): <img id="ff-img" src="http | ||
20 | |||
21 | prune: no | ||
22 | |||
23 | single_page_link: concat(//li[@class='pager']//a/@href, '&singlePage=true') | ||
24 | |||
25 | test_url: http://abcnews.go.com/Politics/newt-gingrich-rocky-rollout-presidential-campaign-recover/story?id=13632744 | ||
26 | # multi-page | ||
27 | test_url: http://abcnews.go.com/Blotter/family-freed-american-hostage-somalia-seals-obama/story?id=15439544 \ No newline at end of file | ||