]> git.immae.eu Git - github/wallabag/wallabag.git/blob - inc/3rdparty/site_config/standard/bbc.com.txt
update config from @fivefilters
[github/wallabag/wallabag.git] / inc / 3rdparty / site_config / standard / bbc.com.txt
1 body: //div[@class="story-body"]
2 # for video entries
3 body: //div[contains(@class, "videoInStory") or @id="meta-information"]
4 title: //h1[@class="story-header"]
5 date: //span[@class="story-date"]/span[@class='date']
6 # for sport site
7 date: //meta[@name='DCTERMS.created']/@content
8 author: //div[@id='headline']//span[@class='byline-name']
9
10 # recipes, e.g. http://www.bbc.co.uk/food/recipes/mymincepies_71055
11 body: //div[contains(@class, 'hrecipe')]//div[@id='subcolumn-1']
12
13 #strip: //div[@class="story-feature narrow"]
14 #strip: //div[@class="story-feature wide"]
15 #strip: //div[@class="story-feature dslideshow-enclosure"]
16 strip: //div[contains(@class, "story-feature") and not(contains(@class, 'full-width'))]
17 strip: //span[@class="story-date"]
18 #strip: //div[@class="caption body-narrow-width"]
19 strip: //div[@class="warning"]//p
20 strip: //div[@id='page-bookmark-links-head']
21 strip: //object
22 strip: //div[contains(@class, "bbccom_advert_placeholder")]
23 strip: //div[contains(@class, "embedded-hyper")]
24 strip: //div[contains(@class, 'market-data')]
25 strip: //a[contains(@class, 'hidden')]
26 strip: //div[contains(@class, 'hypertabs')]
27 strip: //div[contains(@class, 'related')]
28 strip: //form[@id='comment-form']
29 strip: //div[contains(@class, 'comment-introduction')]
30 strip: //div[contains(@class, 'share-tools')]
31 strip: //div[@id='also-related-links']
32
33 strip_id_or_class: share-help
34 strip_id_or_class: comments_module
35
36 find_string: http://ichef.bbci.co.uk/news/200/
37 replace_string: http://ichef.bbci.co.uk/news/624/
38
39 find_string: http://ichef.bbci.co.uk/news/304/
40 replace_string: http://ichef.bbci.co.uk/news/624/
41
42 replace_string(<noscript>): <div>
43 replace_string(</noscript>): </div>
44
45 native_ad_clue: //meta[@property="og:url" and contains(@content, '/sponsored/')]
46
47 tidy: no
48 prune: no
49
50 dissolve: //h2
51
52 test_url: http://www.bbc.com/sport/0/football/28918021
53 test_contains: Cameroonian footballer Albert Ebosse has died
54
55 test_url: http://www.bbc.com/sport/0/football/23224017
56
57 test_url: http://www.bbc.com/news/business-15060862
58 test_contains: Europe's leaders are meeting again to try
59
60
61 # news feed
62 test_url: http://feeds.bbci.co.uk/news/rss.xml
63 # sports feed
64 test_url: http://feeds.bbci.co.uk/sport/0/football/rss.xml?edition=int
65 # video entry
66 test_url: http://www.bbc.com/news/world-asia-22056933