aboutsummaryrefslogtreecommitdiffhomepage
path: root/inc/3rdparty/site_config/standard/theverge.com.txt
blob: 1e1ce58f0405caecd78a30c25810cbd065681ff9 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
author: //p[contains(@class, "byline")]/a[contains(@class, "author")]

date: //span[contains(@class, "publish-date")]/time[@pubdate]/@datetime

body: //div[contains(@class, 'entry-content')]
# for vergecasts, e.g. http://www.theverge.com/2013/8/22/4648566/the-vergecast-090-august-22th-2013-video
body: //article
prune: no
#tidy: no

strip: //article/header
strip: //*[@id='sticky-menu']
strip: //aside
strip: //nav
strip: //img[contains(@class, 'vox-lazy-load')]
# deal with bad parsing
strip: //div[contains(@class, 'story-image')]//div[contains(., 'function(')]

strip_id_or_class: gallery
strip_id_or_class: article-meta
strip_id_or_class: story-navigation
strip_id_or_class: slegend
strip_id_or_class: related-product-meta
strip_id_or_class: comments
strip_id_or_class: ui-jump-list
strip_id_or_class: pullquote
strip_id_or_class: m-ad
strip_id_or_class: social-sharing
strip_id_or_class: m-video-entry__excerpt
strip_id_or_class: hidden

replace_string(<noscript>): <div>
replace_string(</noscript>): </div>

find_string: <script
replace_string: <div style="display:none" 
find_string: </script>
replace_string: </div>

strip: //q

strip: //a[contains(@class, 'entry-section-title')]

test_url: http://www.theverge.com/2012/2/29/2821763/lytro-review
test_url: http://www.theverge.com/2011/11/3/2534861/nokia-lumia-800-review
test_url: http://www.theverge.com/2013/2/24/4026114/barnes-noble-shifting-focus-away-from-nook-hardware
test_url: http://www.theverge.com/2014/6/19/5824072/top-shelf-living-the-dream
test_url: http://www.theverge.com/rss/frontpage