diff options
author | tcitworld <thomas.citharet@gmail.com> | 2014-01-04 12:30:31 -0800 |
---|---|---|
committer | tcitworld <thomas.citharet@gmail.com> | 2014-01-04 12:30:31 -0800 |
commit | 7f667839764621b5aa01c9db8ce5dde2a29ef18f (patch) | |
tree | 93d8241ee81c87e18494325ae02f0589a8e328a2 /inc/3rdparty/site_config/standard/npr.org.txt | |
parent | a84f77d6ba15a64ff00453f5d5190c021ce460ed (diff) | |
parent | 2abcccb37180c17318f5226f5d4bc28f30b621ea (diff) | |
download | wallabag-7f667839764621b5aa01c9db8ce5dde2a29ef18f.tar.gz wallabag-7f667839764621b5aa01c9db8ce5dde2a29ef18f.tar.zst wallabag-7f667839764621b5aa01c9db8ce5dde2a29ef18f.zip |
Merge pull request #1 from inthepoche/dev
Dev
Diffstat (limited to 'inc/3rdparty/site_config/standard/npr.org.txt')
-rw-r--r-- | inc/3rdparty/site_config/standard/npr.org.txt | 32 |
1 files changed, 32 insertions, 0 deletions
diff --git a/inc/3rdparty/site_config/standard/npr.org.txt b/inc/3rdparty/site_config/standard/npr.org.txt new file mode 100644 index 00000000..afab0eb3 --- /dev/null +++ b/inc/3rdparty/site_config/standard/npr.org.txt | |||
@@ -0,0 +1,32 @@ | |||
1 | title: //div[contains(@class, 'storytitle')]//h1 | ||
2 | author: //p[@class="byline"]/span | ||
3 | body: //div[@id='storyspan02']//*[@class='duration' or @class='download' or contains(@class, 'photo')] | //div[@id='storytext'] | //div[@class='transcript'] | ||
4 | date: //meta[@name="date"]/@content | ||
5 | |||
6 | strip: //div[@class='enlarge_measure'] | ||
7 | strip: //div[@class='enlarge_html'] | ||
8 | strip: //a[@class='enlargeicon'] | ||
9 | strip: //div[contains(@class, 'bookedition')] | ||
10 | strip: //div[@class='textsize'] | ||
11 | strip: //ul[@class='genres'] | ||
12 | strip: //span[@class='bull'] | ||
13 | strip_id_or_class: secondary | ||
14 | strip_id_or_class: con1col | ||
15 | strip: //h3[@class='conheader'] | ||
16 | |||
17 | replace_string(<a name="more"> </a>): <!-- no more --> | ||
18 | replace_string(<div class="transcript">): <div class="transcript"><h2>Transcript</h2> | ||
19 | |||
20 | prune: no | ||
21 | strip://div[@class="ecommercepop"] | ||
22 | strip://span[@class="bull"] | ||
23 | strip://span[@class="purchaseLink"] | ||
24 | strip://div[@class="enlarge_html"] | ||
25 | strip://div[@class="enlarge_measure"] | ||
26 | strip://div[@class="container con1col small"] | ||
27 | strip://a[contains(@class, "enlargebtn")] | ||
28 | strip://div[contains(@class, "bucketwrap internallink")] | ||
29 | |||
30 | test_url: http://www.npr.org/blogs/thetwo-way/2011/07/12/137799301/sports-loses-its-escapist-gleam-in-a-summer-of-court-dates | ||
31 | test_url: http://www.npr.org/2012/07/04/156190948/feeling-under-siege-catholic-leadership-shifts-right | ||
32 | test_url: http://www.npr.org/2012/12/13/166480907/the-years-best-sci-fi-crosses-galaxies-and-genres \ No newline at end of file | ||