aboutsummaryrefslogtreecommitdiffhomepage
path: root/inc/3rdparty/site_config/standard/npr.org.txt
diff options
context:
space:
mode:
Diffstat (limited to 'inc/3rdparty/site_config/standard/npr.org.txt')
-rwxr-xr-x[-rw-r--r--]inc/3rdparty/site_config/standard/npr.org.txt66
1 files changed, 34 insertions, 32 deletions
diff --git a/inc/3rdparty/site_config/standard/npr.org.txt b/inc/3rdparty/site_config/standard/npr.org.txt
index afab0eb3..acd73e48 100644..100755
--- a/inc/3rdparty/site_config/standard/npr.org.txt
+++ b/inc/3rdparty/site_config/standard/npr.org.txt
@@ -1,32 +1,34 @@
1title: //div[contains(@class, 'storytitle')]//h1 1title: //div[contains(@class, 'storytitle')]//h1
2author: //p[@class="byline"]/span 2author: //p[@class="byline"]/span
3body: //div[@id='storyspan02']//*[@class='duration' or @class='download' or contains(@class, 'photo')] | //div[@id='storytext'] | //div[@class='transcript'] 3body: //div[@id='primaryaudio']//*[@class='duration' or @class='download' or contains(@class, 'photo')] | //div[@id='storytext' or @id='supplementarycontent' or contains(@class, 'transcript')]
4date: //meta[@name="date"]/@content 4date: //meta[@name="date"]/@content
5 5
6strip: //div[@class='enlarge_measure'] 6strip_id_or_class: enlarge_measure
7strip: //div[@class='enlarge_html'] 7strip_id_or_class: enlarge_html
8strip: //a[@class='enlargeicon'] 8strip: //a[contains(@class, 'enlargeicon')]
9strip: //div[contains(@class, 'bookedition')] 9strip: //div[contains(@class, 'bookedition')]
10strip: //div[@class='textsize'] 10strip: //div[@class='textsize']
11strip: //ul[@class='genres'] 11strip: //ul[@class='genres']
12strip: //span[@class='bull'] 12strip: //span[@class='bull']
13strip_id_or_class: secondary 13strip_id_or_class: secondary
14strip_id_or_class: con1col 14strip_id_or_class: con1col
15strip: //h3[@class='conheader'] 15strip: //h3[@class='conheader']
16 16
17replace_string(<a name="more">&nbsp;</a>): <!-- no more --> 17replace_string(<a name="more">&nbsp;</a>): <!-- no more -->
18replace_string(<div class="transcript">): <div class="transcript"><h2>Transcript</h2> 18replace_string(<div class="transcript">): <div class="transcript"><h2>Transcript</h2>
19 19replace_string(<div class="transcript storytext">): <div class="transcript storytext"><h2>Transcript</h2>
20prune: no 20
21strip://div[@class="ecommercepop"] 21prune: no
22strip://span[@class="bull"] 22strip://div[@class="ecommercepop"]
23strip://span[@class="purchaseLink"] 23strip://span[@class="bull"]
24strip://div[@class="enlarge_html"] 24strip://span[@class="purchaseLink"]
25strip://div[@class="enlarge_measure"] 25strip://div[@class="enlarge_html"]
26strip://div[@class="container con1col small"] 26strip://div[@class="enlarge_measure"]
27strip://a[contains(@class, "enlargebtn")] 27strip://div[@class="container con1col small"]
28strip://div[contains(@class, "bucketwrap internallink")] 28strip://a[contains(@class, "enlargebtn")]
29 29strip://div[contains(@class, "bucketwrap internallink")]
30test_url: http://www.npr.org/blogs/thetwo-way/2011/07/12/137799301/sports-loses-its-escapist-gleam-in-a-summer-of-court-dates 30
31test_url: http://www.npr.org/2012/07/04/156190948/feeling-under-siege-catholic-leadership-shifts-right 31test_url: http://www.npr.org/blogs/thetwo-way/2011/07/12/137799301/sports-loses-its-escapist-gleam-in-a-summer-of-court-dates
32test_url: http://www.npr.org/2012/12/13/166480907/the-years-best-sci-fi-crosses-galaxies-and-genres \ No newline at end of file 32test_url: http://www.npr.org/2012/07/04/156190948/feeling-under-siege-catholic-leadership-shifts-right
33test_url: http://www.npr.org/2012/12/13/166480907/the-years-best-sci-fi-crosses-galaxies-and-genres
34test_url: http://www.npr.org/templates/story/story.php?storyId=229103221 \ No newline at end of file