aboutsummaryrefslogtreecommitdiffhomepage
path: root/inc/3rdparty/site_config/standard/politico.com.txt
diff options
context:
space:
mode:
Diffstat (limited to 'inc/3rdparty/site_config/standard/politico.com.txt')
-rwxr-xr-xinc/3rdparty/site_config/standard/politico.com.txt26
1 files changed, 11 insertions, 15 deletions
diff --git a/inc/3rdparty/site_config/standard/politico.com.txt b/inc/3rdparty/site_config/standard/politico.com.txt
index c5302d1b..d8f5e575 100755
--- a/inc/3rdparty/site_config/standard/politico.com.txt
+++ b/inc/3rdparty/site_config/standard/politico.com.txt
@@ -1,17 +1,13 @@
1title://div[contains(@class, "article")]/h1 1title://div[contains(@class, "article")]/h1
2body://div[contains(@class,"story-text")] 2body://div[contains(@class,"story-text")]
3 3
4# Why doesn't this work? next_page_link://ul[contains(@class,"pagination")]/li/a[@rel="next"] 4# Why doesn't this work? next_page_link://ul[contains(@class,"pagination")]/li/a[@rel="next"]
5 5
6next_page_link://ul[contains(@class,"pagination")]/li[contains(@class, "current")]/following-sibling::node()/a 6next_page_link://ul[contains(@class,"pagination")]/li[contains(@class, "current")]/following-sibling::node()/a
7next_page_link://div[contains(@class,"pagination")]/ol/li[contains(@class, "current")]/following-sibling::node()/a 7date://meta[@name="publish_date"]/@content
8date://meta[@name="publish_date"]/@content 8
9 9strip://div[contains(@class, "breadcrumbs")]
10strip://div[contains(@class, "breadcrumbs")] 10strip://a[contains(@class, "hidden")]
11strip://a[contains(@class, "hidden")] 11strip://div[contains(@class, "story-embed")]
12strip://div[contains(@class, "story-embed")]
13strip://div[contains(@class, "story-text")]//p/a[contains(text(), "Also on POLITICO:")]/.. 12strip://div[contains(@class, "story-text")]//p/a[contains(text(), "Also on POLITICO:")]/..
14strip://div[contains(@class, "story-interrupt")]
15strip://footer[contains(@class, "author-bio")]
16
17test_url: http://www.politico.com/news/stories/0712/78105.html \ No newline at end of file 13test_url: http://www.politico.com/news/stories/0712/78105.html \ No newline at end of file