aboutsummaryrefslogtreecommitdiffhomepage
path: root/inc/3rdparty/site_config/standard/politico.com.txt
diff options
context:
space:
mode:
Diffstat (limited to 'inc/3rdparty/site_config/standard/politico.com.txt')
-rw-r--r--inc/3rdparty/site_config/standard/politico.com.txt13
1 files changed, 13 insertions, 0 deletions
diff --git a/inc/3rdparty/site_config/standard/politico.com.txt b/inc/3rdparty/site_config/standard/politico.com.txt
new file mode 100644
index 00000000..121fd5b9
--- /dev/null
+++ b/inc/3rdparty/site_config/standard/politico.com.txt
@@ -0,0 +1,13 @@
1title://div[contains(@class, "article")]/h1
2body://div[contains(@class,"story-text")]
3
4# Why doesn't this work? next_page_link://ul[contains(@class,"pagination")]/li/a[@rel="next"]
5
6next_page_link://ul[contains(@class,"pagination")]/li[contains(@class, "current")]/following-sibling::node()/a
7date://meta[@name="publish_date"]/@content
8
9strip://div[contains(@class, "breadcrumbs")]
10strip://a[contains(@class, "hidden")]
11strip://div[contains(@class, "story-embed")]
12strip://div[contains(@class, "story-text")]//p/a[contains(text(), "Also on POLITICO:")]/..
13test_url: http://www.politico.com/news/stories/0712/78105.html \ No newline at end of file