diff options
Diffstat (limited to 'inc/3rdparty/site_config/standard/politico.com.txt')
-rw-r--r-- | inc/3rdparty/site_config/standard/politico.com.txt | 13 |
1 files changed, 13 insertions, 0 deletions
diff --git a/inc/3rdparty/site_config/standard/politico.com.txt b/inc/3rdparty/site_config/standard/politico.com.txt new file mode 100644 index 00000000..121fd5b9 --- /dev/null +++ b/inc/3rdparty/site_config/standard/politico.com.txt | |||
@@ -0,0 +1,13 @@ | |||
1 | title://div[contains(@class, "article")]/h1 | ||
2 | body://div[contains(@class,"story-text")] | ||
3 | |||
4 | # Why doesn't this work? next_page_link://ul[contains(@class,"pagination")]/li/a[@rel="next"] | ||
5 | |||
6 | next_page_link://ul[contains(@class,"pagination")]/li[contains(@class, "current")]/following-sibling::node()/a | ||
7 | date://meta[@name="publish_date"]/@content | ||
8 | |||
9 | strip://div[contains(@class, "breadcrumbs")] | ||
10 | strip://a[contains(@class, "hidden")] | ||
11 | strip://div[contains(@class, "story-embed")] | ||
12 | strip://div[contains(@class, "story-text")]//p/a[contains(text(), "Also on POLITICO:")]/.. | ||
13 | test_url: http://www.politico.com/news/stories/0712/78105.html \ No newline at end of file | ||