From ac4d114214d820b20e18518a2dbc809337e39043 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Nicolas=20L=C5=93uillet?= Date: Fri, 6 Dec 2013 10:13:03 +0100 Subject: [add] new specific configuration files --- inc/3rdparty/site_config/standard/slashfilm.com.txt | 15 +++++++++++++++ 1 file changed, 15 insertions(+) create mode 100644 inc/3rdparty/site_config/standard/slashfilm.com.txt (limited to 'inc/3rdparty/site_config/standard/slashfilm.com.txt') diff --git a/inc/3rdparty/site_config/standard/slashfilm.com.txt b/inc/3rdparty/site_config/standard/slashfilm.com.txt new file mode 100644 index 00000000..78d38ecf --- /dev/null +++ b/inc/3rdparty/site_config/standard/slashfilm.com.txt @@ -0,0 +1,15 @@ +title: substring-before(//title,'| /Film') +date: substring-before(substring-after(//p[@class='post-info'],'Posted on '),'by') +strip: //div[@class='pm-left'] +strip: //div[@class='pm-right'] +strip: //h2/span +next_page_link: //h2/strong/a +strip: //h2/strong/a +strip: //p[contains(text(),'we have to split this post over')] +strip: //p[@class='post-info'] +strip: //h1/a +strip: //img[contains(@src,'siteimages/authors')] +strip: //div[@id='header'] +strip: //div[@class='topad-right'] +strip: //strong[contains(text(),'Cool Posts From Around the Web:')] +test_url: http://www.slashfilm.com/superhero-bits-206/ \ No newline at end of file -- cgit v1.2.3