From 4e067ceabd705201a16b4c92cf4b23f3b990326c Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Nicolas=20L=C5=93uillet?= Date: Sun, 13 Jul 2014 10:15:40 +0200 Subject: updated specific configuration for parsing --- inc/3rdparty/site_config/standard/zdnet.com.txt | 18 +++++++++--------- 1 file changed, 9 insertions(+), 9 deletions(-) mode change 100644 => 100755 inc/3rdparty/site_config/standard/zdnet.com.txt (limited to 'inc/3rdparty/site_config/standard/zdnet.com.txt') diff --git a/inc/3rdparty/site_config/standard/zdnet.com.txt b/inc/3rdparty/site_config/standard/zdnet.com.txt old mode 100644 new mode 100755 index b244b229..939fb0e3 --- a/inc/3rdparty/site_config/standard/zdnet.com.txt +++ b/inc/3rdparty/site_config/standard/zdnet.com.txt @@ -1,10 +1,10 @@ -title: //h1[@class="h s-1"] -author: substring-before(substring-after(//p[@class="meta s-10"], 'By'), '|') -author: substring-after(//div[@class="bio"]//h3, 'About ') -date: substring-after(//p[@class="meta s-10"], '|') -date: substring-after(//p[@class="meta"], '|') -body: //div[@class="content-1 entry space-1 clear"] -body: //div[@class="storyBody"] - -test_url: http://www.zdnet.com/blog/microsoft/the-bing-back-end-more-on-cosmos-tiger-and-scope/10920 +title: //h1[@class="h s-1"] +author: substring-before(substring-after(//p[@class="meta s-10"], 'By'), '|') +author: substring-after(//div[@class="bio"]//h3, 'About ') +date: substring-after(//p[@class="meta s-10"], '|') +date: substring-after(//p[@class="meta"], '|') +body: //div[@class="content-1 entry space-1 clear"] +body: //div[@class="storyBody"] + +test_url: http://www.zdnet.com/blog/microsoft/the-bing-back-end-more-on-cosmos-tiger-and-scope/10920 test_url: http://www.zdnet.com/researchers-find-web-tracking-up-privacy-down-7000000358/ \ No newline at end of file -- cgit v1.2.3