From 4e067ceabd705201a16b4c92cf4b23f3b990326c Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Nicolas=20L=C5=93uillet?= Date: Sun, 13 Jul 2014 10:15:40 +0200 Subject: updated specific configuration for parsing --- .../site_config/standard/sueddeutsche.de.txt | 34 +++++++++++----------- 1 file changed, 17 insertions(+), 17 deletions(-) mode change 100644 => 100755 inc/3rdparty/site_config/standard/sueddeutsche.de.txt (limited to 'inc/3rdparty/site_config/standard/sueddeutsche.de.txt') diff --git a/inc/3rdparty/site_config/standard/sueddeutsche.de.txt b/inc/3rdparty/site_config/standard/sueddeutsche.de.txt old mode 100644 new mode 100755 index 4aa9410c..74b8d451 --- a/inc/3rdparty/site_config/standard/sueddeutsche.de.txt +++ b/inc/3rdparty/site_config/standard/sueddeutsche.de.txt @@ -1,18 +1,18 @@ -# 2012-12-04: complete rewrite after Süddeutsche.de relaunch - carlo@... - -single_page_link: //a[ contains( @href, "/2.220/" ) ] - -body: //article[@id="sitecontent"]/section[@class="body"] -author: //address[@class="author"] -date: //div[@class="header"]//h1//span[@class="updated"] -wrap_in(small): //div[@class="footer"] -wrap_in(i): //figcaption/h3 -dissolve: //figcaption//h3 -dissolve: //figure/div[@class="body"] -dissolve: //figure/a - -strip: //figure[ not( contains(@class, "zoomimage" ) ) ] -strip: //div[@data-onlineonly="true"] -strip: //address[@class="author"] - +# 2012-12-04: complete rewrite after Süddeutsche.de relaunch - carlo@... + +single_page_link: //a[ contains( @href, "/2.220/" ) ] + +body: //article[@id="sitecontent"]/section[@class="body"] +author: //address[@class="author"] +date: //div[@class="header"]//h1//span[@class="updated"] +wrap_in(small): //div[@class="footer"] +wrap_in(i): //figcaption/h3 +dissolve: //figcaption//h3 +dissolve: //figure/div[@class="body"] +dissolve: //figure/a + +strip: //figure[ not( contains(@class, "zoomimage" ) ) ] +strip: //div[@data-onlineonly="true"] +strip: //address[@class="author"] + test_url: http://www.sueddeutsche.de/muenchen/mietshaus-am-gaertnerplatz-alles-muss-raus-1.1556693 \ No newline at end of file -- cgit v1.2.3