From 4e067ceabd705201a16b4c92cf4b23f3b990326c Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Nicolas=20L=C5=93uillet?= Date: Sun, 13 Jul 2014 10:15:40 +0200 Subject: updated specific configuration for parsing --- .../site_config/standard/gotomanager.com.txt | 38 +++++++++++----------- 1 file changed, 19 insertions(+), 19 deletions(-) mode change 100644 => 100755 inc/3rdparty/site_config/standard/gotomanager.com.txt (limited to 'inc/3rdparty/site_config/standard/gotomanager.com.txt') diff --git a/inc/3rdparty/site_config/standard/gotomanager.com.txt b/inc/3rdparty/site_config/standard/gotomanager.com.txt old mode 100644 new mode 100755 index 7fb0ee03..f8af7324 --- a/inc/3rdparty/site_config/standard/gotomanager.com.txt +++ b/inc/3rdparty/site_config/standard/gotomanager.com.txt @@ -1,21 +1,21 @@ -title: //span[@id="showTitle"] -author: //span[@id="showAuthor"] -date: //span[@id="showRefDate"] - -strip: //span[@class="black_bold"] -strip: //div[@id="sectionName"] -strip: //div[@id="storyHeader"] - -body: //div[@id="newsBodyText"] - -strip_image_src: "http://www.gotomanager.com/img/mgrm/space.gif" -strip_image_src: "http://www.gotomanager.com/images/separator.gif" -strip_image_src: "http://www.gotomanager.com/images/spaces.gif" - -convert_double_br_tags: yes -tidy: yes - -strip: //div[@id="smallLeadImage"] -strip: //div[@id="truehitsSurvey"] +title: //span[@id="showTitle"] +author: //span[@id="showAuthor"] +date: //span[@id="showRefDate"] + +strip: //span[@class="black_bold"] +strip: //div[@id="sectionName"] +strip: //div[@id="storyHeader"] + +body: //div[@id="newsBodyText"] + +strip_image_src: "http://www.gotomanager.com/img/mgrm/space.gif" +strip_image_src: "http://www.gotomanager.com/images/separator.gif" +strip_image_src: "http://www.gotomanager.com/images/spaces.gif" + +convert_double_br_tags: yes +tidy: yes + +strip: //div[@id="smallLeadImage"] +strip: //div[@id="truehitsSurvey"] strip: //table[@id="relatedInfoTable"] test_url: http://www.gotomanager.com/news/details.aspx?id=86759 \ No newline at end of file -- cgit v1.2.3