From 4e067ceabd705201a16b4c92cf4b23f3b990326c Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Nicolas=20L=C5=93uillet?= Date: Sun, 13 Jul 2014 10:15:40 +0200 Subject: updated specific configuration for parsing --- inc/3rdparty/site_config/standard/philly.com.txt | 16 ++++++++-------- 1 file changed, 8 insertions(+), 8 deletions(-) mode change 100644 => 100755 inc/3rdparty/site_config/standard/philly.com.txt (limited to 'inc/3rdparty/site_config/standard/philly.com.txt') diff --git a/inc/3rdparty/site_config/standard/philly.com.txt b/inc/3rdparty/site_config/standard/philly.com.txt old mode 100644 new mode 100755 index 41318f63..accbd60b --- a/inc/3rdparty/site_config/standard/philly.com.txt +++ b/inc/3rdparty/site_config/standard/philly.com.txt @@ -1,10 +1,10 @@ -title: //h1[@class='entry-title'] -author: //p[@class='byline']/span -body: //@id='body-content' -date: //div[@class='article_timestamp']/span - -strip: //@class=b-group -strip: //*[contains(@style, 'none')] -strip: //a[contains(@href, 'comments')] +title: //h1[@class='entry-title'] +author: //p[@class='byline']/span +body: //@id='body-content' +date: //div[@class='article_timestamp']/span + +strip: //@class=b-group +strip: //*[contains(@style, 'none')] +strip: //a[contains(@href, 'comments')] strip: //*[contains(@class, 'comment')] test_url: http://www.philly.com/philly/sports/eagles/20120127_Ohio_State_s_Posey_didn_t_waste_time_lost_to_suspension.html \ No newline at end of file -- cgit v1.2.3