From 4e067ceabd705201a16b4c92cf4b23f3b990326c Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Nicolas=20L=C5=93uillet?= Date: Sun, 13 Jul 2014 10:15:40 +0200 Subject: updated specific configuration for parsing --- .../site_config/standard/archiveofourown.org.txt | 38 ++++++++++++---------- 1 file changed, 21 insertions(+), 17 deletions(-) mode change 100644 => 100755 inc/3rdparty/site_config/standard/archiveofourown.org.txt (limited to 'inc/3rdparty/site_config/standard/archiveofourown.org.txt') diff --git a/inc/3rdparty/site_config/standard/archiveofourown.org.txt b/inc/3rdparty/site_config/standard/archiveofourown.org.txt old mode 100644 new mode 100755 index 50ff632d..579de517 --- a/inc/3rdparty/site_config/standard/archiveofourown.org.txt +++ b/inc/3rdparty/site_config/standard/archiveofourown.org.txt @@ -1,18 +1,22 @@ -# Description: Fix XPaths to include ALL chapters on 'view_full_work' pages. -# Include: work meta, summary, chapter information, and notes which Instapaper strips out on default. -# Exclude: header, footer, navigation, comments. -# Notes: User is a newbie with XPaths. - -title: //h2[@class='title'] -author: //h3[@class='byline'] -author: //a[@class='login author'] - -strip_id_or_class:header -strip_id_or_class:navigation -strip_id_or_class:feedback -strip_id_or_class:kudos -strip_id_or_class:add_comment_placeholder -strip_id_or_class:add_comment -strip_id_or_class:globalize +# Description: Fix XPaths to include ALL chapters on 'view_full_work' pages. +# Include: work meta, summary, chapter information, and notes which Instapaper strips out on default. +# Exclude: header, footer, navigation, comments. +# Notes: User is a newbie with XPaths. + +title: //h2[@class='title'] +author: //h3[@class='byline'] +author: //a[@class='login author'] + +strip_id_or_class:header +strip_id_or_class:navigation +strip_id_or_class:feedback +strip_id_or_class:kudos +strip_id_or_class:add_comment_placeholder +strip_id_or_class:add_comment +strip_id_or_class:globalize strip_id_or_class:footer -test_url: http://archiveofourown.org/works/229402?view_full_work=true \ No newline at end of file + +single_page_link: //div[@id='main']//a[contains(@href, 'view_adult=true')] + +test_url: http://archiveofourown.org/works/229402?view_full_work=true +test_url: http://archiveofourown.org/works/750111/chapters/1399929 \ No newline at end of file -- cgit v1.2.3