From 4e067ceabd705201a16b4c92cf4b23f3b990326c Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Nicolas=20L=C5=93uillet?= Date: Sun, 13 Jul 2014 10:15:40 +0200 Subject: updated specific configuration for parsing --- .../site_config/standard/chronicle.com.txt | 30 +++++++++++----------- 1 file changed, 15 insertions(+), 15 deletions(-) mode change 100644 => 100755 inc/3rdparty/site_config/standard/chronicle.com.txt (limited to 'inc/3rdparty/site_config/standard/chronicle.com.txt') diff --git a/inc/3rdparty/site_config/standard/chronicle.com.txt b/inc/3rdparty/site_config/standard/chronicle.com.txt old mode 100644 new mode 100755 index 0c6c11ed..e86d3eca --- a/inc/3rdparty/site_config/standard/chronicle.com.txt +++ b/inc/3rdparty/site_config/standard/chronicle.com.txt @@ -1,17 +1,17 @@ -title: //h1[contains(@class, "entry-title")] -author: //p[contains(@class, "byline")] - -# blog articles (chronicle.com/blogs/*) -body: //div[contains(@class, "abstract")] -date: //p[contains(@class, "time")] - -# all (?) other articles -body: //div[@id="article-body"] -date: //p[contains(@class, "dateline")] - -# remove sidebars containing images (I assume this is desired for Instapaper) -strip: //div[@id="related"] -strip: //div[contains(@class, "image")] - +title: //h1[contains(@class, "entry-title")] +author: //p[contains(@class, "byline")] + +# blog articles (chronicle.com/blogs/*) +body: //div[contains(@class, "abstract")] +date: //p[contains(@class, "time")] + +# all (?) other articles +body: //div[@id="article-body"] +date: //p[contains(@class, "dateline")] + +# remove sidebars containing images (I assume this is desired for Instapaper) +strip: //div[@id="related"] +strip: //div[contains(@class, "image")] + # note that if you're not a Chronicle subscriber (personally or institutionally), you'll only see the first couple of paragraphs of the article, and Instapaper will display that with some crap above and below. thank goodness for that bookmarklet test_url: http://chronicle.com/article/In-a-Land-of-Second-Chances/128375/ \ No newline at end of file -- cgit v1.2.3