diff options
-rwxr-xr-x | inc/3rdparty/site_config/standard/chronicle.com.txt | 15 |
1 files changed, 4 insertions, 11 deletions
diff --git a/inc/3rdparty/site_config/standard/chronicle.com.txt b/inc/3rdparty/site_config/standard/chronicle.com.txt index e86d3eca..227a03c7 100755 --- a/inc/3rdparty/site_config/standard/chronicle.com.txt +++ b/inc/3rdparty/site_config/standard/chronicle.com.txt | |||
@@ -1,17 +1,10 @@ | |||
1 | title: //h1[contains(@class, "entry-title")] | 1 | title: //h1[contains(@class, "entry-title")] |
2 | author: //p[contains(@class, "byline")] | 2 | author: //p[contains(@class, "byline")] |
3 | 3 | ||
4 | # blog articles (chronicle.com/blogs/*) | ||
5 | body: //div[contains(@class, "abstract")] | ||
6 | date: //p[contains(@class, "time")] | ||
7 | |||
8 | # all (?) other articles | 4 | # all (?) other articles |
9 | body: //div[@id="article-body"] | 5 | body: //div[@class="content-item__story"] |
10 | date: //p[contains(@class, "dateline")] | 6 | date: //p[contains(@class, "dateline")] |
11 | 7 | ||
12 | # remove sidebars containing images (I assume this is desired for Instapaper) | 8 | # note that if you're not a Chronicle subscriber (personally or institutionally), you'll only see the first couple of paragraphs of the article, and Instapaper $ |
13 | strip: //div[@id="related"] | 9 | test_url: http://chronicle.com/article/In-a-Land-of-Second-Chances/128375/ |
14 | strip: //div[contains(@class, "image")] | 10 | test_url: http://chronicle.com/blogs/wiredcampus/university-run-boot-camps-offer-students-marketable-skills-but-not-course-credit/57494 |
15 | |||
16 | # note that if you're not a Chronicle subscriber (personally or institutionally), you'll only see the first couple of paragraphs of the article, and Instapaper will display that with some crap above and below. thank goodness for that bookmarklet | ||
17 | test_url: http://chronicle.com/article/In-a-Land-of-Second-Chances/128375/ \ No newline at end of file | ||