blob: 0c6c11ed64d763a64b31a5f807a4bd0f64d44030 (
plain) (
blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
|
title: //h1[contains(@class, "entry-title")]
author: //p[contains(@class, "byline")]
# blog articles (chronicle.com/blogs/*)
body: //div[contains(@class, "abstract")]
date: //p[contains(@class, "time")]
# all (?) other articles
body: //div[@id="article-body"]
date: //p[contains(@class, "dateline")]
# remove sidebars containing images (I assume this is desired for Instapaper)
strip: //div[@id="related"]
strip: //div[contains(@class, "image")]
# note that if you're not a Chronicle subscriber (personally or institutionally), you'll only see the first couple of paragraphs of the article, and Instapaper will display that with some crap above and below. thank goodness for that bookmarklet
test_url: http://chronicle.com/article/In-a-Land-of-Second-Chances/128375/
|