]>
Commit | Line | Data |
---|---|---|
4e067cea NL |
1 | #basics |
2 | author: (//div[contains(@class,'author')])[1] | |
3 | date: substring-before(//a[@class='issue'], '—') | |
4 | #body://div[@class = 'entry'] | |
5 | # use this until move_into support is ready | |
6 | body: //div[@class = 'entry' or @class='standfirst' or @class='lead_image'] | |
7 | ||
8 | #moves header image and tagline into body | |
9 | move_into(//div[@class='entry']/div)://div[@class = 'lead_image'] | |
10 | move_into(//div[@class='entry']/div)://div[@class = 'standfirst'] | |
11 | ||
12 | ||
13 | # moves author info to end of text | |
14 | move_into(//p[strong[string(.) = 'Follow Prospect on Twitter']])://div[@id='sidebar_content']/p/em | |
15 | ||
16 | prune: no | |
17 | ||
18 | # strips social links | |
19 | strip_id_or_class:login-status | |
20 | strip_id_or_class:shareinpost | |
21 | strip_id_or_class:content_subscribe | |
22 | strip_id_or_class:postinfo | |
23 | strip_id_or_class:postutils | |
24 | strip_id_or_class:comments | |
25 | strip://strong[string(.) = 'Follow Prospect on Twitter'] | |
ac4d1142 | 26 | test_url: http://www.prospectmagazine.co.uk/2011/07/postmodernism-is-dead-va-exhibition-age-of-authenticism/ |