]>
Commit | Line | Data |
---|---|---|
ac4d1142 NL |
1 | #basics\r |
2 | author: (//div[contains(@class,'author')])[1]\r | |
3 | date: substring-before(//a[@class='issue'], '—')\r | |
4 | #body://div[@class = 'entry']\r | |
5 | # use this until move_into support is ready\r | |
6 | body: //div[@class = 'entry' or @class='standfirst' or @class='lead_image']\r | |
7 | \r | |
8 | #moves header image and tagline into body\r | |
9 | move_into(//div[@class='entry']/div)://div[@class = 'lead_image']\r | |
10 | move_into(//div[@class='entry']/div)://div[@class = 'standfirst']\r | |
11 | \r | |
12 | \r | |
13 | # moves author info to end of text\r | |
14 | move_into(//p[strong[string(.) = 'Follow Prospect on Twitter']])://div[@id='sidebar_content']/p/em\r | |
15 | \r | |
16 | prune: no\r | |
17 | \r | |
18 | # strips social links\r | |
19 | strip_id_or_class:login-status\r | |
20 | strip_id_or_class:shareinpost\r | |
21 | strip_id_or_class:content_subscribe\r | |
22 | strip_id_or_class:postinfo\r | |
23 | strip_id_or_class:postutils\r | |
24 | strip_id_or_class:comments\r | |
25 | strip://strong[string(.) = 'Follow Prospect on Twitter']\r | |
26 | test_url: http://www.prospectmagazine.co.uk/2011/07/postmodernism-is-dead-va-exhibition-age-of-authenticism/ |