]>
Commit | Line | Data |
---|---|---|
4e067cea NL |
1 | # TIDY |
2 | #tidy: no | |
3 | # PRUNE | |
4 | #prune: no | |
5 | ||
6 | # SINGLE PAGE | |
7 | single_page_link: //div[@class='showlinks']/a | |
8 | ||
9 | # TITLE | |
10 | title: //h1[@class="title"] | |
11 | ||
12 | # AUTHOR | |
13 | author: //div[contains(@class,"field-field-article-display-authors")]/div/div/a/text() | |
14 | ||
15 | # DATE | |
16 | date: //div[contains(@class,"field-field-article-issue")]/div/div/a/text() | //span[@class="date-display-single"] | |
17 | ||
18 | # BODY | |
19 | body: //div[contains(@class,"content-resize")] | |
20 | ||
21 | # Remove clutter | |
22 | strip: //div[@class="article-sidebar"] | |
23 | strip: //div[@class="showlinks"] | |
24 | strip: //div[contains(@class,"premium-box")] | |
25 | strip: //div[contains(@class,"premium-box")] | |
26 | strip: //table[contains(@border,"2")] | |
27 | ||
28 | # Fix picture captions | |
29 | wrap_in(small): //p/img/following-sibling::em | |
30 | wrap_in(small): //p[img]/text() | |
31 | ||
32 | # Fix sub-headlines | |
33 | wrap_in(h3): //div[contains(@class,"field-field-article-subtitle")]/div/div/text() | |
34 | test_url: http://www.foreignaffairs.com/articles/138810/pierre-n-leval/the-long-arm-of-international-law |