]>
Commit | Line | Data |
---|---|---|
4e067cea NL |
1 | title: //div[@class='articleLeft']/h3 |
2 | ||
3 | author: substring-after(//span[@class='articleAuthor']/a,'By ') | |
4 | ||
5 | date: substring-before(//span[@class='articleDateTime'],'in ') | |
6 | ||
7 | body: //div[@class='articleLeft'] | |
8 | strip: //div[@class='articleMoreNews'] | |
9 | strip: //div[@class='articleLeft']/h3 | |
10 | strip: //div[@class='articleLeft']/p[@class='articleInfo clearfix'] | |
11 | ||
12 | # Remove duplicate title from text | |
13 | strip: //div[@id='site']/div[5][@class='holder']/div[1][@class='hBlock']/div[1][@class='sglCol article']/h3 | |
ac4d1142 | 14 | test_url: http://www.stalbansreview.co.uk/news/9581446.New_roundabout_in_King_Harry_Lane/r/?ref=rss |