1 title: //div[@class='articleLeft']/h3
3 author: substring-after(//span[@class='articleAuthor']/a,'By ')
5 date: substring-before(//span[@class='articleDateTime'],'in ')
7 body: //div[@class='articleLeft']
8 strip: //div[@class='articleMoreNews']
9 strip: //div[@class='articleLeft']/h3
10 strip: //div[@class='articleLeft']/p[@class='articleInfo clearfix']
12 # Remove duplicate title from text
13 strip: //div[@id='site']/div[5][@class='holder']/div[1][@class='hBlock']/div[1][@class='sglCol article']/h3
14 test_url: http://www.stalbansreview.co.uk/news/9581446.New_roundabout_in_King_Harry_Lane/r/?ref=rss