1 title: //div[@class='post']/h2
2 author: substring-before(substring-after(//div[@class='alignright']/small, 'By '),'-')
3 date: substring-after(//div[@class='alignright']/small, '-')
4 strip: //div[@class='alignleft']
5 test_url: http://www.ritholtz.com/blog/2012/09/situational-awareness/