1 title: //header/h1/b[contains(@class, 'title')]
2 author: substring-after(//article/header/div, 'By ')
3 date: //header/h1/span[contains(@class, 'date')]
4 body: //div[@id='main]/article
6 test_url: http://chrisltd.com/blog/2012/03/fix-widows-indesign/