2 title://h1[@id = 'articleTitle']
3 author:substring-after(//ul[@id = 'byLine']/li[1],'By ')
4 date:substring-before(substring-after(//ul[@id = 'byLine']/li[last()],','),',')
5 body://div[@id = 'article-body']
8 single_page_link://td/li[@class = 'article-singlepage']/a
11 single_page_link: //a[@id='continue-btn']
14 wrap_in(i)://span[@class='articleImageCaptionwide']
15 move_into (//span[@class='articleImageCaptionwide'])://div[@id = 'articleImage']/p
19 strip://p[@id = 'articlePaginationWrapper']
20 strip://ul[contains(@class, 'cat-breadcrumb')]
21 strip://div [@class= 'viewMorePhotos']
23 test_url: http://www.smithsonianmag.com/history-archaeology/The-Goddess-Goes-Home.html