blob: 70d3d4373e02e3773ffcb4bcdb55443d1e860cf2 (
plain) (
tree)
|
|
single_page_link: //link[contains(@href, 'm.theregister')]
if_page_contains: //div[@id='nextpage']
strip: //div[@class='wptl btm']
body: //div[contains(@class,'article_head')]//h2 | //div[@id='body']
#multipage
test_url: http://www.theregister.co.uk/2015/07/06/geeks_guide_spaceguard_center/
#singlepage
test_url: http://www.theregister.co.uk/2015/07/06/us_japan_massive_robots_in_the_ring/
|