1 2 3 4 5 6 7 8
title: //span[@id='DetailedTitle'] body: //td[@id='tdTextContent'] strip_id_or_class: Skyscrapper_Body date: //span[@id='ctl00_cphBody_lblDate'] author: //div[@id="dvAuthorInfo"]//a/text() strip: //table[ tbody/tr/td/object ] prune: no test_url: http://www.aljazeera.com/indepth/opinion/2012/01/2012114121925380575.html