1 # TODO: clean up the extra junk at the end of articles
3 # general text formatting
5 convert_double_br_tags:yes
7 # where to find the basic metadata
8 author://a[@class='articleauthor']
9 date://a[starts-with(@href,'/en/search/published/')]
10 title:substring-before(//h2[@class='title'],'—')
11 body://div[@id='maincontainer']
13 dissolve://div[starts-with(@id,'commentableblock')]
16 strip://div[contains(@class,'domusnetwork')]
17 strip://div[contains(@class,'relative_wrapper')]
19 strip://div[contains(@class,'captionsubimage')]/img[contains(@class,'arrow')]
20 wrap_in(em): //div[contains(@class,'captionsubimage')]/span
21 test_url: http://www.domusweb.it/en/design/in-praise-of-lost-time/