aboutsummaryrefslogtreecommitdiffhomepage
path: root/inc/3rdparty/site_config/standard/domusweb.it.txt
blob: 81683f02330f21109688290fb7557d8ae590c09c (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
# TODO: clean up the extra junk at the end of articles

# general text formatting
prune: no
convert_double_br_tags:yes

# where to find the basic metadata
author://a[@class='articleauthor']
date://a[starts-with(@href,'/en/search/published/')]
title:substring-before(//h2[@class='title'],'—')
body://div[@id='maincontainer']

dissolve://div[starts-with(@id,'commentableblock')]

# clean up the crap
strip://div[contains(@class,'domusnetwork')]
strip://div[contains(@class,'relative_wrapper')]

strip://div[contains(@class,'captionsubimage')]/img[contains(@class,'arrow')]
wrap_in(em): //div[contains(@class,'captionsubimage')]/span
test_url: http://www.domusweb.it/en/design/in-praise-of-lost-time/