aboutsummaryrefslogtreecommitdiffhomepage
path: root/inc/3rdparty/site_config/standard/welt.de.txt
diff options
context:
space:
mode:
authorNicolas LÅ“uillet <nicolas.loeuillet@gmail.com>2013-12-06 10:13:03 +0100
committerNicolas LÅ“uillet <nicolas.loeuillet@gmail.com>2013-12-06 10:13:03 +0100
commitac4d114214d820b20e18518a2dbc809337e39043 (patch)
tree27886128ef949b7f8dd174b0646b5a4d99883b44 /inc/3rdparty/site_config/standard/welt.de.txt
parentd5501950e2470d52f6bf5954d2179010cdee0475 (diff)
downloadwallabag-ac4d114214d820b20e18518a2dbc809337e39043.tar.gz
wallabag-ac4d114214d820b20e18518a2dbc809337e39043.tar.zst
wallabag-ac4d114214d820b20e18518a2dbc809337e39043.zip
[add] new specific configuration files
Diffstat (limited to 'inc/3rdparty/site_config/standard/welt.de.txt')
-rw-r--r--inc/3rdparty/site_config/standard/welt.de.txt22
1 files changed, 22 insertions, 0 deletions
diff --git a/inc/3rdparty/site_config/standard/welt.de.txt b/inc/3rdparty/site_config/standard/welt.de.txt
new file mode 100644
index 00000000..6e4f828f
--- /dev/null
+++ b/inc/3rdparty/site_config/standard/welt.de.txt
@@ -0,0 +1,22 @@
1# set body
2tidy: no
3body: //div[contains(@class, 'articleContent')]
4
5# remove clutter
6strip: //div[@class='advertising']
7strip: //div[@class='themenalarm']
8strip: //div[contains(@class, 'inTextTeaser')]
9
10# remove captions
11strip: //span[@class='copyRight']
12
13# remove photo galleries and extras
14strip: //div[contains(@class, 'textGallery')]
15strip: //div[contains(@class, 'videoGallery')]
16strip: //div[contains(@class, 'imageGallery')]
17strip: //div[contains(@class, 'openContent')]
18
19# remove comments
20strip: //div[@id = 'writeComment']
21
22test_url: http://www.welt.de/vermischtes/weltgeschehen/article11050589/27-Bergleute-in-neuseelaendischer-Mine-vermisst.html \ No newline at end of file