aboutsummaryrefslogtreecommitdiffhomepage
path: root/inc/3rdparty/site_config/standard/welt.de.txt
diff options
context:
space:
mode:
authorNicolas LÅ“uillet <nicolas@loeuillet.org>2014-07-13 10:15:40 +0200
committerNicolas LÅ“uillet <nicolas@loeuillet.org>2014-07-13 10:15:40 +0200
commit4e067ceabd705201a16b4c92cf4b23f3b990326c (patch)
tree939f3a8e5ff3ab9ee414a57a895d3e78e1d46ce3 /inc/3rdparty/site_config/standard/welt.de.txt
parent58dbe103889148def78b0fc8744d3f94c56a1561 (diff)
downloadwallabag-4e067ceabd705201a16b4c92cf4b23f3b990326c.tar.gz
wallabag-4e067ceabd705201a16b4c92cf4b23f3b990326c.tar.zst
wallabag-4e067ceabd705201a16b4c92cf4b23f3b990326c.zip
updated specific configuration for parsing
Diffstat (limited to 'inc/3rdparty/site_config/standard/welt.de.txt')
-rwxr-xr-x[-rw-r--r--]inc/3rdparty/site_config/standard/welt.de.txt42
1 files changed, 21 insertions, 21 deletions
diff --git a/inc/3rdparty/site_config/standard/welt.de.txt b/inc/3rdparty/site_config/standard/welt.de.txt
index 6e4f828f..42e65e97 100644..100755
--- a/inc/3rdparty/site_config/standard/welt.de.txt
+++ b/inc/3rdparty/site_config/standard/welt.de.txt
@@ -1,22 +1,22 @@
1# set body 1# set body
2tidy: no 2tidy: no
3body: //div[contains(@class, 'articleContent')] 3body: //div[contains(@class, 'articleContent')]
4 4
5# remove clutter 5# remove clutter
6strip: //div[@class='advertising'] 6strip: //div[@class='advertising']
7strip: //div[@class='themenalarm'] 7strip: //div[@class='themenalarm']
8strip: //div[contains(@class, 'inTextTeaser')] 8strip: //div[contains(@class, 'inTextTeaser')]
9 9
10# remove captions 10# remove captions
11strip: //span[@class='copyRight'] 11strip: //span[@class='copyRight']
12 12
13# remove photo galleries and extras 13# remove photo galleries and extras
14strip: //div[contains(@class, 'textGallery')] 14strip: //div[contains(@class, 'textGallery')]
15strip: //div[contains(@class, 'videoGallery')] 15strip: //div[contains(@class, 'videoGallery')]
16strip: //div[contains(@class, 'imageGallery')] 16strip: //div[contains(@class, 'imageGallery')]
17strip: //div[contains(@class, 'openContent')] 17strip: //div[contains(@class, 'openContent')]
18 18
19# remove comments 19# remove comments
20strip: //div[@id = 'writeComment'] 20strip: //div[@id = 'writeComment']
21 21
22test_url: http://www.welt.de/vermischtes/weltgeschehen/article11050589/27-Bergleute-in-neuseelaendischer-Mine-vermisst.html \ No newline at end of file 22test_url: http://www.welt.de/vermischtes/weltgeschehen/article11050589/27-Bergleute-in-neuseelaendischer-Mine-vermisst.html \ No newline at end of file