aboutsummaryrefslogtreecommitdiffhomepage
path: root/inc/3rdparty/site_config/standard/handelsblatt.com.txt
diff options
context:
space:
mode:
authorNicolas LÅ“uillet <nicolas@loeuillet.org>2014-07-13 10:15:40 +0200
committerNicolas LÅ“uillet <nicolas@loeuillet.org>2014-07-13 10:15:40 +0200
commit4e067ceabd705201a16b4c92cf4b23f3b990326c (patch)
tree939f3a8e5ff3ab9ee414a57a895d3e78e1d46ce3 /inc/3rdparty/site_config/standard/handelsblatt.com.txt
parent58dbe103889148def78b0fc8744d3f94c56a1561 (diff)
downloadwallabag-4e067ceabd705201a16b4c92cf4b23f3b990326c.tar.gz
wallabag-4e067ceabd705201a16b4c92cf4b23f3b990326c.tar.zst
wallabag-4e067ceabd705201a16b4c92cf4b23f3b990326c.zip
updated specific configuration for parsing
Diffstat (limited to 'inc/3rdparty/site_config/standard/handelsblatt.com.txt')
-rwxr-xr-xinc/3rdparty/site_config/standard/handelsblatt.com.txt31
1 files changed, 31 insertions, 0 deletions
diff --git a/inc/3rdparty/site_config/standard/handelsblatt.com.txt b/inc/3rdparty/site_config/standard/handelsblatt.com.txt
new file mode 100755
index 00000000..7d067aa6
--- /dev/null
+++ b/inc/3rdparty/site_config/standard/handelsblatt.com.txt
@@ -0,0 +1,31 @@
1#Single Page
2single_page_link: //li[contains(@class,"hcf-print")]/a
3
4# Title hcf-headline
5title: //span[@class='hcf-headline']
6
7# Authors
8author: //div[@class="hcf-author"]/a/text()
9author: substring-after(//div[@class='hcf-author'], 'von ')
10
11# Date
12date: //div[@class='hcf-article-date']
13
14# Body
15body: //div[@class='article']
16
17# General removements
18strip: //div[contains(@class,"hcf-smartbox")]
19strip: //div[contains(@class,"hcf-stopper")]
20strip: //div[contains(@class,"hcf-img-controls")]
21strip: //span[@class='hcf-location-mark']
22strip: //span[@class='hcf-copyright']
23strip: //div[@class='hcf-copyright']
24strip: //div[@class='hcf-origin']
25
26
27
28
29# Fix picture captions
30wrap_in(small): //div[@class="hcf-caption"]
31test_url: http://www.handelsblatt.com/meinung/gastbeitraege/gastkommentar-zum-emissionshandel-kurskorrekturen-fuehren-zum-kentern/8044326.html \ No newline at end of file