diff options
author | Nicolas LÅ“uillet <nicolas@loeuillet.org> | 2014-07-13 10:15:40 +0200 |
---|---|---|
committer | Nicolas LÅ“uillet <nicolas@loeuillet.org> | 2014-07-13 10:15:40 +0200 |
commit | 4e067ceabd705201a16b4c92cf4b23f3b990326c (patch) | |
tree | 939f3a8e5ff3ab9ee414a57a895d3e78e1d46ce3 /inc/3rdparty/site_config/standard/bt.no.txt | |
parent | 58dbe103889148def78b0fc8744d3f94c56a1561 (diff) | |
download | wallabag-4e067ceabd705201a16b4c92cf4b23f3b990326c.tar.gz wallabag-4e067ceabd705201a16b4c92cf4b23f3b990326c.tar.zst wallabag-4e067ceabd705201a16b4c92cf4b23f3b990326c.zip |
updated specific configuration for parsing
Diffstat (limited to 'inc/3rdparty/site_config/standard/bt.no.txt')
-rwxr-xr-x | inc/3rdparty/site_config/standard/bt.no.txt | 12 |
1 files changed, 12 insertions, 0 deletions
diff --git a/inc/3rdparty/site_config/standard/bt.no.txt b/inc/3rdparty/site_config/standard/bt.no.txt new file mode 100755 index 00000000..200c2e4e --- /dev/null +++ b/inc/3rdparty/site_config/standard/bt.no.txt | |||
@@ -0,0 +1,12 @@ | |||
1 | title: //h1[contains(@class,'articleTitle')] | ||
2 | author: //span[@itemprop='name'] | ||
3 | date: //time[@class='published'] | ||
4 | body: //div[contains(@class,'bodyText')] | ||
5 | |||
6 | strip_id_or_class: 'pull1' | ||
7 | strip_id_or_class: 'relationArticle' | ||
8 | strip: //span[@class='quote'] | ||
9 | |||
10 | # strip h2 if at end of article (typically a request for comments) | ||
11 | strip: //div[contains(@class,'bodyText')]/node()[last()-1]/self::h2 | ||
12 | test_url: http://www.bt.no/meninger/debatt/Typisk-norsk-a-vare-god-nok-2884108.html \ No newline at end of file | ||