From: Nicolas Lœuillet Date: Sat, 1 Aug 2015 19:20:43 +0000 (+0200) Subject: update config from @fivefilters X-Git-Tag: 1.9.1^2^2 X-Git-Url: https://git.immae.eu/?a=commitdiff_plain;h=refs%2Fpull%2F1266%2Fhead;p=github%2Fwallabag%2Fwallabag.git update config from @fivefilters --- diff --git a/inc/3rdparty/site_config/standard/20min.ch.txt b/inc/3rdparty/site_config/standard/20min.ch.txt new file mode 100755 index 00000000..cd8e3fc0 --- /dev/null +++ b/inc/3rdparty/site_config/standard/20min.ch.txt @@ -0,0 +1,24 @@ +# Author: cirnod@gmail.com + +tidy: no +prune: no + +title: //h1 +date: /html/body/div[3]/div[1]/div[6]/div/div[1]/div[2]/div[1]/div/p +body: //div[@class='published clearfix'] | //div[@class='story_titles']/h3 | //div[@class='story_text'] + +# General Cleanup +strip_id_or_class: info_panel +strip_id_or_class: info_poll +strip_id_or_class: teaser +strip_id_or_class: panelbox +strip_id_or_class: polls +strip_id_or_class: warning +strip_id_or_class: vplaceholder + +# visual removal only -> complete removal doesn't work +replace_string(Print): + +# Try yourself +test_url: http://www.20min.ch/wissen/news/story/31588952 +test_url: http://www.20min.ch/digital/dossier/apple/story/So-einfach-laesst-sich-das-iPhone-6-Plus-verbiegen-24651169 diff --git a/inc/3rdparty/site_config/standard/24.ae.txt b/inc/3rdparty/site_config/standard/24.ae.txt new file mode 100755 index 00000000..6e515076 --- /dev/null +++ b/inc/3rdparty/site_config/standard/24.ae.txt @@ -0,0 +1,8 @@ +title: //div[@id='DivTitle'] +body: //div[@id='divImages' or @id='Divkhabarcontent'] +author: //div[@id='DivAuthor'] + +prune: no + +test_url: http://24.ae/article.aspx?ArticleId=123304 +test_url: http://24.ae/rss.aspx?pageId=30 diff --git a/inc/3rdparty/site_config/standard/9gag.com.txt b/inc/3rdparty/site_config/standard/9gag.com.txt new file mode 100755 index 00000000..4ebb62ad --- /dev/null +++ b/inc/3rdparty/site_config/standard/9gag.com.txt @@ -0,0 +1,6 @@ +# Generated by FiveFilters.org's web-based selection tool +# Place this file inside your site_config/custom/ folder +# Source: http://siteconfig.fivefilters.org/grab.php?url=http%3A%2F%2F9gag.com%2Fgag%2FaDwQnO7 + +body: //div[contains(concat(' ',normalize-space(@class),' '),' badge-post-container ')] +test_url: http://9gag.com/gag/aDwQnO7 diff --git a/inc/3rdparty/site_config/standard/ad.nl.txt b/inc/3rdparty/site_config/standard/ad.nl.txt new file mode 100755 index 00000000..422faa57 --- /dev/null +++ b/inc/3rdparty/site_config/standard/ad.nl.txt @@ -0,0 +1,7 @@ +#bypass cookie check +single_page_link: //a[contains(@href, '/acceptCookieCheck.do?url=')] + +test_url: http://www.ad.nl/ad/nl/10444/Offside/article/detail/4043834/2015/05/31/Dani-Alves-voetbalt-met-drol-op-zijn-hoofd.dhtml +test_contains: De nieuwe coupe van Alves + +test_url: http://www.ad.nl/digitaal/rss.xml \ No newline at end of file diff --git a/inc/3rdparty/site_config/standard/albayan.ae.txt b/inc/3rdparty/site_config/standard/albayan.ae.txt index f6c093d2..d52700b3 100755 --- a/inc/3rdparty/site_config/standard/albayan.ae.txt +++ b/inc/3rdparty/site_config/standard/albayan.ae.txt @@ -1,5 +1,7 @@ body: //div[@id='main-column']//div[@class='content'] +strip_id_or_class: social-buttons + prune: no test_url: http://www.albayan.ae/across-the-uae/education/2013-08-29-1.1949645 diff --git a/inc/3rdparty/site_config/standard/androidpolice.com.txt b/inc/3rdparty/site_config/standard/androidpolice.com.txt index 8f9b1a21..660f29d9 100755 --- a/inc/3rdparty/site_config/standard/androidpolice.com.txt +++ b/inc/3rdparty/site_config/standard/androidpolice.com.txt @@ -1,5 +1,6 @@ body: //div[@class='post_content'] date: //div[@class='date_day'] | div[@class='date_month'] +strip_id_or_class: author-box +author: //h2[@class='author-box-heading']/a test_url: http://www.androidpolice.com/2014/03/30/music-boss-for-pebble-can-now-control-playback-and-volume-on-chromecast-content-from-your-smartwatch/ - diff --git a/inc/3rdparty/site_config/standard/artofmanliness.com.txt b/inc/3rdparty/site_config/standard/artofmanliness.com.txt new file mode 100755 index 00000000..b29ea0db --- /dev/null +++ b/inc/3rdparty/site_config/standard/artofmanliness.com.txt @@ -0,0 +1,6 @@ +parser: html5php +date: //article/p[contains(@class, 'single-date')] +author: //article/p[contains(@class, 'byline')] + +test_url: http://www.artofmanliness.com/2013/01/31/relationship-red-flags/ +test_contains: It seems that once we get close to a person \ No newline at end of file diff --git a/inc/3rdparty/site_config/standard/au.businessinsider.com.txt b/inc/3rdparty/site_config/standard/au.businessinsider.com.txt new file mode 100755 index 00000000..46bcddf2 --- /dev/null +++ b/inc/3rdparty/site_config/standard/au.businessinsider.com.txt @@ -0,0 +1,12 @@ +title://div[@class="sl-layout-post"]/h1 +body: //div[@id='content_post'] +strip: //div[contains(@class, "post-sidebar")] +strip: //div[@id='related-links'] +strip: //img[@class='size_xlarge'] +author://div[@class="byline"]/a +date://div[@class="byline"]/span[@class="date"] +prune: no +tidy: no + + +test_url: http://www.businessinsider.com/microsoft-just-put-one-of-its-hardcore-technical-geniuses-on-xbox-2012-1 diff --git a/inc/3rdparty/site_config/standard/au.news.yahoo.com.txt b/inc/3rdparty/site_config/standard/au.news.yahoo.com.txt new file mode 100755 index 00000000..8e84cbbb --- /dev/null +++ b/inc/3rdparty/site_config/standard/au.news.yahoo.com.txt @@ -0,0 +1,4 @@ +strip: //a[contains(text(), "RELATED:")] +author: //div[@class="info"]//span[@class="association printer-source"] +author: //div[@class="info"]//span[@class="stamp printer-date"] + diff --git a/inc/3rdparty/site_config/standard/bbc.co.uk.txt b/inc/3rdparty/site_config/standard/bbc.co.uk.txt index bad77654..7bef73ad 100755 --- a/inc/3rdparty/site_config/standard/bbc.co.uk.txt +++ b/inc/3rdparty/site_config/standard/bbc.co.uk.txt @@ -30,6 +30,12 @@ strip: //div[contains(@class, 'comment-introduction')] strip: //div[contains(@class, 'share-tools')] strip: //div[@id='also-related-links'] +find_string: http://ichef.bbci.co.uk/news/200/ +replace_string: http://ichef.bbci.co.uk/news/624/ + +find_string: http://ichef.bbci.co.uk/news/304/ +replace_string: http://ichef.bbci.co.uk/news/624/ + strip_id_or_class: share-help strip_id_or_class: comments_module diff --git a/inc/3rdparty/site_config/standard/bbc.com.txt b/inc/3rdparty/site_config/standard/bbc.com.txt index c04a683e..200dba63 100755 --- a/inc/3rdparty/site_config/standard/bbc.com.txt +++ b/inc/3rdparty/site_config/standard/bbc.com.txt @@ -33,6 +33,12 @@ strip: //div[@id='also-related-links'] strip_id_or_class: share-help strip_id_or_class: comments_module +find_string: http://ichef.bbci.co.uk/news/200/ +replace_string: http://ichef.bbci.co.uk/news/624/ + +find_string: http://ichef.bbci.co.uk/news/304/ +replace_string: http://ichef.bbci.co.uk/news/624/ + replace_string(