From 62fec3cd16e6cbbbdb4eb344fba169b45045e34a Mon Sep 17 00:00:00 2001 From: juanjobe Date: Sat, 3 Oct 2015 14:39:22 +0200 Subject: Add support to timeshighereducation.com --- inc/3rdparty/site_config/standard/timeshighereducation.com.txt | 3 +++ 1 file changed, 3 insertions(+) create mode 100644 inc/3rdparty/site_config/standard/timeshighereducation.com.txt (limited to 'inc/3rdparty/site_config/standard') diff --git a/inc/3rdparty/site_config/standard/timeshighereducation.com.txt b/inc/3rdparty/site_config/standard/timeshighereducation.com.txt new file mode 100644 index 00000000..ba52788d --- /dev/null +++ b/inc/3rdparty/site_config/standard/timeshighereducation.com.txt @@ -0,0 +1,3 @@ +body: //div[@class="col-md-12 radix-layouts-contentheader panel-panel"] +strip: //div[@class="htmlContent subscribe_box"] +test_url: https://www.timeshighereducation.com/blog/jeremy-corbyn-serious-about-free-higher-education -- cgit v1.2.3 From 5ae298b11fc54b58761bb383647382c4c792891c Mon Sep 17 00:00:00 2001 From: Juanjo Benages Date: Sat, 3 Oct 2015 16:46:34 +0200 Subject: Add wired.de site config --- inc/3rdparty/site_config/standard/wired.de.txt | 8 ++++++++ 1 file changed, 8 insertions(+) create mode 100644 inc/3rdparty/site_config/standard/wired.de.txt (limited to 'inc/3rdparty/site_config/standard') diff --git a/inc/3rdparty/site_config/standard/wired.de.txt b/inc/3rdparty/site_config/standard/wired.de.txt new file mode 100644 index 00000000..da88362f --- /dev/null +++ b/inc/3rdparty/site_config/standard/wired.de.txt @@ -0,0 +1,8 @@ +title: //meta[@name='Title']/@content +author: //meta[@name='Author']/@content +date: //meta[@name='DisplayDate']/@content +body: //div[@class='article-content'] +strip: //div[@class='article-sidebar'] + +test_url: https://www.wired.de/collection/latest/der-vw-skandal-zeigt-ohne-vertrauen-ist-software-nicht-mehr-als-bose-magie + -- cgit v1.2.3 From baa3184f422cdde85e0cd6ad152d5857bcbbb9e9 Mon Sep 17 00:00:00 2001 From: Juanjo Benages Date: Sat, 3 Oct 2015 17:05:12 +0200 Subject: Add Gara to wallabag --- inc/3rdparty/site_config/standard/naiz.eus.txt | 3 +++ 1 file changed, 3 insertions(+) create mode 100644 inc/3rdparty/site_config/standard/naiz.eus.txt (limited to 'inc/3rdparty/site_config/standard') diff --git a/inc/3rdparty/site_config/standard/naiz.eus.txt b/inc/3rdparty/site_config/standard/naiz.eus.txt new file mode 100644 index 00000000..7914ccb3 --- /dev/null +++ b/inc/3rdparty/site_config/standard/naiz.eus.txt @@ -0,0 +1,3 @@ +body: //div[@class='widget full_article'] + +test_url: http://www.naiz.eus/eu/actualidad/noticia/20151002/adegi-afirma-que-los-jovenes-viven-una-vida-muy-comoda-y-no-tienen-hambre-para-emprender# -- cgit v1.2.3 From 2aab9e5ca98de361e1f2ecf582be56d77cc1aa76 Mon Sep 17 00:00:00 2001 From: Juanjo Benages Date: Sat, 3 Oct 2015 17:16:17 +0200 Subject: Add esglobal.org --- inc/3rdparty/site_config/standard/esglobal.org.txt | 3 +++ 1 file changed, 3 insertions(+) create mode 100644 inc/3rdparty/site_config/standard/esglobal.org.txt (limited to 'inc/3rdparty/site_config/standard') diff --git a/inc/3rdparty/site_config/standard/esglobal.org.txt b/inc/3rdparty/site_config/standard/esglobal.org.txt new file mode 100644 index 00000000..6408f441 --- /dev/null +++ b/inc/3rdparty/site_config/standard/esglobal.org.txt @@ -0,0 +1,3 @@ +body: //div[@class='blog-content'] + +test_url: http://www.esglobal.org/el-caos-en-el-este-los-socios-de-la-ue-necesitan-que-se-les-preste-atencion/ -- cgit v1.2.3 From bd5cfe87d41451544112d1b7bb57c3df06e80cd9 Mon Sep 17 00:00:00 2001 From: Juanjo Benages Date: Sat, 3 Oct 2015 19:37:40 +0200 Subject: Add Deia.com --- inc/3rdparty/site_config/standard/deia.com.txt | 4 ++++ 1 file changed, 4 insertions(+) create mode 100644 inc/3rdparty/site_config/standard/deia.com.txt (limited to 'inc/3rdparty/site_config/standard') diff --git a/inc/3rdparty/site_config/standard/deia.com.txt b/inc/3rdparty/site_config/standard/deia.com.txt new file mode 100644 index 00000000..d2f78239 --- /dev/null +++ b/inc/3rdparty/site_config/standard/deia.com.txt @@ -0,0 +1,4 @@ +body: //div[@class='widget full_article'] +strip: //div[@class='Herramientas'] + +test_url: http://www.deia.com/2015/10/03/politica/euskadi/el-envilecimiento-de-la-politica-y-de-los-medios-de-comunicacion -- cgit v1.2.3 From d60ae41af9ca186feadff66190ecd701ebd21a93 Mon Sep 17 00:00:00 2001 From: Juanjo Benages Date: Sat, 3 Oct 2015 20:24:43 +0200 Subject: Add bez.es --- inc/3rdparty/site_config/standard/bez.es.txt | 5 +++++ 1 file changed, 5 insertions(+) create mode 100644 inc/3rdparty/site_config/standard/bez.es.txt (limited to 'inc/3rdparty/site_config/standard') diff --git a/inc/3rdparty/site_config/standard/bez.es.txt b/inc/3rdparty/site_config/standard/bez.es.txt new file mode 100644 index 00000000..cab7c6f7 --- /dev/null +++ b/inc/3rdparty/site_config/standard/bez.es.txt @@ -0,0 +1,5 @@ +body: //div[@class='text_art'] +strip: //div[@class='cab_datos_opinion'] +strip: //div[@class='sumario2_left'] + +test_url: http://www.bez.es/382758623/otros-fracasos-empresas.html -- cgit v1.2.3 From 84d62811e2d308a6142058c4b6bf1b149194821e Mon Sep 17 00:00:00 2001 From: Juanjo Benages Date: Sun, 4 Oct 2015 21:33:15 +0200 Subject: Add diagonalperiodico.net --- inc/3rdparty/site_config/standard/diagonalperiodico.net.txt | 4 ++++ 1 file changed, 4 insertions(+) create mode 100644 inc/3rdparty/site_config/standard/diagonalperiodico.net.txt (limited to 'inc/3rdparty/site_config/standard') diff --git a/inc/3rdparty/site_config/standard/diagonalperiodico.net.txt b/inc/3rdparty/site_config/standard/diagonalperiodico.net.txt new file mode 100644 index 00000000..f0681bac --- /dev/null +++ b/inc/3rdparty/site_config/standard/diagonalperiodico.net.txt @@ -0,0 +1,4 @@ +body: //div[@class='field__items'] +title: //div[@class='art_titulo'] + +test_url: https://www.diagonalperiodico.net/global/27947-cuanto-mas-tiempo-nos-aferremos-este-sistema-peor-y-menores-seran-nuestras-opciones -- cgit v1.2.3 From 465d18cc64160e2ce50ef8235ccb491d63acde98 Mon Sep 17 00:00:00 2001 From: Juanjo Benages Date: Mon, 5 Oct 2015 22:17:26 +0200 Subject: Add aclu.org --- inc/3rdparty/site_config/standard/aclu.org.txt | 5 +++++ 1 file changed, 5 insertions(+) create mode 100644 inc/3rdparty/site_config/standard/aclu.org.txt (limited to 'inc/3rdparty/site_config/standard') diff --git a/inc/3rdparty/site_config/standard/aclu.org.txt b/inc/3rdparty/site_config/standard/aclu.org.txt new file mode 100644 index 00000000..74236e2d --- /dev/null +++ b/inc/3rdparty/site_config/standard/aclu.org.txt @@ -0,0 +1,5 @@ +body: //div[@class='panel-panel panel-main-3 content-column'] +title: //div[@class='panel-pane pane-node-title'] +date: //div[@class='updated-date'] + +test_url: https://www.aclu.org/blog/free-future/chinas-nightmarish-citizen-scores-are-warning-americans -- cgit v1.2.3 From 13cbfe313eec63c16d3148803e7994a86ad18574 Mon Sep 17 00:00:00 2001 From: Juanjo Benages Date: Tue, 6 Oct 2015 18:45:26 +0200 Subject: Add pieria.co.uk --- inc/3rdparty/site_config/standard/pieria.co.uk.txt | 3 +++ 1 file changed, 3 insertions(+) create mode 100644 inc/3rdparty/site_config/standard/pieria.co.uk.txt (limited to 'inc/3rdparty/site_config/standard') diff --git a/inc/3rdparty/site_config/standard/pieria.co.uk.txt b/inc/3rdparty/site_config/standard/pieria.co.uk.txt new file mode 100644 index 00000000..31f2c84a --- /dev/null +++ b/inc/3rdparty/site_config/standard/pieria.co.uk.txt @@ -0,0 +1,3 @@ +body: //div[@id='article'] + +test_url: http://www.pieria.co.uk/articles/need_a_fiscal_rule_george__try_get_the_economy_growing -- cgit v1.2.3 From 2152c8707947c1873658c77e4bf7bf9bb31b29c4 Mon Sep 17 00:00:00 2001 From: Juanjo Benages Date: Tue, 6 Oct 2015 18:45:43 +0200 Subject: Add thenews.coop --- inc/3rdparty/site_config/standard/thenews.coop.txt | 3 +++ 1 file changed, 3 insertions(+) create mode 100644 inc/3rdparty/site_config/standard/thenews.coop.txt (limited to 'inc/3rdparty/site_config/standard') diff --git a/inc/3rdparty/site_config/standard/thenews.coop.txt b/inc/3rdparty/site_config/standard/thenews.coop.txt new file mode 100644 index 00000000..7d593805 --- /dev/null +++ b/inc/3rdparty/site_config/standard/thenews.coop.txt @@ -0,0 +1,3 @@ +body: //div[@class='entry-content'] + +test_url: http://www.thenews.coop/98221/news/co-operatives/jeremy-corbyn-needs-co-op-movement/ -- cgit v1.2.3 From 692d1aae300fc43de6a9b08964f66fbd3e12536d Mon Sep 17 00:00:00 2001 From: Juanjo Benages Date: Tue, 6 Oct 2015 18:45:57 +0200 Subject: Add rasgolatente.es --- inc/3rdparty/site_config/standard/rasgolatente.es.txt | 8 ++++++++ 1 file changed, 8 insertions(+) create mode 100644 inc/3rdparty/site_config/standard/rasgolatente.es.txt (limited to 'inc/3rdparty/site_config/standard') diff --git a/inc/3rdparty/site_config/standard/rasgolatente.es.txt b/inc/3rdparty/site_config/standard/rasgolatente.es.txt new file mode 100644 index 00000000..84b75f4a --- /dev/null +++ b/inc/3rdparty/site_config/standard/rasgolatente.es.txt @@ -0,0 +1,8 @@ +nte.es.txt + +title: //div[@class='entry-title'] +author: //div[@class='entry-author'] +date: //div[@class='entry-time'] +body: //div[@class='entry-content'] + +test_url: http://rasgolatente.es/estupidez-psicologia-estupidos/ -- cgit v1.2.3 From 787209722804e3b4dc28acf39634115f3093c4cf Mon Sep 17 00:00:00 2001 From: Juanjo Benages Date: Tue, 6 Oct 2015 18:53:38 +0200 Subject: Add rasgolatente.es --- inc/3rdparty/site_config/standard/rasgolatente.es.txt | 2 -- 1 file changed, 2 deletions(-) (limited to 'inc/3rdparty/site_config/standard') diff --git a/inc/3rdparty/site_config/standard/rasgolatente.es.txt b/inc/3rdparty/site_config/standard/rasgolatente.es.txt index 84b75f4a..fcdbbd97 100644 --- a/inc/3rdparty/site_config/standard/rasgolatente.es.txt +++ b/inc/3rdparty/site_config/standard/rasgolatente.es.txt @@ -1,5 +1,3 @@ -nte.es.txt - title: //div[@class='entry-title'] author: //div[@class='entry-author'] date: //div[@class='entry-time'] -- cgit v1.2.3 From 5f3e7cb44b351103bfeed8688af51b61ffd12832 Mon Sep 17 00:00:00 2001 From: Juanjo Benages Date: Wed, 14 Oct 2015 20:51:05 +0200 Subject: Corrections to chronicle.com --- inc/3rdparty/site_config/standard/chronicle.com.txt | 15 ++++----------- 1 file changed, 4 insertions(+), 11 deletions(-) (limited to 'inc/3rdparty/site_config/standard') diff --git a/inc/3rdparty/site_config/standard/chronicle.com.txt b/inc/3rdparty/site_config/standard/chronicle.com.txt index e86d3eca..227a03c7 100755 --- a/inc/3rdparty/site_config/standard/chronicle.com.txt +++ b/inc/3rdparty/site_config/standard/chronicle.com.txt @@ -1,17 +1,10 @@ title: //h1[contains(@class, "entry-title")] author: //p[contains(@class, "byline")] -# blog articles (chronicle.com/blogs/*) -body: //div[contains(@class, "abstract")] -date: //p[contains(@class, "time")] - # all (?) other articles -body: //div[@id="article-body"] +body: //div[@class="content-item__story"] date: //p[contains(@class, "dateline")] -# remove sidebars containing images (I assume this is desired for Instapaper) -strip: //div[@id="related"] -strip: //div[contains(@class, "image")] - -# note that if you're not a Chronicle subscriber (personally or institutionally), you'll only see the first couple of paragraphs of the article, and Instapaper will display that with some crap above and below. thank goodness for that bookmarklet -test_url: http://chronicle.com/article/In-a-Land-of-Second-Chances/128375/ \ No newline at end of file +# note that if you're not a Chronicle subscriber (personally or institutionally), you'll only see the first couple of paragraphs of the article, and Instapaper $ +test_url: http://chronicle.com/article/In-a-Land-of-Second-Chances/128375/ +test_url: http://chronicle.com/blogs/wiredcampus/university-run-boot-camps-offer-students-marketable-skills-but-not-course-credit/57494 -- cgit v1.2.3 From 0d2d2e76aed97e32d13edf17b86839d20e1ede3c Mon Sep 17 00:00:00 2001 From: Juanjo Benages Date: Wed, 14 Oct 2015 23:24:36 +0200 Subject: Correction to naiz.eus --- inc/3rdparty/site_config/standard/naiz.eus.txt | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) (limited to 'inc/3rdparty/site_config/standard') diff --git a/inc/3rdparty/site_config/standard/naiz.eus.txt b/inc/3rdparty/site_config/standard/naiz.eus.txt index 7914ccb3..9e48333a 100644 --- a/inc/3rdparty/site_config/standard/naiz.eus.txt +++ b/inc/3rdparty/site_config/standard/naiz.eus.txt @@ -1,3 +1,4 @@ -body: //div[@class='widget full_article'] +body: //div[contains(@class,'widget full_article')] test_url: http://www.naiz.eus/eu/actualidad/noticia/20151002/adegi-afirma-que-los-jovenes-viven-una-vida-muy-comoda-y-no-tienen-hambre-para-emprender# +test_url: http://www.naiz.eus/eu/actualidad/noticia/20151012/podemos-euskadi-critica-que-otegi-y-sus-companeros-quieran-pasar-por-grandes-pacifistas -- cgit v1.2.3 From 4715490858114b7870533e3f988db74fea9fdd81 Mon Sep 17 00:00:00 2001 From: Juanjo Benages Date: Mon, 7 Dec 2015 14:53:53 +0100 Subject: Add lawfareblog.com --- inc/3rdparty/site_config/standard/lawfareblog.com.txt | 4 ++++ 1 file changed, 4 insertions(+) create mode 100644 inc/3rdparty/site_config/standard/lawfareblog.com.txt (limited to 'inc/3rdparty/site_config/standard') diff --git a/inc/3rdparty/site_config/standard/lawfareblog.com.txt b/inc/3rdparty/site_config/standard/lawfareblog.com.txt new file mode 100644 index 00000000..49d858a7 --- /dev/null +++ b/inc/3rdparty/site_config/standard/lawfareblog.com.txt @@ -0,0 +1,4 @@ +body: //div[@class='field-items'] +title: //div[@class='title'] + +test_url: https://lawfareblog.com/limits-panopticon -- cgit v1.2.3 From d536b6d9b7d52cfeec45dae5cbfb9857218cc85d Mon Sep 17 00:00:00 2001 From: Juanjo Benages Date: Mon, 7 Dec 2015 14:54:15 +0100 Subject: Add letraslibres.com --- inc/3rdparty/site_config/standard/letraslibres.com.txt | 3 +++ 1 file changed, 3 insertions(+) create mode 100644 inc/3rdparty/site_config/standard/letraslibres.com.txt (limited to 'inc/3rdparty/site_config/standard') diff --git a/inc/3rdparty/site_config/standard/letraslibres.com.txt b/inc/3rdparty/site_config/standard/letraslibres.com.txt new file mode 100644 index 00000000..cf271bca --- /dev/null +++ b/inc/3rdparty/site_config/standard/letraslibres.com.txt @@ -0,0 +1,3 @@ +single_page_link: concat(link[@rel="canonical"], "?page=full") + +test_url: http://www.letraslibres.com/revista/dossier/quien-manda-en-europa -- cgit v1.2.3 From 086bf93f2b886592d13c9d9105ddcfd179797ee0 Mon Sep 17 00:00:00 2001 From: Juanjo Benages Date: Wed, 9 Dec 2015 18:09:34 +0100 Subject: Modified blog.cloudflare.com --- inc/3rdparty/site_config/standard/blog.cloudflare.com.txt | 7 ++++--- 1 file changed, 4 insertions(+), 3 deletions(-) (limited to 'inc/3rdparty/site_config/standard') diff --git a/inc/3rdparty/site_config/standard/blog.cloudflare.com.txt b/inc/3rdparty/site_config/standard/blog.cloudflare.com.txt index db80a35f..2f9a5a2f 100755 --- a/inc/3rdparty/site_config/standard/blog.cloudflare.com.txt +++ b/inc/3rdparty/site_config/standard/blog.cloudflare.com.txt @@ -1,9 +1,10 @@ # Instapaper gets this back to front and only gets the blog title instead of the article title. -title: substring-before(//title, '-') +title: //div[@class='title'] author: //a[ contains(@href, '/people') ] -body: //div[ @class='post' ] +body: //div[ @class='post-content' ] # Date is impossible to retrieve since they use those stupid "fuzzy" dates, inserted through javascript, at posterous. -test_url: http://blog.cloudflare.com/understanding-analytics-when-is-a-page-view-n \ No newline at end of file +test_url: http://blog.cloudflare.com/understanding-analytics-when-is-a-page-view-n +test_url: https://blog.cloudflare.com/sha-1-deprecation-no-browser-left-behind -- cgit v1.2.3 From 04b64c9d49fe4cfcfeb63ea84c724c6a66d306d9 Mon Sep 17 00:00:00 2001 From: Juanjo Benages Date: Mon, 21 Dec 2015 22:38:19 +0100 Subject: Add popehat.com --- inc/3rdparty/site_config/standard/popehat.com.txt | 6 ++++++ 1 file changed, 6 insertions(+) create mode 100644 inc/3rdparty/site_config/standard/popehat.com.txt (limited to 'inc/3rdparty/site_config/standard') diff --git a/inc/3rdparty/site_config/standard/popehat.com.txt b/inc/3rdparty/site_config/standard/popehat.com.txt new file mode 100644 index 00000000..45b76ae1 --- /dev/null +++ b/inc/3rdparty/site_config/standard/popehat.com.txt @@ -0,0 +1,6 @@ +title: //div[@class='entry-title'] +author: //div[@class='entry-author'] +date: //div[@class='entry-time'] +body: //div[@class='entry-content'] + +test_url: https://popehat.com/2015/12/16/eric-posner-the-first-amendments-nemesis/ -- cgit v1.2.3 From 23aed1cd4c03c90ddf6c5dfe00c23eb906c3cba8 Mon Sep 17 00:00:00 2001 From: Juanjo Benages Date: Sun, 17 Jan 2016 18:49:17 +0100 Subject: Add caffereggio.net --- inc/3rdparty/site_config/standard/caffereggio.net.txt | 3 +++ 1 file changed, 3 insertions(+) create mode 100644 inc/3rdparty/site_config/standard/caffereggio.net.txt (limited to 'inc/3rdparty/site_config/standard') diff --git a/inc/3rdparty/site_config/standard/caffereggio.net.txt b/inc/3rdparty/site_config/standard/caffereggio.net.txt new file mode 100644 index 00000000..08e1f05a --- /dev/null +++ b/inc/3rdparty/site_config/standard/caffereggio.net.txt @@ -0,0 +1,3 @@ +body: //div[@class="pf-content"] + +test_url: http://www.caffereggio.net/2016/01/16/115327/ -- cgit v1.2.3