From 83020b993c9dc18093cbe213ef40afa03f33c124 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Nicolas=20L=C5=93uillet?= Date: Fri, 25 Oct 2013 15:50:16 +0200 Subject: parse dilbert.com --- inc/3rdparty/site_config/custom/dilbert.com.txt | 4 ++++ 1 file changed, 4 insertions(+) create mode 100644 inc/3rdparty/site_config/custom/dilbert.com.txt (limited to 'inc/3rdparty/site_config/custom') diff --git a/inc/3rdparty/site_config/custom/dilbert.com.txt b/inc/3rdparty/site_config/custom/dilbert.com.txt new file mode 100644 index 00000000..6c8d95a2 --- /dev/null +++ b/inc/3rdparty/site_config/custom/dilbert.com.txt @@ -0,0 +1,4 @@ +title: //div[contains(@class, 'SB_Title')]//a +body: //div[contains(@class, 'STR_Content')] + +test_url: http://dilbert.com/strips/comic/2013-10-22 \ No newline at end of file -- cgit v1.2.3 From e070b9b511aea783d9709acd014e759aaaf5f7e1 Mon Sep 17 00:00:00 2001 From: Jason Ghent Date: Sat, 30 Nov 2013 12:08:17 -0500 Subject: Added stackoverflow parsing. --- inc/3rdparty/site_config/custom/stackoverflow.com.txt | 4 ++++ 1 file changed, 4 insertions(+) create mode 100755 inc/3rdparty/site_config/custom/stackoverflow.com.txt (limited to 'inc/3rdparty/site_config/custom') diff --git a/inc/3rdparty/site_config/custom/stackoverflow.com.txt b/inc/3rdparty/site_config/custom/stackoverflow.com.txt new file mode 100755 index 00000000..d2eb984d --- /dev/null +++ b/inc/3rdparty/site_config/custom/stackoverflow.com.txt @@ -0,0 +1,4 @@ +title: //title +body: //div[@id='question']//div[contains(@class,'post-text')] | //div[@id='answers-header']//h2 | //div[contains(@class,'accepted-answer')]//div[contains(@class,'post-text')] + +test_url: http://stackoverflow.com/questions/20302422/calling-a-function-from-a-javascript-object -- cgit v1.2.3 From 2ab37d6205d3e4f7bfacf702de6755a924931751 Mon Sep 17 00:00:00 2001 From: Jason Ghent Date: Sat, 30 Nov 2013 13:00:24 -0500 Subject: Addition of stackexchange parser. --- inc/3rdparty/site_config/custom/stackexchange.com.txt | 4 ++++ 1 file changed, 4 insertions(+) create mode 100755 inc/3rdparty/site_config/custom/stackexchange.com.txt (limited to 'inc/3rdparty/site_config/custom') diff --git a/inc/3rdparty/site_config/custom/stackexchange.com.txt b/inc/3rdparty/site_config/custom/stackexchange.com.txt new file mode 100755 index 00000000..c9d44b1d --- /dev/null +++ b/inc/3rdparty/site_config/custom/stackexchange.com.txt @@ -0,0 +1,4 @@ +title: //title +body: //div[@id='question']//div[contains(@class,'post-text')] | //div[@id='answers-header']//h2 | //div[contains(@class,'accepted-answer')]//div[contains(@class,'post-text')] + +test_url: http://cstheory.stackexchange.com/questions/14811/what-is-the-enlightenment-im-supposed-to-attain-after-studying-finite-automata/14818#14818 -- cgit v1.2.3 From 4a84d94e91b2868145e222d235c1209ac9fe7f0b Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Nicolas=20L=C5=93uillet?= Date: Fri, 3 Jan 2014 10:21:18 +0100 Subject: [add] config file for interviewmagazine.com --- inc/3rdparty/site_config/custom/interviewmagazine.com.txt | 4 ++++ 1 file changed, 4 insertions(+) create mode 100644 inc/3rdparty/site_config/custom/interviewmagazine.com.txt (limited to 'inc/3rdparty/site_config/custom') diff --git a/inc/3rdparty/site_config/custom/interviewmagazine.com.txt b/inc/3rdparty/site_config/custom/interviewmagazine.com.txt new file mode 100644 index 00000000..a9d4f8ca --- /dev/null +++ b/inc/3rdparty/site_config/custom/interviewmagazine.com.txt @@ -0,0 +1,4 @@ +title: //title +body: //div[contains(@class, 'block')] + +test_url: http://www.interviewmagazine.com/film/spike-jonze \ No newline at end of file -- cgit v1.2.3 From cb4fba5a333ac18b40665502e3de74249106cad4 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Nicolas=20L=C5=93uillet?= Date: Fri, 3 Jan 2014 10:22:12 +0100 Subject: [del] remove inthepoche.com config file, website has changed --- inc/3rdparty/site_config/custom/inthepoche.com.txt | 7 ------- 1 file changed, 7 deletions(-) delete mode 100644 inc/3rdparty/site_config/custom/inthepoche.com.txt (limited to 'inc/3rdparty/site_config/custom') diff --git a/inc/3rdparty/site_config/custom/inthepoche.com.txt b/inc/3rdparty/site_config/custom/inthepoche.com.txt deleted file mode 100644 index ede74b97..00000000 --- a/inc/3rdparty/site_config/custom/inthepoche.com.txt +++ /dev/null @@ -1,7 +0,0 @@ -title: //title -body: //div[@class='post-content'] - -prune: no -tidy: no - -test_url: http://www.inthepoche.com/?post/poche-hosting \ No newline at end of file -- cgit v1.2.3