From 90a1a78b1e2f4d40e1d9b8e6f46aca129a9d7bcf Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Nicolas=20L=C5=93uillet?= Date: Mon, 27 Oct 2014 06:46:13 +0100 Subject: updated site_config --- inc/3rdparty/site_config/standard/bit-tech.net.txt | 19 +++++++++++++++++++ 1 file changed, 19 insertions(+) create mode 100755 inc/3rdparty/site_config/standard/bit-tech.net.txt (limited to 'inc/3rdparty/site_config/standard/bit-tech.net.txt') diff --git a/inc/3rdparty/site_config/standard/bit-tech.net.txt b/inc/3rdparty/site_config/standard/bit-tech.net.txt new file mode 100755 index 00000000..c6f5b204 --- /dev/null +++ b/inc/3rdparty/site_config/standard/bit-tech.net.txt @@ -0,0 +1,19 @@ +body: //div[@id='column_1'] +next_page_link: //div[@class='next']/a[not(contains(@href, '/comments') or contains(@href, '/news/'))] +prune: no + +author: substring-after(//p[@class='byline'], 'by ') +date: substring-before(substring-after(//p[@class='byline'], 'on '), ' by') + +strip: //h1 +strip_id_or_class: socialLinks +strip_id_or_class: byline +strip_id_or_class: pageSelector +strip_id_or_class: articleTabs +strip_id_or_class: pageNav +strip_id_or_class: share +strip_id_or_class: commentsContainer +strip_id_or_class: below_article_related + +test_url: http://www.bit-tech.net/hardware/storage/2014/08/13/ocz-arc-100-240gb-review/1 +test_url: http://www.bit-tech.net/news/bits/2014/08/15/google-trojan/1 -- cgit v1.2.3