aboutsummaryrefslogtreecommitdiffhomepage
path: root/inc/3rdparty/site_config/standard/slate.com.txt
diff options
context:
space:
mode:
Diffstat (limited to 'inc/3rdparty/site_config/standard/slate.com.txt')
-rw-r--r--inc/3rdparty/site_config/standard/slate.com.txt19
1 files changed, 19 insertions, 0 deletions
diff --git a/inc/3rdparty/site_config/standard/slate.com.txt b/inc/3rdparty/site_config/standard/slate.com.txt
new file mode 100644
index 00000000..e92f6a06
--- /dev/null
+++ b/inc/3rdparty/site_config/standard/slate.com.txt
@@ -0,0 +1,19 @@
1title: //h1[@class="sl-art-head-dek"]
2body: //article//div[@class='sl-art-body']/div[contains(@class, 'body')]
3strip: //div[@class="department_kicker"]
4strip: //div[@id="insider_ad_wrapper" or @id="insider_ad_inner"]
5strip: //div[@id="bottom_sponsored_links"]
6strip: //div[@class="sl-art-ad-midflex"]
7#strip: //dl
8#strip: //p[em/a[contains(@href, 'facebook.com')]]
9prune: no
10
11author: //div[@id='author_bio']//a[contains(@href, '/author/')]
12author: //a[contains(@href, '/authors.')]
13
14date: substring-before(substring-after(//span[@class='sl-art-byline'], 'Posted '), ', at ')
15
16single_page_link: //a[@class='sl-art-sinpage']
17
18test_url: http://www.slate.com/id/2274583/pagenum/all/
19test_url: http://www.slate.com/id/2293116/ \ No newline at end of file