aboutsummaryrefslogtreecommitdiffhomepage
path: root/inc/3rdparty/site_config/standard/blogs.scientificamerican.com.txt
diff options
context:
space:
mode:
Diffstat (limited to 'inc/3rdparty/site_config/standard/blogs.scientificamerican.com.txt')
-rw-r--r--inc/3rdparty/site_config/standard/blogs.scientificamerican.com.txt16
1 files changed, 16 insertions, 0 deletions
diff --git a/inc/3rdparty/site_config/standard/blogs.scientificamerican.com.txt b/inc/3rdparty/site_config/standard/blogs.scientificamerican.com.txt
new file mode 100644
index 00000000..a7d15081
--- /dev/null
+++ b/inc/3rdparty/site_config/standard/blogs.scientificamerican.com.txt
@@ -0,0 +1,16 @@
1# meta data
2title://h1[@class = 'postTitle']
3author:substring-before(substring-after(//span[@class = 'byline'],'By '),'|')
4date://span[@class = 'datestamp']
5
6#body content
7body://div[@id = 'singleBlogPost']
8
9#reclaim author info
10move_into(//div[@id = 'singleBlogPost'])://div[@id = 'aboutAuthorDiv']
11strip://p[@class = 'moreLink mobileHide']
12
13#cleanup comments, there might be some open <div> sections
14strip://div[@id = 'comments2']
15strip://h3[a[@href = '#add-comment']]
16test_url: http://blogs.scientificamerican.com/a-blog-around-the-clock/2012/07/10/science-blogs-definition-and-a-history/ \ No newline at end of file