1 title: //*[@id='Content']/span[1]
2 author: substring-after(substring-before(//*[@id='Content']/span[2], ')'), '(')
3 date: substring-before(substring-after(//*[@id='Content']/span[2], 'Updated: '), 'Counter')
5 strip: //*[@id='Content']/span[1]
6 strip: //*[@id='Content']/span[2]
8 body: //*[@id='Content']
10 test_url: http://www.chinamining.org/News/2011-07-22/1311319069d48087.html