blob: e09f6692a8d4af23741c972d6514390465e87280 (
plain) (
blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
|
# This filter is tested on:
# http://www.lifeweek.com.cn/2012/1211/39439.shtml
# http://www.lifeweek.com.cn/2013/0308/40213.shtml
title:substring-before(//h1, '(')
title://h1
date://ul[@class='authorbox']/li
author: substring-after(//ul[@class='authorbox']/li/following-sibling::li, '作者:')
next_page_link: //div[@class='pageturn_list']/a[@class='pagedown']
body: //div[@class='original ']
strip://h1
strip://ul[@class='authorbox']
strip://span[@class='app_p']
strip://div[@style='text-align:right;']
strip://div[@class='pageturn_list']
strip://div[@class='lifespeaks']
strip://div[@class='vright fr']
strip://div[@class='copyrt mg20']
strip://div[@class='keyabout mg20']
strip://ul[@class='readabout mg20']
test_url: http://www.lifeweek.com.cn/2013/0308/40213.shtml
|