aboutsummaryrefslogtreecommitdiffhomepage
path: root/inc/3rdparty/site_config/standard/sportsillustrated.cnn.com.txt
blob: afc5879f1df280ee1aeb41c7759ce580b2badc82 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
# main sportsillustrated.com articles
#
body: //div[@id="cnnStoryContent"]
title: //div[@id="cnnStoryHeadline"]//h1
author: //div[@id="cnnSubBanner"]//strong
date: substring-after(//div[@id="cnnTimeStamp"], "Updated: ")
date: substring-after(//div[@id="cnnTimeStamp"], "Posted: ")

# kill ugly font buttons
strip: //div[@id="cnnSCFontButtons"]

# kill misc filler videos & etc
strip: //div[@class="cnnDivideContent"]
strip: //*[@class="cnnTMbox"]

# si vault articles
# -------------
body: //div[@class="siv_artPara"]
title: //div[@class="siv_artHeader"]//h1
author: //div[@class="byline"]
date: //div[@class="date"]

next_page_link: //div[@id='cnnStoryContinue']/a
strip_id_or_class: cnnstorypagination

test_url: http://sportsillustrated.cnn.com/2012/writers/peter_king/02/27/combine/index.html