aboutsummaryrefslogtreecommitdiffhomepage
path: root/inc/3rdparty/site_config/standard/thedaily.com.txt
blob: 24ebbbacbc8055c181fd5a12487f83db1d578276 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
#keep all body text
prune: no

#title, body, metadata
title: //div[@class='story_header']/h1
body: //div[@id='content']
author: substring-after(//span[@class='byline'], "by ")
author: substring-after(//span[@class='byline'], "By ")
author: //span[@class='byline']
date: //span[@class='date']

#formatting
convert_double_br_tags: yes
dissolve: //div[@class='slides_full']/ul/li

# cleanup
strip: //a[@id='story_note']
strip: //br
strip: //div[@class='intro']
strip: //div[@class='share-block']
strip: //div[@class='sidebar-social']
strip: //div[@class='top-stories']
strip: //div[@class='prevnext']
test_url: http://www.thedaily.com/page/2012/01/09/010912-news-college-costs-1-5/