aboutsummaryrefslogtreecommitdiffhomepage
path: root/inc/3rdparty/site_config/standard/newyorker.com.txt
blob: 5624aa8c779f47f8f2992a7401599be2d5b67087 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
title: //h1[@id='articlehed'] | //h2[@id="articleintro"]
body: //div[@id='articletext']

strip: //ul[@id="bc"] | //div[@id="yrail"] | //div[@class="entry-keywords"] | //div[@class="entry-categories"] | //div[@class="socialUtils"] | //div[@id="footer"]

date: //h4[@id='articleauthor']/span[@class='dd dds']
date: //div[@id="pagebody"]/div[@class='hentry entry']/div[@class='published']

single_page_link: //div[@class='paginationViewSinglePage']/a
test_url: http://www.newyorker.com/online/blogs/culture/2012/06/mug-shot-web-sites.html