aboutsummaryrefslogblamecommitdiffhomepage
path: root/inc/3rdparty/site_config/standard/dr.dk.txt
blob: 7e46b0d66b7985cae084cebc7d79604046b341f0 (plain) (tree)
1
2
3
4
5
6
7
8
9








                                                                                                                             
title: //meta[@property='og:title']/@content
author: //div[@class='articleFunctions']//a
date: //meta[@name='pubdate']/@content

# Can you strip elements from the body only? It is required here (`//div[@class='articleContent']/p` breaks for some reason)
body: //div[@class='articleContent']

tidy: no
test_url: http://www.dr.dk/Nyheder/Udland/2011/10/24/150115.htm