aboutsummaryrefslogblamecommitdiffhomepage
path: root/inc/3rdparty/site_config/standard/brookings.edu.txt
blob: 17a476056d6b6c9bf6547e66f5c506ba691a9cf9 (plain) (tree)
1
2
3
4
5
6
7
8
9
10
11










                                                                                   

                                                                                     
title: //div[@id='contentheader']/h1
author: //p[@class='attribution']/span[@class='author']/*
# Is there a way to pull multiple authors? My XPath here is just grabbing the first

date: /html/head/meta[@name="date"]/@content
body: //div[@class='main-content']

strip: //p[@class='byline']
strip: //div[@class='img-gallery']
strip: //div[@class='callout']
strip: //div[@class='add-your-view']
convert_double_br_tags: yes
test_url: http://www.brookings.edu/opinions/2011/1018_cyberattack_libya_goldsmith.aspx