aboutsummaryrefslogblamecommitdiffhomepage
path: root/inc/3rdparty/site_config/standard/uni-watch.com.txt
blob: cbe87d197c4f63084611d20b42e44843daabddb6 (plain) (tree)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
















                                                                                                      
author: substring-before(substring-after(//div[@class='post-byline'], 'By '), ', on')
date: substring-after(//div[@class='post-byline'], ', on')

# for some reason, the following is producing a "no text [48]" error
#title: //div[@class='post-headline']

# for some reason, the following doesn't appear to isolate just the body copy
body: //div[@class='post-bodycopy']

# we solve the above issue by stripping out everything else we don't want
# these can probably all be removed if the body: command above worked
strip_id_or_class: reply
strip_id_or_class: left
strip_id_or_class: post-headline
strip_id_or_class: post-byline
strip_id_or_class: footer
test_url: http://www.uni-watch.com/2011/10/18/the-curious-case-of-steve-debergs-microphone-and-speaker/