aboutsummaryrefslogblamecommitdiffhomepage
path: root/inc/3rdparty/site_config/standard/menshealth.com.txt
blob: e7e1e2697a53b6e186d629dc7b793556851e8243 (plain) (tree)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16















                                                                                                             
# need to find a way to eliminate <span> content for "related content" without eliminating important content

convert_double_br_tags: [yes]
#body: //div[@id='leftside']
title: //h1
title: //h2
Author: substring-after(//h4, 'By ')
Author: substring-after(//h4, 'By: ')
#Strip: //span
strip_id_or_class: morefromcat
strip_id_or_class: mostpopular
strip_id_or_class: articlepagination
strip_id_or_class: toolbar
body: //div[@id='zmodcontent']
single_page_link: //li[@class='onepage'] //a[contains (@href, 'printer.php')]
test_url: http://www.menshealth.com/mhlists/pursuit_of_happiness/index.php