1 2 3 4 5 6 7 8 9 10 11 12
title: //h1[contains(@class, 'article-title')] author: //article//span[contains(@class, 'byline')] date: //time[@pubdate]/@datetime body: //section[contains(@class, 'article-body')] prune: no tidy: no strip: //figcaption strip: //p[contains(., 'MORE:') and ./a] strip: //aside test_url: http://time.com/14478/emotions-may-not-be-so-universal-after-all/