blob: 29199242c2378bc9e0516089be5b9fb7d61ad146 (
plain) (
blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
|
title://h1
author://div[@id="news-meta"]/a
body://*[@id="main"]/div[1]
strip://*[@id="main"]/div[2]
strip://*[@id="main"]/div[3]
strip://*[@id="page"]//footer
#date: didn't manage to parse it
#Images have to be stripped because the page does it with overlay
strip://img
#figures are not displayed in instapaper...
strip://figure | //figcaption
test_url: http://www.computerbase.de/news/2012-06/verbraucherzentrale-mahnt-blizzard-fuer-diablo-3-ab/
|