]>
Commit | Line | Data |
---|---|---|
ac4d1142 NL |
1 | title://h1[1]\r |
2 | \r | |
3 | author: substring-after(//em, 'Von ')\r | |
4 | author:string('tagesschau.de')\r | |
5 | \r | |
6 | date:substring-after(//div[@class='standDatum'], 'Stand: ')\r | |
7 | \r | |
8 | body://div[contains(@class, 'article')] | //div[contains(@class, 'centerCol')]\r | |
9 | \r | |
10 | strip://h1[1]\r | |
11 | strip: //div[contains(@class, 'directLinks')]\r | |
12 | strip: //div[contains(@class, 'zitatBox')]\r | |
13 | strip: //div[contains(@class, 'teaserBox metaBlock')]\r | |
14 | strip: //*[contains(@class, 'inv')]\r | |
15 | strip: //span[@class='imgSubline']\r | |
16 | strip: //*[contains(@class, 'topline')][1]\r | |
17 | strip: //div[@id='rightCol'][1]\r | |
18 | strip: //div[@id="footer"][1]\r | |
19 | strip: //div[@class="fPlayer"] \r | |
20 | strip: //div[@id='seitenanfang']\r | |
21 | strip: //div[@class='standDatum']\r | |
22 | strip: //em | |
23 | test_url: http://www.tagesschau.de/ausland/wahlkampffrankreich102.html |