diff options
Diffstat (limited to 'inc/3rdparty/site_config/standard/wmnf.org.txt')
-rwxr-xr-x[-rw-r--r--] | inc/3rdparty/site_config/standard/wmnf.org.txt | 22 |
1 files changed, 11 insertions, 11 deletions
diff --git a/inc/3rdparty/site_config/standard/wmnf.org.txt b/inc/3rdparty/site_config/standard/wmnf.org.txt index ffb6b2d1..1d403a91 100644..100755 --- a/inc/3rdparty/site_config/standard/wmnf.org.txt +++ b/inc/3rdparty/site_config/standard/wmnf.org.txt | |||
@@ -1,13 +1,13 @@ | |||
1 | title: //div[@class="bodyText"]/h1/text() | 1 | title: //div[@class="bodyText"]/h1/text() |
2 | body: //div[@class="bodyText"] | 2 | body: //div[@class="bodyText"] |
3 | 3 | ||
4 | # author and date are separated by only a newline | 4 | # author and date are separated by only a newline |
5 | # can't figure out how to tokenize that yet | 5 | # can't figure out how to tokenize that yet |
6 | author: //div[@class="bodyText"]/span[@class="info"]/text() | 6 | author: //div[@class="bodyText"]/span[@class="info"]/text() |
7 | date: //div[@class="bodyText"]/span[@class="info"]/text() | 7 | date: //div[@class="bodyText"]/span[@class="info"]/text() |
8 | 8 | ||
9 | # strip metdata from body text | 9 | # strip metdata from body text |
10 | strip: //div[@class="bodyText"]/h1/text() | 10 | strip: //div[@class="bodyText"]/h1/text() |
11 | strip: //div[@class="bodyText"]/span[@class="info"] | 11 | strip: //div[@class="bodyText"]/span[@class="info"] |
12 | strip: //div[@class="bodyText"]/span[@class="info"] | 12 | strip: //div[@class="bodyText"]/span[@class="info"] |
13 | test_url: http://www.wmnf.org/news_stories/light-rail-advocates-join-forces-to-combat-opposition-in-pinellas \ No newline at end of file | 13 | test_url: http://www.wmnf.org/news_stories/light-rail-advocates-join-forces-to-combat-opposition-in-pinellas \ No newline at end of file |