diff options
author | tcit <tcit@tcit.fr> | 2014-09-27 17:54:13 +0200 |
---|---|---|
committer | tcit <tcit@tcit.fr> | 2014-09-27 17:54:13 +0200 |
commit | 04a7674bdd20f2f24b32de69c086ecffdf20ceb4 (patch) | |
tree | bcc26634c68a8689ad511513c316058647e90789 /inc/3rdparty/site_config/standard/.about.com.txt | |
parent | 657245dcbdbca323621952d2b6f9e991dd94fa03 (diff) | |
parent | a15108e65b12ceaf50821783bcaa1ee3fee10d13 (diff) | |
download | wallabag-04a7674bdd20f2f24b32de69c086ecffdf20ceb4.tar.gz wallabag-04a7674bdd20f2f24b32de69c086ecffdf20ceb4.tar.zst wallabag-04a7674bdd20f2f24b32de69c086ecffdf20ceb4.zip |
merge refactor and dev
Diffstat (limited to 'inc/3rdparty/site_config/standard/.about.com.txt')
-rw-r--r-- | inc/3rdparty/site_config/standard/.about.com.txt | 14 |
1 files changed, 14 insertions, 0 deletions
diff --git a/inc/3rdparty/site_config/standard/.about.com.txt b/inc/3rdparty/site_config/standard/.about.com.txt new file mode 100644 index 00000000..e1ebaee3 --- /dev/null +++ b/inc/3rdparty/site_config/standard/.about.com.txt | |||
@@ -0,0 +1,14 @@ | |||
1 | body: //div[@id='articlebody'] | ||
2 | title: //h1 | ||
3 | author: //p[@id='by']//a | ||
4 | |||
5 | next_page_link: //span[@class='next']/a | ||
6 | # Not the same as below! | ||
7 | |||
8 | prune: yes | ||
9 | tidy: no | ||
10 | |||
11 | # Annoying 'next' links plainly inside the article body | ||
12 | strip: //*[text()[contains(.,'Next: ')]] | ||
13 | |||
14 | test_url: http://psychology.about.com/od/theoriesofpersonality/ss/defensemech.htm | ||