aboutsummaryrefslogtreecommitdiffhomepage
path: root/inc/3rdparty/site_config/standard/neh.gov.txt
diff options
context:
space:
mode:
authorNicolas LÅ“uillet <nicolas.loeuillet@gmail.com>2013-12-06 10:13:03 +0100
committerNicolas LÅ“uillet <nicolas.loeuillet@gmail.com>2013-12-06 10:13:03 +0100
commitac4d114214d820b20e18518a2dbc809337e39043 (patch)
tree27886128ef949b7f8dd174b0646b5a4d99883b44 /inc/3rdparty/site_config/standard/neh.gov.txt
parentd5501950e2470d52f6bf5954d2179010cdee0475 (diff)
downloadwallabag-ac4d114214d820b20e18518a2dbc809337e39043.tar.gz
wallabag-ac4d114214d820b20e18518a2dbc809337e39043.tar.zst
wallabag-ac4d114214d820b20e18518a2dbc809337e39043.zip
[add] new specific configuration files
Diffstat (limited to 'inc/3rdparty/site_config/standard/neh.gov.txt')
-rw-r--r--inc/3rdparty/site_config/standard/neh.gov.txt17
1 files changed, 17 insertions, 0 deletions
diff --git a/inc/3rdparty/site_config/standard/neh.gov.txt b/inc/3rdparty/site_config/standard/neh.gov.txt
new file mode 100644
index 00000000..45136a2b
--- /dev/null
+++ b/inc/3rdparty/site_config/standard/neh.gov.txt
@@ -0,0 +1,17 @@
1#host configuration should be http://www.neh.gov/news/humanities/
2
3
4#meta data
5title:substring-after(substring-after(//title,':'),':')
6author:substring-after(//h2[@class = 'subHead'],'By')
7date:substring-before(substring-after(//title,':'),':')
8
9#img and caption handling
10wrap_in(small)://div[@id = 'mainContent']/table/descendant::p/descendant::text()
11wrap_in(fieldset)://div[@id = 'mainContent']/table
12
13# clean up
14strip: //table[@class = 'marginpaddingTop']
15strip: //h2[@class = 'subHead']
16
17test_url: http://www.neh.gov/news/humanities/2011-11/IslamicScholar.html \ No newline at end of file