aboutsummaryrefslogtreecommitdiffhomepage
path: root/inc/3rdparty/site_config/standard/bostonglobe.com.txt
diff options
context:
space:
mode:
authorNicolas LÅ“uillet <nicolas.loeuillet@gmail.com>2013-12-06 10:13:03 +0100
committerNicolas LÅ“uillet <nicolas.loeuillet@gmail.com>2013-12-06 10:13:03 +0100
commitac4d114214d820b20e18518a2dbc809337e39043 (patch)
tree27886128ef949b7f8dd174b0646b5a4d99883b44 /inc/3rdparty/site_config/standard/bostonglobe.com.txt
parentd5501950e2470d52f6bf5954d2179010cdee0475 (diff)
downloadwallabag-ac4d114214d820b20e18518a2dbc809337e39043.tar.gz
wallabag-ac4d114214d820b20e18518a2dbc809337e39043.tar.zst
wallabag-ac4d114214d820b20e18518a2dbc809337e39043.zip
[add] new specific configuration files
Diffstat (limited to 'inc/3rdparty/site_config/standard/bostonglobe.com.txt')
-rw-r--r--inc/3rdparty/site_config/standard/bostonglobe.com.txt16
1 files changed, 16 insertions, 0 deletions
diff --git a/inc/3rdparty/site_config/standard/bostonglobe.com.txt b/inc/3rdparty/site_config/standard/bostonglobe.com.txt
new file mode 100644
index 00000000..d3e6f43f
--- /dev/null
+++ b/inc/3rdparty/site_config/standard/bostonglobe.com.txt
@@ -0,0 +1,16 @@
1# NOTE: If testing this configuration yields bad results, including junk text like "Try BostonGlobe.com today" and "THIS STORY APPEARED IN", please replace the Test URL with a current-day headline link from bostonglobe.com.
2
3title: //div[@class="header"]/h1
4author: substring-after(//div[@class="byline"]/h2[@class="author"],"By ")
5date: //div[@class="byline"]/p[last()]
6body: //div[@class="article-body"]
7
8strip_id_or_class: aside
9strip_id_or_class: promo
10strip_id_or_class: skip-nav
11strip_id_or_class: article-more
12strip_id_or_class: article-bar
13
14# This removes image captions. If the parser starts saving images from bostonglobe.com (currently, it does not), then this directive should be removed.
15strip_id_or_class: figure
16test_url: http://bostonglobe.com/news/nation/2012/03/17/illinois-primary-could-pivotal/PsDzFZqvhEYyXbOcF9FOkO/story.html \ No newline at end of file