diff options
author | Nicolas LÅ“uillet <nicolas.loeuillet@gmail.com> | 2013-12-23 02:28:56 -0800 |
---|---|---|
committer | Nicolas LÅ“uillet <nicolas.loeuillet@gmail.com> | 2013-12-23 02:28:56 -0800 |
commit | 60fc4f4b1ab37fbfe9021f3fa1395d66a4424ed2 (patch) | |
tree | 515c4b9c8286ae363f77722c91acb878151dc386 /inc/3rdparty/site_config/standard/searchengineland.com.txt | |
parent | cbfd5a1019f47fadefd8490dae9f039ae894298d (diff) | |
parent | da5fc42f615eeb45a702604970f94967507fb432 (diff) | |
download | wallabag-60fc4f4b1ab37fbfe9021f3fa1395d66a4424ed2.tar.gz wallabag-60fc4f4b1ab37fbfe9021f3fa1395d66a4424ed2.tar.zst wallabag-60fc4f4b1ab37fbfe9021f3fa1395d66a4424ed2.zip |
Merge pull request #363 from inthepoche/dev1.3.0
poche 1.3.0
Diffstat (limited to 'inc/3rdparty/site_config/standard/searchengineland.com.txt')
-rw-r--r-- | inc/3rdparty/site_config/standard/searchengineland.com.txt | 20 |
1 files changed, 20 insertions, 0 deletions
diff --git a/inc/3rdparty/site_config/standard/searchengineland.com.txt b/inc/3rdparty/site_config/standard/searchengineland.com.txt new file mode 100644 index 00000000..f176d7c7 --- /dev/null +++ b/inc/3rdparty/site_config/standard/searchengineland.com.txt | |||
@@ -0,0 +1,20 @@ | |||
1 | body: //div[@class="storyBox"] | ||
2 | title: //div[@class="storyBox"]/h1 | ||
3 | author: //a[@rel="author"] | ||
4 | date: substring-before(//span[@class="dateline"], 'by') | ||
5 | |||
6 | #Removes related content but cleans up article text | ||
7 | strip: //h1 | ||
8 | strip: //p[@class="homeStory tdmSideInfo"] | ||
9 | strip: //div[@id="bylineShare"] | ||
10 | strip: //script | ||
11 | strip: //hr | ||
12 | |||
13 | strip_id_or_class: homeStory | ||
14 | strip_id_or_class: authorpic | ||
15 | strip_id_or_class: insideComments | ||
16 | strip_id_or_class: authorbio | ||
17 | strip_id_or_class: gpt-ad-sel-cube | ||
18 | strip_id_or_class: smxTextAd | ||
19 | |||
20 | test_url: http://searchengineland.com/googles-jaw-dropping-sponsored-post-campaign-for-chrome-106348 \ No newline at end of file | ||