aboutsummaryrefslogtreecommitdiffhomepage
path: root/inc/3rdparty/site_config/standard/searchengineland.com.txt
diff options
context:
space:
mode:
Diffstat (limited to 'inc/3rdparty/site_config/standard/searchengineland.com.txt')
-rw-r--r--inc/3rdparty/site_config/standard/searchengineland.com.txt20
1 files changed, 20 insertions, 0 deletions
diff --git a/inc/3rdparty/site_config/standard/searchengineland.com.txt b/inc/3rdparty/site_config/standard/searchengineland.com.txt
new file mode 100644
index 00000000..f176d7c7
--- /dev/null
+++ b/inc/3rdparty/site_config/standard/searchengineland.com.txt
@@ -0,0 +1,20 @@
1body: //div[@class="storyBox"]
2title: //div[@class="storyBox"]/h1
3author: //a[@rel="author"]
4date: substring-before(//span[@class="dateline"], 'by')
5
6#Removes related content but cleans up article text
7strip: //h1
8strip: //p[@class="homeStory tdmSideInfo"]
9strip: //div[@id="bylineShare"]
10strip: //script
11strip: //hr
12
13strip_id_or_class: homeStory
14strip_id_or_class: authorpic
15strip_id_or_class: insideComments
16strip_id_or_class: authorbio
17strip_id_or_class: gpt-ad-sel-cube
18strip_id_or_class: smxTextAd
19
20test_url: http://searchengineland.com/googles-jaw-dropping-sponsored-post-campaign-for-chrome-106348 \ No newline at end of file