diff options
Diffstat (limited to 'inc/3rdparty/site_config/standard/searchengineland.com.txt')
-rwxr-xr-x[-rw-r--r--] | inc/3rdparty/site_config/standard/searchengineland.com.txt | 36 |
1 files changed, 18 insertions, 18 deletions
diff --git a/inc/3rdparty/site_config/standard/searchengineland.com.txt b/inc/3rdparty/site_config/standard/searchengineland.com.txt index f176d7c7..fb6a1074 100644..100755 --- a/inc/3rdparty/site_config/standard/searchengineland.com.txt +++ b/inc/3rdparty/site_config/standard/searchengineland.com.txt | |||
@@ -1,20 +1,20 @@ | |||
1 | body: //div[@class="storyBox"] | 1 | body: //div[@class="storyBox"] |
2 | title: //div[@class="storyBox"]/h1 | 2 | title: //div[@class="storyBox"]/h1 |
3 | author: //a[@rel="author"] | 3 | author: //a[@rel="author"] |
4 | date: substring-before(//span[@class="dateline"], 'by') | 4 | date: substring-before(//span[@class="dateline"], 'by') |
5 | 5 | ||
6 | #Removes related content but cleans up article text | 6 | #Removes related content but cleans up article text |
7 | strip: //h1 | 7 | strip: //h1 |
8 | strip: //p[@class="homeStory tdmSideInfo"] | 8 | strip: //p[@class="homeStory tdmSideInfo"] |
9 | strip: //div[@id="bylineShare"] | 9 | strip: //div[@id="bylineShare"] |
10 | strip: //script | 10 | strip: //script |
11 | strip: //hr | 11 | strip: //hr |
12 | 12 | ||
13 | strip_id_or_class: homeStory | 13 | strip_id_or_class: homeStory |
14 | strip_id_or_class: authorpic | 14 | strip_id_or_class: authorpic |
15 | strip_id_or_class: insideComments | 15 | strip_id_or_class: insideComments |
16 | strip_id_or_class: authorbio | 16 | strip_id_or_class: authorbio |
17 | strip_id_or_class: gpt-ad-sel-cube | 17 | strip_id_or_class: gpt-ad-sel-cube |
18 | strip_id_or_class: smxTextAd | 18 | strip_id_or_class: smxTextAd |
19 | 19 | ||
20 | test_url: http://searchengineland.com/googles-jaw-dropping-sponsored-post-campaign-for-chrome-106348 \ No newline at end of file | 20 | test_url: http://searchengineland.com/googles-jaw-dropping-sponsored-post-campaign-for-chrome-106348 \ No newline at end of file |