1
0
mirror of https://github.com/moparisthebest/wallabag synced 2024-12-04 14:52:25 -05:00
wallabag/inc/3rdparty/site_config/standard/searchengineland.com.txt

20 lines
622 B
Plaintext
Raw Normal View History

2013-12-06 04:13:03 -05:00
body: //div[@class="storyBox"]
title: //div[@class="storyBox"]/h1
author: //a[@rel="author"]
date: substring-before(//span[@class="dateline"], 'by')
#Removes related content but cleans up article text
strip: //h1
strip: //p[@class="homeStory tdmSideInfo"]
strip: //div[@id="bylineShare"]
strip: //script
strip: //hr
strip_id_or_class: homeStory
strip_id_or_class: authorpic
strip_id_or_class: insideComments
strip_id_or_class: authorbio
strip_id_or_class: gpt-ad-sel-cube
strip_id_or_class: smxTextAd
test_url: http://searchengineland.com/googles-jaw-dropping-sponsored-post-campaign-for-chrome-106348