1
0
mirror of https://github.com/moparisthebest/wallabag synced 2024-11-17 14:45:06 -05:00
wallabag/inc/3rdparty/site_config/standard/chronicle.com.txt
2013-12-06 10:13:03 +01:00

17 lines
785 B
Plaintext

title: //h1[contains(@class, "entry-title")]
author: //p[contains(@class, "byline")]
# blog articles (chronicle.com/blogs/*)
body: //div[contains(@class, "abstract")]
date: //p[contains(@class, "time")]
# all (?) other articles
body: //div[@id="article-body"]
date: //p[contains(@class, "dateline")]
# remove sidebars containing images (I assume this is desired for Instapaper)
strip: //div[@id="related"]
strip: //div[contains(@class, "image")]
# note that if you're not a Chronicle subscriber (personally or institutionally), you'll only see the first couple of paragraphs of the article, and Instapaper will display that with some crap above and below. thank goodness for that bookmarklet
test_url: http://chronicle.com/article/In-a-Land-of-Second-Chances/128375/