1
0
mirror of https://github.com/moparisthebest/wallabag synced 2024-08-13 16:54:00 -04:00
wallabag/inc/3rdparty/site_config/standard/reddit.com.txt
2014-07-13 10:15:40 +02:00

20 lines
751 B
Plaintext
Executable File

# This setup grabs the text from a Reddit self post. It ignores all comments etc.
title: //p[@class="title"]/a/text()
author: //p[@class="tagline"]/a
# this doesn't work for some reason...?
date: //p[@class="tagline"]//@datetime
body: //div[@class="expando"]//div[@class="usertext-body"]
strip_id_or_class: tagline
strip_id_or_class: unvotable-message
strip_id_or_class: buttons
# follow the posted link (unless it's a self post - relative URL, no http://)
single_page_link: //p[@class="title"]/a[contains(@href, 'http://')]
test_url: http://www.reddit.com/r/truegaming/comments/wfe7r/i_wrote_about_the_problems_i_honestly_feel_that/
test_url: http://www.reddit.com/r/worldnews/comments/1as37r/twelve_north_korean_soldiers_attempting_to_defect/