1
0
mirror of https://github.com/moparisthebest/wallabag synced 2024-12-21 06:48:56 -05:00
wallabag/vendor/full-text-rss/site_config/standard/menshealth.com.txt
2013-12-10 16:19:15 +01:00

16 lines
607 B
Plaintext

# need to find a way to eliminate <span> content for "related content" without eliminating important content
convert_double_br_tags: [yes]
#body: //div[@id='leftside']
title: //h1
title: //h2
Author: substring-after(//h4, 'By ')
Author: substring-after(//h4, 'By: ')
#Strip: //span
strip_id_or_class: morefromcat
strip_id_or_class: mostpopular
strip_id_or_class: articlepagination
strip_id_or_class: toolbar
body: //div[@id='zmodcontent']
single_page_link: //li[@class='onepage'] //a[contains (@href, 'printer.php')]
test_url: http://www.menshealth.com/mhlists/pursuit_of_happiness/index.php