2014-10-27 01:46:13 -04:00
|
|
|
# Author: zinnober
|
|
|
|
# Template should work well with either desktop or mobile version (m.heise.de)
|
2014-07-13 04:15:40 -04:00
|
|
|
|
2014-10-27 01:46:13 -04:00
|
|
|
prune: no
|
|
|
|
|
|
|
|
title: //article/h1 | //h1
|
2014-07-13 04:15:40 -04:00
|
|
|
date: //p[@class='news_datum']
|
2014-10-27 01:46:13 -04:00
|
|
|
author: //h4[@class='author']
|
|
|
|
|
|
|
|
body: //article | //div[@class='meldung_wrapper']
|
|
|
|
|
|
|
|
# General cleanup
|
|
|
|
strip: //time
|
|
|
|
strip: //h4[@class='author']
|
|
|
|
strip: //p[@class='news_datum']
|
|
|
|
strip: //p[@class='artikel_datum']
|
|
|
|
strip: //a[contains(@href, 'mailto')]
|
|
|
|
strip_id_or_class: comments
|
|
|
|
strip_id_or_class: ISI_IGNORE
|
|
|
|
strip_id_or_class: clear
|
|
|
|
|
|
|
|
strip_id_or_class: linkurl_grossbild
|
|
|
|
strip_id_or_class: image-num
|
|
|
|
strip_id_or_class: heisebox_right
|
|
|
|
strip_id_or_class: dossier
|
|
|
|
|
|
|
|
# Strip Ads
|
|
|
|
strip_id_or_class: ad_
|
|
|
|
|
|
|
|
# Some optimizations
|
|
|
|
replace_string(<h5>): <h2>
|
|
|
|
replace_string(</h5>): </h2>
|
|
|
|
replace_string(<span class="bild_rechts"): <p
|
|
|
|
replace_string(<div class="heisebox">): <blockquote>
|
|
|
|
|
|
|
|
|
|
|
|
next_page_link: //a[@class='next']
|
|
|
|
next_page_link: //a[@title='vor']
|
2014-07-13 04:15:40 -04:00
|
|
|
|
2014-10-27 01:46:13 -04:00
|
|
|
test_url: http://www.heise.de/open/artikel/Die-Neuerungen-von-Linux-3-15-2196231.html
|
|
|
|
test_url: http://m.heise.de/open/artikel/Die-Neuerungen-von-Linux-3-15-2196231.html
|
|
|
|
test_url: http://www.heise.de/newsticker/meldung/Ueberwachungstechnik-Die-globale-Handy-Standortueberwachung-2301494.html
|