mirror of
https://github.com/kovidgoyal/calibre.git
synced 2025-07-09 03:04:10 -04:00
Update Kliene Zeitung
This commit is contained in:
parent
51a6d79039
commit
ecc428c98b
@ -1,5 +1,8 @@
|
|||||||
|
#!/usr/bin/env python2
|
||||||
|
# vim:fileencoding=utf-8
|
||||||
|
from __future__ import unicode_literals, division, absolute_import, print_function
|
||||||
|
|
||||||
from calibre.web.feeds.news import BasicNewsRecipe
|
from calibre.web.feeds.news import BasicNewsRecipe
|
||||||
import re
|
|
||||||
|
|
||||||
class KleineZeitungRecipe(BasicNewsRecipe):
|
class KleineZeitungRecipe(BasicNewsRecipe):
|
||||||
__license__ = 'GPL v3'
|
__license__ = 'GPL v3'
|
||||||
@ -20,34 +23,48 @@ class KleineZeitungRecipe(BasicNewsRecipe):
|
|||||||
no_stylesheets = True
|
no_stylesheets = True
|
||||||
remove_javascript = True
|
remove_javascript = True
|
||||||
|
|
||||||
# Feeds from http://www.kleinezeitung.at/allgemein/multimedia/102434/wichtige-news-immer-sofort-ueber-rss-feed-abrufen.story
|
masthead_url = 'https://cdn-kl.niceshops.com/images/logos/logo_kleine_invoice.jpg'
|
||||||
feeds = []
|
|
||||||
feeds.append((u'Chronik', u'http://www.kleinezeitung.at/klon/rss/nachrichten'))
|
|
||||||
feeds.append((u'Wirtschaft', u'http://www.kleinezeitung.at/klon/rss/wirtschaft'))
|
|
||||||
feeds.append((u'Leute', u'http://www.kleinezeitung.at/klon/rss/leute'))
|
|
||||||
feeds.append((u'Sport', u'http://www.kleinezeitung.at/klon/rss/sport'))
|
|
||||||
feeds.append((u'Nachrichten aus der Steiermark', u'http://www.kleinezeitung.at/klon/rss/steiermark'))
|
|
||||||
feeds.append((u'Nachrichten aus Kaernten', u'http://www.kleinezeitung.at/klon/rss/kaernten'))
|
|
||||||
feeds.append((u'Multimedia-News', u'http://www.kleinezeitung.at/klon/rss/multimedia'))
|
|
||||||
feeds.append((u'Kino, Events & Tickets', u'http://www.kleinezeitung.at/klon/rss/events'))
|
|
||||||
|
|
||||||
keep_only_tags = []
|
feeds = [
|
||||||
keep_only_tags.append(dict(name = 'div', attrs = {'class': 'article_body'}))
|
('Nachrichten', 'http://www.kleinezeitung.at/rss/nachrichten'),
|
||||||
|
('Politik', 'http://www.kleinezeitung.at/rss/politik'),
|
||||||
|
('Wirtschaft', 'http://www.kleinezeitung.at/rss/wirtschaft'),
|
||||||
|
('Österreich und die Welt', 'http://www.kleinezeitung.at/rss/chronik'),
|
||||||
|
('Leben', 'http://www.kleinezeitung.at/rss/leben'),
|
||||||
|
('Sport', 'http://www.kleinezeitung.at/rss/sport'),
|
||||||
|
# ('Ennstal', 'http://www.kleinezeitung.at/rss/rss_ennstal'),
|
||||||
|
# ('Graz & Umgebung', 'http://www.kleinezeitung.at/rss/rss_graz'),
|
||||||
|
# ('Leoben', 'http://www.kleinezeitung.at/rss/rss_leoben'),
|
||||||
|
# ('Murtal', 'http://www.kleinezeitung.at/rss/rss_murtal'),
|
||||||
|
# ('Mürztal', 'http://www.kleinezeitung.at/rss/rss_muerztal'),
|
||||||
|
# ('Oststeier', 'http://www.kleinezeitung.at/rss/rss_oststeier'),
|
||||||
|
# ('Süd & Südwest', 'http://www.kleinezeitung.at/rss/rss_suedsuedwest'),
|
||||||
|
# ('Südost & Süd', 'http://www.kleinezeitung.at/rss/rss_sueostsued'),
|
||||||
|
# ('Weiz', 'http://www.kleinezeitung.at/rss/rss_weiz'),
|
||||||
|
# ('Weststeier', 'http://www.kleinezeitung.at/rss/rss_weststeier'),
|
||||||
|
# ('Feldkirchen', 'http://www.kleinezeitung.at/rss/rss_feldkirchen'),
|
||||||
|
# ('Klagenfurt', 'http://www.kleinezeitung.at/rss/rss_klagenfurt'),
|
||||||
|
# ('Lavanttal', 'http://www.kleinezeitung.at/rss/rss_lavanttal'),
|
||||||
|
# ('Oberkärnten', 'http://www.kleinezeitung.at/rss/rss_oberkaernten'),
|
||||||
|
# ('Osttirol', 'http://www.kleinezeitung.at/rss/rss_osttirol'),
|
||||||
|
# ('St. Veit', 'http://www.kleinezeitung.at/rss/rss_stveit'),
|
||||||
|
# ('Villach', 'http://www.kleinezeitung.at/rss/rss_villach'),
|
||||||
|
# ('Völkermarkt', 'http://www.kleinezeitung.at/rss/rss_voelkermarkt')
|
||||||
|
]
|
||||||
|
|
||||||
remove_tags = []
|
remove_tags_before = dict(attrs={'class':'hline'})
|
||||||
remove_tags.append(dict(name = 'a', attrs = {'id': 'comment_count'}))
|
remove_tags_after = [dict(name='div', attrs={'class':'articletext'})]
|
||||||
remove_tags.append(dict(name = 'div', attrs = {'class': re.compile('adv[0-9]+')}))
|
remove_tags = [dict(name='hr')]
|
||||||
remove_tags.append(dict(name = 'div', attrs = {'class': 'art_info'}))
|
|
||||||
remove_tags.append(dict(name = 'div', attrs = {'id': re.compile('grafikoverlay_.*')}))
|
|
||||||
remove_tags.append(dict(name = 'a', attrs = {'class': 'zoom'}))
|
|
||||||
|
|
||||||
extra_css = '''
|
extra_css = '''
|
||||||
body {font-family:verdana,arial,helvetica,geneva,sans-serif ;}
|
|
||||||
h1 {text-align: left;}
|
h1 {text-align: left;}
|
||||||
span {margin-left: 0.1em; margin-right: 0.1em;}
|
|
||||||
span.update {font-size: x-small; color: #666666}
|
|
||||||
span.update strong {font-weight: normal;}
|
|
||||||
p.intro {font-size: large;}
|
|
||||||
div.art_foto_big, div.art_foto {font-size: xx-small; color: #696969; margin-bottom: 0.5em;}
|
|
||||||
div.art_foto_big span.src {float: right;}
|
|
||||||
'''
|
'''
|
||||||
|
|
||||||
|
def print_version(self, url):
|
||||||
|
main, sep, id = url.rpartition('/')
|
||||||
|
return main + '/print.do'
|
||||||
|
|
||||||
|
def preprocess_html(self, soup):
|
||||||
|
if soup.find('div', {'class':'articletext'}) is None:
|
||||||
|
self.abort_article()
|
||||||
|
return soup
|
||||||
|
Loading…
x
Reference in New Issue
Block a user