From fbabeb1f594bc832311f109f8a30443a0f2cb72b Mon Sep 17 00:00:00 2001 From: Kovid Goyal Date: Mon, 9 Jan 2017 19:43:27 +0530 Subject: [PATCH] Update Telepolis --- recipes/telepolis.recipe | 48 +++++++++------------------------------- 1 file changed, 11 insertions(+), 37 deletions(-) diff --git a/recipes/telepolis.recipe b/recipes/telepolis.recipe index 8511ca0430..ec27cafcc3 100644 --- a/recipes/telepolis.recipe +++ b/recipes/telepolis.recipe @@ -1,46 +1,20 @@ -# -*- coding: utf-8 -*- - +#!/usr/bin/env python2 +# vim:fileencoding=utf-8 +from __future__ import unicode_literals, division, absolute_import, print_function from calibre.web.feeds.news import BasicNewsRecipe -class TelepolisNews(BasicNewsRecipe): - title = u'Telepolis' - __author__ = 'syntaxis' - publisher = 'Heise Zeitschriften Verlag GmbH & Co KG' - description = 'News from Telepolis' - category = 'news' +class Telepolis(BasicNewsRecipe): + title = 'Telepolis' oldest_article = 7 max_articles_per_feed = 100 - recursion = 0 - no_stylesheets = True - encoding = "utf-8" + auto_cleanup = True + recursions = 10 language = 'de' - remove_empty_feeds = True - - keep_only_tags = [dict(name='div', attrs={'class': 'head'}), dict( - name='div', attrs={'class': 'leftbox'}), dict(name='td', attrs={'class': 'strict'})] - remove_tags = [dict(name='td', attrs={'class': 'blogbottom'}), - dict(name='div', attrs={'class': 'forum'}), dict(name='div', attrs={ - 'class': 'social'}), dict(name='div', attrs={'class': 'blog-letter p-news'}), - dict(name='div', attrs={'class': 'blog-sub'}), - dict(name='div', attrs={'class': 'version-div'}), - dict(name='div', attrs={'id': 'breadcrumb'}), dict(attrs={'class': 'tp-url'}), - dict(attrs={'class': 'blog-name entry_'})] - - remove_tags_after = [dict(name='span', attrs={'class': ['breadcrumb']})] - - feeds = [(u'News', u'http://www.heise.de/tp/news-atom.xml')] - - html2lrf_options = [ - '--comment', description, '--category', category, '--publisher', publisher + feeds = [ + ('Telepolis', 'https://www.heise.de/tp/news-atom.xml'), ] - html2epub_options = 'publisher="' + publisher + \ - '"\ncomments="' + description + '"\ntags="' + category + '"' - - def preprocess_html(self, soup): - mtag = '' - soup.head.insert(0, mtag) - return soup + def is_link_wanted(self, url, tag): + return tag['class'] == 'seite_weiter'