From d06dc22ac1985a8cb4c8be48bd13b409182f4771 Mon Sep 17 00:00:00 2001 From: Kovid Goyal Date: Thu, 24 Mar 2011 08:48:30 -0600 Subject: [PATCH] ... --- recipes/h1.recipe | 18 ++++++++++++------ 1 file changed, 12 insertions(+), 6 deletions(-) diff --git a/recipes/h1.recipe b/recipes/h1.recipe index 28d7077137..8c3691981e 100644 --- a/recipes/h1.recipe +++ b/recipes/h1.recipe @@ -16,11 +16,18 @@ class hu168ora(BasicNewsRecipe): encoding = 'utf8' publisher = u'Telegráf Kiadó' category = u'news, hírek, 168' - extra_css = 'body{ font-family: Verdana,Helvetica,Arial,sans-serif } .lead{font-weight: bold} h2{text-align: center; text-transform: uppercase} ' + extra_css = 'body{ font-family: Verdana,Helvetica,Arial,sans-serif }' preprocess_regexps = [(re.compile(r'', re.DOTALL), lambda m: '')] - remove_tags_before = dict(id='cikk_fejlec') - remove_tags_after = dict(id='szoveg') - remove_tags = [dict(id='box_toolbar')] + keep_only_tags = [ + dict(id='cikk_fejlec') + ,dict(id='cikk_torzs') + ] +# remove_tags_before = dict(id='cikk_fejlec') +# remove_tags_after = dict(id='szoveg') + remove_tags = [ + dict(id='box_toolbar') + ,dict(id='text') + ] remove_javascript = True remove_empty_feeds = True @@ -36,10 +43,9 @@ class hu168ora(BasicNewsRecipe): ,(u'Sport', u'http://www.168ora.hu/static/rss/cikkek_sport.xml') ,(u'Vélemény', u'http://www.168ora.hu/static/rss/cikkek_velemeny.xml') ,(u'Dolce Vita', u'http://www.168ora.hu/static/rss/cikkek_dolcevita.xml') - ,(u'Rádió', u'http://www.168ora.hu/static/rss/radio.xml') +# ,(u'Rádió', u'http://www.168ora.hu/static/rss/radio.xml') ] def print_version(self, url): url += '?print=1' return url -