Fix Tagesspiegel

This commit is contained in:
Kovid Goyal 2012-01-03 08:04:27 +05:30
parent e1498bfa3e
commit cd9412db51

View File

@ -33,17 +33,7 @@ class TagesspiegelRSS(BasicNewsRecipe):
no_javascript = True no_javascript = True
remove_empty_feeds = True remove_empty_feeds = True
encoding = 'utf-8' encoding = 'utf-8'
auto_cleanup = True
keep_only_tags = dict(name='div', attrs={'class':["hcf-article"]})
remove_tags = [
dict(name='link'), dict(name='iframe'),dict(name='style'),dict(name='meta'),dict(name='button'),
dict(name='div', attrs={'class':["hcf-jump-to-comments","hcf-clear","hcf-magnify hcf-media-control",
"hcf-socials-widgets hcf-socials-top","hcf-socials-widgets hcf-socials-bottom"] }),
dict(name='span', attrs={'class':["hcf-mainsearch",] }),
dict(name='ul', attrs={'class':["hcf-tools"]}),
dict(name='ul', attrs={'class': re.compile('hcf-services')})
]
def parse_index(self): def parse_index(self):
soup = self.index_to_soup('http://www.tagesspiegel.de/zeitung/') soup = self.index_to_soup('http://www.tagesspiegel.de/zeitung/')