diff --git a/resources/recipes/times_online.recipe b/resources/recipes/times_online.recipe index 7a9e944301..a57749c79d 100644 --- a/resources/recipes/times_online.recipe +++ b/resources/recipes/times_online.recipe @@ -5,6 +5,7 @@ __copyright__ = '2008-2009, Darko Miletic ' ''' timesonline.co.uk ''' +import re from calibre.web.feeds.news import BasicNewsRecipe from calibre.ebooks.BeautifulSoup import Tag @@ -26,6 +27,8 @@ class Timesonline(BasicNewsRecipe): recursions = 9 match_regexps = [r'http://www.timesonline.co.uk/.*page=[2-9]'] + preprocess_regexps = [(re.compile(r'', re.DOTALL), lambda m: '')] + keep_only_tags = [ dict(name='div', attrs= {'id':['region-column1and2-layout2']}), {'class' : ['subheading']},