diff --git a/recipes/atlantic.recipe b/recipes/atlantic.recipe index 55e02b2ad1..1fca16827c 100644 --- a/recipes/atlantic.recipe +++ b/recipes/atlantic.recipe @@ -18,13 +18,14 @@ class TheAtlantic(BasicNewsRecipe): INDEX = 'http://www.theatlantic.com/magazine/toc/0/' language = 'en' - remove_tags_before = dict(name='div', id='articleHead') - remove_tags_after = dict(id='copyright') - remove_tags = [dict(id=['header', 'printAds', 'pageControls'])] + keep_only_tags = [{'attrs':{'class':['article', 'articleHead', 'articleText']}}] + remove_tags = [dict(attrs={'class':'footer'})] no_stylesheets = True - preprocess_regexps = [(re.compile(r'', re.DOTALL), lambda m: '')] - + preprocess_regexps = [ + (re.compile(r'', re.DOTALL), lambda m: ''), + (re.compile(r'.*