Remove various bad tags from Economist downloads.

2025-07-09 03:04:10 -04:00 · 2009-12-05 09:51:38 -07:00 · 2009-12-05 09:51:38 -07:00 · 4f13ef6aaa
commit 4f13ef6aaa
parent f58c59ca0a
2 changed files with 4 additions and 2 deletions
--- a/resources/recipes/economist.recipe
+++ b/resources/recipes/economist.recipe
@ -22,7 +22,8 @@ class Economist(BasicNewsRecipe):

    oldest_article = 7.0
    cover_url = 'http://www.economist.com/images/covers/currentcovereu_large.jpg'
-    remove_tags = [dict(name=['script', 'noscript', 'title'])]
+    remove_tags = [dict(name=['script', 'noscript', 'title', 'iframe', 'cf_floatingcontent']),
+            dict(attrs={'class':['dblClkTrk']})]
    remove_tags_before = dict(name=lambda tag: tag.name=='title' and tag.parent.name=='body')
    needs_subscription = True

--- a/resources/recipes/economist_free.recipe
+++ b/resources/recipes/economist_free.recipe
@ -16,7 +16,8 @@ class Economist(BasicNewsRecipe):

    oldest_article = 6.5
    cover_url = 'http://www.economist.com/images/covers/currentcovereu_large.jpg'
-    remove_tags = [dict(name=['script', 'noscript', 'title'])]
+    remove_tags = [dict(name=['script', 'noscript', 'title', 'iframe', 'cf_floatingcontent']),
+            dict(attrs={'class':['dblClkTrk']})]
    remove_tags_before = dict(name=lambda tag: tag.name=='title' and tag.parent.name=='body')

    def parse_index(self):