Recipe: make Hindu better resemble print edition

* Remove redundant date and timestamps cluttering every article * Place intro immediately beneath the heading, as in print edition |- duplicate intro is now removed using CSS * Visual styling
2025-07-09 03:04:10 -04:00 · 2021-06-15 17:24:59 +05:30 · 2021-06-15 17:24:59 +05:30 · b0d4c388d6
commit b0d4c388d6
parent adf810cae6
1 changed files with 13 additions and 5 deletions
--- a/recipes/hindu.recipe
+++ b/recipes/hindu.recipe
@ -23,12 +23,14 @@ class TheHindu(BasicNewsRecipe):
    no_stylesheets = True
    remove_attributes = ['style']
    extra_css = '.lead-img-cont { text-align: center; } ' \
-                '.lead-img-caption { font-size: small; font-style: italic; }'
+                '.lead-img-caption { font-size: small; font-style: italic; } ' \
+                '.mobile-author-cont { font-size: small; text-transform: uppercase; } ' \
+                '.intro ~ .intro, .update-time, .ksl-time-stamp * { display: none; } '

    ignore_duplicate_articles = {'title', 'url'}
    keep_only_tags = [
        dict(name='h1', attrs={'class': ['title', 'special-article-heading']}),
-        classes('author-nm lead-img-cont mobile-author-cont photo-collage intro'),
+        classes('lead-img-cont mobile-author-cont photo-collage intro'),
        dict(id=lambda x: x and x.startswith('content-body-')),
    ]

@ -50,9 +52,15 @@ class TheHindu(BasicNewsRecipe):
                source.extract()
        except Exception:
            pass
-        # Remove duplicate intro
-        for h in soup.findAll('h2', attrs={'class': 'intro'})[1:]:
-            h.extract()
+        # Place intro beneath the title, skip duplicates
+        try:
+            soup.h1.insert_after(soup.find('h2', attrs={'class': 'intro'}))
+        except Exception:
+            pass
+        # Remove ',' from location tag
+        ts = soup.find('span', attrs={'class': 'ksl-time-stamp'})
+        if ts and ts.string:
+            ts.string = ts.string.split(',')[0]
        return soup

    def populate_article_metadata(self, article, soup, first):