Merge branch 'master' of https://github.com/unkn0w7n/calibre

2025-07-09 03:04:10 -04:00 · 2024-01-01 14:47:46 +05:30 · 2024-01-01 14:47:46 +05:30 · 3032655349
commit 3032655349
parent 375e63f597 a170eafd20
3 changed files with 12 additions and 9 deletions
--- a/recipes/economist.recipe
+++ b/recipes/economist.recipe
@ -205,6 +205,10 @@ class Economist(BasicNewsRecipe):
    def preprocess_raw_html(self, raw, url):
        # open('/t/raw.html', 'wb').write(raw.encode('utf-8'))
        root = parse(raw)
+        if '/interactive/' in url:
+            return '<html><body><article><h1>' + root.xpath('//h1')[0].text + '</h1><em>' \
+                        + 'This article is supposed to be read in a browser' \
+                            + '</em></article></body></html>'
        script = root.xpath('//script[@id="__NEXT_DATA__"]')
        if script:
            try:
@ -293,9 +297,6 @@ class Economist(BasicNewsRecipe):
                sub = safe_dict(part, "subheadline") or ''
                if sub and section != sub:
                    desc = sub + ' :: ' + desc
-                if '/interactive/' in url:
-                    self.log('Skipping interactive article:', title, url)
-                    continue
                feeds_dict[section].append({"title": title, "url": url, "description": desc})
                self.log(' ', title, url, '\n   ', desc)
            return [(section, articles) for section, articles in feeds_dict.items()]
--- a/recipes/economist_free.recipe
+++ b/recipes/economist_free.recipe
@ -205,6 +205,10 @@ class Economist(BasicNewsRecipe):
    def preprocess_raw_html(self, raw, url):
        # open('/t/raw.html', 'wb').write(raw.encode('utf-8'))
        root = parse(raw)
+        if '/interactive/' in url:
+            return '<html><body><article><h1>' + root.xpath('//h1')[0].text + '</h1><em>' \
+                        + 'This article is supposed to be read in a browser' \
+                            + '</em></article></body></html>'
        script = root.xpath('//script[@id="__NEXT_DATA__"]')
        if script:
            try:
@ -293,9 +297,6 @@ class Economist(BasicNewsRecipe):
                sub = safe_dict(part, "subheadline") or ''
                if sub and section != sub:
                    desc = sub + ' :: ' + desc
-                if '/interactive/' in url:
-                    self.log('Skipping interactive article:', title, url)
-                    continue
                feeds_dict[section].append({"title": title, "url": url, "description": desc})
                self.log(' ', title, url, '\n   ', desc)
            return [(section, articles) for section, articles in feeds_dict.items()]
--- a/recipes/economist_world_ahead.recipe
+++ b/recipes/economist_world_ahead.recipe
@ -201,6 +201,10 @@ class Economist(BasicNewsRecipe):
    def preprocess_raw_html(self, raw, url):
        # open('/t/raw.html', 'wb').write(raw.encode('utf-8'))
        root = parse(raw)
+        if '/interactive/' in url:
+            return '<html><body><article><h1>' + root.xpath('//h1')[0].text + '</h1><em>' \
+                        + 'This article is supposed to be read in a browser' \
+                            + '</em></article></body></html>'
        script = root.xpath('//script[@id="__NEXT_DATA__"]')
        if script:
            try:
@ -281,9 +285,6 @@ class Economist(BasicNewsRecipe):
                    sub = safe_dict(part, "subheadline") or ''
                    if sub:
                        desc = sub + ' :: ' + desc
-                    if '/interactive/' in url:
-                        self.log('\tSkipping interactive article:', title, url)
-                        continue
                    self.log('\t', title, '\n\t', desc, '\n\t\t', url)
                    articles.append({'title': title, 'description':desc, 'url': url})
                if articles: