From 9d519d7dc8ff6ab54a0fe54795d49b78ec349dd3 Mon Sep 17 00:00:00 2001 From: unkn0w7n <51942695+unkn0w7n@users.noreply.github.com> Date: Mon, 29 Apr 2024 10:10:35 +0530 Subject: [PATCH] *** --- recipes/economist.recipe | 9 ++++++++- recipes/economist_free.recipe | 9 ++++++++- 2 files changed, 16 insertions(+), 2 deletions(-) diff --git a/recipes/economist.recipe b/recipes/economist.recipe index 15b5e08588..6285119441 100644 --- a/recipes/economist.recipe +++ b/recipes/economist.recipe @@ -263,7 +263,8 @@ class Economist(BasicNewsRecipe): dt = datetime.fromisoformat(data['datePublished'][:-1]) + timedelta(seconds=time.timezone) dt = dt.strftime('%b %d, %Y') self.timefmt = ' [' + dt + ']' - self.cover_url = data['image']['cover'][0]['url']['canonical'] + self.cover_url = data['image']['cover'][0]['url']['canonical'].replace('economist.com/', + 'economist.com/cdn-cgi/image/width=960,quality=80,format=auto/') self.log('Got cover:', self.cover_url) feeds_dict = defaultdict(list) @@ -290,6 +291,12 @@ class Economist(BasicNewsRecipe): def populate_article_metadata(self, article, soup, first): article.url = soup.find('h1')['title'] + def preprocess_html(self, soup): + for img in soup.findAll('img', src=True): + img['src'] = img['src'].replace('economist.com/', + 'economist.com/cdn-cgi/image/width=600,quality=80,format=auto/') + return soup + else: # Load articles from individual article pages {{{ def parse_index(self): # return self.economist_test_article() diff --git a/recipes/economist_free.recipe b/recipes/economist_free.recipe index 15b5e08588..6285119441 100644 --- a/recipes/economist_free.recipe +++ b/recipes/economist_free.recipe @@ -263,7 +263,8 @@ class Economist(BasicNewsRecipe): dt = datetime.fromisoformat(data['datePublished'][:-1]) + timedelta(seconds=time.timezone) dt = dt.strftime('%b %d, %Y') self.timefmt = ' [' + dt + ']' - self.cover_url = data['image']['cover'][0]['url']['canonical'] + self.cover_url = data['image']['cover'][0]['url']['canonical'].replace('economist.com/', + 'economist.com/cdn-cgi/image/width=960,quality=80,format=auto/') self.log('Got cover:', self.cover_url) feeds_dict = defaultdict(list) @@ -290,6 +291,12 @@ class Economist(BasicNewsRecipe): def populate_article_metadata(self, article, soup, first): article.url = soup.find('h1')['title'] + def preprocess_html(self, soup): + for img in soup.findAll('img', src=True): + img['src'] = img['src'].replace('economist.com/', + 'economist.com/cdn-cgi/image/width=600,quality=80,format=auto/') + return soup + else: # Load articles from individual article pages {{{ def parse_index(self): # return self.economist_test_article()