From 1239a405bc3d50ee1ba1c57c09b45cc8b2edcfba Mon Sep 17 00:00:00 2001 From: unkn0w7n <51942695+unkn0w7n@users.noreply.github.com> Date: Thu, 30 May 2024 17:55:39 +0530 Subject: [PATCH 1/2] Update livemint --- recipes/economist_espresso.recipe | 4 +--- recipes/livemint.recipe | 2 +- 2 files changed, 2 insertions(+), 4 deletions(-) diff --git a/recipes/economist_espresso.recipe b/recipes/economist_espresso.recipe index 8d82379d6e..63b60ed9ca 100644 --- a/recipes/economist_espresso.recipe +++ b/recipes/economist_espresso.recipe @@ -169,8 +169,6 @@ class Espresso(BasicNewsRecipe): return ans def parse_index(self): - # return self.economist_test_article() - # url = 'https://www.economist.com/weeklyedition/archive' query = { 'query': 'query EspressoQuery($ref:String!){espresso:canonical(ref:$ref){...EspressoFragment __typename}}fragment EspressoFragment on Content{id type hasPart(size:1 sort:"datePublished:desc"){parts{id type rubric:description hasPart(sort:"publication.context.position:asc,datePublished:desc"){parts{...ArticleFragment __typename}__typename}__typename}__typename}__typename}fragment ArticleFragment on Content{ad{grapeshot{channels{name __typename}__typename}__typename}articleSection{internal{id title:headline __typename}__typename}audio{main{id duration(format:"seconds")source:channel{id __typename}url{canonical __typename}__typename}__typename}byline dateline dateModified datePublished dateRevised flyTitle:subheadline id image{...ImageInlineFragment ...ImageMainFragment ...ImagePromoFragment __typename}print{title:headline flyTitle:subheadline rubric:description section{id title:headline __typename}__typename}publication{id tegID title:headline flyTitle:subheadline datePublished regionsAllowed url{canonical __typename}__typename}rubric:description source:channel{id __typename}tegID text(format:"json")title:headline type url{canonical __typename}topic contentIdentity{forceAppWebview mediaType articleType __typename}__typename}fragment ImageInlineFragment on Media{inline{url{canonical __typename}width height __typename}__typename}fragment ImageMainFragment on Media{main{url{canonical __typename}width height __typename}__typename}fragment ImagePromoFragment on Media{promo{url{canonical __typename}id width height __typename}__typename}', # noqa 'operationName': 'EspressoQuery', @@ -196,7 +194,7 @@ class Espresso(BasicNewsRecipe): pt.close() url = 'file:///' + pt.name ans.append({"title": title, "url": url}) - return [('The world in brief', ans)] + return [('Espresso', ans)] def populate_article_metadata(self, article, soup, first): article.url = soup.find('h1')['title'] diff --git a/recipes/livemint.recipe b/recipes/livemint.recipe index 53e5cb4a46..c6cb471def 100644 --- a/recipes/livemint.recipe +++ b/recipes/livemint.recipe @@ -94,7 +94,7 @@ class LiveMint(BasicNewsRecipe): ''' keep_only_tags = [ - dict(name='article', attrs={'id':lambda x: x and x.startswith(('article_', 'box_'))}), + dict(name='article', attrs={'id':lambda x: x and x.startswith(('article_', 'box_', 'storyPage_storyBox__'))}), classes('contentSec') ] remove_tags = [ From 09ee23dd1ce8be3e532b7c688486d87a9409d15d Mon Sep 17 00:00:00 2001 From: unkn0w7n <51942695+unkn0w7n@users.noreply.github.com> Date: Thu, 30 May 2024 17:58:40 +0530 Subject: [PATCH 2/2] ... --- recipes/livemint.recipe | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/recipes/livemint.recipe b/recipes/livemint.recipe index c6cb471def..8eb4586b06 100644 --- a/recipes/livemint.recipe +++ b/recipes/livemint.recipe @@ -94,7 +94,8 @@ class LiveMint(BasicNewsRecipe): ''' keep_only_tags = [ - dict(name='article', attrs={'id':lambda x: x and x.startswith(('article_', 'box_', 'storyPage_storyBox__'))}), + dict(name='article', attrs={'id':lambda x: x and x.startswith(('article_', 'box_'))}), + dict(attrs={'class':lambda x: x and x.startswith('storyPage_storyBox__')}), classes('contentSec') ] remove_tags = [