natgeo cover

2025-08-11 09:13:57 -04:00 · 2024-01-02 19:21:11 +05:30 · 2024-01-02 19:21:11 +05:30 · 68aaed8872
commit 68aaed8872
parent 3032655349
2 changed files with 9 additions and 4 deletions
--- a/recipes/natgeo.recipe
+++ b/recipes/natgeo.recipe
@ -137,8 +137,12 @@ class NatGeo(BasicNewsRecipe):
    '''

    def get_cover_url(self):
-        soup = self.index_to_soup('https://www.nationalgeographic.com/magazine/')
-        png = re.findall('https://i\.natgeofe\.com\S+?national-geographic-\S+?\.jpg', soup.decode('utf-8'))
+        # soup = self.index_to_soup('https://www.nationalgeographic.com/magazine/')
+        # png = re.findall('https://i\.natgeofe\.com\S+?national-geographic-\S+?\.jpg', soup.decode('utf-8'))
+        from datetime import date
+        url = 'https://www.nationalgeographic.com/magazine/issue/' + (date.today().strftime('%B-%Y')).lower()
+        soup = self.index_to_soup(url)
+        png = soup.find('meta', attrs={'property':'og:image'})['content'].split('?')
        return png[0] + '?w=1000&h=1000'

    def parse_index(self):
--- a/recipes/natgeomag.recipe
+++ b/recipes/natgeomag.recipe
@ -143,8 +143,9 @@ class NatGeo(BasicNewsRecipe):
        self.log('Downloading ', url)
        self.timefmt = ' [' + edition + ']'
        soup = self.index_to_soup(url)
-        png = re.findall('https://i\.natgeofe\.com\S+?national-geographic-\S+?\.jpg', soup.decode('utf-8'))
-        self.cover_url = png[0] + '?w=1000&h=1000'
+        # png = re.findall('https://i\.natgeofe\.com\S+?national-geographic-\S+?\.jpg', soup.decode('utf-8'))
+        # self.cover_url = png[0] + '?w=1000&h=1000'
+        self.cover_url = soup.find('meta', attrs={'property':'og:image'})['content'].split('?')[0] + '?w=1000'

        name = soup.find(attrs={'class':lambda x: x and 'Header__Description' in x.split()})
        self.title = 'National Geographic ' + self.tag_to_string(name)