natgeo cover

This commit is contained in:
unkn0w7n 2024-01-02 19:21:11 +05:30
parent 3032655349
commit 68aaed8872
2 changed files with 9 additions and 4 deletions

View File

@ -137,8 +137,12 @@ class NatGeo(BasicNewsRecipe):
'''
def get_cover_url(self):
soup = self.index_to_soup('https://www.nationalgeographic.com/magazine/')
png = re.findall('https://i\.natgeofe\.com\S+?national-geographic-\S+?\.jpg', soup.decode('utf-8'))
# soup = self.index_to_soup('https://www.nationalgeographic.com/magazine/')
# png = re.findall('https://i\.natgeofe\.com\S+?national-geographic-\S+?\.jpg', soup.decode('utf-8'))
from datetime import date
url = 'https://www.nationalgeographic.com/magazine/issue/' + (date.today().strftime('%B-%Y')).lower()
soup = self.index_to_soup(url)
png = soup.find('meta', attrs={'property':'og:image'})['content'].split('?')
return png[0] + '?w=1000&h=1000'
def parse_index(self):

View File

@ -143,8 +143,9 @@ class NatGeo(BasicNewsRecipe):
self.log('Downloading ', url)
self.timefmt = ' [' + edition + ']'
soup = self.index_to_soup(url)
png = re.findall('https://i\.natgeofe\.com\S+?national-geographic-\S+?\.jpg', soup.decode('utf-8'))
self.cover_url = png[0] + '?w=1000&h=1000'
# png = re.findall('https://i\.natgeofe\.com\S+?national-geographic-\S+?\.jpg', soup.decode('utf-8'))
# self.cover_url = png[0] + '?w=1000&h=1000'
self.cover_url = soup.find('meta', attrs={'property':'og:image'})['content'].split('?')[0] + '?w=1000'
name = soup.find(attrs={'class':lambda x: x and 'Header__Description' in x.split()})
self.title = 'National Geographic ' + self.tag_to_string(name)