Update Popular Science

This commit is contained in:
Kovid Goyal 2021-12-30 20:54:15 +05:30
parent 1daad1bda9
commit 75afcfbd1c
No known key found for this signature in database
GPG Key ID: 06BC317B515ACE7C

View File

@ -23,18 +23,18 @@ class AdvancedUserRecipe1282101454(BasicNewsRecipe):
ignore_duplicate_articles = {'url'} ignore_duplicate_articles = {'url'}
no_stylesheets = True no_stylesheets = True
keep_only_tags = [ keep_only_tags = [
classes('content-body article-header featured-img'), classes('Article-header Article-excerpt Article-author Article-thumbnail Article-bodyText'),
] ]
def parse_section_index(self, slug): def parse_section_index(self, slug):
soup = self.index_to_soup('https://www.popsci.com/{}/'.format(slug)) soup = self.index_to_soup('https://www.popsci.com/{}/'.format(slug))
main = soup.find(**classes('main-module')) main = soup.find(**classes('main-content'))
for div in main.findAll(**classes('main-item')): for div in main.findAll(**classes('Post')):
a = div.find('a', href=True, **classes('linkable')) a = div.find('a', href=True, **classes('Post-link'))
url = a['href'] url = a['href']
title = self.tag_to_string(a.find(**classes('title'))) title = self.tag_to_string(div.find(**classes('Post-title')))
desc = '' desc = ''
dek = a.find(**classes('dek')) dek = div.find(**classes('Post-excerpt'))
if dek is not None: if dek is not None:
desc = self.tag_to_string(dek) desc = self.tag_to_string(dek)
self.log(' ', title, url) self.log(' ', title, url)