Update The New Yorker

This commit is contained in:
Kovid Goyal 2022-05-13 08:18:48 +05:30
parent 5d222cfd74
commit f8554fec19
No known key found for this signature in database
GPG Key ID: 06BC317B515ACE7C

View File

@ -2,18 +2,11 @@
# vim:fileencoding=utf-8 # vim:fileencoding=utf-8
# License: GPLv3 Copyright: 2016, Kovid Goyal <kovid at kovidgoyal.net> # License: GPLv3 Copyright: 2016, Kovid Goyal <kovid at kovidgoyal.net>
from __future__ import absolute_import, division, print_function, unicode_literals from __future__ import absolute_import, division, print_function, unicode_literals
from collections import OrderedDict from collections import OrderedDict
from calibre import browser from calibre import browser
from calibre.ebooks.BeautifulSoup import Tag from calibre.ebooks.BeautifulSoup import Tag
from calibre.web.feeds.news import BasicNewsRecipe from calibre.web.feeds.news import BasicNewsRecipe, classes, prefixed_classes
def classes(classes):
q = frozenset(classes.split(' '))
return dict(
attrs={'class': lambda x: x and frozenset(x.split()).intersection(q)})
def absurl(x): def absurl(x):
@ -47,6 +40,10 @@ class NewYorker(BasicNewsRecipe):
''' '''
keep_only_tags = [ keep_only_tags = [
prefixed_classes(
'SplitScreenContentHeaderHed- SplitScreenContentHeaderDek- SplitScreenContentHeaderByline-'
' SplitScreenContentHeaderLeadWrapper-'
),
classes( classes(
'split-screen-content-header__dek split-screen-content-header__hed' 'split-screen-content-header__dek split-screen-content-header__hed'
' content-header__dek content-header__hed content-header__publish-date content-header__lede-block' ' content-header__dek content-header__hed content-header__publish-date content-header__lede-block'
@ -59,6 +56,7 @@ class NewYorker(BasicNewsRecipe):
classes( classes(
'social-icons' 'social-icons'
), ),
prefixed_classes('ConsentBannerWrapper-'),
dict(childtypes='iframe'), dict(childtypes='iframe'),
] ]
remove_attributes = ['style'] remove_attributes = ['style']