This commit is contained in:
Kovid Goyal 2025-03-27 22:46:03 +05:30
commit 2ced906a0b
No known key found for this signature in database
GPG Key ID: 06BC317B515ACE7C

View File

@ -28,14 +28,14 @@ class AssociatedPress(BasicNewsRecipe):
classes('StoryPage-lede-content Page-lead Page-byline-info RichTextStoryBody'), classes('StoryPage-lede-content Page-lead Page-byline-info RichTextStoryBody'),
] ]
remove_tags = [ remove_tags = [
classes('displayNone Advertisement HTMLModuleEnhancement videoSlide'), classes('displayNone Advertisement HTMLModuleEnhancement AudioEnhancement'),
dict( dict(
name=[ name=[
'source', 'source',
'button', 'button',
'svg', 'svg',
'template', 'template',
'bsp-jw-player', 'video',
'astro-island', 'astro-island',
'iframe', 'iframe',
'document', 'document',
@ -64,7 +64,10 @@ class AssociatedPress(BasicNewsRecipe):
return [('Articles', feeds)] return [('Articles', feeds)]
def preprocess_html(self, soup): def preprocess_html(self, soup):
for st in soup.findAll(**classes('CarouselSlide-infoDescription')): for v in soup.findAll('bsp-jw-player', attrs={'poster': True}):
v.name = 'img'
v.attrs = {'src': v.get('poster', '')}
for st in soup.findAll(**classes('CarouselSlide-infoDescription Figure-caption')):
if p := st.find('p'): if p := st.find('p'):
p.name = 'span' p.name = 'span'
for h in soup.findAll(['h2', 'h3']): for h in soup.findAll(['h2', 'h3']):