From 51b819f6387286d921d56eecebd0c17b644b24c0 Mon Sep 17 00:00:00 2001 From: Kovid Goyal Date: Sat, 15 Oct 2011 06:15:28 +0530 Subject: [PATCH] Fix 874643 --- recipes/icons/la_republica.png | Bin 0 -> 868 bytes recipes/la_republica.recipe | 56 ++++++++++++++++++--------------- 2 files changed, 30 insertions(+), 26 deletions(-) create mode 100644 recipes/icons/la_republica.png diff --git a/recipes/icons/la_republica.png b/recipes/icons/la_republica.png new file mode 100644 index 0000000000000000000000000000000000000000..e24405b6d4511c7b54d9e4b61b7bd922926527b5 GIT binary patch literal 868 zcmV-q1DpJbP)0009kNklY@O^)~-M(b8VzKDDZnavi z*Xy}l?j<^t31l*vm#p-FX0sUtL8VgB)br;Rn^D1RHiIczt=9Q`*3pwpAe+tVEbttl zQ79DF>$S3mWCHDWTUk4U%jE)7L{X&nIF&~6hQcsB91gr*#4ExS>Fablk&jHLQ-zl$ zr~{=^iR6IY@Av!oZ+JQUgn0_Sy4h@yrpW!o5Cn0z+a)FMQ{?C8XRTIao`NrdEx(@_ z0s_jFXfm0QlCW^U-xn#jkw(EBS)UXhkH;eAmg+#G(I6$^NTQ5niGZl$&gXMp*b)JR zHBu8PEUIhvS_!^;gBS5??Ge!L+rEXMkioL3`HW<_Tt-QH_!0SWI2@8|@w-Z`8+`)s z=Y{PN;Kw>q#e7Esq@%{LM_{+xk&+lVd9{`Z;PsQq5uKlCT((4juT6Z<8^aO-vd2XJ zk(LV^1khlTa~XyQsdD245WD2-$4IF#au^|ikj1{^N!s%~CVbTfV#iP`Ap%BWc#bG_ z-XrB!qSxykk4NR*JLwWY&KV2_nunxm5gI7z6xamh#!UW0U~jSEAKhEEa037$ks5 z$mjEDT zS7qc=-jR|CU@J(^zVGv2JwOuj4@n*KJNdYCvlz)C;amuFx955M!ViGkVBeiiC;pfJ zZXyOkf4N*f|9T?90-C1=h{*d(Uy%`6K*IK^gwzO$NFV_J<8Ro% u0x|F~-NOi?TAMi5{eTZ&-yFXL(#AhWQgd%jDdNEZ0000', re.DOTALL|re.IGNORECASE), lambda match: ''), + (re.compile(r'.*?', re.DOTALL|re.IGNORECASE), lambda match: '<head><title>'), + (re.compile(r'.*?', re.DOTALL|re.IGNORECASE), lambda match: '') + ] + def get_article_url(self, article): link = article.get('id', article.get('guid', None)) if link is None: return article return link - - keep_only_tags = [dict(name='div', attrs={'class':'articolo'}), - dict(name='div', attrs={'class':'body-text'}), -# dict(name='div', attrs={'class':'page-content'}), + + keep_only_tags = [ + dict(attrs={'class':'articolo'}), + dict(attrs={'class':'body-text'}), dict(name='p', attrs={'class':'disclaimer clearfix'}), - dict(name='div', attrs={'id':'contA'}) + dict(attrs={'id':'contA'}) ] remove_tags = [ - dict(name=['object','link']), + dict(name=['object','link','meta']), dict(name='span',attrs={'class':'linkindice'}), dict(name='div', attrs={'class':'bottom-mobile'}), dict(name='div', attrs={'id':['rssdiv','blocco']}),