From 48cbe5fb5f43a1634b47b25b24c338fba5059a28 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Tomasz=20D=C5=82ugosz?= Date: Thu, 4 Apr 2013 22:39:27 +0200 Subject: [PATCH 1/2] icon for newsweek_polska --- recipes/icons/newsweek_polska.png | Bin 0 -> 905 bytes 1 file changed, 0 insertions(+), 0 deletions(-) create mode 100644 recipes/icons/newsweek_polska.png diff --git a/recipes/icons/newsweek_polska.png b/recipes/icons/newsweek_polska.png new file mode 100644 index 0000000000000000000000000000000000000000..83e84b89e2e989e12e1d813f7c845ef56e713636 GIT binary patch literal 905 zcmeAS@N?(olHy`uVBq!ia0vp^0wB!61SBU+%rFB|jKx9jP7LeL$-D$|I14-?iy0WW zg+Z8+Vb&Z8pdfpRr>`sf9d03UZ4Os0iFgJEW@%3s#}ExsMgivce;6OL0hN;gK$epP z5E^8DzJVaAmv@;2_<^SI)t12p;f5kKAcO??`MX=-Tr>t24L}v#agpqH)@Vv0TNUK&345a-?a%R1FltV#CivM}J?uf>kwk4M5QkCDo*9 z09x{O(Q>SMus8{#?qg}qzYiZV^&o;3Xevbd+u{{K22l0;)Lg!rGPJ;@eQG^E+2F8l S-;*yO*Lb@6xvX Date: Sun, 7 Apr 2013 23:14:08 +0200 Subject: [PATCH 2/2] fixes for fronda --- recipes/fronda.recipe | 21 ++++++++++++--------- 1 file changed, 12 insertions(+), 9 deletions(-) diff --git a/recipes/fronda.recipe b/recipes/fronda.recipe index 6ed5d052a3..5ae78ae848 100644 --- a/recipes/fronda.recipe +++ b/recipes/fronda.recipe @@ -23,6 +23,7 @@ class Fronda(BasicNewsRecipe): extra_css = ''' h1 {font-size:150%} .body {text-align:left;} + div#featured-image {font-style:italic; font-size:70%} ''' earliest_date = date.today() - timedelta(days=oldest_article) @@ -55,7 +56,10 @@ class Fronda(BasicNewsRecipe): articles = {} for url, genName in genres: - soup = self.index_to_soup('http://www.fronda.pl/c/'+ url) + try: + soup = self.index_to_soup('http://www.fronda.pl/c/'+ url) + except: + continue articles[genName] = [] for item in soup.findAll('li'): article_h = item.find('h2') @@ -77,16 +81,15 @@ class Fronda(BasicNewsRecipe): ] remove_tags = [ - dict(name='div', attrs={'class':['related-articles', - 'button right', - 'pagination']}), + dict(name='div', attrs={'class':['related-articles','button right','pagination','related-articles content']}), dict(name='h3', attrs={'class':'block-header article comments'}), - dict(name='ul', attrs={'class':'comment-list'}), - dict(name='ul', attrs={'class':'category'}), - dict(name='ul', attrs={'class':'tag-list'}), + dict(name='ul', attrs={'class':['comment-list','category','tag-list']}), dict(name='p', attrs={'id':'comments-disclaimer'}), dict(name='div', attrs={'style':'text-align: left; margin-bottom: 15px;'}), dict(name='div', attrs={'style':'text-align: left; margin-top: 15px; margin-bottom: 30px;'}), - dict(name='div', attrs={'class':'related-articles content'}), - dict(name='div', attrs={'id':'comment-form'}) + dict(name='div', attrs={'id':'comment-form'}), + dict(name='span', attrs={'class':'separator'}) ] + + preprocess_regexps = [ + (re.compile(r'komentarzy: .*?', re.IGNORECASE | re.DOTALL | re.M ), lambda match: '')]