From 0f78497dc5e02d6335b6c41d4c773d37577390b9 Mon Sep 17 00:00:00 2001 From: Kovid Goyal Date: Sat, 22 Jul 2017 23:13:40 +0530 Subject: [PATCH] =?UTF-8?q?Fix=20#1705822=20[Impossible=20de=20r=C3=A9cup?= =?UTF-8?q?=C3=A9rer=20des=20actualit=C3=A9s=20Mediapart](https://bugs.lau?= =?UTF-8?q?nchpad.net/calibre/+bug/1705822)?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- recipes/mediapart.recipe | 7 ++----- 1 file changed, 2 insertions(+), 5 deletions(-) diff --git a/recipes/mediapart.recipe b/recipes/mediapart.recipe index 7f6a0214b3..5c8023c21e 100644 --- a/recipes/mediapart.recipe +++ b/recipes/mediapart.recipe @@ -9,7 +9,6 @@ Mediapart ''' import re -from calibre.ebooks.BeautifulSoup import BeautifulSoup from calibre.web.feeds.news import BasicNewsRecipe from calibre.web.feeds import feeds_from_index from datetime import date, timedelta @@ -54,7 +53,7 @@ class Mediapart(BasicNewsRecipe): soup = self.index_to_soup( 'https://www.mediapart.fr/journal/fil-dactualites') - page = soup.find('section', {'class': 'global-wrapper'}) + page = soup.find('main', {'class': 'global-wrapper'}) fils = page.find('ul', {'class': 'post-list universe-journal'}) for article in fils.findAll('li'): @@ -129,8 +128,7 @@ class Mediapart(BasicNewsRecipe): 'août', 'septembre', 'octobre', 'novembre', 'décembre'].index(date_arr[1])) def print_version(self, url): - raw = self.browser.open(url).read() - soup = BeautifulSoup(raw.decode('utf8', 'replace')) + soup = self.index_to_soup(url) # Filter old articles # article_date = self.parse_french_date(self.tag_to_string(soup.find('span', 'article-date'))) @@ -139,7 +137,6 @@ class Mediapart(BasicNewsRecipe): tools = soup.find('li', {'class': 'print'}) link = tools.find('a', {'href': re.compile(r'\/print\/.*')}) - print(link['href']) # if link is None: # print 'Error: print link not found' # return None