From 1cf37c8400d16e7159b259108660eaed509f683a Mon Sep 17 00:00:00 2001 From: bobbysteel Date: Sun, 27 Aug 2017 14:38:09 +0100 Subject: [PATCH] Fix Financial Times UK categories --- recipes/financial_times_uk.recipe | 20 ++++++++++++++------ 1 file changed, 14 insertions(+), 6 deletions(-) diff --git a/recipes/financial_times_uk.recipe b/recipes/financial_times_uk.recipe index b3cae18735..f2378a3f78 100644 --- a/recipes/financial_times_uk.recipe +++ b/recipes/financial_times_uk.recipe @@ -86,12 +86,20 @@ class FinancialTimes(BasicNewsRecipe): def parse_index(self): articles = [] soup = self.index_to_soup(self.INDEX) - - for article in soup.findAll('a', href=True, attrs={'data-trackable':'main-link'}): - url = self.PREFIX + article['href'] - title = self.tag_to_string(article) - articles.append({'title': title, 'url': url, 'description': '', 'date': ''}) - return [("Articles", articles)] + totalfeeds = [] + current_section = [] + div = [] + for div in soup.findAll('div', attrs={'data-trackable': 'list'}): + articles = [] + current_section = self.tag_to_string(div.find('h2')) + self.log('in section: ', current_section) + for article in div.findAll('a', href=True, attrs={'data-trackable':'main-link'}): + url = self.PREFIX + article['href'] + title = self.tag_to_string(article) + articles.append({'title': title, 'url': url, 'description': '', 'date': ''}) + self.log('title: ', title, ' url: ', url) + totalfeeds.append((current_section,articles)) + return totalfeeds def preprocess_html(self, soup): for img in soup.findAll('img', srcset=True):