Add a no subscription needed version of the recipe for The Hew York Review of Books

2026-03-06 08:53:40 -05:00 · 2009-03-12 16:27:09 -07:00 · 2009-03-12 16:27:09 -07:00 · ec95fab482
commit ec95fab482
parent 4d5c538f89
2 changed files with 45 additions and 0 deletions
--- a/src/calibre/web/feeds/recipes/init.py
+++ b/src/calibre/web/feeds/recipes/init.py
@ -34,6 +34,7 @@ recipe_modules = ['recipe_' + r for r in (
           'al_jazeera', 'winsupersite', 'borba', 'courrierinternational',
           'lamujerdemivida', 'soldiers', 'theonion', 'news_times',
           'el_universal', 'mediapart', 'wikinews_en', 'ecogeek', 'daily_mail',
+           'new_york_review_of_books_no_sub',
          )]

 import re, imp, inspect, time, os
--- a/src/calibre/web/feeds/recipes/recipe_new_york_review_of_books_no_sub.py
+++ b/src/calibre/web/feeds/recipes/recipe_new_york_review_of_books_no_sub.py
@ -0,0 +1,44 @@
+#!/usr/bin/env  python
+__license__   = 'GPL v3'
+__copyright__ = '2008, Kovid Goyal kovid@kovidgoyal.net'
+__docformat__ = 'restructuredtext en'
+
+'''
+nybooks.com
+'''
+
+from calibre.web.feeds.news import BasicNewsRecipe
+from lxml import html
+from calibre.constants import preferred_encoding
+
+class NewYorkReviewOfBooks(BasicNewsRecipe):
+    
+    title = u'New York Review of Books (no subscription)'
+    description = u'Book reviews'
+    language = _('English')
+    __author__ = 'Kovid Goyal' 
+    remove_tags_before = {'id':'container'}
+    remove_tags = [{'class':['noprint', 'ad', 'footer']}, {'id':'right-content'}]
+
+    def parse_index(self):
+        root = html.fromstring(self.browser.open('http://www.nybooks.com/current-issue').read())
+        date = root.xpath('//h4[@class = "date"]')[0]
+        self.timefmt = ' ['+date.text.encode(preferred_encoding)+']'
+        articles = []
+        for tag in date.itersiblings():
+            if tag.tag == 'h4': break
+            if tag.tag == 'p':
+                if tag.get('class') == 'indented':
+                    articles[-1]['description'] += html.tostring(tag)
+                else:
+                    href = tag.xpath('descendant::a[@href]')[0].get('href')
+                    article = {
+                               'title': u''.join(tag.xpath('descendant::text()')),
+                               'date' : '',
+                               'url'  : 'http://www.nybooks.com'+href,
+                               'description': '',
+                               }
+                    articles.append(article)
+                    
+        return [('Current Issue', articles)]
+