diff --git a/src/libprs500/ebooks/lrf/web/convert_from.py b/src/libprs500/ebooks/lrf/web/convert_from.py index 3e3c484bd3..b69f4ca244 100644 --- a/src/libprs500/ebooks/lrf/web/convert_from.py +++ b/src/libprs500/ebooks/lrf/web/convert_from.py @@ -28,8 +28,9 @@ from libprs500.ebooks.lrf.web.profiles.nytimes import NYTimes from libprs500.ebooks.lrf.web.profiles.bbc import BBC from libprs500.ebooks.lrf.web.profiles.newsweek import Newsweek from libprs500.ebooks.lrf.web.profiles.economist import Economist +from libprs500.ebooks.lrf.web.profiles.newyorkreview import NewYorkReviewOfBooks -builtin_profiles = [NYTimes, BBC, Newsweek, Economist] +builtin_profiles = [NYTimes, BBC, Newsweek, Economist, NewYorkReviewOfBooks] available_profiles = [i.__module__.rpartition('.')[2] for i in builtin_profiles] def option_parser(): diff --git a/src/libprs500/ebooks/lrf/web/profiles/newyorkreview.py b/src/libprs500/ebooks/lrf/web/profiles/newyorkreview.py new file mode 100644 index 0000000000..81f056984a --- /dev/null +++ b/src/libprs500/ebooks/lrf/web/profiles/newyorkreview.py @@ -0,0 +1,23 @@ +from libprs500.ebooks.lrf.web.profiles import DefaultProfile + +import re + +class NewYorkReviewOfBooks(DefaultProfile): + + title = 'New York Review of Books' + max_recursions = 2 + max_articles_per_feed = 50 + html_description = True + no_stylesheets = True + + def get_feeds(self): + return [ ('Current Issue', 'http://feeds.feedburner.com/nybooks') ] + + preprocess_regexps = [(re.compile(i[0], re.IGNORECASE | re.DOTALL), i[1]) for i in [ + (r')|(
)|(
)|(

)|())', lambda match: '

'), + (r'(()|(
)|(

©)|(