diff --git a/src/libprs500/ebooks/lrf/web/__init__.py b/src/libprs500/ebooks/lrf/web/__init__.py index 99a5f55a54..5c6c9dbdaa 100644 --- a/src/libprs500/ebooks/lrf/web/__init__.py +++ b/src/libprs500/ebooks/lrf/web/__init__.py @@ -31,10 +31,11 @@ from libprs500.ebooks.lrf.web.profiles.jpost import JerusalemPost from libprs500.ebooks.lrf.web.profiles.reuters import Reuters from libprs500.ebooks.lrf.web.profiles.atlantic import Atlantic from libprs500.ebooks.lrf.web.profiles.ap import AssociatedPress +from libprs500.ebooks.lrf.web.profiles.newyorker import NewYorker builtin_profiles = [Atlantic, AssociatedPress, Barrons, BBC, ChristianScienceMonitor, CNN, Dilbert, Economist, FazNet, - JerusalemPost, Newsweek, NewYorkReviewOfBooks, NYTimes, + JerusalemPost, Newsweek, NewYorker, NewYorkReviewOfBooks, NYTimes, Portfolio, Reuters, SpiegelOnline, WallStreetJournal, ZeitNachrichten, ] diff --git a/src/libprs500/ebooks/lrf/web/profiles/newyorker.py b/src/libprs500/ebooks/lrf/web/profiles/newyorker.py new file mode 100644 index 0000000000..b9502010ba --- /dev/null +++ b/src/libprs500/ebooks/lrf/web/profiles/newyorker.py @@ -0,0 +1,56 @@ +''' + Profile to download Jutarnji.hr +''' + +import re + +from libprs500.ebooks.lrf.web.profiles import DefaultProfile + +class NewYorker(DefaultProfile): + + title = 'The New Yorker' + max_recursions = 2 + timefmt = ' [%d %b %Y]' + max_articles_per_feed = 20 + html_description = True + no_stylesheets = True + oldest_article = 14 + + + ## Getting the print version + def print_version(self, url): + return url + '?printable=true' + + + preprocess_regexps = [ + (re.compile(r'