diff --git a/src/libprs500/ebooks/lrf/web/__init__.py b/src/libprs500/ebooks/lrf/web/__init__.py index 2452d7b4d1..4eb0432c18 100644 --- a/src/libprs500/ebooks/lrf/web/__init__.py +++ b/src/libprs500/ebooks/lrf/web/__init__.py @@ -25,10 +25,15 @@ from libprs500.ebooks.lrf.web.profiles.wsj import WallStreetJournal from libprs500.ebooks.lrf.web.profiles.barrons import Barrons from libprs500.ebooks.lrf.web.profiles.portfolio import Portfolio from libprs500.ebooks.lrf.web.profiles.dilbert import Dilbert -from libprs500.ebooks.lrf.web.profiles.cnn import CNN +from libprs500.ebooks.lrf.web.profiles.cnn import CNN +from libprs500.ebooks.lrf.web.profiles.chr_mon import ChristianScienceMonitor +from libprs500.ebooks.lrf.web.profiles.jpost import JerusalemPost +from libprs500.ebooks.lrf.web.profiles.reuters import Reuters +from libprs500.ebooks.lrf.web.profiles.atlantic import Atlantic -builtin_profiles = [Barrons, BBC, CNN, Dilbert, Economist, FazNet, Newsweek, NewYorkReviewOfBooks, NYTimes, \ - Portfolio, SpiegelOnline, WallStreetJournal, ZeitNachrichten, \ +builtin_profiles = [Atlantic, Barrons, BBC, ChristianScienceMonitor, CNN, Dilbert, Economist, FazNet, + JerusalemPost, Newsweek, NewYorkReviewOfBooks, NYTimes, + Portfolio, Reuters, SpiegelOnline, WallStreetJournal, ZeitNachrichten, ] available_profiles = [i.__module__.rpartition('.')[2] for i in builtin_profiles] \ No newline at end of file diff --git a/src/libprs500/ebooks/lrf/web/profiles/atlantic.py b/src/libprs500/ebooks/lrf/web/profiles/atlantic.py new file mode 100644 index 0000000000..6bd3944db6 --- /dev/null +++ b/src/libprs500/ebooks/lrf/web/profiles/atlantic.py @@ -0,0 +1,59 @@ +## Copyright (C) 2008 Kovid Goyal kovid@kovidgoyal.net +## This program is free software; you can redistribute it and/or modify +## it under the terms of the GNU General Public License as published by +## the Free Software Foundation; either version 2 of the License, or +## (at your option) any later version. +## +## This program is distributed in the hope that it will be useful, +## but WITHOUT ANY WARRANTY; without even the implied warranty of +## MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +## GNU General Public License for more details. +## +## You should have received a copy of the GNU General Public License along +## with this program; if not, write to the Free Software Foundation, Inc., +## 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. +import re +from libprs500.ebooks.lrf.web.profiles import DefaultProfile +from libprs500.ebooks.BeautifulSoup import BeautifulSoup + +class Atlantic(DefaultProfile): + + title = 'The Atlantic' + max_recursions = 2 + INDEX = 'http://www.theatlantic.com/doc/current' + + preprocess_regexps = [ + (re.compile(r'