diff --git a/src/libprs500/ebooks/lrf/web/profiles/chr_mon.py b/src/libprs500/ebooks/lrf/web/profiles/chr_mon.py index 0fc068af42..42dbfc1dc7 100644 --- a/src/libprs500/ebooks/lrf/web/profiles/chr_mon.py +++ b/src/libprs500/ebooks/lrf/web/profiles/chr_mon.py @@ -1,38 +1,46 @@ -import re + +import re, time from libprs500.ebooks.lrf.web.profiles import DefaultProfile +from libprs500.ebooks.BeautifulSoup import BeautifulSoup class ChristianScienceMonitor(DefaultProfile): title = 'Christian Science Monitor' max_recursions = 2 max_articles_per_feed = 20 - use_pubdate = False - html_description = True - html2lrf_options = ['--ignore-tables', '--base-font-size=8.0', '--wordspace=2.0',] + no_stylesheets = True + + preprocess_regexps = [ (re.compile(i[0], re.IGNORECASE | re.DOTALL), i[1]) for i in -[ - (r'
.*?' , lambda match : ''), - (r'.*?', lambda match : ''), - (r'.*?', lambda match : ''), - (r'', lambda match : ''), - (r'.*?