diff --git a/resources/recipes/usatoday.recipe b/resources/recipes/usatoday.recipe index 1a314f652e..368437a709 100644 --- a/resources/recipes/usatoday.recipe +++ b/resources/recipes/usatoday.recipe @@ -7,62 +7,430 @@ usatoday.com ''' from calibre.web.feeds.news import BasicNewsRecipe +from calibre.ebooks.BeautifulSoup import BeautifulSoup, BeautifulStoneSoup, NavigableString, Tag import re class USAToday(BasicNewsRecipe): title = 'USA Today' - timefmt = ' [%d %b %Y]' - __author__ = 'Kovid Goyal and Sujata Raman' + __author__ = 'GRiker' + oldest_article = 1 + timefmt = '' max_articles_per_feed = 20 language = 'en' - - no_stylesheets = True - extra_css = ''' - .inside-head{font-family:Arial,Helvetica,sans-serif; font-size:large; font-weight:bold } - .inside-head2{font-family:Arial,Helvetica,sans-serif; font-size:large; font-weight:bold } - .inside-head3{font-family:Arial,Helvetica,sans-serif; font-size:large; font-weight:bold } - h3{font-family:Arial,Helvetica,sans-serif; font-size:large; font-weight:bold; } - h4{font-family:Arial,Helvetica,sans-serif; font-size:x-small; font-weight:bold; } - .side-by-side{font-family:Arial,Helvetica,sans-serif; font-size:x-small;} - #byLineTag{font-family:Arial,Helvetica,sans-serif; font-size:xx-small;} - .inside-copy{font-family:Arial,Helvetica,sans-serif; font-size:x-small;text-align:left;} - .caption{font-family:Arial,Helvetica,sans-serif; font-size:x-small;} - li{font-family:Arial,Helvetica,sans-serif; font-size:x-small;text-align:left ;} - .vatext{font-family:Arial,Helvetica,sans-serif; font-size:x-small;text-align:left ;} - .vaTextBold{font-family:Arial,Helvetica,sans-serif; font-size:x-small;font-weight:bold; color:#666666;} - ''' - remove_tags = [ - {'class':['tagListLabel','piped-taglist-string','socialcontainer','social-wrapper',]}, - {'id':['topSocialButtons']}, - ] - + extra_css = '.headline {text-align: left;}\n \ + .byline {font-family: monospace; \ + text-align: left; \ + margin-bottom: 1em;}\n \ + .image {text-align: center;}\n \ + .caption {text-align: center; \ + font-size: smaller; \ + font-style: italic}\n \ + .credit {text-align: right; \ + margin-bottom: 0em; \ + font-size: smaller;}\n \ + .articleBody {text-align: left;}\n ' conversion_options = { 'linearize_tables' : True } - - preprocess_regexps = [ - (re.compile(r'