Fix missing first paragraph in USA Today download

This commit is contained in:
Kovid Goyal 2009-08-27 22:02:18 -06:00
parent b34bdd60cd
commit c8d70c591f
2 changed files with 10 additions and 8 deletions

View File

@ -108,7 +108,7 @@ sudo python -c "import urllib2; exec urllib2.urlopen('http://status.calibre-eboo
<pre class="wiki"> <pre class="wiki">
wget -O- http://calibre.kovidgoyal.net/downloads/${app}-${version}.tar.gz | tar xvz wget -O- http://calibre.kovidgoyal.net/downloads/${app}-${version}.tar.gz | tar xvz
cd calibre* cd calibre*
python setup.py build &amp;&amp; sudo python setup.py install python setup.py build_ext &amp;&amp; python setup.py build &amp;&amp; sudo python setup.py install
sudo calibre_postinstall sudo calibre_postinstall
</pre> </pre>
Note that if your distribution does not have a Note that if your distribution does not have a

View File

@ -13,28 +13,30 @@ class USAToday(BasicNewsRecipe):
title = 'USA Today' title = 'USA Today'
timefmt = ' [%d %b %Y]' timefmt = ' [%d %b %Y]'
__author__ = 'Kovid Goyal and Sujata Raman'
max_articles_per_feed = 20 max_articles_per_feed = 20
language = _('English') language = _('English')
__author__ = _('Kovid Goyal and Sujata Raman')
no_stylesheets = True no_stylesheets = True
extra_css = ''' extra_css = '''
.inside-head{font-family:Arial,Helvetica,sans-serif; font-size:large; font-weight:bold } .inside-head{font-family:Arial,Helvetica,sans-serif; font-size:large; font-weight:bold }
.inside-head2{font-family:Arial,Helvetica,sans-serif; font-size:large; font-weight:bold } .inside-head2{font-family:Arial,Helvetica,sans-serif; font-size:large; font-weight:bold }
.inside-head3{font-family:Arial,Helvetica,sans-serif; font-size:large; font-weight:bold } .inside-head3{font-family:Arial,Helvetica,sans-serif; font-size:large; font-weight:bold }
h3{font-family:Arial,Helvetica,sans-serif; font-size:large; font-weight:bold } h3{font-family:Arial,Helvetica,sans-serif; font-size:large; font-weight:bold; }
h4{font-family:Arial,Helvetica,sans-serif; font-size:x-small; font-weight:bold } h4{font-family:Arial,Helvetica,sans-serif; font-size:x-small; font-weight:bold; }
.side-by-side{font-family:Arial,Helvetica,sans-serif; font-size:x-small;} .side-by-side{font-family:Arial,Helvetica,sans-serif; font-size:x-small;}
#byLineTag{font-family:Arial,Helvetica,sans-serif; font-size:xx-small;} #byLineTag{font-family:Arial,Helvetica,sans-serif; font-size:xx-small;}
.inside-copy{font-family:Arial,Helvetica,sans-serif; font-size:x-small;text-align:left} .inside-copy{font-family:Arial,Helvetica,sans-serif; font-size:x-small;text-align:left;}
.caption{font-family:Arial,Helvetica,sans-serif; font-size:x-small;} .caption{font-family:Arial,Helvetica,sans-serif; font-size:x-small;}
li{font-family:Arial,Helvetica,sans-serif; font-size:x-small;text-align:left ;}
.vatext{font-family:Arial,Helvetica,sans-serif; font-size:x-small;text-align:left ;}
.vaTextBold{font-family:Arial,Helvetica,sans-serif; font-size:x-small;font-weight:bold; color:#666666;}
''' '''
remove_tags = [ remove_tags = [
dict(name='div', attrs={'class':'inside-copy'}), {'class':['tagListLabel','piped-taglist-string',]}
{'class':['tagListLabel','piped-taglist-string',]}
] ]
html2lrf_options = ['--ignore-tables'] conversion_options = { 'linearize_tables' : True }
preprocess_regexps = [ preprocess_regexps = [
(re.compile(r'<BODY.*?<!--Article Goes Here-->', re.IGNORECASE | re.DOTALL), lambda match : '<BODY>'), (re.compile(r'<BODY.*?<!--Article Goes Here-->', re.IGNORECASE | re.DOTALL), lambda match : '<BODY>'),