Fix Gawker

This commit is contained in:
Kovid Goyal 2011-02-25 13:15:12 -07:00
parent 40006a5b4b
commit e6c49c4a9f

View File

@ -16,14 +16,10 @@ class Gawker(BasicNewsRecipe):
max_articles_per_feed = 100 max_articles_per_feed = 100
no_stylesheets = True no_stylesheets = True
encoding = 'utf-8' encoding = 'utf-8'
use_embedded_content = False use_embedded_content = True
language = 'en' language = 'en'
masthead_url = 'http://cache.gawkerassets.com/assets/gawker.com/img/logo.png' masthead_url = 'http://cache.gawkerassets.com/assets/gawker.com/img/logo.png'
extra_css = '''
body{font-family: "Lucida Grande",Helvetica,Arial,sans-serif}
img{margin-bottom: 1em}
h1{font-family :Arial,Helvetica,sans-serif; font-size:large}
'''
conversion_options = { conversion_options = {
'comment' : description 'comment' : description
, 'tags' : category , 'tags' : category
@ -31,13 +27,11 @@ class Gawker(BasicNewsRecipe):
, 'language' : language , 'language' : language
} }
remove_attributes = ['width','height'] remove_tags = [
keep_only_tags = [dict(attrs={'class':'content permalink'})] {'class': 'feedflare'},
remove_tags_before = dict(name='h1') ]
remove_tags = [dict(attrs={'class':'contactinfo'})]
remove_tags_after = dict(attrs={'class':'contactinfo'})
feeds = [(u'Articles', u'http://feeds.gawker.com/gawker/full')] feeds = [(u'Articles', u'http://feeds.gawker.com/gawker/vip?format=xml')]
def preprocess_html(self, soup): def preprocess_html(self, soup):
return self.adeify_images(soup) return self.adeify_images(soup)