mirror of
https://github.com/kovidgoyal/calibre.git
synced 2025-07-09 03:04:10 -04:00
no new content since 2014
This commit is contained in:
parent
ce4a738581
commit
99299512f6
Binary file not shown.
Before Width: | Height: | Size: 502 B |
@ -1,37 +0,0 @@
|
|||||||
from calibre.web.feeds.news import BasicNewsRecipe
|
|
||||||
from calibre.ebooks.BeautifulSoup import Comment
|
|
||||||
|
|
||||||
class OCLab(BasicNewsRecipe):
|
|
||||||
title = u'OCLab.pl'
|
|
||||||
oldest_article = 7
|
|
||||||
max_articles_per_feed = 100
|
|
||||||
__author__ = 'fenuks'
|
|
||||||
description = u'Portal OCLab.pl jest miejscem przyjaznym pasjonatom sprzętu komputerowego, w szczególności overclockerom, które będzie służyć im za aktualną bazę wiedzy o podkręcaniu komputera, źródło aktualnych informacji z rynku oraz opinii na temat sprzętu komputerowego.'
|
|
||||||
category = 'IT'
|
|
||||||
language = 'pl'
|
|
||||||
cover_url= 'http://www.idealforum.ru/attachment.php?attachmentid=7963&d=1316008118'
|
|
||||||
no_stylesheets = True
|
|
||||||
keep_only_tags=[dict(id='main')]
|
|
||||||
remove_tags_after= dict(attrs={'class':'single-postmetadata'})
|
|
||||||
remove_tags=[dict(attrs={'class':['single-postmetadata', 'pagebar', 'shr-bookmarks shr-bookmarks-expand shr-bookmarks-center shr-bookmarks-bg-enjoy']})]
|
|
||||||
feeds = [(u'Wpisy', u'http://oclab.pl/feed/')]
|
|
||||||
|
|
||||||
|
|
||||||
def append_page(self, soup, appendtag):
|
|
||||||
tag=soup.find(attrs={'class':'contentjumpddl'})
|
|
||||||
if tag:
|
|
||||||
nexturl=tag.findAll('option')
|
|
||||||
for nextpage in nexturl[1:-1]:
|
|
||||||
soup2 = self.index_to_soup(nextpage['value'])
|
|
||||||
pagetext = soup2.find(attrs={'class':'single-entry'})
|
|
||||||
pos = len(appendtag.contents)
|
|
||||||
appendtag.insert(pos, pagetext)
|
|
||||||
for r in appendtag.findAll(attrs={'class':'post-nav-bottom-list'}):
|
|
||||||
r.extract()
|
|
||||||
comments = appendtag.findAll(text=lambda text:isinstance(text, Comment))
|
|
||||||
for comment in comments:
|
|
||||||
comment.extract()
|
|
||||||
|
|
||||||
def preprocess_html(self, soup):
|
|
||||||
self.append_page(soup, soup.body)
|
|
||||||
return soup
|
|
Loading…
x
Reference in New Issue
Block a user