mirror of
https://github.com/kovidgoyal/calibre.git
synced 2025-07-09 03:04:10 -04:00
remove non-working recipes
This commit is contained in:
parent
1a3d3600b1
commit
c8b372bb2c
@ -1,48 +0,0 @@
|
||||
# -*- coding: utf-8 -*-
|
||||
import re
|
||||
from calibre.web.feeds.recipes import BasicNewsRecipe
|
||||
|
||||
|
||||
class hu168ora(BasicNewsRecipe):
|
||||
title = u'168 óra'
|
||||
__author__ = u'István Papp'
|
||||
description = u'A 168 óra friss hírei'
|
||||
timefmt = ' [%Y. %b. %d., %a.]'
|
||||
oldest_article = 7
|
||||
language = 'hu'
|
||||
|
||||
max_articles_per_feed = 100
|
||||
no_stylesheets = True
|
||||
use_embedded_content = False
|
||||
encoding = 'utf8'
|
||||
publisher = u'Telegráf Kiadó'
|
||||
category = u'news, hírek, 168'
|
||||
extra_css = 'body{ font-family: Verdana,Helvetica,Arial,sans-serif }'
|
||||
preprocess_regexps = [(re.compile(r'<!--.*?-->', re.DOTALL), lambda m: '')]
|
||||
keep_only_tags = [
|
||||
dict(id='cikk_fejlec'), dict(id='cikk_torzs')
|
||||
]
|
||||
remove_tags = [
|
||||
dict(id='box_toolbar'), dict(id='text')
|
||||
]
|
||||
remove_javascript = True
|
||||
remove_empty_feeds = True
|
||||
|
||||
feeds = [
|
||||
|
||||
(u'Itthon', u'http://www.168ora.hu/static/rss/cikkek_itthon.xml'),
|
||||
(u'Glóbusz', u'http://www.168ora.hu/static/rss/cikkek_globusz.xml'),
|
||||
(u'Punch', u'http://www.168ora.hu/static/rss/cikkek_punch.xml'),
|
||||
(u'Arte', u'http://www.168ora.hu/static/rss/cikkek_arte.xml'),
|
||||
(u'Buxa', u'http://www.168ora.hu/static/rss/cikkek_buxa.xml'),
|
||||
(u'Sebesség', u'http://www.168ora.hu/static/rss/cikkek_sebesseg.xml'),
|
||||
(u'Tudás', u'http://www.168ora.hu/static/rss/cikkek_tudas.xml'),
|
||||
(u'Sport', u'http://www.168ora.hu/static/rss/cikkek_sport.xml'),
|
||||
(u'Vélemény', u'http://www.168ora.hu/static/rss/cikkek_velemeny.xml'),
|
||||
(u'Dolce Vita', u'http://www.168ora.hu/static/rss/cikkek_dolcevita.xml'),
|
||||
# (u'Rádió', u'http://www.168ora.hu/static/rss/radio.xml')
|
||||
]
|
||||
|
||||
def print_version(self, url):
|
||||
url += '?print=1'
|
||||
return url
|
@ -1,21 +0,0 @@
|
||||
#!/usr/bin/env python2
|
||||
# vim:fileencoding=UTF-8:ts=4:sw=4:sta:et:sts=4:ai
|
||||
from __future__ import with_statement
|
||||
|
||||
__license__ = 'GPL v3'
|
||||
__copyright__ = '2009, Kovid Goyal <kovid@kovidgoyal.net>'
|
||||
__docformat__ = 'restructuredtext en'
|
||||
|
||||
from calibre.web.feeds.news import BasicNewsRecipe
|
||||
|
||||
|
||||
class ATV(BasicNewsRecipe):
|
||||
title = u'ATV'
|
||||
oldest_article = 5
|
||||
max_articles_per_feed = 50
|
||||
language = 'hu'
|
||||
|
||||
__author__ = 'Ezmegaz'
|
||||
|
||||
feeds = [(u'H\xedrek', u'http://atv.hu/rss/1'), (u'Cikkek',
|
||||
u'http://atv.hu/rss/2')]
|
@ -1,46 +0,0 @@
|
||||
# -*- coding: utf-8 -*-
|
||||
|
||||
from calibre.web.feeds.news import BasicNewsRecipe
|
||||
|
||||
|
||||
class Haber7TS (BasicNewsRecipe):
|
||||
|
||||
title = u'H7 TÜMSPOR'
|
||||
__author__ = u'thomass'
|
||||
description = ' Haber 7 TÜMSPOR sitesinden tüm branşlarda spor haberleri '
|
||||
oldest_article = 2
|
||||
max_articles_per_feed = 100
|
||||
no_stylesheets = True
|
||||
encoding = 'ISO 8859-9'
|
||||
publisher = 'thomass'
|
||||
category = 'güncel, haber, türkçe,spor,futbol'
|
||||
language = 'tr'
|
||||
publication_type = 'newspaper'
|
||||
|
||||
conversion_options = {
|
||||
'tags': category, 'language': language, 'publisher': publisher, 'linearize_tables': True
|
||||
}
|
||||
extra_css = ' #newsheadcon h1{font-weight: bold; font-size: 18px;color:#0000FF} '
|
||||
keep_only_tags = [
|
||||
dict(name='div', attrs={'class': ['intNews', 'leftmidmerge']})]
|
||||
remove_tags = [dict(name='div', attrs={'id': ['blocktitle', 'banner46860body']}), dict(name='div', attrs={'class': ['Breadcrumb', 'shr', 'mobile/home.jpg', 'etiket', 'yorumYazNew', 'shr', 'y-list', 'banner', 'lftBannerShowcase', 'comments', 'interNews', 'lftBanner', 'midblock', 'rightblock', 'comnum', 'commentcon', ]}), dict(name='a', attrs={'class': ['saveto', 'sendto', 'comlink', 'newsshare', ]}), dict(name='iframe', attrs={'name': ['frm111', 'frm107']}), dict(name='ul', attrs={'class': ['nocPagi', 'leftmidmerge']})] # noqa
|
||||
cover_img_url = 'http://image.tumspor.com/v2/images/tasarim/images/logo.jpg'
|
||||
masthead_url = 'http://image.tumspor.com/v2/images/tasarim/images/logo.jpg'
|
||||
remove_empty_feeds = True
|
||||
|
||||
feeds = [
|
||||
(u'Futbol', u'http://open.dapper.net/services/h7tsfutbol'),
|
||||
(u'Basketbol', u'http://open.dapper.net/services/h7tsbasket'),
|
||||
(u'Tenis', u'http://open.dapper.net/services/h7tstenis'),
|
||||
(u'NBA', u'http://open.dapper.net/services/h7tsnba'),
|
||||
(u'Diğer Sporlar', u'http://open.dapper.net/services/h7tsdiger'),
|
||||
(u'Yazarlar & Magazin',
|
||||
u'http://open.dapper.net/services/h7tsyazarmagazin'),
|
||||
]
|
||||
|
||||
def preprocess_html(self, soup):
|
||||
for alink in soup.findAll('a'):
|
||||
if alink.string is not None:
|
||||
tstr = alink.string
|
||||
alink.replaceWith(tstr)
|
||||
return soup
|
@ -1,55 +0,0 @@
|
||||
# -*- coding: utf-8 -*-
|
||||
|
||||
from calibre.web.feeds.news import BasicNewsRecipe
|
||||
|
||||
|
||||
class Haber7 (BasicNewsRecipe):
|
||||
|
||||
title = u'Haber 7'
|
||||
__author__ = u'thomass'
|
||||
description = ' Haber 7 sitesinden haberler '
|
||||
oldest_article = 2
|
||||
max_articles_per_feed = 100
|
||||
no_stylesheets = True
|
||||
encoding = 'ISO 8859-9'
|
||||
publisher = 'thomass'
|
||||
category = 'güncel, haber, türkçe'
|
||||
language = 'tr'
|
||||
publication_type = 'newspaper'
|
||||
|
||||
conversion_options = {
|
||||
'tags': category, 'language': language, 'publisher': publisher, 'linearize_tables': True
|
||||
}
|
||||
extra_css = 'body{ font-size: 12px}h2{font-weight: bold; font-size: 18px;color:#0000FF} #newsheadcon h1{font-weight: bold; font-size: 18px;color:#0000FF}'
|
||||
|
||||
keep_only_tags = [
|
||||
dict(name='div', attrs={'class': ['intNews', 'leftmidmerge']})]
|
||||
remove_tags = [dict(name='div', attrs={'id': ['blocktitle', 'banner46860body']}), dict(name='div', attrs={'class': ['Breadcrumb', 'shr', 'mobile/home.jpg', 'etiket', 'yorumYazNew', 'shr', 'y-list', 'banner', 'lftBannerShowcase', 'comments', 'interNews', 'lftBanner', 'midblock', 'rightblock', 'comnum', 'commentcon', ]}), dict(name='a', attrs={'class': ['saveto', 'sendto', 'comlink', 'newsshare', ]}), dict(name='iframe', attrs={'name': ['frm111', 'frm107']}), dict(name='ul', attrs={'class': ['nocPagi', 'leftmidmerge']})] # noqa
|
||||
|
||||
cover_img_url = 'http://dl.dropbox.com/u/39726752/haber7.JPG'
|
||||
masthead_url = 'http://dl.dropbox.com/u/39726752/haber7.JPG'
|
||||
remove_empty_feeds = True
|
||||
|
||||
feeds = [
|
||||
(u'Siyaset', u'http://open.dapper.net/services/h7siyaset'),
|
||||
(u'Güncel', u'http://open.dapper.net/services/h7guncel'),
|
||||
(u'Yaşam', u'http://open.dapper.net/services/h7yasam'),
|
||||
(u'Ekonomi', u'http://open.dapper.net/services/h7ekonomi'),
|
||||
(u'3. Sayfa', u'http://open.dapper.net/services/h73sayfa'),
|
||||
(u'Dünya', u'http://open.dapper.net/services/h7dunya'),
|
||||
(u'Medya', u'http://open.dapper.net/services/h7medya'),
|
||||
|
||||
(u'Yazarlar', u'http://open.dapper.net/services/h7yazarlar'),
|
||||
(u'Bilim', u'http://open.dapper.net/services/h7bilim'),
|
||||
(u'Eğitim', u'http://open.dapper.net/services/h7egitim'),
|
||||
(u'Spor', u'http://open.dapper.net/services/h7sporv3'),
|
||||
|
||||
|
||||
]
|
||||
|
||||
def preprocess_html(self, soup):
|
||||
for alink in soup.findAll('a'):
|
||||
if alink.string is not None:
|
||||
tstr = alink.string
|
||||
alink.replaceWith(tstr)
|
||||
return soup
|
@ -1,39 +0,0 @@
|
||||
from calibre.web.feeds.news import BasicNewsRecipe
|
||||
|
||||
|
||||
class AdvancedUserRecipe1302341394(BasicNewsRecipe):
|
||||
title = u'Hallo Assen'
|
||||
oldest_article = 180
|
||||
max_articles_per_feed = 100
|
||||
|
||||
__author__ = 'Reijndert'
|
||||
no_stylesheets = True
|
||||
cover_url = 'http://www.halloassen.nl/multimedia/halloassen/archive/00002/HalloAssen_2518a.gif'
|
||||
language = 'nl'
|
||||
country = 'NL'
|
||||
version = 1
|
||||
category = u'Nieuws'
|
||||
timefmt = ' %Y-%m-%d (%a)'
|
||||
|
||||
keep_only_tags = [dict(name='div', attrs={'class': 'photoFrame'}), dict(name='div', attrs={'class': 'textContent'})
|
||||
]
|
||||
|
||||
remove_tags = [
|
||||
dict(name='div', attrs={'id': 'articleLinks'}), dict(name='div', attrs={'class': 'categories clearfix'}), dict(
|
||||
name='div', attrs={'id': 'rating'}), dict(name='div', attrs={'id': 'comments'})
|
||||
]
|
||||
|
||||
feeds = [
|
||||
(u'Ons Nieuws', u'http://feeds.feedburner.com/halloassen/onsnieuws'),
|
||||
(u'Politie', u'http://www.halloassen.nl/rss/?c=37'),
|
||||
(u'Rechtbank', u'http://www.halloassen.nl/rss/?c=39'),
|
||||
(u'Justitie', u'http://www.halloassen.nl/rss/?c=36'),
|
||||
|
||||
(u'Evenementen', u'http://www.halloassen.nl/rss/?c=34'),
|
||||
(u'Cultuur', u'http://www.halloassen.nl/rss/?c=32'),
|
||||
(u'Politiek', u'http://www.halloassen.nl/rss/?c=38'),
|
||||
(u'Economie', u'http://www.halloassen.nl/rss/?c=33')]
|
||||
|
||||
extra_css = '''
|
||||
body {font-family: verdana, arial, helvetica, geneva, sans-serif;}
|
||||
'''
|
@ -1,47 +0,0 @@
|
||||
from __future__ import with_statement
|
||||
__license__ = 'GPL 3'
|
||||
__copyright__ = '2009, Kovid Goyal <kovid@kovidgoyal.net>'
|
||||
__docformat__ = 'restructuredtext en'
|
||||
|
||||
from calibre.web.feeds.news import BasicNewsRecipe
|
||||
|
||||
|
||||
class ChicagoTribune(BasicNewsRecipe):
|
||||
|
||||
title = 'The Hartford Courant'
|
||||
__author__ = 'Being and Sujata Raman'
|
||||
description = 'Politics, local and business news from Hartford'
|
||||
language = 'en'
|
||||
use_embedded_content = False
|
||||
no_stylesheets = True
|
||||
remove_javascript = True
|
||||
auto_cleanup = True
|
||||
|
||||
feeds = [
|
||||
('Breaking News', 'http://feeds.feedburner.com/courant-breaking-news/'),
|
||||
('Nation/World News', 'http://feeds.feedburner.com/courant-nation-world/'),
|
||||
('Connecticut News', 'http://feeds.feedburner.com/courant-connecticut-news/'),
|
||||
('Hartford News', 'http://feeds.feedburner.com/courant-hartford/'),
|
||||
('West Hartford News', 'http://feeds.feedburner.com/courant-west-hartford/'),
|
||||
('Bristol', 'http://feeds.feedburner.com/courant-bristol/'),
|
||||
('Politics', 'http://feeds.feedburner.com/courant-politics/'),
|
||||
('Opinion', 'http://feeds.feedburner.com/courant-opinion/'),
|
||||
('Editorials', 'http://feeds.feedburner.com/courant-editorials/'),
|
||||
('Letters', 'http://feeds.feedburner.com/courant-letters/'),
|
||||
('Bob Englehart', 'http://feeds2.feedburner.com/BobEnglehartEnglehartsView'),
|
||||
('Business', 'http://feeds.feedburner.com/courant-business/'),
|
||||
('Sports', 'http://feeds.feedburner.com/courant-sports/'),
|
||||
('Features', 'http://feeds.feedburner.com/courant-features/'),
|
||||
('Consumer', 'http://feeds.feedburner.com/courant-consumer/'),
|
||||
('Shopping', 'http://feeds.feedburner.com/courant-shopping/'),
|
||||
('Arts & Theater', 'http://feeds.feedburner.com/courant-entertainment/'),
|
||||
('Entertainment', 'http://feeds.feedburner.com/courant-stage/'),
|
||||
('Music', 'http://feeds.feedburner.com/courant-music/'),
|
||||
('TV', 'http://feeds.feedburner.com/courant-tv/'),
|
||||
('Movies', 'http://feeds.feedburner.com/courant-movies/'),
|
||||
('Outdoors', 'http://feeds.feedburner.com/courant-outdoors/'),
|
||||
('Peter Marteka', 'http://feeds.feedburner.com/courant-marteka-column/'),
|
||||
('Jim Shea', 'http://feeds.feedburner.com/courant-jim-shea-column/'),
|
||||
('Tom Condon', 'http://feeds.feedburner.com/courant-tom-condon-column/'),
|
||||
('Colin McEnroe', 'http://feeds.feedburner.com/courant-colin-mcenroe-column/'),
|
||||
]
|
Binary file not shown.
Before Width: | Height: | Size: 580 B |
Binary file not shown.
Before Width: | Height: | Size: 508 B |
Loading…
x
Reference in New Issue
Block a user