mirror of
https://github.com/kovidgoyal/calibre.git
synced 2025-06-23 15:30:45 -04:00
86 lines
3.8 KiB
Python
86 lines
3.8 KiB
Python
#!/usr/bin/env python
|
|
__license__ = 'GPL v3'
|
|
__copyright__ = '2011, Adrian Gunawan <agunawan at adrnalin.com>'
|
|
__author__ = 'Adrian Gunawan'
|
|
__version__ = 'v1.0'
|
|
__date__ = '02 February 2011'
|
|
|
|
'''
|
|
http://www.kompas.com/
|
|
'''
|
|
|
|
import re
|
|
from calibre.web.feeds.news import BasicNewsRecipe
|
|
|
|
|
|
class Kompas(BasicNewsRecipe):
|
|
title = u'Kompas'
|
|
masthead_url = 'http://stat.k.kidsklik.com/data/2k10/kompascom2011/images/logo_kompas.png'
|
|
cover_url = 'http://stat.k.kidsklik.com/data/2k10/kompascom2011/images/logo_kompas.png'
|
|
|
|
__author__ = u'Adrian Gunawan'
|
|
description = u'Indonesian News from Kompas Online Edition'
|
|
category = 'local news, international, business, Indonesia'
|
|
language = 'id'
|
|
oldest_article = 5
|
|
max_articles_per_feed = 100
|
|
|
|
no_stylesheets = True
|
|
use_embedded_content = False
|
|
no_javascript = True
|
|
remove_empty_feeds = True
|
|
|
|
timefmt = ' [%A, %d %B, %Y]'
|
|
encoding = 'utf-8'
|
|
|
|
keep_only_tags = [dict(name='div', attrs={'class': 'content_kiri_detail'})]
|
|
|
|
extra_css = '''
|
|
h1{font-family:Georgia,"Times New Roman",Times,serif; font-weight:bold; font-size:large;}
|
|
.cT-storyDetails{font-family:Arial,Helvetica,sans-serif; color:#666666;font-size:x-small;}
|
|
.articleBody{font-family:Arial,Helvetica,sans-serif; color:black;font-size:small;}
|
|
.cT-imageLandscape{font-family:Arial,Helvetica,sans-serif; color:#333333 ;font-size:x-small;}
|
|
.source{font-family:Arial,Helvetica,sans-serif; color:#333333 ;font-size:xx-small;}
|
|
#content{font-family:Arial,Helvetica,sans-serif;font-size:x-small;}
|
|
.pageprint{font-family:Arial,Helvetica,sans-serif;font-size:small;}
|
|
#bylineDetails{font-family:Arial,Helvetica,sans-serif; color:#666666;font-size:x-small;}
|
|
.featurePic-wide{font-family:Arial,Helvetica,sans-serif;font-size:x-small;}
|
|
#idfeaturepic{font-family:Arial,Helvetica,sans-serif;font-size:x-small;}
|
|
h3{font-family:Georgia,"Times New Roman",Times,serif; font-size:small;}
|
|
h2{font-family:Georgia,"Times New Roman",Times,serif; font-size:small;}
|
|
h4{font-family:Georgia,"Times New Roman",Times,serif; font-size:small;}
|
|
h5{font-family:Georgia,"Times New Roman",Times,serif; font-size:small;}
|
|
body{font-family:Arial,Helvetica,sans-serif; font-size:x-small;}
|
|
'''
|
|
|
|
remove_tags = [
|
|
dict(name='div', attrs={'class': [
|
|
'c_biru_kompas2011', 'c_abu01_kompas2011', 'c_abu_01_kompas2011', 'right', 'clearit']}),
|
|
dict(name='div', attrs={
|
|
'id': ['comment_list', 'comment_paging', 'share']}),
|
|
dict(name='form'),
|
|
dict(name='ul'),
|
|
]
|
|
|
|
preprocess_regexps = [
|
|
(re.compile(r'<!--TERKAIT -->.*<!--TERKAIT END -->',
|
|
re.DOTALL | re.IGNORECASE), lambda match: ''),
|
|
(re.compile(r'<strong>Sent Using.*</body>',
|
|
re.DOTALL | re.IGNORECASE), lambda match: ''),
|
|
(re.compile(r'<strong>Kirim Komentar Anda</strong>',
|
|
re.DOTALL | re.IGNORECASE), lambda match: ''),
|
|
(re.compile(r'<a[^>]*>Kembali ke Index Topik Pilihan</a>',
|
|
re.DOTALL | re.IGNORECASE), lambda match: ''),
|
|
]
|
|
|
|
feeds = [
|
|
(u'Nasional', u'http://www.kompas.com/getrss/nasional'),
|
|
(u'Regional', u'http://www.kompas.com/getrss/regional'),
|
|
(u'Internasional', u'http://www.kompas.com/getrss/internasional'),
|
|
(u'Megapolitan', u'http://www.kompas.com/getrss/megapolitan'),
|
|
(u'Bisnis Keuangan',
|
|
u'http://www.kompas.com/getrss/bisniskeuangan'),
|
|
(u'Kesehatan', u'http://www.kompas.com/getrss/kesehatan'),
|
|
(u'Olahraga', u'http://www.kompas.com/getrss/olahraga'),
|
|
]
|