mirror of
				https://github.com/kovidgoyal/calibre.git
				synced 2025-10-24 23:38:55 -04:00 
			
		
		
		
	
		
			
				
	
	
		
			70 lines
		
	
	
		
			2.5 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			70 lines
		
	
	
		
			2.5 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| #!/usr/bin/env python
 | |
| 
 | |
| __license__ = 'GPL v3'
 | |
| __copyright__ = '2009, Darko Miletic <darko.miletic at gmail.com>'
 | |
| 
 | |
| '''
 | |
| www.vecernji.hr
 | |
| '''
 | |
| 
 | |
| import re
 | |
| 
 | |
| from calibre.ebooks.BeautifulSoup import Tag
 | |
| from calibre.web.feeds.recipes import BasicNewsRecipe
 | |
| 
 | |
| 
 | |
| def new_tag(soup, name, attrs=()):
 | |
|     impl = getattr(soup, 'new_tag', None)
 | |
|     if impl is not None:
 | |
|         return impl(name, attrs=dict(attrs))
 | |
|     return Tag(soup, name, attrs=attrs or None)
 | |
| 
 | |
| 
 | |
| class VecernjiList(BasicNewsRecipe):
 | |
|     title = 'Vecernji List'
 | |
|     __author__ = 'Darko Miletic'
 | |
|     description = 'Vecernji.hr je vodeci hrvatski news portal. Cilj je biti prvi u objavljivanju svih vijesti iz Hrvatske, svijeta, sporta, gospodarstva, showbiza i jos mnogo vise. Uz cjelodnevni rad, novinari objavljuju preko 300 raznih vijesti svakoga dana. Vecernji.hr prati sve vaznije dogadaje specijalnim izvjestajima, video specijalima i foto galerijama.'  # noqa: E501
 | |
|     publisher = 'Vecernji.hr'
 | |
|     category = 'news, politics, Croatia'
 | |
|     oldest_article = 2
 | |
|     max_articles_per_feed = 100
 | |
|     delay = 1
 | |
|     no_stylesheets = True
 | |
|     encoding = 'utf-8'
 | |
|     use_embedded_content = False
 | |
|     language = 'hr'
 | |
| 
 | |
|     lang = 'hr-HR'
 | |
|     direction = 'ltr'
 | |
| 
 | |
|     extra_css = '@font-face {font-family: "serif1";src:url(res:///opt/sony/ebook/FONT/tt0011m_.ttf)} body{font-family: serif1, serif} .article_description{font-family: serif1, serif}'  # noqa: E501
 | |
| 
 | |
|     conversion_options = {
 | |
|         'comment': description, 'tags': category, 'publisher': publisher, 'language': lang, 'pretty_print': True
 | |
|     }
 | |
| 
 | |
|     preprocess_regexps = [(re.compile(u'\u0110'), lambda match: u'\u00D0')]  # noqa: RUF039
 | |
| 
 | |
|     remove_tags = [
 | |
|         dict(name=['object', 'link', 'embed']), dict(
 | |
|             name='table', attrs={'class': 'enumbox'})
 | |
|     ]
 | |
| 
 | |
|     feeds = [(u'Vijesti', u'http://www.vecernji.hr/rss/')]
 | |
| 
 | |
|     def preprocess_html(self, soup):
 | |
|         soup.html['lang'] = self.lang
 | |
|         soup.html['dir'] = self.direction
 | |
| 
 | |
|         mlang = new_tag(soup, 'meta', [
 | |
|                     ('http-equiv', 'Content-Language'), ('content', self.lang)])
 | |
|         mcharset = new_tag(soup, 'meta', [
 | |
|                        ('http-equiv', 'Content-Type'), ('content', 'text/html; charset=UTF-8')])
 | |
|         soup.head.insert(0, mlang)
 | |
|         soup.head.insert(1, mcharset)
 | |
|         return self.adeify_images(soup)
 | |
| 
 | |
|     def print_version(self, url):
 | |
|         artid = url.rpartition('-')[2]
 | |
|         return 'http://www.vecernji.hr/index.php?cmd=show_clanak&action=print_popup&clanak_id=' + artid
 |