mirror of
				https://github.com/kovidgoyal/calibre.git
				synced 2025-10-25 07:48:55 -04:00 
			
		
		
		
	
		
			
				
	
	
		
			54 lines
		
	
	
		
			1.7 KiB
		
	
	
	
		
			Plaintext
		
	
	
	
	
	
			
		
		
	
	
			54 lines
		
	
	
		
			1.7 KiB
		
	
	
	
		
			Plaintext
		
	
	
	
	
	
| # -*- coding: utf-8 -*-
 | |
| #!/usr/bin/env  python
 | |
| 
 | |
| __license__   = 'GPL v3'
 | |
| __copyright__ = u'2011, Silviu Cotoar\u0103'
 | |
| '''
 | |
| divahair.ro
 | |
| '''
 | |
| 
 | |
| from calibre.web.feeds.news import BasicNewsRecipe
 | |
| 
 | |
| class DivaHair(BasicNewsRecipe):
 | |
|     title                 = u'Diva Hair'
 | |
|     language              = 'ro'
 | |
|     __author__            = u'Silviu Cotoar\u0103'
 | |
|     description           = u'Coafuri, frizuri, tunsori ..'
 | |
|     publisher             = u'Diva Hair'
 | |
|     category              = u'Ziare,Stiri,Coafuri,Femei'
 | |
|     oldest_article        = 5
 | |
|     max_articles_per_feed = 100
 | |
|     no_stylesheets        = True
 | |
|     use_embedded_content  = False
 | |
|     encoding              = 'utf-8'
 | |
|     remove_javascript     = True
 | |
|     cover_url             = 'http://www.divahair.ro/imgs/logo.jpg'
 | |
| 
 | |
|     conversion_options = {
 | |
|                              'comments'   : description
 | |
|                             ,'tags'       : category
 | |
|                             ,'language'   : language
 | |
|                             ,'publisher'  : publisher
 | |
|                          }
 | |
| 
 | |
|     keep_only_tags = [
 | |
|                          dict(name='td', attrs={'class':'spatiuart'})
 | |
|                         , dict(name='div', attrs={'class':'spatiuart'})
 | |
|                      ]
 | |
| 
 | |
| 
 | |
|     remove_tags = [
 | |
|                      dict(name='div', attrs={'class':'categorie'})
 | |
|                      , dict(name='div', attrs={'class':'gri gri2 detaliiart'})
 | |
|                      , dict(name='div', attrs={'class':'articol_box_bottom'})
 | |
|                   ]
 | |
| 
 | |
|     remove_tags_after = [
 | |
|                              dict(name='div', attrs={'class':'articol_box_bottom'})
 | |
|                         ]
 | |
| 
 | |
|     feeds = [ (u'\u0218tiri', u'http://www.divahair.ro/feed') ]
 | |
| 
 | |
|     def preprocess_html(self, soup):
 | |
|         return self.adeify_images(soup)
 |