home *** CD-ROM | disk | FTP | other *** search
/ Chip 2011 November / CHIP_2011_11.iso / Programy / Narzedzia / Calibre / calibre-0.8.18.msi / file_280 / cotidianul.recipe < prev    next >
Text File  |  2011-09-09  |  3KB  |  70 lines

  1. # -*- coding: utf-8 -*-
  2. #!/usr/bin/env  python
  3.  
  4. __license__   = 'GPL v3'
  5. __copyright__ = u'2011, Silviu Cotoar\u0103'
  6. '''
  7. cotidianul.ro
  8. '''
  9.  
  10. from calibre.web.feeds.news import BasicNewsRecipe
  11.  
  12. class Cotidianul(BasicNewsRecipe):
  13.     title                 = u'Cotidianul'
  14.     __author__            = u'Silviu Cotoar\u0103'
  15.     description           = u''
  16.     publisher             = u'Cotidianul'
  17.     oldest_article        = 25
  18.     language              = 'ro'
  19.     max_articles_per_feed = 100
  20.     no_stylesheets        = True
  21.     use_embedded_content  = False
  22.     category              = 'Ziare,Stiri'
  23.     encoding              = 'utf-8'
  24.     cover_url             = 'http://www.cotidianul.ro/images/cotidianul.png'
  25.  
  26.     conversion_options = {
  27.                              'comments'   : description
  28.                             ,'tags'       : category
  29.                             ,'language'   : language
  30.                             ,'publisher'  : publisher
  31.                          }
  32.  
  33.     extra_css = '''
  34.                     h1{font-family:Arial,Helvetica,sans-serif; font-weight:bold;font-size:large;}
  35.                     h2{font-family:Arial,Helvetica,sans-serif; font-weight:normal;font-size:small;}
  36.                     .byline {font-family:Arial,Helvetica,sans-serif; font-size:xx-small;}
  37.                     .date {font-family:Arial,Helvetica,sans-serif; font-size:xx-small;}
  38.                     p{font-family:Arial,Helvetica,sans-serif;font-size:small;}
  39.                     .copyright {font-family:Arial,Helvetica,sans-serif;font-size:xx-small;text-align:center}
  40.                     .story{font-family:Arial,Helvetica,sans-serif;font-size:small;}
  41.                     .entry-asset asset hentry{font-family:Arial,Helvetica,sans-serif;font-size:small;}
  42.                     .pagebody{font-family:Arial,Helvetica,sans-serif;font-size:small;}
  43.                     .maincontentcontainer{font-family:Arial,Helvetica,sans-serif;font-size:small;}
  44.                     .story-body{font-family:Arial,Helvetica,sans-serif;font-size:small;}
  45.                     body{font-family:Helvetica,Arial,sans-serif;font-size:small;}
  46.                 '''
  47.  
  48.     keep_only_tags = [
  49.                           dict(name='div', attrs={'class':'titlu'})
  50.                         , dict(name='div', attrs={'class':'gallery clearfix'})
  51.                         , dict(name='div', attrs={'align':'justify'})
  52.                      ]
  53.  
  54.     remove_tags = [
  55.                           dict(name='div', attrs={'class':['space']})
  56.                         , dict(name='div', attrs={'id':['title_desc']})
  57.                   ]
  58.  
  59.     remove_tags_after = [
  60.                               dict(name='div', attrs={'class':['space']})
  61.                             , dict(name='span', attrs={'class':['date']})
  62.                         ]
  63.  
  64.     feeds          = [
  65.                         (u'Feeds', u'http://www.cotidianul.ro/rssfeed/ToateStirile.xml')
  66.                      ]
  67.  
  68.     def preprocess_html(self, soup):
  69.         return self.adeify_images(soup)
  70.