home *** CD-ROM | disk | FTP | other *** search
/ Chip 2011 November / CHIP_2011_11.iso / Programy / Narzedzia / Calibre / calibre-0.8.18.msi / file_280 / descopera.recipe < prev    next >
Text File  |  2011-09-09  |  2KB  |  58 lines

  1. # -*- coding: utf-8 -*-
  2. #!/usr/bin/env  python
  3.  
  4. __license__   = 'GPL v3'
  5. __copyright__ = u'2011, Silviu Cotoar\u0103'
  6. '''
  7. descopera.ro
  8. '''
  9.  
  10. from calibre.web.feeds.news import BasicNewsRecipe
  11.  
  12. class Descopera(BasicNewsRecipe):
  13.     title                       = u'Descoper\u0103'
  14.     __author__          = u'Silviu Cotoar\u0103'
  15.     description             = 'E lumea ta'
  16.     publisher                   = 'Descopera'
  17.     oldest_article              = 5
  18.     language                    = 'ro'
  19.     max_articles_per_feed = 100
  20.     no_stylesheets          = True
  21.     use_embedded_content  = False
  22.     category                  = 'Ziare,Reviste,Descopera'
  23.     encoding                = 'utf-8'
  24.     cover_url     = 'http://www.descopera.ro/images/header_images/logo.gif'
  25.  
  26.     conversion_options = {
  27.                              'comments'  : description
  28.                             ,'tags'           : category
  29.                             ,'language'    : language
  30.                 ,'publisher'   : publisher
  31.                          }
  32.  
  33.  
  34.     keep_only_tags = [
  35.         dict(name='h1', attrs={'style':'font-family: Arial,Helvetica,sans-serif; font-size: 18px; color: rgb(51, 51, 51); font-weight: bold; margin: 10px 0pt; clear: both; float: left;width: 610px;'})
  36.         ,dict(name='div', attrs={'style':'margin-right: 15px; margin-bottom: 15px; float: left;'})
  37.         , dict(name='p', attrs={'id':'itemDescription'})
  38.         ,dict(name='div', attrs={'id':'itemBody'})
  39.                  ]
  40.  
  41.     remove_tags = [
  42.              dict(name='div', attrs={'class':['tools']})
  43.            , dict(name='div', attrs={'class':['share']})
  44.            , dict(name='div', attrs={'class':['category']})
  45.            , dict(name='div', attrs={'id':['comments']})
  46.                           ]
  47.  
  48.     remove_tags_after = [
  49.                dict(name='div', attrs={'id':'comments'})
  50.            ]
  51.  
  52.     feeds          = [
  53.         (u'Feeds', u'http://www.descopera.ro/rss')
  54.                      ]
  55.  
  56.     def preprocess_html(self, soup):
  57.         return self.adeify_images(soup)
  58.