home *** CD-ROM | disk | FTP | other *** search
/ Chip 2011 November / CHIP_2011_11.iso / Programy / Narzedzia / Calibre / calibre-0.8.18.msi / file_280 / ntv_tr.recipe < prev    next >
Text File  |  2011-09-09  |  2KB  |  46 lines

  1. from calibre.web.feeds.news import BasicNewsRecipe
  2.  
  3. class NTVMSNBC(BasicNewsRecipe):
  4.     title          = u'NTV'
  5.     __author__            = 'A Erdogan'
  6.     description           = 'News from Turkey'
  7.     publisher             = 'NTV'
  8.     category              = 'news, politics, Turkey'
  9.     oldest_article        = 7
  10.     max_articles_per_feed = 100
  11.     no_stylesheets        = True
  12.     use_embedded_content  = False
  13.     masthead_url          = 'http://www.ntvmsnbc.com/images/MSNBC/msnbc_ban.gif'
  14.     language              = 'tr'
  15.  
  16.  
  17.     remove_tags_before = dict(name='h1')
  18.     remove_tags_after = dict(attrs={'id':'haberDetayYazi'})
  19.     extra_css             ='''
  20.                         body{font-family:Arial,Helvetica,sans-serif; font-size:small; align:left;  color:#000000}
  21.                         h1{font-size:large; color:#000000}
  22.          h2{font-size:small; color:#000000}
  23.         p{font-size:small; color:#000000}
  24.                      '''
  25.  
  26.     conversion_options = {
  27.                           'comment'   : description
  28.                         , 'tags'      : category
  29.                         , 'publisher' : publisher
  30.                         , 'language'  : language
  31.                         }
  32.  
  33.     remove_tags = [dict(name=['embed','il','ul','iframe','object','link','base']), dict(name='div', attrs={'style':['padding: 0pt 10px 10px;']}), dict(name='div', attrs={'style':['padding: 0pt 10px 10px;']}),  dict(name='div', attrs={'class':['textSmallGrey w320']}), dict(name='div', attrs={'style':['font-family:Arial; font-size:16px;font-weight:bold; font-color:#003366; margin-bottom:20px; margin-top:20px; border-bottom:solid 1px;border-color: #CCC; padding-bottom:2px;']})]
  34.     remove_tags_before = dict(name='h1')
  35.     remove_tags_after = dict(name='div', attrs={'style':['font-family:Arial; font-size:16px;font-weight:bold; font-color:#003366; margin-bottom:20px; margin-top:20px; border-bottom:solid 1px;border-color: #CCC; padding-bottom:2px;']})
  36.  
  37.     feeds          = [(u'NTV', u'http://www.ntvmsnbc.com/id/3032091/device/rss/rss.xml')]
  38.  
  39.     def print_version(self, url):
  40.         articleid = url.rpartition('/id/')[2]
  41.         return 'http://www.ntvmsnbc.com/id/' + articleid + '/print/1/displaymode/1098/'
  42.  
  43.     def preprocess_html(self, soup):
  44.         return self.adeify_images(soup)
  45.  
  46.