home *** CD-ROM | disk | FTP | other *** search
/ Chip 2011 November / CHIP_2011_11.iso / Programy / Narzedzia / Calibre / calibre-0.8.18.msi / file_280 / orlando_sentinel.recipe < prev    next >
Text File  |  2011-09-09  |  2KB  |  39 lines

  1. from calibre.web.feeds.news import BasicNewsRecipe
  2.  
  3. class AdvancedUserRecipe1279258912(BasicNewsRecipe):
  4.     title          = u'Orlando Sentinel'
  5.     oldest_article = 3
  6.     max_articles_per_feed = 100
  7.  
  8.     feeds          = [
  9.     (u'News', u'http://feeds.feedburner.com/orlandosentinel/news'),
  10.     (u'Opinion', u'http://feeds.feedburner.com/orlandosentinel/news/opinion'),
  11.     (u'Business', u'http://feeds.feedburner.com/orlandosentinel/business'),
  12.     (u'Technology', u'http://feeds.feedburner.com/orlandosentinel/technology'),
  13.     (u'Space and Science', u'http://feeds.feedburner.com/orlandosentinel/news/space'),
  14.     (u'Entertainment', u'http://feeds.feedburner.com/orlandosentinel/entertainment'),
  15.     (u'Life and Family', u'http://feeds.feedburner.com/orlandosentinel/features/lifestyle'),
  16.     ]
  17.     __author__ = 'rty'
  18.     pubisher  = 'OrlandoSentinel.com'
  19.     description           = 'Orlando, Florida, Newspaper'
  20.     category              = 'News, Orlando, Florida'
  21.  
  22.  
  23.     remove_javascript = True
  24.     use_embedded_content   = False
  25.     no_stylesheets = True
  26.     language = 'en'
  27.     encoding               = 'utf-8'
  28.     conversion_options = {'linearize_tables':True}
  29.     masthead_url = 'http://www.orlandosentinel.com/media/graphic/2009-07/46844851.gif'
  30.     keep_only_tags = [
  31.                               dict(name='div', attrs={'class':'story'})
  32.                                ]
  33.     remove_tags = [
  34.                   dict(name='div', attrs={'class':['articlerail','tools','comment-group','clearfix']}),
  35.                          ]
  36.     remove_tags_after = [
  37.                   dict(name='p', attrs={'class':'copyright'}),
  38.                          ]
  39.