home *** CD-ROM | disk | FTP | other *** search
/ Chip 2011 November / CHIP_2011_11.iso / Programy / Narzedzia / Calibre / calibre-0.8.18.msi / file_280 / anchorage_daily.recipe < prev    next >
Encoding:
Text File  |  2011-09-09  |  1.6 KB  |  41 lines

  1. from calibre.web.feeds.news import BasicNewsRecipe
  2.  
  3. class AdvancedUserRecipe1278347258(BasicNewsRecipe):
  4.     title          = u'Anchorage Daily News'
  5.     __author__ = 'rty'
  6.     oldest_article = 7
  7.     max_articles_per_feed = 100
  8.  
  9.     feeds          = [(u'Alaska News', u'http://www.adn.com/news/alaska/index.xml'),
  10.     (u'Business', u'http://www.adn.com/money/index.xml'),
  11.     (u'Sports', u'http://www.adn.com/sports/index.xml'),
  12.     (u'Politics', u'http://www.adn.com/politics/index.xml'),
  13.     (u'Lifestyles', u'http://www.adn.com/life/index.xml'),
  14.     (u'Iditarod', u'http://www.adn.com/iditarod/index.xml')
  15.     ]
  16.     description           = ''''Alaska's Newspaper'''
  17.     publisher             = 'http://www.adn.com'
  18.     category              = 'news, Alaska, Anchorage'
  19.     language = 'en'
  20.     extra_css = '''
  21.                 p{font-weight: normal;text-align: justify}
  22.                '''
  23.     remove_javascript = True
  24.     use_embedded_content   = False
  25.     no_stylesheets = True
  26.     language = 'en'
  27.     encoding               = 'latin-1'
  28.     conversion_options = {'linearize_tables':True}
  29.     masthead_url = 'http://media.adn.com/includes/assets/images/adn_logo.2.gif'
  30.  
  31.     keep_only_tags = [
  32.                               dict(name='div', attrs={'class':'left_col story_mainbar'}),
  33.                                ]
  34.     remove_tags = [
  35.                               dict(name='div', attrs={'class':'story_tools'}),
  36.                               dict(name='p', attrs={'class':'ad_label'}),
  37.                                ]
  38.     remove_tags_after = [
  39.                               dict(name='div', attrs={'class':'advertisement'}),
  40.                                ]
  41.