home *** CD-ROM | disk | FTP | other *** search
/ Chip 2011 November / CHIP_2011_11.iso / Programy / Narzedzia / Calibre / calibre-0.8.18.msi / file_280 / european_voice.recipe < prev    next >
Text File  |  2011-09-09  |  3KB  |  52 lines

  1.  
  2. from calibre.web.feeds.news import BasicNewsRecipe
  3.  
  4. class EuropeanVoice(BasicNewsRecipe):
  5.     title          = u'European Voice'
  6.     __author__     = 'malfi'
  7.     oldest_article = 14
  8.     max_articles_per_feed = 100
  9.     no_stylesheets = True
  10.     cover_url = 'http://www.europeanvoice.com/Css/images/logo.gif'
  11.     language = 'en'
  12.     keep_only_tags    = [dict(name='div', attrs={'id':'articleLeftColumn'})]
  13.     remove_tags    = [dict(name='div', attrs={'id':'BreadCrump'})]
  14.     feeds          = [
  15.                         (u'Whole site ',u'http://www.europeanvoice.com/Rss/2.xml'),
  16.                           (u'News and analysis',u'http://www.europeanvoice.com/Rss/6.xml'),
  17.                           (u'Comment',u'http://www.europeanvoice.com/Rss/7.xml'),
  18.                           (u'Special reports',u'http://www.europeanvoice.com/Rss/5.xml'),
  19.                           (u'People',u'http://www.europeanvoice.com/Rss/8.xml'),
  20.                           (u'Career',u'http://www.europeanvoice.com/Rss/11.xml'),
  21.                           (u'Policies',u'http://www.europeanvoice.com/Rss/4.xml'),
  22.                           (u'EVents',u'http://www.europeanvoice.com/Rss/10.xml'),
  23.                           (u'Policies - Economics',u'http://www.europeanvoice.com/Rss/31.xml'),
  24.                           (u'Policies - Business',u'http://www.europeanvoice.com/Rss/19.xml'),
  25.                           (u'Policies - Trade',u'http://www.europeanvoice.com/Rss/25.xml'),
  26.                           (u'Policies - Information society',u'http://www.europeanvoice.com/Rss/20.xml'),
  27.                           (u'Policies - Energy',u'http://www.europeanvoice.com/Rss/15.xml'),
  28.                           (u'Policies - Transport',u'http://www.europeanvoice.com/Rss/18.xml'),
  29.                           (u'Policies - Climate change',u'http://www.europeanvoice.com/Rss/16.xml'),
  30.                           (u'Policies - Environment',u'http://www.europeanvoice.com/Rss/17.xml'),
  31.                           (u'Policies - Farming & food',u'http://www.europeanvoice.com/Rss/23.xml'),
  32.                           (u'Policies - Health & society',u'http://www.europeanvoice.com/Rss/24.xml'),
  33.                           (u'Policies - Justice',u'http://www.europeanvoice.com/Rss/29.xml'),
  34.                           (u'Policies - Foreign affairs',u'http://www.europeanvoice.com/Rss/27.xml')
  35.                      ]
  36.     extra_css = '''
  37.         h1{font-family:Arial,Helvetica,sans-serif; font-weight:bold;font-size:large;}
  38.         h2{font-family:Arial,Helvetica,sans-serif; font-weight:normal;font-size:small;}
  39.         p{font-family:Arial,Helvetica,sans-serif;font-size:small;}
  40.         body{font-family:Helvetica,Arial,sans-serif;font-size:small;}
  41.         '''
  42.  
  43.     def print_version(self, url):
  44.           return url + '?bPrint=1'
  45.  
  46.     def preprocess_html(self, soup):
  47.            denied = soup.findAll(True,text='Subscribers')
  48.            if denied:
  49.                 raise Exception('Article skipped, because content can only be seen with subscription')
  50.            return soup
  51.  
  52.