home *** CD-ROM | disk | FTP | other *** search
/ Chip 2011 November / CHIP_2011_11.iso / Programy / Narzedzia / Calibre / calibre-0.8.18.msi / file_280 / idg_now.recipe < prev    next >
Text File  |  2011-09-09  |  2KB  |  44 lines

  1. from calibre.web.feeds.news import BasicNewsRecipe
  2.  
  3. class IDGNow(BasicNewsRecipe):
  4.     title                  = 'IDG Now!'
  5.     __author__             = 'Diniz Bortolotto'
  6.     description            = 'Posts do IDG Now!'
  7.     oldest_article         = 7
  8.     max_articles_per_feed  = 20
  9.     encoding               = 'utf8'
  10.     publisher              = 'Now!Digital Business Ltda.'
  11.     category               = 'technology, telecom, IT, Brazil'
  12.     language               = 'pt_BR'
  13.     publication_type       = 'technology portal'
  14.     use_embedded_content   = False
  15.     extra_css              = '.headline {font-size: x-large;} \n .fact { padding-top: 10pt  }'
  16.  
  17.     def get_article_url(self, article):
  18.        link = article.get('link', None)
  19.        if link is None:
  20.            return article
  21.        if link.split('/')[-1]=="story01.htm":
  22.            link=link.split('/')[-2]
  23.            a=['0B','0C','0D','0E','0F','0G','0I','0N'  ,'0L0S','0A','0J3A']
  24.            b=['.' ,'/' ,'?' ,'-' ,'=' ,'&' ,'_','.com','www.','0',':']
  25.            for i in range(0,len(a)):
  26.               link=link.replace(a[i],b[i])
  27.            link=link.split('&')[-3]
  28.            link=link.split('=')[1]
  29.            link=link + "/IDGNoticiaPrint_view"
  30.        return link
  31.  
  32.     feeds                  = [
  33.                               (u'Ultimas noticias', u'http://rss.idgnow.com.br/c/32184/f/499640/index.rss'),
  34.                               (u'Computa\xe7\xe3o Corporativa', u'http://rss.idgnow.com.br/c/32184/f/499643/index.rss'),
  35.                               (u'Carreira', u'http://rss.idgnow.com.br/c/32184/f/499644/index.rss'),
  36.                               (u'Computa\xe7\xe3o Pessoal', u'http://rss.idgnow.com.br/c/32184/f/499645/index.rss'),
  37.                               (u'Internet', u'http://rss.idgnow.com.br/c/32184/f/499646/index.rss'),
  38.                               (u'Mercado', u'http://rss.idgnow.com.br/c/32184/f/419982/index.rss'),
  39.                               (u'Seguran\xe7a', u'http://rss.idgnow.com.br/c/32184/f/499647/index.rss'),
  40.                               (u'Telecom e Redes', u'http://rss.idgnow.com.br/c/32184/f/499648/index.rss')
  41.                              ]
  42.  
  43.     reverse_article_order  = True
  44.