home *** CD-ROM | disk | FTP | other *** search
/ Chip 2011 November / CHIP_2011_11.iso / Programy / Narzedzia / Calibre / calibre-0.8.18.msi / file_280 / film_web.recipe < prev    next >
Text File  |  2011-09-09  |  3KB  |  41 lines

  1. from calibre.web.feeds.news import BasicNewsRecipe
  2.  
  3. class Filmweb_pl(BasicNewsRecipe):
  4.     title          = u'FilmWeb'
  5.     __author__        = 'fenuks'
  6.     description   = 'FilmWeb - biggest polish movie site'
  7.     cover_url      = 'http://userlogos.org/files/logos/crudus/filmweb.png'
  8.     category       = 'movies'
  9.     language       = 'pl'
  10.     oldest_article = 8
  11.     max_articles_per_feed = 100
  12.     no_stylesheets= True
  13.     extra_css      = '.hdrBig {font-size:22px;}'
  14.     remove_tags= [dict(name='div', attrs={'class':['recommendOthers']}), dict(name='ul', attrs={'class':'fontSizeSet'})]
  15.     keep_only_tags= [dict(name='h1', attrs={'class':'hdrBig'}), dict(name='div', attrs={'class':['newsInfo', 'reviewContent fontSizeCont description']})]
  16.     feeds          = [(u'Wszystkie newsy', u'http://www.filmweb.pl/feed/news/latest'),
  17.                          (u'News / Filmy w produkcji', 'http://www.filmweb.pl/feed/news/category/filminproduction'),
  18.                          (u'News / Festiwale, nagrody i przegl─àdy', u'http://www.filmweb.pl/feed/news/category/festival'),
  19.                          (u'News / Seriale', u'http://www.filmweb.pl/feed/news/category/serials'),
  20.                          (u'News / Box office', u'http://www.filmweb.pl/feed/news/category/boxoffice'),
  21.                          (u'News / Multimedia', u'http://www.filmweb.pl/feed/news/category/multimedia'),
  22.                          (u'News / Dystrybucja dvd / blu-ray', u'http://www.filmweb.pl/feed/news/category/video'),
  23.                          (u'News / Dystrybucja kinowa', u'http://www.filmweb.pl/feed/news/category/cinema'),
  24.                          (u'News / off', u'http://www.filmweb.pl/feed/news/category/off'),
  25.                          (u'News / Gry wideo', u'http://www.filmweb.pl/feed/news/category/game'),
  26.                          (u'News / Organizacje bran┼╝owe', u'http://www.filmweb.pl/feed/news/category/organizations'),
  27.                          (u'News / Internet', u'http://www.filmweb.pl/feed/news/category/internet'),
  28.                          (u'News / R├│┼╝ne', u'http://www.filmweb.pl/feed/news/category/other'),
  29.                          (u'News / Kino polskie', u'http://www.filmweb.pl/feed/news/category/polish.cinema'),
  30.                          (u'News / Telewizja', u'http://www.filmweb.pl/feed/news/category/tv'),
  31.                          (u'Recenzje redakcji', u'http://www.filmweb.pl/feed/reviews/latest'),
  32.                          (u'Recenzje u┼╝ytkownik├│w', u'http://www.filmweb.pl/feed/user-reviews/latest')]
  33.  
  34.     def skip_ad_pages(self, soup):   
  35.         skip_tag = soup.find('a', attrs={'class':'welcomeScreenButton'})
  36.         if skip_tag is not None:
  37.             self.log.warn('skip_tag')
  38.             self.log.warn(skip_tag)
  39.             return self.index_to_soup(skip_tag['href'], raw=True)
  40.         
  41.