home *** CD-ROM | disk | FTP | other *** search
/ Chip 2011 November / CHIP_2011_11.iso / Programy / Narzedzia / Calibre / calibre-0.8.18.msi / file_280 / jakarta_post.recipe < prev    next >
Text File  |  2011-09-09  |  3KB  |  68 lines

  1. #!/usr/bin/env  python
  2. __license__   = 'GPL v3'
  3. __copyright__ = '2011, Adrian Gunawan <agunawan at adrnalin.com>'
  4. __author__    = 'Adrian Gunawan'
  5. __version__   = 'v1.0'
  6. __date__      = '02 February 2011'
  7.  
  8. '''
  9. http://www.thejakartapost.com/
  10. '''
  11.  
  12. from calibre.web.feeds.news import BasicNewsRecipe
  13.  
  14. class JakartaPost(BasicNewsRecipe):
  15.     title          = u'Jakarta Post'
  16.     masthead_url   = 'http://www.thejakartapost.com/images/jakartapost_logo.jpg'
  17.     cover_url      = 'http://www.thejakartapost.com/images/jakartapost_logo.jpg'
  18.  
  19.     __author__     = u'Adrian Gunawan'
  20.     description    = u'Indonesian Newspaper in English from Jakarta Post Online Edition'
  21.     category       = 'breaking news, national, business, international, Indonesia'
  22.     language       = 'en_ID'
  23.     oldest_article = 2
  24.     max_articles_per_feed = 100
  25.  
  26.     no_stylesheets        = True
  27.     use_embedded_content  = False
  28.     no_javascript         = True
  29.     remove_empty_feeds    = True
  30.  
  31.     timefmt               = ' [%A, %d %B, %Y]'
  32.     encoding              = 'utf-8'
  33.  
  34.     keep_only_tags = [dict(name='div', attrs ={'id':'news-main'})]
  35.  
  36.     extra_css = '''
  37.                   h1{font-family:Georgia,"Times New Roman",Times,serif; font-weight:bold; font-size:large;}
  38.                   .cT-storyDetails{font-family:Arial,Helvetica,sans-serif; color:#666666;font-size:x-small;}
  39.                   .articleBody{font-family:Arial,Helvetica,sans-serif; color:black;font-size:small;}
  40.                   .cT-imageLandscape{font-family:Arial,Helvetica,sans-serif; color:#333333 ;font-size:x-small;}
  41.                   .source{font-family:Arial,Helvetica,sans-serif; color:#333333 ;font-size:xx-small;}
  42.                   #content{font-family:Arial,Helvetica,sans-serif;font-size:x-small;}
  43.                   .pageprint{font-family:Arial,Helvetica,sans-serif;font-size:small;}
  44.                   #bylineDetails{font-family:Arial,Helvetica,sans-serif; color:#666666;font-size:x-small;}
  45.                   .featurePic-wide{font-family:Arial,Helvetica,sans-serif;font-size:x-small;}
  46.                   #idfeaturepic{font-family:Arial,Helvetica,sans-serif;font-size:x-small;}
  47.                   h3{font-family:Georgia,"Times New Roman",Times,serif; font-size:small;}
  48.                   h2{font-family:Georgia,"Times New Roman",Times,serif; font-size:small;}
  49.                   h4{font-family:Georgia,"Times New Roman",Times,serif; font-size:small;}
  50.                   h5{font-family:Georgia,"Times New Roman",Times,serif; font-size:small;}
  51.                   body{font-family:Arial,Helvetica,sans-serif; font-size:x-small;}
  52.                 '''
  53.  
  54.     remove_tags     = [
  55.                         dict(name='div', attrs ={'class':['text-size']}),
  56.                        ]
  57.  
  58.     feeds          = [
  59.  
  60.                       (u'Breaking News', u'http://www.thejakartapost.com/breaking/feed'),
  61.                       (u'National', u'http://www.thejakartapost.com/channel/national/feed'),
  62.                       (u'Archipelago', u'http://www.thejakartapost.com/channel/archipelago/feed'),
  63.                       (u'Business', u'http://www.thejakartapost.com/channel/business/feed'),
  64.                       (u'Jakarta', u'http://www.thejakartapost.com/channel/jakarta/feed'),
  65.                       (u'World', u'http://www.thejakartapost.com/channel/world/feed'),
  66.                       (u'Sports', u'http://www.thejakartapost.com/channel/sports/feed'),
  67.                       ]
  68.