home *** CD-ROM | disk | FTP | other *** search
Wrap
# -*- coding: utf-8 -*- from calibre.web.feeds.news import BasicNewsRecipe class TodaysZaman_en(BasicNewsRecipe): title = u'Sızıntı Dergisi' __author__ = u'thomass' description = 'a Turkey based daily for national and international news in the fields of business, diplomacy, politics, culture, arts, sports and economics, in addition to commentaries, specials and features' oldest_article = 30 max_articles_per_feed =80 no_stylesheets = True #delay = 1 #use_embedded_content = False encoding = 'utf-8' #publisher = ' ' category = 'dergi, ilim, kültür, bilim,Türkçe' language = 'tr' publication_type = 'magazine' #extra_css = ' body{ font-family: Verdana,Helvetica,Arial,sans-serif } .introduction{font-weight: bold} .story-feature{display: block; padding: 0; border: 1px solid; width: 40%; font-size: small} .story-feature h2{text-align: center; text-transform: uppercase} ' #keep_only_tags = [dict(name='h1', attrs={'class':['georgia_30']})] #remove_attributes = ['aria-describedby'] #remove_tags = [dict(name='div', attrs={'id':['renk10']}) ] cover_img_url = 'http://www.sizinti.com.tr/images/sizintiprint.jpg' masthead_url = 'http://www.sizinti.com.tr/images/sizintiprint.jpg' remove_tags_before = dict(id='content-right') #remove_empty_feeds= True #remove_attributes = ['width','height'] feeds = [ ( u'Sızıntı', u'http://www.sizinti.com.tr/rss'), ] #def preprocess_html(self, soup): # return self.adeify_images(soup) #def print_version(self, url): #there is a probem caused by table format #return url.replace('http://www.todayszaman.com/newsDetail_getNewsById.action?load=detay&', 'http://www.todayszaman.com/newsDetail_openPrintPage.action?')