home
***
CD-ROM
|
disk
|
FTP
|
other
***
search
/
Chip 2011 November
/
CHIP_2011_11.iso
/
Programy
/
Narzedzia
/
Calibre
/
calibre-0.8.18.msi
/
file_280
/
samanyolu_haber.recipe
< prev
next >
Wrap
Text File
|
2011-09-09
|
4KB
|
64 lines
# -*- coding: utf-8 -*-
from calibre.web.feeds.news import BasicNewsRecipe
class SHaber (BasicNewsRecipe):
title = u'Samanyolu Haber'
__author__ = u'thomass'
description = ' Samanyolu Haber Sitesinden g├╝nl├╝k haberler '
oldest_article =2
max_articles_per_feed =100
no_stylesheets = True
#delay = 1
#use_embedded_content = False
encoding = 'utf-8'
publisher = 'thomass'
category = 'güncel, haber, türkçe'
language = 'tr'
publication_type = 'newspaper'
conversion_options = {
'tags' : category
,'language' : language
,'publisher' : publisher
,'linearize_tables': True
}
extra_css = ' .Haber-Baslik-Yazisi {font-weight: bold; font-size: 9px} .Haber-Ozet-Yazisi{ font-family:sans-serif;font-weight: normal;font-size: 11px } #Haber{ font-family:sans-serif;font-weight: normal;font-size: 9px }.KirmiziText{ font-weight: normal;font-size: 5px }' #.story-feature{display: block; padding: 0; border: 1px solid; width: 40%; font-size: small} .story-feature h2{text-align: center; text-transform: uppercase} '
#extra_css = ' body{ font-family: Verdana,Helvetica,Arial,sans-serif } .introduction{font-weight: bold} .story-feature{display: block; padding: 0; border: 1px solid; width: 40%; font-size: small} .story-feature h2{text-align: center; text-transform: uppercase} '
keep_only_tags = [dict(name='div', attrs={'class':['Haber-Baslik-Yazisi','Haber-Ozet-Yazisi']}),dict(name='div', attrs={'id':['ctl00_ContentPlaceHolder1_imagenew','Haber']})]#,dict(name='h6', attrs={'class':['KirmiziText',]}) dict(name='div', attrs={'id':['Haber']}),dict(name='div', attrs={'id':['gallery']})]
#remove_tags = [dict(name='img', attrs={'src':[ 'http://medya.aksiyon.com.tr/aksiyon/images/logo/logo.bmp','/aksiyon/images/template/green/baslik0.gif','mobile/home.jpg']}) ],dict(name='h1', attrs={'class':['H1-Haber-DetayBasligi']}),dict(name='h4', attrs={'class':['BrownText']}) ,
cover_img_url = 'http://static.samanyoluhaber.com/Images/resources/images/samanyoluhaber-yazi-logo.png'
masthead_url = 'http://static.samanyoluhaber.com/Images/resources/images/samanyoluhaber-yazi-logo.png'
remove_empty_feeds= True
#remove_attributes = ['width','height']
feeds = [
( u'Son Dakika', u'http://podcast.samanyoluhaber.com/sondakika.rss'),
( u'G├╝ndem', u'http://podcast.samanyoluhaber.com/gundem.rss'),
( u'Politika ', u'http://podcast.samanyoluhaber.com/politika.rss'),
( u'Ekonomi', u'http://podcast.samanyoluhaber.com/ekonomi.rss'),
( u'D├╝nya', u'http://podcast.samanyoluhaber.com/dunya.rss'),
( u'Spor ', u'http://podcast.samanyoluhaber.com/spor.rss'),
( u'Sa─ƒl─▒k', u'http://podcast.samanyoluhaber.com/saglik.rss'),
( u'K├╝lt├╝r', u'http://podcast.samanyoluhaber.com/kultur.rss'),
#( u'Teknoloji ', u'http://podcast.samanyoluhaber.com/teknoloji.rss'),
( u'E─ƒitim', u'http://podcast.samanyoluhaber.com/egitim.rss'),
( u'Ramazan', u'http://podcast.samanyoluhaber.com/ramazan.rss'),
( u'Yazarlar ', u'http://podcast.samanyoluhaber.com/yazarlar.rss'),
]
def preprocess_html(self, soup):
for alink in soup.findAll('a'):
if alink.string is not None:
tstr = alink.string
alink.replaceWith(tstr)
return soup
# def print_version(self, url):
# return url.replace('http://www.aksiyon.com.tr/aksiyon/newsDetail_getNewsById.action?load=detay&', 'http://www.aksiyon.com.tr/aksiyon/mobile_detailn.action?')