home
***
CD-ROM
|
disk
|
FTP
|
other
***
search
/
Chip 2011 November
/
CHIP_2011_11.iso
/
Programy
/
Narzedzia
/
Calibre
/
calibre-0.8.18.msi
/
file_280
/
sme.recipe
< prev
next >
Wrap
Text File
|
2011-09-09
|
3KB
|
70 lines
from calibre.web.feeds.news import BasicNewsRecipe
import re
class SmeRecipe(BasicNewsRecipe):
__license__ = 'GPL v3'
__author__ = 'kwetal'
language = 'sk'
version = 1
title = u'SME'
publisher = u''
category = u'News, Newspaper'
description = u'News from Slovakia'
oldest_article = 1
max_articles_per_feed = 100
use_embedded_content = False
remove_empty_feeds = True
no_stylesheets = True
remove_javascript = True
# Feeds from: http://rss.sme.sk/
feeds = []
feeds.append((u'Tituln\u00E1 strana', u'http://rss.sme.sk/rss/rss.asp?id=frontpage'))
feeds.append((u'Naj\u010D\u00EDtanej\u0161ie za 4 hodiny', u'http://rss.sme.sk/rss/rss.asp?id=smenajcit4'))
feeds.append((u'Naj\u010D\u00EDtanej\u0161ie za 24 hod\u00EDn', u'http://rss.sme.sk/rss/rss.asp?id=smenajcit24'))
feeds.append((u'Z domova', u'http://rss.sme.sk/rss/rss.asp?sek=smeonline&rub=online_zdom'))
feeds.append((u'Zahrani\u010Die', u'http://rss.sme.sk/rss/rss.asp?sek=smeonline&rub=online_zahr'))
feeds.append((u'Z domova + zahrani\u010Die', u'http://rss.sme.sk/rss/rss.asp?sek=smeonline'))
feeds.append((u'Ekonomika', u'http://rss.sme.sk/rss/rss.asp?sek=ekon'))
feeds.append((u'Kult\u00FAra', u'http://rss.sme.sk/rss/rss.asp?sek=kult'))
feeds.append((u'Koment\u00E1re', u'http://rss.sme.sk/rss/rss.asp?sek=koment'))
feeds.append((u'Volby', u'http://rss.sme.sk/rss/rss.asp?sek=eVolby'))
#feeds.append((u'Press foto', u'http://rss.sme.sk/rss/rss.asp?sek=smeonline&rub=online_foto'))
feeds.append((u'\u0160port', u'http://rss.sme.sk/rss/rss.asp?sek=sport'))
feeds.append((u'Futbal', u'http://rss.sme.sk/rss/rss.asp?sek=futbal'))
feeds.append((u'Hokej', u'http://rss.sme.sk/rss/rss.asp?sek=hokej'))
feeds.append((u'Po\u010D\u00EDta\u010De', u'http://rss.sme.sk/rss/rss.asp?sek=pocit'))
feeds.append((u'Mobil', u'http://rss.sme.sk/rss/rss.asp?sek=mobil'))
feeds.append((u'Veda', u'http://rss.sme.sk/rss/rss.asp?sek=veda'))
feeds.append((u'Natankuj', u'http://rss.sme.sk/rss/rss.asp?sek=natankuj'))
feeds.append((u'Auto', u'http://rss.sme.sk/rss/rss.asp?sek=auto'))
feeds.append((u'Dom\u00E1cnos\u0165', u'http://rss.sme.sk/rss/rss.asp?sek=domac'))
feeds.append((u'\u017Dena', u'http://rss.sme.sk/rss/rss.asp?sek=zena'))
feeds.append((u'Z\u00E1bava', u'http://rss.sme.sk/rss/rss.asp?sek=zabava'))
feeds.append((u'Hry', u'http://rss.sme.sk/rss/rss.asp?sek=hry'))
#feeds.append((u'', u''))
keep_only_tags = []
keep_only_tags.append(dict(name = 'div', attrs = {'id': 'contenth'}))
keep_only_tags.append(dict(name = 'div', attrs = {'class': 'articlec col'}))
remove_tags = []
remove_tags.append(dict(name = 'div', attrs = {'id': re.compile('smeplayer.*')}))
remove_tags_after = [dict(name = 'p', attrs = {'class': 'autor_line'})]
extra_css = '''
@font-face {font-family: "serif1";src:url(res:///opt/sony/ebook/FONT/tt0011m_.ttf)}
@font-face {font-family: "sans1";src:url(res:///opt/sony/ebook/FONT/LiberationSans.ttf)}
body {font-family: sans1, serif1;}
'''
def print_version(self, url):
parts = url.split('/')
id = parts[4]
return u'http://korzar.sme.sk/clanok_tlac.asp?cl=' + str(id)