#!/usr/bin/env python __license__ = 'GPL v3' ''' OSNews.pl ''' from calibre.web.feeds.news import BasicNewsRecipe import re class OSNewsRecipe(BasicNewsRecipe): __author__ = u'Mori & Tomasz D\u0142ugosz' language = 'pl' title = u'OSnews.pl' publisher = u'OSnews.pl' description = u'OSnews.pl jest spo\u0142eczno\u015bciowym serwisem informacyjnym po\u015bwi\u0119conym oprogramowaniu, systemom operacyjnym i \u015bwiatowi IT' no_stylesheets = True remove_javascript = True encoding = 'utf-8' use_embedded_content = False; remove_empty_feeds = True oldest_article = 7 max_articles_per_feed = 100 cover_url='http://osnews.pl/wp-content/themes/osnews/img/logo.png' extra_css = ''' .news-heading {font-size:150%} .newsinformations li {display:inline;} blockquote {border:2px solid #000; padding:5px;} ''' feeds = [ (u'Niusy', u'http://feeds.feedburner.com/OSnewspl'), (u'Wylęgarnia', u'http://feeds.feedburner.com/osnewspl_nowe') ] keep_only_tags = [ dict(name = 'div', attrs = {'id' : 'content'}) ] remove_tags = [ dict(name = 'div', attrs = {'class' : ['newstags', 'tw_button', 'post_prev']}), dict(name = 'div', attrs = {'id' : 'newspage_upinfo'}), ] remove_tags_after = dict(name = 'div', attrs = {'class' : 'post_prev'}) preprocess_regexps = [(re.compile(u'Komentarze: \(?[0-9]+\)? ?'), lambda match: '')]