Logo Search packages:      
Sourcecode: calibre version File versions  Download package

recipe_corriere_della_sera_it.py

#!/usr/bin/env  python

__license__   = 'GPL v3'
__copyright__ = '2009, Darko Miletic <darko.miletic at gmail.com>'
'''
www.corriere.it
'''

from calibre.web.feeds.news import BasicNewsRecipe
class Corriere_it(BasicNewsRecipe):
    title                 = 'Corriere della Sera'
    __author__            = 'Darko Miletic'
    description           = 'News from Milan and Italy'    
    oldest_article        = 7
    publisher             = 'Corriere della Sera'
    category              = 'news, politics, Italy'        
    max_articles_per_feed = 100
    no_stylesheets        = True
    use_embedded_content  = False
    encoding              = 'cp1252'
    remove_javascript     = True
    language = 'it'


    html2lrf_options = [
                          '--comment', description
                        , '--category', category
                        , '--publisher', publisher
                        , '--ignore-tables'
                        ]
    
    html2epub_options = 'publisher="' + publisher + '"\ncomments="' + description + '"\ntags="' + category + '"\nlinearize_tables=True' 

    keep_only_tags = [dict(name='div', attrs={'class':['news-dettaglio article','article']})]

    remove_tags = [
                    dict(name=['base','object','link','embed','img'])
                   ,dict(name='div', attrs={'class':'news-goback'})
                   ,dict(name='ul', attrs={'class':'toolbar'})
                  ]

    remove_tags_after = dict(name='p', attrs={'class':'footnotes'})
    
    feeds = [ 
              (u'Ultimora'  , u'http://www.corriere.it/rss/ultimora.xml'  )
             ,(u'Cronache'  , u'http://www.corriere.it/rss/cronache.xml'  )
             ,(u'Economia'  , u'http://www.corriere.it/rss/economia.xml'  )
             ,(u'Editoriali', u'http://www.corriere.it/rss/editoriali.xml')
             ,(u'Esteri'    , u'http://www.corriere.it/rss/esteri.xml'    )
             ,(u'Politica'  , u'http://www.corriere.it/rss/politica.xml'  )
             ,(u'Salute'    , u'http://www.corriere.it/rss/salute.xml'    )
             ,(u'Scienze'   , u'http://www.corriere.it/rss/scienze.xml'   )
             ,(u'Spettacolo', u'http://www.corriere.it/rss/spettacoli.xml')
             ,(u'Sport'     , u'http://www.corriere.it/rss/sport.xml'     )
            ]


Generated by  Doxygen 1.6.0   Back to index