home *** CD-ROM | disk | FTP | other *** search
- __license__ = 'GPL v3'
- __copyright__ = '2010, Dean Cording'
- '''
- abc.net.au/news
- '''
- import re
- from calibre.web.feeds.recipes import BasicNewsRecipe
-
- class ABCNews(BasicNewsRecipe):
- title = 'ABC News'
- __author__ = 'Dean Cording'
- description = 'News from Australia'
- masthead_url = 'http://www.abc.net.au/news/assets/v5/images/common/logo-news.png'
- cover_url = 'http://www.abc.net.au/news/assets/v5/images/common/logo-news.png'
-
- oldest_article = 2
- max_articles_per_feed = 100
- no_stylesheets = False
- #delay = 1
- use_embedded_content = False
- encoding = 'utf8'
- publisher = 'ABC News'
- category = 'News, Australia, World'
- language = 'en_AU'
- publication_type = 'newsportal'
- preprocess_regexps = [(re.compile(r'<!--.*?-->', re.DOTALL), lambda m: '')]
- conversion_options = {
- 'comments' : description
- ,'tags' : category
- ,'language' : language
- ,'publisher' : publisher
- ,'linearize_tables': False
- }
-
- keep_only_tags = dict(id='article')
-
- remove_tags = [dict(attrs={'class':['related', 'tags']}),
- dict(id='statepromo')
- ]
-
- remove_attributes = ['width','height']
-
- feeds = [
- ('Top Stories', 'http://www.abc.net.au/news/syndicate/topstoriesrss.xml'),
- ('Canberra', 'http://www.abc.net.au/news/indexes/idx-act/rss.xml'),
- ('Sydney', 'http://www.abc.net.au/news/indexes/sydney/rss.xml'),
- ('Melbourne', 'http://www.abc.net.au/news/indexes/melbourne/rss.xml'),
- ('Brisbane', 'http://www.abc.net.au/news/indexes/brisbane/rss.xml'),
- ('Perth', 'http://www.abc.net.au/news/indexes/perth/rss.xml'),
- ('Australia', 'http://www.abc.net.au/news/indexes/idx-australia/rss.xml'),
- ('World', 'http://www.abc.net.au/news/indexes/world/rss.xml'),
- ('Business', 'http://www.abc.net.au/news/indexes/business/rss.xml'),
- ('Science and Technology', 'http://www.abc.net.au/news/tag/science-and-technology/rss.xml'),
- ]
-