Skip to content
This repository

HTTPS clone URL

Subversion checkout URL

You can clone with HTTPS or Subversion.

Download ZIP
tree: 735747ab20
Fetching contributors…

Cannot retrieve contributors at this time

file 44 lines (37 sloc) 2.142 kb
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44
from calibre.web.feeds.news import BasicNewsRecipe

class BangkokPostRecipe(BasicNewsRecipe):
    __license__ = 'GPL v3'
    __author__ = 'kwetal'
    language = 'en_TH'
    version = 1

    title = u'Bangkok Post'
    publisher = u'Post Publishing PCL'
    category = u'News'
    description = u'The world\'s window to Thailand'

    oldest_article = 1
    max_articles_per_feed = 50

    no_stylesheets = True
    remove_javascript = True
    use_embedded_content = False

    # Feeds from: http://www.bangkokpost.com/rss/
    feeds = []
    feeds.append((u'Breaking News', u'http://www.bangkokpost.com/rss/data/breakingnews.xml'))
    feeds.append((u'Top Stories', u'http://www.bangkokpost.com/rss/data/topstories.xml'))
    feeds.append((u'News', u'http://www.bangkokpost.com/rss/data/news.xml'))
    feeds.append((u'Business', u'http://www.bangkokpost.com/rss/data/business.xml'))
    feeds.append((u'Opinion', u'http://www.bangkokpost.com/rss/data/opinion.xml'))
    feeds.append((u'Travel', u'http://www.bangkokpost.com/rss/data/travel.xml'))
    feeds.append((u'Leisure', u'http://www.bangkokpost.com/rss/data/leisure.xml'))
    feeds.append((u'Entertainment', u'http://www.bangkokpost.com/rss/data/entertainment.xml'))
    feeds.append((u'Auto', u'http://www.bangkokpost.com/rss/data/auto.xml'))
    feeds.append((u'Life', u'http://www.bangkokpost.com/rss/data/life.xml'))
    feeds.append((u'Tech', u'http://www.bangkokpost.com/rss/data/tect.xml'))

    keep_only_tags = []
    keep_only_tags.append(dict(name = 'div', attrs = {'class' : 'entry'}))

    remove_tags = []
    remove_tags.append(dict(name = 'div', attrs = {'class': 'article-features'}))
    remove_tags.append(dict(name = 'div', attrs = {'class': 'socialBookmark'}))
    remove_tags.append(dict(name = 'div', attrs = {'id': 'main-sns'}))
    # Their YouTube movies are displayed in an iframe, if you want those you will have to parse the articles by hand.
    # Setting self.recursion to 1, which might resolve this, makes calibre downloading a lot of PDF files, which will cause a very, very very, long download time
    remove_tags.append(dict(name = 'iframe'))
Something went wrong with that request. Please try again.