weboob-devel/modules/dailymotion/browser.py

# -*- coding: utf-8 -*-

# Copyright(C) 2011  Romain Bignon
#
# This file is part of weboob.
#
# weboob is free software: you can redistribute it and/or modify
# it under the terms of the GNU Affero General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# weboob is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU Affero General Public License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with weboob. If not, see <http://www.gnu.org/licenses/>.

from urllib import quote_plus

from weboob.tools.browser import Browser
from weboob.tools.browser.decorators import id2url

from .pages import IndexPage, VideoPage, KidsVideoPage
from .video import DailymotionVideo


__all__ = ['DailymotionBrowser']


class DailymotionBrowser(Browser):
    DOMAIN = 'www.dailymotion.com'
    ENCODING = None
    PAGES = {r'http://[w\.]*dailymotion\.com/1': IndexPage,
             r'http://[w\.]*dailymotion\.com/[a-z\-]{2,5}/1': IndexPage,
             r'http://[w\.]*dailymotion\.com/[a-z\-]{2,5}/(\w+/)?search/.*': IndexPage,
             r'http://[w\.]*dailymotion\.com/video/(?P<id>.+)': VideoPage,
             r'http://kids\.dailymotion\.com/(?P<from>[^\/#]+)#(.*&)?video=(?P<id>.+)': KidsVideoPage,
             }

    @id2url(DailymotionVideo.id2url)
    def get_video(self, url, video=None):
        # clear cookies.
        # this is required in some weird cases, namely *interactive* videoob usage
        # to avoid getting 403 errors when getting the video URL after a search.
        #
        # better control of this issue would be nice (especially if we support user login)
        self._ua_handlers['_cookies'].cookiejar.clear()

        # translate embed URLs
        url = url.replace('dailymotion.com/swf/', 'dailymotion.com/video/')
        self.location(url)
        return self.page.get_video(video)

    def home(self):
        self.location('/1')

    def search_videos(self, pattern, sortby):
        pattern = pattern.replace('/', '').encode('utf-8')
        if sortby is None:
            url = '/en/search/%s/1' % quote_plus(pattern)
        else:
            url = '/en/%s/search/%s/1' % (sortby, quote_plus(pattern))
        self.location(url)

        assert self.is_on_page(IndexPage)
        return self.page.iter_videos()

    def latest_videos(self):
        self.home()

        assert self.is_on_page(IndexPage)
        return self.page.iter_videos()