weboob-devel/modules/dailymotion/browser.py
2014-09-26 10:18:12 +02:00

74 lines
2.6 KiB
Python

# -*- coding: utf-8 -*-
# Copyright(C) 2011 Romain Bignon
#
# This file is part of weboob.
#
# weboob is free software: you can redistribute it and/or modify
# it under the terms of the GNU Affero General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# weboob is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU Affero General Public License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with weboob. If not, see <http://www.gnu.org/licenses/>.
from urllib import quote_plus
from weboob.tools.browser import Browser
from weboob.tools.browser.decorators import id2url
from .pages import IndexPage, VideoPage, KidsVideoPage
from .video import DailymotionVideo
__all__ = ['DailymotionBrowser']
class DailymotionBrowser(Browser):
DOMAIN = 'www.dailymotion.com'
ENCODING = None
PAGES = {r'http://[w\.]*dailymotion\.com/1': IndexPage,
r'http://[w\.]*dailymotion\.com/[a-z\-]{2,5}/1': IndexPage,
r'http://[w\.]*dailymotion\.com/[a-z\-]{2,5}/(\w+/)?search/.*': IndexPage,
r'http://[w\.]*dailymotion\.com/video/(?P<id>.+)': VideoPage,
r'http://kids\.dailymotion\.com/(?P<from>[^\/#]+)#(.*&)?video=(?P<id>.+)': KidsVideoPage,
}
@id2url(DailymotionVideo.id2url)
def get_video(self, url, video=None):
# clear cookies.
# this is required in some weird cases, namely *interactive* videoob usage
# to avoid getting 403 errors when getting the video URL after a search.
#
# better control of this issue would be nice (especially if we support user login)
self._ua_handlers['_cookies'].cookiejar.clear()
# translate embed URLs
url = url.replace('dailymotion.com/swf/', 'dailymotion.com/video/')
self.location(url)
return self.page.get_video(video)
def home(self):
self.location('/1')
def search_videos(self, pattern, sortby):
pattern = pattern.replace('/', '').encode('utf-8')
if sortby is None:
url = '/en/search/%s/1' % quote_plus(pattern)
else:
url = '/en/%s/search/%s/1' % (sortby, quote_plus(pattern))
self.location(url)
assert self.is_on_page(IndexPage)
return self.page.iter_videos()
def latest_videos(self):
self.home()
assert self.is_on_page(IndexPage)
return self.page.iter_videos()