# -*- coding: utf-8 -*- # Copyright(C) 2011 Romain Bignon # # This file is part of weboob. # # weboob is free software: you can redistribute it and/or modify # it under the terms of the GNU Affero General Public License as published by # the Free Software Foundation, either version 3 of the License, or # (at your option) any later version. # # weboob is distributed in the hope that it will be useful, # but WITHOUT ANY WARRANTY; without even the implied warranty of # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the # GNU Affero General Public License for more details. # # You should have received a copy of the GNU Affero General Public License # along with weboob. If not, see . from urllib import quote_plus from weboob.deprecated.browser import Browser from weboob.deprecated.browser.decorators import id2url from .pages import IndexPage, VideoPage, KidsVideoPage from .video import DailymotionVideo __all__ = ['DailymotionBrowser'] class DailymotionBrowser(Browser): DOMAIN = 'www.dailymotion.com' ENCODING = None PAGES = {r'http://[w\.]*dailymotion\.com/1': IndexPage, r'http://[w\.]*dailymotion\.com/[a-z\-]{2,5}/1': IndexPage, r'http://[w\.]*dailymotion\.com/[a-z\-]{2,5}/(\w+/)?search/.*': IndexPage, r'http://[w\.]*dailymotion\.com/video/(?P.+)': VideoPage, r'http://kids\.dailymotion\.com/(?P[^\/#]+)#(.*&)?video=(?P.+)': KidsVideoPage, } @id2url(DailymotionVideo.id2url) def get_video(self, url, video=None): # clear cookies. # this is required in some weird cases, namely *interactive* videoob usage # to avoid getting 403 errors when getting the video URL after a search. # # better control of this issue would be nice (especially if we support user login) self._ua_handlers['_cookies'].cookiejar.clear() # translate embed URLs url = url.replace('dailymotion.com/swf/', 'dailymotion.com/video/') self.location(url) return self.page.get_video(video) def home(self): self.location('/1') def search_videos(self, pattern, sortby): pattern = pattern.replace('/', '').encode('utf-8') if sortby is None: url = '/en/search/%s/1' % quote_plus(pattern) else: url = '/en/%s/search/%s/1' % (sortby, quote_plus(pattern)) self.location(url) assert self.is_on_page(IndexPage) return self.page.iter_videos() def latest_videos(self): self.home() assert self.is_on_page(IndexPage) return self.page.iter_videos()