weboob-devel/modules/francetelevisions/browser.py

75 lines
2.7 KiB
Python

# -*- coding: utf-8 -*-
# Copyright(C) 2011-2012 Romain Bignon, Laurent Bachelier
#
# This file is part of weboob.
#
# weboob is free software: you can redistribute it and/or modify
# it under the terms of the GNU Affero General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# weboob is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU Affero General Public License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with weboob. If not, see <http://www.gnu.org/licenses/>.
from weboob.browser import PagesBrowser, URL
from .pages import IndexPage, VideoPage, Programs, VideoListPage, LatestPage
__all__ = ['PluzzBrowser']
class PluzzBrowser(PagesBrowser):
ENCODING = 'utf-8'
BASEURL = 'http://pluzz.francetv.fr'
PROGRAMS = None
latest = URL('http://pluzz.webservices.francetelevisions.fr/pluzz/liste/type/replay', LatestPage)
programs_page = URL('http://pluzz.webservices.francetelevisions.fr/pluzz/programme', Programs)
index_page = URL(r'recherche\?recherche=(?P<pattern>.*)', IndexPage)
video_page = URL(r'http://webservices.francetelevisions.fr/tools/getInfosOeuvre/v2/\?idDiffusion=(?P<id>.*)&catalogue=Pluzz', VideoPage)
videos_list_page = URL('(?P<program>videos/.*)', VideoListPage)
def get_video_from_url(self, url):
video = self.videos_list_page.go(program=url).get_last_video()
if video:
return self.get_video(video.id, video)
def search_videos(self, pattern):
if not self.PROGRAMS:
self.PROGRAMS = list(self.get_program_list())
videos = []
for program in self.PROGRAMS:
if pattern.upper() in program._title.upper():
video = self.videos_list_page.go(program=program.id).get_last_video()
if video:
videos.append(video)
videos += list(self.page.iter_videos())
return videos if len(videos) > 0 else self.index_page.go(pattern=pattern).iter_videos()
def get_program_list(self):
return list(self.programs_page.go().iter_programs())
@video_page.id2url
def get_video(self, url, video=None):
self.location(url)
video = self.page.get_video(obj=video)
for item in self.read_url(video.url):
video.url = u'%s' % item
return video
def read_url(self, url):
r = self.open(url, stream=True)
buf = r.iter_lines()
return buf
def latest_videos(self):
return self.latest.go().iter_videos()