From c9614152f66a61b1bcc3f917bc63c495a6b9e83a Mon Sep 17 00:00:00 2001 From: Roger Philibert Date: Wed, 13 Jul 2011 02:22:00 +0200 Subject: [PATCH] add basic support for Izneo --- weboob/backends/izneo/__init__.py | 22 +++++++ weboob/backends/izneo/backend.py | 99 +++++++++++++++++++++++++++++++ weboob/capabilities/gallery.py | 5 +- 3 files changed, 125 insertions(+), 1 deletion(-) create mode 100644 weboob/backends/izneo/__init__.py create mode 100644 weboob/backends/izneo/backend.py diff --git a/weboob/backends/izneo/__init__.py b/weboob/backends/izneo/__init__.py new file mode 100644 index 00000000..fcb468a8 --- /dev/null +++ b/weboob/backends/izneo/__init__.py @@ -0,0 +1,22 @@ +# -*- coding: utf-8 -*- + +# Copyright(C) 2010-2011 Roger Philibert +# +# This file is part of weboob. +# +# weboob is free software: you can redistribute it and/or modify +# it under the terms of the GNU Affero General Public License as published by +# the Free Software Foundation, either version 3 of the License, or +# (at your option) any later version. +# +# weboob is distributed in the hope that it will be useful, +# but WITHOUT ANY WARRANTY; without even the implied warranty of +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +# GNU Affero General Public License for more details. +# +# You should have received a copy of the GNU Affero General Public License +# along with weboob. If not, see . + +from .backend import IzneoBackend + +__all__ = ['IzneoBackend'] diff --git a/weboob/backends/izneo/backend.py b/weboob/backends/izneo/backend.py new file mode 100644 index 00000000..da87b0ee --- /dev/null +++ b/weboob/backends/izneo/backend.py @@ -0,0 +1,99 @@ +# -*- coding: utf-8 -*- + +# Copyright(C) 2010-2011 Roger Philibert +# +# This file is part of weboob. +# +# weboob is free software: you can redistribute it and/or modify +# it under the terms of the GNU Affero General Public License as published by +# the Free Software Foundation, either version 3 of the License, or +# (at your option) any later version. +# +# weboob is distributed in the hope that it will be useful, +# but WITHOUT ANY WARRANTY; without even the implied warranty of +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +# GNU Affero General Public License for more details. +# +# You should have received a copy of the GNU Affero General Public License +# along with weboob. If not, see . + +from __future__ import with_statement + +try: + import simplejson as json +except ImportError: + import json + +import re + +from weboob.capabilities.gallery import ICapGallery, BaseGallery, BaseImage +from weboob.tools.backend import BaseBackend +from weboob.tools.browser import BaseBrowser, BasePage + +__all__ = ['IzneoBackend'] + +class ReaderV2(BasePage): + def get_ean(self): + return self.document.xpath("//div[@id='viewer']/attribute::rel")[0] + + def iter_gallery_images(self, gallery): + ean = self.get_ean() + pages = json.load(self.browser.openurl( + 'http://www.izneo.com/playerv2/ajax.php?ean=%s&action=get_list_jpg' + % ean)) + + for page in pages: + width = 1200 # maximum width + yield BaseImage(page['page'], + gallery=gallery, + url=("http://www.izneo.com/playerv2/%s/%s/%s/%d/%s" % + (page['expires'], page['token'], ean, width, page['page']))) + +class IzneoBrowser(BaseBrowser): + PAGES = { r'http://.+\.izneo.\w+/readv2-.+': ReaderV2 } + + def iter_gallery_images(self, gallery): + self.location(gallery.url) + assert self.is_on_page(ReaderV2) + return self.page.iter_gallery_images(gallery) + + def fill_image(self, image, fields): + if 'data' in fields: + image.data = self.readurl(self.request_class( + image.url, None, {'Referer': image.gallery.url})) + + +class IzneoBackend(BaseBackend, ICapGallery): + NAME = 'izneo' + MAINTAINER = 'Roger Philibert' + EMAIL = 'roger.philibert@gmail.com' + VERSION = '0.9' + DESCRIPTION = 'Izneo' + LICENSE = 'AGPLv3+' + BROWSER = IzneoBrowser + + def iter_gallery_images(self, gallery): + with self.browser: + return self.browser.iter_gallery_images(gallery) + + def get_gallery(self, _id): + match = re.match(r'(?:(?:.+izneo.com/)?readv2-)?(\d+-\d+)/?$', _id) + if match is None: + return None + + _id = match.group(1) + + gallery = BaseGallery(_id, url=('http://www.izneo.com/readv2-%s' % _id)) + with self.browser: + return gallery + + def fill_gallery(self, gallery, fields): + gallery.title = gallery.id + + def fill_image(self, image, fields): + with self.browser: + self.browser.fill_image(image, fields) + + OBJECTS = { + BaseGallery: fill_gallery, + BaseImage: fill_image } diff --git a/weboob/capabilities/gallery.py b/weboob/capabilities/gallery.py index a01bfee4..a546f238 100644 --- a/weboob/capabilities/gallery.py +++ b/weboob/capabilities/gallery.py @@ -56,7 +56,9 @@ class BaseGallery(CapBaseObject): raise NotImplementedError() class BaseImage(CapBaseObject): - def __init__(self, _id, index=None, thumbnail=NotLoaded, url=NotLoaded, ext=NotLoaded): + def __init__(self, _id, index=None, thumbnail=NotLoaded, url=NotLoaded, + ext=NotLoaded, gallery=None): + CapBaseObject.__init__(self, unicode(_id)) self.add_field('index', int, index) # usually page number @@ -64,6 +66,7 @@ class BaseImage(CapBaseObject): self.add_field('url', basestring, url) self.add_field('ext', basestring, ext) self.add_field('data', str) + self.add_field('gallery', BaseGallery, gallery) def __str__(self): return self.url