# -*- coding: utf-8 -*- # Copyright(C) 2010-2011 Romain Bignon # # This file is part of weboob. # # weboob is free software: you can redistribute it and/or modify # it under the terms of the GNU Affero General Public License as published by # the Free Software Foundation, either version 3 of the License, or # (at your option) any later version. # # weboob is distributed in the hope that it will be useful, # but WITHOUT ANY WARRANTY; without even the implied warranty of # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the # GNU Affero General Public License for more details. # # You should have received a copy of the GNU Affero General Public License # along with weboob. If not, see . import re import datetime from .base import PornPage from ..video import YoupornVideo __all__ = ['IndexPage'] class IndexPage(PornPage): def iter_videos(self): for li in self.document.getroot().xpath('//ul/li[@class="videoBox"]'): a = li.find('a') if a is None or a.find('img') is None: continue thumbnail_url = a.find('img').attrib['src'] h1 = li.find('h1') a = h1.find('a') if a is None: continue url = a.attrib['href'] _id = url[len('/watch/'):] _id = _id[:_id.find('/')] title = a.text.strip() hours = minutes = seconds = 0 div = li.cssselect('h2[class=duration]') if len(div) > 0: pack = [int(s) for s in div[0].text.strip().split(':')] if len(pack) == 3: hours, minutes, seconds = pack elif len(pack) == 2: minutes, seconds = pack rating = 0 rating_max = 0 div = li.cssselect('div.stars') if div: m = re.match('.*star-(\d).*', div[0].attrib.get('class', '')) if m: rating = int(m.group(1)) rating_max = 5 yield YoupornVideo(int(_id), title=title, rating=rating, rating_max=rating_max, duration=datetime.timedelta(hours=hours, minutes=minutes, seconds=seconds), thumbnail_url=thumbnail_url, )