weboob-devel/modules/btmon/pages.py
Romain Bignon d61e15cf84 rename things related to browsers
weboob.tools.browser -> weboob.deprecated.browser
weboob.tools.parsers -> weboob.deprecated.browser.parsers
weboob.tools.mech -> weboob.deprecated.mech
weboob.browser2 -> weboob.browser
weboob.core.exceptions -> weboob.exceptions

Also, the new tree for browser2 is:

weboob.browser: import weboob.browser.browsers.* and weboob.browser.url.*
weboob.browser.browsers: all browsers (including PagesBrowser and LoginBrowser)
weboob.browser.url: the URL class
weboob.browser.profiles: all Profile classes
weboob.browser.sessions: WeboobSession and FuturesSession
weboob.browser.cookies: that's a cookies thing
weboob.browser.pages: all Page and derivated classes, and Form class
weboob.browser.exceptions: specific browser exceptions
weboob.browser.elements: AbstractElement classes, and 'method' decorator
weboob.browser.filters.*: all filters
2014-10-07 00:30:07 +02:00

112 lines
4.5 KiB
Python

# -*- coding: utf-8 -*-
# Copyright(C) 2013 Julien Veyssier
#
# This file is part of weboob.
#
# weboob is free software: you can redistribute it and/or modify
# it under the terms of the GNU Affero General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# weboob is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU Affero General Public License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with weboob. If not, see <http://www.gnu.org/licenses/>.
import string
from weboob.capabilities.torrent import Torrent
from weboob.capabilities.base import NotAvailable, NotLoaded
from weboob.deprecated.browser import Page
from weboob.tools.misc import get_bytes_size
class TorrentsPage(Page):
def iter_torrents(self):
for div in self.parser.select(self.document.getroot(),'div.list_tor'):
name = NotAvailable
size = NotAvailable
seeders = NotAvailable
leechers = NotAvailable
right_div = self.parser.select(div,'div.list_tor_right',1)
try:
seeders = int(self.parser.select(right_div,'b.green',1).text)
except ValueError:
seeders = 0
try:
leechers = int(self.parser.select(right_div,'b.red',1).text)
except ValueError:
leechers = 0
sizep = self.parser.select(right_div,'p')[0]
sizespan = self.parser.select(sizep,'span')[0]
nsize = float(sizespan.text_content().split(':')[1].split()[0])
usize = sizespan.text_content().split()[-1].upper()
size = get_bytes_size(nsize,usize)
a = self.parser.select(div,'a.list_tor_title',1)
href = a.attrib.get('href','')
name = unicode(a.text_content())
id = unicode(href.strip('/').split('.html')[0])
torrent = Torrent(id,name)
torrent.url = NotLoaded
torrent.filename = id
torrent.magnet = NotLoaded
torrent.size = size
torrent.seeders = seeders
torrent.leechers = leechers
torrent.description = NotLoaded
torrent.files = NotLoaded
yield torrent
class TorrentPage(Page):
def get_torrent(self):
seed = 0
leech = 0
description = NotAvailable
url = NotAvailable
magnet = NotAvailable
title = NotAvailable
id = unicode(self.browser.geturl().split('.html')[0].split('/')[-1])
div = self.parser.select(self.document.getroot(),'div#middle_content',1)
title = u'%s'%self.parser.select(self.document.getroot(),'div#middle_content > h1',1).text
slblock_values = self.parser.select(div,'div.sl_block b')
if len(slblock_values) >= 2:
seed = slblock_values[0].text
leech = slblock_values[1].text
href_t = self.parser.select(div,'a.down',1).attrib.get('href','')
url = u'http://%s%s'%(self.browser.DOMAIN,href_t)
magnet = unicode(self.parser.select(div,'a.magnet',1).attrib.get('href',''))
divtabs = self.parser.select(div,'div#tabs',1)
files_div = self.parser.select(divtabs,'div.body > div.doubleblock > div.leftblock')
files = []
if len(files_div) > 0:
size_text = self.parser.select(files_div,'h5',1).text
for b in self.parser.select(files_div,'b'):
div = b.getparent()
files.append(div.text_content())
else:
size_text = self.parser.select(divtabs,'h5',1).text_content()
size_text = size_text.split('(')[1].split(')')[0].strip()
size = float(size_text.split(',')[1].strip(string.letters))
u = size_text.split(',')[1].strip().translate(None,string.digits).strip('.').strip().upper()
div_desc = self.parser.select(divtabs,'div#descriptionContent')
if len(div_desc) > 0:
description = unicode(div_desc[0].text_content())
torrent = Torrent(id, title)
torrent.url = url
torrent.filename = id
torrent.magnet = magnet
torrent.size = get_bytes_size(size, u)
torrent.seeders = int(seed)
torrent.leechers = int(leech)
torrent.description = description
torrent.files = files
return torrent