isohunt 50%

2010-11-27 22:32:34 +01:00 · 2010-11-27 22:32:34 +01:00 · a40cf0ef44
commit a40cf0ef44
parent 11123a1176
6 changed files with 253 additions and 0 deletions
--- a/weboob/backends/isohunt/pages/torrents.py
+++ b/weboob/backends/isohunt/pages/torrents.py
@ -0,0 +1,117 @@
+# -*- coding: utf-8 -*-
+
+# Copyright(C) 2010  Julien Veyssier
+#
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation, version 3 of the License.
+#
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with this program; if not, write to the Free Software
+# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
+
+
+
+from weboob.tools.browser import BasePage
+from weboob.capabilities.torrent import Torrent
+
+
+__all__ = ['TorrentsPage']
+
+
+class TorrentsPage(BasePage):
+    def unit(self, n, u):
+        m = {'KB': 1024,
+             'MB': 1024*1024,
+             'GB': 1024*1024*1024,
+             'TB': 1024*1024*1024*1024,
+            }
+        return float(n*m[u])
+
+    def iter_torrents(self):
+
+
+
+        for tr in self.document.getiterator('tr'):
+            if tr.attrib.get('class','') == 'hlRow':
+                atitle = tr.getchildren()[2].getchildren()[1]
+                title = atitle.text
+                if not title:
+                    title = ''
+                for bold in atitle.getchildren():
+                    if bold.text:
+                        title += bold.text
+                    if bold.tail:
+                        title += bold.tail
+                idt = tr.getchildren()[2].getchildren()[0].attrib.get('href','')
+                idt = idt.split('/')[2]
+                size = tr.getchildren()[3].text
+                u = size[-2:]
+                size = float(size[:-3])
+                seed = tr.getchildren()[4].text
+                leech = tr.getchildren()[5].text
+                url = 'https://isohunt.com/download/%s/mon_joli_torrent.torrent' % idt
+
+                torrent = Torrent(idt,
+                                  title,
+                                  url=url,
+                                  size=self.unit(size,u),
+                                  seeders=int(seed),
+                                  leechers=int(leech))
+                yield torrent
+
+class TorrentPage(BasePage):
+    def unit(self, n, u):
+        m = {'KB': 1024,
+             'MB': 1024*1024,
+             'GB': 1024*1024*1024,
+             'TB': 1024*1024*1024*1024,
+            }
+        return float(n*m[u])
+
+    def get_torrent(self, id):
+        url = 'https://isohunt.com/download/%s/mon_joli_torrent.torrent' % id
+        for a in self.document.getiterator('a'):
+            if 'Search more torrents of' in a.attrib.get('title',''):
+                title = a.tail
+        #--------------------------TODO
+
+        description = "No description"
+        for div in self.document.getiterator('div'):
+            if div.attrib.get('id','') == 'desc':
+                description = div.text.strip()
+        for td in self.document.getiterator('td'):
+            if td.attrib.get('class','') == 'hreview-aggregate':
+                seed = int(td.getchildren()[2].getchildren()[0].getchildren()[0].text)
+                leech = int(td.getchildren()[2].getchildren()[1].getchildren()[0].text)
+                url = td.getchildren()[3].getchildren()[0].attrib.get('href')
+                title = td.getchildren()[1].getchildren()[0].getchildren()[0].text
+
+        size = 0
+        for span in self.document.getiterator('span'):
+            if span.attrib.get('class','') == "folder" or span.attrib.get('class','') == "folderopen":
+                size = span.getchildren()[1].tail
+                u = size.split(' ')[-1].split(')')[0]
+                size = float(size.split(': ')[1].split(' ')[0].replace(',','.'))
+
+        files = []
+        for td in self.document.getiterator('td'):
+            if td.attrib.get('class','') == 'torFileName':
+                files.append(td.text)
+
+
+        torrent = Torrent(id, title)
+        torrent = Torrent(id, title)
+        torrent.url = url
+        torrent.size = self.unit(size,u)
+        torrent.seeders = int(seed)
+        torrent.leechers = int(leech)
+        torrent.description = description
+        torrent.files = files
+                    
+        return torrent