LCL: update to fit web site changes

Update login process Secure login by adding a random value in the URL as in the original web site Deal with both Pro and Particulier versions Signed-off-by: Pierre Mazière <pierre.maziere@gmail.com>
2012-01-24 23:19:52 +01:00 · 2012-01-24 23:19:52 +01:00 · 8a70c77b80
commit 8a70c77b80
parent 2310e8506f
2 changed files with 89 additions and 77 deletions
--- a/modules/lcl/browser.py
+++ b/modules/lcl/browser.py
@ -20,7 +20,7 @@
 from weboob.tools.browser import BaseBrowser, BrowserIncorrectPassword
-from .pages import LoginPage, LoginResultPage, FramePage, AccountsPage, AccountHistoryPage
+from .pages import SkipPage, LoginPage, AccountsPage, AccountHistoryPage
 __all__ = ['LCLBrowser']
@ -33,11 +33,11 @@ class LCLBrowser(BaseBrowser):
    ENCODING = 'utf-8'
    USER_AGENT = BaseBrowser.USER_AGENTS['wget']
    PAGES = {
-        'https://particuliers.secure.lcl.fr/everest/UWBI/UWBIAccueil\?DEST=PAGEIDENT': LoginPage,
+        'https://particuliers.secure.lcl.fr/outil/UAUT/Authentication/authenticate': LoginPage,
-        'https://particuliers.secure.lcl.fr/everest/UWBI/UWBIAccueil\?DEST=IDENTIFICATION': LoginResultPage,
+        'https://particuliers.secure.lcl.fr/outil/UWSP/Synthese': AccountsPage,
        'https://particuliers.secure.lcl.fr/outil/UWSP/Synthese/accesSynthese': AccountsPage,
        'https://particuliers.secure.lcl.fr/outil/UWB2/Accueil\?DEST=INIT': FramePage,
        'https://particuliers.secure.lcl.fr/outil/UWLM/ListeMouvements.*/accesListeMouvements.*': AccountHistoryPage,
        'https://particuliers.secure.lcl.fr/outil/UAUT/Contrat/selectionnerContrat.*': SkipPage,
        'https://particuliers.secure.lcl.fr/index.html': SkipPage
        }
    def __init__(self, agency, *args, **kwargs):
@ -55,17 +55,17 @@ class LCLBrowser(BaseBrowser):
        assert self.agency.isdigit()
        if not self.is_on_page(LoginPage):
-            self.location('%s://%s/everest/UWBI/UWBIAccueil?DEST=PAGEIDENT' \
+            self.location('%s://%s/outil/UAUT/Authentication/authenticate' \
                          % (self.PROTOCOL, self.DOMAIN),
                          no_login=True)
        if not self.page.login(self.agency, self.username, self.password) or \
           not self.is_logged() or \
-           (self.is_on_page(LoginResultPage) and self.page.is_error()) :
+           (self.is_on_page(LoginPage) and self.page.is_error()) :
            raise BrowserIncorrectPassword()
-
+        self.location('%s://%s/outil/UWSP/Synthese' \
-        self.location('%s://%s/outil/UWSP/Synthese/accesSynthese' \
+                      % (self.PROTOCOL, self.DOMAIN),
-                      % (self.PROTOCOL, self.DOMAIN))
+                      no_login=True)
    def get_accounts_list(self):
        if not self.is_on_page(AccountsPage):
--- a/modules/lcl/pages.py
+++ b/modules/lcl/pages.py
@ -25,6 +25,8 @@ from weboob.tools.browser import BasePage, BrowserUnavailable
 from weboob.tools.captcha.virtkeyboard import MappedVirtKeyboard, VirtKeyboardError
 from logging import error
 import tempfile
 import math
 import random
 class LCLVirtKeyboard(MappedVirtKeyboard):
    symbols={'0':'9da2724133f2221482013151735f033c',
@ -39,14 +41,16 @@ class LCLVirtKeyboard(MappedVirtKeyboard):
             '9':'cc60e5894a9d8e12ee0c2c104c1d5490'
            }
-    url="/UWBI/UWBIAccueil?DEST=GENERATION_CLAVIER"
+    url="/outil/UAUT/Clavier/creationClavier?random="
    color=(255,255,255,255)
    def __init__(self,basepage):
        img=basepage.document.find("//img[@id='idImageClavier']")
        random.seed()
        self.url+="%li"%math.floor(long(random.random()*1000000000000000000000))
        MappedVirtKeyboard.__init__(self,basepage.browser.openurl(self.url),
-                                    basepage.document,img,self.color)
+                                    basepage.document,img,self.color,"id")
        if basepage.browser.responses_dirname is None:
            basepage.browser.responses_dirname = \
                    tempfile.mkdtemp(prefix='weboob_session_')
@ -54,7 +58,7 @@ class LCLVirtKeyboard(MappedVirtKeyboard):
    def get_symbol_code(self,md5sum):
        code=MappedVirtKeyboard.get_symbol_code(self,md5sum)
-        return code[-5:-3]
+        return code[-2:]
    def get_string_code(self,string):
        code=''
@ -62,6 +66,8 @@ class LCLVirtKeyboard(MappedVirtKeyboard):
            code+=self.get_symbol_code(self.symbols[c])
        return code
 class SkipPage(BasePage):
    pass
 class LoginPage(BasePage):
    def myXOR(self,value,seed):
@ -81,22 +87,23 @@ class LoginPage(BasePage):
        seed=-1
        str="var aleatoire = "
-        for script in self.document.findall("/head/script"):
+        for script in self.document.findall("//script"):
            if(script.text is None or len(script.text)==0):
                continue
            offset=script.text.find(str)
            if offset!=-1:
-                seed=int(script.text[offset+len(str):offset+len(str)+1])
+                seed=int(script.text[offset+len(str)+1:offset+len(str)+2])
                break
        if seed==-1:
            error("Variable 'aleatoire' not found")
            return False
-        self.browser.select_form(nr=0)
+        self.browser.select_form(
            predicate=lambda x: x.attrs.get('id','')=='formAuthenticate')
        self.browser.form.set_all_readonly(False)
-        self.browser['agenceId'] = base64.b64encode(self.myXOR(agency,seed))
+        self.browser['agenceId'] = agency
-        self.browser['compteId'] = base64.b64encode(self.myXOR(login,seed))
+        self.browser['compteId'] = login
-        self.browser['postClavier'] = base64.b64encode(self.myXOR(password,seed))
+        self.browser['postClavierXor'] = base64.b64encode(self.myXOR(password,seed))
        try:
            self.browser.submit()
        except BrowserUnavailable:
@ -104,7 +111,6 @@ class LoginPage(BasePage):
            return False
        return True
 class LoginResultPage(BasePage):
    def is_error(self):
        for text in self.document.find('body').itertext():
            text=text.strip()
@ -112,75 +118,81 @@ class LoginResultPage(BasePage):
            needle='Les données saisies sont incorrectes'
            if text.startswith(needle.decode('utf-8')):
                return True
        return False
 class FramePage(BasePage):
    pass
 class AccountsPage(BasePage):
    def get_list(self):
        l = []
-        for div in self.document.getiterator('div'):
+        for a in self.document.getiterator('a'):
-            if div.attrib.get('class')=="unCompte-CA" or\
+            link=a.attrib.get('href')
-            div.attrib.get('class')=="unCompte-CC" or\
+            if link is not None and link.startswith("/outil/UWLM/ListeMouvements"):
            div.attrib.get('class')=="unCompte-CD" or\
            div.attrib.get('class')=="unCompte-CE":
                #CA=> ? maybe Assurance-vie
                #CC=> Compte Courant
                #CD=> Compte Dépôt
                #CE=> Compte d'Epargne
                account = Account()
-                account.type=div.attrib.get('class')[-2:]
+                account.link_id=link
-                account.id = div.attrib.get('id').replace('-','')
+                parameters=link.split("?").pop().split("&")
-                for td in div.getiterator('td'):
+                for parameter in parameters:
-                    if td.find("div") is not None and td.find("div").attrib.get('class') == 'libelleCompte':
+                    list=parameter.split("=")
-                        account.label = td.find("div").text
+                    value=list.pop()
-                    elif td.find('a') is not None and td.find('a').attrib.get('class') is None:
+                    name=list.pop()
-                        balance = td.find('a').text.replace(u"\u00A0",'').replace('.','').replace('+','').replace(',','.')
+                    if name=="agence":
-                        account.balance = float(balance)
+                        account.id=value
-                        account.link_id = td.find('a').attrib.get('href')
+                    elif name=="compte":
-
+                        account.id+=value
                    elif name=="nature":
                        account.type=value
                account.label=a.getparent().getprevious().text.strip()
                balance=a.text.replace(u"\u00A0",'').replace(' ','').replace('.','').replace('+','').replace(',','.')
                account.balance=float(balance)
                l.append(account)
        return l
 class AccountHistoryPage(BasePage):
-    def get_specific_operations(self,tableHeaderPrefixes,debitColumns,creditColumns):
+    def get_operations(self,account):
        operations = []
-        for td in self.document.iter('td'):
+        tables=self.document.findall("//table[@class='tagTab pyjama']")
-            text=td.findtext("b")
+        table=None
-            if text is None:
+        for i in range(len(tables)):
            # Look for the relevant table in the Pro version
            header=tables[i].getprevious()
            while str(header.tag)=="<built-in function Comment>":
                header=header.getprevious()
            header=header.find("div")
            if header is not None:
                header=header.find("span")
            if header is not None and \
               header.text.strip().startswith("Opérations effectuées".decode('utf-8')):
                table=tables[i]
                break;
            # Look for the relevant table in the Particulier version
            header=tables[i].find("thead").find("tr").find("th[@class='titleTab titleTableft']")
            if header is not None and\
               header.text.strip().startswith("Solde au"):
                table=tables[i]
                break;
        for tr in table.iter('tr'):
            # skip headers and empty rows
            if len(tr.findall("th"))!=0 or\
               len(tr.findall("td"))==0:
                continue
            for i in range(len(tableHeaderPrefixes)):
                if text.startswith(tableHeaderPrefixes[i].decode('utf-8')):
                    tbody=td.getparent().getparent()
                    for tr in tbody.iter('tr'):
                        tr_class=tr.attrib.get('class')
                        if tr_class == 'tbl1' or tr_class=='tbl2':
                            tds=tr.findall('td')
                            d=date(*reversed([int(x) for x in tds[0].text.split('/')]))
                            label=u''+tds[1].find('a').text.strip()
                            if tds[debitColumns[i]].text.strip() != u"":
                                amount = - float(tds[debitColumns[i]].text.strip().replace('.','').replace(',','.').replace(u"\u00A0",'').replace(' ',''))
                            else:
                                amount= float(tds[creditColumns[i]].text.strip().replace('.','').replace(',','.').replace(u"\u00A0",'').replace(' ',''))
            operation=Operation(len(operations))
-                            operation.date=d
+            mntColumn=0
-                            operation.label=label
+            for td in tr.iter('td'):
                value=td.attrib.get('id')
                if value is None:
                    value=td.attrib.get('class');
                if value.startswith("date"):
                    operation.date=date(*reversed([int(x) for x in td.text.split('/')]))
                elif value.startswith("lib") or value.startswith("opLib"):
                    # misclosed A tag requires to grab text from td
                    operation.label=u''.join([txt.strip() for txt in td.itertext()])
                elif value.startswith("solde") or value.startswith("mnt"):
                    mntColumn+=1
                    if td.text.strip() != "":
                        amount = float(td.text.strip().replace('.','').replace(',','.').replace(u"\u00A0",'').replace(' ',''))
                        if value.startswith("soldeDeb") or mntColumn==1:
                            amount=-amount
                        operation.amount=amount
            operations.append(operation)
        return operations
    def get_operations(self,account):
        if account.type=="CA":
            return [] # Not supported: page example required
        elif account.type=="CC":
            return self.get_specific_operations(['Opérations effectuées'],[3],[4])
        elif account.type=="CD":
            return self.get_specific_operations(['Solde au'],[2],[3])
        elif account.type=="CE":
            return self.get_specific_operations(['Solde au'],[2],[3])