LCL: update to fit web site changes

Update login process Secure login by adding a random value in the URL as in the original web site Deal with both Pro and Particulier versions Signed-off-by: Pierre Mazière <pierre.maziere@gmail.com>
2012-01-24 23:19:52 +01:00 · 2012-01-24 23:19:52 +01:00 · 8a70c77b80
commit 8a70c77b80
parent 2310e8506f
2 changed files with 89 additions and 77 deletions
--- a/modules/lcl/browser.py
+++ b/modules/lcl/browser.py
@ -20,7 +20,7 @@

 from weboob.tools.browser import BaseBrowser, BrowserIncorrectPassword

-from .pages import LoginPage, LoginResultPage, FramePage, AccountsPage, AccountHistoryPage
+from .pages import SkipPage, LoginPage, AccountsPage, AccountHistoryPage


 __all__ = ['LCLBrowser']
@ -33,11 +33,11 @@ class LCLBrowser(BaseBrowser):
    ENCODING = 'utf-8'
    USER_AGENT = BaseBrowser.USER_AGENTS['wget']
    PAGES = {
-        'https://particuliers.secure.lcl.fr/everest/UWBI/UWBIAccueil\?DEST=PAGEIDENT': LoginPage,
-        'https://particuliers.secure.lcl.fr/everest/UWBI/UWBIAccueil\?DEST=IDENTIFICATION': LoginResultPage,
-        'https://particuliers.secure.lcl.fr/outil/UWSP/Synthese/accesSynthese': AccountsPage,
-        'https://particuliers.secure.lcl.fr/outil/UWB2/Accueil\?DEST=INIT': FramePage,
+        'https://particuliers.secure.lcl.fr/outil/UAUT/Authentication/authenticate': LoginPage,
+        'https://particuliers.secure.lcl.fr/outil/UWSP/Synthese': AccountsPage,
        'https://particuliers.secure.lcl.fr/outil/UWLM/ListeMouvements.*/accesListeMouvements.*': AccountHistoryPage,
+        'https://particuliers.secure.lcl.fr/outil/UAUT/Contrat/selectionnerContrat.*': SkipPage,
+        'https://particuliers.secure.lcl.fr/index.html': SkipPage
        }

    def __init__(self, agency, *args, **kwargs):
@ -55,17 +55,17 @@ class LCLBrowser(BaseBrowser):
        assert self.agency.isdigit()

        if not self.is_on_page(LoginPage):
-            self.location('%s://%s/everest/UWBI/UWBIAccueil?DEST=PAGEIDENT' \
+            self.location('%s://%s/outil/UAUT/Authentication/authenticate' \
                          % (self.PROTOCOL, self.DOMAIN),
                          no_login=True)

        if not self.page.login(self.agency, self.username, self.password) or \
           not self.is_logged() or \
-           (self.is_on_page(LoginResultPage) and self.page.is_error()) :
+           (self.is_on_page(LoginPage) and self.page.is_error()) :
            raise BrowserIncorrectPassword()
-
-        self.location('%s://%s/outil/UWSP/Synthese/accesSynthese' \
-                      % (self.PROTOCOL, self.DOMAIN))
+        self.location('%s://%s/outil/UWSP/Synthese' \
+                      % (self.PROTOCOL, self.DOMAIN),
+                      no_login=True)

    def get_accounts_list(self):
        if not self.is_on_page(AccountsPage):
--- a/modules/lcl/pages.py
+++ b/modules/lcl/pages.py
@ -25,6 +25,8 @@ from weboob.tools.browser import BasePage, BrowserUnavailable
 from weboob.tools.captcha.virtkeyboard import MappedVirtKeyboard, VirtKeyboardError
 from logging import error
 import tempfile
+import math
+import random

 class LCLVirtKeyboard(MappedVirtKeyboard):
    symbols={'0':'9da2724133f2221482013151735f033c',
@ -39,14 +41,16 @@ class LCLVirtKeyboard(MappedVirtKeyboard):
             '9':'cc60e5894a9d8e12ee0c2c104c1d5490'
            }

-    url="/UWBI/UWBIAccueil?DEST=GENERATION_CLAVIER"
+    url="/outil/UAUT/Clavier/creationClavier?random="

    color=(255,255,255,255)

    def __init__(self,basepage):
        img=basepage.document.find("//img[@id='idImageClavier']")
+        random.seed()
+        self.url+="%li"%math.floor(long(random.random()*1000000000000000000000))
        MappedVirtKeyboard.__init__(self,basepage.browser.openurl(self.url),
-                                    basepage.document,img,self.color)
+                                    basepage.document,img,self.color,"id")
        if basepage.browser.responses_dirname is None:
            basepage.browser.responses_dirname = \
                    tempfile.mkdtemp(prefix='weboob_session_')
@ -54,7 +58,7 @@ class LCLVirtKeyboard(MappedVirtKeyboard):

    def get_symbol_code(self,md5sum):
        code=MappedVirtKeyboard.get_symbol_code(self,md5sum)
-        return code[-5:-3]
+        return code[-2:]

    def get_string_code(self,string):
        code=''
@ -62,6 +66,8 @@ class LCLVirtKeyboard(MappedVirtKeyboard):
            code+=self.get_symbol_code(self.symbols[c])
        return code

+class SkipPage(BasePage):
+    pass

 class LoginPage(BasePage):
    def myXOR(self,value,seed):
@ -81,22 +87,23 @@ class LoginPage(BasePage):

        seed=-1
        str="var aleatoire = "
-        for script in self.document.findall("/head/script"):
+        for script in self.document.findall("//script"):
            if(script.text is None or len(script.text)==0):
                continue
            offset=script.text.find(str)
            if offset!=-1:
-                seed=int(script.text[offset+len(str):offset+len(str)+1])
+                seed=int(script.text[offset+len(str)+1:offset+len(str)+2])
                break
        if seed==-1:
            error("Variable 'aleatoire' not found")
            return False

-        self.browser.select_form(nr=0)
+        self.browser.select_form(
+            predicate=lambda x: x.attrs.get('id','')=='formAuthenticate')
        self.browser.form.set_all_readonly(False)
-        self.browser['agenceId'] = base64.b64encode(self.myXOR(agency,seed))
-        self.browser['compteId'] = base64.b64encode(self.myXOR(login,seed))
-        self.browser['postClavier'] = base64.b64encode(self.myXOR(password,seed))
+        self.browser['agenceId'] = agency
+        self.browser['compteId'] = login
+        self.browser['postClavierXor'] = base64.b64encode(self.myXOR(password,seed))
        try:
            self.browser.submit()
        except BrowserUnavailable:
@ -104,7 +111,6 @@ class LoginPage(BasePage):
            return False
        return True

-class LoginResultPage(BasePage):
    def is_error(self):
        for text in self.document.find('body').itertext():
            text=text.strip()
@ -112,75 +118,81 @@ class LoginResultPage(BasePage):
            needle='Les données saisies sont incorrectes'
            if text.startswith(needle.decode('utf-8')):
                return True
-
        return False

-class FramePage(BasePage):
-    pass
-
-
 class AccountsPage(BasePage):
    def get_list(self):
        l = []
-        for div in self.document.getiterator('div'):
-            if div.attrib.get('class')=="unCompte-CA" or\
-            div.attrib.get('class')=="unCompte-CC" or\
-            div.attrib.get('class')=="unCompte-CD" or\
-            div.attrib.get('class')=="unCompte-CE":
-                #CA=> ? maybe Assurance-vie
-                #CC=> Compte Courant
-                #CD=> Compte Dépôt
-                #CE=> Compte d'Epargne
+        for a in self.document.getiterator('a'):
+            link=a.attrib.get('href')
+            if link is not None and link.startswith("/outil/UWLM/ListeMouvements"):
                account = Account()
-                account.type=div.attrib.get('class')[-2:]
-                account.id = div.attrib.get('id').replace('-','')
-                for td in div.getiterator('td'):
-                    if td.find("div") is not None and td.find("div").attrib.get('class') == 'libelleCompte':
-                        account.label = td.find("div").text
-                    elif td.find('a') is not None and td.find('a').attrib.get('class') is None:
-                        balance = td.find('a').text.replace(u"\u00A0",'').replace('.','').replace('+','').replace(',','.')
-                        account.balance = float(balance)
-                        account.link_id = td.find('a').attrib.get('href')
-
+                account.link_id=link
+                parameters=link.split("?").pop().split("&")
+                for parameter in parameters:
+                    list=parameter.split("=")
+                    value=list.pop()
+                    name=list.pop()
+                    if name=="agence":
+                        account.id=value
+                    elif name=="compte":
+                        account.id+=value
+                    elif name=="nature":
+                        account.type=value
+                account.label=a.getparent().getprevious().text.strip()
+                balance=a.text.replace(u"\u00A0",'').replace(' ','').replace('.','').replace('+','').replace(',','.')
+                account.balance=float(balance)
                l.append(account)
-
        return l

 class AccountHistoryPage(BasePage):
-    def get_specific_operations(self,tableHeaderPrefixes,debitColumns,creditColumns):
+    def get_operations(self,account):
        operations = []
-        for td in self.document.iter('td'):
-            text=td.findtext("b")
-            if text is None:
+        tables=self.document.findall("//table[@class='tagTab pyjama']")
+        table=None
+        for i in range(len(tables)):
+            # Look for the relevant table in the Pro version
+            header=tables[i].getprevious()
+            while str(header.tag)=="<built-in function Comment>":
+                header=header.getprevious()
+            header=header.find("div")
+            if header is not None:
+                header=header.find("span")
+            if header is not None and \
+               header.text.strip().startswith("Opérations effectuées".decode('utf-8')):
+                table=tables[i]
+                break;
+            # Look for the relevant table in the Particulier version
+            header=tables[i].find("thead").find("tr").find("th[@class='titleTab titleTableft']")
+            if header is not None and\
+               header.text.strip().startswith("Solde au"):
+                table=tables[i]
+                break;
+
+        for tr in table.iter('tr'):
+            # skip headers and empty rows
+            if len(tr.findall("th"))!=0 or\
+               len(tr.findall("td"))==0:
                continue
-            for i in range(len(tableHeaderPrefixes)):
-                if text.startswith(tableHeaderPrefixes[i].decode('utf-8')):
-                    tbody=td.getparent().getparent()
-                    for tr in tbody.iter('tr'):
-                        tr_class=tr.attrib.get('class')
-                        if tr_class == 'tbl1' or tr_class=='tbl2':
-                            tds=tr.findall('td')
-                            d=date(*reversed([int(x) for x in tds[0].text.split('/')]))
-                            label=u''+tds[1].find('a').text.strip()
-                            if tds[debitColumns[i]].text.strip() != u"":
-                                amount = - float(tds[debitColumns[i]].text.strip().replace('.','').replace(',','.').replace(u"\u00A0",'').replace(' ',''))
-                            else:
-                                amount= float(tds[creditColumns[i]].text.strip().replace('.','').replace(',','.').replace(u"\u00A0",'').replace(' ',''))
-                            operation=Operation(len(operations))
-                            operation.date=d
-                            operation.label=label
-                            operation.amount=amount
-                            operations.append(operation)
+            operation=Operation(len(operations))
+            mntColumn=0
+            for td in tr.iter('td'):
+                value=td.attrib.get('id')
+                if value is None:
+                    value=td.attrib.get('class');
+                if value.startswith("date"):
+                    operation.date=date(*reversed([int(x) for x in td.text.split('/')]))
+                elif value.startswith("lib") or value.startswith("opLib"):
+                    # misclosed A tag requires to grab text from td
+                    operation.label=u''.join([txt.strip() for txt in td.itertext()])
+                elif value.startswith("solde") or value.startswith("mnt"):
+                    mntColumn+=1
+                    if td.text.strip() != "":
+                        amount = float(td.text.strip().replace('.','').replace(',','.').replace(u"\u00A0",'').replace(' ',''))
+                        if value.startswith("soldeDeb") or mntColumn==1:
+                            amount=-amount
+                        operation.amount=amount
+            operations.append(operation)
        return operations

-    def get_operations(self,account):
-        if account.type=="CA":
-            return [] # Not supported: page example required
-        elif account.type=="CC":
-            return self.get_specific_operations(['Opérations effectuées'],[3],[4])
-        elif account.type=="CD":
-            return self.get_specific_operations(['Solde au'],[2],[3])
-        elif account.type=="CE":
-            return self.get_specific_operations(['Solde au'],[2],[3])
-