rename parser/parsers module, add get_parsers() with preference_order
This commit is contained in:
parent
54cc3b0a4a
commit
8638024756
13 changed files with 104 additions and 70 deletions
|
|
@ -22,7 +22,7 @@ import time
|
|||
from logging import warning
|
||||
|
||||
from weboob.tools.browser import BaseBrowser
|
||||
from weboob.tools.parser import Html5libParser
|
||||
from weboob.tools.parsers.html5libparser import Html5libParser
|
||||
|
||||
from weboob.backends.aum.exceptions import AdopteWait
|
||||
|
||||
|
|
|
|||
|
|
@ -21,7 +21,7 @@ Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
|
|||
from cStringIO import StringIO
|
||||
|
||||
from weboob.tools.browser import BaseBrowser, BrowserIncorrectPassword
|
||||
from weboob.tools.parser import ElementTidyParser
|
||||
from weboob.tools.parsers.elementtidyparser import ElementTidyParser
|
||||
from weboob.backends.bnporc import pages
|
||||
|
||||
# Parser
|
||||
|
|
|
|||
|
|
@ -26,15 +26,15 @@ from .pages.index import IndexPage, LoginPage
|
|||
from .pages.news import ContentPage
|
||||
from .tools import id2url, id2threadid, id2contenttype
|
||||
|
||||
from weboob.tools.parser import StandardParser
|
||||
from weboob.tools.parsers.htmlparser import HTMLParser
|
||||
|
||||
# Parser
|
||||
class DLFParser(StandardParser):
|
||||
class DLFParser(HTMLParser):
|
||||
def parse(self, data, encoding):
|
||||
s = data.read()
|
||||
s = s.replace('<<', '<')
|
||||
data = StringIO(s)
|
||||
return StandardParser.parse(self, data, encoding)
|
||||
return HTMLParser.parse(self, data, encoding)
|
||||
|
||||
# Browser
|
||||
class DLFP(BaseBrowser):
|
||||
|
|
|
|||
|
|
@ -22,15 +22,10 @@ from logging import error
|
|||
import re
|
||||
|
||||
from weboob.tools.browser import BaseBrowser
|
||||
from weboob.tools.parser import LxmlHtmlParser
|
||||
|
||||
class YoujizzBrowser(BaseBrowser):
|
||||
video_file_regex = re.compile(r'"(http://media[^ ,]+\.flv)"')
|
||||
|
||||
def __init__(self, *args, **kwargs):
|
||||
kwargs['parser'] = LxmlHtmlParser()
|
||||
Browser.__init__(self, *args, **kwargs)
|
||||
|
||||
def iter_page_urls(self, mozaic_url):
|
||||
raise NotImplementedError()
|
||||
|
||||
|
|
|
|||
|
|
@ -21,7 +21,7 @@ Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
|
|||
import re
|
||||
|
||||
from weboob.tools.browser import BaseBrowser
|
||||
from weboob.tools.parser import LxmlHtmlParser
|
||||
from weboob.tools.parsers.lxmlhtmlparser import LxmlHtmlParser
|
||||
|
||||
from .pages import VideoPage
|
||||
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue