New backend: mediawiki.
Features working: - get_content() - push_content() - get_content_preview() TODO: - log_content() - check for encoding problems
This commit is contained in:
parent
cbe44de033
commit
179d6ec75e
3 changed files with 239 additions and 0 deletions
21
weboob/backends/mediawiki/__init__.py
Normal file
21
weboob/backends/mediawiki/__init__.py
Normal file
|
|
@ -0,0 +1,21 @@
|
|||
# -*- coding: utf-8 -*-
|
||||
|
||||
# Copyright(C) 2011 Clément Schreiner
|
||||
#
|
||||
# This program is free software; you can redistribute it and/or modify
|
||||
# it under the terms of the GNU General Public License as published by
|
||||
# the Free Software Foundation, version 3 of the License.
|
||||
#
|
||||
# This program is distributed in the hope that it will be useful,
|
||||
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||
# GNU General Public License for more details.
|
||||
#
|
||||
# You should have received a copy of the GNU General Public License
|
||||
# along with this program; if not, write to the Free Software
|
||||
# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
|
||||
|
||||
|
||||
from .backend import MediawikiBackend
|
||||
|
||||
__all__ = ['MediawikiBackend']
|
||||
64
weboob/backends/mediawiki/backend.py
Normal file
64
weboob/backends/mediawiki/backend.py
Normal file
|
|
@ -0,0 +1,64 @@
|
|||
# -*- coding: utf-8 -*-
|
||||
|
||||
# Copyright(C) 2011 Clément Schreiner
|
||||
#
|
||||
# This program is free software; you can redistribute it and/or modify
|
||||
# it under the terms of the GNU General Public License as published by
|
||||
# the Free Software Foundation, version 3 of the License.
|
||||
#
|
||||
# This program is distributed in the hope that it will be useful,
|
||||
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||
# GNU General Public License for more details.
|
||||
#
|
||||
# You should have received a copy of the GNU General Public License
|
||||
# along with this program; if not, write to the Free Software
|
||||
# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
|
||||
|
||||
from weboob.tools.backend import BaseBackend
|
||||
from weboob.capabilities.content import ICapContent, Content
|
||||
from weboob.tools.value import ValuesDict, Value
|
||||
|
||||
|
||||
from .browser import MediawikiBrowser
|
||||
|
||||
|
||||
__all__ = ['MediawikiBackend']
|
||||
|
||||
class MediawikiBackend(BaseBackend, ICapContent):
|
||||
NAME = 'mediawiki'
|
||||
MAINTAINER = 'Clément Schreiner'
|
||||
EMAIL = '0.6'
|
||||
LICENSE = 'GPLv3'
|
||||
DESCRIPTION = 'Mediawiki wiki software application'
|
||||
CONFIG = ValuesDict(Value('url', label='URL of the Mediawiki website'),
|
||||
Value('apiurl', label='URL of the Mediawiki website\'s API'),
|
||||
Value('username', label='Login'),
|
||||
Value('password', label='Password', masked=True))
|
||||
|
||||
BROWSER = MediawikiBrowser
|
||||
def create_default_browser(self):
|
||||
return self.create_browser(self.config['url'], self.config['apiurl'], self.config['username'], self.config['password'])
|
||||
|
||||
def get_content(self, _id):
|
||||
_id = _id.replace(' ', '_').encode('utf-8')
|
||||
content = Content(_id)
|
||||
page = _id
|
||||
with self.browser:
|
||||
data = self.browser.get_wiki_source(page)
|
||||
|
||||
content.content = data
|
||||
return content
|
||||
|
||||
def log_content(self, id):
|
||||
raise NotImplementedError()
|
||||
|
||||
|
||||
def push_content(self, content, message=None, minor=False):
|
||||
self.browser.set_wiki_source(content, message, minor)
|
||||
|
||||
def get_content_preview(self, content):
|
||||
return self.browser.get_wiki_preview(content)
|
||||
|
||||
|
||||
|
||||
154
weboob/backends/mediawiki/browser.py
Normal file
154
weboob/backends/mediawiki/browser.py
Normal file
|
|
@ -0,0 +1,154 @@
|
|||
# -*- coding: utf-8 -*-
|
||||
|
||||
# Copyright(C) 2011 Clément Schreiner
|
||||
#
|
||||
# This program is free software; you can redistribute it and/or modify
|
||||
# it under the terms of the GNU General Public License as published by
|
||||
# the Free Software Foundation, version 3 of the License.
|
||||
#
|
||||
# This program is distributed in the hope that it will be useful,
|
||||
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||
# GNU General Public License for more details.
|
||||
#
|
||||
# You should have received a copy of the GNU General Public License
|
||||
# along with this program; if not, write to the Free Software
|
||||
# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
|
||||
|
||||
from urlparse import urlsplit
|
||||
import urllib
|
||||
import lxml.html
|
||||
|
||||
from weboob.tools.browser import BaseBrowser
|
||||
|
||||
try:
|
||||
import simplejson
|
||||
except ImportError:
|
||||
# Python 2.6+ has a module similar to simplejson
|
||||
import json as simplejson
|
||||
|
||||
__all__ = ['MediawikiBrowser']
|
||||
|
||||
|
||||
# Browser
|
||||
class MediawikiBrowser(BaseBrowser):
|
||||
ENCODING = 'utf-8'
|
||||
|
||||
def __init__(self, url, apiurl, *args, **kwargs):
|
||||
url_parsed = urlsplit(url)
|
||||
self.PROTOCOL = url_parsed.scheme
|
||||
self.DOMAIN = url_parsed.netloc
|
||||
self.BASEPATH = url_parsed.path
|
||||
if self.BASEPATH.endswith('/'):
|
||||
self.BASEPATH = self.BASEPATH[:-1]
|
||||
|
||||
prefix = '%s://%s%s' % (self.PROTOCOL, self.DOMAIN, self.BASEPATH)
|
||||
self.apiurl = apiurl
|
||||
|
||||
BaseBrowser.__init__(self, *args, **kwargs)
|
||||
|
||||
def get_wiki_source(self, page):
|
||||
assert isinstance(self.apiurl, basestring)
|
||||
|
||||
data = {'action': 'query',
|
||||
'prop': 'revisions|info',
|
||||
'titles': page,
|
||||
'rvprop': 'content|timestamp',
|
||||
'rvlimit': '1',
|
||||
'intoken': 'edit',
|
||||
}
|
||||
|
||||
|
||||
|
||||
result = self.API_get(data)
|
||||
pageid = result['query']['pages'].keys()[0]
|
||||
if pageid == "-1":
|
||||
return None
|
||||
return result['query']['pages'][str(pageid)]['revisions'][0]['*']
|
||||
|
||||
def get_token(self, page, _type):
|
||||
if not self.is_logged():
|
||||
self.login()
|
||||
|
||||
data = {'action': 'query',
|
||||
'prop': 'info',
|
||||
'titles': page.encode,
|
||||
'intoken': _type,
|
||||
}
|
||||
result = self.API_get(data)
|
||||
pageid = result['query']['pages'].keys()[0]
|
||||
if pageid == "-1":
|
||||
return None
|
||||
return result['query']['pages'][str(pageid)][_type+'token']
|
||||
|
||||
|
||||
def set_wiki_source(self, content, message=None, minor=False):
|
||||
if not self.is_logged():
|
||||
self.login()
|
||||
|
||||
page = content.id
|
||||
token = self.get_token(page, 'edit')
|
||||
|
||||
data = {'action': 'edit',
|
||||
'title': page,
|
||||
'token': token,
|
||||
'text': content.content.encode('utf-8'),
|
||||
'summary': message,
|
||||
}
|
||||
if minor:
|
||||
data['minor'] = 'true'
|
||||
|
||||
result = self.API_post(data)
|
||||
print result
|
||||
|
||||
def get_wiki_preview(self, content, message=None):
|
||||
data = {'action': 'parse',
|
||||
'title': content.id,
|
||||
'text': content.content.encode('utf-8'),
|
||||
'summary': message,
|
||||
}
|
||||
result = self.API_post(data)
|
||||
return result['parse']['text']['*']
|
||||
|
||||
|
||||
|
||||
def is_logged(self):
|
||||
data = {'action': 'query',
|
||||
'meta': 'userinfo',
|
||||
}
|
||||
result = self.API_get(data)
|
||||
return result['query']['userinfo']['id'] != 0
|
||||
|
||||
def login(self):
|
||||
assert isinstance(self.username, basestring)
|
||||
assert isinstance(self.password, basestring)
|
||||
assert isinstance(self.apiurl, basestring)
|
||||
|
||||
data = {'action': 'login',
|
||||
'lgname': self.username,
|
||||
'lgpassword': self.password,
|
||||
}
|
||||
result = self.API_post(data)
|
||||
if result['login']['result'] == 'WrongPass':
|
||||
raise BrowserIncorrectPassword
|
||||
|
||||
if result['login']['result'] == 'NeedToken':
|
||||
data['lgtoken'] = result['login']['token']
|
||||
result2 = self.API_post(data)
|
||||
|
||||
def home(self):
|
||||
'''We don't need to change location, we're using the JSON API here.'''
|
||||
pass
|
||||
|
||||
def API_get(self, data):
|
||||
'''Submit a GET request to the website
|
||||
The JSON data is parsed and returned as a dictionary'''
|
||||
data['format'] = 'json'
|
||||
return simplejson.load(self.openurl(self.buildurl(self.apiurl, **data)), 'utf-8')
|
||||
|
||||
def API_post(self, data):
|
||||
'''Submit a POST request to the website
|
||||
The JSON data is parsed and returned as a dictionary'''
|
||||
|
||||
data['format'] = 'json'
|
||||
return simplejson.load(self.openurl(self.apiurl, urllib.urlencode(data)), 'utf-8')
|
||||
Loading…
Add table
Add a link
Reference in a new issue