1 # python-simplemediawiki - Extremely low-level wrapper to the MediaWiki API
2 # Copyright (C) 2010 Red Hat, Inc.
4 # This library is free software; you can redistribute it and/or modify it under
5 # the terms of the GNU Lesser General Public License as published by the Free
6 # Software Foundation; either version 2.1 of the License, or (at your option)
9 # This library is distributed in the hope that it will be useful, but WITHOUT
10 # ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
11 # FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public License for more
14 # You should have received a copy of the GNU General Public License along with
15 # this program. If not, see <http://www.gnu.org/licenses/>.
18 simplemediawiki is an extremely low-level wrapper to the MediaWiki API. It
19 automatically handles cookies and gzip compression so that you can make basic
20 calls to the API in the easiest way possible. It also provides a few functions
21 to make day-to-day API access easier.
23 To use this module, instantiate a MediaWiki object, passing it the URL of
24 api.php for the wiki you want to work with. Calls go through MediaWiki.call().
25 A generic login wrapper as well as functions to determine limits and get a list
26 of namespaces are provided for your convenience.
28 >>> from simplemediawiki import MediaWiki
29 >>> wiki = MediaWiki('http://en.wikipedia.org/w/api.php')
30 >>> wiki.call({'action': 'query', 'prop': 'revisions', 'titles': 'Main Page'})
31 {u'query': {u'pages': {...}}}
36 from iso8601 import iso8601
38 from StringIO import StringIO
45 Class to represent a MediaWiki installation with an enabled API.
47 api_url: URL to api.php (usually similar to http://example.com/w/api.php)
51 _psuedo_namespaces = None
53 def __init__(self, api_url, cookie_file=None):
54 self._api_url = api_url
56 self._cj = cookielib.MozillaCookieJar(cookie_file)
63 self._cj = cookielib.CookieJar()
64 self._opener = urllib2.build_opener(urllib2.HTTPCookieProcessor(self._cj))
66 def call(self, params):
68 Make a call to the wiki. Returns a dictionary that represents the JSON
71 params['format'] = 'json'
72 request = urllib2.Request(self._api_url, urllib.urlencode(params))
73 request.add_header('Accept-encoding', 'gzip')
74 response = self._opener.open(request)
75 if isinstance(self._cj, cookielib.MozillaCookieJar):
77 if response.headers.get('Content-Encoding') == 'gzip':
78 compressed = StringIO(response.read())
79 gzipper = gzip.GzipFile(fileobj=compressed)
82 data = response.read()
83 return json.loads(data)
85 def login(self, user, passwd, token=None):
87 Convenience function for logging into the wiki. It should never be
88 necessary to provide a token argument; it is part of the login process
89 since MediaWiki 1.15.3 (see MediaWiki bug 23076).
91 data = {'action': 'login',
95 data['lgtoken'] = token
96 result = self.call(data)
97 if result['login']['result'] == 'Success':
99 elif result['login']['result'] == 'NeedToken' and not token:
100 return self.login(user, passwd, result['login']['token'])
104 def limits(self, low, high):
106 Convenience function for determining appropriate limits in the API. If
107 the logged in user has the "apihighlimits" right, it will return the
108 high argument; otherwise it will return the low argument.
110 if self._high_limits == None:
111 result = self.call({'action': 'query',
114 self._high_limits = 'apihighlimits' in \
115 result['query']['userinfo']['rights']
116 if self._high_limits:
121 def namespaces(self, psuedo=True):
123 Fetches a list of namespaces for this wiki.
125 if self._namespaces == None:
126 result = self.call({'action': 'query',
128 'siprop': 'namespaces'})
129 self._namespaces = {}
130 self._psuedo_namespaces = {}
131 for nsid in result['query']['namespaces']:
133 self._namespaces[int(nsid)] = \
134 result['query']['namespaces'][nsid]['*']
136 self._psuedo_namespaces[int(nsid)] = \
137 result['query']['namespaces'][nsid]['*']
140 retval.update(self._namespaces)
141 retval.update(self._psuedo_namespaces)
144 return self._namespaces
147 def parse_date(date):
149 Converts dates provided by the MediaWiki API into datetime.datetime
152 return iso8601.parse_date(date)
155 __author__ = 'Ian Weller <ian@ianweller.org>'
156 __version__ = '1.0.1'