X-Git-Url: https://projects.mako.cc/source/wikipedia-api-cdsw/blobdiff_plain/4f9f564e2fac44ff1330a1d4d5bb4c7424791306..f17f0a3f63dd03d70cdc693da0bda53a1e85671b:/wikipedia-raw2.py diff --git a/wikipedia-raw2.py b/wikipedia-raw2.py index c7eca1b..a8efd34 100644 --- a/wikipedia-raw2.py +++ b/wikipedia-raw2.py @@ -1,6 +1,5 @@ import time -import simplejson as json -from urllib2 import urlopen +import requests url_base = 'https://en.wikipedia.org/w/api.php?action=query&prop=revisions&titles=%s&rvlimit=100&rvprop=timestamp|user&format=json' @@ -8,15 +7,14 @@ pages = ["Benjamin_Mako_Hill", "Python", "Data_science"] for page_title in pages: - wp_call = urlopen(url_base % page_title) - response = json.loads(wp_call.read()) + wp_call = requests.get(url_base % page_title) + response = wp_call.json() for page_id in response["query"]["pages"].keys(): page_title = response["query"]["pages"][page_id]["title"] revisions = response["query"]["pages"][page_id]["revisions"] for rev in revisions: - print page_title + "\t" + rev["user"] + "\t" + rev["timestamp"] - + print(page_title + "\t" + rev["user"] + "\t" + rev["timestamp"]) time.sleep(3)