67 lines
1.5 KiB
Python
67 lines
1.5 KiB
Python
import requests
|
|
import json
|
|
|
|
wd_api_url = "https://www.wikidata.org/w/api.php"
|
|
|
|
|
|
def api_get(params):
|
|
base_params = {
|
|
"format": "json",
|
|
"formatversion": 2,
|
|
}
|
|
|
|
return requests.get(wd_api_url, params={**base_params, **params})
|
|
|
|
|
|
def get_revision_timestamp(revid):
|
|
params = {
|
|
"action": "query",
|
|
"prop": "revisions",
|
|
"revids": revid,
|
|
"rvprop": "ids|timestamp",
|
|
}
|
|
r = api_get(params)
|
|
rev = r.json()["query"]["pages"][0]["revisions"][0]
|
|
assert rev["revid"] == int(revid)
|
|
return rev["timestamp"]
|
|
|
|
|
|
def get_recent_changes(**kwargs):
|
|
props = [
|
|
"title",
|
|
"ids",
|
|
"comment",
|
|
"parsedcomment",
|
|
"timestamp",
|
|
"redirect",
|
|
"loginfo",
|
|
]
|
|
|
|
params = {
|
|
"action": "query",
|
|
"list": "recentchanges",
|
|
"rcnamespace": 0,
|
|
# "rctype": "log",
|
|
# "rclimit": "max",
|
|
"rclimit": "max",
|
|
# "rcstart": start,
|
|
"rcdir": "newer",
|
|
"rcprop": "|".join(props),
|
|
**{k: v for k, v in kwargs.items() if v},
|
|
}
|
|
|
|
return api_get(params)
|
|
|
|
|
|
def get_entity(qid):
|
|
data = api_get({"action": "wbgetentities", "ids": qid}).json()
|
|
if "entities" not in data:
|
|
print(json.dumps(data, indent=2))
|
|
return data["entities"][qid]
|
|
|
|
|
|
def get_entities(ids):
|
|
r = api_get({"action": "wbgetentities", "ids": "|".join(ids)})
|
|
for qid, entity in r.json()["entities"].items():
|
|
yield qid, entity
|