dab-mechanic/dab_mechanic/mediawiki_api.py

46 lines
1.2 KiB
Python
Raw Normal View History

2022-08-17 14:38:30 +01:00
"""Interface with the mediawiki API."""
from typing import Any
from . import wikidata_oauth
2022-08-17 14:38:30 +01:00
wiki_hostname = "en.wikipedia.org"
wiki_api_php = f"https://{wiki_hostname}/w/api.php"
user_agent = "dab-mechanic/0.1"
def parse_page(enwiki: str) -> dict[str, Any]:
"""Call mediawiki parse API for given article."""
params: dict[str, str | int] = {
"action": "parse",
"format": "json",
"formatversion": 2,
"disableeditsection": 1,
"page": enwiki,
"prop": "text|links|headhtml",
"disabletoc": 1,
}
parse: dict[str, Any] = call(params)["parse"]
2022-08-17 14:38:30 +01:00
return parse
def call(params: dict[str, str | int]) -> dict[str, Any]:
2022-08-17 14:38:30 +01:00
"""Make GET request to mediawiki API."""
data: dict[str, Any] = wikidata_oauth.api_post_request(params)
return data.json()
2022-08-17 14:38:30 +01:00
def get_content(title: str) -> str:
"""Get article text."""
params: dict[str, str | int] = {
"action": "query",
"format": "json",
"formatversion": 2,
"prop": "revisions|info",
"rvprop": "content|timestamp",
"titles": title,
}
data = call(params)
2022-08-17 14:38:30 +01:00
rev: str = data["query"]["pages"][0]["revisions"][0]["content"]
return rev