49 lines
1.2 KiB
Python
49 lines
1.2 KiB
Python
|
"""Interface with the mediawiki API."""
|
||
|
|
||
|
from typing import Any
|
||
|
|
||
|
import requests
|
||
|
|
||
|
wiki_hostname = "en.wikipedia.org"
|
||
|
wiki_api_php = f"https://{wiki_hostname}/w/api.php"
|
||
|
user_agent = "dab-mechanic/0.1"
|
||
|
|
||
|
|
||
|
def parse_page(enwiki: str) -> dict[str, Any]:
|
||
|
"""Call mediawiki parse API for given article."""
|
||
|
params: dict[str, str | int] = {
|
||
|
"action": "parse",
|
||
|
"format": "json",
|
||
|
"formatversion": 2,
|
||
|
"disableeditsection": 1,
|
||
|
"page": enwiki,
|
||
|
"prop": "text|links|headhtml",
|
||
|
"disabletoc": 1,
|
||
|
}
|
||
|
|
||
|
parse: dict[str, Any] = get(params)["parse"]
|
||
|
return parse
|
||
|
|
||
|
|
||
|
def get(params: dict[str, str | int]) -> dict[str, Any]:
|
||
|
"""Make GET request to mediawiki API."""
|
||
|
data: dict[str, Any] = requests.get(
|
||
|
wiki_api_php, headers={"User-Agent": user_agent}, params=params
|
||
|
).json()
|
||
|
return data
|
||
|
|
||
|
|
||
|
def get_content(title: str) -> str:
|
||
|
"""Get article text."""
|
||
|
params: dict[str, str | int] = {
|
||
|
"action": "query",
|
||
|
"format": "json",
|
||
|
"formatversion": 2,
|
||
|
"prop": "revisions|info",
|
||
|
"rvprop": "content|timestamp",
|
||
|
"titles": title,
|
||
|
}
|
||
|
data = get(params)
|
||
|
rev: str = data["query"]["pages"][0]["revisions"][0]["content"]
|
||
|
return rev
|