ferrocarrilcentral/check.py

180 lines
5 KiB
Python
Executable file

#!/usr/bin/python3
import configparser
import json
import logging
import smtplib
import sys
from datetime import date
from email.mime.text import MIMEText
from pathlib import Path
import lxml.html
import requests
# Spanish months with corresponding numbers (1-12)
spanish_months = {
"enero": 1,
"febrero": 2,
"marzo": 3,
"abril": 4,
"mayo": 5,
"junio": 6,
"julio": 7,
"agosto": 8,
"septiembre": 9,
"octubre": 10,
"noviembre": 11,
"diciembre": 12,
}
# Paths
CONFIG_DIR = Path.home() / ".config" / "ferrocarril"
CONFIG_FILE = CONFIG_DIR / "config"
DATA_DIR = Path.home() / "lib" / "data"
DATA_FILE = DATA_DIR / "ferrocarril_dates.json"
URL = "https://ferrocarrilcentral.com.pe/appfcca/"
# Configure logging
logger = logging.getLogger("FerrocarrilMonitor")
logger.setLevel(logging.INFO)
# Handler for stdout
handler = logging.StreamHandler(sys.stdout)
formatter = logging.Formatter("%(levelname)s: %(message)s")
handler.setFormatter(formatter)
# Only log INFO when in TTY, always log ERROR
if sys.stdout.isatty():
logger.addHandler(handler)
else:
handler.setLevel(logging.ERROR)
logger.addHandler(handler)
def parse_dates(html_content: str) -> list[date]:
doc = lxml.html.fromstring(html_content)
dates = []
for tour in doc.xpath('//div[contains(@class, "tourdate")]'):
try:
day = int(tour.xpath('.//div[contains(@class, "day")]')[0].text.strip())
yeardate = tour.xpath('.//div[contains(@class, "yeardate")]')[0]
month_str = (
yeardate.xpath('.//div[contains(@class, "month")]')[0]
.text.strip()
.lower()
)
year = int(
yeardate.xpath('.//div[contains(@class, "year")]')[0].text.strip()
)
month = spanish_months.get(month_str)
if month is None:
raise ValueError(f"Unknown month: {month_str}")
dates.append(date(year, month, day))
except (IndexError, ValueError) as e:
logger.error(f"Error parsing date: {e}")
continue
return dates
def load_previous_dates() -> set[str]:
"""Load previously seen dates from file, return as set of ISO strings."""
if DATA_FILE.exists():
with open(DATA_FILE, "r") as f:
return set(json.load(f))
return set()
def save_dates(dates: list[date]) -> None:
"""Save current dates to file as ISO strings."""
DATA_DIR.mkdir(parents=True, exist_ok=True)
with open(DATA_FILE, "w") as f:
json.dump([d.isoformat() for d in dates], f)
def load_config() -> configparser.ConfigParser:
"""Load email configuration from INI file."""
if not CONFIG_FILE.exists():
raise FileNotFoundError(
f"Config file not found at {CONFIG_FILE}. Please create it with SMTP details."
)
config = configparser.ConfigParser()
config.read(CONFIG_FILE)
if "mail" not in config:
raise ValueError(f"Config file {CONFIG_FILE} must have an [mail] section")
return config
def send_email(new_dates: list[date], config: configparser.ConfigParser) -> None:
"""Send email with new dates."""
email_config = config["mail"]
subject = "New Ferrocarril Central Dates Available!"
body = (
"New dates found:\n"
+ "\n".join(d.strftime("%d %B %Y") for d in new_dates)
+ f"\n\n{URL}"
)
msg = MIMEText(body)
msg["Subject"] = subject
msg["From"] = email_config["from_address"]
msg["To"] = email_config["to_address"]
try:
with smtplib.SMTP(email_config["smtp_host"]) as server:
server.send_message(msg)
logger.info("Email sent successfully")
except Exception as e:
logger.error(f"Failed to send email: {e}")
raise # Re-raise to prevent saving dates if email fails
def main() -> None:
# Ensure directories exist
CONFIG_DIR.mkdir(parents=True, exist_ok=True)
DATA_DIR.mkdir(parents=True, exist_ok=True)
# Fetch webpage
try:
response = requests.get(URL, timeout=10)
response.raise_for_status()
html_content = response.text
except requests.RequestException as e:
logger.error(f"Failed to fetch webpage: {e}")
return
# Parse current dates
current_dates = set(parse_dates(html_content))
if not current_dates:
logger.info("No dates found on webpage")
return
# Load previous dates
previous_dates = load_previous_dates()
# Check for new dates
new_dates = [d for d in current_dates if d.isoformat() not in previous_dates]
if new_dates:
logger.info(f"New dates found: {new_dates}")
try:
config = load_config()
send_email(new_dates, config)
save_dates(
list(current_dates)
) # Update stored dates only if email succeeds
except FileNotFoundError as e:
logger.error(str(e))
except Exception as e:
logger.error(f"Error in processing: {e}")
else:
logger.info("No new dates found")
if __name__ == "__main__":
main()