Generate Eurostar timetable URLs from station IDs
This commit is contained in:
parent
f75c1e2db3
commit
945d028c13
3 changed files with 40 additions and 24 deletions
2
app.py
2
app.py
|
|
@ -115,7 +115,7 @@ def results(slug, travel_date):
|
||||||
next_date = (dt + timedelta(days=1)).isoformat()
|
next_date = (dt + timedelta(days=1)).isoformat()
|
||||||
travel_date_display = dt.strftime('%A %-d %B %Y')
|
travel_date_display = dt.strftime('%A %-d %B %Y')
|
||||||
|
|
||||||
eurostar_url = eurostar_scraper.ROUTE_URLS[destination] + f"?date={travel_date}"
|
eurostar_url = eurostar_scraper.timetable_url(destination) + f"?date={travel_date}"
|
||||||
rtt_url = RTT_PADDINGTON_URL.format(date=travel_date)
|
rtt_url = RTT_PADDINGTON_URL.format(date=travel_date)
|
||||||
|
|
||||||
return render_template(
|
return render_template(
|
||||||
|
|
|
||||||
|
|
@ -22,30 +22,32 @@ DEFAULT_UA = (
|
||||||
"(KHTML, like Gecko) Chrome/122.0.0.0 Safari/537.36"
|
"(KHTML, like Gecko) Chrome/122.0.0.0 Safari/537.36"
|
||||||
)
|
)
|
||||||
|
|
||||||
ROUTE_URLS = {
|
ORIGIN_STATION_ID = '7015400'
|
||||||
'Paris Gare du Nord': (
|
ORIGIN_STATION_SLUG = 'london-st-pancras-intl'
|
||||||
'https://www.eurostar.com/uk-en/travel-info/timetable/'
|
TIMETABLE_BASE_URL = 'https://www.eurostar.com/uk-en/travel-info/timetable'
|
||||||
'7015400/8727100/london-st-pancras-intl/paris-gare-du-nord'
|
|
||||||
),
|
DESTINATION_STATION_IDS = {
|
||||||
'Brussels Midi': (
|
'Paris Gare du Nord': '8727100',
|
||||||
'https://www.eurostar.com/uk-en/travel-info/timetable/'
|
'Brussels Midi': '8814001',
|
||||||
'7015400/8814001/london-st-pancras-intl/brussels-midi'
|
'Lille Europe': '8722326',
|
||||||
),
|
'Amsterdam Centraal': '8400058',
|
||||||
'Lille Europe': (
|
'Rotterdam Centraal': '8400530',
|
||||||
'https://www.eurostar.com/uk-en/travel-info/timetable/'
|
|
||||||
'7015400/8722326/london-st-pancras-intl/lille-europe'
|
|
||||||
),
|
|
||||||
'Amsterdam Centraal': (
|
|
||||||
'https://www.eurostar.com/uk-en/travel-info/timetable/'
|
|
||||||
'7015400/8400058/london-st-pancras-intl/amsterdam-centraal'
|
|
||||||
),
|
|
||||||
'Rotterdam Centraal': (
|
|
||||||
'https://www.eurostar.com/uk-en/travel-info/timetable/'
|
|
||||||
'7015400/8400530/london-st-pancras-intl/rotterdam-centraal'
|
|
||||||
),
|
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
|
def _slugify_station_name(name: str) -> str:
|
||||||
|
return re.sub(r'[^a-z0-9]+', '-', name.lower()).strip('-')
|
||||||
|
|
||||||
|
|
||||||
|
def timetable_url(destination: str) -> str:
|
||||||
|
dest_id = DESTINATION_STATION_IDS[destination]
|
||||||
|
dest_slug = _slugify_station_name(destination)
|
||||||
|
return (
|
||||||
|
f'{TIMETABLE_BASE_URL}/{ORIGIN_STATION_ID}/{dest_id}/'
|
||||||
|
f'{ORIGIN_STATION_SLUG}/{dest_slug}'
|
||||||
|
)
|
||||||
|
|
||||||
|
|
||||||
def _hhmm(dt_str: str | None) -> str | None:
|
def _hhmm(dt_str: str | None) -> str | None:
|
||||||
"""'2026-03-30 09:34:00' → '09:34'"""
|
"""'2026-03-30 09:34:00' → '09:34'"""
|
||||||
if not dt_str:
|
if not dt_str:
|
||||||
|
|
@ -78,7 +80,7 @@ def _parse(html: str, destination: str) -> list[dict]:
|
||||||
|
|
||||||
def fetch(destination: str, travel_date: str,
|
def fetch(destination: str, travel_date: str,
|
||||||
user_agent: str = DEFAULT_UA) -> list[dict]:
|
user_agent: str = DEFAULT_UA) -> list[dict]:
|
||||||
url = ROUTE_URLS[destination]
|
url = timetable_url(destination)
|
||||||
headers = {
|
headers = {
|
||||||
'User-Agent': user_agent,
|
'User-Agent': user_agent,
|
||||||
'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8',
|
'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8',
|
||||||
|
|
|
||||||
|
|
@ -1,6 +1,6 @@
|
||||||
import json
|
import json
|
||||||
import pytest
|
import pytest
|
||||||
from scraper.eurostar import _hhmm, _parse
|
from scraper.eurostar import _hhmm, _parse, timetable_url
|
||||||
|
|
||||||
|
|
||||||
# ---------------------------------------------------------------------------
|
# ---------------------------------------------------------------------------
|
||||||
|
|
@ -80,3 +80,17 @@ def test_parse_no_next_data_returns_empty():
|
||||||
def test_parse_empty_departures():
|
def test_parse_empty_departures():
|
||||||
html = _make_next_data([])
|
html = _make_next_data([])
|
||||||
assert _parse(html, 'Paris Gare du Nord') == []
|
assert _parse(html, 'Paris Gare du Nord') == []
|
||||||
|
|
||||||
|
|
||||||
|
def test_timetable_url_uses_station_id_table():
|
||||||
|
assert timetable_url('Paris Gare du Nord') == (
|
||||||
|
'https://www.eurostar.com/uk-en/travel-info/timetable/'
|
||||||
|
'7015400/8727100/london-st-pancras-intl/paris-gare-du-nord'
|
||||||
|
)
|
||||||
|
|
||||||
|
|
||||||
|
def test_timetable_url_slugifies_destination_name():
|
||||||
|
assert timetable_url('Rotterdam Centraal') == (
|
||||||
|
'https://www.eurostar.com/uk-en/travel-info/timetable/'
|
||||||
|
'7015400/8400530/london-st-pancras-intl/rotterdam-centraal'
|
||||||
|
)
|
||||||
|
|
|
||||||
Loading…
Add table
Add a link
Reference in a new issue