refactor: centralize timeout constants in scrapers/timeouts.py

Problem: each scraper defined its own timeout constants (`TIMEOUT_S`, `TIMEOUT_SECONDS`) with inconsistent values (15s vs 30s) and browser timeouts were scattered as magic numbers (60000, 15000, 5000, 500). Solution: introduce `scrapers/timeouts.py` with named constants for HTTP requests, browser session/navigation/element/turnstile/settle timeouts, and submission polling. All six scrapers now import from the shared module.
2026-03-05 01:35:40 -05:00 · 2026-03-05 01:35:40 -05:00 · 2cdde85d36
commit 2cdde85d36
parent f4055b071b
7 changed files with 58 additions and 37 deletions
--- a/scrapers/kattis.py
+++ b/scrapers/kattis.py
@ -10,6 +10,7 @@ from datetime import datetime
 import httpx

 from .base import BaseScraper
+from .timeouts import HTTP_TIMEOUT
 from .models import (
    ContestListResult,
    ContestSummary,
@ -23,7 +24,6 @@ BASE_URL = "https://open.kattis.com"
 HEADERS = {
    "User-Agent": "Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36"
 }
-TIMEOUT_S = 15.0
 CONNECTIONS = 8

 TIME_RE = re.compile(
@ -37,13 +37,13 @@ MEM_RE = re.compile(


 async def _fetch_text(client: httpx.AsyncClient, url: str) -> str:
-    r = await client.get(url, headers=HEADERS, timeout=TIMEOUT_S)
+    r = await client.get(url, headers=HEADERS, timeout=HTTP_TIMEOUT)
    r.raise_for_status()
    return r.text


 async def _fetch_bytes(client: httpx.AsyncClient, url: str) -> bytes:
-    r = await client.get(url, headers=HEADERS, timeout=TIMEOUT_S)
+    r = await client.get(url, headers=HEADERS, timeout=HTTP_TIMEOUT)
    r.raise_for_status()
    return r.content