From 8c74f0a0bc645e25844b6245bd1b2c9db9a0f3a7 Mon Sep 17 00:00:00 2001 From: Andras Schmelczer Date: Sun, 25 Jan 2026 21:08:01 +0000 Subject: [PATCH] Cache data sources --- download_arcgis_data.py | 4 ++++ download_land_registry.py | 4 ++++ generate_tfl_client.py | 6 +++--- 3 files changed, 11 insertions(+), 3 deletions(-) diff --git a/download_arcgis_data.py b/download_arcgis_data.py index 1e2d249..8cccc56 100644 --- a/download_arcgis_data.py +++ b/download_arcgis_data.py @@ -101,6 +101,10 @@ def convert_to_parquet(data_path: Path, parquet_path: Path) -> None: def main() -> None: + if PARQUET_PATH.exists(): + print(f"Parquet already exists at {PARQUET_PATH}, skipping") + return + if not DOWNLOAD_PATH.exists(): download_with_progress(URL, DOWNLOAD_PATH) else: diff --git a/download_land_registry.py b/download_land_registry.py index c421bab..6172eae 100644 --- a/download_land_registry.py +++ b/download_land_registry.py @@ -95,6 +95,10 @@ def convert_to_parquet(csv_path: Path, parquet_path: Path) -> None: def main() -> None: + if PARQUET_PATH.exists(): + print(f"Parquet already exists at {PARQUET_PATH}, skipping") + return + if not CSV_PATH.exists(): download_with_progress(URL, CSV_PATH) else: diff --git a/generate_tfl_client.py b/generate_tfl_client.py index c6eb9ad..d52e073 100644 --- a/generate_tfl_client.py +++ b/generate_tfl_client.py @@ -20,10 +20,10 @@ def main() -> None: if not OPENAPI_SPEC.exists(): raise FileNotFoundError(f"OpenAPI spec not found: {OPENAPI_SPEC}") - # Remove existing client if present + # Skip if client already exists if OUTPUT_PATH.exists(): - print(f"Removing existing client at {OUTPUT_PATH}") - shutil.rmtree(OUTPUT_PATH) + print(f"TfL client already exists at {OUTPUT_PATH}, skipping") + return # Generate the client print(f"Generating client from {OPENAPI_SPEC}")