Cache data sources

This commit is contained in:
Andras Schmelczer 2026-01-25 21:08:01 +00:00
parent 77c9a40dbf
commit 8c74f0a0bc
3 changed files with 11 additions and 3 deletions

View file

@ -95,6 +95,10 @@ def convert_to_parquet(csv_path: Path, parquet_path: Path) -> None:
def main() -> None:
if PARQUET_PATH.exists():
print(f"Parquet already exists at {PARQUET_PATH}, skipping")
return
if not CSV_PATH.exists():
download_with_progress(URL, CSV_PATH)
else: