Stop doing manual caching

This commit is contained in:
Andras Schmelczer 2026-01-31 10:18:31 +00:00
parent 5c39f31283
commit 0cea9b873c
6 changed files with 82 additions and 191 deletions

View file

@ -4,31 +4,29 @@ DATA_DIR = Path("./data_sources")
GB_PBF_FILE = DATA_DIR / "great-britain-latest.osm.pbf"
OUTPUT_FILE = DATA_DIR / "uk_pois.parquet"
BATCH_SIZE = 50_000
MIN_OCCURENCE_COUNT = 20
GEOFABRIK_GB_URL = (
"https://download.geofabrik.de/europe/great-britain-latest.osm.pbf"
)
# UK bounding box (west, south, east, north) — used for way centroid filtering
UK_BBOX_WEST = -7.57
UK_BBOX_SOUTH = 49.96
UK_BBOX_EAST = 1.68
UK_BBOX_NORTH = 58.64
# OSM tag keys that indicate a POI. Any element with one of these keys is kept,
# regardless of the specific value. When multiple keys match, their values are
# concatenated with " / ".
POI_TAG_KEYS: list[str] = [
"amenity",
"shop",
"leisure",
"tourism",
"railway",
"aeroway",
"highway",
"public_transport",
"station",
"building",
"military",
"craft",
"emergency",
"healthcare",
"leisure",
"office",
"shop",
"tourism",
"public_transport",
]