Add geosure data

This commit is contained in:
Andras Schmelczer 2026-02-07 13:22:57 +00:00
parent c715475351
commit c91561d7fe
4 changed files with 216 additions and 1 deletions

View file

@ -13,7 +13,7 @@ vars:
WIDE_OUTPUT: "{{.DATA_DIR}}/wide.parquet"
EPC: "{{.DATA_DIR}}/certificates.csv"
JOURNEY_TIMES_BANK: "{{.DATA_DIR}}/journey_times_bank.parquet"
JOURNEY_TIMES_FITZROVIA: "{{.DATA_DIR}}/journey_times_fitzrovia_checkpoint.parquet"
JOURNEY_TIMES_FITZROVIA: "{{.DATA_DIR}}/journey_times_fitzrovia.parquet"
ETHNICITY_OUTPUT: "{{.DATA_DIR}}/ethnicity_by_la.parquet"
CRIME_DIR: "{{.DATA_DIR}}/crime"
CRIME_OUTPUT: "{{.DATA_DIR}}/crime_by_lsoa.parquet"
@ -23,6 +23,8 @@ vars:
BROADBAND_OUTPUT: "{{.DATA_DIR}}/broadband.parquet"
SCHOOL_PROXIMITY_OUTPUT: "{{.DATA_DIR}}/school_proximity.parquet"
POSTCODES_OUTPUT: "{{.DATA_DIR}}/postcodes"
GEOSURE_OUTPUT: "{{.DATA_DIR}}/geosure"
GEOSURE_PARQUET: "{{.DATA_DIR}}/geosure.parquet"
tasks:
download:tiles:
@ -141,6 +143,13 @@ tasks:
cmds:
- uv run python -m pipeline.download.postcodes --output {{.POSTCODES_OUTPUT}}
download:geosure:
desc: Download OS GeoSure ground stability data (5km hex grid)
status:
- test -d {{.GEOSURE_OUTPUT}}
cmds:
- uv run python -m pipeline.download.geosure --output {{.GEOSURE_OUTPUT}}
download:noise:
desc: Download Defra noise data (road, rail, airport) sampled at postcode centroids
deps:
@ -197,6 +206,16 @@ tasks:
cmds:
- uv run python -m pipeline.transform.school_proximity --ofsted {{.OFSTED_OUTPUT}} --arcgis {{.ARCGIS_OUTPUT}} --output {{.SCHOOL_PROXIMITY_OUTPUT}}
transform:geosure:
desc: Spatial-join GeoSure ground stability data to postcode centroids
deps:
- download:geosure
- download:arcgis
status:
- test -f {{.GEOSURE_PARQUET}}
cmds:
- uv run python -m pipeline.transform.transform_geosure --geosure {{.GEOSURE_OUTPUT}} --arcgis {{.ARCGIS_OUTPUT}} --output {{.GEOSURE_PARQUET}}
download:journey-times:
desc: "Fetch TfL journey times: task download:journey-times"
deps:
@ -218,6 +237,7 @@ tasks:
# - transform:crime
# - transform:poi-proximity
# - transform:school-proximity
# - transform:geosure
# - prompt:journey-times
status:
- test -f {{.WIDE_OUTPUT}}
@ -235,4 +255,5 @@ tasks:
--noise {{.NOISE_OUTPUT}}
--school-proximity {{.SCHOOL_PROXIMITY_OUTPUT}}
--broadband {{.BROADBAND_OUTPUT}}
--geosure {{.GEOSURE_PARQUET}}
--output {{.WIDE_OUTPUT}}