11# Versioned directories (used with config.get_dir_path())
22versions :
33 osm_data : " 20260416"
4- model_output : " 20260315 "
4+ model_output : " 20260416_by_leisure "
55 snapshot_osm : " 20260416"
6- snapshot_overture : " 20260416 "
6+ snapshot_overture : " 20260417 "
77 snapshot_foursquare : " 20260416"
88 aws : " 20260416"
9- conflation : " 20260416 "
9+ conflation : " 20260417 "
1010
1111# Settings for downloading data
1212download :
@@ -48,29 +48,53 @@ download:
4848 chunk_size : 100_000
4949 max_area_nodes : 1_000
5050 verbose : true
51- filter_keys : ['shop', 'healthcare', 'leisure', 'amenity']
51+ filter_keys : ['shop', 'healthcare', 'leisure', 'amenity', 'tourism', 'office', 'craft', 'historic' ]
5252 extract_keys : [
5353 ' addr:city' ,'addr:country','addr:housename','addr:housenumber','addr:postcode',
5454 ' addr:state' ,'addr:street','addr:unit','amenity','atm','bar','bicycle',
5555 ' bicycle_parking' ,'brand','brand:wikidata','building','check_date',
56- ' check_date:opening_hours' ,'cuisine','description','education','email',
56+ ' check_date:opening_hours' ,'craft',' cuisine','description','education','email',
5757 ' emergency' ,'fountain','geometry','healthcare','healthcare:speciality','historic',
58- ' image' ,'landuse','leisure','name','nursery','official_name','old_name',
58+ ' image' ,'landuse','leisure','name','nursery','office',' official_name','old_name',
5959 ' opening_date' ,'opening_hours','osm_id','osm_type','phone','playground','preschool',
60- ' recycling_type' ,'self_service','service','shelter','shop','short_name',
60+ ' recycling_type' ,'religion',' self_service','service','shelter','shop','short_name',
6161 ' social_facility' ,'social_facility:for','source','sport','tourism','type','url',
6262 ' website' ,'wikidata','wikipedia'
6363 ]
6464 overture :
6565 release_date : null # null = auto-detect latest
6666 s3_bucket : " overturemaps-us-west-2"
6767 s3_region : " us-west-2"
68- taxonomy_l0_categories :
69- - food_and_drink
70- - shopping
71- - arts_and_entertainment
72- - sports_and_recreation
73- - health_care
68+ # (L0, L1) allowlist. L1 = null means "all of this L0".
69+ # Entries intentionally exclude office/B2B-style L1s (corporate offices,
70+ # media services, etc.), transit/parking/airports (covered elsewhere), and
71+ # private lodging (Airbnb-style — duplicates residential addresses).
72+ taxonomy_allowlist :
73+ - [food_and_drink, null]
74+ - [shopping, null]
75+ - [arts_and_entertainment, null]
76+ - [sports_and_recreation, null]
77+ - [health_care, null]
78+ - [lodging, null]
79+ - [cultural_and_historic, null]
80+ - [education, null]
81+ - [lifestyle_services, personal_or_beauty_service]
82+ - [lifestyle_services, wellness_service]
83+ - [lifestyle_services, animal_or_pet_service]
84+ - [lifestyle_services, beauty_service]
85+ - [lifestyle_services, food_service]
86+ - [services_and_business, financial_service]
87+ - [services_and_business, legal_service]
88+ - [services_and_business, professional_service]
89+ - [services_and_business, real_estate_service]
90+ - [services_and_business, home_service]
91+ - [community_and_government, social_or_community_service]
92+ - [community_and_government, government_office]
93+ - [community_and_government, civic_organization]
94+ - [community_and_government, public_facility]
95+ - [community_and_government, public_safety_service]
96+ - [travel_and_transportation, fueling_station]
97+ - [travel_and_transportation, vehicle_service]
7498 foursquare :
7599 release_date : null # null = auto-detect latest
76100 catalog_uri : " https://catalog.h3-hub.foursquare.com/iceberg"
@@ -95,14 +119,14 @@ osm_data:
95119 - last_obs_timestamp
96120 - last_tag_timestamp
97121 apply_model :
98- model_stub : ' 20260315 '
122+ model_stub : ' 20260416 '
99123
100124# Settings for exploratory/models/pytorch_simple.py
101125osm_turnover_model :
102- model_type : constant
126+ model_type : random_by_type
103127 tag_key : name
104128 var_prior : [-1.0, 5.0]
105- group_key : null
129+ group_key : leisure_last_value
106130 group_values : null
107131 min_value_count : 5
108132 n_draws : 250
0 commit comments