@@ -3,26 +3,25 @@ variable_mappings: variable_mappings.csv
33variable_definitions : variables.csv
44sublocations : station_subloc.csv
55ncro_inventory : ncro_inventory_full.csv
6-
76daily_data_manifest : daily_data_manifest.csv
87daily_dropbox_spec : daily_dropbox.yaml
9-
108file_deletion_list : non_15_min_files_checked.txt
119compare_excepts_formatted : compare_excepts_formatted.txt
1210des_rationalize_time_spec : des_rationalize_cfg.yaml
13-
1411repo_base : " //cnrastore-bdo/Modeling_Data/repo"
15-
16- default_repo : screened
17-
1812spot_check_spec : spot_check_spec.yaml
1913
20- # registry files available to repos
14+ # Repository info
15+ default_repo : screened
2116
2217
18+ # aliases for registry files available to repos in their "registry"
19+ # these will be looked for in the dbase_config directory and are expected to be csv files.
20+ # The registry files provide supplementary metadata that can be used for provider resolution,
21+ # geographical and other purposes.
2322registries :
2423 continuous : station_dbase.csv
25- processed : processed_series .csv
24+ processed_synthetic : processed_registry .csv
2625 structures : structures_registry.csv
2726 daily : station_dbase.csv
2827
@@ -31,15 +30,10 @@ repos:
3130 formatted :
3231 root : " //cnrastore-bdo/Modeling_Data/repo/continuous/formatted"
3332
34- # Registry providing supplementary metadata (e.g., agency, location)
35- registry : continuous
36-
37- # Primary identifier for a site (station, structure, etc.). This will be a key for the registry
38- # and is always part of filename templates, usually in the second slot
39- # Examples: structure_id or station_id
40- site_key : station_id
41-
42- # Depending on settings for the repo, multiple sources (e.g., ncro, cdec) may supply the same series
33+ # Registry providing supplementary metadata (e.g., agency, location) for stations
34+ registry : continuous # this is an alias set up above for station_dbase.csv.
35+
36+ # Depending on settings for the repo, multiple sources (e.g., ncro, cdec) may supply the same time series
4337 # For instance Bacon Island conductance is observed by NCRO but distributed both by NCRO (QA/QC'd data on Water Data Library)
4438 # and on CDEC (realtime, not QA/QC). This field, in this case {source} appears in the filename template
4539 # (typically first slot) and drives globbing and merge order
8882 screened :
8983 root : " //cnrastore-bdo/Modeling_Data/repo/continuous/screened"
9084 registry : continuous
91- site_key : station_id
9285 # screened data is assumed to be grouped according to the original agency/program that manages the station.
9386 # so whereas in formatted you might have both "ncro" and "cdec" sources for a station, here they will be unified under ncro.
9487 provider_key : agency
@@ -102,8 +95,8 @@ repos:
10295
10396 processed :
10497 root : " //cnrastore-bdo/Modeling_Data/repo/continuous/processed"
105- registry : processed
106- site_key : station_id
98+ registry : [continuous, processed_synthetic]
99+
107100 provider_key : processor
108101 provider_resolution_mode : assume_unique # This may have to be adjusted for cases like SF harmonic tides where there is a noaa and dwr version
109102 filename_templates :
@@ -113,23 +106,21 @@ repos:
113106 - " {processor}_{station_id@subloc}_{param}_{year}.csv"
114107 - " {processor}_{station_id@subloc}_{param}.csv"
115108 file_key : [processor, station_id, subloc, param, modifier, shard]
116- data_key : [station_id , subloc, param, modifier]
109+ data_key : [processor , subloc, param, modifier]
117110
118111 structures_formatted :
119112 root : " //cnrastore-bdo/Modeling_Data/repo/structures/formatted"
120113 registry : structures
121- site_key : structure_id
122114 provider_key : processor
123115 provider_resolution_mode : assume_unique
124116 filename_templates :
125- - " {processor}_{structure_id @subloc}_{param@modifier}.csv"
126- - " {processor}_{structure_id @subloc}_{param@modifier}_{year}.csv"
117+ - " {processor}_{station_id @subloc}_{param@modifier}.csv"
118+ - " {processor}_{station_id @subloc}_{param@modifier}_{year}.csv"
127119
128120
129121 daily_formatted :
130122 root : " //cnrastore-bdo/Modeling_Data/repo/daily/formatted"
131123 registry : continuous # aliases the station data base that provides supplementary metadata like geolocation and agency
132- site_key : station_id # registry and template use this term for the site's identifier (was "key")
133124 provider_key : source # provider is the agency mainly involved in delivering the data.
134125 # Generic for "source" (datamart) "agency" (collecting agency) and
135126# # "processor" (group synthesizing, manipulating or filling data)
0 commit comments