You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
Copy file name to clipboardExpand all lines: examples/dropbox/dropbox_spec_ccf_downele.yaml
+10-10Lines changed: 10 additions & 10 deletions
Original file line number
Diff line number
Diff line change
@@ -7,10 +7,10 @@ target_tz_label: PST
7
7
8
8
9
9
data:
10
-
- name: ccf_ele
10
+
- name: ccf_elev
11
11
skip: False
12
12
collect:
13
-
file_pattern: "CC_Water_Levels_2024*.csv"
13
+
file_pattern: "CC_Water_Levels_2025*.csv"
14
14
wildcard: time_overlap # time_sharded | time_overlap | data | none.
15
15
# If time_sharded, indicates non-overlapping timestamps that uses year chunking.
16
16
# If time_overlap, indicates wildcards are ordered by date 20250531(lexicographic must = chronological)
@@ -20,14 +20,14 @@ data:
20
20
recursive_search: False
21
21
reader: read_ts # Names, pointers to code etc. To be fleshed out
22
22
reader_args:
23
-
names: ["datetime", "up_ele","down_ele"]
23
+
names: ["datetime", "up_elev","down_elev"]
24
24
na_values: ["(null)", "null", "NULL", ""]
25
25
hint: "resort"
26
26
force_regular: False
27
27
merge_method: "ts_splice"# We will not call read_ts on wildcard, but rather glob and read and creat list of dfs
28
28
merge_args:
29
29
transition: prefer_first
30
-
selector: down_ele# Usually a column name. When read_last_resort_csv is used, use null.
30
+
selector: down_elev# Usually a column name. When read_last_resort_csv is used, use null.
31
31
transforms:
32
32
- name: dst_tz # SCADA is delivered local time. Often this is not needed from better data sources
33
33
args:
@@ -42,13 +42,12 @@ data:
42
42
heartbeat_freq: 60min
43
43
metadata:
44
44
station_id: clc
45
-
structure_id: ccfb
46
-
agency_id: ccfb
45
+
agency_id: clc
47
46
processor: dms
48
47
agency: dwr
49
48
source: dwr
50
49
freq: None # None for irregular, "infer" for infer.
51
-
param: elevation
50
+
param: elev
52
51
unit: ft
53
52
subloc: down
54
53
time_zone: ${target_tz}
@@ -58,16 +57,17 @@ data:
58
57
# seems like this prevails, but we should prevent conflicts.
59
58
60
59
output:
60
+
# repo_data_dir: ${modeling_data}/repo/continuous/proprietary/formatted # This is a practice directory so you don't go overwriting a real repo while developing the recipe
61
+
# When omitted the target location is the repo_root as configured in dstore_config.yaml
61
62
repo_name: proprietary_formatted # This is a pointer to an entry in dstore_config.yaml
62
63
staging: # This is where the read and transformed time series will be staged.
63
64
# It will be used to update the repo, but that uses update_repo and may not mean a full replacement
repo_data_dir: ${modeling_data}/repo/continuous/proprietary/formatted # This is a practice directory so you don't go overwriting a real repo while developing the recipe
70
-
# When omitted the target location is the repo_root as configured in dstore_config.yaml
70
+
71
71
prefer: staged # This is an argument to the update process:
72
72
# - staged means "prefer the new stuff we staged"
73
73
# - repo means "prefer the stuff in the repo, just top off with any new time stamps"
Copy file name to clipboardExpand all lines: examples/dropbox/dropbox_spec_ccf_upele.yaml
+10-10Lines changed: 10 additions & 10 deletions
Original file line number
Diff line number
Diff line change
@@ -7,10 +7,10 @@ target_tz_label: PST
7
7
8
8
9
9
data:
10
-
- name: ccf_ele
10
+
- name: ccf_elev
11
11
skip: False
12
12
collect:
13
-
file_pattern: "CC_Water_Levels_2024*.csv"
13
+
file_pattern: "CC_Water_Levels_2025*.csv"
14
14
wildcard: time_overlap # time_sharded | time_overlap | data | none.
15
15
# If time_sharded, indicates non-overlapping timestamps that uses year chunking.
16
16
# If time_overlap, indicates wildcards are ordered by date 20250531(lexicographic must = chronological)
@@ -20,14 +20,14 @@ data:
20
20
recursive_search: False
21
21
reader: read_ts # Names, pointers to code etc. To be fleshed out
22
22
reader_args:
23
-
names: ["datetime", "up_ele", "down_ele"]
23
+
names: ["datetime", "up_elev", "down_elev"]
24
24
na_values: ["(null)", "null", "NULL", ""]
25
25
hint: "resort"
26
26
force_regular: False
27
27
merge_method: "ts_splice"# We will not call read_ts on wildcard, but rather glob and read and creat list of dfs
28
28
merge_args:
29
29
transition: prefer_first
30
-
selector: up_ele# Usually a column name. When read_last_resort_csv is used, use null.
30
+
selector: up_elev# Usually a column name. When read_last_resort_csv is used, use null.
31
31
transforms:
32
32
- name: dst_tz # SCADA is delivered local time. Often this is not needed from better data sources
33
33
args:
@@ -42,13 +42,12 @@ data:
42
42
heartbeat_freq: 60min
43
43
metadata:
44
44
station_id: clc
45
-
structure_id: ccfb
46
-
agency_id: ccfb
45
+
agency_id: clc
47
46
processor: dms
48
47
agency: dwr
49
48
source: dwr
50
49
freq: None # None for irregular, "infer" for infer.
51
-
param: elevation
50
+
param: elev
52
51
unit: ft
53
52
subloc: up
54
53
time_zone: ${target_tz}
@@ -59,15 +58,16 @@ data:
59
58
60
59
output:
61
60
repo_name: proprietary_formatted # This is a pointer to an entry in dstore_config.yaml
61
+
# repo_data_dir: ${modeling_data}/repo/continuous/proprietary/formatted # This is a practice directory so you don't go overwriting a real repo while developing the recipe
62
+
# When omitted the target location is the repo_root as configured in dstore_config.yaml
62
63
staging: # This is where the read and transformed time series will be staged.
63
64
# It will be used to update the repo, but that uses update_repo and may not mean a full replacement
repo_data_dir: ${modeling_data}/repo/continuous/proprietary/formatted # This is a practice directory so you don't go overwriting a real repo while developing the recipe
70
-
# When omitted the target location is the repo_root as configured in dstore_config.yaml
70
+
71
71
prefer: staged # This is an argument to the update process:
72
72
# - staged means "prefer the new stuff we staged"
73
73
# - repo means "prefer the stuff in the repo, just top off with any new time stamps"
0 commit comments