Skip to content

Commit 16004aa

Browse files
committed
docs: align project documentation and benchmarks with new pipeline architecture
1 parent 840f973 commit 16004aa

9 files changed

Lines changed: 212 additions & 159 deletions

File tree

.vscode/settings.json

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -5,5 +5,6 @@
55
"python.testing.unittestEnabled": false,
66
"python.testing.pytestEnabled": true,
77
"python-envs.defaultEnvManager": "ms-python.python:conda",
8-
"python-envs.defaultPackageManager": "ms-python.python:conda"
8+
"python-envs.defaultPackageManager": "ms-python.python:conda",
9+
"python.terminal.activateEnvironment": false
910
}

README.md

Lines changed: 53 additions & 39 deletions
Large diffs are not rendered by default.
Lines changed: 130 additions & 110 deletions
Original file line numberDiff line numberDiff line change
@@ -1,111 +1,131 @@
11
view,timestamp,logger,memory,unit
2-
DEFAULT,2026-04-20T14:59:18.784422Z,METRIC_MEM:,429,MB
3-
DEFAULT,2026-04-20T14:59:19.784315Z,METRIC_MEM:,467.35,MB
4-
DEFAULT,2026-04-20T14:59:20.784602Z,METRIC_MEM:,525.09,MB
5-
DEFAULT,2026-04-20T14:59:21.784888Z,METRIC_MEM:,530.13,MB
6-
DEFAULT,2026-04-20T14:59:22.785227Z,METRIC_MEM:,533.62,MB
7-
DEFAULT,2026-04-20T14:59:23.785545Z,METRIC_MEM:,534.02,MB
8-
DEFAULT,2026-04-20T14:59:24.785893Z,METRIC_MEM:,534.46,MB
9-
DEFAULT,2026-04-20T14:59:25.786286Z,METRIC_MEM:,533.57,MB
10-
DEFAULT,2026-04-20T14:59:26.786608Z,METRIC_MEM:,533.07,MB
11-
DEFAULT,2026-04-20T14:59:27.786989Z,METRIC_MEM:,533.24,MB
12-
DEFAULT,2026-04-20T14:59:28.787246Z,METRIC_MEM:,534.23,MB
13-
DEFAULT,2026-04-20T14:59:29.787577Z,METRIC_MEM:,534.72,MB
14-
DEFAULT,2026-04-20T14:59:30.787938Z,METRIC_MEM:,534.72,MB
15-
DEFAULT,2026-04-20T14:59:31.788315Z,METRIC_MEM:,534.96,MB
16-
DEFAULT,2026-04-20T14:59:32.788644Z,METRIC_MEM:,536.2,MB
17-
DEFAULT,2026-04-20T14:59:33.788993Z,METRIC_MEM:,538.16,MB
18-
DEFAULT,2026-04-20T14:59:34.789341Z,METRIC_MEM:,538.66,MB
19-
DEFAULT,2026-04-20T14:59:35.789670Z,METRIC_MEM:,538.66,MB
20-
DEFAULT,2026-04-20T14:59:36.789550Z,METRIC_MEM:,539.64,MB
21-
DEFAULT,2026-04-20T14:59:37.789398Z,METRIC_MEM:,539.64,MB
22-
DEFAULT,2026-04-20T14:59:38.789317Z,METRIC_MEM:,541.61,MB
23-
DEFAULT,2026-04-20T14:59:39.789179Z,METRIC_MEM:,541.61,MB
24-
DEFAULT,2026-04-20T14:59:40.789326Z,METRIC_MEM:,546.59,MB
25-
DEFAULT,2026-04-20T14:59:41.789650Z,METRIC_MEM:,546.59,MB
26-
DEFAULT,2026-04-20T14:59:42.790023Z,METRIC_MEM:,546.59,MB
27-
DEFAULT,2026-04-20T14:59:43.790569Z,METRIC_MEM:,720.57,MB
28-
DEFAULT,2026-04-20T14:59:44.790956Z,METRIC_MEM:,950.8,MB
29-
DEFAULT,2026-04-20T14:59:45.791405Z,METRIC_MEM:,1116.99,MB
30-
DEFAULT,2026-04-20T14:59:46.791919Z,METRIC_MEM:,1334.91,MB
31-
DEFAULT,2026-04-20T14:59:47.792322Z,METRIC_MEM:,1531.51,MB
32-
DEFAULT,2026-04-20T14:59:48.792605Z,METRIC_MEM:,1672.36,MB
33-
DEFAULT,2026-04-20T14:59:49.793038Z,METRIC_MEM:,1945.44,MB
34-
DEFAULT,2026-04-20T14:59:50.796118Z,METRIC_MEM:,2140.77,MB
35-
DEFAULT,2026-04-20T14:59:51.793792Z,METRIC_MEM:,2344.64,MB
36-
DEFAULT,2026-04-20T14:59:52.794297Z,METRIC_MEM:,2603.11,MB
37-
DEFAULT,2026-04-20T14:59:53.795767Z,METRIC_MEM:,2983.83,MB
38-
DEFAULT,2026-04-20T14:59:54.796083Z,METRIC_MEM:,3151.56,MB
39-
DEFAULT,2026-04-20T14:59:55.822665Z,METRIC_MEM:,3624.16,MB
40-
DEFAULT,2026-04-20T14:59:56.818814Z,METRIC_MEM:,3774.27,MB
41-
DEFAULT,2026-04-20T14:59:57.818682Z,METRIC_MEM:,4308.78,MB
42-
DEFAULT,2026-04-20T14:59:58.818511Z,METRIC_MEM:,4809.82,MB
43-
DEFAULT,2026-04-20T14:59:59.821162Z,METRIC_MEM:,5383.96,MB
44-
DEFAULT,2026-04-20T15:00:00.818704Z,METRIC_MEM:,5452.28,MB
45-
DEFAULT,2026-04-20T15:00:01.819104Z,METRIC_MEM:,5468.47,MB
46-
DEFAULT,2026-04-20T15:00:02.819475Z,METRIC_MEM:,5457.18,MB
47-
DEFAULT,2026-04-20T15:00:03.819830Z,METRIC_MEM:,5447.39,MB
48-
DEFAULT,2026-04-20T15:00:04.820259Z,METRIC_MEM:,5465.26,MB
49-
DEFAULT,2026-04-20T15:00:05.820598Z,METRIC_MEM:,5463.11,MB
50-
DEFAULT,2026-04-20T15:00:06.820974Z,METRIC_MEM:,5449.82,MB
51-
DEFAULT,2026-04-20T15:00:07.821433Z,METRIC_MEM:,5462.01,MB
52-
DEFAULT,2026-04-20T15:00:08.821801Z,METRIC_MEM:,5461.89,MB
53-
DEFAULT,2026-04-20T15:00:09.822611Z,METRIC_MEM:,5466.36,MB
54-
DEFAULT,2026-04-20T15:00:10.839283Z,METRIC_MEM:,5462.5,MB
55-
DEFAULT,2026-04-20T15:00:11.826381Z,METRIC_MEM:,5461.91,MB
56-
DEFAULT,2026-04-20T15:00:12.826815Z,METRIC_MEM:,5458.66,MB
57-
DEFAULT,2026-04-20T15:00:13.827094Z,METRIC_MEM:,5472.28,MB
58-
DEFAULT,2026-04-20T15:00:14.830802Z,METRIC_MEM:,5777.54,MB
59-
DEFAULT,2026-04-20T15:00:15.834612Z,METRIC_MEM:,6242.66,MB
60-
DEFAULT,2026-04-20T15:00:16.831243Z,METRIC_MEM:,6952.15,MB
61-
DEFAULT,2026-04-20T15:00:17.832603Z,METRIC_MEM:,7086.52,MB
62-
DEFAULT,2026-04-20T15:00:18.837562Z,METRIC_MEM:,7565.95,MB
63-
DEFAULT,2026-04-20T15:00:19.832365Z,METRIC_MEM:,7538.39,MB
64-
DEFAULT,2026-04-20T15:00:20.837168Z,METRIC_MEM:,7572.7,MB
65-
DEFAULT,2026-04-20T15:00:21.833118Z,METRIC_MEM:,7471.39,MB
66-
DEFAULT,2026-04-20T15:00:22.833394Z,METRIC_MEM:,7300.56,MB
67-
DEFAULT,2026-04-20T15:00:23.834075Z,METRIC_MEM:,7132.16,MB
68-
DEFAULT,2026-04-20T15:00:24.834825Z,METRIC_MEM:,6974.58,MB
69-
DEFAULT,2026-04-20T15:00:25.835584Z,METRIC_MEM:,6812.74,MB
70-
DEFAULT,2026-04-20T15:00:26.836323Z,METRIC_MEM:,6683.75,MB
71-
DEFAULT,2026-04-20T15:00:27.837011Z,METRIC_MEM:,6570.68,MB
72-
DEFAULT,2026-04-20T15:00:28.840331Z,METRIC_MEM:,6553.34,MB
73-
DEFAULT,2026-04-20T15:00:29.842342Z,METRIC_MEM:,6449.74,MB
74-
DEFAULT,2026-04-20T15:00:30.842779Z,METRIC_MEM:,6420.25,MB
75-
DEFAULT,2026-04-20T15:00:31.843102Z,METRIC_MEM:,6447.04,MB
76-
DEFAULT,2026-04-20T15:00:32.846716Z,METRIC_MEM:,6428.24,MB
77-
DEFAULT,2026-04-20T15:00:33.850433Z,METRIC_MEM:,7085.44,MB
78-
DEFAULT,2026-04-20T15:00:34.847560Z,METRIC_MEM:,7094.02,MB
79-
DEFAULT,2026-04-20T15:00:35.847891Z,METRIC_MEM:,7108.24,MB
80-
DEFAULT,2026-04-20T15:00:36.847936Z,METRIC_MEM:,7095.18,MB
81-
DEFAULT,2026-04-20T15:00:37.847913Z,METRIC_MEM:,7092.72,MB
82-
DEFAULT,2026-04-20T15:00:38.847807Z,METRIC_MEM:,7062.34,MB
83-
DEFAULT,2026-04-20T15:00:39.853210Z,METRIC_MEM:,6921.07,MB
84-
DEFAULT,2026-04-20T15:00:40.853684Z,METRIC_MEM:,6909.97,MB
85-
DEFAULT,2026-04-20T15:00:41.854214Z,METRIC_MEM:,6891.98,MB
86-
DEFAULT,2026-04-20T15:00:42.854490Z,METRIC_MEM:,6879.31,MB
87-
DEFAULT,2026-04-20T15:00:43.855020Z,METRIC_MEM:,6877.95,MB
88-
DEFAULT,2026-04-20T15:00:44.855450Z,METRIC_MEM:,6894.8,MB
89-
DEFAULT,2026-04-20T15:00:45.855873Z,METRIC_MEM:,6756.96,MB
90-
DEFAULT,2026-04-20T15:00:46.857784Z,METRIC_MEM:,6485.72,MB
91-
DEFAULT,2026-04-20T15:00:47.856652Z,METRIC_MEM:,6450.91,MB
92-
DEFAULT,2026-04-20T15:00:48.857031Z,METRIC_MEM:,6517.63,MB
93-
DEFAULT,2026-04-20T15:00:49.862250Z,METRIC_MEM:,6513.41,MB
94-
DEFAULT,2026-04-20T15:00:50.857773Z,METRIC_MEM:,6521.28,MB
95-
DEFAULT,2026-04-20T15:00:51.858133Z,METRIC_MEM:,6505.07,MB
96-
DEFAULT,2026-04-20T15:00:52.858414Z,METRIC_MEM:,6429.95,MB
97-
DEFAULT,2026-04-20T15:00:53.858797Z,METRIC_MEM:,6476.4,MB
98-
DEFAULT,2026-04-20T15:00:54.859127Z,METRIC_MEM:,6480.01,MB
99-
DEFAULT,2026-04-20T15:00:55.859485Z,METRIC_MEM:,6481.43,MB
100-
DEFAULT,2026-04-20T15:00:56.859441Z,METRIC_MEM:,6478.38,MB
101-
DEFAULT,2026-04-20T15:00:57.859322Z,METRIC_MEM:,6479.16,MB
102-
DEFAULT,2026-04-20T15:00:58.859179Z,METRIC_MEM:,6474.57,MB
103-
DEFAULT,2026-04-20T15:00:59.859043Z,METRIC_MEM:,6344.71,MB
104-
DEFAULT,2026-04-20T15:01:00.859298Z,METRIC_MEM:,6363.68,MB
105-
DEFAULT,2026-04-20T15:01:01.859673Z,METRIC_MEM:,6307.33,MB
106-
DEFAULT,2026-04-20T15:01:02.859970Z,METRIC_MEM:,6302.04,MB
107-
DEFAULT,2026-04-20T15:01:03.860228Z,METRIC_MEM:,6297.34,MB
108-
DEFAULT,2026-04-20T15:01:04.860579Z,METRIC_MEM:,6293.2,MB
109-
DEFAULT,2026-04-20T15:01:05.860960Z,METRIC_MEM:,6287.33,MB
110-
DEFAULT,2026-04-20T15:01:06.861270Z,METRIC_MEM:,6284.43,MB
111-
DEFAULT,2026-04-20T15:01:07.861650Z,METRIC_MEM:,6284.43,MB
2+
DEFAULT,2026-04-24T06:06:58.207798Z,METRIC_MEM:,434.28,MB
3+
DEFAULT,2026-04-24T06:06:59.207850Z,METRIC_MEM:,509.68,MB
4+
DEFAULT,2026-04-24T06:07:00.208299Z,METRIC_MEM:,831.41,MB
5+
DEFAULT,2026-04-24T06:07:01.208631Z,METRIC_MEM:,961.37,MB
6+
DEFAULT,2026-04-24T06:07:02.209024Z,METRIC_MEM:,1103.34,MB
7+
DEFAULT,2026-04-24T06:07:03.209345Z,METRIC_MEM:,1188.03,MB
8+
DEFAULT,2026-04-24T06:07:04.209737Z,METRIC_MEM:,1449.39,MB
9+
DEFAULT,2026-04-24T06:07:05.210167Z,METRIC_MEM:,1590.39,MB
10+
DEFAULT,2026-04-24T06:07:06.210532Z,METRIC_MEM:,1771.91,MB
11+
DEFAULT,2026-04-24T06:07:07.210839Z,METRIC_MEM:,1914.38,MB
12+
DEFAULT,2026-04-24T06:07:08.211239Z,METRIC_MEM:,2056.89,MB
13+
DEFAULT,2026-04-24T06:07:09.211568Z,METRIC_MEM:,2175.38,MB
14+
DEFAULT,2026-04-24T06:07:10.212214Z,METRIC_MEM:,2356.97,MB
15+
DEFAULT,2026-04-24T06:07:11.212420Z,METRIC_MEM:,2531.37,MB
16+
DEFAULT,2026-04-24T06:07:12.212775Z,METRIC_MEM:,2673.6,MB
17+
DEFAULT,2026-04-24T06:07:13.223192Z,METRIC_MEM:,3255.59,MB
18+
DEFAULT,2026-04-24T06:07:14.223502Z,METRIC_MEM:,4054.9,MB
19+
DEFAULT,2026-04-24T06:07:15.223724Z,METRIC_MEM:,4033.88,MB
20+
DEFAULT,2026-04-24T06:07:16.224079Z,METRIC_MEM:,4035.61,MB
21+
DEFAULT,2026-04-24T06:07:17.223893Z,METRIC_MEM:,4035.61,MB
22+
DEFAULT,2026-04-24T06:07:18.223768Z,METRIC_MEM:,4035.61,MB
23+
DEFAULT,2026-04-24T06:07:19.223720Z,METRIC_MEM:,4037.49,MB
24+
DEFAULT,2026-04-24T06:07:20.223688Z,METRIC_MEM:,4037.49,MB
25+
DEFAULT,2026-04-24T06:07:21.224059Z,METRIC_MEM:,4037.97,MB
26+
DEFAULT,2026-04-24T06:07:22.224378Z,METRIC_MEM:,4037.97,MB
27+
DEFAULT,2026-04-24T06:07:23.224735Z,METRIC_MEM:,4037.97,MB
28+
DEFAULT,2026-04-24T06:07:24.225030Z,METRIC_MEM:,4038.95,MB
29+
DEFAULT,2026-04-24T06:07:25.226138Z,METRIC_MEM:,4038.95,MB
30+
DEFAULT,2026-04-24T06:07:26.226603Z,METRIC_MEM:,4038.89,MB
31+
DEFAULT,2026-04-24T06:07:27.226915Z,METRIC_MEM:,4038.1,MB
32+
DEFAULT,2026-04-24T06:07:28.227237Z,METRIC_MEM:,4037.22,MB
33+
DEFAULT,2026-04-24T06:07:29.227583Z,METRIC_MEM:,4038.28,MB
34+
DEFAULT,2026-04-24T06:07:30.227920Z,METRIC_MEM:,4037.22,MB
35+
DEFAULT,2026-04-24T06:07:31.228230Z,METRIC_MEM:,4037.38,MB
36+
DEFAULT,2026-04-24T06:07:32.228553Z,METRIC_MEM:,4041.57,MB
37+
DEFAULT,2026-04-24T06:07:33.228834Z,METRIC_MEM:,4041.36,MB
38+
DEFAULT,2026-04-24T06:07:34.229175Z,METRIC_MEM:,4041.36,MB
39+
DEFAULT,2026-04-24T06:07:35.229526Z,METRIC_MEM:,4042.84,MB
40+
DEFAULT,2026-04-24T06:07:36.229733Z,METRIC_MEM:,4042.84,MB
41+
DEFAULT,2026-04-24T06:07:37.229503Z,METRIC_MEM:,4046.88,MB
42+
DEFAULT,2026-04-24T06:07:38.229947Z,METRIC_MEM:,4100.14,MB
43+
DEFAULT,2026-04-24T06:07:39.229831Z,METRIC_MEM:,4143.25,MB
44+
DEFAULT,2026-04-24T06:07:40.230001Z,METRIC_MEM:,4165.57,MB
45+
DEFAULT,2026-04-24T06:07:41.230428Z,METRIC_MEM:,4168.71,MB
46+
DEFAULT,2026-04-24T06:07:42.250201Z,METRIC_MEM:,4193.07,MB
47+
DEFAULT,2026-04-24T06:07:43.253966Z,METRIC_MEM:,4207.2,MB
48+
DEFAULT,2026-04-24T06:07:44.250842Z,METRIC_MEM:,4206.1,MB
49+
DEFAULT,2026-04-24T06:07:45.251184Z,METRIC_MEM:,4256.93,MB
50+
DEFAULT,2026-04-24T06:07:46.251637Z,METRIC_MEM:,4257.46,MB
51+
DEFAULT,2026-04-24T06:07:47.252061Z,METRIC_MEM:,4273.06,MB
52+
DEFAULT,2026-04-24T06:07:48.252264Z,METRIC_MEM:,4277.84,MB
53+
DEFAULT,2026-04-24T06:07:49.252628Z,METRIC_MEM:,4287.83,MB
54+
DEFAULT,2026-04-24T06:07:50.252933Z,METRIC_MEM:,4299.75,MB
55+
DEFAULT,2026-04-24T06:07:51.253352Z,METRIC_MEM:,4305.93,MB
56+
DEFAULT,2026-04-24T06:07:52.253787Z,METRIC_MEM:,4339.72,MB
57+
DEFAULT,2026-04-24T06:07:53.262896Z,METRIC_MEM:,4354.3,MB
58+
DEFAULT,2026-04-24T06:07:54.259356Z,METRIC_MEM:,4362.78,MB
59+
DEFAULT,2026-04-24T06:07:55.259685Z,METRIC_MEM:,4385,MB
60+
DEFAULT,2026-04-24T06:07:56.259922Z,METRIC_MEM:,4385.66,MB
61+
DEFAULT,2026-04-24T06:07:57.259775Z,METRIC_MEM:,4409.23,MB
62+
DEFAULT,2026-04-24T06:07:58.259651Z,METRIC_MEM:,4411.26,MB
63+
DEFAULT,2026-04-24T06:07:59.259557Z,METRIC_MEM:,4434.75,MB
64+
DEFAULT,2026-04-24T06:08:00.259799Z,METRIC_MEM:,4459.57,MB
65+
DEFAULT,2026-04-24T06:08:01.262089Z,METRIC_MEM:,4492.48,MB
66+
DEFAULT,2026-04-24T06:08:02.262503Z,METRIC_MEM:,4493.22,MB
67+
DEFAULT,2026-04-24T06:08:03.262963Z,METRIC_MEM:,4506.8,MB
68+
DEFAULT,2026-04-24T06:08:04.263388Z,METRIC_MEM:,4540.05,MB
69+
DEFAULT,2026-04-24T06:08:05.263680Z,METRIC_MEM:,4623.99,MB
70+
DEFAULT,2026-04-24T06:08:06.264028Z,METRIC_MEM:,4698.93,MB
71+
DEFAULT,2026-04-24T06:08:07.264313Z,METRIC_MEM:,4770.75,MB
72+
DEFAULT,2026-04-24T06:08:08.264810Z,METRIC_MEM:,4872.98,MB
73+
DEFAULT,2026-04-24T06:08:09.265137Z,METRIC_MEM:,5062.45,MB
74+
DEFAULT,2026-04-24T06:08:10.265502Z,METRIC_MEM:,5209.61,MB
75+
DEFAULT,2026-04-24T06:08:11.265831Z,METRIC_MEM:,5337.89,MB
76+
DEFAULT,2026-04-24T06:08:12.270969Z,METRIC_MEM:,5616.41,MB
77+
DEFAULT,2026-04-24T06:08:13.271402Z,METRIC_MEM:,6073.16,MB
78+
DEFAULT,2026-04-24T06:08:14.271755Z,METRIC_MEM:,6514.41,MB
79+
DEFAULT,2026-04-24T06:08:15.272127Z,METRIC_MEM:,6931.82,MB
80+
DEFAULT,2026-04-24T06:08:16.273910Z,METRIC_MEM:,7545.53,MB
81+
DEFAULT,2026-04-24T06:08:17.273802Z,METRIC_MEM:,7579.41,MB
82+
DEFAULT,2026-04-24T06:08:18.273648Z,METRIC_MEM:,7575.39,MB
83+
DEFAULT,2026-04-24T06:08:19.273546Z,METRIC_MEM:,7581.73,MB
84+
DEFAULT,2026-04-24T06:08:20.273690Z,METRIC_MEM:,7569.69,MB
85+
DEFAULT,2026-04-24T06:08:21.274034Z,METRIC_MEM:,7586.38,MB
86+
DEFAULT,2026-04-24T06:08:22.274427Z,METRIC_MEM:,7584.85,MB
87+
DEFAULT,2026-04-24T06:08:23.274720Z,METRIC_MEM:,7565.12,MB
88+
DEFAULT,2026-04-24T06:08:24.275157Z,METRIC_MEM:,7512.23,MB
89+
DEFAULT,2026-04-24T06:08:25.275555Z,METRIC_MEM:,7295.88,MB
90+
DEFAULT,2026-04-24T06:08:26.276061Z,METRIC_MEM:,7148.72,MB
91+
DEFAULT,2026-04-24T06:08:27.276404Z,METRIC_MEM:,6975.2,MB
92+
DEFAULT,2026-04-24T06:08:28.277060Z,METRIC_MEM:,6634.11,MB
93+
DEFAULT,2026-04-24T06:08:29.277427Z,METRIC_MEM:,6463.36,MB
94+
DEFAULT,2026-04-24T06:08:30.277957Z,METRIC_MEM:,6270.87,MB
95+
DEFAULT,2026-04-24T06:08:31.278482Z,METRIC_MEM:,6107.61,MB
96+
DEFAULT,2026-04-24T06:08:32.279156Z,METRIC_MEM:,5950.92,MB
97+
DEFAULT,2026-04-24T06:08:33.279385Z,METRIC_MEM:,5947.23,MB
98+
DEFAULT,2026-04-24T06:08:34.279685Z,METRIC_MEM:,5924.39,MB
99+
DEFAULT,2026-04-24T06:08:35.286375Z,METRIC_MEM:,5910.64,MB
100+
DEFAULT,2026-04-24T06:08:36.283635Z,METRIC_MEM:,6774.96,MB
101+
DEFAULT,2026-04-24T06:08:37.283545Z,METRIC_MEM:,6806.27,MB
102+
DEFAULT,2026-04-24T06:08:38.283430Z,METRIC_MEM:,6821.47,MB
103+
DEFAULT,2026-04-24T06:08:39.283389Z,METRIC_MEM:,6821.45,MB
104+
DEFAULT,2026-04-24T06:08:40.283475Z,METRIC_MEM:,6897.86,MB
105+
DEFAULT,2026-04-24T06:08:41.284863Z,METRIC_MEM:,6937.82,MB
106+
DEFAULT,2026-04-24T06:08:42.284236Z,METRIC_MEM:,6847.93,MB
107+
DEFAULT,2026-04-24T06:08:43.284623Z,METRIC_MEM:,6862.59,MB
108+
DEFAULT,2026-04-24T06:08:44.285121Z,METRIC_MEM:,6866.46,MB
109+
DEFAULT,2026-04-24T06:08:45.285655Z,METRIC_MEM:,6864.15,MB
110+
DEFAULT,2026-04-24T06:08:46.286183Z,METRIC_MEM:,6852.66,MB
111+
DEFAULT,2026-04-24T06:08:47.286737Z,METRIC_MEM:,6906.88,MB
112+
DEFAULT,2026-04-24T06:08:48.287239Z,METRIC_MEM:,6609.81,MB
113+
DEFAULT,2026-04-24T06:08:49.294612Z,METRIC_MEM:,6459.63,MB
114+
DEFAULT,2026-04-24T06:08:50.291134Z,METRIC_MEM:,6522.66,MB
115+
DEFAULT,2026-04-24T06:08:51.291500Z,METRIC_MEM:,6507.25,MB
116+
DEFAULT,2026-04-24T06:08:52.291873Z,METRIC_MEM:,6512.25,MB
117+
DEFAULT,2026-04-24T06:08:53.292217Z,METRIC_MEM:,6523.08,MB
118+
DEFAULT,2026-04-24T06:08:54.292612Z,METRIC_MEM:,6523.29,MB
119+
DEFAULT,2026-04-24T06:08:55.292877Z,METRIC_MEM:,6431,MB
120+
DEFAULT,2026-04-24T06:08:56.293090Z,METRIC_MEM:,6451.77,MB
121+
DEFAULT,2026-04-24T06:08:57.293038Z,METRIC_MEM:,6456.9,MB
122+
DEFAULT,2026-04-24T06:08:58.292924Z,METRIC_MEM:,6453.93,MB
123+
DEFAULT,2026-04-24T06:08:59.292781Z,METRIC_MEM:,6450.25,MB
124+
DEFAULT,2026-04-24T06:09:00.292920Z,METRIC_MEM:,6452.43,MB
125+
DEFAULT,2026-04-24T06:09:01.293289Z,METRIC_MEM:,6449.31,MB
126+
DEFAULT,2026-04-24T06:09:02.293620Z,METRIC_MEM:,6292.76,MB
127+
DEFAULT,2026-04-24T06:09:03.293983Z,METRIC_MEM:,6290.23,MB
128+
DEFAULT,2026-04-24T06:09:04.294267Z,METRIC_MEM:,6285.38,MB
129+
DEFAULT,2026-04-24T06:09:05.294589Z,METRIC_MEM:,6281.16,MB
130+
DEFAULT,2026-04-24T06:09:06.294899Z,METRIC_MEM:,6274.43,MB
131+
DEFAULT,2026-04-24T06:09:07.295234Z,METRIC_MEM:,6274.39,MB
35.6 KB
Loading
15 KB
Loading
717 Bytes
Loading

data/README.md

Lines changed: 21 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -1,21 +1,32 @@
11
# Data & Synthetic Benchmarks
22

3-
This directory serves as the local state provider for the pipeline when executing in a non-cloud environment. It mimics the structure of the Google Cloud Storage (GCS) buckets, allowing for high-fidelity local simulation and performance benchmarking.
3+
This directory serves as the local state provider for the pipeline when executing in a non-cloud environment. It mimics the structure of the Google Cloud Storage (GCS) buckets.
44

55
## Synthetic Dataset
6-
To replicate the high-volume environment described in the [GCP Stress-Test Metrics (Scaling Efficiency)](/README.md#gcp-stress-test-metrics-scaling-efficiency) section, you can download the 36M-row synthetic dataset here: [**Kaggle Dataset Link**](https://www.kaggle.com/datasets/melvidabryan/e-commerce-synthetic-dataset)
6+
To replicate the high-volume environment described in the [GCP Stress-Test Metrics (Scaling Efficiency)](/README.md#gcp-stress-test-metrics-scaling-efficiency) section, you can download the 40M-row synthetic dataset here: [**Kaggle Dataset Link**](https://www.kaggle.com/datasets/melvidabryan/e-commerce-synthetic-dataset)
77

8-
>*Note: This upload contains the **Contracted Version** of the dataset. The original "Raw" statetotaling approximately 24GB of unrefined CSVs was omitted to prioritize transfer efficiency.*
8+
> *Note: This upload contains the **Contracted Version** of the dataset. The original "Raw" state, totaling approximately ~26GB of unrefined CSVs was omitted to prioritize transfer efficiency.*
99
10-
### File Structure & Purpose
11-
The dataset is divided into two primary directories to facilitate different stages of pipeline testing:
10+
## File Structure & Purpose
11+
The dataset is divided into three primary directories to facilitate different stages of pipeline testing:
1212

1313
| Directory | Files | Description |
1414
| :--- | :--- | :--- |
15-
| `contracted/` | 110 files | **Production-Scale Test:** The full 36M row dataset (~4.04 GB) formatted to strict enterprise schema requirements. |
16-
| `raw/` | 5 files | **Delta Sample (Validation):** Small-scale samples (~10k rows each) representing **daily incoming deltas**. These files are intentionally "noisy" to exhibit the full range of injected data quality errors. |
15+
| `contracted/` | 125 files | **Production-Scale Test:** The full 36M row dataset (~5.34 GB) formatted to strict schema requirements. |
16+
| `id_mapping/customer_id/` | 1 file | **Metadata Registry:** Central lookup mapping Customer UUIDs to Uint32 surrogate keys. |
17+
| `id_mapping/order_id/` | 40 files | **Metadata Registry (Sharded):** Fragmented lookup (40M+ keys) to test high-cardinality ID resolution. |
18+
| `id_mapping/product_id/` | 1 file | **Metadata Registry:** Central lookup mapping Product UUIDs to Uint32 surrogate keys. |
19+
| `id_mapping/seller_id/` | 1 file | **Metadata Registry:** Central lookup mapping Seller UUIDs to Uint32 surrogate keys. |
20+
| `raw/` | 5 files | **Delta Sample (Validation):** Small-scale samples (~20k rows each) representing **daily incoming deltas**. These files are intentionally "noisy" to exhibit the full range of injected data quality errors. |
1721

18-
### Included Tables
22+
---
23+
24+
### ID Mapping & Surrogate Key Simulation
25+
The id_mapping/ directory acts as a simulated metadata registrar for surrogate key generation. The pipeline utilizes these registries to resolve raw source UUIDs into memory-efficient Uint32 identifiers while enforcing global deduplication and referential integrity.
26+
27+
To benchmark ***[`mapping`](/data_pipeline/contract/id_registrar.py) throughput and memory footprint***, the order_id registry is partitioned into 40 sharded files (1M rows each). This fragmentation simulates the ingestion pressure of high-cardinality transactional data (40M+ unique keys) on serverless compute. Dimension-level registries (Customer, Product, Seller) remain unfragmented, as their lower cardinality is insufficient to trigger the resource-exhaustion thresholds required for these performance benchmarks.
28+
29+
## Included Tables
1930

2031
The dataset provides a complete relational snapshot of an e-commerce ecosystem:
2132

@@ -28,7 +39,8 @@ The dataset provides a complete relational snapshot of an e-commerce ecosystem:
2839
## Local Execution Setup
2940
1. Extract the downloaded dataset archive.
3041
2. Copy the `raw/` and `contracted/` directories into this `data/` folder.
31-
3. The `RunContext` manager is configured to strictly recognize `.parquet` and `.csv` extensions; all other file types are ignored to prevent ingestion noise.
42+
3. Use the commented out local path in [`RunContext.create()`](../data_pipeline/shared/run_context.py#L62).
43+
4. The `RunContext` manager is configured to strictly recognize `.parquet` and `.csv` extensions; all other file types are ignored to prevent ingestion noise.
3244

3345
**Execute the local pipeline:**
3446
```

data_pipeline/assembly/assembly_executor.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -145,6 +145,8 @@ def orchestrate_event_assembly(run_context: RunContext, report: Dict) -> bool:
145145

146146
except Exception as e:
147147
log_error(f"Unexpected error processing event assembly: {e}", report)
148+
report["status"] = "failed"
149+
return False
148150

149151
finally:
150152
if "lf_derived" in locals():

data_pipeline/semantic/semantic_executor.py

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -168,9 +168,13 @@ def orchestrate_module(
168168

169169
except FileExistsError as e:
170170
log_error(f"Unexpected table returned {table_name}: {e}", report)
171+
report["status"] = "failed"
172+
return False
171173

172174
except Exception as e:
173175
log_error(f"Unexpected error processing {table_name}: {e}", report)
176+
report["status"] = "failed"
177+
return False
174178

175179
finally:
176180
if "lf_frozen" in locals():

0 commit comments

Comments
 (0)