|
156 | 156 | "metadata": {}, |
157 | 157 | "source": [ |
158 | 158 | "---\n", |
159 | | - "## 3. Daily Registration Failures by Manager & Stage (14 days)\n", |
| 159 | + "## 3. Overall Setup Success Rate (28 days)\n", |
160 | 160 | "\n", |
161 | | - "Day-by-day failure counts per manager + stage. A spike in one stage on a specific day = regression in that code path." |
| 161 | + "Top-level health metric. If this drops, something is broken." |
162 | 162 | ] |
163 | 163 | }, |
164 | 164 | { |
|
168 | 168 | "metadata": {}, |
169 | 169 | "outputs": [], |
170 | 170 | "source": [ |
171 | | - "df = run_kql_file(client, \"03-failure-stage-daily-trend.kql\")\n", |
| 171 | + "df = run_kql_file(client, \"03-overall-setup-success-rate.kql\")\n", |
172 | 172 | "display(df)" |
173 | 173 | ] |
174 | 174 | }, |
|
178 | 178 | "metadata": {}, |
179 | 179 | "source": [ |
180 | 180 | "---\n", |
181 | | - "## 4. Overall Setup Success Rate (28 days)\n", |
182 | | - "\n", |
183 | | - "Top-level health metric. If this drops, something is broken." |
184 | | - ] |
185 | | - }, |
186 | | - { |
187 | | - "cell_type": "code", |
188 | | - "execution_count": null, |
189 | | - "id": "13", |
190 | | - "metadata": {}, |
191 | | - "outputs": [], |
192 | | - "source": [ |
193 | | - "df = run_kql_file(client, \"04-overall-setup-success-rate.kql\")\n", |
194 | | - "display(df)" |
195 | | - ] |
196 | | - }, |
197 | | - { |
198 | | - "cell_type": "markdown", |
199 | | - "id": "14", |
200 | | - "metadata": {}, |
201 | | - "source": [ |
202 | | - "---\n", |
203 | | - "## 5. Manager Availability\n", |
| 181 | + "## 4. Manager Availability\n", |
204 | 182 | "\n", |
205 | 183 | "What tools do users actually have installed? Shows registered vs skipped vs failed per manager." |
206 | 184 | ] |
207 | 185 | }, |
208 | 186 | { |
209 | 187 | "cell_type": "code", |
210 | 188 | "execution_count": null, |
211 | | - "id": "15", |
| 189 | + "id": "13", |
212 | 190 | "metadata": {}, |
213 | 191 | "outputs": [], |
214 | 192 | "source": [ |
215 | | - "df = run_kql_file(client, \"05-manager-availability.kql\")\n", |
| 193 | + "df = run_kql_file(client, \"04-manager-availability.kql\")\n", |
216 | 194 | "display(df)\n", |
217 | 195 | "\n", |
218 | 196 | "if not df.empty:\n", |
|
241 | 219 | }, |
242 | 220 | { |
243 | 221 | "cell_type": "markdown", |
244 | | - "id": "16", |
| 222 | + "id": "14", |
245 | 223 | "metadata": {}, |
246 | 224 | "source": [ |
247 | 225 | "---\n", |
248 | | - "## 6. Daily Trend (14 days)\n", |
| 226 | + "## 5. Daily Trend (14 days)\n", |
249 | 227 | "\n", |
250 | 228 | "Day-by-day trend of setup success rate. Check after shipping a new version." |
251 | 229 | ] |
252 | 230 | }, |
253 | 231 | { |
254 | 232 | "cell_type": "code", |
255 | 233 | "execution_count": null, |
256 | | - "id": "17", |
| 234 | + "id": "15", |
257 | 235 | "metadata": {}, |
258 | 236 | "outputs": [], |
259 | 237 | "source": [ |
260 | | - "df = run_kql_file(client, \"06-daily-trend.kql\")\n", |
| 238 | + "df = run_kql_file(client, \"05-daily-trend.kql\")\n", |
261 | 239 | "display(df)\n", |
262 | 240 | "\n", |
263 | 241 | "if not df.empty:\n", |
|
276 | 254 | }, |
277 | 255 | { |
278 | 256 | "cell_type": "markdown", |
279 | | - "id": "18", |
| 257 | + "id": "16", |
280 | 258 | "metadata": {}, |
281 | 259 | "source": [ |
282 | 260 | "---\n", |
283 | | - "## 7. Error Type Distribution\n", |
| 261 | + "## 6. Error Type Distribution\n", |
284 | 262 | "\n", |
285 | 263 | "Groups all failures by error type across setup and individual managers." |
286 | 264 | ] |
287 | 265 | }, |
288 | 266 | { |
289 | 267 | "cell_type": "code", |
290 | 268 | "execution_count": null, |
291 | | - "id": "19", |
| 269 | + "id": "17", |
292 | 270 | "metadata": {}, |
293 | 271 | "outputs": [], |
294 | 272 | "source": [ |
295 | | - "df = run_kql_file(client, \"07-error-type-distribution.kql\")\n", |
| 273 | + "df = run_kql_file(client, \"06-error-type-distribution.kql\")\n", |
296 | 274 | "display(df)\n", |
297 | 275 | "\n", |
298 | 276 | "if not df.empty:\n", |
|
312 | 290 | }, |
313 | 291 | { |
314 | 292 | "cell_type": "markdown", |
315 | | - "id": "20", |
| 293 | + "id": "18", |
316 | 294 | "metadata": {}, |
317 | 295 | "source": [ |
318 | 296 | "---\n", |
319 | | - "## 8. Hang ↔ Failure Correlation\n", |
| 297 | + "## 7. Hang ↔ Failure Correlation\n", |
320 | 298 | "\n", |
321 | 299 | "Do hangs always cause failures, or do some self-recover?" |
322 | 300 | ] |
323 | 301 | }, |
324 | 302 | { |
325 | 303 | "cell_type": "code", |
326 | 304 | "execution_count": null, |
327 | | - "id": "21", |
| 305 | + "id": "19", |
328 | 306 | "metadata": {}, |
329 | 307 | "outputs": [], |
330 | 308 | "source": [ |
331 | | - "df = run_kql_file(client, \"08-hang-failure-correlation.kql\")\n", |
| 309 | + "df = run_kql_file(client, \"07-hang-failure-correlation.kql\")\n", |
332 | 310 | "display(df)" |
333 | 311 | ] |
334 | 312 | }, |
335 | 313 | { |
336 | 314 | "cell_type": "markdown", |
337 | | - "id": "22", |
| 315 | + "id": "20", |
338 | 316 | "metadata": {}, |
339 | 317 | "source": [ |
340 | 318 | "---\n", |
341 | | - "## 9. Weekly Health Summary\n", |
| 319 | + "## 8. Weekly Health Summary\n", |
342 | 320 | "\n", |
343 | 321 | "One-stop query for weekly check. Returns all key numbers in a single row." |
344 | 322 | ] |
345 | 323 | }, |
346 | 324 | { |
347 | 325 | "cell_type": "code", |
348 | 326 | "execution_count": null, |
349 | | - "id": "23", |
| 327 | + "id": "21", |
350 | 328 | "metadata": {}, |
351 | 329 | "outputs": [], |
352 | 330 | "source": [ |
353 | | - "df = run_kql_file(client, \"09-weekly-health-summary.kql\")\n", |
| 331 | + "df = run_kql_file(client, \"08-weekly-health-summary.kql\")\n", |
354 | 332 | "display(df)" |
355 | 333 | ] |
356 | 334 | } |
357 | 335 | ], |
358 | 336 | "metadata": { |
359 | 337 | "kernelspec": { |
360 | | - "display_name": ".venv (3.13.12)", |
| 338 | + "display_name": ".venv", |
361 | 339 | "language": "python", |
362 | 340 | "name": "python3" |
363 | 341 | }, |
|
0 commit comments