Merge pull request #91 from ndycode/feat/prompt-cache-doctor

ndycode · web-flow · commit 405ef3f377ed · 2026-03-22T14:01:05.000+08:00
feat: add prompt cache diagnostics to codex-doctor
diff --git a/index.ts b/index.ts
@@ -158,6 +158,7 @@ import { paintUiText, formatUiBadge, formatUiHeader, formatUiItem, formatUiKeyVa
 import {
 	buildBeginnerChecklist,
 	buildBeginnerDoctorFindings,
+	formatPromptCacheSnapshot,
 	recommendBeginnerNextAction,
 	summarizeBeginnerAccounts,
 	type BeginnerAccountSnapshot,
@@ -278,6 +279,9 @@ export const OpenAIOAuthPlugin: Plugin = async ({ client }: PluginInput) => {
 		lastRequestAt: number | null;
 		lastError: string | null;
 		lastErrorCategory: string | null;
+		promptCacheEnabledRequests: number;
+		promptCacheMissingRequests: number;
+		lastPromptCacheKey: string | null;
 		lastSelectedAccountIndex: number | null;
 		lastQuotaKey: string | null;
 		lastSelectionSnapshot: SelectionSnapshot | null;
@@ -304,6 +308,9 @@ export const OpenAIOAuthPlugin: Plugin = async ({ client }: PluginInput) => {
 		lastRequestAt: null,
 		lastError: null,
 		lastErrorCategory: null,
+		promptCacheEnabledRequests: 0,
+		promptCacheMissingRequests: 0,
+		lastPromptCacheKey: null,
 		lastSelectedAccountIndex: null,
 		lastQuotaKey: null,
 		lastSelectionSnapshot: null,
@@ -1373,6 +1380,9 @@ export const OpenAIOAuthPlugin: Plugin = async ({ client }: PluginInput) => {
 			serverErrors: runtimeMetrics.serverErrors,
 			networkErrors: runtimeMetrics.networkErrors,
 			lastErrorCategory: runtimeMetrics.lastErrorCategory,
+			promptCacheEnabledRequests: runtimeMetrics.promptCacheEnabledRequests,
+			promptCacheMissingRequests: runtimeMetrics.promptCacheMissingRequests,
+			lastPromptCacheKey: runtimeMetrics.lastPromptCacheKey,
 		});
 
 		const formatDoctorSeverity = (
@@ -2025,6 +2035,12 @@ export const OpenAIOAuthPlugin: Plugin = async ({ client }: PluginInput) => {
 								threadIdCandidate ? `${threadIdCandidate}:${Date.now()}` : undefined,
 							);
 							runtimeMetrics.lastRequestAt = Date.now();
+							runtimeMetrics.lastPromptCacheKey = promptCacheKey ?? null;
+							if (promptCacheKey) {
+								runtimeMetrics.promptCacheEnabledRequests++;
+							} else {
+								runtimeMetrics.promptCacheMissingRequests++;
+							}
 							const retryBudget = new RetryBudgetTracker(retryBudgetLimits);
 							const consumeRetryBudget = (
 								bucket: RetryBudgetClass,
@@ -2313,20 +2329,31 @@ while (attempted.size < Math.max(1, accountCount)) {
 									: null;
 
 								if (abortSignal?.aborted) {
-									clearTimeout(fetchTimeoutId);
-									fetchController.abort(abortSignal.reason ?? new Error("Aborted by user"));
-								} else if (abortSignal && onUserAbort) {
-									abortSignal.addEventListener("abort", onUserAbort, { once: true });
-								}
+								clearTimeout(fetchTimeoutId);
+								fetchController.abort(abortSignal.reason ?? new Error("Aborted by user"));
+							} else if (abortSignal && onUserAbort) {
+								abortSignal.addEventListener("abort", onUserAbort, { once: true });
+							}
 
-								try {
+							try {
+								// Request metrics are tracked at the fetch boundary, so retries and
+								// account rotation are counted consistently. These increments are
+								// in-memory only and run on Node's single-threaded event loop, so no
+								// filesystem locking or token-redaction concerns are introduced here.
 								runtimeMetrics.totalRequests++;
 								response = await fetch(url, {
 									...requestInit,
 									headers,
 									signal: fetchController.signal,
 								});
-				} catch (networkError) {
+							} catch (networkError) {
+								if (abortSignal?.aborted && fetchController.signal.aborted) {
+									accountManager.refundToken(account, modelFamily, model);
+									if (networkError instanceof Error) {
+										throw networkError;
+									}
+									throw new Error(String(networkError));
+								}
 								const errorMsg = networkError instanceof Error ? networkError.message : String(networkError);
 								logWarn(`Network error for account ${account.index + 1}: ${errorMsg}`);
 								if (
@@ -2359,21 +2386,21 @@ while (attempted.size < Math.max(1, accountCount)) {
 								accountManager.refundToken(account, modelFamily, model);
 								accountManager.recordFailure(account, modelFamily, model);
 								break;
-								} finally {
-									clearTimeout(fetchTimeoutId);
-									if (abortSignal && onUserAbort) {
-										abortSignal.removeEventListener("abort", onUserAbort);
-									}
+							} finally {
+								clearTimeout(fetchTimeoutId);
+								if (abortSignal && onUserAbort) {
+									abortSignal.removeEventListener("abort", onUserAbort);
 								}
-											const fetchLatencyMs = Math.round(performance.now() - fetchStart);
-
-											logRequest(LOG_STAGES.RESPONSE, {
-												status: response.status,
-												ok: response.ok,
-												statusText: response.statusText,
-												latencyMs: fetchLatencyMs,
-												headers: Object.fromEntries(response.headers.entries()),
-											});
+							}
+							const fetchLatencyMs = Math.round(performance.now() - fetchStart);
+
+							logRequest(LOG_STAGES.RESPONSE, {
+								status: response.status,
+								ok: response.ok,
+								statusText: response.statusText,
+								latencyMs: fetchLatencyMs,
+								headers: Object.fromEntries(response.headers.entries()),
+							});
 
 								if (!response.ok) {
 									const contextOverflowResult = await handleContextOverflow(response, model);
@@ -5197,6 +5224,14 @@ while (attempted.size < Math.max(1, accountCount)) {
 									"muted",
 								),
 							);
+							lines.push(
+								formatUiKeyValue(
+									ui,
+									"Prompt cache",
+									formatPromptCacheSnapshot(runtime),
+									"muted",
+								),
+							);
 						}
 
 						return lines.join("\n");
@@ -5236,6 +5271,9 @@ while (attempted.size < Math.max(1, accountCount)) {
 						lines.push(
 							`  Runtime failures: failed=${runtime.failedRequests}, rateLimited=${runtime.rateLimitedResponses}, authRefreshFailed=${runtime.authRefreshFailures}, server=${runtime.serverErrors}, network=${runtime.networkErrors}`,
 						);
+						lines.push(
+							`  Prompt cache: ${formatPromptCacheSnapshot(runtime)}`,
+						);
 					}
 					return lines.join("\n");
 				},
diff --git a/lib/ui/beginner.ts b/lib/ui/beginner.ts
@@ -1,3 +1,5 @@
+import { createHash } from "node:crypto";
+
 export type BeginnerDiagnosticSeverity = "ok" | "warning" | "error";
 
 export interface BeginnerAccountSnapshot {
@@ -18,6 +20,9 @@ export interface BeginnerRuntimeSnapshot {
 	serverErrors: number;
 	networkErrors: number;
 	lastErrorCategory: string | null;
+	promptCacheEnabledRequests: number;
+	promptCacheMissingRequests: number;
+	lastPromptCacheKey: string | null;
 }
 
 export interface BeginnerChecklistItem {
@@ -47,6 +52,20 @@ export interface BeginnerAccountSummary {
 	unlabeled: number;
 }
 
+export function formatPromptCacheKey(value: string | null | undefined): string {
+	const normalized = value?.trim();
+	if (!normalized) return "none";
+	const fingerprint = createHash("sha256").update(normalized).digest("hex").slice(0, 12);
+	return `masked-${fingerprint}`;
+}
+
+export function formatPromptCacheSnapshot(runtime: Pick<
+	BeginnerRuntimeSnapshot,
+	"promptCacheEnabledRequests" | "promptCacheMissingRequests" | "lastPromptCacheKey"
+>): string {
+	return `enabled=${runtime.promptCacheEnabledRequests}, missing=${runtime.promptCacheMissingRequests}, lastKey=${formatPromptCacheKey(runtime.lastPromptCacheKey)}`;
+}
+
 export function summarizeBeginnerAccounts(
 	accounts: BeginnerAccountSnapshot[],
 	now: number,
@@ -241,6 +260,27 @@ export function buildBeginnerDoctorFindings(input: {
 		});
 	}
 
+	if (input.runtime.totalRequests > 0) {
+		if (input.runtime.promptCacheEnabledRequests === 0) {
+			findings.push({
+				severity: "warning",
+				code: "prompt-cache-missing",
+				summary: "Recent requests did not include a prompt cache key.",
+				action:
+					"Use a session-backed OpenCode flow that forwards `prompt_cache_key` so Codex prompt caching can engage.",
+			});
+		} else if (input.runtime.promptCacheMissingRequests > 0) {
+			findings.push({
+				severity: "warning",
+				code: "prompt-cache-inconsistent",
+				summary:
+					"Prompt cache keys were present for some recent requests but missing for others.",
+				action:
+					"Keep requests on a stable session/thread path so `prompt_cache_key` stays consistent across turns.",
+			});
+		}
+	}
+
 	const failureRate = getFailureRate(input.runtime);
 	if (input.runtime.totalRequests >= 6 && failureRate >= 0.5) {
 		findings.push({
diff --git a/test/beginner-ui.test.ts b/test/beginner-ui.test.ts
@@ -1,8 +1,12 @@
 import { describe, it, expect } from "vitest";
+import { createHash } from "node:crypto";
+
 import {
 	buildBeginnerChecklist,
 	buildBeginnerDoctorFindings,
 	explainRuntimeErrorCategory,
+	formatPromptCacheKey,
+	formatPromptCacheSnapshot,
 	recommendBeginnerNextAction,
 	summarizeBeginnerAccounts,
 	type BeginnerAccountSnapshot,
@@ -19,6 +23,9 @@ const healthyRuntime: BeginnerRuntimeSnapshot = {
 	serverErrors: 0,
 	networkErrors: 0,
 	lastErrorCategory: null,
+	promptCacheEnabledRequests: 12,
+	promptCacheMissingRequests: 0,
+	lastPromptCacheKey: "ses_prompt_cache",
 };
 
 function buildAccount(
@@ -117,6 +124,55 @@ describe("buildBeginnerDoctorFindings", () => {
 		expect(findings.some((f) => f.code === "auth-refresh-failures")).toBe(true);
 		expect(findings.some((f) => f.code === "recent-error-category")).toBe(true);
 	});
+
+	it("flags missing prompt cache keys when recent requests never supplied one", () => {
+		const findings = buildBeginnerDoctorFindings({
+			accounts: [buildAccount()],
+			now,
+			runtime: {
+				...healthyRuntime,
+				totalRequests: 5,
+				promptCacheEnabledRequests: 0,
+				promptCacheMissingRequests: 5,
+				lastPromptCacheKey: null,
+			},
+		});
+
+		expect(findings.some((f) => f.code === "prompt-cache-missing")).toBe(true);
+	});
+
+	it("flags inconsistent prompt cache usage when only some requests had keys", () => {
+		const findings = buildBeginnerDoctorFindings({
+			accounts: [buildAccount()],
+			now,
+			runtime: {
+				...healthyRuntime,
+				totalRequests: 6,
+				promptCacheEnabledRequests: 4,
+				promptCacheMissingRequests: 2,
+				lastPromptCacheKey: null,
+			},
+		});
+
+		expect(findings.some((f) => f.code === "prompt-cache-inconsistent")).toBe(true);
+	});
+
+	it("does not flag cache issues when no requests have been made", () => {
+		const findings = buildBeginnerDoctorFindings({
+			accounts: [buildAccount()],
+			now,
+			runtime: {
+				...healthyRuntime,
+				totalRequests: 0,
+				promptCacheEnabledRequests: 0,
+				promptCacheMissingRequests: 3,
+				lastPromptCacheKey: null,
+			},
+		});
+
+		expect(findings.some((f) => f.code === "prompt-cache-missing")).toBe(false);
+		expect(findings.some((f) => f.code === "prompt-cache-inconsistent")).toBe(false);
+	});
 });
 
 describe("recommendBeginnerNextAction", () => {
@@ -175,3 +231,38 @@ describe("explainRuntimeErrorCategory", () => {
 		expect(hint).toContain("codex-doctor");
 	});
 });
+
+describe("formatPromptCacheKey", () => {
+	it("returns none for empty values", () => {
+		expect(formatPromptCacheKey(null)).toBe("none");
+		expect(formatPromptCacheKey(undefined)).toBe("none");
+		expect(formatPromptCacheKey("   ")).toBe("none");
+	});
+
+	it("redacts short values too", () => {
+		expect(formatPromptCacheKey("ses_1234")).toBe(
+			`masked-${createHash("sha256").update("ses_1234").digest("hex").slice(0, 12)}`,
+		);
+	});
+
+	it("redacts longer values to a stable masked fingerprint", () => {
+		expect(formatPromptCacheKey("ses_prompt_cache_key_123")).toBe(
+			`masked-${createHash("sha256").update("ses_prompt_cache_key_123").digest("hex").slice(0, 12)}`,
+		);
+	});
+});
+
+describe("formatPromptCacheSnapshot", () => {
+	it("renders a redacted prompt cache snapshot string", () => {
+		const rendered = formatPromptCacheSnapshot({
+			promptCacheEnabledRequests: 4,
+			promptCacheMissingRequests: 1,
+			lastPromptCacheKey: "ses_prompt_cache_key_123",
+		});
+
+		expect(rendered).toBe(
+			`enabled=4, missing=1, lastKey=masked-${createHash("sha256").update("ses_prompt_cache_key_123").digest("hex").slice(0, 12)}`,
+		);
+		expect(rendered).not.toContain("ses_prompt_cache_key_123");
+	});
+});