feat: v4.6.0 - Context overflow handling and missing tool result injection

ndycode · ndycode · commit 58fd6ae5d8d4 · 2026-01-25T10:33:23.000+08:00
- Context Overflow Handler: Gracefully handles 'prompt too long' errors by returning synthetic SSE response with /compact, /clear, /undo suggestions - Missing Tool Result Injection: Detects orphaned function_call items and injects 'Operation cancelled by user' to prevent API errors - 34 new unit tests (379 total) Ultraworked with [Sisyphus](https://github.com/code-yeongyu/oh-my-opencode)
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -8,15 +8,27 @@ All notable changes to this project are documented here. Dates use the ISO forma
 
 ### Changed
 
-## [4.3.1] - 2026-01-23
+## [4.6.0] - 2026-01-25
+
+**Feature release**: Context overflow handling and missing tool result injection.
 
 ### Added
-- `openai-accounts-status --json` for scriptable status output with email/ID labels.
+- **Context Overflow Handler**: Gracefully handles "prompt too long" / context length exceeded errors:
+  - Returns synthetic SSE response with helpful instructions instead of raw 400 error
+  - Suggests `/compact`, `/clear`, or `/undo` commands to reduce context size
+  - Prevents OpenCode session from getting locked on context overflow
+  - New module: `lib/context-overflow.ts`
+- **Missing Tool Result Injection**: Automatically handles cancelled tool calls (ESC mid-execution):
+  - Detects orphaned `function_call` items (calls without matching outputs)
+  - Injects synthetic output: `"Operation cancelled by user"`
+  - Prevents "missing tool_result" API errors when user cancels mid-tool
+  - New function: `injectMissingToolOutputs()` in `lib/request/helpers/input-utils.ts`
+- **34 new unit tests** for context overflow and tool injection (now 379 total tests)
 
-### Changed
-- Account labels now prefer email and show ID suffix when available; list/status outputs are columnized for readability.
-- Stored account emails are trimmed/lowercased when present.
-- Dependency refresh: @opencode-ai plugin/sdk 1.1.34, hono 4.11.5, vitest 4.0.18, @types/node 25.0.10, @typescript-eslint 8.53.1.
+### Technical Details
+- Context overflow detection matches patterns: `prompt_too_long`, `context_length_exceeded`, `maximum context length`, `token limit exceeded`, `too many tokens`
+- Synthetic SSE response includes proper message_start/content_block_delta/message_stop events
+- Tool injection preserves message order: outputs are placed immediately after their calls
 
 ## [4.5.0] - 2026-01-25
 
@@ -48,6 +60,16 @@ All notable changes to this project are documented here. Dates use the ISO forma
 - Stale entries (>30s) are automatically cleaned up to prevent memory leaks
 - Auto-update check is non-blocking and fails silently to avoid disrupting plugin operation
 
+## [4.3.1] - 2026-01-23
+
+### Added
+- `openai-accounts-status --json` for scriptable status output with email/ID labels.
+
+### Changed
+- Account labels now prefer email and show ID suffix when available; list/status outputs are columnized for readability.
+- Stored account emails are trimmed/lowercased when present.
+- Dependency refresh: @opencode-ai plugin/sdk 1.1.34, hono 4.11.5, vitest 4.0.18, @types/node 25.0.10, @typescript-eslint 8.53.1.
+
 ## [4.4.0] - 2026-01-25
 
 **Feature release**: Intelligent rate-limit rotation with health-based account selection.
diff --git a/index.ts b/index.ts
@@ -55,6 +55,7 @@ import {
 } from "./lib/constants.js";
 import { logRequest, logDebug } from "./lib/logger.js";
 import { checkAndNotify } from "./lib/auto-update-checker.js";
+import { handleContextOverflow } from "./lib/context-overflow.js";
 import {
         AccountManager,
         extractAccountEmail,
@@ -660,10 +661,16 @@ export const OpenAIAuthPlugin: Plugin = async ({ client }: PluginInput) => {
 																											headers: Object.fromEntries(response.headers.entries()),
 																										});
 
-																											if (!response.ok) {
-																												const { response: errorResponse, rateLimit } =
-																													await handleErrorResponse(response);
-																												if (rateLimit) {
+								if (!response.ok) {
+									// Check for context overflow (400 "prompt too long") before other error handling
+									const contextOverflowResult = await handleContextOverflow(response, model);
+									if (contextOverflowResult.handled) {
+										return contextOverflowResult.response;
+									}
+
+									const { response: errorResponse, rateLimit } =
+										await handleErrorResponse(response);
+									if (rateLimit) {
 																														const { attempt, delayMs } = getRateLimitBackoff(
 																															account.index,
 																															quotaKey,
diff --git a/lib/context-overflow.ts b/lib/context-overflow.ts
@@ -0,0 +1,139 @@
+/**
+ * Context Overflow Handler
+ * 
+ * Handles "Prompt too long" / context length exceeded errors by returning
+ * a synthetic SSE response that advises the user to use /compact or /clear.
+ * This prevents the OpenCode session from getting locked on 400 errors.
+ */
+
+import { PLUGIN_NAME } from "./constants.js";
+
+/**
+ * Error patterns that indicate context overflow
+ */
+const CONTEXT_OVERFLOW_PATTERNS = [
+  "prompt is too long",
+  "prompt_too_long",
+  "context length exceeded",
+  "context_length_exceeded",
+  "maximum context length",
+  "token limit exceeded",
+  "too many tokens",
+];
+
+/**
+ * Check if an error body indicates context overflow
+ */
+export function isContextOverflowError(status: number, bodyText: string): boolean {
+  if (status !== 400) return false;
+  if (!bodyText) return false;
+  
+  const lowerBody = bodyText.toLowerCase();
+  return CONTEXT_OVERFLOW_PATTERNS.some(pattern => lowerBody.includes(pattern));
+}
+
+/**
+ * The message shown to users when context overflow occurs
+ */
+const CONTEXT_OVERFLOW_MESSAGE = `[Plugin Notice] Context is too long for this model.
+
+Please use one of these commands to reduce context size:
+
+• **/compact** - Compress conversation history (recommended)
+• **/clear** - Start fresh with empty context
+• **/undo** - Remove recent messages
+
+Then retry your request.
+
+Alternatively, you can switch to a model with a larger context window.`;
+
+/**
+ * Creates a synthetic SSE response for context overflow errors.
+ * This returns a 200 OK with the error message as assistant text,
+ * preventing the session from getting locked.
+ */
+export function createContextOverflowResponse(model: string = "unknown"): Response {
+  const messageId = `msg_synthetic_overflow_${Date.now()}`;
+  const events: string[] = [];
+
+  // message_start
+  events.push(`event: message_start\ndata: ${JSON.stringify({
+    type: "message_start",
+    message: {
+      id: messageId,
+      type: "message",
+      role: "assistant",
+      content: [],
+      model,
+      usage: { input_tokens: 0, output_tokens: 0 },
+    },
+  })}\n\n`);
+
+  // content_block_start
+  events.push(`event: content_block_start\ndata: ${JSON.stringify({
+    type: "content_block_start",
+    index: 0,
+    content_block: { type: "text", text: "" },
+  })}\n\n`);
+
+  // content_block_delta (the actual message)
+  events.push(`event: content_block_delta\ndata: ${JSON.stringify({
+    type: "content_block_delta",
+    index: 0,
+    delta: { type: "text_delta", text: CONTEXT_OVERFLOW_MESSAGE },
+  })}\n\n`);
+
+  // content_block_stop
+  events.push(`event: content_block_stop\ndata: ${JSON.stringify({
+    type: "content_block_stop",
+    index: 0,
+  })}\n\n`);
+
+  // message_delta (end_turn)
+  events.push(`event: message_delta\ndata: ${JSON.stringify({
+    type: "message_delta",
+    delta: { stop_reason: "end_turn" },
+    usage: { output_tokens: 0 },
+  })}\n\n`);
+
+  // message_stop
+  events.push(`event: message_stop\ndata: ${JSON.stringify({
+    type: "message_stop",
+  })}\n\n`);
+
+  return new Response(events.join(""), {
+    status: 200,
+    headers: {
+      "Content-Type": "text/event-stream",
+      "X-Codex-Plugin-Synthetic": "true",
+      "X-Codex-Plugin-Error-Type": "context_overflow",
+    },
+  });
+}
+
+/**
+ * Check response for context overflow and return synthetic response if needed
+ */
+export async function handleContextOverflow(
+  response: Response,
+  model?: string,
+): Promise<{ handled: true; response: Response } | { handled: false }> {
+  if (response.status !== 400) {
+    return { handled: false };
+  }
+
+  try {
+    const bodyText = await response.clone().text();
+    if (isContextOverflowError(response.status, bodyText)) {
+      console.log(`[${PLUGIN_NAME}] Context overflow detected, returning synthetic response`);
+      return {
+        handled: true,
+        response: createContextOverflowResponse(model),
+      };
+    }
+  } catch {
+    // Ignore read errors
+  }
+
+  return { handled: false };
+}
diff --git a/lib/request/helpers/input-utils.ts b/lib/request/helpers/input-utils.ts
@@ -208,3 +208,53 @@ export const normalizeOrphanedToolOutputs = (
 		return item;
 	});
 };
+
+const CANCELLED_TOOL_OUTPUT = "Operation cancelled by user";
+
+const collectOutputCallIds = (input: InputItem[]): Set<string> => {
+	const outputCallIds = new Set<string>();
+	for (const item of input) {
+		if (
+			item.type === "function_call_output" ||
+			item.type === "local_shell_call_output" ||
+			item.type === "custom_tool_call_output"
+		) {
+			const callId = getCallId(item);
+			if (callId) outputCallIds.add(callId);
+		}
+	}
+	return outputCallIds;
+};
+
+export const injectMissingToolOutputs = (input: InputItem[]): InputItem[] => {
+	const outputCallIds = collectOutputCallIds(input);
+	const result: InputItem[] = [];
+
+	for (const item of input) {
+		result.push(item);
+
+		if (
+			item.type === "function_call" ||
+			item.type === "local_shell_call" ||
+			item.type === "custom_tool_call"
+		) {
+			const callId = getCallId(item);
+			if (callId && !outputCallIds.has(callId)) {
+				const outputType =
+					item.type === "function_call"
+						? "function_call_output"
+						: item.type === "local_shell_call"
+							? "local_shell_call_output"
+							: "custom_tool_call_output";
+
+				result.push({
+					type: outputType,
+					call_id: callId,
+					output: CANCELLED_TOOL_OUTPUT,
+				} as unknown as InputItem);
+			}
+		}
+	}
+
+	return result;
+};
diff --git a/lib/request/request-transformer.ts b/lib/request/request-transformer.ts
@@ -6,6 +6,7 @@ import { getNormalizedModel } from "./helpers/model-map.js";
 import {
 	filterOpenCodeSystemPromptsWithCachedPrompt,
 	normalizeOrphanedToolOutputs,
+	injectMissingToolOutputs,
 } from "./helpers/input-utils.js";
 import type {
 	ConfigOptions,
@@ -498,6 +499,7 @@ export async function transformRequestBody(
 		// convert them to messages to preserve context while avoiding API errors
 		if (body.input) {
 			body.input = normalizeOrphanedToolOutputs(body.input);
+			body.input = injectMissingToolOutputs(body.input);
 		}
 	}
 
diff --git a/package.json b/package.json
@@ -1,6 +1,6 @@
 {
   "name": "opencode-openai-codex-auth-multi",
-  "version": "4.5.0",
+  "version": "4.6.0",
   "description": "Fork of opencode-openai-codex-auth with multi-account rotation (ChatGPT OAuth / Codex backend)",
   "main": "./dist/index.js",
   "types": "./dist/index.d.ts",
diff --git a/test/context-overflow.test.ts b/test/context-overflow.test.ts
diff --git a/test/input-utils.test.ts b/test/input-utils.test.ts

Original file line number	Diff line number	Diff line change
`@@ -6,6 +6,7 @@ import { getNormalizedModel } from "./helpers/model-map.js";`
`6`	`6`	`import {`
`7`	`7`	`filterOpenCodeSystemPromptsWithCachedPrompt,`
`8`	`8`	`normalizeOrphanedToolOutputs,`
	`9`	`+ injectMissingToolOutputs,`
`9`	`10`	`} from "./helpers/input-utils.js";`
`10`	`11`	`import type {`
`11`	`12`	`ConfigOptions,`
`@@ -498,6 +499,7 @@ export async function transformRequestBody(`
`498`	`499`	`// convert them to messages to preserve context while avoiding API errors`
`499`	`500`	`if (body.input) {`
`500`	`501`	`body.input = normalizeOrphanedToolOutputs(body.input);`
	`502`	`+ body.input = injectMissingToolOutputs(body.input);`
`501`	`503`	`}`
`502`	`504`	`}`
`503`	`505`
Original file line number	Diff line number	Diff line change
`@@ -1,6 +1,6 @@`
`1`	`1`	`{`
`2`	`2`	`"name": "opencode-openai-codex-auth-multi",`
`3`		`- "version": "4.5.0",`
	`3`	`+ "version": "4.6.0",`
`4`	`4`	`"description": "Fork of opencode-openai-codex-auth with multi-account rotation (ChatGPT OAuth / Codex backend)",`
`5`	`5`	`"main": "./dist/index.js",`
`6`	`6`	`"types": "./dist/index.d.ts",`