v1.7.7: remove IPC truncation cap, strip stray JSON fences from display, fix CUDA partial-layer fallback, strip echoed continuation prompt

Brendan Gray · Brendan Gray · commit 8604b167e7f7 · 2026-03-05T19:31:58.000-05:00
diff --git a/main/agenticChat.js b/main/agenticChat.js
@@ -1338,8 +1338,8 @@ function register(ctx) {
                 // Step 2: stream the accumulating content to the renderer
                 if (_tStart !== -1 && _tName && mainWindow && !mainWindow.isDestroyed()) {
                   const raw = _tb.slice(_tStart);
-                  // Cap at 3000 chars for IPC efficiency; frontend further caps at 1500 for display
-                  const paramsText = raw.length > 3000 ? raw.slice(0, 3000) + '\n…[truncated]' : raw;
+                  // Pass full raw JSON — no truncation
+                  const paramsText = raw;
                   mainWindow.webContents.send('llm-tool-generating', {
                     callIndex: _tIdx,
                     functionName: _tName,
@@ -1665,11 +1665,17 @@ function register(ctx) {
         // Strip tool-call JSON fences from the user-visible copy before accumulating.
         // fullResponseText (fed back to the model for context) keeps the raw text.
         // displayResponseText (committed to the chat message) should only have natural language.
-        // Targets: ```tool_call```, ```tool```, and ```json``` whose root object is a tool call.
-        // Tool-call fenced blocks are left in displayChunk so they appear as formatted code
-        // blocks in the chat bubble rather than being silently stripped to nothing.
-        const displayChunk = responseText
+        // Targets: ```tool_call```, ```tool```, and ```json``` blocks (duplicate visible text —
+        // proper tool call UI is rendered via the 'tool-executing' IPC channel instead).
+        let displayChunk = responseText
+          .replace(/\n?```(?:json|tool_call|tool)\b[\s\S]*?```\n?/g, '')
           .replace(/\n{3,}/g, '\n\n');
+        // Strip echoed continuation prompt — small models sometimes echo our bracketed
+        // instruction back as output instead of continuing. This is NOT a user-input classifier;
+        // it detects only our own constant continuation prompt string being reflected by the model.
+        if (continuationCount > 0) {
+          displayChunk = displayChunk.replace(/\[Continue your response[\s\S]*?\]/gi, '');
+        }
         displayResponseText += displayChunk;
 
         // ── SEAMLESS CONTINUATION ──
diff --git a/main/llmEngine.js b/main/llmEngine.js
@@ -391,8 +391,8 @@ class LLMEngine extends EventEmitter {
           // Previously only skipped when auto=0 — but auto can return a small nonzero count (e.g. 6)
           // that is still well below what a computed partial offload gives (e.g. 14).
           const _partialFallback = gpuModes.find(m => typeof m === 'number');
-          if (tryGpuMode === 'auto' && _partialFallback !== undefined && gpuLayers < _partialFallback) {
-            console.log(`[LLM] Auto returned ${gpuLayers} GPU layers (< partial fallback ${_partialFallback}) — trying explicit partial offload`);
+          if ((tryGpuMode === 'auto' || tryGpuMode === 'cuda') && _partialFallback !== undefined && gpuLayers < _partialFallback) {
+            console.log(`[LLM] ${tryGpuMode} returned ${gpuLayers} GPU layers (< partial fallback ${_partialFallback}) — trying explicit partial offload`);
             continue;
           }
         } catch (loadErr) {
diff --git a/package.json b/package.json
@@ -1,6 +1,6 @@
 {
   "name": "guide-ide",
-  "version": "1.7.6",
+  "version": "1.7.7",
   "description": "guIDE - AI-Powered Offline IDE with local LLM, RAG, MCP tools, browser automation, and integrated terminal",
   "author": {
     "name": "Brendan Gray",

Original file line number	Diff line number	Diff line change
`@@ -1,6 +1,6 @@`
`1`	`1`	`{`
`2`	`2`	`"name": "guide-ide",`
`3`		`- "version": "1.7.6",`
	`3`	`+ "version": "1.7.7",`
`4`	`4`	`"description": "guIDE - AI-Powered Offline IDE with local LLM, RAG, MCP tools, browser automation, and integrated terminal",`
`5`	`5`	`"author": {`
`6`	`6`	`"name": "Brendan Gray",`