fix: bugs

giladgd · giladgd · commit 140d888cd4bf · 2026-03-06T08:04:51.000+02:00
diff --git a/src/bindings/utils/getLlamaGpuTypes.ts b/src/bindings/utils/getLlamaGpuTypes.ts
@@ -18,6 +18,9 @@ export async function getLlamaGpuTypes(include: "supported" | "allValid"): Promi
     const platform = getPlatform();
     const arch = process.arch;
 
+    if (include == null)
+        include = "supported";
+
     if (include === "supported") {
         const gpuTypes = new Set(await getGpuTypesToUseForOption("auto"));
 
diff --git a/src/evaluator/LlamaChat/LlamaChat.ts b/src/evaluator/LlamaChat/LlamaChat.ts
@@ -26,6 +26,7 @@ import {LlamaModel} from "../LlamaModel/LlamaModel.js";
 import {getChatWrapperSegmentDefinition} from "../../utils/getChatWrapperSegmentDefinition.js";
 import {jsonDumps} from "../../chatWrappers/utils/jsonDumps.js";
 import {defaultMaxPreloadTokens} from "../LlamaChatSession/utils/LlamaChatSessionPromptCompletionEngine.js";
+import {LlamaLogLevel} from "../../bindings/types.js";
 import {
     eraseFirstResponseAndKeepFirstSystemChatContextShiftStrategy
 } from "./utils/contextShiftStrategies/eraseFirstResponseAndKeepFirstSystemChatContextShiftStrategy.js";
@@ -3081,6 +3082,25 @@ class GenerateResponseState<const Functions extends ChatModelFunctions | undefin
     }
 
     public async createNewEvaluationIterator() {
+        if (this.tokens.length === 0) {
+            if (this.evaluationIterator != null)
+                return;
+
+            const token = this.llamaChat.sequence.contextTokens.at(-1);
+            if (token == null)
+                throw new Error("No tokens to evaluate");
+
+            this.llamaChat.sequence.model._llama._log(
+                LlamaLogLevel.warn,
+                "Attempted to evaluate with no input, reevaluating the last context sequence token"
+            );
+            await this.llamaChat.sequence.eraseContextTokenRanges([{
+                start: this.llamaChat.sequence.contextTokens.length - 1,
+                end: this.llamaChat.sequence.contextTokens.length
+            }]);
+            this.tokens = [token];
+        }
+
         if (this.evaluationIterator != null)
             await this.evaluationIterator.return();
 
diff --git a/src/evaluator/LlamaContext/LlamaContext.ts b/src/evaluator/LlamaContext/LlamaContext.ts
@@ -1318,6 +1318,7 @@ export class LlamaContextSequence {
             const newSequenceTokens = this._contextTokens.slice();
             this._nextTokenIndex = 0;
             this._context._ctx.disposeSequence(this._sequenceId);
+            this._contextTokens = [];
 
             // wait for the evaluation outside the "context" lock to avoid deadlocks
             awaitPromise = this.evaluateWithoutGeneratingNewTokens(newSequenceTokens, {_skipLock: skipLock});