fix: remove double-deduction in isOverflow for non-limit.input models

anandgupta42 · claude · anandgupta42 · commit 5aab4bcd18c0 · 2026-03-04T13:27:41.000-08:00
Sentry correctly flagged that the non-limit.input path was subtracting
both maxOutput AND reserved (20K buffer), causing compaction to trigger
20K tokens too early for most production models. Simplified both paths
to use a single headroom = Math.max(reserved, maxOutput). For default
configs (maxOutput=32K &gt; buffer=20K), this matches the original upstream
behavior while preserving the P0 fix for limit.input models.

Co-Authored-By: Claude Opus 4.6 &lt;noreply@anthropic.com&gt;
diff --git a/packages/altimate-code/src/session/compaction.ts b/packages/altimate-code/src/session/compaction.ts
@@ -84,9 +84,8 @@ export namespace SessionCompaction {
 
     const maxOutput = ProviderTransform.maxOutputTokens(input.model)
     const reserved = config.compaction?.reserved ?? COMPACTION_BUFFER
-    const usable = input.model.limit.input
-      ? input.model.limit.input - Math.max(reserved, maxOutput)
-      : context - maxOutput - reserved
+    const headroom = Math.max(reserved, maxOutput)
+    const usable = (input.model.limit.input ?? context) - headroom
     return count >= usable
   }
 
diff --git a/packages/altimate-code/test/session/compaction-loop.test.ts b/packages/altimate-code/test/session/compaction-loop.test.ts
@@ -409,9 +409,9 @@ describe("session.compaction.isOverflow boundary conditions", () => {
     await Instance.provide({
       directory: tmp.path,
       fn: async () => {
-        // context=100K, output=32K → usable = 100K - 32K - 20K(buffer) = 48K
+        // context=100K, output=32K → headroom = max(20K, 32K) = 32K → usable = 68K
         const model = createModel({ context: 100_000, output: 32_000 })
-        const tokens = { input: 48_000, output: 0, reasoning: 0, cache: { read: 0, write: 0 } }
+        const tokens = { input: 68_000, output: 0, reasoning: 0, cache: { read: 0, write: 0 } }
         expect(await SessionCompaction.isOverflow({ tokens, model })).toBe(true)
       },
     })
@@ -423,8 +423,8 @@ describe("session.compaction.isOverflow boundary conditions", () => {
       directory: tmp.path,
       fn: async () => {
         const model = createModel({ context: 100_000, output: 32_000 })
-        // usable = 100K - 32K - 20K = 48K; count = 47999
-        const tokens = { input: 47_999, output: 0, reasoning: 0, cache: { read: 0, write: 0 } }
+        // headroom = max(20K, 32K) = 32K → usable = 68K; count = 67999
+        const tokens = { input: 67_999, output: 0, reasoning: 0, cache: { read: 0, write: 0 } }
         expect(await SessionCompaction.isOverflow({ tokens, model })).toBe(false)
       },
     })
@@ -436,12 +436,13 @@ describe("session.compaction.isOverflow boundary conditions", () => {
       directory: tmp.path,
       fn: async () => {
         const model = createModel({ context: 100_000, output: 32_000 })
-        // total=50K > usable=48K → overflow
+        // headroom = max(20K, 32K) = 32K → usable = 68K
+        // total=70K > usable=68K → overflow
         // component sum would be 10K (not overflow) — total should take precedence
         const tokens = {
           input: 5_000, output: 5_000, reasoning: 0,
           cache: { read: 0, write: 0 },
-          total: 50_000,
+          total: 70_000,
         }
         expect(await SessionCompaction.isOverflow({ tokens, model })).toBe(true)
       },
@@ -454,9 +455,10 @@ describe("session.compaction.isOverflow boundary conditions", () => {
       directory: tmp.path,
       fn: async () => {
         const model = createModel({ context: 100_000, output: 32_000 })
-        // sum = 10K + 5K + 20K + 15K = 50K > usable 48K
+        // headroom = max(20K, 32K) = 32K → usable = 68K
+        // sum = 30K + 10K + 20K + 15K = 75K > usable 68K
         const tokens = {
-          input: 10_000, output: 5_000, reasoning: 0,
+          input: 30_000, output: 10_000, reasoning: 0,
           cache: { read: 20_000, write: 15_000 },
         }
         expect(await SessionCompaction.isOverflow({ tokens, model })).toBe(true)
@@ -502,10 +504,10 @@ describe("session.compaction.isOverflow boundary conditions", () => {
     await Instance.provide({
       directory: tmp.path,
       fn: async () => {
-        // context=200K, output=32K, reserved=50K → usable=200K-32K-50K=118K
+        // context=200K, output=32K, reserved=50K → headroom=max(50K,32K)=50K → usable=150K
         const model = createModel({ context: 200_000, output: 32_000 })
-        // 120K > 118K → overflow
-        const tokens = { input: 120_000, output: 0, reasoning: 0, cache: { read: 0, write: 0 } }
+        // 151K > 150K → overflow
+        const tokens = { input: 151_000, output: 0, reasoning: 0, cache: { read: 0, write: 0 } }
         expect(await SessionCompaction.isOverflow({ tokens, model })).toBe(true)
       },
     })
@@ -523,9 +525,10 @@ describe("session.compaction.isOverflow boundary conditions", () => {
     await Instance.provide({
       directory: tmp.path,
       fn: async () => {
-        // input=200K, output=32K, reserved=50K → reserved=max(50K,32K)=50K → usable=150K
+        // input=200K, output=32K, reserved=50K → headroom=max(50K,32K)=50K → usable=150K
         const model = createModel({ context: 200_000, input: 200_000, output: 32_000 })
-        const tokens = { input: 150_000, output: 0, reasoning: 0, cache: { read: 0, write: 0 } }
+        // 151K > 150K → overflow
+        const tokens = { input: 151_000, output: 0, reasoning: 0, cache: { read: 0, write: 0 } }
         expect(await SessionCompaction.isOverflow({ tokens, model })).toBe(true)
       },
     })