amDosion
diff --git a/‎packages/builtin-tools/src/tools/LocalMemoryRecallTool/LocalMemoryRecallTool.ts‎
Lines changed: 31 additions & 0 deletions b/‎packages/builtin-tools/src/tools/LocalMemoryRecallTool/LocalMemoryRecallTool.ts‎
Lines changed: 31 additions & 0 deletions
diff --git a/‎packages/builtin-tools/src/tools/LocalMemoryRecallTool/__tests__/LocalMemoryRecallTool.test.ts‎
Lines changed: 46 additions & 0 deletions b/‎packages/builtin-tools/src/tools/LocalMemoryRecallTool/__tests__/LocalMemoryRecallTool.test.ts‎
Lines changed: 46 additions & 0 deletions
diff --git a/‎packages/builtin-tools/src/tools/VaultHttpFetchTool/VaultHttpFetchTool.ts‎
Lines changed: 21 additions & 0 deletions b/‎packages/builtin-tools/src/tools/VaultHttpFetchTool/VaultHttpFetchTool.ts‎
Lines changed: 21 additions & 0 deletions
diff --git a/‎packages/builtin-tools/src/tools/VaultHttpFetchTool/__tests__/VaultHttpFetchTool.test.ts‎
Lines changed: 90 additions & 0 deletions b/‎packages/builtin-tools/src/tools/VaultHttpFetchTool/__tests__/VaultHttpFetchTool.test.ts‎
Lines changed: 90 additions & 0 deletions
diff --git a/‎packages/builtin-tools/src/tools/VaultHttpFetchTool/__tests__/scrub.test.ts‎
Lines changed: 29 additions & 6 deletions b/‎packages/builtin-tools/src/tools/VaultHttpFetchTool/__tests__/scrub.test.ts‎
Lines changed: 29 additions & 6 deletions
diff --git a/‎packages/builtin-tools/src/tools/VaultHttpFetchTool/scrub.ts‎
Lines changed: 33 additions & 3 deletions b/‎packages/builtin-tools/src/tools/VaultHttpFetchTool/scrub.ts‎
Lines changed: 33 additions & 3 deletions
diff --git a/‎src/commands/local-vault/__tests__/parseArgs.test.ts‎
Lines changed: 50 additions & 0 deletions b/‎src/commands/local-vault/__tests__/parseArgs.test.ts‎
Lines changed: 50 additions & 0 deletions
@@ -86,7 +86,38 @@ function deriveTurnKey(context: {
   return NO_TURN_KEY
 }
 
+/**
+ * Consume `bytes` against `turnKey`'s budget. Returns false if the budget
+ * would be exceeded (caller should refuse the fetch).
+ *
+ * M4 fix (codecov-100 audit #7): explicitly document the threading model.
+ * This bookkeeper is BEST-EFFORT and NOT thread-safe in the general sense:
+ *
+ *   1. V8/Bun JavaScript runs JS on a single event-loop thread, so the
+ *      read-modify-write sequence here (get → check → maybe-evict → set)
+ *      is atomic with respect to other JS on the same thread. There is
+ *      NO `await` between read and write, which guarantees no
+ *      interleaving with other async tasks on the same loop.
+ *
+ *   2. We are NOT safe under multi-process / Worker concurrency. A
+ *      forked Worker thread running this same module gets its own
+ *      `FETCH_BUDGET_USED` Map; the budget is per-process. Tools are
+ *      not currently invoked across processes within one Claude turn,
+ *      so this is acceptable.
+ *
+ *   3. The budget is a SOFT limit: a crash mid-call can leak budget,
+ *      and the FIFO eviction makes the cap a heuristic, not a hard
+ *      enforcement. The HARD enforcement is the per-fetch byte cap
+ *      (FETCH_CAP_BYTES) and the per-list byte cap, which run inside
+ *      the call() body and are independent of this counter.
+ *
+ * If we ever introduce true parallelism (Worker pools sharing this
+ * module via SharedArrayBuffer, or off-loop tool execution), this
+ * function must be migrated to Atomics or a lock — not a Map.
+ */
 function consumeBudget(turnKey: string, bytes: number): boolean {
+  // Read-modify-write is atomic on the JS event loop because there is no
+  // `await` between the get and the set below.
   const used = FETCH_BUDGET_USED.get(turnKey) ?? 0
   if (used + bytes > PER_TURN_FETCH_BUDGET_BYTES) return false
   // FIFO eviction by Map insertion order (Map.keys() is insertion-ordered).
 
@@ -295,6 +295,52 @@ describe('LocalMemoryRecallTool', () => {
     expect(r3.data.error).toMatch(/budget/i)
   })
 
+  // ── M4 (codecov-100 audit #7): race / interleaving guarantees ──
+  // The audit flagged the read-modify-write in consumeBudget as a potential
+  // race. We document (and pin via test) that under the realistic JS
+  // event-loop model, concurrently-issued async fetches sharing the same
+  // turnKey settle on the correct cumulative budget — no double-charges,
+  // no torn writes — because there is no `await` between get and set in
+  // the tracker, and the tracker itself is synchronous.
+  test('M4 (audit #7): concurrent fetches with same turnKey settle on correct budget', async () => {
+    const { LocalMemoryRecallTool, _resetFetchBudgetForTest } = await import(
+      '../LocalMemoryRecallTool.js'
+    )
+    _resetFetchBudgetForTest()
+    const baseDir = join(tmpDir, 'local-memory', 'race-test')
+    mkdirSync(baseDir, { recursive: true })
+    // 5 entries of 30KB each → 150KB total. Budget=100KB. Issued in
+    // parallel with the SAME turnKey, the first 3 succeed, the rest are
+    // budget_exceeded. With 30KB charge per call: 30+30+30=90KB ok, 4th
+    // would be 120KB > 100KB → exceeded. No torn-write should let two
+    // calls past the cap.
+    for (const k of ['a', 'b', 'c', 'd', 'e']) {
+      writeFileSync(join(baseDir, `${k}.md`), 'X'.repeat(30 * 1024))
+    }
+
+    const sharedCtx = {
+      messages: [{ type: 'assistant', uuid: 'race-turn' }],
+      toolUseId: 't',
+    } as never
+
+    // Fire 5 calls in parallel via Promise.all
+    const results = await Promise.all(
+      ['a', 'b', 'c', 'd', 'e'].map(key =>
+        LocalMemoryRecallTool.call(
+          { action: 'fetch', store: 'race-test', key, preview_only: false },
+          sharedCtx,
+        ),
+      ),
+    )
+
+    const exceeded = results.filter(r => r.data.budget_exceeded === true)
+    const ok = results.filter(r => r.data.budget_exceeded !== true)
+    // Exactly 3 ok (90KB), 2 exceeded (120KB+, 150KB+). Critical assertion:
+    // the SUM of successful charges must NOT exceed the budget.
+    expect(ok.length).toBe(3)
+    expect(exceeded.length).toBe(2)
+  })
+
   test('M9: different turnKeys do NOT share budget', async () => {
     const { LocalMemoryRecallTool, _resetFetchBudgetForTest } = await import(
       '../LocalMemoryRecallTool.js'
 
@@ -197,6 +197,27 @@ export const VaultHttpFetchTool = buildTool({
     // again for each new host. Format: `<key>@<host>`. Hosts are taken
     // from URL parsing and lowercased; the empty-host case is unreachable
     // (HTTPS guard above already accepted the URL).
+    //
+    // M2 fix (codecov-100 audit #5): the `host` property of `URL` includes
+    // the port suffix when present (e.g. `api.example.com:8080`) and
+    // wraps IPv6 literals in square brackets (e.g. `[::1]:8080`). Both are
+    // preserved verbatim in the rule content. Two consequences worth
+    // documenting:
+    //
+    //   1. PORTS ARE PART OF THE PERMISSION SCOPE. An allow rule for
+    //      `mykey@api.example.com:8080` does NOT also allow
+    //      `api.example.com:8443` — these are distinct origins per the
+    //      RFC 6454 same-origin rule, and we deliberately mirror that
+    //      so a model cannot pivot from a sanctioned admin port to a
+    //      different one without re-asking.
+    //
+    //   2. IPv6 BRACKET ROUND-TRIP. `new URL('https://[::1]:8080/').host`
+    //      returns `[::1]:8080` (with brackets). The `permissionRule`
+    //      validator in src/utils/settings/permissionValidation.ts is
+    //      configured to accept `[A-Fa-f0-9:]+` *inside brackets* and
+    //      allows `:port` after, so the rule round-trips. If the
+    //      validator regex is ever tightened, update this code path to
+    //      strip the brackets before composing the rule.
     const targetHost = new URL(input.url).host.toLowerCase()
     const ruleContent = `${input.vault_auth_key}@${targetHost}`
     // Also offer a wildcard rule that allows any host for a given key —
 
@@ -732,6 +732,96 @@ describe('VaultHttpFetchTool: deny/allow rule branches', () => {
     )
     expect(result.behavior).toBe('allow')
   })
+
+  // ── M2 (codecov-100 audit #5): port and IPv6 host scoping ──
+  // The `host` property of `URL` includes :port and IPv6 brackets verbatim,
+  // and the rule content is built from it directly. These tests pin that
+  // contract so any future regression that strips ports (and weakens the
+  // permission scope) or strips brackets (breaking IPv6 round-trip) is
+  // caught.
+  test('M2: distinct ports on the same host are distinct permission scopes', async () => {
+    const { VaultHttpFetchTool } = await import('../VaultHttpFetchTool.js')
+    // Allow rule scoped to port 8080. Request to port 8443 must NOT match.
+    const result = await VaultHttpFetchTool.checkPermissions!(
+      {
+        vault_auth_key: 'gh-token',
+        url: 'https://api.example.com:8443/path',
+        method: 'GET',
+        auth_scheme: 'bearer',
+        reason: 'r',
+      } as never,
+      mockToolContext({
+        permissionOverrides: {
+          alwaysAllowRules: {
+            userSettings: ['VaultHttpFetch(gh-token@api.example.com:8080)'],
+            projectSettings: [],
+            localSettings: [],
+            flagSettings: [],
+            policySettings: [],
+            cliArg: [],
+            command: [],
+          },
+        },
+      }) as never,
+    )
+    // No matching allow → falls through to ask (per docstring: bypass-immune)
+    expect(result.behavior).toBe('ask')
+  })
+
+  test('M2: same port DOES match allow rule', async () => {
+    const { VaultHttpFetchTool } = await import('../VaultHttpFetchTool.js')
+    const result = await VaultHttpFetchTool.checkPermissions!(
+      {
+        vault_auth_key: 'gh-token',
+        url: 'https://api.example.com:8080/path',
+        method: 'GET',
+        auth_scheme: 'bearer',
+        reason: 'r',
+      } as never,
+      mockToolContext({
+        permissionOverrides: {
+          alwaysAllowRules: {
+            userSettings: ['VaultHttpFetch(gh-token@api.example.com:8080)'],
+            projectSettings: [],
+            localSettings: [],
+            flagSettings: [],
+            policySettings: [],
+            cliArg: [],
+            command: [],
+          },
+        },
+      }) as never,
+    )
+    expect(result.behavior).toBe('allow')
+  })
+
+  test('M2: IPv6 literal with brackets round-trips through allow rule', async () => {
+    const { VaultHttpFetchTool } = await import('../VaultHttpFetchTool.js')
+    // new URL('https://[::1]:8080/').host === '[::1]:8080' (lowercase preserved)
+    const result = await VaultHttpFetchTool.checkPermissions!(
+      {
+        vault_auth_key: 'gh-token',
+        url: 'https://[::1]:8080/path',
+        method: 'GET',
+        auth_scheme: 'bearer',
+        reason: 'r',
+      } as never,
+      mockToolContext({
+        permissionOverrides: {
+          alwaysAllowRules: {
+            userSettings: ['VaultHttpFetch(gh-token@[::1]:8080)'],
+            projectSettings: [],
+            localSettings: [],
+            flagSettings: [],
+            policySettings: [],
+            cliArg: [],
+            command: [],
+          },
+        },
+      }) as never,
+    )
+    expect(result.behavior).toBe('allow')
+  })
 })
 
 describe('VaultHttpFetchTool: call() additional paths', () => {
 
@@ -19,18 +19,41 @@ describe('buildDerivedSecretForms', () => {
     expect(buildDerivedSecretForms('XYZ')).toEqual([])
   })
 
-  test('covers all 4 forms: raw, Bearer, base64, Basic-base64', () => {
+  test('covers all 4 forms: raw, Bearer, base64, Basic-base64 (>=8 chars)', () => {
+    // M3 (audit #6): bare-base64 form is only emitted for secrets >= 8 chars
+    // (collision risk for short secrets). Use 'helloXXX' (8 chars).
+    const forms = buildDerivedSecretForms('helloXXX')
+    const b64 = Buffer.from('helloXXX', 'utf8').toString('base64')
+    expect(forms).toContain('helloXXX')
+    expect(forms).toContain('Bearer helloXXX')
+    expect(forms).toContain(b64)
+    expect(forms).toContain(`Basic ${b64}`)
+    expect(forms.length).toBe(4)
+  })
+
+  test('M3 (audit #6): short secret (4-7 chars) omits bare-base64 form', () => {
+    // 4-char secret. Raw + Bearer + Basic-prefixed-base64 all emitted; bare
+    // base64 is suppressed because 7-8 char base64 collides with random
+    // tokens in the response body.
     const forms = buildDerivedSecretForms('hello')
+    const b64 = Buffer.from('hello', 'utf8').toString('base64')
     expect(forms).toContain('hello')
     expect(forms).toContain('Bearer hello')
-    expect(forms).toContain('aGVsbG8=') // base64('hello')
-    expect(forms).toContain('Basic aGVsbG8=')
-    expect(forms.length).toBe(4)
+    expect(forms).toContain(`Basic ${b64}`)
+    expect(forms).not.toContain(b64) // bare-base64 NOT emitted
+    expect(forms.length).toBe(3)
+  })
+
+  test('M3 (audit #6): boundary at 7 vs 8 chars', () => {
+    // 7-char: bare-base64 suppressed (3 forms)
+    expect(buildDerivedSecretForms('1234567').length).toBe(3)
+    // 8-char: bare-base64 emitted (4 forms)
+    expect(buildDerivedSecretForms('12345678').length).toBe(4)
   })
 
   test('M7: returns longest-first so callers do not need to sort', () => {
-    const forms = buildDerivedSecretForms('hello')
-    // Basic <base64> is longest, raw 'hello' is shortest
+    const forms = buildDerivedSecretForms('helloXXX')
+    // Basic <base64> is longest, raw 'helloXXX' is shortest
     for (let i = 1; i < forms.length; i++) {
       expect(forms[i]!.length).toBeLessThanOrEqual(forms[i - 1]!.length)
     }
 
@@ -34,16 +34,33 @@ const SENSITIVE_HEADER_NAMES = new Set([
 ])
 
 /**
- * Minimum secret length to scrub. Below this threshold, scrubbing causes
- * pathological output amplification — e.g. a 1-char secret 'X' on a 1MB
- * body that happens to contain many X chars produces ~10MB of [REDACTED].
+ * Minimum secret length for scrubbing the RAW form. Below this threshold,
+ * scrubbing causes pathological output amplification — e.g. a 1-char
+ * secret 'X' on a 1MB body that happens to contain many X chars produces
+ * ~10MB of [REDACTED].
  *
  * 4 chars is below any realistic secret (API tokens, OAuth tokens, JWTs,
  * passwords are all >>4). The vault store should reject sub-4-char values
  * at write time, but this is defense-in-depth at scrub time.
  */
 const MIN_SCRUB_LENGTH = 4
 
+/**
+ * Minimum secret length for scrubbing the BASE64-derived forms.
+ *
+ * M3 fix (codecov-100 audit #6): a 4-char secret has a 7-8 char base64
+ * representation that is short enough to collide with naturally-occurring
+ * tokens in the response body (`x4Kp` → `eDRLcA==`, which can match
+ * unrelated short identifiers). Raw + Bearer forms are still scrubbed
+ * for short secrets because their substring match is much more specific
+ * (e.g. `Bearer x4Kp` is unlikely to collide). For base64 forms we wait
+ * until the secret is >= 8 chars (yielding >= 12 base64 chars), which is
+ * the OWASP minimum for a credential and is well clear of incidental
+ * collisions. This is a TIGHTER scrub for short secrets, not looser:
+ * we still scrub the raw secret value itself.
+ */
+const MIN_SCRUB_BASE64_LENGTH = 8
+
 /**
  * Compute every form the secret could appear in across response body /
  * headers / error message.
@@ -54,13 +71,26 @@ const MIN_SCRUB_LENGTH = 4
  * trusting the result is non-empty. The previous JSDoc claimed "always
  * non-empty" which was inaccurate.
  *
+ * M3 fix (codecov-100 audit #6): for short secrets (4-7 chars) we omit
+ * the bare-base64 form because its 7-8 char encoding is short enough to
+ * collide with unrelated tokens in the response body and produce
+ * spurious [REDACTED] markers. We still emit raw + Bearer + Basic-base64
+ * because those have a longer/more-specific match shape.
+ *
  * Returned forms are sorted longest-first so callers don't need to re-sort.
  */
 export function buildDerivedSecretForms(secret: string): readonly string[] {
   if (!secret || secret.length < MIN_SCRUB_LENGTH) return []
   const base64 = Buffer.from(secret, 'utf8').toString('base64')
   // Pre-sorted longest-first (Basic > Bearer > base64 > raw, generally)
   // so callers don't pay the sort cost on every scrub call.
+  if (secret.length < MIN_SCRUB_BASE64_LENGTH) {
+    // M3 fix: omit the bare-base64 form for short secrets (collision risk).
+    // The Basic-prefixed form keeps base64 content in the scrub list but
+    // anchored on the literal "Basic " prefix so collisions with random
+    // 8-char tokens in the body are vanishingly unlikely.
+    return [`Basic ${base64}`, `Bearer ${secret}`, secret]
+  }
   return [`Basic ${base64}`, `Bearer ${secret}`, base64, secret]
 }
 
 
@@ -93,4 +93,54 @@ describe('parseLocalVaultArgs', () => {
     const r = parseLocalVaultArgs('set -k v')
     expect(r.action).toBe('invalid')
   })
+
+  // ── M1 (codecov-100 audit #4): hyphen-like Unicode prefix rejection ──
+  // U+2212 MINUS SIGN visually looks like '-' but the shell would not
+  // round-trip it back to ASCII '-'. If we accepted such keys, the user
+  // could store them but never retrieve them via the CLI.
+  describe('M1: hyphen-like Unicode prefix rejection (audit #4)', () => {
+    test('U+2212 MINUS SIGN prefix → invalid', () => {
+      const r = parseLocalVaultArgs('set −key value')
+      expect(r.action).toBe('invalid')
+      if (r.action === 'invalid') {
+        expect(r.reason.toLowerCase()).toContain('hyphen')
+      }
+    })
+
+    test('U+2010 HYPHEN prefix → invalid', () => {
+      const r = parseLocalVaultArgs('set ‐key value')
+      expect(r.action).toBe('invalid')
+    })
+
+    test('U+2013 EN DASH prefix → invalid', () => {
+      const r = parseLocalVaultArgs('set –key value')
+      expect(r.action).toBe('invalid')
+    })
+
+    test('U+2014 EM DASH prefix → invalid', () => {
+      const r = parseLocalVaultArgs('set —key value')
+      expect(r.action).toBe('invalid')
+    })
+
+    test('U+FF0D FULLWIDTH HYPHEN-MINUS prefix → invalid', () => {
+      const r = parseLocalVaultArgs('set －key value')
+      expect(r.action).toBe('invalid')
+    })
+
+    test('non-hyphen unicode prefix is still allowed (e.g. CJK)', () => {
+      // Defensive: we only reject hyphen-like; legitimate unicode keys
+      // like '日本語' must still be accepted.
+      const r = parseLocalVaultArgs('set 日本語key value')
+      expect(r.action).toBe('set')
+      if (r.action === 'set') {
+        expect(r.key).toBe('日本語key')
+        expect(r.value).toBe('value')
+      }
+    })
+
+    test('underscore prefix is still allowed (not a hyphen)', () => {
+      const r = parseLocalVaultArgs('set _under value')
+      expect(r.action).toBe('set')
+    })
+  })
 })