Lower default cluster probe cap from 96 to 48

platypii · platypii · commit c5147f0a8b75 · 2026-06-25T19:06:59.000-07:00
A WildChat 1024-dim sweep finds 48, 72, and 96 probed lists give
statistically indistinguishable recall@10 at 1M and 3.2M (within ~1pp vs
exact scan, no consistent direction), while 48 reads ~42% fewer bytes at
scale. Only the default path (probe omitted) is affected; an explicit
probe is honored literally.
diff --git a/package.json b/package.json
@@ -50,10 +50,10 @@
     "hyparquet-writer": "0.16.1"
   },
   "devDependencies": {
-    "@types/node": "26.0.0",
+    "@types/node": "26.0.1",
     "@vitest/coverage-v8": "4.1.9",
     "eslint": "9.39.4",
-    "eslint-plugin-jsdoc": "63.0.7",
+    "eslint-plugin-jsdoc": "63.0.8",
     "typescript": "6.0.3",
     "vitest": "4.1.9"
   }
diff --git a/src/constants.js b/src/constants.js
@@ -31,12 +31,19 @@ export const defaultClusterIterations = 6
 export const defaultClusterProbeFraction = 0.25
 
 // Upper bound on clusters probed under the *default* fraction. Clusters grow
-// as ~sqrt(N)/2, so 0.25 x nlist keeps rising with N; measured recall knees
-// well before that at scale (~92% at 80-96 lists on 1M x 1024, vs 93% at the
-// uncapped 125). Capping the default trims ~25% of roundtrips and ~30% of
-// bytes above ~400k vectors for ~1pp recall. Only applies when `probe` is
-// left default; an explicit `probe` is honored literally.
-export const defaultClusterProbeCap = 96
+// as ~sqrt(N)/2, so 0.25 x nlist keeps rising with N, but the clusters needed
+// to reach the recall ceiling stay roughly flat (~25-45) regardless of N. A
+// WildChat 1024-dim sweep found 48, 72, and 96 lists give statistically
+// indistinguishable recall@10 at 1M and 3.2M (within ~1pp over 20 exact-scan
+// queries, no consistent direction). Their top-10 sets are not bit-identical:
+// over 200 queries, cap 48 matches cap 96 on ~93% (1M) to ~97% (3.2M), the
+// rest reshuffling near-ties at the list boundary, not losing true neighbors.
+// Capping at 48 reads ~42% fewer bytes than 96 at scale with no measurable
+// recall loss; structurally, shrinking the cap can only lose recall, never
+// gain it, since probed clusters are a subset. Residual misses are a
+// rerankFactor limit, not a probe limit. Only applies when `probe` is left
+// default; an explicit `probe` is honored literally.
+export const defaultClusterProbeCap = 48
 
 // When `binary` is not specified at write time, the column is added once
 // the corpus is at least this large. Below the threshold, exact full scan
diff --git a/test/ranges.test.js b/test/ranges.test.js
@@ -38,7 +38,7 @@ describe('selectClusterRowRanges probe cap', () => {
   const query = Uint8Array.from([0, 0])
 
   it('caps the default fraction at the absolute ceiling for large nlist', () => {
-    // 0.25 * 500 = 125 clusters, but the default cap (96) should bind.
+    // 0.25 * 500 = 125 clusters, but the default cap should bind.
     const ranges = selectClusterRowRanges(makeMeta(500), query, undefined)
     expect(rowsCovered(ranges)).toBe(defaultClusterProbeCap)
   })