66 BenchmarkConfigResponseSchema ,
77 BenchmarkRoutingTableResponseSchema ,
88 BenchmarkRunsResponseSchema ,
9+ DEFAULT_BENCHMARK_ORG_ID ,
10+ DEFAULT_BENCHMARK_USER_ID ,
911 StartBenchmarkRunResponseSchema ,
1012 type BenchmarkConfig ,
1113 type BenchmarkKind ,
@@ -124,9 +126,6 @@ type DeciderModelRow = {
124126
125127type AutoDeciderModelRow = AutoBenchmarkDeciderModel ;
126128
127- const DEFAULT_BENCHMARK_USER_ID = 'ce12ef3d-ae95-4d77-b4f0-23735f0a0591' ;
128- const DEFAULT_BENCHMARK_ORG_ID = '9d278969-5453-4ae3-a51f-a8d2274a7b56' ;
129-
130129export function configToFormState ( config : BenchmarkConfig | null ) : {
131130 classifierModels : string ;
132131 deciderModels : DeciderModelRow [ ] ;
@@ -144,8 +143,8 @@ export function configToFormState(config: BenchmarkConfig | null): {
144143 autoDeciderMaxCostUsd : number ;
145144} {
146145 if ( config === null ) {
147- // No config saved yet: the worker fabricates nothing , so the form starts
148- // empty and the admin must enter and save a config before running .
146+ // No config saved yet: identity fields are overrides , so blank means the
147+ // worker uses its default benchmark user and org at run time .
149148 return {
150149 classifierModels : '' ,
151150 deciderModels : [ ] ,
@@ -154,8 +153,8 @@ export function configToFormState(config: BenchmarkConfig | null): {
154153 minAccuracy : 0.7 ,
155154 switchCostFactor : 3 ,
156155 maxConcurrency : 100 ,
157- benchmarkUserId : DEFAULT_BENCHMARK_USER_ID ,
158- benchmarkOrgId : DEFAULT_BENCHMARK_ORG_ID ,
156+ benchmarkUserId : '' ,
157+ benchmarkOrgId : '' ,
159158 classifierRepetitions : 1 ,
160159 deciderRepetitions : 1 ,
161160 classifierMaxP95LatencyMs : '1000' ,
@@ -652,37 +651,35 @@ function BenchmarkConfigEditor({
652651 </ div >
653652
654653 < div className = "grid gap-4 md:grid-cols-2" >
655- { /* Benchmark user id */ }
656654 < div className = "flex flex-col gap-1.5" >
657655 < Label htmlFor = "benchmark-user-id" className = "text-sm font-medium" >
658- Benchmark user id
656+ Benchmark user override
659657 </ Label >
660658 < Input
661659 id = "benchmark-user-id"
662660 value = { form . benchmarkUserId }
663661 onChange = { e => updateForm ( prev => ( { ...prev , benchmarkUserId : e . target . value } ) ) }
664662 className = "h-8 font-mono text-xs"
665- placeholder = "(unset)"
663+ placeholder = { `Default: ${ DEFAULT_BENCHMARK_USER_ID } ` }
666664 />
667665 < p className = "text-muted-foreground text-xs" >
668- Kilo user the decider CLI authenticates as .
666+ Leave blank to run decider benchmarks as the default benchmark user .
669667 </ p >
670668 </ div >
671669
672- { /* Benchmark org id */ }
673670 < div className = "flex flex-col gap-1.5" >
674671 < Label htmlFor = "benchmark-org-id" className = "text-sm font-medium" >
675- Benchmark org id
672+ Benchmark org override
676673 </ Label >
677674 < Input
678675 id = "benchmark-org-id"
679676 value = { form . benchmarkOrgId }
680677 onChange = { e => updateForm ( prev => ( { ...prev , benchmarkOrgId : e . target . value } ) ) }
681678 className = "h-8 font-mono text-xs"
682- placeholder = "(personal credits)"
679+ placeholder = { `Default: ${ DEFAULT_BENCHMARK_ORG_ID } ` }
683680 />
684681 < p className = "text-muted-foreground text-xs" >
685- Optional org context; when set, decider runs bill org credits .
682+ Leave blank to bill decider benchmarks to the default benchmark org .
686683 </ p >
687684 </ div >
688685 </ div >
@@ -943,6 +940,7 @@ export function RoutingTableView({ data }: { data: BenchmarkRoutingTableResponse
943940 < TableHeader >
944941 < TableRow >
945942 < TableHead > Model</ TableHead >
943+ < TableHead className = "w-36" > Reasoning effort</ TableHead >
946944 < TableHead className = "text-right" > Accuracy</ TableHead >
947945 < TableHead className = "text-right" > Avg cost</ TableHead >
948946 < TableHead className = "text-right" > Cost / accuracy</ TableHead >
@@ -955,6 +953,9 @@ export function RoutingTableView({ data }: { data: BenchmarkRoutingTableResponse
955953 < TableCell className = "max-w-56 truncate font-mono text-xs" >
956954 { c . model }
957955 </ TableCell >
956+ < TableCell className = "capitalize text-xs" >
957+ { c . reasoningEffort ?? 'default' }
958+ </ TableCell >
958959 < TableCell className = "text-right tabular-nums text-xs" >
959960 { formatAccuracy ( c . accuracy ) }
960961 </ TableCell >
0 commit comments