style: fix biome formatting

danielnaab · danielnaab · commit c44a9b788294 · 2026-05-07T05:25:43.000Z
diff --git a/src/entrypoints/cli/commands/evaluate.ts b/src/entrypoints/cli/commands/evaluate.ts
@@ -429,9 +429,7 @@ export async function evaluate(
     case 'layout': {
       const strategyId = args[1]
       if (!strategyId) {
-        console.error(
-          'Usage: evaluate layout <strategy-id> [--out-dir <path>]',
-        )
+        console.error('Usage: evaluate layout <strategy-id> [--out-dir <path>]')
         return 1
       }
 
@@ -466,11 +464,8 @@ export async function evaluate(
         return 1
       }
 
-      const {
-        layoutQualityKind,
-        setLayoutJudge,
-        createBedrockLayoutJudge,
-      } = await import('../../../services/evaluation')
+      const { layoutQualityKind, setLayoutJudge, createBedrockLayoutJudge } =
+        await import('../../../services/evaluation')
       const { OPUS_MODEL_ID } = await import('../../../services/extraction')
 
       const judge = createBedrockLayoutJudge(OPUS_MODEL_ID)
diff --git a/src/services/evaluation/index.ts b/src/services/evaluation/index.ts
@@ -11,21 +11,21 @@ export {
 export { runEvaluation } from './harness'
 // Judges
 export { createBedrockFieldJudge } from './judge'
-export { createBedrockLayoutJudge } from './layout-judge'
 // Kinds
 export {
-  layoutQualityKind,
-  setLayoutJudge,
   type LayoutJudge,
   type LayoutJudgeResponse,
   type LayoutQualityOutput,
+  layoutQualityKind,
+  setLayoutJudge,
 } from './kinds/layout-quality'
 export {
   type ExtractionOutput,
   pdfFieldExtractionKind,
 } from './kinds/pdf-field-extraction'
 export { createLlmJudgeKind } from './kinds/pdf-field-extraction-judge'
 export { shapingCommandsKind } from './kinds/shaping-commands'
+export { createBedrockLayoutJudge } from './layout-judge'
 // Layout judge prompt
 export { buildLayoutJudgePrompt } from './layout-judge-prompt'
 export { evaluationRunSchema } from './schemas'
diff --git a/src/services/evaluation/kinds/layout-quality.ts b/src/services/evaluation/kinds/layout-quality.ts
@@ -29,78 +29,76 @@ const DIMENSIONS = [
 
 let currentJudge: LayoutJudge | undefined
 
-export const layoutQualityKind: EvaluationKind<
-  LayoutQualityOutput,
-  undefined
-> = {
-  id: 'layout-quality',
-  description:
-    'Evaluates FormSpec layout quality using LLM-as-judge against a civic tech best practices rubric',
-
-  async score(output: LayoutQualityOutput): Promise<CaseMetrics> {
-    if (!currentJudge) {
-      throw new Error(
-        'layoutQualityKind: judge not set. Call setLayoutJudge() before scoring.',
-      )
-    }
-
-    const response = await currentJudge.judge(output.spec, output.formSpec)
-
-    const metrics: Record<string, number> = {}
-    let total = 0
-    let count = 0
-
-    for (const dim of DIMENSIONS) {
-      const entry = response.scores[dim]
-      if (entry) {
-        const normalized = (entry.score - 1) / 4 // 1-5 → 0-1
-        metrics[dim] = normalized
-        total += normalized
-        count++
+export const layoutQualityKind: EvaluationKind<LayoutQualityOutput, undefined> =
+  {
+    id: 'layout-quality',
+    description:
+      'Evaluates FormSpec layout quality using LLM-as-judge against a civic tech best practices rubric',
+
+    async score(output: LayoutQualityOutput): Promise<CaseMetrics> {
+      if (!currentJudge) {
+        throw new Error(
+          'layoutQualityKind: judge not set. Call setLayoutJudge() before scoring.',
+        )
       }
-    }
-
-    metrics.overall = count > 0 ? total / count : 0
-
-    return {
-      fixture: '',
-      metrics,
-      details: {
-        rawScores: response.scores,
-        pageCount: output.formSpec.pages.length,
-        fieldCount: output.spec.groups.reduce(
-          (sum, g) => sum + g.requirements.length,
-          0,
-        ),
-        groupCount: output.spec.groups.length,
-      },
-    }
-  },
-
-  summarize(cases: CaseMetrics[]): SummaryMetrics {
-    if (cases.length === 0) return { metrics: {} }
-
-    const metricKeys = new Set<string>()
-    for (const c of cases) {
-      for (const key of Object.keys(c.metrics)) metricKeys.add(key)
-    }
-
-    const metrics: Record<string, number> = {}
-    for (const key of metricKeys) {
-      let sum = 0
+
+      const response = await currentJudge.judge(output.spec, output.formSpec)
+
+      const metrics: Record<string, number> = {}
+      let total = 0
       let count = 0
-      for (const c of cases) {
-        if (key in c.metrics) {
-          sum += c.metrics[key]
+
+      for (const dim of DIMENSIONS) {
+        const entry = response.scores[dim]
+        if (entry) {
+          const normalized = (entry.score - 1) / 4 // 1-5 → 0-1
+          metrics[dim] = normalized
+          total += normalized
           count++
         }
       }
-      metrics[key] = count > 0 ? sum / count : 0
-    }
 
-    return { metrics }
-  },
-}
+      metrics.overall = count > 0 ? total / count : 0
+
+      return {
+        fixture: '',
+        metrics,
+        details: {
+          rawScores: response.scores,
+          pageCount: output.formSpec.pages.length,
+          fieldCount: output.spec.groups.reduce(
+            (sum, g) => sum + g.requirements.length,
+            0,
+          ),
+          groupCount: output.spec.groups.length,
+        },
+      }
+    },
+
+    summarize(cases: CaseMetrics[]): SummaryMetrics {
+      if (cases.length === 0) return { metrics: {} }
+
+      const metricKeys = new Set<string>()
+      for (const c of cases) {
+        for (const key of Object.keys(c.metrics)) metricKeys.add(key)
+      }
+
+      const metrics: Record<string, number> = {}
+      for (const key of metricKeys) {
+        let sum = 0
+        let count = 0
+        for (const c of cases) {
+          if (key in c.metrics) {
+            sum += c.metrics[key]
+            count++
+          }
+        }
+        metrics[key] = count > 0 ? sum / count : 0
+      }
+
+      return { metrics }
+    },
+  }
 
 export function setLayoutJudge(judge: LayoutJudge): void {
   currentJudge = judge
diff --git a/src/services/extraction/registry.ts b/src/services/extraction/registry.ts
@@ -128,7 +128,8 @@ export function createExtractorRegistry(
         'Hybrid extraction prompt with layout-aware FormSpec generation. Step 2 uses civic tech best practices (GOV.UK, USDS, Code for America) for adaptive page sizing, topic cohesion, and progressive disclosure.',
       status: 'experimental',
       courseTopics: ['evaluation', 'prompt-optimization', 'form-design'],
-      catalogPath: '/catalog/experiments/layout-quality/sonnet-hybrid-layout-v1',
+      catalogPath:
+        '/catalog/experiments/layout-quality/sonnet-hybrid-layout-v1',
       modelId: SONNET_MODEL_ID,
       pricing: { inputPer1k: 0.003, outputPer1k: 0.015 },
     },
diff --git a/test/evaluation/layout-quality.test.ts b/test/evaluation/layout-quality.test.ts
@@ -1,10 +1,10 @@
 import { describe, expect, test } from 'bun:test'
+import type { DataCollectionSpec } from '../../src/services/data-collection'
 import {
-  layoutQualityKind,
   type LayoutJudge,
+  layoutQualityKind,
   setLayoutJudge,
 } from '../../src/services/evaluation/kinds/layout-quality'
-import type { DataCollectionSpec } from '../../src/services/data-collection'
 import type { FormSpec } from '../../src/services/forms'
 
 describe('layoutQualityKind', () => {