Kilo-Org · alex-alecu · Jun 18, 2026 · Jun 18, 2026 · kilo-code-bot · Jun 18, 2026
diff --git a/apps/web/src/app/(app)/code-reviews/[reviewId]/CodeReviewDetailClient.tsx b/apps/web/src/app/(app)/code-reviews/[reviewId]/CodeReviewDetailClient.tsx
@@ -5,6 +5,7 @@ import { Button } from '@/components/ui/button';
 import { Card, CardContent, CardHeader, CardTitle } from '@/components/ui/card';
 import { PageContainer } from '@/components/layouts/PageContainer';
 import { CodeReviewStreamView } from '@/components/code-reviews/CodeReviewStreamView';
+import { formatTokenCount } from '@/lib/code-reviews/summary/usage-footer';
 import {
   ExternalLink,
   GitPullRequest,
@@ -55,6 +56,10 @@ type CodeReviewDetailClientProps = {
   reviewId: string;
 };
 
+function formatAvailableTokenCount(count: number | null): string {
+  return count == null ? '—' : formatTokenCount(count);
+}
+
 export function CodeReviewDetailClient({ reviewId }: CodeReviewDetailClientProps) {
   const trpc = useTRPC();
   const queryClient = useQueryClient();
@@ -268,12 +273,15 @@ export function CodeReviewDetailClient({ reviewId }: CodeReviewDetailClientProps
                 <dd>${(review.total_cost_musd / 1_000_000).toFixed(4)}</dd>
               </div>
             )}
-            {(review.total_tokens_in != null || review.total_tokens_out != null) && (
+            {(data.tokenUsage.input != null ||
+              data.tokenUsage.output != null ||
+              data.tokenUsage.cached != null) && (
               <div>
                 <dt className="text-muted-foreground">Tokens</dt>
-                <dd>
-                  {review.total_tokens_in?.toLocaleString() ?? '—'} in /{' '}
-                  {review.total_tokens_out?.toLocaleString() ?? '—'} out
+                <dd className="tabular-nums">
+                  Input {formatAvailableTokenCount(data.tokenUsage.input)} / Output{' '}
+                  {formatAvailableTokenCount(data.tokenUsage.output)} / Cached{' '}
+                  {formatAvailableTokenCount(data.tokenUsage.cached)}
                 </dd>
               </div>
             )}

diff --git a/apps/web/src/app/api/internal/code-review-status/[reviewId]/route.test.ts b/apps/web/src/app/api/internal/code-review-status/[reviewId]/route.test.ts
@@ -1317,6 +1317,8 @@ describe('POST /api/internal/code-review-status/[reviewId]', () => {
           model: 'anthropic/claude-sonnet-4.6',
           totalTokensIn: 100_001,
           totalTokensOut: 0,
+          totalCachedTokens: 0,
+          totalUncachedTokens: 100_001,
           totalCostMusd: 200_000,
         },
       },
@@ -1326,6 +1328,8 @@ describe('POST /api/internal/code-review-status/[reviewId]', () => {
           model: 'anthropic/claude-sonnet-4.6',
           totalTokensIn: 60_000,
           totalTokensOut: 40_000,
+          totalCachedTokens: 0,
+          totalUncachedTokens: 60_000,
           totalCostMusd: 200_000,
         },
       },
@@ -1335,6 +1339,8 @@ describe('POST /api/internal/code-review-status/[reviewId]', () => {
           model: 'anthropic/claude-sonnet-4.6',
           totalTokensIn: 100_001,
           totalTokensOut: 0,
+          totalCachedTokens: 0,
+          totalUncachedTokens: 100_001,
           totalCostMusd: 199_999,
         },
       },
@@ -1344,6 +1350,8 @@ describe('POST /api/internal/code-review-status/[reviewId]', () => {
           model: 'anthropic/claude-sonnet-4.6',
           totalTokensIn: 99_999,
           totalTokensOut: 0,
+          totalCachedTokens: 0,
+          totalUncachedTokens: 99_999,
           totalCostMusd: 200_000,
         },
       },
@@ -1575,6 +1583,8 @@ describe('POST /api/internal/code-review-status/[reviewId]', () => {
         model: 'anthropic/claude-sonnet-4.6',
         totalTokensIn: 99_999,
         totalTokensOut: 0,
+        totalCachedTokens: 0,
+        totalUncachedTokens: 99_999,
         totalCostMusd: 200_000,
       });
 
@@ -1614,6 +1624,8 @@ describe('POST /api/internal/code-review-status/[reviewId]', () => {
           model: 'anthropic/claude-sonnet-4.6',
           totalTokensIn: 99_999,
           totalTokensOut: 0,
+          totalCachedTokens: 0,
+          totalUncachedTokens: 99_999,
           totalCostMusd: 199_999,
         },
       },
@@ -2762,11 +2774,21 @@ describe('POST /api/internal/code-review-status/[reviewId]', () => {
         repository_review_instructions_used: true,
         repository_review_instructions_ref: 'main',
         repository_review_instructions_truncated: false,
+        cli_session_id: 'ses_review_with_cache',
         model: 'anthropic/claude-sonnet-4.6',
         total_tokens_in: 1000,
         total_tokens_out: 200,
+        completed_at: '2025-01-01T00:10:00Z',
       });
       mockGetCodeReviewById.mockResolvedValue(review);
+      mockGetSessionUsageFromBilling.mockResolvedValue({
+        model: 'openai/gpt-4o',
+        totalTokensIn: 1000,
+        totalTokensOut: 200,
+        totalCachedTokens: 800,
+        totalUncachedTokens: 200,
+        totalCostMusd: 100,
+      });
 
       await POST(makeRequest({ status: 'completed' }), makeParams(REVIEW_ID));
 
@@ -2783,8 +2805,23 @@ describe('POST /api/internal/code-review-status/[reviewId]', () => {
         null,
         { maxBodyCharacters: 65_536, reservedCharacters: 8 }
       );
+      expect(mockGetSessionUsageFromBilling).toHaveBeenCalledWith(
+        'ses_review_with_cache',
+        '2025-01-01T00:00:00Z',
+        '2025-01-01T00:10:00Z'
+      );
+      expect(mockUpdateCodeReviewUsage).toHaveBeenCalledWith(REVIEW_ID, {
+        totalTokensIn: 1000,
+        totalTokensOut: 200,
+        totalCostMusd: 100,
+      });
       expect(mockAppendReviewSummaryFooter).toHaveBeenCalledWith('existing body', {
-        usage: { model: 'anthropic/claude-sonnet-4.6', tokensIn: 1000, tokensOut: 200 },
+        usage: {
+          model: 'anthropic/claude-sonnet-4.6',
+          tokensIn: 200,
+          tokensOut: 200,
+          cachedTokens: 800,
+        },
         reviewGuidance: { used: true, ref: 'main', truncated: false },
       });
       expect(mockUpdateKiloReviewComment).toHaveBeenCalledWith(
@@ -2820,7 +2857,12 @@ describe('POST /api/internal/code-review-status/[reviewId]', () => {
         'https://gitlab.com'
       );
       expect(mockAppendReviewSummaryFooter).toHaveBeenCalledWith('existing note body', {
-        usage: { model: 'anthropic/claude-sonnet-4.6', tokensIn: 1000, tokensOut: 200 },
+        usage: {
+          model: 'anthropic/claude-sonnet-4.6',
+          tokensIn: 1000,
+          tokensOut: 200,
+          cachedTokens: null,
+        },
         reviewGuidance: { used: true, ref: 'main', truncated: true },
       });
       expect(mockUpdateKiloReviewNote).toHaveBeenCalledWith(

diff --git a/apps/web/src/app/api/internal/code-review-status/[reviewId]/route.ts b/apps/web/src/app/api/internal/code-review-status/[reviewId]/route.ts
@@ -573,8 +573,9 @@ const BILLING_NOTICE_BODY = `${BILLING_NOTICE_MARKER}
  * For v2 (cloud-agent-next) the orchestrator never writes usage — we
  * skip the poll and go straight to the billing tables.
  *
- * When the billing fallback is used we also back-fill the code_reviews
- * record so later reads (e.g. admin panel) don't repeat the aggregation.
+ * Billing usage is preferred when a CLI session is available because the
+ * persisted review columns do not include cache details. Raw cache-inclusive
+ * input, output, and cost totals are still back-filled for later reads.
  */
 async function getReviewUsageData(reviewId: string) {
   let review = await getCodeReviewById(reviewId);
@@ -591,21 +592,15 @@ async function getReviewUsageData(reviewId: string) {
     }
   }
 
-  if (review?.model) {
-    return {
-      model: review.model,
-      tokensIn: review.total_tokens_in ?? null,
-      tokensOut: review.total_tokens_out ?? null,
-    };
-  }
-
-  // Fallback: aggregate from billing tables (covers v2 / cloud-agent-next reviews)
   if (review?.cli_session_id && review.created_at) {
-    const billing = await getSessionUsageFromBilling(review.cli_session_id, review.created_at);
+    const billing = await getSessionUsageFromBilling(
+      review.cli_session_id,
+      review.created_at,
+      review.completed_at ?? undefined
+    );
     if (billing) {
-      // Back-fill the code_reviews record so we don't repeat this aggregation
       updateCodeReviewUsage(reviewId, {
-        model: billing.model,
+        ...(review.model == null ? { model: billing.model } : {}),
         totalTokensIn: billing.totalTokensIn,
         totalTokensOut: billing.totalTokensOut,
         totalCostMusd: billing.totalCostMusd,
@@ -614,14 +609,24 @@ async function getReviewUsageData(reviewId: string) {
       });
 
       return {
-        model: billing.model,
-        tokensIn: billing.totalTokensIn,
+        model: review.model ?? billing.model,
+        tokensIn: billing.totalUncachedTokens,
         tokensOut: billing.totalTokensOut,
+        cachedTokens: billing.totalCachedTokens,
       };
     }
   }
 
-  return { model: null, tokensIn: null, tokensOut: null };
+  if (review?.model) {
+    return {
+      model: review.model,
+      tokensIn: review.total_tokens_in ?? null,
+      tokensOut: review.total_tokens_out ?? null,
+      cachedTokens: null,
+    };
+  }
+
+  return { model: null, tokensIn: null, tokensOut: null, cachedTokens: null };
 }
 
 function getReviewGuidanceFooterData(review: CloudAgentCodeReview) {
@@ -1455,10 +1460,11 @@ export async function POST(
 
               // Summary history and footer (completed only)
               if (status === 'completed') {
-                const { model, tokensIn, tokensOut } = await getReviewUsageData(reviewId);
+                const { model, tokensIn, tokensOut, cachedTokens } =
+                  await getReviewUsageData(reviewId);
                 const usage =
                   model && tokensIn != null && tokensOut != null
-                    ? { model, tokensIn, tokensOut }
+                    ? { model, tokensIn, tokensOut, cachedTokens }
                     : undefined;
                 const reviewGuidance = getReviewGuidanceFooterData(review);
                 const summaryFooter = { usage, reviewGuidance };
@@ -1548,10 +1554,11 @@ export async function POST(
 
               // Summary history and footer (completed only)
               if (status === 'completed') {
-                const { model, tokensIn, tokensOut } = await getReviewUsageData(reviewId);
+                const { model, tokensIn, tokensOut, cachedTokens } =
+                  await getReviewUsageData(reviewId);
                 const usage =
                   model && tokensIn != null && tokensOut != null
-                    ? { model, tokensIn, tokensOut }
+                    ? { model, tokensIn, tokensOut, cachedTokens }
                     : undefined;
                 const reviewGuidance = getReviewGuidanceFooterData(review);
 

diff --git a/apps/web/src/lib/code-reviews/db/code-reviews.test.ts b/apps/web/src/lib/code-reviews/db/code-reviews.test.ts
@@ -3,9 +3,11 @@ import {
   cloud_agent_code_review_attempts,
   cloud_agent_code_reviews,
   kilocode_users,
+  microdollar_usage,
+  microdollar_usage_metadata,
   platform_integrations,
 } from '@kilocode/db/schema';
-import { eq } from 'drizzle-orm';
+import { eq, inArray } from 'drizzle-orm';
 import { insertTestUser } from '@/tests/helpers/user.helper';
 import type { User } from '@kilocode/db/schema';
 import {
@@ -14,6 +16,7 @@ import {
   createCodeReviewAttempt,
   createInfraRetryAttemptIfMissing,
   getCodeReviewAttemptForReview,
+  getSessionUsageFromBilling,
   listCodeReviewAttempts,
   updateCodeReviewAttemptForCallback,
   findPreviousCompletedReview,
@@ -618,3 +621,74 @@ describe('findPreviousCompletedReview', () => {
     ).rejects.toThrow('not found');
   });
 });
+
+describe('getSessionUsageFromBilling', () => {
+  const usageIds: string[] = [];
+
+  afterEach(async () => {
+    if (usageIds.length === 0) return;
+
+    await db
+      .delete(microdollar_usage_metadata)
+      .where(inArray(microdollar_usage_metadata.id, usageIds));
+    await db.delete(microdollar_usage).where(inArray(microdollar_usage.id, usageIds));
+    usageIds.length = 0;
+  });
+
+  it('excludes later usage when a completed review session is reused', async () => {
+    const sessionId = `ses_usage_window_${crypto.randomUUID()}`;
+    const firstUsageId = crypto.randomUUID();
+    const laterUsageId = crypto.randomUUID();
+    usageIds.push(firstUsageId, laterUsageId);
+
+    await db.insert(microdollar_usage).values([
+      {
+        id: firstUsageId,
+        kilo_user_id: 'code-review-usage-test',
+        cost: 100,
+        input_tokens: 1000,
+        output_tokens: 100,
+        cache_write_tokens: 100,
+        cache_hit_tokens: 600,
+        created_at: '2026-06-18T10:00:00.000Z',
+        model: 'anthropic/claude-sonnet-4.6',
+      },
+      {
+        id: laterUsageId,
+        kilo_user_id: 'code-review-usage-test',
+        cost: 200,
+        input_tokens: 2000,
+        output_tokens: 200,
+        cache_write_tokens: 200,
+        cache_hit_tokens: 1200,
+        created_at: '2026-06-18T12:00:00.000Z',
+        model: 'openai/gpt-4o',
+      },
+    ]);
+    await db.insert(microdollar_usage_metadata).values([
+      {
+        id: firstUsageId,
+        message_id: `msg_${firstUsageId}`,
+        session_id: sessionId,
+        created_at: '2026-06-18T10:00:00.000Z',
+      },
+      {
+        id: laterUsageId,
+        message_id: `msg_${laterUsageId}`,
+        session_id: sessionId,
+        created_at: '2026-06-18T12:00:00.000Z',
+      },
+    ]);
+
+    await expect(
+      getSessionUsageFromBilling(sessionId, '2026-06-18T09:00:00.000Z', '2026-06-18T11:00:00.000Z')
+    ).resolves.toEqual({
+      model: 'anthropic/claude-sonnet-4.6',
+      totalTokensIn: 1000,
+      totalTokensOut: 100,
+      totalCachedTokens: 700,
+      totalUncachedTokens: 300,
+      totalCostMusd: 100,
+    });
+  });
+});