feat(telemetry): add skill usage telemetry

rev-rwasilewski · rev-rwasilewski · commit 5d11123bf693 · 2026-06-19T18:26:54.000+02:00
diff --git a/README.md b/README.md
@@ -47,6 +47,7 @@ An [opencode](https://opencode.ai) plugin that exports telemetry via OpenTelemet
 | `opencode.session.cost.total` | Histogram | Total cost per session in USD, recorded on idle |
 | `opencode.model.usage` | Counter | Messages per model and provider |
 | `opencode.retry.count` | Counter | API retries observed via `session.status` events |
+| `opencode.skill.count` | Counter | Skill command invocations when opencode exposes command `source=skill` metadata |
 
 ### Log events
 
@@ -60,6 +61,7 @@ An [opencode](https://opencode.ai) plugin that exports telemetry via OpenTelemet
 | `api_error` | Failed assistant message (error summary, duration) |
 | `tool_result` | Tool completed or errored (duration, success, output size) |
 | `tool_decision` | Permission prompt answered (accept/reject) |
+| `skill_invoked` | Skill command invoked (includes skill name, command name, optional agent/subtask metadata, and argument length) |
 | `commit` | Git commit detected |
 
 ## Installation
@@ -165,7 +167,7 @@ Disabling a metric only stops the counter/histogram from being incremented — t
 export OPENCODE_DISABLE_METRICS="retry.count"
 
 # Disable multiple metrics
-export OPENCODE_DISABLE_METRICS="cache.count,session.duration,session.token.total,session.cost.total,model.usage,retry.count,message.count"
+export OPENCODE_DISABLE_METRICS="cache.count,session.duration,session.token.total,session.cost.total,model.usage,retry.count,message.count,skill.count"
 
 # Disable the new per-session cumulative gauge while keeping the delta counter
 export OPENCODE_DISABLE_METRICS="lines_of_code.total"
@@ -176,7 +178,7 @@ export OPENCODE_DISABLE_METRICS="lines_of_code.total"
 The following metrics are specific to opencode and have no equivalent in Claude Code's built-in monitoring. If you are using a Claude Code dashboard and want to avoid cluttering it with opencode-only metrics, you can disable them:
 
 ```bash
-export OPENCODE_DISABLE_METRICS="cache.count,session.duration,session.token.total,session.cost.total,model.usage,retry.count,message.count"
+export OPENCODE_DISABLE_METRICS="cache.count,session.duration,session.token.total,session.cost.total,model.usage,retry.count,message.count,skill.count"
 ```
 
 | Metric suffix | Why it's opencode-only |
@@ -188,6 +190,7 @@ export OPENCODE_DISABLE_METRICS="cache.count,session.duration,session.token.tota
 | `model.usage` | Per-model message counter — not emitted by Claude Code |
 | `retry.count` | API retry counter — not emitted by Claude Code |
 | `message.count` | Completed message counter — not emitted by Claude Code |
+| `skill.count` | OpenCode skill command counter — not emitted by Claude Code |
 
 ### Disabling OTLP logs
 
diff --git a/src/handlers/skill.ts b/src/handlers/skill.ts
@@ -0,0 +1,208 @@
+import { SeverityNumber } from "@opentelemetry/api-logs"
+import { isMetricEnabled } from "../util.ts"
+import type { HandlerContext, PluginLogger } from "../types.ts"
+
+type SkillCommandInfo = {
+  name: string
+  description?: string
+  agent?: string
+  subtask?: boolean
+}
+
+type RawCommand = {
+  name?: unknown
+  source?: unknown
+  description?: unknown
+  agent?: unknown
+  subtask?: unknown
+}
+
+type CommandListClient = {
+  command?: {
+    list(options?: { query?: { directory?: string; workspace?: string } }): Promise<{ data?: unknown; error?: unknown } | unknown>
+  }
+}
+
+type CommandExecuteInput = {
+  command: string
+  sessionID: string
+  arguments: string
+}
+
+type SkillCommandLookup = {
+  ok: boolean
+  commands: SkillCommandInfo[]
+}
+
+function rawSkillCommand(command: RawCommand): SkillCommandInfo | undefined {
+  if (command.source !== "skill" || typeof command.name !== "string") return undefined
+  return {
+    name: command.name,
+    ...(typeof command.description === "string" ? { description: command.description } : {}),
+    ...(typeof command.agent === "string" ? { agent: command.agent } : {}),
+    ...(typeof command.subtask === "boolean" ? { subtask: command.subtask } : {}),
+  }
+}
+
+function commandsFromPayload(payload: unknown): SkillCommandInfo[] {
+  const data = payload && typeof payload === "object" && "data" in payload
+    ? (payload as { data?: unknown }).data
+    : payload
+  const commands = data && typeof data === "object" && "data" in data
+    ? (data as { data?: unknown }).data
+    : data
+  if (!Array.isArray(commands)) return []
+  return commands
+    .map((command) => rawSkillCommand(command as RawCommand))
+    .filter((command): command is SkillCommandInfo => !!command)
+}
+
+async function clientSkillCommands(client: CommandListClient, directory: string | undefined): Promise<SkillCommandLookup> {
+  if (!client.command?.list) return { ok: false, commands: [] }
+  const response = await client.command.list(directory ? { query: { directory } } : undefined)
+  if (response && typeof response === "object" && "error" in response && (response as { error?: unknown }).error !== undefined) {
+    return { ok: false, commands: [] }
+  }
+  return { ok: true, commands: commandsFromPayload(response) }
+}
+
+async function rawSkillCommands(serverUrl: URL, directory: string | undefined, path: "/command" | "/api/command"): Promise<SkillCommandLookup> {
+  const url = new URL(path, serverUrl)
+  if (directory) {
+    if (path === "/api/command") {
+      url.searchParams.set("location[directory]", directory)
+    } else {
+      url.searchParams.set("directory", directory)
+    }
+  }
+  const controller = new AbortController()
+  const timeout = setTimeout(() => controller.abort(), 1_000)
+  try {
+    const response = await fetch(url, { signal: controller.signal })
+    if (!response.ok) return { ok: false, commands: [] }
+    return { ok: true, commands: commandsFromPayload(await response.json()) }
+  } finally {
+    clearTimeout(timeout)
+  }
+}
+
+export function createSkillCommandResolver(input: {
+  client: CommandListClient
+  serverUrl: URL
+  directory?: string
+  log: PluginLogger
+}) {
+  let lastRefresh = 0
+  let refreshPromise: Promise<void> | undefined
+  const skillCommands = new Map<string, SkillCommandInfo>()
+
+  const refresh = async (force = false) => {
+    if (!force && Date.now() - lastRefresh < 30_000) return
+    if (refreshPromise) return refreshPromise
+    refreshPromise = (async () => {
+      const next = new Map<string, SkillCommandInfo>()
+      let catalogLoaded = false
+      try {
+        const lookup = await clientSkillCommands(input.client, input.directory)
+        catalogLoaded = catalogLoaded || lookup.ok
+        for (const command of lookup.commands) {
+          next.set(command.name, command)
+        }
+      } catch (err) {
+        await input.log("debug", "otel: command catalog lookup failed", {
+          error: err instanceof Error ? err.message : String(err),
+        })
+      }
+      if (next.size === 0) {
+        try {
+          const lookup = await rawSkillCommands(input.serverUrl, input.directory, "/command")
+          catalogLoaded = catalogLoaded || lookup.ok
+          for (const command of lookup.commands) {
+            next.set(command.name, command)
+          }
+        } catch (err) {
+          await input.log("debug", "otel: raw command catalog lookup failed", {
+            error: err instanceof Error ? err.message : String(err),
+          })
+        }
+      }
+      if (next.size === 0) {
+        try {
+          const lookup = await rawSkillCommands(input.serverUrl, input.directory, "/api/command")
+          catalogLoaded = catalogLoaded || lookup.ok
+          for (const command of lookup.commands) {
+            next.set(command.name, command)
+          }
+        } catch (err) {
+          await input.log("debug", "otel: v2 command catalog lookup failed", {
+            error: err instanceof Error ? err.message : String(err),
+          })
+        }
+      }
+      if (!catalogLoaded) {
+        await input.log("debug", "otel: skill command catalog refresh skipped")
+        return
+      }
+      skillCommands.clear()
+      for (const [name, command] of next) skillCommands.set(name, command)
+      lastRefresh = Date.now()
+      await input.log("debug", "otel: skill command catalog refreshed", { count: skillCommands.size })
+    })().finally(() => {
+      refreshPromise = undefined
+    })
+    return refreshPromise
+  }
+
+  return {
+    refresh,
+    resolve: async (command: string) => {
+      let skill = skillCommands.get(command)
+      if (skill) return skill
+      await refresh(false)
+      skill = skillCommands.get(command)
+      return skill
+    },
+  }
+}
+
+export async function handleCommandExecuteBefore(
+  input: CommandExecuteInput,
+  ctx: HandlerContext,
+  resolveSkillCommand: (command: string) => Promise<SkillCommandInfo | undefined>,
+) {
+  const skill = await resolveSkillCommand(input.command)
+  if (!skill) return
+
+  const attrs = {
+    ...ctx.commonAttrs,
+    "session.id": input.sessionID,
+    skill_name: skill.name,
+    command_name: input.command,
+    ...(skill.agent ? { agent: skill.agent } : {}),
+    ...(skill.subtask !== undefined ? { subtask: skill.subtask } : {}),
+  }
+
+  if (isMetricEnabled("skill.count", ctx)) {
+    ctx.instruments.skillCounter.add(1, attrs)
+  }
+
+  ctx.emitLog({
+    severityNumber: SeverityNumber.INFO,
+    severityText: "INFO",
+    timestamp: Date.now(),
+    observedTimestamp: Date.now(),
+    body: "skill_invoked",
+    attributes: {
+      "event.name": "skill_invoked",
+      ...attrs,
+      arguments_length: input.arguments.length,
+      ...(skill.description ? { description: skill.description } : {}),
+    },
+  })
+
+  return ctx.log("info", "otel: skill_invoked", {
+    sessionID: input.sessionID,
+    skill_name: skill.name,
+    command_name: input.command,
+  })
+}
diff --git a/src/index.ts b/src/index.ts
@@ -25,6 +25,7 @@ import { handleSessionCreated, handleSessionIdle, handleSessionError, handleSess
 import { handleMessageUpdated, handleMessagePartUpdated, startMessageSpan } from "./handlers/message.ts"
 import { handlePermissionUpdated, handlePermissionReplied } from "./handlers/permission.ts"
 import { handleSessionDiff, handleCommandExecuted } from "./handlers/activity.ts"
+import { createSkillCommandResolver, handleCommandExecuteBefore } from "./handlers/skill.ts"
 
 const PLUGIN_VERSION: string = (pkg as { version?: string }).version ?? "unknown"
 
@@ -33,7 +34,7 @@ const PLUGIN_VERSION: string = (pkg as { version?: string }).version ?? "unknown
  * Instruments metrics (sessions, tokens, cost, lines of code, commits, tool durations)
  * and structured log events. All instrumentation is gated on `OPENCODE_ENABLE_TELEMETRY`.
  */
-export const OtelPlugin: Plugin = async ({ project, client, directory, worktree }) => {
+export const OtelPlugin: Plugin = async ({ project, client, directory, worktree, serverUrl }) => {
   const config = loadConfig()
   const otlpHeadersHelper = resolveHelperPath(config.otlpHeadersHelper, directory, worktree)
   let minLevel: Level = "info"
@@ -139,6 +140,8 @@ export const OtelPlugin: Plugin = async ({ project, client, directory, worktree
     sessionInputs,
     messageOutputs,
   }
+  const skillCommands = createSkillCommandResolver({ client, serverUrl, directory: worktree ?? directory, log })
+  await skillCommands.refresh(true)
 
   async function shutdown() {
     await Promise.allSettled([meterProvider.shutdown(), loggerProvider.shutdown(), tracerProvider.shutdown()])
@@ -217,6 +220,10 @@ export const OtelPlugin: Plugin = async ({ project, client, directory, worktree
       })
     }),
 
+    "command.execute.before": safe("command.execute.before", async (input) => {
+      await handleCommandExecuteBefore(input, ctx, skillCommands.resolve)
+    }),
+
     event: safe("event", async ({ event }) => {
       switch (event.type) {
         case "session.created":
diff --git a/src/otel.ts b/src/otel.ts
@@ -209,5 +209,9 @@ export function createInstruments(prefix: string): Instruments {
       unit: "{subtask}",
       description: "Number of sub-agent invocations observed via subtask message parts",
     }),
+    skillCounter: meter.createCounter(`${prefix}skill.count`, {
+      unit: "{skill}",
+      description: "Number of skill command invocations observed via command execution hooks",
+    }),
   }
 }
diff --git a/src/types.ts b/src/types.ts
@@ -52,6 +52,7 @@ export type Instruments = {
   modelUsageCounter: Counter
   retryCounter: Counter
   subtaskCounter: Counter
+  skillCounter: Counter
 }
 
 /** Accumulated per-session totals used for gauge snapshots on session.idle. */
diff --git a/tests/handlers/disabled-metrics.test.ts b/tests/handlers/disabled-metrics.test.ts
@@ -2,6 +2,7 @@ import { describe, test, expect } from "bun:test"
 import { handleSessionCreated, handleSessionIdle, handleSessionStatus } from "../../src/handlers/session.ts"
 import { handleMessageUpdated, handleMessagePartUpdated } from "../../src/handlers/message.ts"
 import { handleSessionDiff, handleCommandExecuted } from "../../src/handlers/activity.ts"
+import { handleCommandExecuteBefore } from "../../src/handlers/skill.ts"
 import { makeCtx } from "../helpers.ts"
 import type { EventSessionCreated, EventSessionIdle, EventSessionStatus, EventMessageUpdated, EventMessagePartUpdated, EventSessionDiff, EventCommandExecuted } from "@opencode-ai/sdk"
 
@@ -226,13 +227,35 @@ describe("OPENCODE_DISABLE_METRICS", () => {
     })
   })
 
+  describe("skill.count disabled", () => {
+    test("does not increment skill counter", async () => {
+      const { ctx, counters } = makeCtx("proj_test", ["skill.count"])
+      await handleCommandExecuteBefore(
+        { command: "review", sessionID: "ses_1", arguments: "args" },
+        ctx,
+        async () => ({ name: "review" }),
+      )
+      expect(counters.skill.calls).toHaveLength(0)
+    })
+
+    test("still emits skill_invoked log record", async () => {
+      const { ctx, logger } = makeCtx("proj_test", ["skill.count"])
+      await handleCommandExecuteBefore(
+        { command: "review", sessionID: "ses_1", arguments: "args" },
+        ctx,
+        async () => ({ name: "review" }),
+      )
+      expect(logger.records.at(0)!.body).toBe("skill_invoked")
+    })
+  })
+
   describe("multiple disabled at once", () => {
     test("disabling all metrics stops all counter/histogram calls", async () => {
       const all = [
         "session.count", "token.usage", "cost.usage", "lines_of_code.count",
         "commit.count", "tool.duration", "cache.count", "session.duration",
         "message.count", "session.token.total", "session.cost.total",
-        "model.usage", "retry.count", "subtask.count",
+        "model.usage", "retry.count", "subtask.count", "skill.count",
       ]
       const { ctx, counters, histograms, gauges } = makeCtx("proj_test", all)
       const subtaskEvent = {
@@ -251,6 +274,11 @@ describe("OPENCODE_DISABLE_METRICS", () => {
       await handleMessagePartUpdated(makeToolPart("running"), ctx)
       await handleMessagePartUpdated(makeToolPart("completed"), ctx)
       await handleMessagePartUpdated(subtaskEvent, ctx)
+      await handleCommandExecuteBefore(
+        { command: "review", sessionID: "ses_1", arguments: "args" },
+        ctx,
+        async () => ({ name: "review" }),
+      )
 
       expect(counters.session.calls).toHaveLength(0)
       expect(counters.token.calls).toHaveLength(0)
@@ -262,6 +290,7 @@ describe("OPENCODE_DISABLE_METRICS", () => {
       expect(counters.lines.calls).toHaveLength(0)
       expect(counters.commit.calls).toHaveLength(0)
       expect(counters.subtask.calls).toHaveLength(0)
+      expect(counters.skill.calls).toHaveLength(0)
       expect(histograms.tool.calls).toHaveLength(0)
       expect(histograms.sessionDuration.calls).toHaveLength(0)
       expect(gauges.sessionToken.calls).toHaveLength(0)
diff --git a/tests/handlers/skill.test.ts b/tests/handlers/skill.test.ts
diff --git a/tests/helpers.ts b/tests/helpers.ts

Original file line number	Diff line number	Diff line change
`@@ -209,5 +209,9 @@ export function createInstruments(prefix: string): Instruments {`
`209`	`209`	`unit: "{subtask}",`
`210`	`210`	`description: "Number of sub-agent invocations observed via subtask message parts",`
`211`	`211`	`}),`
	`212`	+ skillCounter: meter.createCounter(`${prefix}skill.count`, {
	`213`	`+ unit: "{skill}",`
	`214`	`+ description: "Number of skill command invocations observed via command execution hooks",`
	`215`	`+ }),`
`212`	`216`	`}`
`213`	`217`	`}`
Original file line number	Diff line number	Diff line change
`@@ -52,6 +52,7 @@ export type Instruments = {`
`52`	`52`	`modelUsageCounter: Counter`
`53`	`53`	`retryCounter: Counter`
`54`	`54`	`subtaskCounter: Counter`
	`55`	`+ skillCounter: Counter`
`55`	`56`	`}`
`56`	`57`
`57`	`58`	`/** Accumulated per-session totals used for gauge snapshots on session.idle. */`