traceloop
diff --git a/‎packages/instrumentation-llamaindex/package.json‎
Lines changed: 1 addition & 0 deletions b/‎packages/instrumentation-llamaindex/package.json‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎packages/instrumentation-llamaindex/src/custom-llm-instrumentation.ts‎
Lines changed: 138 additions & 64 deletions b/‎packages/instrumentation-llamaindex/src/custom-llm-instrumentation.ts‎
Lines changed: 138 additions & 64 deletions
diff --git a/‎packages/instrumentation-llamaindex/src/instrumentation.ts‎
Lines changed: 1 addition & 1 deletion b/‎packages/instrumentation-llamaindex/src/instrumentation.ts‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎packages/instrumentation-llamaindex/src/utils.ts‎
Lines changed: 31 additions & 11 deletions b/‎packages/instrumentation-llamaindex/src/utils.ts‎
Lines changed: 31 additions & 11 deletions
diff --git a/‎packages/instrumentation-llamaindex/test/finish_reasons.test.ts‎
Lines changed: 58 additions & 0 deletions b/‎packages/instrumentation-llamaindex/test/finish_reasons.test.ts‎
Lines changed: 58 additions & 0 deletions
@@ -42,6 +42,7 @@
     "@opentelemetry/instrumentation": "^0.203.0",
     "@opentelemetry/semantic-conventions": "^1.38.0",
     "@traceloop/ai-semantic-conventions": "workspace:*",
+    "@traceloop/instrumentation-utils": "workspace:*",
     "lodash": "^4.17.21",
     "tslib": "^2.8.1"
   },
 
@@ -1,4 +1,3 @@
-import * as lodash from "lodash";
 import type * as llamaindex from "llamaindex";
 
 import {
@@ -13,15 +12,29 @@ import {
 } from "@opentelemetry/api";
 import { safeExecuteInTheMiddle } from "@opentelemetry/instrumentation";
 
-import { SpanAttributes } from "@traceloop/ai-semantic-conventions";
 import {
-  ATTR_GEN_AI_COMPLETION,
-  ATTR_GEN_AI_PROMPT,
+  SpanAttributes,
+  FinishReasons,
+} from "@traceloop/ai-semantic-conventions";
+import {
+  ATTR_GEN_AI_INPUT_MESSAGES,
+  ATTR_GEN_AI_OPERATION_NAME,
+  ATTR_GEN_AI_OUTPUT_MESSAGES,
+  ATTR_GEN_AI_PROVIDER_NAME,
   ATTR_GEN_AI_REQUEST_MODEL,
   ATTR_GEN_AI_REQUEST_TOP_P,
+  ATTR_GEN_AI_RESPONSE_FINISH_REASONS,
   ATTR_GEN_AI_RESPONSE_MODEL,
-  ATTR_GEN_AI_SYSTEM,
+  ATTR_GEN_AI_USAGE_INPUT_TOKENS,
+  ATTR_GEN_AI_USAGE_OUTPUT_TOKENS,
+  GEN_AI_OPERATION_NAME_VALUE_CHAT,
+  GEN_AI_PROVIDER_NAME_VALUE_OPENAI,
 } from "@opentelemetry/semantic-conventions/incubating";
+import {
+  formatInputMessages,
+  formatOutputMessage,
+  mapOpenAIContentBlock,
+} from "@traceloop/instrumentation-utils";
 
 import { LlamaIndexInstrumentationConfig } from "./types";
 import { shouldSendPrompts, llmGeneratorWrapper } from "./utils";
@@ -33,9 +46,21 @@ type AsyncResponseType =
   | AsyncIterable<llamaindex.ChatResponseChunk>
   | AsyncIterable<llamaindex.CompletionResponse>;
 
+const classNameToProviderName: Record<string, string> = {
+  OpenAI: GEN_AI_PROVIDER_NAME_VALUE_OPENAI,
+};
+
+export const openAIFinishReasonMap: Record<string, string> = {
+  stop: FinishReasons.STOP,
+  length: FinishReasons.LENGTH,
+  tool_calls: FinishReasons.TOOL_CALL,
+  content_filter: FinishReasons.CONTENT_FILTER,
+  function_call: FinishReasons.TOOL_CALL,
+};
+
 export class CustomLLMInstrumentation {
   constructor(
-    private config: LlamaIndexInstrumentationConfig,
+    private config: () => LlamaIndexInstrumentationConfig,
     private diag: DiagLogger,
     private tracer: () => Tracer,
   ) {}
@@ -50,44 +75,30 @@ export class CustomLLMInstrumentation {
         const messages = params?.messages;
         const streaming = params?.stream;
 
-        const span = plugin
-          .tracer()
-          .startSpan(`llamaindex.${lodash.snakeCase(className)}.chat`, {
-            kind: SpanKind.CLIENT,
-          });
+        const span = plugin.tracer().startSpan(`chat ${this.metadata.model}`, {
+          kind: SpanKind.CLIENT,
+        });
 
         try {
-          span.setAttribute(ATTR_GEN_AI_SYSTEM, className);
+          span.setAttribute(
+            ATTR_GEN_AI_PROVIDER_NAME,
+            classNameToProviderName[className] ?? className.toLowerCase(),
+          );
           span.setAttribute(ATTR_GEN_AI_REQUEST_MODEL, this.metadata.model);
-          span.setAttribute(SpanAttributes.LLM_REQUEST_TYPE, "chat");
+          span.setAttribute(
+            ATTR_GEN_AI_OPERATION_NAME,
+            GEN_AI_OPERATION_NAME_VALUE_CHAT,
+          );
           span.setAttribute(ATTR_GEN_AI_REQUEST_TOP_P, this.metadata.topP);
-          if (shouldSendPrompts(plugin.config)) {
-            for (const messageIdx in messages) {
-              const content = messages[messageIdx].content;
-              if (typeof content === "string") {
-                span.setAttribute(
-                  `${ATTR_GEN_AI_PROMPT}.${messageIdx}.content`,
-                  content as string,
-                );
-              } else if (
-                (content as llamaindex.MessageContentDetail[])[0].type ===
-                "text"
-              ) {
-                span.setAttribute(
-                  `${ATTR_GEN_AI_PROMPT}.${messageIdx}.content`,
-                  (content as llamaindex.MessageContentTextDetail[])[0].text,
-                );
-              }
-
-              span.setAttribute(
-                `${ATTR_GEN_AI_PROMPT}.${messageIdx}.role`,
-                messages[messageIdx].role,
-              );
-            }
+          if (shouldSendPrompts(plugin.config()) && messages) {
+            span.setAttribute(
+              ATTR_GEN_AI_INPUT_MESSAGES,
+              formatInputMessages(messages, mapOpenAIContentBlock),
+            );
           }
         } catch (e) {
           plugin.diag.warn(e);
-          plugin.config.exceptionLogger?.(e);
+          plugin.config().exceptionLogger?.(e);
         }
 
         const execContext = trace.setSpan(context.active(), span);
@@ -138,36 +149,59 @@ export class CustomLLMInstrumentation {
   ): T {
     span.setAttribute(ATTR_GEN_AI_RESPONSE_MODEL, metadata.model);
 
-    if (!shouldSendPrompts(this.config)) {
-      span.setStatus({ code: SpanStatusCode.OK });
-      span.end();
-      return result;
-    }
-
     try {
-      if ((result as llamaindex.ChatResponse).message) {
+      const raw = (result as any).raw;
+      const finishReason: string | null =
+        raw?.choices?.[0]?.finish_reason ?? null;
+
+      // finish_reasons: metadata, not content — always set outside shouldSendPrompts
+      if (finishReason != null) {
+        span.setAttribute(ATTR_GEN_AI_RESPONSE_FINISH_REASONS, [
+          openAIFinishReasonMap[finishReason] ?? finishReason,
+        ]);
+      }
+
+      // Token usage: always set when available
+      const usage = raw?.usage;
+      if (usage) {
+        span.setAttribute(ATTR_GEN_AI_USAGE_INPUT_TOKENS, usage.prompt_tokens);
+        span.setAttribute(
+          ATTR_GEN_AI_USAGE_OUTPUT_TOKENS,
+          usage.completion_tokens,
+        );
         span.setAttribute(
-          `${ATTR_GEN_AI_COMPLETION}.0.role`,
-          (result as llamaindex.ChatResponse).message.role,
+          SpanAttributes.GEN_AI_USAGE_TOTAL_TOKENS,
+          usage.total_tokens,
         );
+      }
+
+      // output messages: content — always set inside shouldSendPrompts
+      if (
+        shouldSendPrompts(this.config()) &&
+        (result as llamaindex.ChatResponse).message
+      ) {
         const content = (result as llamaindex.ChatResponse).message.content;
-        if (typeof content === "string") {
-          span.setAttribute(`${ATTR_GEN_AI_COMPLETION}.0.content`, content);
-        } else if (content[0].type === "text") {
-          span.setAttribute(
-            `${ATTR_GEN_AI_COMPLETION}.0.content`,
-            content[0].text,
-          );
-        }
-        span.setStatus({ code: SpanStatusCode.OK });
+        // Normalize to array so mapOpenAIContentBlock handles both string and block array
+        const contentArray = typeof content === "string" ? [content] : content;
+        span.setAttribute(
+          ATTR_GEN_AI_OUTPUT_MESSAGES,
+          formatOutputMessage(
+            contentArray,
+            finishReason,
+            openAIFinishReasonMap,
+            GEN_AI_OPERATION_NAME_VALUE_CHAT,
+            mapOpenAIContentBlock,
+          ),
+        );
       }
+
+      span.setStatus({ code: SpanStatusCode.OK });
     } catch (e) {
       this.diag.warn(e);
-      this.config.exceptionLogger?.(e);
+      this.config().exceptionLogger?.(e);
     }
 
     span.end();
-
     return result;
   }
 
@@ -178,14 +212,54 @@ export class CustomLLMInstrumentation {
     metadata: llamaindex.LLMMetadata,
   ): T {
     span.setAttribute(ATTR_GEN_AI_RESPONSE_MODEL, metadata.model);
-    if (!shouldSendPrompts(this.config)) {
-      span.setStatus({ code: SpanStatusCode.OK });
-      span.end();
-      return result;
-    }
 
-    return llmGeneratorWrapper(result, execContext, (message) => {
-      span.setAttribute(`${ATTR_GEN_AI_COMPLETION}.0.content`, message);
+    return llmGeneratorWrapper(result, execContext, (message, lastChunk) => {
+      try {
+        // Extract finish_reason and usage from the last chunk's raw OpenAI
+        // response — available when stream_options: { include_usage: true }
+        // is set on the LLM (OpenAI sends usage in the final streaming chunk).
+        const lastRaw = lastChunk?.raw as any;
+        const finishReason: string | null =
+          lastRaw?.choices?.[0]?.finish_reason ?? null;
+        const usage = lastRaw?.usage ?? null;
+
+        if (finishReason != null) {
+          span.setAttribute(ATTR_GEN_AI_RESPONSE_FINISH_REASONS, [
+            openAIFinishReasonMap[finishReason] ?? finishReason,
+          ]);
+        }
+
+        if (usage) {
+          span.setAttribute(
+            ATTR_GEN_AI_USAGE_INPUT_TOKENS,
+            usage.prompt_tokens,
+          );
+          span.setAttribute(
+            ATTR_GEN_AI_USAGE_OUTPUT_TOKENS,
+            usage.completion_tokens,
+          );
+          span.setAttribute(
+            SpanAttributes.GEN_AI_USAGE_TOTAL_TOKENS,
+            usage.total_tokens,
+          );
+        }
+
+        if (shouldSendPrompts(this.config())) {
+          span.setAttribute(
+            ATTR_GEN_AI_OUTPUT_MESSAGES,
+            formatOutputMessage(
+              [message],
+              finishReason,
+              openAIFinishReasonMap,
+              GEN_AI_OPERATION_NAME_VALUE_CHAT,
+              mapOpenAIContentBlock,
+            ),
+          );
+        }
+      } catch (e) {
+        this.diag.warn(e);
+        this.config().exceptionLogger?.(e);
+      }
       span.setStatus({ code: SpanStatusCode.OK });
       span.end();
     }) as any;
 
@@ -41,7 +41,7 @@ export class LlamaIndexInstrumentation extends InstrumentationBase {
   constructor(config: LlamaIndexInstrumentationConfig = {}) {
     super("@traceloop/instrumentation-llamaindex", version, config);
     this.customLLMInstrumentation = new CustomLLMInstrumentation(
-      this._config,
+      () => this._config,
       this._diag,
       () => this.tracer,
     );
 
@@ -58,23 +58,43 @@ export async function* llmGeneratorWrapper(
     | AsyncIterable<llamaindex.ChatResponseChunk>
     | AsyncIterable<llamaindex.CompletionResponse>,
   ctx: Context,
-  fn: (message: string) => void,
+  fn: (message: string, lastChunk?: any) => void,
 ) {
   let message = "";
+  // Track the last chunk so the callback can extract usage/finish_reason from
+  // chunk.raw — OpenAI sends these in the final streaming chunk when
+  // stream_options: { include_usage: true } is set on the LLM.
+  let lastChunk: any;
 
-  for await (const messageChunk of bindAsyncGenerator(
-    ctx,
-    streamingResult as AsyncGenerator,
-  )) {
-    if ((messageChunk as llamaindex.ChatResponseChunk).delta) {
-      message += (messageChunk as llamaindex.ChatResponseChunk).delta;
+  let fnCalled = false;
+  try {
+    for await (const messageChunk of bindAsyncGenerator(
+      ctx,
+      streamingResult as AsyncGenerator,
+    )) {
+      if ((messageChunk as llamaindex.ChatResponseChunk).delta) {
+        message += (messageChunk as llamaindex.ChatResponseChunk).delta;
+      }
+      if ((messageChunk as llamaindex.CompletionResponse).text) {
+        message += (messageChunk as llamaindex.CompletionResponse).text;
+      }
+      lastChunk = messageChunk;
+      yield messageChunk;
+    }
+  } catch (err) {
+    // Ensure span is finalized even if the stream throws
+    if (!fnCalled) {
+      fnCalled = true;
+      fn(message, lastChunk);
     }
-    if ((messageChunk as llamaindex.CompletionResponse).text) {
-      message += (messageChunk as llamaindex.CompletionResponse).text;
+    throw err;
+  } finally {
+    // Covers normal completion and early consumer exit (break/return)
+    if (!fnCalled) {
+      fnCalled = true;
+      fn(message, lastChunk);
     }
-    yield messageChunk;
   }
-  fn(message);
 }
 
 export function genericWrapper(
 
@@ -0,0 +1,58 @@
+/**
+ * Unit tests for openAIFinishReasonMap.
+ *
+ * Each OpenAI raw finish reason value is tested individually.
+ * Verified values from OpenAI API documentation.
+ */
+
+import * as assert from "assert";
+import { FinishReasons } from "@traceloop/ai-semantic-conventions";
+import { openAIFinishReasonMap } from "../src/custom-llm-instrumentation";
+
+const VALID_OTEL_FINISH_REASONS = new Set([
+  FinishReasons.STOP,
+  FinishReasons.LENGTH,
+  FinishReasons.TOOL_CALL,
+  FinishReasons.CONTENT_FILTER,
+  FinishReasons.ERROR,
+]);
+
+describe("openAIFinishReasonMap", () => {
+  it("all mapped values are valid OTel finish reason strings", () => {
+    for (const [raw, otel] of Object.entries(openAIFinishReasonMap)) {
+      assert.ok(
+        VALID_OTEL_FINISH_REASONS.has(otel),
+        `openAIFinishReasonMap["${raw}"] = "${otel}" is not a valid OTel finish reason`,
+      );
+    }
+  });
+
+  it('maps "stop" to stop', () => {
+    assert.strictEqual(openAIFinishReasonMap["stop"], FinishReasons.STOP);
+  });
+
+  it('maps "length" to length', () => {
+    assert.strictEqual(openAIFinishReasonMap["length"], FinishReasons.LENGTH);
+  });
+
+  it('maps "tool_calls" to tool_call', () => {
+    assert.strictEqual(
+      openAIFinishReasonMap["tool_calls"],
+      FinishReasons.TOOL_CALL,
+    );
+  });
+
+  it('maps "content_filter" to content_filter', () => {
+    assert.strictEqual(
+      openAIFinishReasonMap["content_filter"],
+      FinishReasons.CONTENT_FILTER,
+    );
+  });
+
+  it('maps "function_call" to tool_call (deprecated alias)', () => {
+    assert.strictEqual(
+      openAIFinishReasonMap["function_call"],
+      FinishReasons.TOOL_CALL,
+    );
+  });
+});