fix(langchain): emit cache creation tokens (#4261)

dvirski · web-flow · commit fc33f1c16f6a · 2026-06-17T09:55:03.000+03:00
diff --git a/packages/opentelemetry-instrumentation-langchain/opentelemetry/instrumentation/langchain/span_utils.py b/packages/opentelemetry-instrumentation-langchain/opentelemetry/instrumentation/langchain/span_utils.py
@@ -393,7 +393,8 @@ def set_chat_response_usage(
     input_tokens = 0
     output_tokens = 0
     total_tokens = 0
-    cache_read_tokens = 0
+    cache_read_tokens = None
+    cache_creation_tokens = None
 
     # Early return if no generations to avoid potential issues
     if not response.generations:
@@ -423,7 +424,12 @@ def set_chat_response_usage(
                         input_token_details = generation.message.usage_metadata.get(
                             "input_token_details", {}
                         )
-                        cache_read_tokens += input_token_details.get("cache_read", 0)
+                        raw_cache_read = input_token_details.get("cache_read")
+                        if isinstance(raw_cache_read, (int, float)):
+                            cache_read_tokens = (cache_read_tokens or 0) + raw_cache_read
+                        raw_cache_creation = input_token_details.get("cache_creation")
+                        if isinstance(raw_cache_creation, (int, float)):
+                            cache_creation_tokens = (cache_creation_tokens or 0) + raw_cache_creation
     except Exception as e:
         # If there's any issue processing usage metadata, continue without it
         logger.warning("Error processing usage metadata: %s", e)
@@ -433,7 +439,8 @@ def set_chat_response_usage(
         input_tokens > 0
         or output_tokens > 0
         or total_tokens > 0
-        or cache_read_tokens > 0
+        or cache_read_tokens is not None
+        or cache_creation_tokens is not None
     ):
         _set_span_attribute(
             span,
@@ -455,6 +462,11 @@ def set_chat_response_usage(
             GenAIAttributes.GEN_AI_USAGE_CACHE_READ_INPUT_TOKENS,
             cache_read_tokens,
         )
+        _set_span_attribute(
+            span,
+            GenAIAttributes.GEN_AI_USAGE_CACHE_CREATION_INPUT_TOKENS,
+            cache_creation_tokens,
+        )
         if record_token_usage:
             vendor = span.attributes.get(GenAIAttributes.GEN_AI_PROVIDER_NAME, "langchain")