fix: resolve regression on thought process display for ReAct Agent LLM

thepatrickchin · thepatrickchin · commit 88f5a0612ac8 · 2026-03-10T17:30:56.000+08:00
Thought process events were not displaying because LangchainProfilerHandler
was not being invoked during LLM calls. Passing the handler via ainvoke()
config was bypassed by _runnable_config, which was built once at graph
construction time with no callbacks.

Replace the stored _runnable_config attribute with _make_runnable_config(),
which instantiates callback classes fresh on each LLM/tool call. Pass
LangchainProfilerHandler as a class reference to the graph constructor so
each invocation gets an isolated handler, also fixing a memory leak and
concurrency issues from the previously shared instance.

Signed-off-by: Patrick Chin &lt;8509935+thepatrickchin@users.noreply.github.com&gt;
diff --git a/packages/nvidia_nat_langchain/src/nat/plugins/langchain/agent/base.py b/packages/nvidia_nat_langchain/src/nat/plugins/langchain/agent/base.py
@@ -18,6 +18,7 @@
 import logging
 from abc import ABC
 from abc import abstractmethod
+from collections.abc import Callable
 from enum import Enum
 from typing import Any
 
@@ -71,7 +72,7 @@ class BaseAgent(ABC):
     def __init__(self,
                  llm: BaseChatModel,
                  tools: list[BaseTool],
-                 callbacks: list[AsyncCallbackHandler] | None = None,
+                 callbacks: list[Callable[[], AsyncCallbackHandler]] | None = None,
                  detailed_logs: bool = False,
                  log_response_max_chars: int = 1000) -> None:
         logger.debug("Initializing Agent Graph")
@@ -81,8 +82,17 @@ def __init__(self,
         self.detailed_logs = detailed_logs
         self.log_response_max_chars = log_response_max_chars
         self.graph = None
-        self._runnable_config = RunnableConfig(callbacks=self.callbacks,
-                                               configurable={"__pregel_runtime": DEFAULT_RUNTIME})
+
+    @property
+    def _runnable_config(self) -> RunnableConfig:
+        return self._make_runnable_config()
+
+    def _make_runnable_config(self) -> RunnableConfig:
+        """
+        Create a fresh RunnableConfig with isolated callback instances per invocation.
+        """
+        return RunnableConfig(callbacks=[c() for c in self.callbacks],
+                              configurable={"__pregel_runtime": DEFAULT_RUNTIME})
 
     async def _stream_llm(self, runnable: Any, inputs: dict[str, Any]) -> AIMessage:
         """
diff --git a/packages/nvidia_nat_langchain/src/nat/plugins/langchain/agent/dual_node.py b/packages/nvidia_nat_langchain/src/nat/plugins/langchain/agent/dual_node.py
@@ -15,6 +15,7 @@
 
 import logging
 from abc import abstractmethod
+from collections.abc import Callable
 
 from langchain_core.callbacks import AsyncCallbackHandler
 from langchain_core.language_models import BaseChatModel
@@ -34,7 +35,7 @@ class DualNodeAgent(BaseAgent):
     def __init__(self,
                  llm: BaseChatModel,
                  tools: list[BaseTool],
-                 callbacks: list[AsyncCallbackHandler] | None = None,
+                 callbacks: list[Callable[[], AsyncCallbackHandler]] | None = None,
                  detailed_logs: bool = False,
                  log_response_max_chars: int = 1000):
         super().__init__(llm=llm,
diff --git a/packages/nvidia_nat_langchain/src/nat/plugins/langchain/agent/react_agent/register.py b/packages/nvidia_nat_langchain/src/nat/plugins/langchain/agent/react_agent/register.py
@@ -117,7 +117,7 @@ async def react_agent_workflow(config: ReActAgentWorkflowConfig, builder: Builde
         llm=llm,
         prompt=prompt,
         tools=tools,
-        callbacks=[],
+        callbacks=[LangchainProfilerHandler],
         use_tool_schema=config.include_tool_input_schema_in_tool_description,
         detailed_logs=config.verbose,
         log_response_max_chars=config.log_response_max_chars,
@@ -154,12 +154,8 @@ async def _response_fn(chat_request_or_message: ChatRequestOrMessage) -> ChatRes
 
             state = ReActGraphState(messages=messages)
 
-            # run the ReAct Agent Graph with a new callback handler instance per request
-            state = await graph.ainvoke(state,
-                                        config={
-                                            'recursion_limit': (config.max_tool_calls + 1) * 2,
-                                            'callbacks': [LangchainProfilerHandler()]
-                                        })
+            # run the ReAct Agent Graph
+            state = await graph.ainvoke(state, config={'recursion_limit': (config.max_tool_calls + 1) * 2})
             # setting recursion_limit: 4 allows 1 tool call
             #   - allows the ReAct Agent to perform 1 cycle / call 1 single tool,
             #   - but stops the agent when it tries to call a tool a second time
diff --git a/packages/nvidia_nat_langchain/tests/agent/test_base.py b/packages/nvidia_nat_langchain/tests/agent/test_base.py
@@ -22,7 +22,6 @@
 from langchain_core.messages import AIMessage
 from langchain_core.messages import HumanMessage
 from langchain_core.messages import ToolMessage
-from langchain_core.runnables import RunnableConfig
 from langgraph.graph.state import CompiledStateGraph
 
 from nat.plugins.langchain.agent.base import BaseAgent
@@ -40,21 +39,21 @@ def __init__(self, detailed_logs=True, log_response_max_chars=1000):
         self.callbacks = []
         self.detailed_logs = detailed_logs
         self.log_response_max_chars = log_response_max_chars
-        self._runnable_config = RunnableConfig()
+        self.graph = None
 
     async def _build_graph(self, state_schema: type) -> CompiledStateGraph:
         """Mock implementation."""
         return Mock(spec=CompiledStateGraph)
 
 
-@pytest.fixture
-def base_agent():
+@pytest.fixture(name="base_agent")
+def fixture_base_agent():
     """Create a mock agent for testing with detailed logs enabled."""
     return MockBaseAgent(detailed_logs=True)
 
 
-@pytest.fixture
-def base_agent_no_logs():
+@pytest.fixture(name="base_agent_no_logs")
+def fixture_base_agent_no_logs():
     """Create a mock agent for testing with detailed logs disabled."""
     return MockBaseAgent(detailed_logs=False)