MicrosoftDocs
diff --git a/‎agent-framework/agents/middleware/chat-middleware.md‎
Lines changed: 3 additions & 3 deletions b/‎agent-framework/agents/middleware/chat-middleware.md‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎agent-framework/agents/middleware/defining-middleware.md‎
Lines changed: 17 additions & 14 deletions b/‎agent-framework/agents/middleware/defining-middleware.md‎
Lines changed: 17 additions & 14 deletions
diff --git a/‎agent-framework/agents/middleware/index.md‎
Lines changed: 57 additions & 55 deletions b/‎agent-framework/agents/middleware/index.md‎
Lines changed: 57 additions & 55 deletions
@@ -5,7 +5,7 @@ zone_pivot_groups: programming-languages
 author: eavanvalkenburg
 ms.topic: reference
 ms.author: edvan
-ms.date: 02/09/2026
+ms.date: 03/16/2026
 ms.service: agent-framework
 ---
 
@@ -199,7 +199,7 @@ async def security_and_override_middleware(
                         ]
                     )
 
-                    # Set terminate flag to stop execution
+                    # Raise MiddlewareTermination to stop execution after setting context.result
                     raise MiddlewareTermination
 
     # Continue to next middleware or AI execution
@@ -451,7 +451,7 @@ async def security_and_override_middleware(
                         ]
                     )
 
-                    # Set terminate flag to stop execution
+                    # Raise MiddlewareTermination to stop execution after setting context.result
                     raise MiddlewareTermination
 
     # Continue to next middleware or AI execution
 
@@ -5,7 +5,7 @@ zone_pivot_groups: programming-languages
 author: dmytrostruk
 ms.topic: tutorial
 ms.author: dmytrostruk
-ms.date: 09/29/2025
+ms.date: 03/16/2026
 ms.service: agent-framework
 ---
 
@@ -233,17 +233,19 @@ if __name__ == "__main__":
 Create a simple logging middleware to see when your agent runs:
 
 ```python
+from collections.abc import Awaitable, Callable
+
 from agent_framework import AgentContext
 
 async def logging_agent_middleware(
     context: AgentContext,
-    next: Callable[[AgentContext], Awaitable[None]],
+    call_next: Callable[[], Awaitable[None]],
 ) -> None:
     """Simple middleware that logs agent execution."""
     print("Agent starting...")
 
     # Continue to agent execution
-    await next(context)
+    await call_next()
 
     print("Agent finished!")
 ```
@@ -267,33 +269,34 @@ async def main():
 
 ## Step 4: Create Function Middleware
 
-If your agent uses functions, you can intercept function calls:
+If your agent uses functions, you can intercept function calls and set tool-only runtime values before the tool executes:
 
 ```python
+from collections.abc import Awaitable, Callable
+
 from agent_framework import FunctionInvocationContext
 
-def get_time():
+def get_time(ctx: FunctionInvocationContext) -> str:
     """Get the current time."""
     from datetime import datetime
-    return datetime.now().strftime("%H:%M:%S")
+    source = ctx.kwargs.get("request_source", "direct")
+    return f"[{source}] {datetime.now().strftime('%H:%M:%S')}"
 
-async def logging_function_middleware(
+async def inject_function_kwargs(
     context: FunctionInvocationContext,
-    next: Callable[[FunctionInvocationContext], Awaitable[None]],
+    call_next: Callable[[], Awaitable[None]],
 ) -> None:
-    """Middleware that logs function calls."""
-    print(f"Calling function: {context.function.name}")
-
-    await next(context)
+    """Middleware that adds tool-only runtime values before execution."""
+    context.kwargs.setdefault("request_source", "middleware")
 
-    print(f"Function result: {context.result}")
+    await call_next()
 
 # Add both the function and middleware to your agent
 async with AzureAIAgentClient(credential=credential).as_agent(
     name="TimeAgent",
     instructions="You can tell the current time.",
     tools=[get_time],
-    middleware=[logging_function_middleware],
+    middleware=[inject_function_kwargs],
 ) as agent:
     result = await agent.run("What time is it?")
 ```
 
@@ -5,7 +5,7 @@ zone_pivot_groups: programming-languages
 author: dmytrostruk
 ms.topic: reference
 ms.author: dmytrostruk
-ms.date: 02/17/2026
+ms.date: 03/16/2026
 ms.service: agent-framework
 ---
 
@@ -177,7 +177,7 @@ Agent Framework can be customized using three different types of middleware:
 2. **Function middleware**: Intercepts function (tool) calls made during agent execution, enabling input validation, result transformation, and execution control.
 3. **Chat middleware**: Intercepts the underlying chat requests sent to AI models, providing access to the raw messages, options, and responses.
 
-All types support both function-based and class-based implementations. When multiple middleware of the same type are registered, they form a chain where each calls the `next` callable to continue processing.
+All types support both function-based and class-based implementations. When multiple middleware of the same type are registered, they form a chain where each calls the `call_next` callback to continue processing. `call_next` does not take the context as an argument; middleware mutates the shared context object directly and then awaits `call_next()`.
 
 > [!NOTE]
 > Middleware order with mixed registration scopes:
@@ -192,29 +192,31 @@ Agent middleware intercepts and modifies agent run execution. It uses the `Agent
 
 - `agent`: The agent being invoked
 - `messages`: List of chat messages in the conversation
-- `is_streaming`: Boolean indicating if the response is streaming
+- `session`: The current agent session, if any
+- `options`: Agent run options for this invocation
+- `stream`: Boolean indicating if the response is streaming
 - `metadata`: Dictionary for storing additional data between middleware
 - `result`: The agent's response (can be modified)
-- `terminate`: Flag to stop further processing
-- `kwargs`: Additional keyword arguments passed to the agent run method
+- `kwargs`: Legacy runtime keyword arguments passed to the agent run method
+- `client_kwargs`: Client-specific runtime values for downstream chat clients
+- `function_invocation_kwargs`: Runtime values that will be forwarded to tools
 
-The `next` callable continues the middleware chain or executes the agent if it's the last middleware.
+The `call_next` callback continues the middleware chain or executes the agent if it's the last middleware.
 
 ### Function-based
 
 ```python
-async def logging_agent_middleware(
+async def inject_tool_runtime_defaults(
     context: AgentContext,
-    next: Callable[[AgentContext], Awaitable[None]],
+    call_next: Callable[[], Awaitable[None]],
 ) -> None:
-    """Agent middleware that logs execution timing."""
-    # Pre-processing: Log before agent execution
+    """Agent middleware that sets tool-only runtime defaults."""
     print("[Agent] Starting execution")
+    context.function_invocation_kwargs.setdefault("tenant", "contoso")
+    context.function_invocation_kwargs.setdefault("request_source", "agent-middleware")
 
-    # Continue to next middleware or agent execution
-    await next(context)
+    await call_next()
 
-    # Post-processing: Log after agent execution
     print("[Agent] Execution completed")
 ```
 
@@ -231,10 +233,10 @@ class LoggingAgentMiddleware(AgentMiddleware):
     async def process(
         self,
         context: AgentContext,
-        next: Callable[[AgentContext], Awaitable[None]],
+        call_next: Callable[[], Awaitable[None]],
     ) -> None:
         print("[Agent Class] Starting execution")
-        await next(context)
+        await call_next()
         print("[Agent Class] Execution completed")
 ```
 
@@ -244,29 +246,25 @@ Function middleware intercepts function calls within agents. It uses the `Functi
 
 - `function`: The function being invoked
 - `arguments`: The validated arguments for the function
+- `session`: The current agent session, if any
 - `metadata`: Dictionary for storing additional data between middleware
 - `result`: The function's return value (can be modified)
-- `terminate`: Flag to stop further processing
-- `kwargs`: Additional keyword arguments passed to the chat method that invoked this function
+- `kwargs`: Runtime keyword arguments that will be forwarded to the tool invocation
 
-The `next` callable continues to the next middleware or executes the actual function.
+The `call_next` callback continues to the next middleware or executes the actual function.
 
 ### Function-based
 
 ```python
-async def logging_function_middleware(
+async def inject_function_kwargs(
     context: FunctionInvocationContext,
-    next: Callable[[FunctionInvocationContext], Awaitable[None]],
+    call_next: Callable[[], Awaitable[None]],
 ) -> None:
-    """Function middleware that logs function execution."""
-    # Pre-processing: Log before function execution
-    print(f"[Function] Calling {context.function.name}")
+    """Function middleware that enriches tool runtime values."""
+    context.kwargs.setdefault("tenant", "contoso")
+    context.kwargs.setdefault("request_source", "function-middleware")
 
-    # Continue to next middleware or function execution
-    await next(context)
-
-    # Post-processing: Log after function execution
-    print(f"[Function] {context.function.name} completed")
+    await call_next()
 ```
 
 ### Class-based
@@ -280,10 +278,10 @@ class LoggingFunctionMiddleware(FunctionMiddleware):
     async def process(
         self,
         context: FunctionInvocationContext,
-        next: Callable[[FunctionInvocationContext], Awaitable[None]],
+        call_next: Callable[[], Awaitable[None]],
     ) -> None:
         print(f"[Function Class] Calling {context.function.name}")
-        await next(context)
+        await call_next()
         print(f"[Function Class] {context.function.name} completed")
 ```
 
@@ -294,27 +292,27 @@ Chat middleware intercepts chat requests sent to AI models. It uses the `ChatCon
 - `chat_client`: The chat client being invoked
 - `messages`: List of messages being sent to the AI service
 - `options`: The options for the chat request
-- `is_streaming`: Boolean indicating if this is a streaming invocation
+- `stream`: Boolean indicating if this is a streaming invocation
 - `metadata`: Dictionary for storing additional data between middleware
 - `result`: The chat response from the AI (can be modified)
-- `terminate`: Flag to stop further processing
 - `kwargs`: Additional keyword arguments passed to the chat client
+- `function_invocation_kwargs`: Tool-only runtime values that will be forwarded by the chat layer
 
-The `next` callable continues to the next middleware or sends the request to the AI service.
+The `call_next` callback continues to the next middleware or sends the request to the AI service.
 
 ### Function-based
 
 ```python
 async def logging_chat_middleware(
     context: ChatContext,
-    next: Callable[[ChatContext], Awaitable[None]],
+    call_next: Callable[[], Awaitable[None]],
 ) -> None:
     """Chat middleware that logs AI interactions."""
     # Pre-processing: Log before AI call
     print(f"[Chat] Sending {len(context.messages)} messages to AI")
 
     # Continue to next middleware or AI service
-    await next(context)
+    await call_next()
 
     # Post-processing: Log after AI response
     print("[Chat] AI response received")
@@ -331,10 +329,10 @@ class LoggingChatMiddleware(ChatMiddleware):
     async def process(
         self,
         context: ChatContext,
-        next: Callable[[ChatContext], Awaitable[None]],
+        call_next: Callable[[], Awaitable[None]],
     ) -> None:
         print(f"[Chat Class] Sending {len(context.messages)} messages to AI")
-        await next(context)
+        await call_next()
         print("[Chat Class] AI response received")
 ```
 
@@ -346,21 +344,21 @@ Decorators provide explicit middleware type declaration without requiring type a
 from agent_framework import agent_middleware, function_middleware, chat_middleware
 
 @agent_middleware
-async def simple_agent_middleware(context, next):
+async def simple_agent_middleware(context, call_next):
     print("Before agent execution")
-    await next(context)
+    await call_next()
     print("After agent execution")
 
 @function_middleware
-async def simple_function_middleware(context, next):
+async def simple_function_middleware(context, call_next):
     print(f"Calling function: {context.function.name}")
-    await next(context)
+    await call_next()
     print("Function call completed")
 
 @chat_middleware
-async def simple_chat_middleware(context, next):
+async def simple_chat_middleware(context, call_next):
     print(f"Processing {len(context.messages)} chat messages")
-    await next(context)
+    await call_next()
     print("Chat processing completed")
 ```
 
@@ -407,30 +405,34 @@ async with AzureAIAgentClient(credential=credential).as_agent(
 
 ## Middleware Termination
 
-Middleware can terminate execution early using `context.terminate`. This is useful for security checks, rate limiting, or validation failures.
+Middleware can terminate execution early by setting `context.result` and raising `MiddlewareTermination`. This is useful for security checks, rate limiting, or validation failures.
 
 ```python
+from agent_framework import AgentContext, AgentResponse, Message, MiddlewareTermination
+
 async def blocking_middleware(
     context: AgentContext,
-    next: Callable[[AgentContext], Awaitable[None]],
+    call_next: Callable[[], Awaitable[None]],
 ) -> None:
     """Middleware that blocks execution based on conditions."""
     # Check for blocked content
     last_message = context.messages[-1] if context.messages else None
     if last_message and last_message.text:
         if "blocked" in last_message.text.lower():
             print("Request blocked by middleware")
-            context.terminate = True
-            return
+            context.result = AgentResponse(
+                messages=[Message(role="assistant", text="This request was blocked by middleware.")]
+            )
+            raise MiddlewareTermination(result=context.result)
 
     # If no issues, continue normally
-    await next(context)
+    await call_next()
 ```
 
 **What termination means:**
-- Setting `context.terminate = True` signals that processing should stop
-- You can provide a custom result before terminating to give users feedback
-- The agent execution is completely skipped when middleware terminates
+- Set `context.result` before raising `MiddlewareTermination` if you want to return a custom response
+- Raising `MiddlewareTermination` stops the remainder of the middleware chain and skips the normal execution path
+- This pattern works for agent, function, and chat middleware
 
 ## Middleware Result Override
 
@@ -441,17 +443,17 @@ The result type in `context.result` depends on whether the agent invocation is s
 - **Non-streaming**: `context.result` contains an `AgentResponse` with the complete response
 - **Streaming**: `context.result` contains an async generator that yields `AgentResponseUpdate` chunks
 
-You can use `context.is_streaming` to differentiate between these scenarios and handle result overrides appropriately.
+You can use `context.stream` to differentiate between these scenarios and handle result overrides appropriately.
 
 ```python
 async def weather_override_middleware(
     context: AgentContext,
-    next: Callable[[AgentContext], Awaitable[None]]
+    call_next: Callable[[], Awaitable[None]]
 ) -> None:
     """Middleware that overrides weather results for both streaming and non-streaming."""
 
     # Execute the original agent logic
-    await next(context)
+    await call_next()
 
     # Override results if present
     if context.result is not None:
@@ -462,7 +464,7 @@ async def weather_override_middleware(
             "Great day for outdoor activities!"
         ]
 
-        if context.is_streaming:
+        if context.stream:
             # Streaming override
             async def override_stream() -> AsyncIterable[AgentResponseUpdate]:
                 for chunk in custom_message_parts:
Original file line number	Diff line number	Diff line change
`@@ -5,7 +5,7 @@ zone_pivot_groups: programming-languages`
`5`	`5`	`author: eavanvalkenburg`
`6`	`6`	`ms.topic: reference`
`7`	`7`	`ms.author: edvan`
`8`		`-ms.date: 02/09/2026`
	`8`	`+ms.date: 03/16/2026`
`9`	`9`	`ms.service: agent-framework`
`10`	`10`	`---`
`11`	`11`
`@@ -199,7 +199,7 @@ async def security_and_override_middleware(`
`199`	`199`	`]`
`200`	`200`	`)`
`201`	`201`
`202`		`- # Set terminate flag to stop execution`
	`202`	`+ # Raise MiddlewareTermination to stop execution after setting context.result`
`203`	`203`	`raise MiddlewareTermination`
`204`	`204`
`205`	`205`	`# Continue to next middleware or AI execution`
`@@ -451,7 +451,7 @@ async def security_and_override_middleware(`
`451`	`451`	`]`
`452`	`452`	`)`
`453`	`453`
`454`		`- # Set terminate flag to stop execution`
	`454`	`+ # Raise MiddlewareTermination to stop execution after setting context.result`
`455`	`455`	`raise MiddlewareTermination`
`456`	`456`
`457`	`457`	`# Continue to next middleware or AI execution`