Azure
diff --git a/‎sdk/agentserver/azure-ai-agentserver-core/CHANGELOG.md‎
Lines changed: 46 additions & 20 deletions b/‎sdk/agentserver/azure-ai-agentserver-core/CHANGELOG.md‎
Lines changed: 46 additions & 20 deletions
diff --git a/‎sdk/agentserver/azure-ai-agentserver-core/MigrationGuide.md‎
Lines changed: 237 additions & 0 deletions b/‎sdk/agentserver/azure-ai-agentserver-core/MigrationGuide.md‎
Lines changed: 237 additions & 0 deletions
diff --git a/‎sdk/agentserver/azure-ai-agentserver-core/azure/ai/agentserver/core/_base.py‎
Lines changed: 1 addition & 1 deletion b/‎sdk/agentserver/azure-ai-agentserver-core/azure/ai/agentserver/core/_base.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎sdk/agentserver/azure-ai-agentserver-core/azure/ai/agentserver/core/_config.py‎
Lines changed: 1 addition & 1 deletion b/‎sdk/agentserver/azure-ai-agentserver-core/azure/ai/agentserver/core/_config.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎sdk/agentserver/azure-ai-agentserver-core/pyproject.toml‎
Lines changed: 2 additions & 1 deletion b/‎sdk/agentserver/azure-ai-agentserver-core/pyproject.toml‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎sdk/agentserver/azure-ai-agentserver-core/tests/test_graceful_shutdown.py‎
Lines changed: 1 addition & 1 deletion b/‎sdk/agentserver/azure-ai-agentserver-core/tests/test_graceful_shutdown.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎sdk/agentserver/azure-ai-agentserver-githubcopilot/pyproject.toml‎
Lines changed: 3 additions & 8 deletions b/‎sdk/agentserver/azure-ai-agentserver-githubcopilot/pyproject.toml‎
Lines changed: 3 additions & 8 deletions
diff --git a/‎sdk/agentserver/azure-ai-agentserver-invocations/CHANGELOG.md‎
Lines changed: 1 addition & 1 deletion b/‎sdk/agentserver/azure-ai-agentserver-invocations/CHANGELOG.md‎
Lines changed: 1 addition & 1 deletion
@@ -1,29 +1,55 @@
 # Release History
 
-## 2.0.0b1 (Unreleased)
+## 2.0.0b1 (2026-04-14)
 
-### Features Added
-
-- `AgentServerHost` base class (Starlette subclass) with health probe (`/readiness`), graceful shutdown, and port binding.
-- Automatic OpenTelemetry tracing with Azure Monitor and OTLP exporters (included as primary dependencies).
-- `request_span()` host method and `end_span()` / `record_error()` / `trace_stream()` public functions for protocol SDK tracing.
-- Overridable tracing setup via `configure_tracing` constructor parameter.
-- `create_error_response()` utility for standard error envelope responses.
-- Cooperative mixin inheritance for multi-protocol composition.
-- Hypercorn-based ASGI server with HTTP/1.1 support.
+This is a major architectural rewrite. The package has been redesigned as a lightweight hosting
+foundation. Protocol implementations that were previously bundled in this package have moved to
+dedicated protocol packages (`azure-ai-agentserver-responses`, `azure-ai-agentserver-invocations`).
+See the [Migration Guide](https://github.com/Azure/azure-sdk-for-python/blob/main/sdk/agentserver/azure-ai-agentserver-core/MigrationGuide.md)
+for upgrading from 1.x versions.
 
 ### Breaking Changes
 
-- Renamed `AgentHost` → `AgentServerHost`; now inherits from `Starlette` directly.
-- Removed `register_routes()` — protocol packages now subclass `AgentServerHost` and pass routes via `super().__init__()`.
-- Removed lazy `app` property — `AgentServerHost` IS the ASGI app.
-- Replaced `TracingHelper` class with module-level functions (`request_span`, `end_span`, `record_error`, `trace_stream`, `configure_tracing`).
-- Replaced `ErrorResponse.create()` static method with module-level `create_error_response()` function.
-- Removed `AgentLogger` / `get_logger()` — use `logging.getLogger("azure.ai.agentserver")` directly.
-- Removed `AGENT_LOG_LEVEL` and `AGENT_GRACEFUL_SHUTDOWN_TIMEOUT` environment variable support from `Constants`.
-- Removed `leaf_customer_span_id` baggage mechanism and W3C Baggage propagation.
-- OpenTelemetry is now a required dependency (was optional `[tracing]` extras).
-- Renamed health endpoint from `/healthy` to `/readiness`.
+- **Package split**: All Responses API protocol types (models, handler decorators, SSE streaming)
+  have moved to `azure-ai-agentserver-responses`. All Invocations protocol types have moved to
+  `azure-ai-agentserver-invocations`. This package now contains only the shared hosting foundation.
+- **`FoundryCBAgent` removed**: Replaced by `AgentServerHost`, a Starlette subclass that IS the
+  ASGI app (no separate `.app` property or `register_routes()`).
+- **`AgentRunContext` removed**: Protocol packages provide their own context types
+  (`ResponseContext` in Responses, `request.state` in Invocations).
+- **`TracingHelper` class removed**: Replaced by module-level functions (`request_span`,
+  `end_span`, `record_error`, `trace_stream`) for a simpler functional API.
+- **`AgentLogger` / `get_logger()` removed**: Use `logging.getLogger("azure.ai.agentserver")`
+  directly, or rely on the SDK's automatic console logging setup.
+- **`ErrorResponse.create()` removed**: Replaced by `create_error_response()` module-level function.
+- **Health endpoint renamed**: `/healthy` → `/readiness`.
+- **OpenTelemetry is now a required dependency** (was optional `[tracing]` extras in 1.x).
+- **Environment variables changed**: `AGENT_LOG_LEVEL` and `AGENT_GRACEFUL_SHUTDOWN_TIMEOUT` are
+  no longer read from `Constants`. Use the `log_level` and `graceful_shutdown_timeout` constructor
+  parameters instead.
+
+### Features Added
+
+- `AgentServerHost` base class with built-in health probe (`/readiness`), graceful shutdown
+  (configurable timeout), and Hypercorn-based ASGI serving.
+- Cooperative mixin inheritance for multi-protocol composition — a single server can host both
+  Responses and Invocations endpoints.
+- Automatic OpenTelemetry tracing with Azure Monitor and OTLP exporters.
+- `configure_observability` constructor parameter for overridable logging + tracing setup.
+  Console `StreamHandler` is attached to the root logger by default so user `logging.info()`
+  calls are visible without any extra configuration.
+- `request_span()` context manager for creating request-scoped OTel spans with GenAI semantic
+  convention attributes.
+- `end_span()`, `record_error()`, `flush_spans()`, `trace_stream()` public functions for
+  protocol SDK tracing lifecycle.
+- `set_current_span()` / `detach_context()` for explicit OTel context management during
+  streaming, ensuring child spans are correctly parented.
+- `AgentConfig` dataclass for resolved configuration from environment variables (Foundry agent
+  name, version, project ID, session ID, etc.).
+- `create_error_response()` utility for standard error envelope JSON responses.
+- `build_server_version()` for constructing `x-platform-server` header segments.
+- HTTP access logging with configurable format via `access_log` and `access_log_format`
+  constructor parameters.
 
 ## 1.0.0b1 (2025-11-07)
 
 
@@ -0,0 +1,237 @@
+# Guide for migrating to the new azure-ai-agentserver package architecture
+
+This guide helps you migrate from `azure-ai-agentserver-core` 1.x to the new three-package
+architecture introduced in `azure-ai-agentserver-core` 2.0.0b1.
+
+## Table of contents
+
+- [Migration benefits](#migration-benefits)
+- [Package changes](#package-changes)
+- [API changes](#api-changes)
+  - [Handler registration](#handler-registration)
+  - [Streaming handler](#streaming-handler)
+  - [Server startup](#server-startup)
+  - [Tracing](#tracing)
+  - [Logging](#logging)
+  - [Error responses](#error-responses)
+- [Import changes](#import-changes)
+- [Multi-protocol composition](#multi-protocol-composition)
+- [Additional information](#additional-information)
+
+## Migration benefits
+
+The new package architecture provides:
+
+- **Separation of concerns** — protocol implementations (Responses API, Invocations) are in
+  dedicated packages rather than bundled into a monolithic Core package.
+- **Dramatically simpler API** — the old approach required manually constructing SSE events,
+  tracking sequence numbers, and building response objects. The new API provides decorator-based
+  handler registration with builder methods that handle all of this automatically.
+- **Type-safe event builders** — `ResponseEventStream` and its convenience generators manage
+  event sequencing, output indices, and content indices. You cannot accidentally emit events in
+  the wrong order.
+- **Built-in convenience methods** — common patterns like "emit a text message" or "stream
+  tokens" are one-liners via `ResponseEventStream` generators or `TextResponse`.
+- **Zero-config startup** — `app.run()` replaces manual server configuration with sensible
+  defaults including OpenTelemetry, health endpoints, and user-agent headers.
+- **Multi-protocol support** — a single server can host both Responses and Invocations endpoints
+  via cooperative mixin inheritance.
+
+## Package changes
+
+| Before | After | Notes |
+|--------|-------|-------|
+| `azure-ai-agentserver-core` 1.x | `azure-ai-agentserver-core` 2.x | Stripped to hosting foundation only |
+| _(bundled in core)_ | `azure-ai-agentserver-responses` 1.x | New — Responses API protocol |
+| _(bundled in core)_ | `azure-ai-agentserver-invocations` 1.x | New — Invocations protocol |
+
+Update your dependencies:
+
+```bash
+# Install the protocol package you need (transitively brings in core 2.x)
+pip install azure-ai-agentserver-responses
+
+# If you also need the Invocations protocol:
+pip install azure-ai-agentserver-invocations
+```
+
+> **Note:** Both `azure-ai-agentserver-responses` and `azure-ai-agentserver-invocations`
+> depend on `azure-ai-agentserver-core`, so you do not need to install Core separately.
+
+## API changes
+
+### Handler registration
+
+**Before (1.x):**
+
+```python
+from azure.ai.agentserver.core import FoundryCBAgent, AgentRunContext
+
+class MyAgent(FoundryCBAgent):
+    def register_routes(self):
+        self.app.add_route("/responses", self.handle_create, methods=["POST"])
+
+    async def handle_create(self, request):
+        # Manually parse request, build SSE events, track sequence numbers
+        ...
+```
+
+**After (2.x) — Responses protocol:**
+
+```python
+from azure.ai.agentserver.responses import (
+    CreateResponse,
+    ResponseContext,
+    ResponsesAgentServerHost,
+    TextResponse,
+)
+
+app = ResponsesAgentServerHost()
+
+@app.response_handler
+async def handle_create(request: CreateResponse, context: ResponseContext, cancellation_signal):
+    input_text = await context.get_input_text()
+    return TextResponse(context, request, text=f"Echo: {input_text}")
+
+app.run()
+```
+
+**After (2.x) — Invocations protocol:**
+
+```python
+from starlette.requests import Request
+from starlette.responses import JSONResponse, Response
+from azure.ai.agentserver.invocations import InvocationAgentServerHost
+
+app = InvocationAgentServerHost()
+
+@app.invoke_handler
+async def handle(request: Request) -> Response:
+    data = await request.json()
+    return JSONResponse({"greeting": f"Hello, {data['name']}!"})
+
+app.run()
+```
+
+### Streaming handler
+
+**Before (1.x):**
+
+```python
+# Manually construct every SSE event, track sequence numbers and indices
+seq = 0
+yield {"type": "response.created", "sequence_number": seq, "response": {...}}
+seq += 1
+yield {"type": "response.output_item.added", "sequence_number": seq, ...}
+seq += 1
+# ... many more events with manual index tracking
+```
+
+**After (2.x):**
+
+```python
+from azure.ai.agentserver.responses import (
+    CreateResponse,
+    ResponseContext,
+    ResponseEventStream,
+    ResponsesAgentServerHost,
+)
+
+app = ResponsesAgentServerHost()
+
+@app.response_handler
+async def handle_create(request: CreateResponse, context: ResponseContext, cancellation_signal):
+    stream = ResponseEventStream(context, request)
+    stream.emit_created()
+
+    # All inner events (output_item.added, content_part.added, deltas, done events)
+    # are emitted automatically with correct sequence numbers and indices
+    async for token in get_tokens():
+        yield from stream.output_item_message(token)
+
+    stream.emit_completed()
+```
+
+Or, for the simplest case:
+
+```python
+return TextResponse(context, request, text="Hello!")
+```
+
+### Server startup
+
+**Before (1.x):**
+
+```python
+agent = MyAgent()
+agent.run()  # or manual uvicorn/hypercorn setup
+```
+
+**After (2.x):**
+
+```python
+# Responses protocol
+app = ResponsesAgentServerHost()
+
+@app.response_handler
+async def handle(request, context, cancellation_signal):
+    ...
+
+app.run()  # Built-in Hypercorn server with OpenTelemetry, health endpoint, graceful shutdown
+```
+
+Configuration is via constructor parameters:
+
+```python
+app = ResponsesAgentServerHost(
+    log_level="DEBUG",                                      # Console log level
+    graceful_shutdown_timeout=60,                           # Drain period in seconds
+    applicationinsights_connection_string="InstrumentationKey=...",  # Azure Monitor
+    configure_observability=None,                           # Disable SDK logging/tracing setup
+)
+```
+
+## Import changes
+
+| Before (1.x) | After (2.x) |
+|---------------|-------------|
+| `from azure.ai.agentserver.core import FoundryCBAgent` | `from azure.ai.agentserver.core import AgentServerHost` |
+| `from azure.ai.agentserver.core import AgentRunContext` | `from azure.ai.agentserver.responses import ResponseContext` |
+| _(n/a)_ | `from azure.ai.agentserver.responses import ResponsesAgentServerHost` |
+| _(n/a)_ | `from azure.ai.agentserver.responses import TextResponse` |
+| _(n/a)_ | `from azure.ai.agentserver.responses import ResponseEventStream` |
+| _(n/a)_ | `from azure.ai.agentserver.invocations import InvocationAgentServerHost` |
+
+## Multi-protocol composition
+
+A single server can host both Responses and Invocations endpoints using cooperative
+mixin inheritance:
+
+```python
+from azure.ai.agentserver.invocations import InvocationAgentServerHost
+from azure.ai.agentserver.responses import ResponsesAgentServerHost
+
+class MyHost(InvocationAgentServerHost, ResponsesAgentServerHost):
+    pass
+
+app = MyHost()
+
+@app.response_handler
+async def handle_responses(request, context, cancellation_signal):
+    return TextResponse(context, request, text="Hello from Responses!")
+
+@app.invoke_handler
+async def handle_invocations(request):
+    return JSONResponse({"hello": "from Invocations!"})
+
+app.run()
+# Serves both POST /responses and POST /invocations
+```
+
+## Additional information
+
+- [azure-ai-agentserver-core README](https://github.com/Azure/azure-sdk-for-python/blob/main/sdk/agentserver/azure-ai-agentserver-core/README.md)
+- [azure-ai-agentserver-responses README](https://github.com/Azure/azure-sdk-for-python/blob/main/sdk/agentserver/azure-ai-agentserver-responses/README.md)
+- [azure-ai-agentserver-invocations README](https://github.com/Azure/azure-sdk-for-python/blob/main/sdk/agentserver/azure-ai-agentserver-invocations/README.md)
+- [Responses samples](https://github.com/Azure/azure-sdk-for-python/blob/main/sdk/agentserver/azure-ai-agentserver-responses/samples)
+- [Invocations samples](https://github.com/Azure/azure-sdk-for-python/blob/main/sdk/agentserver/azure-ai-agentserver-invocations/samples)
@@ -197,7 +197,7 @@ async def _lifespan(_app: Starlette) -> AsyncGenerator[None, None]:  # noqa: RUF
                         self._graceful_shutdown_timeout,
                     )
                 except Exception:  # pylint: disable=broad-exception-caught
-                    logger.exception("Error in on_shutdown")
+                    logger.warning("Error in on_shutdown", exc_info=True)
 
         # Merge routes: subclass routes (if any) + health endpoint
         all_routes: list[Any] = list(routes or [])
 
@@ -41,7 +41,7 @@
 # ======================================================================
 
 
-class AgentConfig:
+class AgentConfig:  # pylint: disable=too-many-instance-attributes
     """Resolved configuration for an agent server host.
 
     All values are populated from environment variables at creation time.
 
@@ -68,7 +68,8 @@ combine-as-imports = true
 breaking = false
 mypy = true
 pyright = true
-verifytypes = true
+verifytypes = false
+latestdependency = false
 pylint = true
 type_check_samples = false
 
 
@@ -189,7 +189,7 @@ async def receive():
     async def send(message):
         sent_messages.append(message)
 
-    with caplog.at_level(logging.ERROR, logger="azure.ai.agentserver"):
+    with caplog.at_level(logging.WARNING, logger="azure.ai.agentserver"):
         await agent(scope, receive, send)
 
     # The error should be logged
 
@@ -4,7 +4,7 @@ dynamic = ["version", "readme"]
 description = "GitHub Copilot SDK adapter for Azure AI Agent Server"
 requires-python = ">=3.11"
 authors = [
-  { name = "Microsoft Corporation", email = "azpysdkhelp@microsoft.com" },
+    { name = "Microsoft Corporation", email = "azpysdkhelp@microsoft.com" },
 ]
 license = "MIT"
 classifiers = [
@@ -32,13 +32,7 @@ requires = ["setuptools>=69", "wheel"]
 build-backend = "setuptools.build_meta"
 
 [tool.setuptools.packages.find]
-exclude = [
-    "tests*",
-    "samples*",
-    "doc*",
-    "azure",
-    "azure.ai",
-]
+exclude = ["tests*", "samples*", "doc*", "azure", "azure.ai"]
 
 [tool.setuptools.dynamic]
 version = { attr = "azure.ai.agentserver.githubcopilot._version.VERSION" }
@@ -63,6 +57,7 @@ analyze_python_version = "3.11"
 breaking = false
 pyright = false
 verifytypes = false
+latestdependency = false
 verify_keywords = false
 mindependency = false
 whl_no_aio = false
@@ -1,6 +1,6 @@
 # Release History
 
-## 1.0.0b1 (Unreleased)
+## 1.0.0b1 (2026-04-14)
 
 ### Features Added
Original file line number	Diff line number	Diff line change
`@@ -197,7 +197,7 @@ async def _lifespan(_app: Starlette) -> AsyncGenerator[None, None]: # noqa: RUF`
`197`	`197`	`self._graceful_shutdown_timeout,`
`198`	`198`	`)`
`199`	`199`	`except Exception: # pylint: disable=broad-exception-caught`
`200`		`- logger.exception("Error in on_shutdown")`
	`200`	`+ logger.warning("Error in on_shutdown", exc_info=True)`
`201`	`201`
`202`	`202`	`# Merge routes: subclass routes (if any) + health endpoint`
`203`	`203`	`all_routes: list[Any] = list(routes or [])`