From 46d4c9c0cc77038c08c4a6292313c3f237a636c8 Mon Sep 17 00:00:00 2001
From: eavanvalkenburg <github@vanvalkenburg.eu>
Date: Mon, 4 May 2026 17:31:08 +0200
Subject: [PATCH 1/6] feat(hosting): add agent-framework-hosting core package
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

New ``agent-framework-hosting`` package implementing ADR 0026 / SPEC-002:
the channel-neutral host that lets a single ``Agent`` (or ``Workflow``)
fan out across multiple wire protocols ("channels") behind one Starlette
ASGI app.

Surface (re-exported from ``agent_framework_hosting``):

- ``AgentFrameworkHost`` — wraps a hostable target, mounts channels onto
  an ASGI app, owns per-isolation-key ``AgentSession`` reuse, threads
  request context (``response_id`` / ``previous_response_id``) into
  context providers via an ``ExitStack`` of ``bind_request_context``
  calls, and exposes an opt-in Hypercorn ``serve()`` helper (extra
  ``[serve]``).
- ``Channel`` protocol + ``ChannelContribution`` — the surface a channel
  package implements (routes, lifespans, identity hooks, …).
- ``ChannelRequest`` / ``ChannelSession`` / ``ChannelIdentity`` /
  ``ChannelPush`` / ``ChannelCommand[Context]`` / ``ChannelRunHook`` /
  ``ChannelStreamTransformHook`` / ``DeliveryReport`` /
  ``HostedRunResult`` / ``ResponseTarget`` / ``ResponseTargetKind`` /
  ``apply_run_hook`` — channel-side dataclasses + helpers.
- ``IsolationKeys`` + ``ISOLATION_HEADER_USER`` / ``..._CHAT`` +
  ``get/set/reset_current_isolation_keys`` — the host's ASGI middleware
  reads the ``x-agent-{user,chat}-isolation-key`` headers off each
  inbound request and exposes them to the agent stack via a
  ``ContextVar`` so storage-side providers (e.g.
  ``FoundryHostedAgentHistoryProvider``) can apply per-tenant
  partitioning without channels having to forward anything.

Includes 45 unit tests covering the host, channel contributions,
isolation contextvar, and shared types. Registers the package in
``python/pyproject.toml`` ``[tool.uv.sources]`` and adds the matching
pyright ``executionEnvironments`` entry for tests.

Hypercorn is an optional dependency (``[serve]`` extra); the soft import
in ``serve()`` is annotated for pyright since it isn't on the default
install.

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 python/packages/hosting/LICENSE               |  21 +
 python/packages/hosting/README.md             |  59 ++
 .../agent_framework_hosting/__init__.py       |  74 ++
 .../hosting/agent_framework_hosting/_host.py  | 946 ++++++++++++++++++
 .../agent_framework_hosting/_isolation.py     |  76 ++
 .../hosting/agent_framework_hosting/_types.py | 376 +++++++
 python/packages/hosting/pyproject.toml        | 107 ++
 python/packages/hosting/tests/__init__.py     |   0
 .../hosting/tests/_workflow_fixtures.py       |  43 +
 python/packages/hosting/tests/test_host.py    | 714 +++++++++++++
 python/packages/hosting/tests/test_types.py   | 105 ++
 python/pyproject.toml                         |   2 +
 python/uv.lock                                |  39 +-
 13 files changed, 2558 insertions(+), 4 deletions(-)
 create mode 100644 python/packages/hosting/LICENSE
 create mode 100644 python/packages/hosting/README.md
 create mode 100644 python/packages/hosting/agent_framework_hosting/__init__.py
 create mode 100644 python/packages/hosting/agent_framework_hosting/_host.py
 create mode 100644 python/packages/hosting/agent_framework_hosting/_isolation.py
 create mode 100644 python/packages/hosting/agent_framework_hosting/_types.py
 create mode 100644 python/packages/hosting/pyproject.toml
 create mode 100644 python/packages/hosting/tests/__init__.py
 create mode 100644 python/packages/hosting/tests/_workflow_fixtures.py
 create mode 100644 python/packages/hosting/tests/test_host.py
 create mode 100644 python/packages/hosting/tests/test_types.py

diff --git a/python/packages/hosting/LICENSE b/python/packages/hosting/LICENSE
new file mode 100644
index 0000000000..9e841e7a26
--- /dev/null
+++ b/python/packages/hosting/LICENSE
@@ -0,0 +1,21 @@
+    MIT License
+
+    Copyright (c) Microsoft Corporation.
+
+    Permission is hereby granted, free of charge, to any person obtaining a copy
+    of this software and associated documentation files (the "Software"), to deal
+    in the Software without restriction, including without limitation the rights
+    to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+    copies of the Software, and to permit persons to whom the Software is
+    furnished to do so, subject to the following conditions:
+
+    The above copyright notice and this permission notice shall be included in all
+    copies or substantial portions of the Software.
+
+    THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+    IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+    FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+    AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+    LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+    OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+    SOFTWARE
diff --git a/python/packages/hosting/README.md b/python/packages/hosting/README.md
new file mode 100644
index 0000000000..a2690b5705
--- /dev/null
+++ b/python/packages/hosting/README.md
@@ -0,0 +1,59 @@
+# agent-framework-hosting
+
+Multi-channel hosting for Microsoft Agent Framework agents.
+
+`agent-framework-hosting` lets you serve a single agent (or workflow)
+target through one or more **channels** — pluggable adapters that
+expose the target over different transports. The result is a single
+Starlette ASGI application you can host anywhere (local Hypercorn,
+Azure Container Apps, Foundry Hosted Agents, …).
+
+The base package contains only the channel-neutral plumbing:
+
+- `AgentFrameworkHost` — the Starlette host
+- `Channel` / `ChannelPush` — the channel protocols
+- `ChannelRequest` / `ChannelSession` / `ChannelIdentity` / `ResponseTarget`
+  — the request envelope and routing primitives
+- `ChannelContext` / `ChannelContribution` / `ChannelCommand` — the
+  channel-side hooks for invoking the target and contributing routes,
+  commands, and lifecycle callbacks
+- `ChannelRunHook` / `ChannelStreamTransformHook` — the per-request
+  customization seams
+
+Concrete channels live in their own packages so you only install what
+you use:
+
+| Package | Transport |
+|---|---|
+| `agent-framework-hosting-responses` | OpenAI Responses API |
+| `agent-framework-hosting-invocations` | Foundry-native invocation envelope |
+| `agent-framework-hosting-telegram` | Telegram Bot API |
+| `agent-framework-hosting-activity-protocol` | Bot Framework Activity Protocol (Teams, Direct Line, Web Chat, …) |
+| `agent-framework-hosting-teams` | Microsoft Teams (Teams SDK) |
+| `agent-framework-hosting-entra` | Entra (OAuth) identity-link sidecar |
+
+## Install
+
+```bash
+pip install agent-framework-hosting agent-framework-hosting-responses
+# or with uvicorn pre-installed for the demo `host.serve(...)` helper
+pip install "agent-framework-hosting[serve]" agent-framework-hosting-responses
+```
+
+## Quickstart
+
+```python
+from agent_framework import ChatAgent
+from agent_framework.openai import OpenAIChatClient
+from agent_framework_hosting import AgentFrameworkHost
+from agent_framework_hosting_responses import ResponsesChannel
+
+agent = ChatAgent(name="Assistant", chat_client=OpenAIChatClient())
+
+host = AgentFrameworkHost(target=agent, channels=[ResponsesChannel()])
+host.serve(port=8000)
+```
+
+See the [hosting samples](https://github.com/microsoft/agent-framework/tree/main/python/samples/04-hosting/af-hosting)
+for richer multi-channel apps (Telegram + Teams + Responses fan-out,
+identity linking, `ResponseTarget` routing, etc.).
diff --git a/python/packages/hosting/agent_framework_hosting/__init__.py b/python/packages/hosting/agent_framework_hosting/__init__.py
new file mode 100644
index 0000000000..9a7cbcadad
--- /dev/null
+++ b/python/packages/hosting/agent_framework_hosting/__init__.py
@@ -0,0 +1,74 @@
+# Copyright (c) Microsoft. All rights reserved.
+
+"""Multi-channel hosting for Microsoft Agent Framework agents.
+
+Serve a single agent target through one or more **channels** — pluggable
+adapters that expose the target over different transports such as the
+OpenAI Responses API, Microsoft Teams, Telegram, and others. The base
+package contains only the channel-neutral plumbing; concrete channels
+ship in their own packages (``agent-framework-hosting-responses``,
+``agent-framework-hosting-telegram``, …) so users install only what
+they need.
+"""
+
+import importlib.metadata
+
+from ._host import AgentFrameworkHost, ChannelContext, logger
+from ._isolation import (
+    ISOLATION_HEADER_CHAT,
+    ISOLATION_HEADER_USER,
+    IsolationKeys,
+    get_current_isolation_keys,
+    reset_current_isolation_keys,
+    set_current_isolation_keys,
+)
+from ._types import (
+    Channel,
+    ChannelCommand,
+    ChannelCommandContext,
+    ChannelContribution,
+    ChannelIdentity,
+    ChannelPush,
+    ChannelRequest,
+    ChannelRunHook,
+    ChannelSession,
+    ChannelStreamTransformHook,
+    DeliveryReport,
+    HostedRunResult,
+    ResponseTarget,
+    ResponseTargetKind,
+    apply_run_hook,
+)
+
+try:
+    __version__ = importlib.metadata.version(__name__)
+except importlib.metadata.PackageNotFoundError:
+    __version__ = "0.0.0"
+
+__all__ = [
+    "ISOLATION_HEADER_CHAT",
+    "ISOLATION_HEADER_USER",
+    "AgentFrameworkHost",
+    "Channel",
+    "ChannelCommand",
+    "ChannelCommandContext",
+    "ChannelContext",
+    "ChannelContribution",
+    "ChannelIdentity",
+    "ChannelPush",
+    "ChannelRequest",
+    "ChannelRunHook",
+    "ChannelSession",
+    "ChannelStreamTransformHook",
+    "DeliveryReport",
+    "HostedRunResult",
+    "IsolationKeys",
+    "ResponseTarget",
+    "ResponseTargetKind",
+    "__version__",
+    "apply_run_hook",
+    "get_current_isolation_keys",
+    "logger",
+    "reset_current_isolation_keys",
+    "set_current_isolation_keys",
+]
diff --git a/python/packages/hosting/agent_framework_hosting/_host.py b/python/packages/hosting/agent_framework_hosting/_host.py
new file mode 100644
index 0000000000..92a0b1c45c
--- /dev/null
+++ b/python/packages/hosting/agent_framework_hosting/_host.py
@@ -0,0 +1,946 @@
+# Copyright (c) Microsoft. All rights reserved.
+
+"""The :class:`AgentFrameworkHost` and its :class:`ChannelContext` bridge.
+
+The host is a tiny Starlette wrapper:
+
+- ``__init__`` accepts a hostable target (``SupportsAgentRun`` agent or
+  ``Workflow``) and a sequence of channels.
+- :meth:`AgentFrameworkHost.app` lazily builds a Starlette app by calling
+  every channel's ``contribute`` and mounting the returned routes under
+  the channel's ``path`` (empty path → mount at the app root).
+- :class:`ChannelContext` exposes ``run`` / ``run_stream`` /
+  ``deliver_response`` for channels to invoke; the host handles
+  per-``isolation_key`` session caching, identity tracking, and
+  :class:`ResponseTarget` fan-out.
+
+Per SPEC-002 (and ADR-0026), the host is intentionally thin so the bulk
+of channel-specific behaviour stays in the channel package. Identity
+linking, link policies, response targets, background runs, and the like
+are pluggable extensions that the future identity/foundry packages will
+contribute on top of this surface.
+"""
+
+from __future__ import annotations
+
+import logging
+import os
+import uuid
+from collections.abc import Awaitable, Callable, Sequence
+from contextlib import AbstractContextManager, ExitStack, asynccontextmanager
+from pathlib import Path
+from typing import TYPE_CHECKING, Any, AsyncIterator, cast
+
+from agent_framework import (
+    AgentResponse,
+    AgentResponseUpdate,
+    CheckpointStorage,
+    Content,
+    FileCheckpointStorage,
+    Message,
+    ResponseStream,
+    SupportsAgentRun,
+    Workflow,
+    WorkflowEvent,
+)
+from starlette.applications import Starlette
+from starlette.middleware import Middleware
+from starlette.requests import Request
+from starlette.responses import PlainTextResponse
+from starlette.routing import BaseRoute, Mount, Route
+from starlette.types import ASGIApp, Receive, Scope, Send
+
+from ._isolation import (
+    ISOLATION_HEADER_CHAT,
+    ISOLATION_HEADER_USER,
+    IsolationKeys,
+    reset_current_isolation_keys,
+    set_current_isolation_keys,
+)
+from ._types import (
+    Channel,
+    ChannelIdentity,
+    ChannelPush,
+    ChannelRequest,
+    DeliveryReport,
+    HostedRunResult,
+    ResponseTargetKind,
+)
+
+if TYPE_CHECKING:
+    pass
+
+logger = logging.getLogger("agent_framework.hosting")
+
+
+def _workflow_output_to_text(value: Any) -> str:
+    """Render a single workflow ``output`` payload as plain text.
+
+    ``AgentResponse`` and ``AgentResponseUpdate`` carry text natively;
+    everything else is best-effort ``str()``.
+    """
+    text = getattr(value, "text", None)
+    if isinstance(text, str):
+        return text
+    return str(value)
+
+
+def _workflow_event_to_update(event: WorkflowEvent[Any]) -> AgentResponseUpdate | None:
+    """Map a :class:`WorkflowEvent` to a channel-friendly :class:`AgentResponseUpdate`.
+
+    Returns ``None`` for events the host should drop (anything that is not
+    user-visible output). The original event is preserved on the update's
+    ``raw_representation`` so consumers can recover full workflow context.
+    """
+    if event.type != "output":
+        return None
+    payload: Any = event.data
+    if isinstance(payload, AgentResponseUpdate):
+        # Already a streaming update — pass through but tag the source so
+        # downstream hooks can tell it came from a workflow executor.
+        if payload.raw_representation is None:
+            payload.raw_representation = event
+        return payload
+    text = _workflow_output_to_text(payload)
+    return AgentResponseUpdate(
+        contents=[Content.from_text(text=text)],
+        role="assistant",
+        author_name=event.executor_id,
+        raw_representation=event,
+    )
+
+
+@asynccontextmanager
+async def _suppress_already_consumed() -> AsyncIterator[None]:  # noqa: RUF029
+    """Yield, swallowing the ``RuntimeError`` ``ResponseStream`` raises on double-consume.
+
+    The bridge stream calls ``get_final_response()`` after iterating the
+    workflow stream so the workflow's cleanup hooks run; on some paths the
+    stream considers itself already finalized and raises, which we treat
+    as benign — we're only after the side effect.
+    """
+    try:
+        yield
+    except RuntimeError as exc:
+        logger.debug("workflow stream finalize skipped: %s", exc)
+    except Exception:  # pragma: no cover - defensive: never let cleanup hide the real result
+        logger.exception("workflow stream finalize failed")
+
+
+class _BoundResponseStream:
+    """Adapter that keeps an :class:`ExitStack` open across stream iteration.
+
+    Streaming runs return a :class:`ResponseStream` synchronously, but
+    consumption happens later (the channel iterates). For host-bound
+    request context (e.g. Foundry response-id binding) to survive that
+    gap, we hold the stack open until the underlying stream is exhausted
+    or :meth:`close` is called. We forward awaitable + async-iterator +
+    ``get_final_response`` semantics so the channel sees a normal
+    ``ResponseStream``-shaped object.
+    """
+
+    def __init__(self, inner: Any, stack: ExitStack) -> None:
+        self._inner = inner
+        self._stack = stack
+        self._closed = False
+
+    def _close(self) -> None:
+        if self._closed:
+            return
+        self._closed = True
+        self._stack.close()
+
+    def __await__(self) -> Any:
+        # ``__await__`` returns a generator; closing here would be too
+        # eager — we close in ``__aiter__`` finally instead. Awaitable
+        # consumers (rare for streams) call ``aclose()`` separately.
+        return self._inner.__await__()
+
+    def __aiter__(self) -> AsyncIterator[Any]:
+        return self._wrap()
+
+    async def _wrap(self) -> AsyncIterator[Any]:
+        try:
+            async for item in self._inner:
+                yield item
+        finally:
+            self._close()
+
+    async def get_final_response(self) -> Any:
+        try:
+            return await self._inner.get_final_response()
+        finally:
+            self._close()
+
+    def __getattr__(self, name: str) -> Any:
+        return getattr(self._inner, name)
+
+
+class ChannelContext:
+    """Host-owned bridge that channels call to invoke the target."""
+
+    def __init__(self, host: "AgentFrameworkHost") -> None:
+        """Bind the context to its owning :class:`AgentFrameworkHost`.
+
+        The host instance is the source of truth for the target, registered
+        channels, identity stores, sessions, and lifecycle state. Channels
+        only ever receive a context; they never see the host directly.
+        """
+        self._host = host
+
+    @property
+    def target(self) -> SupportsAgentRun | Workflow:
+        """The hostable target the channel should invoke."""
+        return self._host.target
+
+    async def run(self, request: ChannelRequest) -> HostedRunResult:
+        """Invoke the target for ``request`` and return a channel-neutral result."""
+        return await self._host._invoke(request)  # pyright: ignore[reportPrivateUsage]
+
+    def run_stream(self, request: ChannelRequest) -> ResponseStream[AgentResponseUpdate, AgentResponse]:
+        """Invoke the target with ``stream=True`` and return the agent's ResponseStream.
+
+        Channels iterate the stream directly (it acts like an AsyncGenerator)
+        and are responsible for delivering updates to their wire protocol.
+        Apply per-channel ``transform_hook`` callables during iteration to
+        rewrite or drop individual updates before they hit the wire.
+        """
+        return self._host._invoke_stream(request)  # pyright: ignore[reportPrivateUsage]
+
+    async def deliver_response(self, request: ChannelRequest, payload: HostedRunResult) -> DeliveryReport:
+        """Resolve ``request.response_target`` and push ``payload`` to each destination.
+
+        Returns a :class:`DeliveryReport` so the originating channel knows
+        whether to render the agent reply on its own wire (``originating``
+        included in or implied by the target) or just acknowledge dispatch.
+        """
+        return await self._host._deliver_response(request, payload)  # pyright: ignore[reportPrivateUsage]
+
+
+class _FoundryIsolationASGIMiddleware:
+    """Lift the two well-known Foundry isolation headers into a contextvar.
+
+    The Foundry Hosted Agents runtime injects
+    ``x-agent-{user,chat}-isolation-key`` on every inbound HTTP request.
+    Storage providers that need partition-aware writes (notably
+    :class:`FoundryHostedAgentHistoryProvider`) read those keys via
+    :func:`get_current_isolation_keys` to avoid every channel having to
+    parse Foundry-specific headers itself. We intentionally inspect
+    only HTTP scopes; lifespan/websocket scopes are forwarded
+    untouched. When neither header is present the contextvar stays at
+    its default ``None``, so local-dev requests behave as before.
+    """
+
+    def __init__(self, app: ASGIApp) -> None:
+        self.app = app
+
+    async def __call__(self, scope: Scope, receive: Receive, send: Send) -> None:
+        if scope["type"] != "http":
+            await self.app(scope, receive, send)
+            return
+        user_key: str | None = None
+        chat_key: str | None = None
+        for raw_name, raw_value in scope.get("headers") or ():
+            name = raw_name.decode("latin-1").lower()
+            if name == ISOLATION_HEADER_USER:
+                user_key = raw_value.decode("latin-1") or None
+            elif name == ISOLATION_HEADER_CHAT:
+                chat_key = raw_value.decode("latin-1") or None
+        if user_key is None and chat_key is None:
+            await self.app(scope, receive, send)
+            return
+        token = set_current_isolation_keys(IsolationKeys(user_key=user_key, chat_key=chat_key))
+        try:
+            await self.app(scope, receive, send)
+        finally:
+            reset_current_isolation_keys(token)
+
+
+class AgentFrameworkHost:
+    """Owns one Starlette app, one hostable target, and a sequence of channels."""
+
+    def __init__(
+        self,
+        target: SupportsAgentRun | Workflow,
+        *,
+        channels: Sequence[Channel],
+        debug: bool = False,
+        checkpoint_location: str | os.PathLike[str] | CheckpointStorage | None = None,
+    ) -> None:
+        """Create a host for ``target`` and its channels.
+
+        Args:
+            target: The hostable target to invoke from channels — either a
+                ``SupportsAgentRun``-compatible agent or a ``Workflow``. The
+                host detects the kind and dispatches to the appropriate
+                execution seam (``agent.run(...)`` vs ``workflow.run(message=...)``).
+                For workflow targets, channels (or their ``run_hook``) are
+                responsible for shaping ``ChannelRequest.input`` into the
+                workflow start executor's typed input.
+            channels: The channels to expose. Each channel contributes routes
+                and commands that are mounted under ``channel.path`` (defaulting
+                to the channel name).
+            debug: Whether to enable Starlette's debug mode (stack traces in
+                responses, etc.) and per-channel debug logging.
+            checkpoint_location: When ``target`` is a :class:`Workflow`, the
+                location used to persist workflow checkpoints across requests.
+                Either a filesystem path (``str`` / ``PathLike``) — the host
+                creates a per-conversation
+                :class:`~agent_framework.FileCheckpointStorage` rooted at
+                ``checkpoint_location / <isolation_key>`` — or a
+                :class:`~agent_framework.CheckpointStorage` instance the host
+                uses as-is (caller owns scoping). Per-request behaviour:
+                requests without ``ChannelRequest.session.isolation_key``
+                are run without checkpointing. When set on a workflow that
+                already has its own checkpoint storage configured
+                (``WorkflowBuilder(checkpoint_storage=...)``), the host
+                refuses to start so ownership of checkpointing is
+                unambiguous. Ignored for ``SupportsAgentRun`` targets (a
+                warning is emitted).
+        """
+        self.target: SupportsAgentRun | Workflow = target
+        self._is_workflow = isinstance(target, Workflow)
+        self.channels = list(channels)
+        self._debug = debug
+        self._app: Starlette | None = None
+        self._checkpoint_location: Path | CheckpointStorage | None = None
+        if checkpoint_location is not None:
+            if not self._is_workflow:
+                logger.warning("checkpoint_location is set but target is not a Workflow; ignoring.")
+            else:
+                workflow: Workflow = target  # type: ignore[assignment]
+                if workflow._runner_context.has_checkpointing():  # type: ignore[reportPrivateUsage]
+                    raise RuntimeError(
+                        "Workflow already has checkpoint storage configured "
+                        "(WorkflowBuilder(checkpoint_storage=...)). The host "
+                        "manages checkpoints when checkpoint_location is set; "
+                        "remove one of the two configurations."
+                    )
+                if isinstance(checkpoint_location, (str, os.PathLike)):
+                    self._checkpoint_location = Path(os.fspath(checkpoint_location))
+                else:
+                    # Anything else is treated as a CheckpointStorage instance.
+                    # ``CheckpointStorage`` is a non-runtime-checkable Protocol,
+                    # so we cannot ``isinstance``-check it directly.
+                    self._checkpoint_location = checkpoint_location
+        # Per-isolation_key session cache. The real spec backs this with a
+        # pluggable session store; this base host keeps it in-process.
+        self._sessions: dict[str, Any] = {}
+        # ``isolation_key -> active session_id``. Normally identical to the
+        # isolation_key, but ``reset_session`` rotates this to a fresh id so
+        # the next turn starts a new ``AgentSession`` while the old history
+        # remains on disk under its original session_id.
+        self._session_aliases: dict[str, str] = {}
+        # Per-isolation_key identity registry: which channels we've seen this
+        # user on, and which native_id they used on each. Powers
+        # ResponseTarget.active / .channel(name) / .channels([...]) /
+        # .all_linked.
+        # Shape: { isolation_key: { channel_name: ChannelIdentity } }.
+        self._identities: dict[str, dict[str, ChannelIdentity]] = {}
+        # (isolation_key -> last-seen channel name) for ResponseTarget.active.
+        self._active: dict[str, str] = {}
+
+    @property
+    def app(self) -> Starlette:
+        """Lazily build (and cache) the Starlette application."""
+        if self._app is None:
+            self._app = self._build_app()
+        return self._app
+
+    def serve(
+        self,
+        *,
+        host: str = "127.0.0.1",
+        port: int = 8000,
+        workers: int = 1,
+        **config_kwargs: Any,
+    ) -> None:
+        """Start the host on ``host:port`` using Hypercorn.
+
+        Hypercorn is the same ASGI server the Foundry Hosted Agents
+        runtime uses for production deployments, so running locally with
+        the same server keeps dev/prod parity (Trio fallbacks, lifespan
+        semantics, HTTP/2 support, …). Install with the ``serve`` extra
+        (``pip install agent-framework-hosting[serve]``).
+
+        Args:
+            host: Interface to bind. Defaults to ``127.0.0.1``.
+            port: TCP port to bind. Defaults to ``8000``.
+            workers: Number of worker processes. Defaults to ``1``;
+                Hypercorn's process model only kicks in for ``>1``.
+            **config_kwargs: Forwarded to :class:`hypercorn.config.Config`
+                via attribute assignment, so any documented Hypercorn
+                config field (e.g. ``keep_alive_timeout=...``,
+                ``access_log_format=...``) can be set directly.
+        """
+        try:
+            import asyncio
+            from typing import cast as _cast
+
+            from hypercorn.asyncio import (  # pyright: ignore[reportMissingImports]
+                serve as _hypercorn_serve,  # pyright: ignore[reportUnknownVariableType]
+            )
+            from hypercorn.config import Config  # pyright: ignore[reportMissingImports, reportUnknownVariableType]
+        except ImportError as exc:  # pragma: no cover - exercised at runtime
+            raise RuntimeError(
+                "AgentFrameworkHost.serve() requires hypercorn. "
+                "Install with `pip install agent-framework-hosting[serve]` or `pip install hypercorn`."
+            ) from exc
+
+        config = Config()  # pyright: ignore[reportUnknownVariableType]
+        config.bind = [f"{host}:{port}"]  # pyright: ignore[reportUnknownMemberType]
+        config.workers = workers  # pyright: ignore[reportUnknownMemberType]
+        for key, value in config_kwargs.items():
+            setattr(config, key, value)  # pyright: ignore[reportUnknownArgumentType]
+
+        # Touch ``self.app`` so the lifespan startup log fires once before
+        # we hand off to hypercorn — gives a single, readable banner of
+        # what the host is exposing without requiring channels to log
+        # individually.
+        app = self.app
+        self._log_startup(host=host, port=port, workers=workers)
+
+        # ``hypercorn.asyncio.serve`` has a complex partially-typed signature
+        # (multiple ASGI/WSGI app overloads) and its ``Scope`` definition
+        # diverges from Starlette's; cast both sides to ``Any`` to keep the
+        # call site readable without sprinkling per-error suppressions.
+        serve_callable = _cast(Any, _hypercorn_serve)
+        asyncio.run(serve_callable(app, config))
+
+    def reset_session(self, isolation_key: str) -> None:
+        """Rotate ``isolation_key`` to a fresh session id without deleting history.
+
+        Old turns are preserved on disk under their original session id and
+        remain accessible by passing that id explicitly (e.g. as
+        ``previous_response_id``). Future requests using ``isolation_key``
+        get a new, empty ``AgentSession``.
+        """
+        new_id = f"{isolation_key}#{uuid.uuid4().hex[:8]}"
+        self._session_aliases[isolation_key] = new_id
+        self._sessions.pop(isolation_key, None)
+
+    # -- internals --------------------------------------------------------- #
+
+    def _log_startup(self, *, host: str, port: int, workers: int) -> None:
+        """Emit a single human-friendly startup banner.
+
+        Mirrors the ``AgentServerHost`` convention from
+        ``azure.ai.agentserver.core``: one INFO line that captures the
+        target type, every channel + its mount path, the bind address,
+        whether we're running inside a Foundry Hosted Agents container,
+        and the worker count. Keeps log noise low while still giving an
+        operator a single grep-able anchor when triaging.
+        """
+        target_kind = "Workflow" if isinstance(self.target, Workflow) else type(self.target).__name__
+        target_name = getattr(self.target, "name", None) or target_kind
+        channels_repr = ", ".join(
+            f"{ch.name}@{ch.path or '/'}"  # blank path means "mounted at root"
+            for ch in self.channels
+        )
+        is_hosted = bool(os.environ.get("FOUNDRY_HOSTING_ENVIRONMENT"))
+        logger.info(
+            "AgentFrameworkHost starting: target=%s (%s) bind=%s:%d workers=%d hosted=%s channels=[%s]",
+            target_name,
+            target_kind,
+            host,
+            port,
+            workers,
+            is_hosted,
+            channels_repr or "<none>",
+        )
+
+    def _build_app(self) -> Starlette:
+        context = ChannelContext(self)
+        routes: list[BaseRoute] = []
+        on_startup: list[Callable[[], Awaitable[None]]] = []
+        on_shutdown: list[Callable[[], Awaitable[None]]] = []
+
+        # ``/readiness`` is the standard probe path the Foundry Hosted Agents
+        # runtime hits to gate traffic. We expose it unconditionally — once the
+        # ASGI app is up the host considers itself ready (channels register
+        # their own startup hooks and may run before the first request, but
+        # readiness is intentionally cheap so the platform's probe never times
+        # out on transient channel work). Mounted first so a channel cannot
+        # accidentally shadow it.
+        async def _readiness(_request: Request) -> PlainTextResponse:  # noqa: RUF029
+            """Liveness/readiness probe handler used by Foundry Hosted Agents."""
+            return PlainTextResponse("ok")
+
+        routes.append(Route("/readiness", _readiness, methods=["GET"]))
+
+        for channel in self.channels:
+            contribution = channel.contribute(context)
+            # Channels publish routes relative to their root; mount under channel.path.
+            # An empty path means "mount at the app root" — useful for single-channel hosts
+            # that don't want a prefix (e.g. ResponsesChannel exposing POST /responses directly).
+            if contribution.routes:
+                if channel.path:
+                    routes.append(Mount(channel.path, routes=list(contribution.routes)))
+                else:
+                    routes.extend(contribution.routes)
+            on_startup.extend(contribution.on_startup)
+            on_shutdown.extend(contribution.on_shutdown)
+
+        @asynccontextmanager
+        async def lifespan(_app: Starlette) -> AsyncIterator[None]:
+            for cb in on_startup:
+                await cb()
+            try:
+                yield
+            finally:
+                for cb in on_shutdown:
+                    await cb()
+
+        return Starlette(
+            debug=self._debug,
+            routes=routes,
+            lifespan=lifespan,
+            middleware=[Middleware(_FoundryIsolationASGIMiddleware)],
+        )
+
+    def _build_run_kwargs(self, request: ChannelRequest) -> dict[str, Any]:
+        # The full spec resolves a ChannelSession into an AgentSession here,
+        # honors session_mode, and consults LinkPolicy / ResponseTarget. This
+        # base host keys a per-isolation_key AgentSession off the channel's
+        # session hint so context providers (FileHistoryProvider, …) on the
+        # target see one session per end user.
+        session = None
+        if request.session_mode != "disabled" and request.session is not None:
+            isolation_key = request.session.isolation_key
+            if isolation_key is not None and hasattr(self.target, "create_session"):
+                session_id = self._session_aliases.get(isolation_key, isolation_key)
+                session = self._sessions.get(isolation_key)
+                if session is None:
+                    # ``create_session`` lives on agent-typed targets but not on
+                    # ``Workflow``; the ``hasattr`` above guards the call site.
+                    session = self.target.create_session(  # pyright: ignore[reportAttributeAccessIssue, reportUnknownVariableType, reportUnknownMemberType]
+                        session_id=session_id
+                    )
+                    self._sessions[isolation_key] = session  # pyright: ignore[reportUnknownArgumentType]
+
+        run_kwargs: dict[str, Any] = {}
+        if session is not None:
+            run_kwargs["session"] = session
+        if request.options:
+            run_kwargs["options"] = request.options
+        return run_kwargs
+
+    def _log_incoming(self, request: ChannelRequest, *, stream: bool) -> None:
+        """Emit a one-line INFO summary for every incoming target invocation.
+
+        When ``debug=True`` is set on the host, also dump the channel-native
+        settings the channel attached to the ``ChannelRequest`` — ``options``
+        (the ChatOptions-shaped fields the channel parsed from its protocol
+        payload, e.g. temperature/tools/tool_choice for Responses), plus
+        ``attributes`` / ``metadata`` (the channel's protocol-specific bag,
+        e.g. ``chat_id`` / ``callback_query_id`` for Telegram).
+        """
+        isolation_key = request.session.isolation_key if request.session is not None else None
+        logger.info(
+            "channel=%s op=%s stream=%s session=%s session_mode=%s",
+            request.channel,
+            request.operation,
+            stream,
+            isolation_key,
+            request.session_mode,
+        )
+        logger.debug(
+            "  ↳ options=%s attributes=%s metadata=%s",
+            dict(request.options) if request.options else {},
+            dict(request.attributes) if request.attributes else {},
+            dict(request.metadata) if request.metadata else {},
+        )
+
+    def _flat_context_providers(self) -> list[Any]:
+        """Flatten ``target.context_providers`` one level for duck-typed hooks.
+
+        ``ContextProviderBase`` aggregates child providers under a
+        ``providers`` attribute when wrapped (e.g. by ``ChatClientAgent``).
+        We descend one level so the host catches both styles without
+        forcing a particular wiring on the agent.
+        """
+        providers = getattr(self.target, "context_providers", None) or ()
+        flat: list[Any] = []
+        for entry in providers:
+            children = getattr(entry, "providers", None)
+            if children:
+                flat.extend(children)
+            else:
+                flat.append(entry)
+        return flat
+
+    def _bind_request_context(self, request: ChannelRequest) -> ExitStack:
+        """Bind any per-request anchors a target's context-providers expose.
+
+        Channels announce per-request anchors (currently ``response_id``
+        and ``previous_response_id``) via ``ChannelRequest.attributes``.
+        Some history providers — notably the Foundry hosted-agent history
+        provider — need to write storage under the same ``response_id``
+        the channel surfaces on its envelope so the next turn's
+        ``previous_response_id`` walks the chain. Rather than the host
+        knowing about specific provider classes, we duck-type: any
+        context provider on the target that exposes a
+        ``bind_request_context(response_id=..., previous_response_id=...,
+        **_)`` context-manager gets it called with the request's
+        attribute values. Per-request platform isolation keys are handled
+        separately by :class:`_FoundryIsolationASGIMiddleware` (lifted
+        off the inbound headers into a contextvar) so providers don't
+        depend on channels to forward them. Bindings are scoped to the
+        returned :class:`ExitStack` which the caller must enter before
+        invoking the target and leave after the run completes.
+        """
+        stack = ExitStack()
+        attrs = request.attributes or {}
+        response_id = attrs.get("response_id")
+        if not isinstance(response_id, str) or not response_id:
+            return stack
+        previous_response_id = attrs.get("previous_response_id")
+        if previous_response_id is not None and not isinstance(previous_response_id, str):
+            previous_response_id = None
+
+        flat: list[Any] = self._flat_context_providers()
+
+        for provider in flat:
+            bind = getattr(provider, "bind_request_context", None)
+            if not callable(bind):
+                continue
+            stack.enter_context(
+                cast(
+                    "AbstractContextManager[Any]",
+                    bind(
+                        response_id=response_id,
+                        previous_response_id=previous_response_id,
+                    ),
+                )
+            )
+        return stack
+
+    async def _invoke(self, request: ChannelRequest) -> HostedRunResult:
+        self._log_incoming(request, stream=False)
+        self._record_identity(request)
+        if self._is_workflow:
+            return await self._invoke_workflow(request)
+        run_kwargs = self._build_run_kwargs(request)
+        with self._bind_request_context(request):
+            # ``_is_workflow`` is False here so ``self.target`` is an
+            # ``Agent``-shaped target whose ``.run`` returns
+            # :class:`AgentResponse`. Narrow back to keep ``result.text``
+            # well-typed without conditional imports of ``Agent``.
+            agent_target = cast("SupportsAgentRun", self.target)
+            result = await agent_target.run(self._wrap_input(request), **run_kwargs)
+        return HostedRunResult(text=result.text)
+
+    def _invoke_stream(self, request: ChannelRequest) -> ResponseStream[AgentResponseUpdate, AgentResponse]:
+        self._log_incoming(request, stream=True)
+        self._record_identity(request)
+        if self._is_workflow:
+            return self._invoke_workflow_stream(request)
+        run_kwargs = self._build_run_kwargs(request)
+        # ``run(stream=True)`` returns a ResponseStream synchronously (it is
+        # itself awaitable / async-iterable). We hand it back to the channel
+        # so the channel can drive iteration and apply its transform hook.
+        # Streaming flows iterate after this method returns, which is
+        # *outside* a sync ``with`` block — so we wrap the underlying
+        # stream in an adapter that holds the binding open across the
+        # iteration lifecycle.
+        binder = self._bind_request_context(request)
+        return _BoundResponseStream(  # type: ignore[return-value]
+            self.target.run(self._wrap_input(request), stream=True, **run_kwargs),
+            binder,
+        )
+
+    def _resolve_checkpoint_storage(self, request: ChannelRequest) -> CheckpointStorage | None:
+        """Build (or return) the per-request checkpoint storage, or ``None``.
+
+        Returns ``None`` when no ``checkpoint_location`` is configured or
+        when the request lacks a stable session key — without a key we
+        cannot scope checkpoints per conversation, and we'd rather skip
+        checkpointing than pollute a single shared store.
+        """
+        if self._checkpoint_location is None:
+            return None
+        if request.session is None or not request.session.isolation_key:
+            return None
+        if isinstance(self._checkpoint_location, Path):
+            return FileCheckpointStorage(str(self._checkpoint_location / request.session.isolation_key))
+        # Caller-supplied storage — used as-is; caller owns scoping.
+        return self._checkpoint_location
+
+    async def _invoke_workflow(self, request: ChannelRequest) -> HostedRunResult:
+        """Dispatch to ``Workflow.run`` and collapse outputs into a ``HostedRunResult``.
+
+        The channel's ``run_hook`` is the canonical adapter for shaping
+        ``request.input`` into the workflow start executor's typed input
+        (free-form text from a Telegram message, structured ``Responses``
+        ``input`` items, …). When no hook is wired, ``request.input`` is
+        forwarded verbatim — appropriate for workflows whose start executor
+        accepts the channel's native input type (commonly ``str``).
+
+        When ``checkpoint_location`` is configured on the host, a
+        per-conversation checkpoint storage is resolved, the workflow is
+        restored from its latest checkpoint (if any) and then re-run with
+        the new input — mirroring the resume semantics of the Foundry
+        Responses host.
+        """
+        # Workflows do not own session state in the agent sense and do not
+        # accept ``session=`` / ``options=`` kwargs. The channel's run_hook is
+        # the seam for any per-run customization; nothing flows through here.
+        workflow: Workflow = self.target  # type: ignore[assignment]
+        storage = self._resolve_checkpoint_storage(request)
+        if storage is not None:
+            latest = await storage.get_latest(workflow_name=workflow.name)
+            if latest is not None:
+                # Restore in-memory state from the most recent checkpoint
+                # before applying the new input.
+                await workflow.run(checkpoint_id=latest.checkpoint_id, checkpoint_storage=storage)
+            result = await workflow.run(request.input, checkpoint_storage=storage)
+        else:
+            result = await workflow.run(request.input)
+        outputs = result.get_outputs()
+        text = "\n".join(_workflow_output_to_text(o) for o in outputs) if outputs else ""
+        return HostedRunResult(text=text)
+
+    def _invoke_workflow_stream(self, request: ChannelRequest) -> ResponseStream[AgentResponseUpdate, AgentResponse]:
+        """Bridge ``Workflow.run(stream=True)`` to a channel-facing ``ResponseStream``.
+
+        Wraps the workflow's ``ResponseStream[WorkflowEvent, WorkflowRunResult]``
+        in a new ``ResponseStream[AgentResponseUpdate, AgentResponse]`` so
+        channels can iterate it identically to an agent stream and apply
+        their ``stream_transform_hook`` callables.
+
+        Mapping rules:
+
+        - ``output`` events whose ``data`` is already an
+          :class:`AgentResponseUpdate` (the common case for workflows
+          containing :class:`AgentExecutor`) pass through unchanged.
+        - ``output`` events with any other ``data`` are wrapped into a
+          single-text-content :class:`AgentResponseUpdate`.
+        - All other event types (``status``, ``executor_invoked``,
+          ``superstep_*``, lifecycle, …) are filtered out — channels only
+          care about user-visible text. Hooks can opt back in by inspecting
+          ``raw_representation`` on the produced updates.
+
+        The original :class:`WorkflowEvent` is stashed on
+        ``AgentResponseUpdate.raw_representation`` so advanced consumers
+        (telemetry, debug UIs) can recover the full workflow timeline.
+
+        Checkpoint restoration (when ``checkpoint_location`` is set) runs
+        before the input stream is opened so the new turn observes the
+        restored state.
+        """
+        workflow: Workflow = self.target  # type: ignore[assignment]
+        storage = self._resolve_checkpoint_storage(request)
+
+        async def _maybe_restore() -> None:
+            if storage is None:
+                return
+            latest = await storage.get_latest(workflow_name=workflow.name)
+            if latest is None:
+                return
+            # Drain the restoration stream so the no-op invocation actually
+            # rehydrates state before the real run starts.
+            async for _ in workflow.run(
+                stream=True,
+                checkpoint_id=latest.checkpoint_id,
+                checkpoint_storage=storage,
+            ):
+                pass
+
+        async def _bridge() -> AsyncIterator[AgentResponseUpdate]:
+            await _maybe_restore()
+            workflow_stream = workflow.run(request.input, stream=True, checkpoint_storage=storage)
+            try:
+                async for event in workflow_stream:
+                    update = _workflow_event_to_update(event)
+                    if update is not None:
+                        yield update
+            finally:
+                async with _suppress_already_consumed():
+                    await workflow_stream.get_final_response()
+
+        async def _finalize(updates: Sequence[AgentResponseUpdate]) -> AgentResponse:  # noqa: RUF029
+            return AgentResponse.from_updates(updates)
+
+        return ResponseStream[AgentResponseUpdate, AgentResponse](_bridge(), finalizer=_finalize)
+
+    def _wrap_input(self, request: ChannelRequest) -> Message | list[Message]:
+        """Promote ``request.input`` to ``Message``(s) carrying channel metadata.
+
+        Channels deliver inputs as plain text, a single ``Message``, or a list
+        of ``Message`` (e.g. a Responses-API request that includes a ``system``
+        instruction plus the user turn). To preserve channel provenance +
+        identity + ``response_target`` on the persisted history record (and
+        make it visible to context providers, evals, audits), we attach a
+        ``hosting`` block under ``additional_properties``. AF's
+        ``Message.to_dict`` round-trips ``additional_properties`` through any
+        ``HistoryProvider`` that serializes via ``to_dict`` (e.g.
+        ``FileHistoryProvider``) and the framework explicitly does *not*
+        forward these fields to model providers, so they are safe to attach.
+
+        For a list of messages we attach the metadata to the LAST message that
+        will be persisted (typically the user turn) — this keeps a single,
+        searchable record of where the inbound message came from.
+        """
+        hosting_meta: dict[str, Any] = {"channel": request.channel}
+        if request.identity is not None:
+            hosting_meta["identity"] = {
+                "channel": request.identity.channel,
+                "native_id": request.identity.native_id,
+                "attributes": dict(request.identity.attributes) if request.identity.attributes else {},
+            }
+        target = request.response_target
+        hosting_meta["response_target"] = {
+            "kind": target.kind.value,
+            "targets": list(target.targets),
+        }
+
+        raw = request.input
+        if isinstance(raw, Message):
+            raw.additional_properties = {**(raw.additional_properties or {}), "hosting": hosting_meta}
+            return raw
+        if isinstance(raw, list) and raw and all(isinstance(m, Message) for m in raw):
+            messages: list[Message] = [m for m in raw if isinstance(m, Message)]
+            last = messages[-1]
+            last.additional_properties = {**(last.additional_properties or {}), "hosting": hosting_meta}
+            return messages
+        # ``raw`` is typed as ``AgentRunInputs`` (str | Content | Message | Sequence[…]).
+        # The remaining cases are str / Content / Mapping — wrap as a single user message.
+        return Message(
+            role="user",
+            contents=[raw],  # type: ignore[list-item]
+            additional_properties={"hosting": hosting_meta},
+        )
+
+    def _record_identity(self, request: ChannelRequest) -> None:
+        """Update the per-``isolation_key`` identity registry + active-channel hint.
+
+        Called on every successful resolve. ``ResponseTarget.active``
+        consumes ``self._active``; ``ResponseTarget.channel(name)`` /
+        ``.channels([...])`` / ``.all_linked`` consume ``self._identities``.
+        """
+        if request.identity is None or request.session is None:
+            return
+        key = request.session.isolation_key
+        if not key:
+            return
+        self._identities.setdefault(key, {})[request.identity.channel] = request.identity
+        self._active[key] = request.identity.channel
+
+    async def _deliver_response(self, request: ChannelRequest, payload: HostedRunResult) -> DeliveryReport:
+        """Resolve ``request.response_target`` and call ``ChannelPush.push`` on each.
+
+        Per SPEC-002 §"ResponseTarget": for any non-``originating`` target,
+        the originating channel returns an acknowledgment and the actual
+        agent reply lands on the destination channel(s). When a destination
+        cannot be resolved (no known native id) or doesn't implement
+        ``ChannelPush``, it is dropped and surfaced in
+        :class:`DeliveryReport.skipped`. If every destination drops, we
+        fall back to delivering on the originating channel (matching the
+        spec's policy default).
+        """
+        target = request.response_target
+        kind = target.kind
+
+        # Fast paths for the trivial variants.
+        if kind == ResponseTargetKind.ORIGINATING:
+            return DeliveryReport(include_originating=True)
+        if kind == ResponseTargetKind.NONE:
+            # Background-only — drop the reply on the floor for now (no
+            # ContinuationToken in the prototype).
+            return DeliveryReport(include_originating=False)
+
+        # Build the destination set.
+        include_originating = False
+        # Each entry is (channel_name, identity_override_or_None_to_lookup).
+        destinations: list[tuple[str, ChannelIdentity | None]] = []
+        isolation_key = request.session.isolation_key if request.session is not None else None
+        known = self._identities.get(isolation_key or "", {})
+
+        if kind == ResponseTargetKind.ACTIVE:
+            active = self._active.get(isolation_key or "")
+            if active is None or active == request.channel:
+                # Fall back to originating when there's no other active
+                # channel known (matches the "first message" case).
+                return DeliveryReport(include_originating=True)
+            destinations.append((active, known.get(active)))
+
+        elif kind == ResponseTargetKind.ALL_LINKED:
+            for channel_name, identity in known.items():
+                if channel_name == request.channel:
+                    include_originating = True
+                    continue
+                destinations.append((channel_name, identity))
+            if not destinations and not include_originating:
+                # No links recorded yet — fall back.
+                return DeliveryReport(include_originating=True)
+
+        elif kind == ResponseTargetKind.CHANNELS:
+            for entry in target.targets:
+                if entry == "originating":
+                    include_originating = True
+                    continue
+                if ":" in entry:
+                    channel_name, _, native_id = entry.partition(":")
+                    if channel_name == request.channel:
+                        # Pointing the originating channel at itself with a
+                        # specific native id — treat as "include
+                        # originating" since the channel will reply on its
+                        # own wire to that user anyway.
+                        include_originating = True
+                        continue
+                    destinations.append((channel_name, ChannelIdentity(channel=channel_name, native_id=native_id)))
+                else:
+                    if entry == request.channel:
+                        include_originating = True
+                        continue
+                    destinations.append((entry, known.get(entry)))
+
+        # Dispatch.
+        by_name = {ch.name: ch for ch in self.channels}
+        pushed: list[str] = []
+        skipped: list[str] = []
+        for channel_name, dest_identity in destinations:
+            channel = by_name.get(channel_name)
+            token = f"{channel_name}:{dest_identity.native_id}" if dest_identity is not None else channel_name
+            if channel is None:
+                logger.warning("deliver_response: no channel named %r (target=%s)", channel_name, token)
+                skipped.append(token)
+                continue
+            if not isinstance(channel, ChannelPush):
+                logger.warning(
+                    "deliver_response: channel %r does not implement ChannelPush (target=%s)",
+                    channel_name,
+                    token,
+                )
+                skipped.append(token)
+                continue
+            if dest_identity is None:
+                logger.warning(
+                    "deliver_response: no known identity for isolation_key=%s on channel=%s",
+                    isolation_key,
+                    channel_name,
+                )
+                skipped.append(token)
+                continue
+            try:
+                await channel.push(dest_identity, payload)
+            except Exception:
+                logger.exception("deliver_response: push failed for target=%s", token)
+                skipped.append(token)
+                continue
+            pushed.append(token)
+            logger.info("deliver_response: pushed to %s (%d chars)", token, len(payload.text))
+
+        if not pushed and not include_originating:
+            # Spec policy: if every destination drops, deliver to originating.
+            logger.warning("deliver_response: every destination dropped — falling back to originating")
+            include_originating = True
+
+        return DeliveryReport(
+            include_originating=include_originating,
+            pushed=tuple(pushed),
+            skipped=tuple(skipped),
+        )
+
+
+__all__ = ["AgentFrameworkHost", "ChannelContext", "logger"]
diff --git a/python/packages/hosting/agent_framework_hosting/_isolation.py b/python/packages/hosting/agent_framework_hosting/_isolation.py
new file mode 100644
index 0000000000..53fb2f1e54
--- /dev/null
+++ b/python/packages/hosting/agent_framework_hosting/_isolation.py
@@ -0,0 +1,76 @@
+# Copyright (c) Microsoft. All rights reserved.
+
+"""Per-request isolation keys read from inbound HTTP headers.
+
+The Foundry Hosted Agents runtime injects two well-known headers on every
+request it forwards to the user's container:
+
+* ``x-agent-user-isolation-key`` — opaque per-user partition key
+* ``x-agent-chat-isolation-key`` — opaque per-conversation partition key
+
+When the headers are present we are running inside (or being driven by) the
+Foundry runtime; when they are absent we are running in plain local dev. The
+host installs an ASGI middleware in :meth:`AgentFrameworkHost._build_app`
+that reads both headers off every inbound HTTP request and pushes them into
+the :data:`current_isolation_keys` contextvar for the duration of the
+request, then resets it. Providers that need partition-aware storage (most
+notably ``FoundryHostedAgentHistoryProvider``) read the contextvar via
+:func:`get_current_isolation_keys` and apply the keys to their backend
+calls — so app authors don't have to wire any middleware themselves and
+channels stay free of Foundry-specific header knowledge.
+
+The contextvar holds a plain :class:`IsolationKeys` mapping; conversion to
+provider-specific types (e.g. Foundry's ``IsolationContext``) happens at
+the consuming provider so this module has no provider dependencies.
+"""
+
+from __future__ import annotations
+
+from contextvars import ContextVar, Token
+
+__all__ = [
+    "ISOLATION_HEADER_CHAT",
+    "ISOLATION_HEADER_USER",
+    "IsolationKeys",
+    "current_isolation_keys",
+    "get_current_isolation_keys",
+    "reset_current_isolation_keys",
+    "set_current_isolation_keys",
+]
+
+
+ISOLATION_HEADER_USER = "x-agent-user-isolation-key"
+ISOLATION_HEADER_CHAT = "x-agent-chat-isolation-key"
+
+
+class IsolationKeys:
+    """Per-request Foundry isolation keys lifted off the inbound headers."""
+
+    def __init__(self, user_key: str | None = None, chat_key: str | None = None) -> None:
+        self.user_key = user_key
+        self.chat_key = chat_key
+
+    @property
+    def is_empty(self) -> bool:
+        return self.user_key is None and self.chat_key is None
+
+
+current_isolation_keys: ContextVar[IsolationKeys | None] = ContextVar(
+    "agent_framework_hosting_isolation_keys",
+    default=None,
+)
+
+
+def get_current_isolation_keys() -> IsolationKeys | None:
+    """Return the isolation keys bound to the current request, if any."""
+    return current_isolation_keys.get()
+
+
+def set_current_isolation_keys(keys: IsolationKeys | None) -> Token[IsolationKeys | None]:
+    """Bind ``keys`` to the current async context and return a reset token."""
+    return current_isolation_keys.set(keys)
+
+
+def reset_current_isolation_keys(token: Token[IsolationKeys | None]) -> None:
+    """Restore the isolation contextvar to its prior value."""
+    current_isolation_keys.reset(token)
diff --git a/python/packages/hosting/agent_framework_hosting/_types.py b/python/packages/hosting/agent_framework_hosting/_types.py
new file mode 100644
index 0000000000..7d200a3266
--- /dev/null
+++ b/python/packages/hosting/agent_framework_hosting/_types.py
@@ -0,0 +1,376 @@
+# Copyright (c) Microsoft. All rights reserved.
+
+# ``ChannelRequest`` is the only intentional dataclass here (callers use
+# ``dataclasses.replace`` on it in run hooks). The other types are plain
+# Python classes by preference, so the "could be a dataclass" lint is muted
+# at the file level.
+# ruff: noqa: B903
+
+"""Channel-neutral request envelope and channel protocol types.
+
+These types form the boundary between the host and individual channels.
+A channel parses its native payload, builds a :class:`ChannelRequest`, and
+hands it to :class:`ChannelContext.run` (or ``run_stream``) on the host.
+The host normalizes the request into a single agent invocation and either
+returns the result to the originating channel or fans out via
+:class:`ResponseTarget` to other channels that implement
+:class:`ChannelPush`.
+
+See ``docs/specs/002-python-hosting-channels.md`` for the full design.
+"""
+
+from __future__ import annotations
+
+from collections.abc import Awaitable, Callable, Mapping, Sequence
+from dataclasses import dataclass, field
+from enum import Enum
+from typing import TYPE_CHECKING, Any, Protocol, runtime_checkable
+
+from agent_framework import (
+    AgentResponse,
+    AgentResponseUpdate,
+    AgentRunInputs,
+    ResponseStream,
+    SupportsAgentRun,
+    Workflow,
+)
+from starlette.routing import BaseRoute
+
+if TYPE_CHECKING:
+    from ._host import ChannelContext
+
+
+# --------------------------------------------------------------------------- #
+# Channel-neutral request envelope
+# --------------------------------------------------------------------------- #
+
+
+_EMPTY_MAPPING: Mapping[str, Any] = {}
+
+
+class ChannelSession:
+    """Channel-supplied session hint.
+
+    The host turns this into an ``AgentSession`` keyed by ``isolation_key`` so
+    every distinct end user gets their own context-provider state (e.g. one
+    ``FileHistoryProvider`` JSONL file per user).
+    """
+
+    def __init__(self, isolation_key: str | None = None) -> None:
+        self.isolation_key = isolation_key
+
+
+class ChannelIdentity:
+    """Channel-native identity the host sees on each request.
+
+    Consumed by the host's identity registry. The host uses it for two things:
+
+    1. Recording the active channel for an ``isolation_key`` so
+       ``ResponseTarget.active`` resolves correctly.
+    2. Telling :class:`ChannelPush` ``push`` recipients **where** in their
+       native namespace to deliver — Telegram uses ``native_id`` as the
+       chat id, Teams as the conversation/AAD id, etc.
+    """
+
+    def __init__(
+        self,
+        channel: str,
+        native_id: str,
+        attributes: Mapping[str, Any] | None = None,
+    ) -> None:
+        self.channel = channel
+        self.native_id = native_id
+        self.attributes: Mapping[str, Any] = attributes if attributes is not None else _EMPTY_MAPPING
+
+
+class ResponseTargetKind(str, Enum):
+    """Discriminator for :class:`ResponseTarget` variants."""
+
+    ORIGINATING = "originating"
+    ACTIVE = "active"
+    CHANNELS = "channels"
+    ALL_LINKED = "all_linked"
+    NONE = "none"
+
+
+class ResponseTarget:
+    """Per-request directive controlling **where** the host delivers the agent reply.
+
+    Independent of ``session_mode``. Construct via the classmethod helpers or
+    use the module-level singletons rather than touching ``kind`` directly.
+    Variants:
+
+    - ``ResponseTarget.originating`` (default) — synchronous response on the
+      originating channel only.
+    - ``ResponseTarget.active`` — push to the channel most recently observed
+      for the resolved ``isolation_key``.
+    - ``ResponseTarget.channel("teams")`` / ``.channels([...])`` — push to
+      one or more named destinations. Each entry is either a bare channel
+      name (host resolves the native id from its identity registry) or a
+      ``"channel:native_id"`` token (used verbatim). The pseudo-name
+      ``"originating"`` includes the originating channel in the fan-out.
+    - ``ResponseTarget.all_linked`` — push to every channel where the
+      resolved ``isolation_key`` has been observed.
+    - ``ResponseTarget.none`` — background-only; in the prototype this just
+      suppresses the originating reply (no ``ContinuationToken`` yet).
+
+    Instances are intended to be treated as immutable; the singletons are
+    shared across the process.
+    """
+
+    def __init__(
+        self,
+        kind: ResponseTargetKind = ResponseTargetKind.ORIGINATING,
+        targets: tuple[str, ...] = (),
+    ) -> None:
+        self.kind = kind
+        self.targets = targets
+
+    # -- builders ---------------------------------------------------------- #
+
+    @classmethod
+    def channel(cls, name: str) -> "ResponseTarget":
+        """Target a single named destination channel."""
+        return cls(kind=ResponseTargetKind.CHANNELS, targets=(name,))
+
+    @classmethod
+    def channels(cls, names: Sequence[str]) -> "ResponseTarget":
+        """Target an explicit list of destination channels."""
+        return cls(kind=ResponseTargetKind.CHANNELS, targets=tuple(names))
+
+    # -- value semantics --------------------------------------------------- #
+    # ``ResponseTarget`` is treated as immutable, so two instances with the
+    # same ``kind`` + ``targets`` are interchangeable. Tests and channel
+    # parsers compare instances with ``==`` and use them as dict keys.
+
+    def __eq__(self, other: object) -> bool:
+        if not isinstance(other, ResponseTarget):
+            return NotImplemented
+        return self.kind is other.kind and self.targets == other.targets
+
+    def __hash__(self) -> int:
+        return hash((self.kind, self.targets))
+
+    def __repr__(self) -> str:
+        if self.kind is ResponseTargetKind.CHANNELS:
+            return f"ResponseTarget.channels({list(self.targets)!r})"
+        return f"ResponseTarget.{self.kind.value}"
+
+
+# Module-level singletons so callers can write ``ResponseTarget.originating``
+# (matching the spec's classmethod-style notation) without juggling Python's
+# no-zero-arg-classmethod-property limitation.
+ResponseTarget.originating = ResponseTarget(kind=ResponseTargetKind.ORIGINATING)  # type: ignore[attr-defined]
+ResponseTarget.active = ResponseTarget(kind=ResponseTargetKind.ACTIVE)  # type: ignore[attr-defined]
+ResponseTarget.all_linked = ResponseTarget(kind=ResponseTargetKind.ALL_LINKED)  # type: ignore[attr-defined]
+ResponseTarget.none = ResponseTarget(kind=ResponseTargetKind.NONE)  # type: ignore[attr-defined]
+
+
+@dataclass
+class ChannelRequest:
+    """Uniform invocation envelope every channel produces from its native payload.
+
+    Kept as a dataclass so app authors can use ``dataclasses.replace(...)`` in
+    run hooks to produce a modified envelope without re-listing every field.
+    """
+
+    channel: str
+    operation: str  # e.g. "message.create", "command.invoke"
+    input: AgentRunInputs
+    session: ChannelSession | None = None
+    options: Mapping[str, Any] | None = None
+    session_mode: str = "auto"  # "auto" | "required" | "disabled"
+    metadata: Mapping[str, Any] = field(default_factory=lambda: {})
+    attributes: Mapping[str, Any] = field(default_factory=lambda: {})
+    stream: bool = False
+    identity: ChannelIdentity | None = None
+    response_target: ResponseTarget = field(default_factory=lambda: ResponseTarget.originating)  # type: ignore[attr-defined]
+
+
+class ChannelCommand:
+    """A discoverable command a channel exposes to its users (e.g. ``/reset``)."""
+
+    def __init__(
+        self,
+        name: str,
+        description: str,
+        handle: Callable[["ChannelCommandContext"], Awaitable[None]],
+    ) -> None:
+        self.name = name
+        self.description = description
+        self.handle = handle
+
+
+class ChannelCommandContext:
+    """Context passed to a :class:`ChannelCommand` handler."""
+
+    def __init__(
+        self,
+        request: ChannelRequest,
+        reply: Callable[[str], Awaitable[None]],
+    ) -> None:
+        self.request = request
+        self.reply = reply
+
+
+_EMPTY_ROUTES: tuple[BaseRoute, ...] = ()
+_EMPTY_COMMANDS: tuple[ChannelCommand, ...] = ()
+_EMPTY_LIFECYCLE: tuple[Callable[[], Awaitable[None]], ...] = ()
+
+
+class ChannelContribution:
+    """Routes, commands, and lifecycle hooks a channel contributes to the host."""
+
+    def __init__(
+        self,
+        routes: Sequence[BaseRoute] = _EMPTY_ROUTES,
+        commands: Sequence[ChannelCommand] = _EMPTY_COMMANDS,
+        on_startup: Sequence[Callable[[], Awaitable[None]]] = _EMPTY_LIFECYCLE,
+        on_shutdown: Sequence[Callable[[], Awaitable[None]]] = _EMPTY_LIFECYCLE,
+    ) -> None:
+        self.routes = routes
+        self.commands = commands
+        self.on_startup = on_startup
+        self.on_shutdown = on_shutdown
+
+
+class HostedRunResult:
+    """Channel-neutral result of an agent invocation routed through the host."""
+
+    def __init__(self, text: str) -> None:
+        self.text = text
+
+
+class DeliveryReport:
+    """What :meth:`ChannelContext.deliver_response` did with a payload.
+
+    The originating channel uses ``include_originating`` to decide whether
+    to render the agent reply on its own wire (``True`` — default for the
+    ``originating`` target, or when ``"originating"`` is one of the listed
+    destinations) or to return only an acknowledgement (``False`` — when
+    the target lists only out-of-band destinations).
+    """
+
+    def __init__(
+        self,
+        include_originating: bool,
+        pushed: tuple[str, ...] = (),
+        skipped: tuple[str, ...] = (),
+    ) -> None:
+        self.include_originating = include_originating
+        self.pushed = pushed  # destination tokens delivered to (e.g. "telegram:123")
+        self.skipped = skipped  # destinations resolved but skipped (no push, failed, …)
+
+
+# A transform hook runs over each AgentResponseUpdate as the channel consumes
+# the stream. It can return a replacement update, ``None`` to drop the update,
+# or be async. Channels apply it during iteration so that channel-specific
+# concerns (e.g. masking, redaction, formatting for the wire) live close to
+# the channel rather than on the agent.
+ChannelStreamTransformHook = Callable[
+    [AgentResponseUpdate],
+    "AgentResponseUpdate | Awaitable[AgentResponseUpdate | None] | None",
+]
+
+
+# --------------------------------------------------------------------------- #
+# Channel run hook
+# --------------------------------------------------------------------------- #
+
+
+# Run hooks accept the channel-built ``ChannelRequest`` and return a
+# (possibly modified) replacement. Channels invoke the hook with both the
+# request and the channel-side context as keyword arguments — the call
+# convention is ``await hook(request, target=..., protocol_request=...)``.
+#
+# The ergonomic minimum for a hook implementation is therefore a function
+# accepting ``request`` positionally plus ``**kwargs`` and returning a
+# (possibly mutated) :class:`ChannelRequest`. Hooks that need the agent
+# target or the raw channel-native payload pull them off the keyword
+# arguments by name (``target`` / ``protocol_request``).
+#
+# ``protocol_request`` is the raw, channel-native payload the channel
+# parsed (the JSON body for Responses, the Telegram ``Update`` dict, the
+# Bot Framework ``Activity`` for Teams). Use it when the hook needs a
+# field the channel did not lift onto ``ChannelRequest`` (e.g. OpenAI's
+# ``safety_identifier``, Teams' ``from.aadObjectId``, …).
+ChannelRunHook = Callable[..., "Awaitable[ChannelRequest] | ChannelRequest"]
+
+
+async def apply_run_hook(
+    hook: ChannelRunHook,
+    request: ChannelRequest,
+    *,
+    target: SupportsAgentRun | Workflow,
+    protocol_request: Any | None,
+) -> ChannelRequest:
+    """Channel-side helper to invoke a :data:`ChannelRunHook` with the standard kwargs.
+
+    Channels call this rather than calling the hook directly so the
+    invocation convention (``request`` positional, ``target`` /
+    ``protocol_request`` keyword) is enforced in one place.
+    """
+    result = hook(request, target=target, protocol_request=protocol_request)
+    if isinstance(result, Awaitable):
+        return await result
+    return result
+
+
+# --------------------------------------------------------------------------- #
+# Channel protocols
+# --------------------------------------------------------------------------- #
+
+
+@runtime_checkable
+class Channel(Protocol):
+    """A pluggable adapter that exposes one transport on the host.
+
+    Channels publish their routes, commands, and lifecycle callbacks via
+    :meth:`contribute`. The host mounts them under the channel's ``path``
+    (or at the app root when ``path == ""``) and gives the channel a
+    :class:`ChannelContext` so it can call back into the host to invoke
+    the agent target and deliver responses.
+    """
+
+    name: str
+    path: str  # default mount path (e.g. "/responses"); use "" to mount routes at the app root
+
+    def contribute(self, context: "ChannelContext") -> ChannelContribution: ...
+
+
+@runtime_checkable
+class ChannelPush(Protocol):
+    """Optional capability: a channel that can deliver outbound messages without a prior request.
+
+    Per SPEC-002 (req #13), channels that can do proactive delivery
+    (Telegram bot proactive message, Teams proactive bot message,
+    webhook callbacks, SSE broadcasts) implement ``push`` on top of the
+    base :class:`Channel` protocol. Channels without push can only be
+    addressed as the ``originating`` :class:`ResponseTarget`.
+    """
+
+    name: str
+
+    async def push(self, identity: ChannelIdentity, payload: HostedRunResult) -> None: ...
+
+
+__all__ = [
+    "AgentResponse",
+    "AgentResponseUpdate",
+    "Channel",
+    "ChannelCommand",
+    "ChannelCommandContext",
+    "ChannelContribution",
+    "ChannelIdentity",
+    "ChannelPush",
+    "ChannelRequest",
+    "ChannelRunHook",
+    "ChannelSession",
+    "ChannelStreamTransformHook",
+    "DeliveryReport",
+    "HostedRunResult",
+    "ResponseStream",
+    "ResponseTarget",
+    "ResponseTargetKind",
+    "apply_run_hook",
+]
diff --git a/python/packages/hosting/pyproject.toml b/python/packages/hosting/pyproject.toml
new file mode 100644
index 0000000000..57c79854bb
--- /dev/null
+++ b/python/packages/hosting/pyproject.toml
@@ -0,0 +1,107 @@
+[project]
+name = "agent-framework-hosting"
+description = "Multi-channel hosting for Microsoft Agent Framework agents."
+authors = [{ name = "Microsoft", email = "af-support@microsoft.com"}]
+readme = "README.md"
+requires-python = ">=3.10"
+version = "1.0.0a260424"
+license-files = ["LICENSE"]
+urls.homepage = "https://aka.ms/agent-framework"
+urls.source = "https://github.com/microsoft/agent-framework/tree/main/python"
+urls.release_notes = "https://github.com/microsoft/agent-framework/releases?q=tag%3Apython-1&expanded=true"
+urls.issues = "https://github.com/microsoft/agent-framework/issues"
+classifiers = [
+  "License :: OSI Approved :: MIT License",
+  "Development Status :: 3 - Alpha",
+  "Intended Audience :: Developers",
+  "Programming Language :: Python :: 3",
+  "Programming Language :: Python :: 3.10",
+  "Programming Language :: Python :: 3.11",
+  "Programming Language :: Python :: 3.12",
+  "Programming Language :: Python :: 3.13",
+  "Programming Language :: Python :: 3.14",
+  "Typing :: Typed",
+]
+dependencies = [
+    "agent-framework-core>=1.2.0,<2",
+    "starlette>=0.37",
+]
+
+[project.optional-dependencies]
+serve = [
+    "hypercorn>=0.17",
+]
+
+[tool.uv]
+prerelease = "if-necessary-or-explicit"
+environments = [
+    "sys_platform == 'darwin'",
+    "sys_platform == 'linux'",
+    "sys_platform == 'win32'"
+]
+
+[tool.uv-dynamic-versioning]
+fallback-version = "0.0.0"
+
+[tool.pytest.ini_options]
+testpaths = 'tests'
+addopts = "-ra -q -r fEX"
+asyncio_mode = "auto"
+asyncio_default_fixture_loop_scope = "function"
+filterwarnings = []
+timeout = 120
+markers = [
+    "integration: marks tests as integration tests that require external services",
+]
+
+[tool.ruff]
+extend = "../../pyproject.toml"
+
+[tool.coverage.run]
+omit = [
+    "**/__init__.py"
+]
+
+[tool.pyright]
+extends = "../../pyproject.toml"
+include = ["agent_framework_hosting"]
+exclude = ['tests']
+
+[tool.mypy]
+plugins = ['pydantic.mypy']
+strict = true
+python_version = "3.10"
+ignore_missing_imports = true
+disallow_untyped_defs = true
+no_implicit_optional = true
+check_untyped_defs = true
+warn_return_any = true
+show_error_codes = true
+warn_unused_ignores = false
+disallow_incomplete_defs = true
+disallow_untyped_decorators = true
+
+[tool.bandit]
+targets = ["agent_framework_hosting"]
+exclude_dirs = ["tests"]
+
+[tool.poe]
+executor.type = "uv"
+include = "../../shared_tasks.toml"
+
+[tool.poe.tasks.mypy]
+help = "Run MyPy for this package."
+cmd = "mypy --config-file $POE_ROOT/pyproject.toml agent_framework_hosting"
+
+[tool.poe.tasks.test]
+help = "Run the default unit test suite for this package."
+cmd = 'pytest -m "not integration" --cov=agent_framework_hosting --cov-report=term-missing:skip-covered tests'
+
+[build-system]
+requires = ["flit-core >= 3.11,<4.0"]
+build-backend = "flit_core.buildapi"
+
+[dependency-groups]
+dev = [
+    "httpx>=0.28.1",
+]
diff --git a/python/packages/hosting/tests/__init__.py b/python/packages/hosting/tests/__init__.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/python/packages/hosting/tests/_workflow_fixtures.py b/python/packages/hosting/tests/_workflow_fixtures.py
new file mode 100644
index 0000000000..f59bb8cab8
--- /dev/null
+++ b/python/packages/hosting/tests/_workflow_fixtures.py
@@ -0,0 +1,43 @@
+# Copyright (c) Microsoft. All rights reserved.
+
+"""Workflow fixtures for hosting tests.
+
+Defined in a module that does not use ``from __future__ import annotations``
+because the workflow handler validation reflects on real annotation objects
+rather than stringified forms.
+"""
+
+from agent_framework import Executor, Workflow, WorkflowBuilder, WorkflowContext, handler
+
+
+class _UpperExecutor(Executor):
+    @handler
+    async def handle(self, text: str, ctx: WorkflowContext[str]) -> None:
+        await ctx.yield_output(text.upper())
+
+
+class _EchoExecutor(Executor):
+    @handler
+    async def handle(self, text: str, ctx: WorkflowContext[str]) -> None:
+        await ctx.yield_output(text)
+
+
+def build_upper_workflow() -> Workflow:
+    return WorkflowBuilder(start_executor=_UpperExecutor(id="upper")).build()
+
+
+def build_echo_workflow() -> Workflow:
+    return WorkflowBuilder(start_executor=_EchoExecutor(id="echo")).build()
+
+
+class _MultiChunkExecutor(Executor):
+    """Yields three separate ``output`` events so streaming has something to chew on."""
+
+    @handler
+    async def handle(self, text: str, ctx: WorkflowContext[str]) -> None:
+        for chunk in (f"{text}-1", f"{text}-2", f"{text}-3"):
+            await ctx.yield_output(chunk)
+
+
+def build_multi_chunk_workflow() -> Workflow:
+    return WorkflowBuilder(start_executor=_MultiChunkExecutor(id="multi")).build()
diff --git a/python/packages/hosting/tests/test_host.py b/python/packages/hosting/tests/test_host.py
new file mode 100644
index 0000000000..bb6d7d5963
--- /dev/null
+++ b/python/packages/hosting/tests/test_host.py
@@ -0,0 +1,714 @@
+# Copyright (c) Microsoft. All rights reserved.
+
+"""Tests for :class:`AgentFrameworkHost` invocation, session, and delivery routing."""
+
+from __future__ import annotations
+
+from collections.abc import AsyncIterator, Sequence
+from dataclasses import dataclass, field
+from typing import Any
+
+import pytest
+from agent_framework import AgentResponseUpdate
+from starlette.requests import Request
+from starlette.responses import JSONResponse
+from starlette.routing import BaseRoute, Route
+from starlette.testclient import TestClient
+
+from agent_framework_hosting import (
+    AgentFrameworkHost,
+    Channel,
+    ChannelContext,
+    ChannelContribution,
+    ChannelIdentity,
+    ChannelPush,
+    ChannelRequest,
+    ChannelSession,
+    HostedRunResult,
+    ResponseTarget,
+)
+
+
+async def _ping(_request: Request) -> JSONResponse:
+    return JSONResponse({"ok": True})
+
+
+# --------------------------------------------------------------------------- #
+# Fakes                                                                        #
+# --------------------------------------------------------------------------- #
+
+
+@dataclass
+class _FakeAgentSession:
+    session_id: str | None = None
+    service_session_id: str | None = None
+
+
+@dataclass
+class _FakeAgentResponse:
+    text: str
+
+
+class _FakeAgent:
+    """Minimal :class:`SupportsAgentRun` implementation that records invocations."""
+
+    def __init__(self, reply: str = "ok") -> None:
+        self._reply = reply
+        self.calls: list[dict[str, Any]] = []
+        self.created_sessions: list[_FakeAgentSession] = []
+
+    def create_session(self, *, session_id: str | None = None) -> _FakeAgentSession:
+        s = _FakeAgentSession(session_id=session_id)
+        self.created_sessions.append(s)
+        return s
+
+    async def run(self, messages: Any = None, *, stream: bool = False, session: Any = None, **kwargs: Any) -> Any:
+        self.calls.append({"messages": messages, "stream": stream, "session": session, "kwargs": kwargs})
+        if stream:  # pragma: no cover - not used by these tests
+
+            async def _gen() -> AsyncIterator[Any]:
+                yield self._reply
+
+            return _gen()
+        return _FakeAgentResponse(text=self._reply)
+
+
+class _RecordingChannel:
+    """Minimal :class:`Channel` + :class:`ChannelPush` for routing tests."""
+
+    def __init__(self, name: str = "fake", path: str = "/fake", supports_push: bool = True) -> None:
+        self.name = name
+        self.path = path
+        self.context: ChannelContext | None = None
+        self.pushes: list[tuple[ChannelIdentity, HostedRunResult]] = []
+        self._push_raises: Exception | None = None
+        self._supports_push = supports_push
+        # Provide a single trivial route so contribute() exercises the mount path.
+        self._routes: Sequence[BaseRoute] = (Route("/ping", _ping),)
+
+    def contribute(self, context: ChannelContext) -> ChannelContribution:
+        self.context = context
+        return ChannelContribution(routes=self._routes)
+
+    async def push(self, identity: ChannelIdentity, payload: HostedRunResult) -> None:
+        if self._push_raises is not None:
+            raise self._push_raises
+        self.pushes.append((identity, payload))
+
+
+class _NoPushChannel:
+    """A channel that does NOT implement :class:`ChannelPush`."""
+
+    def __init__(self, name: str = "nopush", path: str = "/nopush") -> None:
+        self.name = name
+        self.path = path
+
+    def contribute(self, context: ChannelContext) -> ChannelContribution:
+        return ChannelContribution()
+
+
+@dataclass
+class _LifecycleChannel:
+    name: str = "lifecycle"
+    path: str = ""
+    started: list[str] = field(default_factory=list)
+    stopped: list[str] = field(default_factory=list)
+
+    def contribute(self, context: ChannelContext) -> ChannelContribution:
+        async def on_start() -> None:
+            self.started.append("up")
+
+        async def on_stop() -> None:
+            self.stopped.append("down")
+
+        return ChannelContribution(on_startup=[on_start], on_shutdown=[on_stop])
+
+
+# --------------------------------------------------------------------------- #
+# Host wiring                                                                  #
+# --------------------------------------------------------------------------- #
+
+
+class TestHostWiring:
+    def test_channel_is_recognized(self) -> None:
+        ch = _RecordingChannel()
+        assert isinstance(ch, Channel)
+        assert isinstance(ch, ChannelPush)
+
+    def test_app_mounts_channel_routes_under_path(self) -> None:
+        agent = _FakeAgent()
+        ch = _RecordingChannel(path="/fake")
+        host = AgentFrameworkHost(target=agent, channels=[ch])
+
+        with TestClient(host.app) as client:
+            r = client.get("/fake/ping")
+            assert r.status_code == 200
+            assert r.json() == {"ok": True}
+
+    def test_app_mounts_at_root_when_path_is_empty(self) -> None:
+        agent = _FakeAgent()
+        ch = _RecordingChannel(path="")
+        host = AgentFrameworkHost(target=agent, channels=[ch])
+
+        with TestClient(host.app) as client:
+            r = client.get("/ping")
+            assert r.status_code == 200
+
+    def test_app_is_cached(self) -> None:
+        host = AgentFrameworkHost(target=_FakeAgent(), channels=[_RecordingChannel()])
+        assert host.app is host.app
+
+    def test_lifespan_invokes_startup_and_shutdown(self) -> None:
+        agent = _FakeAgent()
+        ch = _LifecycleChannel()
+        host = AgentFrameworkHost(target=agent, channels=[ch])
+        with TestClient(host.app):
+            assert ch.started == ["up"]
+        assert ch.stopped == ["down"]
+
+    def test_app_exposes_readiness_probe(self) -> None:
+        host = AgentFrameworkHost(target=_FakeAgent(), channels=[_RecordingChannel()])
+        with TestClient(host.app) as client:
+            r = client.get("/readiness")
+            assert r.status_code == 200
+            assert r.text == "ok"
+
+
+# --------------------------------------------------------------------------- #
+# Invoke + sessions                                                            #
+# --------------------------------------------------------------------------- #
+
+
+class TestHostInvoke:
+    @pytest.mark.asyncio
+    async def test_invoke_wraps_input_with_hosting_metadata(self) -> None:
+        agent = _FakeAgent(reply="hello")
+        ch = _RecordingChannel(name="responses")
+        host = AgentFrameworkHost(target=agent, channels=[ch])
+        # Force ``app`` build to trigger ``contribute``.
+        _ = host.app
+        assert ch.context is not None
+
+        req = ChannelRequest(
+            channel="responses",
+            operation="message.create",
+            input="hi",
+            session=ChannelSession(isolation_key="user:1"),
+            identity=ChannelIdentity(channel="responses", native_id="user:1"),
+        )
+        result = await ch.context.run(req)
+
+        assert result.text == "hello"
+        assert len(agent.calls) == 1
+        msg = agent.calls[0]["messages"]
+        assert msg.role == "user"
+        assert msg.additional_properties["hosting"]["channel"] == "responses"
+        assert msg.additional_properties["hosting"]["identity"] == {
+            "channel": "responses",
+            "native_id": "user:1",
+            "attributes": {},
+        }
+        assert msg.additional_properties["hosting"]["response_target"] == {
+            "kind": "originating",
+            "targets": [],
+        }
+
+    @pytest.mark.asyncio
+    async def test_invoke_caches_session_per_isolation_key(self) -> None:
+        agent = _FakeAgent()
+        ch = _RecordingChannel()
+        host = AgentFrameworkHost(target=agent, channels=[ch])
+        _ = host.app
+        assert ch.context is not None
+
+        req_a = ChannelRequest(
+            channel=ch.name, operation="op", input="1", session=ChannelSession(isolation_key="alice")
+        )
+        req_b = ChannelRequest(
+            channel=ch.name, operation="op", input="2", session=ChannelSession(isolation_key="alice")
+        )
+        req_c = ChannelRequest(channel=ch.name, operation="op", input="3", session=ChannelSession(isolation_key="bob"))
+
+        await ch.context.run(req_a)
+        await ch.context.run(req_b)
+        await ch.context.run(req_c)
+
+        # Two distinct sessions created (alice, bob) — never re-created.
+        assert len(agent.created_sessions) == 2
+        assert agent.calls[0]["session"] is agent.calls[1]["session"]
+        assert agent.calls[0]["session"] is not agent.calls[2]["session"]
+
+    @pytest.mark.asyncio
+    async def test_session_disabled_does_not_create_session(self) -> None:
+        agent = _FakeAgent()
+        ch = _RecordingChannel()
+        host = AgentFrameworkHost(target=agent, channels=[ch])
+        _ = host.app
+        assert ch.context is not None
+
+        req = ChannelRequest(
+            channel=ch.name,
+            operation="op",
+            input="x",
+            session=ChannelSession(isolation_key="alice"),
+            session_mode="disabled",
+        )
+        await ch.context.run(req)
+        assert agent.created_sessions == []
+        assert agent.calls[0]["session"] is None
+
+    @pytest.mark.asyncio
+    async def test_reset_session_rotates_id_and_drops_cache(self) -> None:
+        agent = _FakeAgent()
+        ch = _RecordingChannel()
+        host = AgentFrameworkHost(target=agent, channels=[ch])
+        _ = host.app
+        assert ch.context is not None
+
+        req = ChannelRequest(channel=ch.name, operation="op", input="x", session=ChannelSession(isolation_key="alice"))
+        await ch.context.run(req)
+        first_session = agent.calls[-1]["session"]
+        assert first_session.session_id == "alice"
+
+        host.reset_session("alice")
+        await ch.context.run(req)
+        second_session = agent.calls[-1]["session"]
+        # New session, new id (alias rotation), distinct object.
+        assert second_session is not first_session
+        assert second_session.session_id != "alice"
+        assert second_session.session_id.startswith("alice#")
+
+    @pytest.mark.asyncio
+    async def test_options_propagates_to_target_run(self) -> None:
+        agent = _FakeAgent()
+        ch = _RecordingChannel()
+        host = AgentFrameworkHost(target=agent, channels=[ch])
+        _ = host.app
+        assert ch.context is not None
+
+        req = ChannelRequest(
+            channel=ch.name,
+            operation="op",
+            input="x",
+            session=ChannelSession(isolation_key="alice"),
+            options={"temperature": 0.4},
+        )
+        await ch.context.run(req)
+        assert agent.calls[0]["kwargs"]["options"] == {"temperature": 0.4}
+
+
+# --------------------------------------------------------------------------- #
+# Workflow target                                                              #
+# --------------------------------------------------------------------------- #
+
+
+class TestHostWorkflowTarget:
+    """The host accepts a ``Workflow`` and dispatches to ``workflow.run(...)``."""
+
+    @pytest.mark.asyncio
+    async def test_invoke_workflow_collapses_outputs_to_hosted_run_result(self) -> None:
+        from tests._workflow_fixtures import build_upper_workflow
+
+        workflow = build_upper_workflow()
+        ch = _RecordingChannel()
+        host = AgentFrameworkHost(target=workflow, channels=[ch])
+        _ = host.app
+        assert ch.context is not None
+
+        # The channel's run_hook is the canonical adapter from a free-form input
+        # to a workflow's typed input; here the start executor accepts ``str``
+        # already so the channel forwards ``input`` verbatim.
+        req = ChannelRequest(channel="fake", operation="message.create", input="hello")
+        result = await ch.context.run(req)
+
+        assert result.text == "HELLO"
+        # No session caching for workflow targets — Workflow has no
+        # ``create_session`` and the host must not invent one.
+        assert host._sessions == {}
+
+    @pytest.mark.asyncio
+    async def test_stream_workflow_yields_updates_and_finalizes(self) -> None:
+        from tests._workflow_fixtures import build_echo_workflow
+
+        workflow = build_echo_workflow()
+        ch = _RecordingChannel()
+        host = AgentFrameworkHost(target=workflow, channels=[ch])
+        _ = host.app
+        assert ch.context is not None
+
+        req = ChannelRequest(channel="fake", operation="message.create", input="hi")
+        stream = ch.context.run_stream(req)
+
+        updates: list[AgentResponseUpdate] = []
+        async for update in stream:
+            updates.append(update)
+
+        # The echo workflow yields a single ``output`` event whose payload is
+        # the original string; the host wraps non-update payloads into a
+        # one-shot ``AgentResponseUpdate`` carrying the text.
+        assert [u.text for u in updates] == ["hi"]
+        # ``raw_representation`` preserves the source ``WorkflowEvent`` so
+        # advanced consumers (telemetry, debug UIs) can recover the full
+        # workflow timeline.
+        assert all(u.raw_representation is not None for u in updates)
+
+        final = await stream.get_final_response()
+        assert final.text == "hi"
+
+    @pytest.mark.asyncio
+    async def test_stream_workflow_yields_one_update_per_output_event(self) -> None:
+        from tests._workflow_fixtures import build_multi_chunk_workflow
+
+        workflow = build_multi_chunk_workflow()
+        ch = _RecordingChannel()
+        host = AgentFrameworkHost(target=workflow, channels=[ch])
+        _ = host.app
+        assert ch.context is not None
+
+        req = ChannelRequest(channel="fake", operation="message.create", input="x")
+        stream = ch.context.run_stream(req)
+
+        chunks: list[str] = []
+        async for update in stream:
+            chunks.append(update.text)
+            # The originating ``executor_id`` is propagated via author_name so
+            # multi-agent workflows can route per-author rendering downstream.
+            assert update.author_name == "multi"
+
+        assert chunks == ["x-1", "x-2", "x-3"]
+        final = await stream.get_final_response()
+        assert final.text == "x-1x-2x-3"
+
+
+class TestHostWorkflowCheckpointing:
+    """The host scopes per-conversation checkpoints when ``checkpoint_location`` is set."""
+
+    def test_rejects_workflow_with_existing_checkpoint_storage(self, tmp_path: Any) -> None:
+        from agent_framework import InMemoryCheckpointStorage, WorkflowBuilder
+
+        from tests._workflow_fixtures import _UpperExecutor
+
+        workflow = WorkflowBuilder(
+            start_executor=_UpperExecutor(id="upper"),
+            checkpoint_storage=InMemoryCheckpointStorage(),
+        ).build()
+        with pytest.raises(RuntimeError, match="already has checkpoint storage"):
+            AgentFrameworkHost(
+                target=workflow,
+                channels=[_RecordingChannel()],
+                checkpoint_location=tmp_path,
+            )
+
+    def test_warns_when_target_is_agent(self, tmp_path: Any, caplog: Any) -> None:
+        import logging as _logging
+
+        agent = _FakeAgent()
+        with caplog.at_level(_logging.WARNING, logger="agent_framework.hosting"):
+            host = AgentFrameworkHost(target=agent, channels=[_RecordingChannel()], checkpoint_location=tmp_path)
+        assert host._checkpoint_location is None
+        assert any("checkpoint_location" in rec.message for rec in caplog.records)
+
+    @pytest.mark.asyncio
+    async def test_invoke_skips_checkpointing_when_no_isolation_key(self, tmp_path: Any) -> None:
+        from tests._workflow_fixtures import build_upper_workflow
+
+        workflow = build_upper_workflow()
+        ch = _RecordingChannel()
+        host = AgentFrameworkHost(target=workflow, channels=[ch], checkpoint_location=tmp_path)
+        _ = host.app
+        assert ch.context is not None
+
+        # No session -> no scoping key -> no checkpoint storage written.
+        req = ChannelRequest(channel="fake", operation="message.create", input="hi")
+        result = await ch.context.run(req)
+
+        assert result.text == "HI"
+        assert list(tmp_path.iterdir()) == []
+
+    @pytest.mark.asyncio
+    async def test_invoke_writes_checkpoint_under_isolation_key(self, tmp_path: Any) -> None:
+        from tests._workflow_fixtures import build_upper_workflow
+
+        workflow = build_upper_workflow()
+        ch = _RecordingChannel()
+        host = AgentFrameworkHost(target=workflow, channels=[ch], checkpoint_location=tmp_path)
+        _ = host.app
+        assert ch.context is not None
+
+        req = ChannelRequest(
+            channel="fake",
+            operation="message.create",
+            input="hi",
+            session=ChannelSession(isolation_key="alice"),
+        )
+        result = await ch.context.run(req)
+        assert result.text == "HI"
+
+        # FileCheckpointStorage rooted at <tmp_path>/<isolation_key> should
+        # have produced at least one checkpoint file scoped to that user.
+        scoped = tmp_path / "alice"
+        assert scoped.exists()
+        assert any(scoped.iterdir()), "expected at least one checkpoint to be written under the per-user dir"
+
+    @pytest.mark.asyncio
+    async def test_stream_writes_checkpoint_under_isolation_key(self, tmp_path: Any) -> None:
+        from tests._workflow_fixtures import build_echo_workflow
+
+        workflow = build_echo_workflow()
+        ch = _RecordingChannel()
+        host = AgentFrameworkHost(target=workflow, channels=[ch], checkpoint_location=tmp_path)
+        _ = host.app
+        assert ch.context is not None
+
+        req = ChannelRequest(
+            channel="fake",
+            operation="message.create",
+            input="hi",
+            session=ChannelSession(isolation_key="bob"),
+        )
+        stream = ch.context.run_stream(req)
+        async for _ in stream:
+            pass
+        await stream.get_final_response()
+
+        scoped = tmp_path / "bob"
+        assert scoped.exists()
+        assert any(scoped.iterdir())
+
+    @pytest.mark.asyncio
+    async def test_caller_supplied_checkpoint_storage_used_as_is(self, tmp_path: Any) -> None:
+        from agent_framework import InMemoryCheckpointStorage
+
+        from tests._workflow_fixtures import build_upper_workflow
+
+        storage = InMemoryCheckpointStorage()
+        workflow = build_upper_workflow()
+        ch = _RecordingChannel()
+        host = AgentFrameworkHost(target=workflow, channels=[ch], checkpoint_location=storage)
+        _ = host.app
+        assert ch.context is not None
+        assert host._checkpoint_location is storage
+
+        req = ChannelRequest(
+            channel="fake",
+            operation="message.create",
+            input="hi",
+            session=ChannelSession(isolation_key="carol"),
+        )
+        await ch.context.run(req)
+
+        # The caller-owned storage is used directly (no per-user scoping
+        # applied by the host); a checkpoint should appear in it.
+        checkpoints = await storage.list_checkpoints(workflow_name=workflow.name)
+        assert checkpoints, "expected the caller-supplied storage to receive a checkpoint"
+        # And nothing should have been written into the tmp_path tree.
+        assert list(tmp_path.iterdir()) == []
+
+
+# --------------------------------------------------------------------------- #
+# Delivery routing                                                             #
+# --------------------------------------------------------------------------- #
+
+
+def _make_host_with_two_channels() -> tuple[AgentFrameworkHost, _RecordingChannel, _RecordingChannel, ChannelContext]:
+    agent = _FakeAgent()
+    a = _RecordingChannel(name="responses", path="/r")
+    b = _RecordingChannel(name="telegram", path="/t")
+    host = AgentFrameworkHost(target=agent, channels=[a, b])
+    _ = host.app
+    assert a.context is not None
+    return host, a, b, a.context
+
+
+def _record_identity_on(host: AgentFrameworkHost, isolation_key: str, channel: str, native_id: str) -> None:
+    """Pre-seed the host's identity registry by running a request."""
+    host._identities.setdefault(isolation_key, {})[channel] = ChannelIdentity(channel=channel, native_id=native_id)
+    host._active[isolation_key] = channel
+
+
+class TestDeliverResponse:
+    @pytest.mark.asyncio
+    async def test_originating_returns_include_originating(self) -> None:
+        _, _, _, ctx = _make_host_with_two_channels()
+        req = ChannelRequest(channel="responses", operation="op", input="x")
+        report = await ctx.deliver_response(req, HostedRunResult(text="reply"))
+        assert report.include_originating is True
+        assert report.pushed == ()
+        assert report.skipped == ()
+
+    @pytest.mark.asyncio
+    async def test_none_suppresses_everything(self) -> None:
+        _, _, _, ctx = _make_host_with_two_channels()
+        req = ChannelRequest(
+            channel="responses",
+            operation="op",
+            input="x",
+            response_target=ResponseTarget.none,  # type: ignore[attr-defined]
+        )
+        report = await ctx.deliver_response(req, HostedRunResult(text="reply"))
+        assert report.include_originating is False
+        assert report.pushed == ()
+        assert report.skipped == ()
+
+    @pytest.mark.asyncio
+    async def test_active_pushes_to_other_channel(self) -> None:
+        host, a, b, ctx = _make_host_with_two_channels()
+        # Alice was last seen on telegram.
+        _record_identity_on(host, "alice", "telegram", "42")
+        # Now she sends a message via responses; ResponseTarget.active should
+        # push to telegram, not back to responses.
+        req = ChannelRequest(
+            channel="responses",
+            operation="op",
+            input="x",
+            session=ChannelSession(isolation_key="alice"),
+            response_target=ResponseTarget.active,  # type: ignore[attr-defined]
+        )
+        report = await ctx.deliver_response(req, HostedRunResult(text="reply"))
+        assert report.include_originating is False
+        assert report.pushed == ("telegram:42",)
+        assert b.pushes and b.pushes[0][0].native_id == "42"
+
+    @pytest.mark.asyncio
+    async def test_active_falls_back_to_originating_when_self(self) -> None:
+        host, _a, _b, ctx = _make_host_with_two_channels()
+        _record_identity_on(host, "alice", "responses", "user:1")
+        req = ChannelRequest(
+            channel="responses",
+            operation="op",
+            input="x",
+            session=ChannelSession(isolation_key="alice"),
+            response_target=ResponseTarget.active,  # type: ignore[attr-defined]
+        )
+        report = await ctx.deliver_response(req, HostedRunResult(text="reply"))
+        assert report.include_originating is True
+
+    @pytest.mark.asyncio
+    async def test_channels_with_unknown_identity_skipped(self) -> None:
+        _, _, _, ctx = _make_host_with_two_channels()
+        # No prior identity seeded for telegram on alice.
+        req = ChannelRequest(
+            channel="responses",
+            operation="op",
+            input="x",
+            session=ChannelSession(isolation_key="alice"),
+            response_target=ResponseTarget.channel("telegram"),
+        )
+        report = await ctx.deliver_response(req, HostedRunResult(text="reply"))
+        # Skipped → fallback to originating.
+        assert report.include_originating is True
+        assert report.skipped == ("telegram",)
+        assert report.pushed == ()
+
+    @pytest.mark.asyncio
+    async def test_channels_with_explicit_native_id_token(self) -> None:
+        _, _, b, ctx = _make_host_with_two_channels()
+        req = ChannelRequest(
+            channel="responses",
+            operation="op",
+            input="x",
+            response_target=ResponseTarget.channel("telegram:99"),
+        )
+        report = await ctx.deliver_response(req, HostedRunResult(text="reply"))
+        assert report.pushed == ("telegram:99",)
+        assert report.include_originating is False
+        assert b.pushes[0][0].native_id == "99"
+
+    @pytest.mark.asyncio
+    async def test_channels_originating_pseudo_includes_origin(self) -> None:
+        host, _a, _b, ctx = _make_host_with_two_channels()
+        _record_identity_on(host, "alice", "telegram", "42")
+        req = ChannelRequest(
+            channel="responses",
+            operation="op",
+            input="x",
+            session=ChannelSession(isolation_key="alice"),
+            response_target=ResponseTarget.channels(["originating", "telegram"]),
+        )
+        report = await ctx.deliver_response(req, HostedRunResult(text="reply"))
+        assert report.include_originating is True
+        assert report.pushed == ("telegram:42",)
+
+    @pytest.mark.asyncio
+    async def test_channels_unknown_channel_name_skipped(self) -> None:
+        _, _, _, ctx = _make_host_with_two_channels()
+        req = ChannelRequest(
+            channel="responses",
+            operation="op",
+            input="x",
+            response_target=ResponseTarget.channel("nope"),
+        )
+        report = await ctx.deliver_response(req, HostedRunResult(text="reply"))
+        assert report.include_originating is True  # fallback
+        assert report.skipped == ("nope",)
+
+    @pytest.mark.asyncio
+    async def test_no_push_capability_skipped(self) -> None:
+        agent = _FakeAgent()
+        a = _RecordingChannel(name="responses", path="/r")
+        b = _NoPushChannel(name="nopush", path="/n")
+        host = AgentFrameworkHost(target=agent, channels=[a, b])
+        _ = host.app
+        assert a.context is not None
+        # Pre-seed identity on the no-push channel so we get past the
+        # identity check and hit the ChannelPush check.
+        host._identities.setdefault("alice", {})["nopush"] = ChannelIdentity(channel="nopush", native_id="42")
+        req = ChannelRequest(
+            channel="responses",
+            operation="op",
+            input="x",
+            session=ChannelSession(isolation_key="alice"),
+            response_target=ResponseTarget.channel("nopush"),
+        )
+        report = await a.context.deliver_response(req, HostedRunResult(text="reply"))
+        assert report.skipped == ("nopush:42",)
+        assert report.include_originating is True  # fallback
+
+    @pytest.mark.asyncio
+    async def test_all_linked_pushes_to_every_other_channel(self) -> None:
+        host, _a, b, ctx = _make_host_with_two_channels()
+        # Alice on responses (originating) and telegram.
+        host._identities.setdefault("alice", {})
+        host._identities["alice"]["responses"] = ChannelIdentity(channel="responses", native_id="user:1")
+        host._identities["alice"]["telegram"] = ChannelIdentity(channel="telegram", native_id="42")
+        req = ChannelRequest(
+            channel="responses",
+            operation="op",
+            input="x",
+            session=ChannelSession(isolation_key="alice"),
+            response_target=ResponseTarget.all_linked,  # type: ignore[attr-defined]
+        )
+        report = await ctx.deliver_response(req, HostedRunResult(text="reply"))
+        assert report.include_originating is True
+        assert report.pushed == ("telegram:42",)
+        assert b.pushes and b.pushes[0][1].text == "reply"
+
+    @pytest.mark.asyncio
+    async def test_all_linked_no_other_channels_falls_back(self) -> None:
+        host, _a, _b, ctx = _make_host_with_two_channels()
+        req = ChannelRequest(
+            channel="responses",
+            operation="op",
+            input="x",
+            session=ChannelSession(isolation_key="alice"),
+            response_target=ResponseTarget.all_linked,  # type: ignore[attr-defined]
+        )
+        report = await ctx.deliver_response(req, HostedRunResult(text="reply"))
+        assert report.include_originating is True
+        assert report.pushed == ()
+
+    @pytest.mark.asyncio
+    async def test_push_exception_marks_skipped(self) -> None:
+        host, _a, b, ctx = _make_host_with_two_channels()
+        b._push_raises = RuntimeError("boom")  # type: ignore[attr-defined]
+        host._identities.setdefault("alice", {})["telegram"] = ChannelIdentity(channel="telegram", native_id="42")
+        req = ChannelRequest(
+            channel="responses",
+            operation="op",
+            input="x",
+            session=ChannelSession(isolation_key="alice"),
+            response_target=ResponseTarget.channel("telegram"),
+        )
+        report = await ctx.deliver_response(req, HostedRunResult(text="reply"))
+        assert report.skipped == ("telegram:42",)
+        assert report.include_originating is True  # fallback
diff --git a/python/packages/hosting/tests/test_types.py b/python/packages/hosting/tests/test_types.py
new file mode 100644
index 0000000000..76531dfe49
--- /dev/null
+++ b/python/packages/hosting/tests/test_types.py
@@ -0,0 +1,105 @@
+# Copyright (c) Microsoft. All rights reserved.
+
+"""Tests for the channel-neutral envelope types in :mod:`agent_framework_hosting._types`."""
+
+from __future__ import annotations
+
+from agent_framework_hosting import (
+    ChannelIdentity,
+    ChannelRequest,
+    ChannelSession,
+    ResponseTarget,
+    ResponseTargetKind,
+)
+
+
+class TestResponseTarget:
+    def test_originating_default_singleton(self) -> None:
+        target = ResponseTarget.originating  # type: ignore[attr-defined]
+        assert target.kind is ResponseTargetKind.ORIGINATING
+        assert target.targets == ()
+
+    def test_active_singleton(self) -> None:
+        target = ResponseTarget.active  # type: ignore[attr-defined]
+        assert target.kind is ResponseTargetKind.ACTIVE
+        assert target.targets == ()
+
+    def test_all_linked_singleton(self) -> None:
+        target = ResponseTarget.all_linked  # type: ignore[attr-defined]
+        assert target.kind is ResponseTargetKind.ALL_LINKED
+
+    def test_none_singleton(self) -> None:
+        target = ResponseTarget.none  # type: ignore[attr-defined]
+        assert target.kind is ResponseTargetKind.NONE
+
+    def test_channel_builder_single(self) -> None:
+        target = ResponseTarget.channel("teams")
+        assert target.kind is ResponseTargetKind.CHANNELS
+        assert target.targets == ("teams",)
+
+    def test_channels_builder_list(self) -> None:
+        target = ResponseTarget.channels(["teams", "telegram", "originating"])
+        assert target.kind is ResponseTargetKind.CHANNELS
+        assert target.targets == ("teams", "telegram", "originating")
+
+    def test_channels_builder_accepts_tuple(self) -> None:
+        target = ResponseTarget.channels(("a", "b"))
+        assert target.targets == ("a", "b")
+
+    def test_target_is_hashable(self) -> None:
+        # Plain class — hashing falls back to identity, which is fine here:
+        # the two keys below are different instances (singleton vs builder).
+        d = {ResponseTarget.originating: 1, ResponseTarget.channel("t"): 2}  # type: ignore[attr-defined]
+        assert len(d) == 2
+
+
+class TestChannelRequest:
+    def test_required_fields_only(self) -> None:
+        req = ChannelRequest(channel="responses", operation="message.create", input="hi")
+        assert req.channel == "responses"
+        assert req.operation == "message.create"
+        assert req.input == "hi"
+        assert req.session is None
+        assert req.options is None
+        assert req.session_mode == "auto"
+        assert req.metadata == {}
+        assert req.attributes == {}
+        assert req.stream is False
+        assert req.identity is None
+        # Default response target is the originating singleton.
+        assert req.response_target.kind is ResponseTargetKind.ORIGINATING
+
+    def test_default_response_target_is_originating_singleton(self) -> None:
+        # Every new request shares the module-level ``originating`` singleton
+        # by default — instances are intended to be treated as immutable, so
+        # sharing is safe and avoids per-request allocation.
+        a = ChannelRequest(channel="a", operation="op", input="x")
+        b = ChannelRequest(channel="b", operation="op", input="y")
+        assert a.response_target is ResponseTarget.originating  # type: ignore[attr-defined]
+        assert a.response_target is b.response_target
+
+    def test_with_session_and_identity(self) -> None:
+        req = ChannelRequest(
+            channel="telegram",
+            operation="message.create",
+            input="hi",
+            session=ChannelSession(isolation_key="user:42"),
+            identity=ChannelIdentity(channel="telegram", native_id="42"),
+            response_target=ResponseTarget.active,  # type: ignore[attr-defined]
+        )
+        assert req.session is not None
+        assert req.session.isolation_key == "user:42"
+        assert req.identity is not None
+        assert req.identity.channel == "telegram"
+        assert req.identity.native_id == "42"
+        assert req.response_target.kind is ResponseTargetKind.ACTIVE
+
+
+class TestChannelIdentity:
+    def test_attributes_default_empty_mapping(self) -> None:
+        ident = ChannelIdentity(channel="teams", native_id="abc")
+        assert dict(ident.attributes) == {}
+
+    def test_attributes_passthrough(self) -> None:
+        ident = ChannelIdentity(channel="teams", native_id="abc", attributes={"role": "user"})
+        assert dict(ident.attributes) == {"role": "user"}
diff --git a/python/pyproject.toml b/python/pyproject.toml
index b788f48e71..406aaf6efc 100644
--- a/python/pyproject.toml
+++ b/python/pyproject.toml
@@ -85,6 +85,7 @@ agent-framework-foundry-hosting = { workspace = true }
 agent-framework-foundry-local = { workspace = true }
 agent-framework-gemini = { workspace = true }
 agent-framework-github-copilot = { workspace = true }
+agent-framework-hosting = { workspace = true }
 agent-framework-hyperlight = { workspace = true }
 agent-framework-lab = { workspace = true }
 agent-framework-mem0 = { workspace = true }
@@ -205,6 +206,7 @@ executionEnvironments = [
     { root = "packages/foundry/tests", reportPrivateUsage = "none" },
     { root = "packages/foundry_local/tests", reportPrivateUsage = "none" },
     { root = "packages/github_copilot/tests", reportPrivateUsage = "none" },
+    { root = "packages/hosting/tests", reportPrivateUsage = "none" },
     { root = "packages/lab/gaia/tests", reportPrivateUsage = "none" },
     { root = "packages/lab/lightning/tests", reportPrivateUsage = "none" },
     { root = "packages/lab/tau2/tests", reportPrivateUsage = "none" },
diff --git a/python/uv.lock b/python/uv.lock
index 85a968174a..a4b58d2270 100644
--- a/python/uv.lock
+++ b/python/uv.lock
@@ -47,6 +47,7 @@ members = [
     "agent-framework-foundry-local",
     "agent-framework-gemini",
     "agent-framework-github-copilot",
+    "agent-framework-hosting",
     "agent-framework-hyperlight",
     "agent-framework-lab",
     "agent-framework-mem0",
@@ -599,6 +600,36 @@ requires-dist = [
     { name = "github-copilot-sdk", marker = "python_full_version >= '3.11'", specifier = ">=0.2.1,<=0.2.1" },
 ]
 
+[[package]]
+name = "agent-framework-hosting"
+version = "1.0.0a260424"
+source = { editable = "packages/hosting" }
+dependencies = [
+    { name = "agent-framework-core", marker = "sys_platform == 'darwin' or sys_platform == 'linux' or sys_platform == 'win32'" },
+    { name = "starlette", marker = "sys_platform == 'darwin' or sys_platform == 'linux' or sys_platform == 'win32'" },
+]
+
+[package.optional-dependencies]
+serve = [
+    { name = "hypercorn", marker = "sys_platform == 'darwin' or sys_platform == 'linux' or sys_platform == 'win32'" },
+]
+
+[package.dev-dependencies]
+dev = [
+    { name = "httpx", marker = "sys_platform == 'darwin' or sys_platform == 'linux' or sys_platform == 'win32'" },
+]
+
+[package.metadata]
+requires-dist = [
+    { name = "agent-framework-core", editable = "packages/core" },
+    { name = "hypercorn", marker = "extra == 'serve'", specifier = ">=0.17" },
+    { name = "starlette", specifier = ">=0.37" },
+]
+provides-extras = ["serve"]
+
+[package.metadata.requires-dev]
+dev = [{ name = "httpx", specifier = ">=0.28.1" }]
+
 [[package]]
 name = "agent-framework-hyperlight"
 version = "1.0.0a260429"
@@ -1636,7 +1667,7 @@ name = "clr-loader"
 version = "0.2.10"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
-    { name = "cffi", marker = "sys_platform == 'darwin' or sys_platform == 'linux' or sys_platform == 'win32'" },
+    { name = "cffi", marker = "(python_full_version < '3.14' and sys_platform == 'darwin') or (python_full_version < '3.14' and sys_platform == 'linux') or (python_full_version < '3.14' and sys_platform == 'win32')" },
 ]
 sdist = { url = "https://files.pythonhosted.org/packages/18/24/c12faf3f61614b3131b5c98d3bf0d376b49c7feaa73edca559aeb2aee080/clr_loader-0.2.10.tar.gz", hash = "sha256:81f114afbc5005bafc5efe5af1341d400e22137e275b042a8979f3feb9fc9446", size = 83605, upload-time = "2026-01-03T23:13:06.984Z" }
 wheels = [
@@ -5132,8 +5163,8 @@ name = "powerfx"
 version = "0.0.34"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
-    { name = "cffi", marker = "sys_platform == 'darwin' or sys_platform == 'linux' or sys_platform == 'win32'" },
-    { name = "pythonnet", marker = "sys_platform == 'darwin' or sys_platform == 'linux' or sys_platform == 'win32'" },
+    { name = "cffi", marker = "(python_full_version < '3.14' and sys_platform == 'darwin') or (python_full_version < '3.14' and sys_platform == 'linux') or (python_full_version < '3.14' and sys_platform == 'win32')" },
+    { name = "pythonnet", marker = "(python_full_version < '3.14' and sys_platform == 'darwin') or (python_full_version < '3.14' and sys_platform == 'linux') or (python_full_version < '3.14' and sys_platform == 'win32')" },
 ]
 sdist = { url = "https://files.pythonhosted.org/packages/9f/fb/6c4bf87e0c74ca1c563921ce89ca1c5785b7576bca932f7255cdf81082a7/powerfx-0.0.34.tar.gz", hash = "sha256:956992e7afd272657ed16d80f4cad24ec95d9e4a79fb9dfa4a068a09e136af32", size = 3237555, upload-time = "2025-12-22T15:50:59.682Z" }
 wheels = [
@@ -5806,7 +5837,7 @@ name = "pythonnet"
 version = "3.0.5"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
-    { name = "clr-loader", marker = "sys_platform == 'darwin' or sys_platform == 'linux' or sys_platform == 'win32'" },
+    { name = "clr-loader", marker = "(python_full_version < '3.14' and sys_platform == 'darwin') or (python_full_version < '3.14' and sys_platform == 'linux') or (python_full_version < '3.14' and sys_platform == 'win32')" },
 ]
 sdist = { url = "https://files.pythonhosted.org/packages/9a/d6/1afd75edd932306ae9bd2c2d961d603dc2b52fcec51b04afea464f1f6646/pythonnet-3.0.5.tar.gz", hash = "sha256:48e43ca463941b3608b32b4e236db92d8d40db4c58a75ace902985f76dac21cf", size = 239212, upload-time = "2024-12-13T08:30:44.393Z" }
 wheels = [

From 9786cbb4c14c29dce1c84867e0877003009562d2 Mon Sep 17 00:00:00 2001
From: eavanvalkenburg <github@vanvalkenburg.eu>
Date: Wed, 6 May 2026 16:03:17 +0200
Subject: [PATCH 2/6] fix(hosting): address PR-2 review comments
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Source-code changes
- _suppress_already_consumed: narrow contract — RuntimeError now logs
  at WARNING with exc_info; non-RuntimeError still logs at exception().
  Docstring clarifies that any non-clean teardown is observable.
- _BoundResponseStream: add aclose() and route __await__ through
  get_final_response() so the binding is always released — fixes
  contextvar leak when channels abandon the stream or use the
  await-the-stream convenience.
- Lifespan: aggregate startup/shutdown callback errors; every callback
  runs, all failures are logged with their qualname, and the first
  error is re-raised so Starlette still aborts boot.
- _build_run_kwargs: switch session-cache write to dict.setdefault so
  concurrent racers cannot orphan a session if create_session ever
  yields.
- _deliver_response: introduce DeliveryReport.failed for push outages
  vs explicit "no link" drops; an outage no longer triggers an
  originating fallback so the channel can decide degraded behaviour.

Test additions
- tests/test_isolation.py (new): full coverage of IsolationKeys, the
  contextvar helpers, header constants, and end-to-end ASGI
  middleware lift / reset / passthrough.
- tests/test_host.py: TestBindRequestContext, TestBoundResponseStream
  (aclose / __await__ / __getattr__ forwarding / double-close
  idempotency), TestWrapInputListMessages (list[Message] LAST
  precedence), TestLifespanAggregation (startup + shutdown).
- tests/test_types.py: TestApplyRunHook (sync/async/None), and
  TestDeliveryReport (new failed field).
- Updated test_push_exception_marks_skipped ->
  test_push_exception_lands_in_failed_no_fallback to match the new
  delivery contract.

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 .../hosting/agent_framework_hosting/_host.py  | 164 ++++-
 .../hosting/agent_framework_hosting/_types.py |  27 +-
 python/packages/hosting/tests/test_host.py    | 575 +++++++++++++++++-
 .../packages/hosting/tests/test_isolation.py  | 284 +++++++++
 python/packages/hosting/tests/test_types.py   | 123 ++++
 5 files changed, 1140 insertions(+), 33 deletions(-)
 create mode 100644 python/packages/hosting/tests/test_isolation.py

diff --git a/python/packages/hosting/agent_framework_hosting/_host.py b/python/packages/hosting/agent_framework_hosting/_host.py
index 92a0b1c45c..14d044235e 100644
--- a/python/packages/hosting/agent_framework_hosting/_host.py
+++ b/python/packages/hosting/agent_framework_hosting/_host.py
@@ -26,10 +26,10 @@
 import logging
 import os
 import uuid
-from collections.abc import Awaitable, Callable, Sequence
+from collections.abc import AsyncIterator, Awaitable, Callable, Sequence
 from contextlib import AbstractContextManager, ExitStack, asynccontextmanager
 from pathlib import Path
-from typing import TYPE_CHECKING, Any, AsyncIterator, cast
+from typing import TYPE_CHECKING, Any, cast
 
 from agent_framework import (
     AgentResponse,
@@ -112,19 +112,37 @@ def _workflow_event_to_update(event: WorkflowEvent[Any]) -> AgentResponseUpdate
 
 @asynccontextmanager
 async def _suppress_already_consumed() -> AsyncIterator[None]:  # noqa: RUF029
-    """Yield, swallowing the ``RuntimeError`` ``ResponseStream`` raises on double-consume.
+    """Yield, swallowing finalizer failures so consumer cleanup never crashes the host.
 
     The bridge stream calls ``get_final_response()`` after iterating the
     workflow stream so the workflow's cleanup hooks run; on some paths the
-    stream considers itself already finalized and raises, which we treat
-    as benign — we're only after the side effect.
+    stream considers itself already finalized (or its inner stream was
+    closed by ``__anext__`` auto-finalization) and the finalizer raises.
+    We are inside an async-generator ``finally`` block during teardown,
+    so we MUST NOT propagate — that would mask the iteration's real
+    result and cascade into the channel's own cleanup. We always log
+    with ``exc_info=True`` so the swallowed failure is observable in
+    operator logs (a regression in the workflow's own cleanup hooks
+    would otherwise vanish into a clean run).
     """
     try:
         yield
-    except RuntimeError as exc:
-        logger.debug("workflow stream finalize skipped: %s", exc)
-    except Exception:  # pragma: no cover - defensive: never let cleanup hide the real result
-        logger.exception("workflow stream finalize failed")
+    except RuntimeError:
+        # Documented benign cases: ``ResponseStream`` raises
+        # ``RuntimeError("Inner stream not available")`` on certain
+        # double-finalize paths, and async-iteration teardown of a
+        # workflow whose tasks were already cancelled can surface
+        # ``RuntimeError("Event loop is closed")`` here. Promoted from
+        # ``debug`` to ``warning`` so production deploys see the
+        # signal and a real bug doesn't masquerade as benign noise.
+        logger.warning("workflow stream finalize raised RuntimeError; cleanup skipped", exc_info=True)
+    except Exception:
+        # Anything else (checkpoint write failure, context-provider
+        # error in a cleanup hook, executor-side bug, …) is a real
+        # problem. ``logger.exception`` includes the traceback and
+        # routes at ERROR so it's grep-able in production. We still
+        # don't propagate — see the docstring.
+        logger.exception("workflow stream finalize raised an unexpected error; cleanup skipped")
 
 
 class _BoundResponseStream:
@@ -134,9 +152,22 @@ class _BoundResponseStream:
     consumption happens later (the channel iterates). For host-bound
     request context (e.g. Foundry response-id binding) to survive that
     gap, we hold the stack open until the underlying stream is exhausted
-    or :meth:`close` is called. We forward awaitable + async-iterator +
+    or :meth:`aclose` is called. We forward awaitable + async-iterator +
     ``get_final_response`` semantics so the channel sees a normal
     ``ResponseStream``-shaped object.
+
+    Lifecycle:
+
+    * Async iteration (``async for u in stream``) — the stack is closed
+      in the iterator's ``finally`` after the inner stream is drained.
+    * ``await stream`` — convenience for ``await get_final_response()``;
+      the stack is closed when ``get_final_response`` runs because that
+      path also routes through :meth:`_close`.
+    * ``await stream.get_final_response()`` — closes the stack in
+      ``finally``.
+    * Manual cleanup — call :meth:`aclose` (idempotent). Safe to call
+      from a ``finally`` even after iteration / ``get_final_response``
+      already closed the stack.
     """
 
     def __init__(self, inner: Any, stack: ExitStack) -> None:
@@ -150,11 +181,23 @@ def _close(self) -> None:
         self._closed = True
         self._stack.close()
 
+    async def aclose(self) -> None:
+        """Idempotently release the bound request context.
+
+        Channels that abandon the stream without iterating it (e.g.
+        early-return on a validation failure) MUST call this in a
+        ``finally`` so the host-bound contextvars don't leak for the
+        lifetime of the host. Calling after the stack already closed
+        (via iteration / ``get_final_response``) is a no-op.
+        """
+        self._close()
+
     def __await__(self) -> Any:
-        # ``__await__`` returns a generator; closing here would be too
-        # eager — we close in ``__aiter__`` finally instead. Awaitable
-        # consumers (rare for streams) call ``aclose()`` separately.
-        return self._inner.__await__()
+        # Convenience: ``await stream`` ≡ ``await stream.get_final_response()``.
+        # We route through ``get_final_response`` so the stack closes in
+        # its ``finally`` block, instead of leaking the binding for the
+        # host's lifetime as the previous direct-await delegation did.
+        return self.get_final_response().__await__()
 
     def __aiter__(self) -> AsyncIterator[Any]:
         return self._wrap()
@@ -179,7 +222,7 @@ def __getattr__(self, name: str) -> Any:
 class ChannelContext:
     """Host-owned bridge that channels call to invoke the target."""
 
-    def __init__(self, host: "AgentFrameworkHost") -> None:
+    def __init__(self, host: AgentFrameworkHost) -> None:
         """Bind the context to its owning :class:`AgentFrameworkHost`.
 
         The host instance is the source of truth for the target, registered
@@ -483,13 +526,56 @@ async def _readiness(_request: Request) -> PlainTextResponse:  # noqa: RUF029
 
         @asynccontextmanager
         async def lifespan(_app: Starlette) -> AsyncIterator[None]:
+            # Run every startup callback; collect (don't propagate) so
+            # one bad channel doesn't leave its peers half-initialised
+            # AND deny us a chance to pair-up shutdown calls. After all
+            # callbacks have been attempted, raise the FIRST error so
+            # Starlette / the ASGI server still aborts boot — and log
+            # every other failure so operators can see them all in one
+            # log scrape rather than discovering them turn-by-turn.
+            startup_errors: list[tuple[str, BaseException]] = []
             for cb in on_startup:
-                await cb()
+                try:
+                    await cb()
+                except Exception as exc:
+                    name = getattr(cb, "__qualname__", repr(cb))
+                    logger.exception("lifespan startup: callback %s failed", name)
+                    startup_errors.append((name, exc))
+            if startup_errors:
+                _, first_exc = startup_errors[0]
+                if len(startup_errors) > 1:
+                    logger.error(
+                        "lifespan startup: %d callback(s) failed; first error re-raised, "
+                        "remaining failures already logged above (%s)",
+                        len(startup_errors),
+                        ", ".join(n for n, _ in startup_errors[1:]),
+                    )
+                raise first_exc
             try:
                 yield
             finally:
+                # Same shape on the shutdown side: walk every callback
+                # so a bad one can't leave its peers leaking
+                # tasks/sockets/sessions, then raise the first if any
+                # failed so the server's exit code reflects the failure.
+                shutdown_errors: list[tuple[str, BaseException]] = []
                 for cb in on_shutdown:
-                    await cb()
+                    try:
+                        await cb()
+                    except Exception as exc:
+                        name = getattr(cb, "__qualname__", repr(cb))
+                        logger.exception("lifespan shutdown: callback %s failed", name)
+                        shutdown_errors.append((name, exc))
+                if shutdown_errors:
+                    _, first_exc = shutdown_errors[0]
+                    if len(shutdown_errors) > 1:
+                        logger.error(
+                            "lifespan shutdown: %d callback(s) failed; first error re-raised, "
+                            "remaining failures already logged above (%s)",
+                            len(shutdown_errors),
+                            ", ".join(n for n, _ in shutdown_errors[1:]),
+                        )
+                    raise first_exc
 
         return Starlette(
             debug=self._debug,
@@ -511,12 +597,23 @@ def _build_run_kwargs(self, request: ChannelRequest) -> dict[str, Any]:
                 session_id = self._session_aliases.get(isolation_key, isolation_key)
                 session = self._sessions.get(isolation_key)
                 if session is None:
+                    # Concurrency note: ``create_session`` is sync today,
+                    # so the get/set window has no await point and CPython
+                    # serialises us against other tasks. ``setdefault`` is
+                    # the atomic primitive that keeps us safe even if a
+                    # future ``create_session`` ever yields — both racers
+                    # would see ``session is None``, both construct a new
+                    # session, but only the first ``setdefault`` wins; the
+                    # loser's just-built session is discarded (one
+                    # transient orphan max per race window) instead of
+                    # silently overwriting a peer-bound session that
+                    # other in-flight requests are already using.
                     # ``create_session`` lives on agent-typed targets but not on
                     # ``Workflow``; the ``hasattr`` above guards the call site.
-                    session = self.target.create_session(  # pyright: ignore[reportAttributeAccessIssue, reportUnknownVariableType, reportUnknownMemberType]
+                    new_session = self.target.create_session(  # pyright: ignore[reportAttributeAccessIssue, reportUnknownVariableType, reportUnknownMemberType]
                         session_id=session_id
                     )
-                    self._sessions[isolation_key] = session  # pyright: ignore[reportUnknownArgumentType]
+                    session = self._sessions.setdefault(isolation_key, new_session)  # pyright: ignore[reportUnknownArgumentType]
 
         run_kwargs: dict[str, Any] = {}
         if session is not None:
@@ -899,6 +996,12 @@ async def _deliver_response(self, request: ChannelRequest, payload: HostedRunRes
         by_name = {ch.name: ch for ch in self.channels}
         pushed: list[str] = []
         skipped: list[str] = []
+        # ``(target_token, error_summary)`` for each destination whose
+        # ``ChannelPush.push`` raised. Distinct from ``skipped`` so the
+        # caller can tell an outage (every destination push raised) from
+        # the documented "no link recorded" drop (no identity yet
+        # mapped to that channel for this isolation_key).
+        failed: list[tuple[str, str]] = []
         for channel_name, dest_identity in destinations:
             channel = by_name.get(channel_name)
             token = f"{channel_name}:{dest_identity.native_id}" if dest_identity is not None else channel_name
@@ -924,22 +1027,35 @@ async def _deliver_response(self, request: ChannelRequest, payload: HostedRunRes
                 continue
             try:
                 await channel.push(dest_identity, payload)
-            except Exception:
+            except Exception as exc:
                 logger.exception("deliver_response: push failed for target=%s", token)
-                skipped.append(token)
+                failed.append((token, f"{type(exc).__name__}: {exc}"))
                 continue
             pushed.append(token)
             logger.info("deliver_response: pushed to %s (%d chars)", token, len(payload.text))
 
         if not pushed and not include_originating:
-            # Spec policy: if every destination drops, deliver to originating.
-            logger.warning("deliver_response: every destination dropped — falling back to originating")
-            include_originating = True
+            # Spec policy: if every destination drops *without ever
+            # raising*, deliver to originating so the user gets a
+            # response. When the drop reason is a push outage (every
+            # ``failed`` entry), we don't fall back — the originating
+            # channel can inspect ``DeliveryReport.failed`` and decide
+            # whether to surface a degraded reply itself rather than
+            # double-delivering on a flaky link.
+            if failed:
+                logger.warning(
+                    "deliver_response: every destination push raised — surfacing failures via "
+                    "DeliveryReport.failed (no originating fallback)"
+                )
+            else:
+                logger.warning("deliver_response: every destination dropped — falling back to originating")
+                include_originating = True
 
         return DeliveryReport(
             include_originating=include_originating,
             pushed=tuple(pushed),
             skipped=tuple(skipped),
+            failed=tuple(failed),
         )
 
 
diff --git a/python/packages/hosting/agent_framework_hosting/_types.py b/python/packages/hosting/agent_framework_hosting/_types.py
index 7d200a3266..04fde4e59b 100644
--- a/python/packages/hosting/agent_framework_hosting/_types.py
+++ b/python/packages/hosting/agent_framework_hosting/_types.py
@@ -129,12 +129,12 @@ def __init__(
     # -- builders ---------------------------------------------------------- #
 
     @classmethod
-    def channel(cls, name: str) -> "ResponseTarget":
+    def channel(cls, name: str) -> ResponseTarget:
         """Target a single named destination channel."""
         return cls(kind=ResponseTargetKind.CHANNELS, targets=(name,))
 
     @classmethod
-    def channels(cls, names: Sequence[str]) -> "ResponseTarget":
+    def channels(cls, names: Sequence[str]) -> ResponseTarget:
         """Target an explicit list of destination channels."""
         return cls(kind=ResponseTargetKind.CHANNELS, targets=tuple(names))
 
@@ -194,7 +194,7 @@ def __init__(
         self,
         name: str,
         description: str,
-        handle: Callable[["ChannelCommandContext"], Awaitable[None]],
+        handle: Callable[[ChannelCommandContext], Awaitable[None]],
     ) -> None:
         self.name = name
         self.description = description
@@ -249,6 +249,15 @@ class DeliveryReport:
     ``originating`` target, or when ``"originating"`` is one of the listed
     destinations) or to return only an acknowledgement (``False`` — when
     the target lists only out-of-band destinations).
+
+    ``skipped`` and ``failed`` are intentionally distinct so callers can
+    tell a structural drop (no link recorded for the destination
+    channel — ``skipped``) from a transport / runtime failure
+    (``ChannelPush.push`` raised — ``failed``). A non-empty ``failed``
+    indicates an outage / outage-like condition (Telegram, Teams,
+    expired credentials, rate limits) and is the right signal for a
+    caller that wants to surface a degraded reply to the originating
+    user instead of treating the request as fully delivered.
     """
 
     def __init__(
@@ -256,10 +265,18 @@ def __init__(
         include_originating: bool,
         pushed: tuple[str, ...] = (),
         skipped: tuple[str, ...] = (),
+        failed: tuple[tuple[str, str], ...] = (),
     ) -> None:
         self.include_originating = include_originating
         self.pushed = pushed  # destination tokens delivered to (e.g. "telegram:123")
-        self.skipped = skipped  # destinations resolved but skipped (no push, failed, …)
+        self.skipped = (
+            skipped  # destinations dropped without a push attempt (no identity / no ChannelPush / unknown channel)
+        )
+        # destinations whose ``ChannelPush.push`` raised — each entry is
+        # ``(target_token, error_summary)`` so callers can distinguish
+        # the "all destinations down" outage case from the documented
+        # "no link recorded" drop case (which lands in ``skipped``).
+        self.failed = failed
 
 
 # A transform hook runs over each AgentResponseUpdate as the channel consumes
@@ -335,7 +352,7 @@ class Channel(Protocol):
     name: str
     path: str  # default mount path (e.g. "/responses"); use "" to mount routes at the app root
 
-    def contribute(self, context: "ChannelContext") -> ChannelContribution: ...
+    def contribute(self, context: ChannelContext) -> ChannelContribution: ...
 
 
 @runtime_checkable
diff --git a/python/packages/hosting/tests/test_host.py b/python/packages/hosting/tests/test_host.py
index bb6d7d5963..91fe7b4fac 100644
--- a/python/packages/hosting/tests/test_host.py
+++ b/python/packages/hosting/tests/test_host.py
@@ -9,7 +9,7 @@
 from typing import Any
 
 import pytest
-from agent_framework import AgentResponseUpdate
+from agent_framework import AgentResponse, AgentResponseUpdate, Content, Message, ResponseStream
 from starlette.requests import Request
 from starlette.responses import JSONResponse
 from starlette.routing import BaseRoute, Route
@@ -698,7 +698,16 @@ async def test_all_linked_no_other_channels_falls_back(self) -> None:
         assert report.pushed == ()
 
     @pytest.mark.asyncio
-    async def test_push_exception_marks_skipped(self) -> None:
+    async def test_push_exception_lands_in_failed_no_fallback(self) -> None:
+        """Push-raised destinations land in ``DeliveryReport.failed`` (with
+        an ``error_summary``) and do NOT trigger the originating-fallback.
+
+        Distinct from a "no link recorded" drop — that lands in
+        ``skipped`` (and DOES trigger the fallback). The originating
+        channel is meant to inspect ``failed`` and decide whether to
+        surface a degraded reply itself rather than double-delivering
+        on a flaky link.
+        """
         host, _a, b, ctx = _make_host_with_two_channels()
         b._push_raises = RuntimeError("boom")  # type: ignore[attr-defined]
         host._identities.setdefault("alice", {})["telegram"] = ChannelIdentity(channel="telegram", native_id="42")
@@ -710,5 +719,563 @@ async def test_push_exception_marks_skipped(self) -> None:
             response_target=ResponseTarget.channel("telegram"),
         )
         report = await ctx.deliver_response(req, HostedRunResult(text="reply"))
-        assert report.skipped == ("telegram:42",)
-        assert report.include_originating is True  # fallback
+        # Push raised → ``failed``, NOT ``skipped``.
+        assert report.skipped == ()
+        assert len(report.failed) == 1
+        token, summary = report.failed[0]
+        assert token == "telegram:42"
+        assert "RuntimeError" in summary
+        assert "boom" in summary
+        # No fallback: caller decides whether to surface a degraded reply.
+        assert report.include_originating is False
+
+
+# --------------------------------------------------------------------------- #
+# Bind request context — duck-typed hook on context providers                 #
+# --------------------------------------------------------------------------- #
+
+
+from contextlib import contextmanager  # noqa: E402
+
+
+class _RecordingContextProvider:
+    """Stand-in for a ``HistoryProvider`` that exposes the duck-typed
+    ``bind_request_context(response_id=..., previous_response_id=..., **_)``
+    seam the host calls. Records (event, payload) pairs so tests can
+    assert call ordering relative to the agent run + stream lifecycle.
+    """
+
+    def __init__(self, *, name: str = "rec") -> None:
+        self.name = name
+        # (event, payload) tuples — events: "enter", "exit", "agent_start",
+        # "agent_end", "stream_yield", "stream_done".
+        self.events: list[tuple[str, Any]] = []
+
+    @contextmanager
+    def bind_request_context(self, **kwargs: Any) -> Any:
+        # Snapshot the call kwargs on enter (so tests can assert
+        # response_id / previous_response_id forwarding) and the same
+        # snapshot on exit so we can verify the SAME payload bracketed
+        # the agent run.
+        snapshot = dict(kwargs)
+        self.events.append(("enter", snapshot))
+        try:
+            yield
+        finally:
+            self.events.append(("exit", snapshot))
+
+
+class _ProvidersAgent:
+    """Agent stand-in that exposes ``context_providers`` so the host's
+    ``_flat_context_providers`` finds the recording provider.
+
+    Mirrors the real :class:`agent_framework.Agent.run` shape: a sync
+    ``def`` that returns either an ``Awaitable[AgentResponse]`` (for
+    ``stream=False``) or a :class:`ResponseStream` synchronously (for
+    ``stream=True``). The host's ``_invoke_stream`` relies on the sync
+    return so it can wrap the stream in ``_BoundResponseStream`` and
+    hand it to channels for later iteration.
+    """
+
+    def __init__(self, providers: Sequence[Any], *, reply: str = "ok") -> None:
+        self.context_providers = list(providers)
+        self._reply = reply
+        self.calls: list[dict[str, Any]] = []
+
+    def create_session(self, *, session_id: str | None = None) -> _FakeAgentSession:
+        return _FakeAgentSession(session_id=session_id)
+
+    def run(
+        self,
+        messages: Any = None,
+        *,
+        stream: bool = False,
+        session: Any = None,
+        **kwargs: Any,
+    ) -> Any:
+        self.calls.append({"messages": messages, "stream": stream, "session": session, "kwargs": kwargs})
+
+        if stream:
+            providers = self.context_providers
+            updates = [
+                AgentResponseUpdate(contents=[Content.from_text("chunk-1")], role="assistant"),
+                AgentResponseUpdate(contents=[Content.from_text("chunk-2")], role="assistant"),
+            ]
+
+            async def _gen() -> AsyncIterator[AgentResponseUpdate]:
+                # ``agent_start`` is only recorded once iteration begins;
+                # if the channel abandons the stream without iterating
+                # we expect to see neither ``agent_start`` nor any
+                # ``stream_yield`` events.
+                for prov in providers:
+                    if isinstance(prov, _RecordingContextProvider):
+                        prov.events.append(("agent_start", None))
+                for u in updates:
+                    for prov in providers:
+                        if isinstance(prov, _RecordingContextProvider):
+                            prov.events.append(("stream_yield", u.text))
+                    yield u
+
+            async def _finalize(items: Sequence[AgentResponseUpdate]) -> AgentResponse:  # noqa: RUF029
+                for prov in providers:
+                    if isinstance(prov, _RecordingContextProvider):
+                        prov.events.append(("stream_done", len(items)))
+                return AgentResponse.from_updates(items)
+
+            return ResponseStream[AgentResponseUpdate, AgentResponse](_gen(), finalizer=_finalize)
+
+        async def _coro() -> _FakeAgentResponse:
+            for prov in self.context_providers:
+                if isinstance(prov, _RecordingContextProvider):
+                    prov.events.append(("agent_start", None))
+                    prov.events.append(("agent_end", None))
+            return _FakeAgentResponse(text=self._reply)
+
+        return _coro()
+
+
+class _ProviderWrapper:
+    """Wrap children in a ``providers`` attribute (mirrors the
+    ``ContextProviderBase`` aggregation shape)."""
+
+    def __init__(self, providers: Sequence[Any]) -> None:
+        self.providers = list(providers)
+
+
+class TestBindRequestContext:
+    """The host walks ``target.context_providers``, descends one level
+    when a provider exposes a ``providers`` attribute, and calls
+    ``bind_request_context(response_id=..., previous_response_id=...)``
+    on every provider that supports it. Foundry response-id chaining
+    plugs into this exact seam — a regression that mistypes the kwarg
+    name, drops the descent, or fails to keep the binding open across
+    the agent run silently breaks chained writes."""
+
+    @pytest.mark.asyncio
+    async def test_bind_called_with_request_attributes(self) -> None:
+        prov = _RecordingContextProvider()
+        agent = _ProvidersAgent([prov])
+        ch = _RecordingChannel(name="responses")
+        host = AgentFrameworkHost(target=agent, channels=[ch])
+        _ = host.app
+        assert ch.context is not None
+
+        req = ChannelRequest(
+            channel="responses",
+            operation="op",
+            input="hi",
+            session=ChannelSession(isolation_key="alice"),
+            attributes={"response_id": "resp_abc", "previous_response_id": "resp_prev"},
+        )
+        result = await ch.context.run(req)
+        assert result.text == "ok"
+
+        # Bind ↔ unbind brackets the agent run.
+        events = [name for name, _ in prov.events]
+        assert events == ["enter", "agent_start", "agent_end", "exit"]
+
+        # Both response_id and previous_response_id forwarded by name.
+        _, enter_payload = prov.events[0]
+        assert enter_payload["response_id"] == "resp_abc"
+        assert enter_payload["previous_response_id"] == "resp_prev"
+
+    @pytest.mark.asyncio
+    async def test_bind_skipped_when_no_response_id_attribute(self) -> None:
+        """Without a ``response_id`` attribute on the request, the host
+        skips the binding entirely — the contract requires one to anchor
+        the chain."""
+        prov = _RecordingContextProvider()
+        agent = _ProvidersAgent([prov])
+        ch = _RecordingChannel(name="responses")
+        host = AgentFrameworkHost(target=agent, channels=[ch])
+        _ = host.app
+        assert ch.context is not None
+
+        req = ChannelRequest(channel="responses", operation="op", input="hi")
+        await ch.context.run(req)
+        assert prov.events == [("agent_start", None), ("agent_end", None)]
+
+    @pytest.mark.asyncio
+    async def test_bind_descends_one_level_into_providers_attribute(self) -> None:
+        """``ContextProviderBase`` style aggregation wraps children under
+        a ``providers`` attribute; the host descends one level so the
+        Foundry history provider gets called even when the agent
+        configures it via the wrapper."""
+        prov = _RecordingContextProvider(name="inner")
+        wrapper = _ProviderWrapper([prov])
+        agent = _ProvidersAgent([wrapper])
+        ch = _RecordingChannel(name="responses")
+        host = AgentFrameworkHost(target=agent, channels=[ch])
+        _ = host.app
+        assert ch.context is not None
+
+        req = ChannelRequest(
+            channel="responses",
+            operation="op",
+            input="hi",
+            attributes={"response_id": "resp_xyz"},
+        )
+        await ch.context.run(req)
+        assert ("enter", {"response_id": "resp_xyz", "previous_response_id": None}) in prov.events
+
+    @pytest.mark.asyncio
+    async def test_bind_held_open_until_stream_exhaustion(self) -> None:
+        """Streaming runs return a ``ResponseStream`` synchronously but
+        consumption happens later. The binding must survive that gap and
+        only release after the iterator drains so the provider sees
+        every yielded chunk under the bound context."""
+        prov = _RecordingContextProvider()
+        agent = _ProvidersAgent([prov])
+        ch = _RecordingChannel(name="responses")
+        host = AgentFrameworkHost(target=agent, channels=[ch])
+        _ = host.app
+        assert ch.context is not None
+
+        req = ChannelRequest(
+            channel="responses",
+            operation="op",
+            input="hi",
+            stream=True,
+            attributes={"response_id": "resp_stream"},
+        )
+        stream = ch.context.run_stream(req)
+
+        # As soon as run_stream returns, the binding must already be open
+        # so any provider work that happens during iteration sees it.
+        names_after_create = [name for name, _ in prov.events]
+        assert names_after_create.count("enter") == 1
+        assert "exit" not in names_after_create
+
+        chunks: list[str] = []
+        async for u in stream:
+            chunks.append(u.text)
+        assert chunks == ["chunk-1", "chunk-2"]
+
+        # After exhaustion the binding must be released — exactly once.
+        names_after_drain = [name for name, _ in prov.events]
+        assert names_after_drain.count("enter") == 1
+        assert names_after_drain.count("exit") == 1
+        # Brackets surround every stream_yield.
+        enter_idx = names_after_drain.index("enter")
+        exit_idx = names_after_drain.index("exit")
+        yield_idxs = [i for i, name in enumerate(names_after_drain) if name == "stream_yield"]
+        assert all(enter_idx < i < exit_idx for i in yield_idxs)
+
+
+# --------------------------------------------------------------------------- #
+# Agent-target streaming — `_BoundResponseStream` adapter behaviour            #
+# --------------------------------------------------------------------------- #
+
+
+class TestBoundResponseStream:
+    """The ``_BoundResponseStream`` adapter holds the bind-context
+    ``ExitStack`` open across iteration. Cover the iterator-finally
+    close, ``get_final_response`` close, double-close idempotence,
+    ``aclose()``, ``__getattr__`` forwarding, and the awaitable path
+    (which now routes through ``get_final_response`` so it doesn't
+    leak the binding)."""
+
+    @pytest.mark.asyncio
+    async def test_get_final_response_closes_binding(self) -> None:
+        prov = _RecordingContextProvider()
+        agent = _ProvidersAgent([prov])
+        ch = _RecordingChannel(name="responses")
+        host = AgentFrameworkHost(target=agent, channels=[ch])
+        _ = host.app
+        assert ch.context is not None
+
+        req = ChannelRequest(
+            channel="responses",
+            operation="op",
+            input="hi",
+            stream=True,
+            attributes={"response_id": "resp_get_final"},
+        )
+        stream = ch.context.run_stream(req)
+        # Skip iteration and go straight to ``get_final_response``;
+        # the adapter must drain the inner stream itself and close
+        # the binding in ``finally``.
+        final = await stream.get_final_response()
+        assert final.text == "chunk-1chunk-2"
+        names = [n for n, _ in prov.events]
+        assert names.count("enter") == 1
+        assert names.count("exit") == 1
+
+    @pytest.mark.asyncio
+    async def test_double_close_is_idempotent(self) -> None:
+        prov = _RecordingContextProvider()
+        agent = _ProvidersAgent([prov])
+        ch = _RecordingChannel(name="responses")
+        host = AgentFrameworkHost(target=agent, channels=[ch])
+        _ = host.app
+        assert ch.context is not None
+
+        req = ChannelRequest(
+            channel="responses",
+            operation="op",
+            input="hi",
+            stream=True,
+            attributes={"response_id": "resp_idem"},
+        )
+        stream = ch.context.run_stream(req)
+        async for _u in stream:
+            pass
+        # Iteration's finally already closed; an explicit ``aclose``
+        # afterwards must be a no-op (no second exit event).
+        await stream.aclose()  # type: ignore[attr-defined]
+        await stream.aclose()  # type: ignore[attr-defined]
+        names = [n for n, _ in prov.events]
+        assert names.count("exit") == 1
+
+    @pytest.mark.asyncio
+    async def test_aclose_releases_binding_when_stream_abandoned(self) -> None:
+        """A channel that abandons the stream without iterating must
+        be able to call ``aclose()`` so the host-bound contextvars
+        don't leak for the host's lifetime."""
+        prov = _RecordingContextProvider()
+        agent = _ProvidersAgent([prov])
+        ch = _RecordingChannel(name="responses")
+        host = AgentFrameworkHost(target=agent, channels=[ch])
+        _ = host.app
+        assert ch.context is not None
+
+        req = ChannelRequest(
+            channel="responses",
+            operation="op",
+            input="hi",
+            stream=True,
+            attributes={"response_id": "resp_abandon"},
+        )
+        stream = ch.context.run_stream(req)
+        await stream.aclose()  # type: ignore[attr-defined]
+
+        # Binding released without iterating.
+        names = [n for n, _ in prov.events]
+        assert names.count("enter") == 1
+        assert names.count("exit") == 1
+        # Agent never ran — we abandoned before iteration.
+        assert "agent_start" not in names
+
+    @pytest.mark.asyncio
+    async def test_getattr_forwards_to_inner_stream(self) -> None:
+        """``_BoundResponseStream.__getattr__`` forwards unknown
+        attributes to the inner ``ResponseStream``; channels that
+        check, e.g., ``stream.add_result_hook(...)`` must keep working."""
+        prov = _RecordingContextProvider()
+        agent = _ProvidersAgent([prov])
+        ch = _RecordingChannel(name="responses")
+        host = AgentFrameworkHost(target=agent, channels=[ch])
+        _ = host.app
+        assert ch.context is not None
+
+        req = ChannelRequest(
+            channel="responses",
+            operation="op",
+            input="hi",
+            stream=True,
+            attributes={"response_id": "resp_getattr"},
+        )
+        stream = ch.context.run_stream(req)
+        # ``with_result_hook`` is a real method on ``ResponseStream``;
+        # if forwarding broke this would AttributeError.
+        try:
+            assert callable(stream.with_result_hook)  # type: ignore[attr-defined]
+        finally:
+            await stream.aclose()  # type: ignore[attr-defined]
+
+    @pytest.mark.asyncio
+    async def test_await_path_routes_through_get_final_response(self) -> None:
+        """``await stream`` is a convenience for ``await
+        get_final_response()``. The previous direct delegation leaked
+        the binding for the host's lifetime; the new routing closes the
+        stack in the same ``finally`` as ``get_final_response``."""
+        prov = _RecordingContextProvider()
+        agent = _ProvidersAgent([prov])
+        ch = _RecordingChannel(name="responses")
+        host = AgentFrameworkHost(target=agent, channels=[ch])
+        _ = host.app
+        assert ch.context is not None
+
+        req = ChannelRequest(
+            channel="responses",
+            operation="op",
+            input="hi",
+            stream=True,
+            attributes={"response_id": "resp_await"},
+        )
+        stream = ch.context.run_stream(req)
+        final = await stream  # exercises __await__
+        assert final.text == "chunk-1chunk-2"
+        names = [n for n, _ in prov.events]
+        assert names.count("enter") == 1
+        assert names.count("exit") == 1
+
+
+# --------------------------------------------------------------------------- #
+# `_wrap_input` — list[Message] LAST-message metadata stamping                 #
+# --------------------------------------------------------------------------- #
+
+
+class TestWrapInputListMessages:
+    """The ``hosting`` block lands on the LAST message of a list — the
+    contract is load-bearing: the user turn (typically last) must
+    carry the channel provenance + identity for history correlation;
+    a regression stamping ``messages[0]`` instead silently breaks
+    every multi-message payload."""
+
+    @pytest.mark.asyncio
+    async def test_metadata_lands_on_last_message_only(self) -> None:
+        agent = _FakeAgent()
+        ch = _RecordingChannel(name="responses")
+        host = AgentFrameworkHost(target=agent, channels=[ch])
+        _ = host.app
+        assert ch.context is not None
+
+        # Responses-API style: a system instruction followed by a user
+        # turn. Only the user turn (LAST) gets stamped.
+        system = Message(role="system", contents=[Content.from_text("be concise")])
+        user = Message(role="user", contents=[Content.from_text("hi")])
+        req = ChannelRequest(
+            channel="responses",
+            operation="op",
+            input=[system, user],
+            identity=ChannelIdentity(channel="responses", native_id="user:1"),
+        )
+        await ch.context.run(req)
+
+        forwarded = agent.calls[0]["messages"]
+        assert isinstance(forwarded, list)
+        assert len(forwarded) == 2
+        # System stays clean.
+        assert (system.additional_properties or {}).get("hosting") is None
+        # User turn carries the metadata.
+        hosting = forwarded[-1].additional_properties["hosting"]
+        assert hosting["channel"] == "responses"
+        assert hosting["identity"]["native_id"] == "user:1"
+
+    @pytest.mark.asyncio
+    async def test_single_message_payload_still_works(self) -> None:
+        """Regression guard: the single-``Message`` branch must be
+        unchanged by the LAST-of-list logic above."""
+        agent = _FakeAgent()
+        ch = _RecordingChannel(name="responses")
+        host = AgentFrameworkHost(target=agent, channels=[ch])
+        _ = host.app
+        assert ch.context is not None
+
+        only = Message(role="user", contents=[Content.from_text("hi")])
+        req = ChannelRequest(channel="responses", operation="op", input=only)
+        await ch.context.run(req)
+        forwarded = agent.calls[0]["messages"]
+        assert isinstance(forwarded, Message)
+        assert forwarded.additional_properties["hosting"]["channel"] == "responses"
+
+
+# --------------------------------------------------------------------------- #
+# Lifespan callback aggregation                                                 #
+# --------------------------------------------------------------------------- #
+
+
+class _RaisingLifecycleChannel:
+    """Channel whose startup OR shutdown callback raises a controlled error."""
+
+    def __init__(self, name: str, *, fail_on: str) -> None:
+        self.name = name
+        self.path = ""
+        self._fail_on = fail_on  # "startup" | "shutdown"
+        self.start_calls: list[str] = []
+        self.stop_calls: list[str] = []
+
+    def contribute(self, _context: ChannelContext) -> ChannelContribution:
+        async def _start() -> None:
+            self.start_calls.append("up")
+            if self._fail_on == "startup":
+                raise RuntimeError(f"startup-boom-{self.name}")
+
+        async def _stop() -> None:
+            self.stop_calls.append("down")
+            if self._fail_on == "shutdown":
+                raise RuntimeError(f"shutdown-boom-{self.name}")
+
+        return ChannelContribution(on_startup=[_start], on_shutdown=[_stop])
+
+
+class _OkLifecycleChannel:
+    def __init__(self, name: str) -> None:
+        self.name = name
+        self.path = ""
+        self.start_calls: list[str] = []
+        self.stop_calls: list[str] = []
+
+    def contribute(self, _context: ChannelContext) -> ChannelContribution:
+        async def _start() -> None:
+            self.start_calls.append("up")
+
+        async def _stop() -> None:
+            self.stop_calls.append("down")
+
+        return ChannelContribution(on_startup=[_start], on_shutdown=[_stop])
+
+
+class TestLifespanAggregation:
+    """One bad startup / shutdown callback must NOT abort the rest —
+    every channel gets a chance to wire / unwire so half-initialised
+    state doesn't leak. The first error is still raised so the
+    process exits with a failure; remaining errors are logged so
+    operators see them all in one log scrape."""
+
+    def test_shutdown_failure_does_not_skip_peer_shutdowns(self, caplog: Any) -> None:
+        import logging as _logging
+
+        agent = _FakeAgent()
+        bad = _RaisingLifecycleChannel("bad", fail_on="shutdown")
+        ok1 = _OkLifecycleChannel("ok1")
+        ok2 = _OkLifecycleChannel("ok2")
+        # Order: bad first so that without aggregation, ok1+ok2 would
+        # never get to run their shutdown callbacks.
+        host = AgentFrameworkHost(target=agent, channels=[bad, ok1, ok2])
+
+        with caplog.at_level(_logging.ERROR, logger="agent_framework.hosting"):  # noqa: SIM117
+            with pytest.raises(RuntimeError, match="shutdown-boom-bad"), TestClient(host.app):
+                pass
+
+        # Every channel had its shutdown attempted, even though `bad` raised.
+        assert bad.stop_calls == ["down"]
+        assert ok1.stop_calls == ["down"]
+        assert ok2.stop_calls == ["down"]
+
+    def test_startup_failure_aggregates_logs_and_raises_first(self, caplog: Any) -> None:
+        import logging as _logging
+
+        agent = _FakeAgent()
+        ok1 = _OkLifecycleChannel("ok1")
+        bad = _RaisingLifecycleChannel("bad", fail_on="startup")
+        ok2 = _OkLifecycleChannel("ok2")
+        another_bad = _RaisingLifecycleChannel("bad2", fail_on="startup")
+        host = AgentFrameworkHost(
+            target=agent,
+            channels=[ok1, bad, ok2, another_bad],
+        )
+
+        with caplog.at_level(_logging.ERROR, logger="agent_framework.hosting"):  # noqa: SIM117
+            # The first failing callback's error is the one that
+            # propagates; remaining failures are logged.
+            with pytest.raises(RuntimeError, match="startup-boom-bad"), TestClient(host.app):
+                pass
+
+        # Every startup callback ran (even ok2 / another_bad after the
+        # first failure) so we get a complete picture in the logs.
+        assert ok1.start_calls == ["up"]
+        assert bad.start_calls == ["up"]
+        assert ok2.start_calls == ["up"]
+        assert another_bad.start_calls == ["up"]
+
+        # Both failures show up in operator logs. ``logger.exception`` puts
+        # the exception payload in ``record.exc_text``; the formatted summary
+        # of the second failure goes into ``record.message`` via the
+        # aggregate "N callback(s) failed" line.
+        log_messages = [rec.getMessage() for rec in caplog.records]
+        log_exc_texts = [rec.exc_text or "" for rec in caplog.records]
+        log_text = "\n".join(log_messages + log_exc_texts)
+        assert "startup-boom-bad" in log_text
+        assert "startup-boom-bad2" in log_text or "callback(s) failed" in log_text
diff --git a/python/packages/hosting/tests/test_isolation.py b/python/packages/hosting/tests/test_isolation.py
new file mode 100644
index 0000000000..2af73e7d53
--- /dev/null
+++ b/python/packages/hosting/tests/test_isolation.py
@@ -0,0 +1,284 @@
+# Copyright (c) Microsoft. All rights reserved.
+
+"""Tests for the per-request isolation contextvar surface in
+:mod:`agent_framework_hosting._isolation`.
+
+The isolation keys are the ONLY seam Foundry-aware providers use to
+find partition keys, and the host's ASGI middleware lifts them off the
+two well-known headers on every inbound HTTP request. A regression
+that drops the lookup, mistypes a header name, or fails to reset the
+contextvar would silently misroute writes / leak per-request state
+across requests, with zero unit-test signal — so cover the surface
+fully here.
+"""
+
+from __future__ import annotations
+
+import asyncio
+
+import pytest
+from starlette.requests import Request
+from starlette.responses import JSONResponse
+from starlette.routing import BaseRoute, Route
+from starlette.testclient import TestClient
+
+from agent_framework_hosting import (
+    Channel,
+    ChannelContext,
+    ChannelContribution,
+    IsolationKeys,
+    get_current_isolation_keys,
+    reset_current_isolation_keys,
+    set_current_isolation_keys,
+)
+from agent_framework_hosting._isolation import (  # pyright: ignore[reportPrivateUsage]
+    ISOLATION_HEADER_CHAT,
+    ISOLATION_HEADER_USER,
+    current_isolation_keys,
+)
+
+
+class TestIsolationKeys:
+    def test_defaults_to_none_pair(self) -> None:
+        keys = IsolationKeys()
+        assert keys.user_key is None
+        assert keys.chat_key is None
+        assert keys.is_empty is True
+
+    def test_partial_with_only_user_is_not_empty(self) -> None:
+        keys = IsolationKeys(user_key="alice")
+        assert keys.user_key == "alice"
+        assert keys.chat_key is None
+        assert keys.is_empty is False
+
+    def test_partial_with_only_chat_is_not_empty(self) -> None:
+        keys = IsolationKeys(chat_key="general")
+        assert keys.is_empty is False
+
+    def test_full_pair_is_not_empty(self) -> None:
+        keys = IsolationKeys(user_key="alice", chat_key="general")
+        assert keys.is_empty is False
+
+
+class TestContextVarHelpers:
+    def test_default_is_none(self) -> None:
+        # Each test gets a fresh contextvar value because pytest runs
+        # tests in fresh contexts. ``get`` returns the default.
+        assert get_current_isolation_keys() is None
+
+    def test_set_and_get_round_trip(self) -> None:
+        token = set_current_isolation_keys(IsolationKeys(user_key="alice", chat_key="general"))
+        try:
+            current = get_current_isolation_keys()
+            assert current is not None
+            assert current.user_key == "alice"
+            assert current.chat_key == "general"
+        finally:
+            reset_current_isolation_keys(token)
+        # Reset restores prior value (None in the default context).
+        assert get_current_isolation_keys() is None
+
+    def test_set_with_none_clears(self) -> None:
+        outer = set_current_isolation_keys(IsolationKeys(user_key="alice"))
+        try:
+            inner = set_current_isolation_keys(None)
+            try:
+                assert get_current_isolation_keys() is None
+            finally:
+                reset_current_isolation_keys(inner)
+            # Reset surfaces the outer value again.
+            current = get_current_isolation_keys()
+            assert current is not None
+            assert current.user_key == "alice"
+        finally:
+            reset_current_isolation_keys(outer)
+
+    def test_module_level_contextvar_is_the_same_instance(self) -> None:
+        """Direct contextvar access (used by the ASGI middleware) and the
+        public `get_current_isolation_keys()` helper read from the SAME
+        underlying contextvar. A regression that introduced a second
+        contextvar would silently break the middleware → provider hop."""
+        token = current_isolation_keys.set(IsolationKeys(user_key="bob"))
+        try:
+            via_helper = get_current_isolation_keys()
+            assert via_helper is not None
+            assert via_helper.user_key == "bob"
+        finally:
+            current_isolation_keys.reset(token)
+
+
+class TestHeaderConstants:
+    """The two header names are part of the public contract — they
+    match the ones the Foundry Hosted Agents runtime stamps on every
+    inbound request. A typo here would silently misroute partition
+    writes."""
+
+    def test_user_header_value(self) -> None:
+        assert ISOLATION_HEADER_USER == "x-agent-user-isolation-key"
+
+    def test_chat_header_value(self) -> None:
+        assert ISOLATION_HEADER_CHAT == "x-agent-chat-isolation-key"
+
+
+# --------------------------------------------------------------------------- #
+# End-to-end: ASGI middleware lifts the headers into the contextvar.
+# --------------------------------------------------------------------------- #
+
+
+class _IsolationProbeChannel:
+    """A minimal Channel that exposes a single GET route which captures
+    the contextvar value INSIDE the request and returns it as JSON.
+
+    Tests use this to exercise the full middleware → contextvar →
+    handler hop end-to-end.
+    """
+
+    name = "probe"
+    path = ""
+
+    def __init__(self) -> None:
+        self.captured: list[IsolationKeys | None] = []
+
+        async def _handler(_request: Request) -> JSONResponse:
+            keys = get_current_isolation_keys()
+            self.captured.append(keys)
+            payload = (
+                {"user": keys.user_key, "chat": keys.chat_key}
+                if keys is not None
+                else {"user": None, "chat": None, "_present": False}
+            )
+            return JSONResponse(payload)
+
+        self._routes: list[BaseRoute] = [Route("/probe", _handler)]
+
+    def contribute(self, _context: ChannelContext) -> ChannelContribution:
+        return ChannelContribution(routes=self._routes)
+
+
+def _make_host_with_probe() -> tuple[object, _IsolationProbeChannel]:
+    from agent_framework_hosting import AgentFrameworkHost
+
+    class _NoopAgent:
+        async def run(self, *_args: object, **_kwargs: object) -> object:  # pragma: no cover - never called
+            raise RuntimeError("not invoked")
+
+    probe = _IsolationProbeChannel()
+    assert isinstance(probe, Channel)
+    host = AgentFrameworkHost(target=_NoopAgent(), channels=[probe])  # type: ignore[arg-type]
+    return host, probe
+
+
+class TestIsolationMiddlewareEndToEnd:
+    def test_both_headers_lifted_into_contextvar(self) -> None:
+        host, probe = _make_host_with_probe()
+        with TestClient(host.app) as client:  # type: ignore[attr-defined]
+            r = client.get(
+                "/probe",
+                headers={
+                    ISOLATION_HEADER_USER: "alice-uid",
+                    ISOLATION_HEADER_CHAT: "general-cid",
+                },
+            )
+        assert r.status_code == 200
+        assert r.json() == {"user": "alice-uid", "chat": "general-cid"}
+        assert len(probe.captured) == 1
+        captured = probe.captured[0]
+        assert captured is not None
+        assert captured.user_key == "alice-uid"
+        assert captured.chat_key == "general-cid"
+
+    def test_only_user_header_lifted(self) -> None:
+        """One-header-only branch: the middleware still binds (chat=None)."""
+        host, probe = _make_host_with_probe()
+        with TestClient(host.app) as client:  # type: ignore[attr-defined]
+            r = client.get("/probe", headers={ISOLATION_HEADER_USER: "alice-uid"})
+        assert r.status_code == 200
+        assert r.json() == {"user": "alice-uid", "chat": None}
+
+    def test_only_chat_header_lifted(self) -> None:
+        host, probe = _make_host_with_probe()
+        with TestClient(host.app) as client:  # type: ignore[attr-defined]
+            r = client.get("/probe", headers={ISOLATION_HEADER_CHAT: "general-cid"})
+        assert r.status_code == 200
+        assert r.json() == {"user": None, "chat": "general-cid"}
+
+    def test_no_headers_keeps_contextvar_none(self) -> None:
+        """Local-dev path: with neither header present the middleware is
+        a no-op and the contextvar stays at its default ``None`` —
+        providers see "no isolation" and route to the in-memory
+        fallback rather than picking up stale per-request state."""
+        host, probe = _make_host_with_probe()
+        with TestClient(host.app) as client:  # type: ignore[attr-defined]
+            r = client.get("/probe")
+        assert r.status_code == 200
+        assert r.json() == {"user": None, "chat": None, "_present": False}
+        assert probe.captured == [None]
+
+    def test_empty_header_value_treated_as_absent(self) -> None:
+        """A header that's present but empty must not bind an empty key —
+        ``IsolationContext`` rejects empty strings on the read side."""
+        host, probe = _make_host_with_probe()
+        with TestClient(host.app) as client:  # type: ignore[attr-defined]
+            r = client.get(
+                "/probe",
+                headers={
+                    ISOLATION_HEADER_USER: "",
+                    ISOLATION_HEADER_CHAT: "general-cid",
+                },
+            )
+        assert r.status_code == 200
+        # Empty user header decodes to None; chat key stays bound.
+        assert r.json() == {"user": None, "chat": "general-cid"}
+
+    def test_contextvar_resets_after_request(self) -> None:
+        """The middleware must call ``reset_current_isolation_keys`` in
+        a ``finally`` so per-request state never leaks across requests
+        or back into the calling thread's context."""
+        host, probe = _make_host_with_probe()
+        with TestClient(host.app) as client:  # type: ignore[attr-defined]
+            r1 = client.get("/probe", headers={ISOLATION_HEADER_USER: "alice-uid"})
+            assert r1.status_code == 200
+            # Reading the contextvar OUTSIDE the request scope must see
+            # the default — not the value the prior request bound.
+            assert get_current_isolation_keys() is None
+            # And a follow-up request without headers gets a clean
+            # ``None`` rather than inheriting alice-uid.
+            r2 = client.get("/probe")
+            assert r2.json() == {"user": None, "chat": None, "_present": False}
+
+    def test_concurrent_requests_get_isolated_contextvars(self) -> None:
+        """Different requests run in different async contexts; binding
+        from request A must NOT leak into a concurrent request B."""
+        host, probe = _make_host_with_probe()
+
+        async def _drive() -> None:
+            # Run two requests in parallel asyncio tasks against the
+            # same TestClient and assert their captures don't bleed
+            # into each other.
+            async def _hit(user_key: str) -> dict[str, str | None]:
+                with TestClient(host.app) as client:  # type: ignore[attr-defined]
+                    r = client.get("/probe", headers={ISOLATION_HEADER_USER: user_key})
+                return r.json()  # type: ignore[no-any-return]
+
+            r_alice, r_bob = await asyncio.gather(_hit("alice-uid"), _hit("bob-uid"))
+            assert r_alice == {"user": "alice-uid", "chat": None}
+            assert r_bob == {"user": "bob-uid", "chat": None}
+
+        asyncio.run(_drive())
+
+
+class TestNonHttpScopesPassThrough:
+    """The middleware intentionally only inspects ``http`` scopes;
+    lifespan / websocket scopes are forwarded untouched. A regression
+    that touched lifespan scopes here would crash boot."""
+
+    @pytest.mark.asyncio
+    async def test_lifespan_scope_does_not_consult_headers(self) -> None:
+        # The TestClient context manager exercises the lifespan scope
+        # implicitly; if the middleware tried to decode headers on a
+        # non-http scope this would raise. Exercise it without binding
+        # any contextvar work.
+        host, _probe = _make_host_with_probe()
+        with TestClient(host.app):  # type: ignore[attr-defined]
+            # Just enter / exit; no requests.
+            pass
diff --git a/python/packages/hosting/tests/test_types.py b/python/packages/hosting/tests/test_types.py
index 76531dfe49..cecc986a29 100644
--- a/python/packages/hosting/tests/test_types.py
+++ b/python/packages/hosting/tests/test_types.py
@@ -4,12 +4,18 @@
 
 from __future__ import annotations
 
+from typing import Any
+
+import pytest
+
 from agent_framework_hosting import (
     ChannelIdentity,
     ChannelRequest,
     ChannelSession,
+    DeliveryReport,
     ResponseTarget,
     ResponseTargetKind,
+    apply_run_hook,
 )
 
 
@@ -103,3 +109,120 @@ def test_attributes_default_empty_mapping(self) -> None:
     def test_attributes_passthrough(self) -> None:
         ident = ChannelIdentity(channel="teams", native_id="abc", attributes={"role": "user"})
         assert dict(ident.attributes) == {"role": "user"}
+
+
+class _DummyTarget:
+    """Stand-in for the ``SupportsAgentRun | Workflow`` arg `apply_run_hook` forwards.
+
+    `apply_run_hook` doesn't introspect the target — it just forwards
+    it as a kwarg to the user's hook — so a bare class is enough.
+    """
+
+
+class TestApplyRunHook:
+    """`apply_run_hook` is the channel-side helper that invokes a
+    `ChannelRunHook` with the standard kwargs (`request` positional,
+    `target` / `protocol_request` keyword). Channels call this rather
+    than calling the hook directly so the convention is enforced in
+    one place. Cover both branching paths (sync vs async hook return)
+    and assert kwargs forwarding so a regression that drops `target`
+    or `protocol_request` is caught."""
+
+    @pytest.mark.asyncio
+    async def test_sync_hook_returning_modified_request(self) -> None:
+        captured: dict[str, Any] = {}
+
+        def hook(request: ChannelRequest, **kwargs: Any) -> ChannelRequest:
+            # Snapshot the kwargs for the assertion below, then return a
+            # NEW request so we also verify the helper passes the
+            # replacement straight through (no merging / mutation).
+            captured["target"] = kwargs.get("target")
+            captured["protocol_request"] = kwargs.get("protocol_request")
+            return ChannelRequest(channel=request.channel, operation="HOOK_TOUCHED", input=request.input)
+
+        original = ChannelRequest(channel="responses", operation="op", input="hi")
+        target = _DummyTarget()
+        proto = {"raw": "payload"}
+
+        result = await apply_run_hook(hook, original, target=target, protocol_request=proto)
+
+        assert result is not original
+        assert result.operation == "HOOK_TOUCHED"
+        assert captured["target"] is target
+        assert captured["protocol_request"] is proto
+
+    @pytest.mark.asyncio
+    async def test_async_hook_returning_modified_request(self) -> None:
+        captured: dict[str, Any] = {}
+
+        async def hook(request: ChannelRequest, **kwargs: Any) -> ChannelRequest:
+            captured["target"] = kwargs.get("target")
+            captured["protocol_request"] = kwargs.get("protocol_request")
+            # Return an awaitable result to exercise the async branch
+            # (`isinstance(result, Awaitable) → await it`).
+            return ChannelRequest(channel=request.channel, operation="ASYNC_HOOK", input=request.input)
+
+        original = ChannelRequest(channel="telegram", operation="op", input="hi")
+        target = _DummyTarget()
+        proto = {"update_id": 42}
+
+        result = await apply_run_hook(hook, original, target=target, protocol_request=proto)
+
+        assert result.operation == "ASYNC_HOOK"
+        assert captured["target"] is target
+        assert captured["protocol_request"] is proto
+
+    @pytest.mark.asyncio
+    async def test_protocol_request_can_be_none(self) -> None:
+        """Channels that don't have a raw protocol payload (e.g. CLI / test
+        harness invocations) pass ``protocol_request=None``; the helper
+        forwards it as-is so hooks can ``if protocol_request is None`` to
+        gate channel-specific logic."""
+        captured: dict[str, Any] = {}
+
+        async def hook(request: ChannelRequest, **kwargs: Any) -> ChannelRequest:
+            captured["protocol_request"] = kwargs.get("protocol_request")
+            captured["protocol_request_in_kwargs"] = "protocol_request" in kwargs
+            return request
+
+        await apply_run_hook(
+            hook,
+            ChannelRequest(channel="x", operation="op", input="hi"),
+            target=_DummyTarget(),
+            protocol_request=None,
+        )
+
+        assert captured["protocol_request"] is None
+        assert captured["protocol_request_in_kwargs"] is True
+
+
+class TestDeliveryReport:
+    """`DeliveryReport.failed` distinguishes "push raised" (an outage)
+    from "no link recorded" (`skipped`). Assert the field exists,
+    defaults empty, accepts the documented shape, and that the original
+    `pushed` / `skipped` semantics are preserved."""
+
+    def test_defaults_are_empty_tuples(self) -> None:
+        report = DeliveryReport(include_originating=True)
+        assert report.include_originating is True
+        assert report.pushed == ()
+        assert report.skipped == ()
+        assert report.failed == ()
+
+    def test_failed_carries_token_and_error_summary(self) -> None:
+        # Channels return a (token, summary) tuple per failed push so
+        # the originating channel can tell "telegram outage" from
+        # "no link" without parsing logs.
+        report = DeliveryReport(
+            include_originating=False,
+            pushed=("teams:42",),
+            skipped=("telegram",),
+            failed=(("telegram:99", "RuntimeError: rate limited"),),
+        )
+        assert report.pushed == ("teams:42",)
+        assert report.skipped == ("telegram",)
+        assert len(report.failed) == 1
+        token, summary = report.failed[0]
+        assert token == "telegram:99"
+        assert "RuntimeError" in summary
+        assert "rate limited" in summary

From 64b7c608c62f4f2847ddf0758c70c1bc23b6a631 Mon Sep 17 00:00:00 2001
From: eavanvalkenburg <github@vanvalkenburg.eu>
Date: Thu, 7 May 2026 16:09:21 +0200
Subject: [PATCH 3/6] fix(hosting): address PR-2 round-2 review comments
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Refactor workflow checkpoint restoration into shared helpers
  (_restore_workflow_checkpoint for blocking; the streaming sibling
  drains the rehydration stream) so the blocking and streaming paths
  rehydrate identically — clarifies the previously inline _maybe_restore
  by hoisting the pattern next to the blocking call site.
- Document that blocking workflow output is text-only by design;
  richer modalities ride the streaming AgentResponseUpdate channel,
  which preserves all content parts.

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 .../hosting/agent_framework_hosting/_host.py  | 87 +++++++++++++------
 1 file changed, 62 insertions(+), 25 deletions(-)

diff --git a/python/packages/hosting/agent_framework_hosting/_host.py b/python/packages/hosting/agent_framework_hosting/_host.py
index 14d044235e..7b54f4609a 100644
--- a/python/packages/hosting/agent_framework_hosting/_host.py
+++ b/python/packages/hosting/agent_framework_hosting/_host.py
@@ -784,19 +784,43 @@ async def _invoke_workflow(self, request: ChannelRequest) -> HostedRunResult:
         # the seam for any per-run customization; nothing flows through here.
         workflow: Workflow = self.target  # type: ignore[assignment]
         storage = self._resolve_checkpoint_storage(request)
-        if storage is not None:
-            latest = await storage.get_latest(workflow_name=workflow.name)
-            if latest is not None:
-                # Restore in-memory state from the most recent checkpoint
-                # before applying the new input.
-                await workflow.run(checkpoint_id=latest.checkpoint_id, checkpoint_storage=storage)
-            result = await workflow.run(request.input, checkpoint_storage=storage)
-        else:
-            result = await workflow.run(request.input)
+        await self._restore_workflow_checkpoint(workflow, storage)
+        result = (
+            await workflow.run(request.input, checkpoint_storage=storage)
+            if storage is not None
+            else await workflow.run(request.input)
+        )
+        # NOTE: blocking workflow output is text-only today. Richer
+        # modalities (image, audio, structured tool results) ride the
+        # streaming path via ``AgentResponseUpdate`` and are forwarded by
+        # the channel as content parts; channels that need full-fidelity
+        # output for blocking calls should drive the workflow through
+        # ``stream=True`` and aggregate via ``get_final_response()``.
         outputs = result.get_outputs()
         text = "\n".join(_workflow_output_to_text(o) for o in outputs) if outputs else ""
         return HostedRunResult(text=text)
 
+    @staticmethod
+    async def _restore_workflow_checkpoint(
+        workflow: Workflow,
+        storage: CheckpointStorage | None,
+    ) -> None:
+        """Rehydrate ``workflow`` from its latest checkpoint, if any.
+
+        Shared between the blocking and streaming workflow paths so the
+        restore step stays in lockstep across both — both must observe
+        the same in-memory state when they apply the new input.
+        """
+        if storage is None:
+            return
+        latest = await storage.get_latest(workflow_name=workflow.name)
+        if latest is None:
+            return
+        # The blocking restore call is a no-op invocation that just
+        # rehydrates state; the streaming path drains the same
+        # restoration stream below to achieve the same effect.
+        await workflow.run(checkpoint_id=latest.checkpoint_id, checkpoint_storage=storage)
+
     def _invoke_workflow_stream(self, request: ChannelRequest) -> ResponseStream[AgentResponseUpdate, AgentResponse]:
         """Bridge ``Workflow.run(stream=True)`` to a channel-facing ``ResponseStream``.
 
@@ -828,23 +852,12 @@ def _invoke_workflow_stream(self, request: ChannelRequest) -> ResponseStream[Age
         workflow: Workflow = self.target  # type: ignore[assignment]
         storage = self._resolve_checkpoint_storage(request)
 
-        async def _maybe_restore() -> None:
-            if storage is None:
-                return
-            latest = await storage.get_latest(workflow_name=workflow.name)
-            if latest is None:
-                return
-            # Drain the restoration stream so the no-op invocation actually
-            # rehydrates state before the real run starts.
-            async for _ in workflow.run(
-                stream=True,
-                checkpoint_id=latest.checkpoint_id,
-                checkpoint_storage=storage,
-            ):
-                pass
-
         async def _bridge() -> AsyncIterator[AgentResponseUpdate]:
-            await _maybe_restore()
+            # Same restore step the blocking path runs (see
+            # ``_restore_workflow_checkpoint``) — kept inside the bridge
+            # so the in-memory state is rehydrated lazily on first
+            # iteration rather than at stream-construction time.
+            await self._restore_workflow_checkpoint_streaming(workflow, storage)
             workflow_stream = workflow.run(request.input, stream=True, checkpoint_storage=storage)
             try:
                 async for event in workflow_stream:
@@ -860,6 +873,30 @@ async def _finalize(updates: Sequence[AgentResponseUpdate]) -> AgentResponse:  #
 
         return ResponseStream[AgentResponseUpdate, AgentResponse](_bridge(), finalizer=_finalize)
 
+    @staticmethod
+    async def _restore_workflow_checkpoint_streaming(
+        workflow: Workflow,
+        storage: CheckpointStorage | None,
+    ) -> None:
+        """Streaming-path counterpart to :meth:`_restore_workflow_checkpoint`.
+
+        ``Workflow.run(stream=True, checkpoint_id=...)`` returns a stream
+        whose updates we don't care about — we just need the side-effect
+        of rehydration. Drained inline so the new-input run that follows
+        observes the restored state.
+        """
+        if storage is None:
+            return
+        latest = await storage.get_latest(workflow_name=workflow.name)
+        if latest is None:
+            return
+        async for _ in workflow.run(
+            stream=True,
+            checkpoint_id=latest.checkpoint_id,
+            checkpoint_storage=storage,
+        ):
+            pass
+
     def _wrap_input(self, request: ChannelRequest) -> Message | list[Message]:
         """Promote ``request.input`` to ``Message``(s) carrying channel metadata.
 

From dccc38426c3ab38ec1216939cae65c479b33d9c2 Mon Sep 17 00:00:00 2001
From: eavanvalkenburg <github@vanvalkenburg.eu>
Date: Thu, 7 May 2026 16:21:05 +0200
Subject: [PATCH 4/6] review: address PR-4 _host.py round 2 feedback
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

These review comments were filed on PR-4 (#5640) but target lines that
live in the hosting-core package (PR-2 / #5638), so the fixes land here
and PR-4's stack will pick them up on rebase.

- _suppress_already_consumed: narrow the RuntimeError catch to the two
  documented benign messages (`Inner stream not available`, `Event loop
  is closed`); any other RuntimeError now logs at ERROR with a full
  traceback so executor bugs / runner-context state errors / checkpoint
  RuntimeErrors during the post-run flush no longer masquerade as
  benign cleanup noise. Still no propagation (we're in an
  async-generator finally during teardown) — see the docstring.
- _restore_workflow_checkpoint{,_streaming}: log a WARNING when a
  non-None latest checkpoint drains to zero events, so a stale or
  partially-written checkpoint_id surfaces as an operator signal
  instead of a silent state-loss.

(The `deliver_response` "no destinations resolvable" vs "every
destination errored" concern raised in 3198268038 is already addressed
by the existing `failed` vs `skipped` distinction surfaced through
`DeliveryReport.failed` — see lines 1080-1102 and the
`DeliveryReport` docstring.)

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 .../hosting/agent_framework_hosting/_host.py  | 55 +++++++++++++++----
 1 file changed, 44 insertions(+), 11 deletions(-)

diff --git a/python/packages/hosting/agent_framework_hosting/_host.py b/python/packages/hosting/agent_framework_hosting/_host.py
index 7b54f4609a..467e90e2a4 100644
--- a/python/packages/hosting/agent_framework_hosting/_host.py
+++ b/python/packages/hosting/agent_framework_hosting/_host.py
@@ -127,15 +127,21 @@ async def _suppress_already_consumed() -> AsyncIterator[None]:  # noqa: RUF029
     """
     try:
         yield
-    except RuntimeError:
-        # Documented benign cases: ``ResponseStream`` raises
-        # ``RuntimeError("Inner stream not available")`` on certain
-        # double-finalize paths, and async-iteration teardown of a
-        # workflow whose tasks were already cancelled can surface
-        # ``RuntimeError("Event loop is closed")`` here. Promoted from
-        # ``debug`` to ``warning`` so production deploys see the
-        # signal and a real bug doesn't masquerade as benign noise.
-        logger.warning("workflow stream finalize raised RuntimeError; cleanup skipped", exc_info=True)
+    except RuntimeError as exc:
+        # Narrow match: only the two documented benign messages produced
+        # by ``ResponseStream`` / async-iteration teardown should be
+        # swallowed. Anything else (executor-side ``RuntimeError`` from a
+        # ``raise RuntimeError(...)`` in user code, runner-context state
+        # error, checkpoint-store ``RuntimeError`` during the post-run
+        # flush, …) is a real bug and is escalated to the unexpected-error
+        # branch so it's logged with a full stack trace at ERROR. We
+        # still don't propagate (we're in an async-generator ``finally``
+        # during teardown) — see the docstring.
+        message = str(exc)
+        if "Inner stream not available" in message or "Event loop is closed" in message:
+            logger.warning("workflow stream finalize raised RuntimeError; cleanup skipped", exc_info=True)
+        else:
+            logger.exception("workflow stream finalize raised an unexpected RuntimeError; cleanup skipped")
     except Exception:
         # Anything else (checkpoint write failure, context-provider
         # error in a cleanup hook, executor-side bug, …) is a real
@@ -810,6 +816,12 @@ async def _restore_workflow_checkpoint(
         Shared between the blocking and streaming workflow paths so the
         restore step stays in lockstep across both — both must observe
         the same in-memory state when they apply the new input.
+
+        If ``storage.get_latest`` returns ``None`` (no prior checkpoint
+        recorded) the call is a benign no-op. A non-``None`` checkpoint
+        whose stored events are empty (stale or partially-written
+        ``checkpoint_id``) is logged at WARNING so operators can detect
+        the silent-state-loss case without sifting through INFO logs.
         """
         if storage is None:
             return
@@ -819,7 +831,15 @@ async def _restore_workflow_checkpoint(
         # The blocking restore call is a no-op invocation that just
         # rehydrates state; the streaming path drains the same
         # restoration stream below to achieve the same effect.
-        await workflow.run(checkpoint_id=latest.checkpoint_id, checkpoint_storage=storage)
+        result = await workflow.run(checkpoint_id=latest.checkpoint_id, checkpoint_storage=storage)
+        events = getattr(result, "events", None)
+        if events is not None and not events:
+            logger.warning(
+                "workflow checkpoint restore produced zero events "
+                "(workflow=%s checkpoint_id=%s) — state may not be rehydrated",
+                workflow.name,
+                latest.checkpoint_id,
+            )
 
     def _invoke_workflow_stream(self, request: ChannelRequest) -> ResponseStream[AgentResponseUpdate, AgentResponse]:
         """Bridge ``Workflow.run(stream=True)`` to a channel-facing ``ResponseStream``.
@@ -884,18 +904,31 @@ async def _restore_workflow_checkpoint_streaming(
         whose updates we don't care about — we just need the side-effect
         of rehydration. Drained inline so the new-input run that follows
         observes the restored state.
+
+        A latest checkpoint that drains to zero events (stale or
+        partially-written ``checkpoint_id``) is logged at WARNING so
+        operators can detect the silent-state-loss case, mirroring the
+        blocking helper.
         """
         if storage is None:
             return
         latest = await storage.get_latest(workflow_name=workflow.name)
         if latest is None:
             return
+        drained = 0
         async for _ in workflow.run(
             stream=True,
             checkpoint_id=latest.checkpoint_id,
             checkpoint_storage=storage,
         ):
-            pass
+            drained += 1
+        if drained == 0:
+            logger.warning(
+                "workflow checkpoint restore stream produced zero events "
+                "(workflow=%s checkpoint_id=%s) — state may not be rehydrated",
+                workflow.name,
+                latest.checkpoint_id,
+            )
 
     def _wrap_input(self, request: ChannelRequest) -> Message | list[Message]:
         """Promote ``request.input`` to ``Message``(s) carrying channel metadata.

From 35a3ab37d43b689a4f163e104cf878b305fbaf2a Mon Sep 17 00:00:00 2001
From: eavanvalkenburg <github@vanvalkenburg.eu>
Date: Mon, 4 May 2026 22:21:02 +0200
Subject: [PATCH 5/6] feat(hosting-activity-protocol): rename Bot Framework
 channel to ActivityProtocolChannel

The existing Bot-Framework-via-Azure-Bot-Service channel was previously
shipped under the name ``hosting-teams`` / ``TeamsChannel``. That name
is misleading for what the channel actually does -- it speaks the Bot
Framework Activity Protocol against Azure Bot Service, which fans out
across MS Teams, Slack, Webex, Telegram-via-Bot-Service, etc., and does
not provide any Teams-specific affordances.

This PR renames the package atomically and frees the ``hosting-teams``
name for a future Teams-native channel built on
``microsoft-teams-apps`` (PR-5b, spec req #28).

Renames (all in one commit):

- Package: ``agent-framework-hosting-teams`` ->
  ``agent-framework-hosting-activity-protocol``
- Module: ``agent_framework_hosting_teams`` ->
  ``agent_framework_hosting_activity_protocol``
- Channel class: ``TeamsChannel`` -> ``ActivityProtocolChannel``
- Helper: ``teams_isolation_key`` -> ``activity_protocol_isolation_key``
  (isolation key prefix ``teams:`` -> ``activity:``)
- Channel name: ``"teams"`` -> ``"activity"``; default mount path
  ``/teams`` -> ``/activity``
- Internal helper: ``_parse_teams_activity`` -> ``_parse_activity``
- Worker task name + a couple of error strings updated for consistency

Updates README.md and the module docstring to call out:

- this is the channel-neutral Activity Protocol channel,
- it surfaces what every Bot-Service-connected channel has in common
  (text in / text out),
- a forthcoming ``agent-framework-hosting-teams`` package will layer
  Teams-specific affordances (adaptive cards, message extensions,
  dialogs, SSO, ...) on the same Bot Service transport.

Workspace: registers ``agent-framework-hosting-activity-protocol`` in
``python/pyproject.toml`` and adds the matching pyright
``executionEnvironments`` entry.

Behavior is unchanged. Pyright + mypy clean, 11 tests pass.

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 .../hosting-activity-protocol/LICENSE         |  21 +
 .../hosting-activity-protocol/README.md       |  43 ++
 .../__init__.py                               |   7 +
 .../_channel.py                               | 571 ++++++++++++++++++
 .../hosting-activity-protocol/pyproject.toml  | 107 ++++
 .../tests/__init__.py                         |   0
 .../tests/test_channel.py                     | 182 ++++++
 python/pyproject.toml                         |   2 +
 python/uv.lock                                |  20 +
 9 files changed, 953 insertions(+)
 create mode 100644 python/packages/hosting-activity-protocol/LICENSE
 create mode 100644 python/packages/hosting-activity-protocol/README.md
 create mode 100644 python/packages/hosting-activity-protocol/agent_framework_hosting_activity_protocol/__init__.py
 create mode 100644 python/packages/hosting-activity-protocol/agent_framework_hosting_activity_protocol/_channel.py
 create mode 100644 python/packages/hosting-activity-protocol/pyproject.toml
 create mode 100644 python/packages/hosting-activity-protocol/tests/__init__.py
 create mode 100644 python/packages/hosting-activity-protocol/tests/test_channel.py

diff --git a/python/packages/hosting-activity-protocol/LICENSE b/python/packages/hosting-activity-protocol/LICENSE
new file mode 100644
index 0000000000..9e841e7a26
--- /dev/null
+++ b/python/packages/hosting-activity-protocol/LICENSE
@@ -0,0 +1,21 @@
+    MIT License
+
+    Copyright (c) Microsoft Corporation.
+
+    Permission is hereby granted, free of charge, to any person obtaining a copy
+    of this software and associated documentation files (the "Software"), to deal
+    in the Software without restriction, including without limitation the rights
+    to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+    copies of the Software, and to permit persons to whom the Software is
+    furnished to do so, subject to the following conditions:
+
+    The above copyright notice and this permission notice shall be included in all
+    copies or substantial portions of the Software.
+
+    THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+    IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+    FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+    AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+    LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+    OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+    SOFTWARE
diff --git a/python/packages/hosting-activity-protocol/README.md b/python/packages/hosting-activity-protocol/README.md
new file mode 100644
index 0000000000..367dc666da
--- /dev/null
+++ b/python/packages/hosting-activity-protocol/README.md
@@ -0,0 +1,43 @@
+# agent-framework-hosting-activity-protocol
+
+Bot Framework **Activity Protocol** channel for
+[agent-framework-hosting](../hosting). Connects to **Azure Bot Service** so
+the same agent can be reached from Microsoft Teams, Slack, Webex,
+Telegram-via-bot-channel, and any other channel Azure Bot Service
+supports — without having to learn each channel's native protocol.
+
+> Looking for a deeper Microsoft Teams integration with adaptive cards,
+> message extensions, dialogs, SSO, etc? See the companion
+> [`agent-framework-hosting-teams`](../hosting-teams) package, which is
+> built on `microsoft-teams-apps` and exposes Teams-specific affordances
+> on top of (still) Azure Bot Service.
+
+Handles inbound `message` activities, outbound replies, mid-stream
+`updateActivity` edits, typing indicators, and both client-secret and
+certificate credential modes for the outbound Bot Framework token.
+
+## Usage
+
+```python
+from agent_framework_hosting import AgentFrameworkHost
+from agent_framework_hosting_activity_protocol import ActivityProtocolChannel
+
+host = AgentFrameworkHost(
+    target=my_agent,
+    channels=[
+        ActivityProtocolChannel(
+            app_id="<entra app id>",
+            client_secret="<entra client secret>",
+            tenant_id="botframework.com",  # or your tenant id
+        )
+    ],
+)
+host.serve()
+```
+
+For tenants that disallow client secrets, supply `certificate_path=` (and
+optionally `certificate_password=`) instead. See the docstring at the top of
+`_channel.py` for the openssl one-liner that generates a usable PEM.
+
+In dev mode (no credentials), the channel skips outbound auth so the Bot
+Framework Emulator can hit the endpoint without setup.
diff --git a/python/packages/hosting-activity-protocol/agent_framework_hosting_activity_protocol/__init__.py b/python/packages/hosting-activity-protocol/agent_framework_hosting_activity_protocol/__init__.py
new file mode 100644
index 0000000000..4c205b4f04
--- /dev/null
+++ b/python/packages/hosting-activity-protocol/agent_framework_hosting_activity_protocol/__init__.py
@@ -0,0 +1,7 @@
+# Copyright (c) Microsoft. All rights reserved.
+
+"""Bot Framework Activity Protocol channel for :mod:`agent_framework_hosting`."""
+
+from ._channel import ActivityProtocolChannel, activity_protocol_isolation_key
+
+__all__ = ["ActivityProtocolChannel", "activity_protocol_isolation_key"]
diff --git a/python/packages/hosting-activity-protocol/agent_framework_hosting_activity_protocol/_channel.py b/python/packages/hosting-activity-protocol/agent_framework_hosting_activity_protocol/_channel.py
new file mode 100644
index 0000000000..36137f35cb
--- /dev/null
+++ b/python/packages/hosting-activity-protocol/agent_framework_hosting_activity_protocol/_channel.py
@@ -0,0 +1,571 @@
+# Copyright (c) Microsoft. All rights reserved.
+
+r"""Built-in channel: Bot Framework Activity Protocol (Azure Bot Service).
+
+Activity Protocol is the Bot Framework messaging shape used by Azure Bot
+Service to fan one bot endpoint out across many surfaces (Microsoft
+Teams, Slack, Webex, Telegram, …). An incoming ``Activity`` is POSTed to
+your bot's ``/messages`` endpoint, and you reply by POSTing one or more
+``Activity`` objects back to the conversation URL the inbound activity
+carried in ``serviceUrl``. Auth is an OAuth2 client-credentials token
+from Entra (the legacy multi-tenant ``botframework.com`` authority for
+public Bot Framework channels, or your own tenant for single-tenant
+bots).
+
+This is the channel-neutral Activity-Protocol channel — it surfaces what
+every Bot-Service-connected channel has in common (text in, text out).
+For deeper Microsoft Teams affordances (adaptive cards, message
+extensions, dialogs, SSO, …) on the same Bot Service transport, see the
+companion ``agent-framework-hosting-teams`` package.
+
+This channel handles:
+
+- inbound ``message`` activities — text and attachments resolved to URIs,
+- outbound replies via ``POST /v3/conversations/{id}/activities``,
+- streaming via ``PUT /v3/conversations/{id}/activities/{id}`` mid-stream
+  edits (Teams supports updateActivity in personal chats and groups),
+- typing indicators while the agent works,
+- per-conversation isolation key ``activity:<conversation_id>`` so a Responses
+  caller can resume a Teams conversation by passing the conversation id,
+- two credential modes for the outbound token — **client secret** or
+  **certificate** (for tenants that disallow secrets) — both via
+  ``azure.identity.aio``,
+- dev-mode auth bypass when no credentials are passed so the Bot Framework
+  Emulator can hit the endpoint with no credentials.
+
+Out of scope for the prototype: full JWT validation of inbound requests,
+adaptive cards, file uploads, OAuth sign-in flows, and the Teams streaming
+preview API (``StreamItem``).
+
+Generating a certificate
+------------------------
+For tenants that disallow client secrets, register a certificate on your
+Bot Framework / Entra app instead. Self-signed PEM (private key + cert in
+one file) is what ``azure.identity.CertificateCredential`` expects::
+
+    # 1. Generate a 2048-bit RSA key + self-signed cert (10y), single PEM.
+    openssl req -x509 -newkey rsa:2048 -nodes -days 3650 \\
+        -subj "/CN=my-teams-bot" \\
+        -keyout teams-bot.key -out teams-bot.crt
+    cat teams-bot.key teams-bot.crt > teams-bot.pem
+
+    # 2. Upload teams-bot.crt to your Entra app under
+    #    "Certificates & secrets" → "Certificates" → "Upload certificate".
+
+    # 3. Point the channel at the combined PEM:
+    ActivityProtocolChannel(
+        app_id="<app id>",
+        tenant_id="<tenant id>",         # or "botframework.com" for legacy bots
+        certificate_path="teams-bot.pem",
+    )
+
+To encrypt the private key, drop ``-nodes`` from the openssl command and
+pass ``certificate_password=<bytes>`` to the channel.
+"""
+
+from __future__ import annotations
+
+import asyncio
+import time
+from collections.abc import Awaitable, Mapping
+from typing import Any
+
+import httpx
+from agent_framework import (
+    AgentResponse,
+    AgentResponseUpdate,
+    Content,
+    Message,
+    ResponseStream,
+)
+from agent_framework_hosting import (
+    ChannelContext,
+    ChannelContribution,
+    ChannelRequest,
+    ChannelRunHook,
+    ChannelSession,
+    ChannelStreamTransformHook,
+    apply_run_hook,
+    logger,
+)
+from azure.core.credentials_async import AsyncTokenCredential
+from azure.identity.aio import CertificateCredential, ClientSecretCredential
+from starlette.requests import Request
+from starlette.responses import JSONResponse, Response
+from starlette.routing import Route
+
+# Bot Framework v4 multi-tenant authority used by the public Bot Framework
+# channels (including Microsoft Teams). Single-tenant bots should override
+# ``tenant_id`` with their own tenant.
+_BOTFRAMEWORK_TENANT = "botframework.com"
+_BOTFRAMEWORK_SCOPE = "https://api.botframework.com/.default"
+
+
+def activity_protocol_isolation_key(conversation_id: Any) -> str:
+    """Build the namespaced isolation key the Teams channel writes under.
+
+    Exposed at module scope so other channels' run hooks can opt into the
+    same per-conversation session (e.g. a Responses caller resuming a Teams
+    conversation by passing the conversation id).
+    """
+    return f"activity:{conversation_id}"
+
+
+def _parse_activity(activity: Mapping[str, Any]) -> Message:
+    """Translate one Bot Framework ``message`` Activity into an Agent Framework Message.
+
+    Pulls the activity's ``text`` plus any image/file attachments with a
+    ``contentType`` and resolvable URL into ``Content`` parts. If the
+    activity has no usable parts an empty text part is emitted so the
+    caller never sees a content-less message.
+    """
+    parts: list[Content] = []
+    if (text := activity.get("text")) and isinstance(text, str):
+        parts.append(Content.from_text(text=text))
+
+    for attachment in activity.get("attachments") or []:
+        if not isinstance(attachment, Mapping):
+            continue
+        url = attachment.get("contentUrl") or attachment.get("content")
+        content_type = attachment.get("contentType")
+        if isinstance(url, str) and isinstance(content_type, str) and "/" in content_type:
+            parts.append(Content.from_uri(uri=url, media_type=content_type))
+
+    if not parts:
+        parts.append(Content.from_text(text=""))
+    return Message("user", parts)
+
+
+class ActivityProtocolChannel:
+    """Microsoft Teams channel via Bot Framework v4 webhook.
+
+    Streaming
+    ---------
+    When ``stream=True`` (default), the channel sends an initial placeholder
+    activity, then edits it in place as the agent emits ``AgentResponseUpdate``
+    chunks (``PUT /v3/conversations/{id}/activities/{id}``). When ``stream=False``
+    it just sends the final reply. A ``stream_transform_hook`` can rewrite or
+    drop individual updates before they hit the wire.
+    """
+
+    name = "activity"
+
+    def __init__(
+        self,
+        *,
+        path: str = "/activity",
+        app_id: str | None = None,
+        app_password: str | None = None,
+        certificate_path: str | None = None,
+        certificate_password: bytes | None = None,
+        tenant_id: str = _BOTFRAMEWORK_TENANT,
+        token_scope: str = _BOTFRAMEWORK_SCOPE,
+        credential: AsyncTokenCredential | None = None,
+        run_hook: ChannelRunHook | None = None,
+        send_typing_action: bool = True,
+        stream: bool = True,
+        stream_transform_hook: ChannelStreamTransformHook | None = None,
+        stream_edit_min_interval: float = 0.7,
+    ) -> None:
+        """Configure the Teams channel.
+
+        Args:
+            path: Mount path. The webhook lives at ``{path}/messages``.
+            app_id: Bot Framework / Entra application (client) id. Required
+                whenever any credential is supplied.
+            app_password: Application secret for OAuth2 client credentials.
+                Mutually exclusive with ``certificate_path``.
+            certificate_path: Path to a PEM file containing **both** the
+                private key and the X.509 certificate. Use this for tenants
+                that disallow client secrets. See the module docstring for an
+                ``openssl`` recipe.
+            certificate_password: Password for the PEM private key, if any.
+            tenant_id: Entra tenant. Defaults to ``"botframework.com"`` for
+                public Bot Framework channels; pass your tenant id for
+                single-tenant bots.
+            token_scope: OAuth2 scope to request. Defaults to the Bot
+                Framework resource.
+            credential: Bring your own ``AsyncTokenCredential`` (e.g. a
+                ``DefaultAzureCredential`` configured elsewhere). Overrides
+                ``app_password`` / ``certificate_path``.
+            run_hook: Optional rewrite of ``ChannelRequest`` before invocation.
+            send_typing_action: Whether to send ``typing`` activities while
+                the agent runs.
+            stream: Whether to stream by default. ``run_hook`` can flip per
+                request.
+            stream_transform_hook: Optional rewrite of each
+                ``AgentResponseUpdate`` before it hits the wire.
+            stream_edit_min_interval: Seconds between successive in-place
+                edits. Teams is more rate-sensitive than Telegram, so default
+                is higher.
+        """
+        if app_password and certificate_path:
+            raise ValueError("ActivityProtocolChannel: pass either app_password or certificate_path, not both.")
+        self.path = path
+        self._app_id = app_id
+        self._token_scope = token_scope
+        self._tenant_id = tenant_id
+        self._hook = run_hook
+        self._send_typing_action = send_typing_action
+        self._stream_default = stream
+        self._stream_transform_hook = stream_transform_hook
+        self._stream_edit_min_interval = stream_edit_min_interval
+        self._ctx: ChannelContext | None = None
+        self._http: httpx.AsyncClient | None = None
+
+        # Build the credential up front so misconfiguration fails at construction.
+        self._credential: AsyncTokenCredential | None
+        if credential is not None:
+            self._credential = credential
+        elif app_id and certificate_path:
+            self._credential = CertificateCredential(
+                tenant_id=tenant_id,
+                client_id=app_id,
+                certificate_path=certificate_path,
+                password=certificate_password,
+            )
+        elif app_id and app_password:
+            self._credential = ClientSecretCredential(
+                tenant_id=tenant_id,
+                client_id=app_id,
+                client_secret=app_password,
+            )
+        else:
+            self._credential = None  # dev mode
+
+    def contribute(self, context: ChannelContext) -> ChannelContribution:
+        """Capture the host context and register the ``POST /messages`` webhook."""
+        self._ctx = context
+        return ChannelContribution(
+            routes=[Route("/messages", self._handle, methods=["POST"])],
+            on_startup=[self._on_startup],
+            on_shutdown=[self._on_shutdown],
+        )
+
+    # -- lifecycle --------------------------------------------------------- #
+
+    async def _on_startup(self) -> None:
+        """Open the outbound HTTP client and emit a startup banner.
+
+        When no Bot Framework credential is configured we log a loud warning —
+        outbound replies will not authenticate, which is only acceptable
+        against the local Bot Framework Emulator.
+        """
+        if self._http is None:
+            self._http = httpx.AsyncClient(timeout=30.0)
+        if self._credential is None:
+            logger.warning(
+                "ActivityProtocolChannel running without credentials — outbound replies "
+                "will not authenticate. Use only with the Bot Framework "
+                "Emulator for local development."
+            )
+        else:
+            cred_kind = type(self._credential).__name__
+            logger.info(
+                "ActivityProtocolChannel listening on %s/messages (auth=%s, tenant=%s)",
+                self.path,
+                cred_kind,
+                self._tenant_id,
+            )
+
+    async def _on_shutdown(self) -> None:
+        """Close the HTTP client and best-effort close the credential.
+
+        Credential ``close`` failures are logged but never raised — shutdown
+        must never be allowed to mask the original cause of an app exit.
+        """
+        if self._http is not None:
+            await self._http.aclose()
+        if self._credential is not None:
+            close = getattr(self._credential, "close", None)
+            if close is not None:
+                try:
+                    await close()
+                except Exception:  # pragma: no cover - best-effort
+                    logger.exception("ActivityProtocolChannel credential close failed")
+
+    # -- token management -------------------------------------------------- #
+
+    async def _get_token(self) -> str | None:
+        """Acquire (and cache) an outbound bearer token.
+
+        ``azure.identity`` credentials cache and refresh internally, so we
+        just delegate.
+        """
+        if self._credential is None:
+            return None
+        access_token = await self._credential.get_token(self._token_scope)
+        return access_token.token
+
+    def _auth_headers(self, token: str | None) -> dict[str, str]:
+        """Return Bot Framework auth headers, or an empty dict in dev mode."""
+        return {"Authorization": f"Bearer {token}"} if token else {}
+
+    # -- request handling -------------------------------------------------- #
+
+    async def _handle(self, request: Request) -> Response:
+        """Bot Framework webhook entry point.
+
+        Only ``message`` activities are processed; ``conversationUpdate``,
+        ``invoke``, ``typing`` and other activity types are silently
+        acknowledged. The webhook always returns 200 (or 202 for ignored
+        types) so Bot Framework can dequeue the activity even if our
+        downstream processing fails — failures are logged and re-tried by
+        the user, not by Teams.
+        """
+        try:
+            activity = await request.json()
+        except Exception:
+            return JSONResponse({"error": "invalid json"}, status_code=400)
+
+        # We accept only message activities for now. ``conversationUpdate``,
+        # ``invoke``, ``typing`` and friends are silently ack'd.
+        if activity.get("type") != "message":
+            return JSONResponse({}, status_code=202)
+
+        try:
+            await self._process_activity(activity)
+        except Exception:
+            logger.exception("Teams activity processing failed")
+        # Bot Framework expects 200 OK to dequeue the activity.
+        return JSONResponse({}, status_code=200)
+
+    async def _process_activity(self, activity: Mapping[str, Any]) -> None:
+        """Build a :class:`ChannelRequest` from a message Activity and dispatch.
+
+        The Teams isolation key is per-conversation so all members of a
+        group chat share session state. Activity metadata (``reply_to_id``,
+        ``recipient``) is preserved so reply-as-reaction style flows can
+        reconstruct the original message context.
+        """
+        if self._ctx is None:  # pragma: no cover - guarded by lifecycle
+            raise RuntimeError("activity channel not started")
+        conversation = activity.get("conversation") or {}
+        conversation_id = conversation.get("id")
+        service_url = activity.get("serviceUrl")
+        if not isinstance(conversation_id, str) or not isinstance(service_url, str):
+            logger.warning("Teams activity missing conversation.id or serviceUrl — dropping")
+            return
+
+        parsed = _parse_activity(activity)
+        channel_request = ChannelRequest(
+            channel=self.name,
+            operation="message.create",
+            input=[parsed],
+            session=ChannelSession(isolation_key=activity_protocol_isolation_key(conversation_id)),
+            attributes={
+                "conversation_id": conversation_id,
+                "service_url": service_url,
+                "from_id": (activity.get("from") or {}).get("id"),
+                "channel_id": activity.get("channelId"),
+            },
+            metadata={"reply_to_id": activity.get("id"), "recipient": activity.get("recipient")},
+            stream=self._stream_default,
+        )
+        if self._hook is not None:
+            channel_request = await apply_run_hook(
+                self._hook,
+                channel_request,
+                target=self._ctx.target,
+                protocol_request=activity,
+            )
+
+        await self._dispatch(activity, channel_request)
+
+    # -- outbound helpers -------------------------------------------------- #
+
+    async def _dispatch(self, inbound: Mapping[str, Any], request: ChannelRequest) -> None:
+        """Run the target and ship the result back into the originating Teams conversation.
+
+        Optionally fires a typing indicator before non-streaming runs;
+        streaming runs route through ``_stream_to_conversation`` which
+        progressively edits a single placeholder activity.
+        """
+        if self._ctx is None:  # pragma: no cover - guarded by lifecycle
+            raise RuntimeError("activity channel not started")
+        if self._send_typing_action:
+            await self._send_typing(inbound)
+
+        if not request.stream:
+            result = await self._ctx.run(request)
+            text = getattr(result, "text", None) or "(no response)"
+            await self._send_message(inbound, text)
+            return
+
+        stream = self._ctx.run_stream(request)
+        await self._stream_to_conversation(inbound, stream)
+
+    async def _stream_to_conversation(
+        self,
+        inbound: Mapping[str, Any],
+        stream: ResponseStream[AgentResponseUpdate, AgentResponse],
+    ) -> None:
+        """Iterate the stream and progressively edit a single Teams activity."""
+        accumulated = ""
+        last_sent = ""
+        last_edit_at = 0.0
+        activity_id: str | None = None
+        worker_done = asyncio.Event()
+        wake = asyncio.Event()
+
+        async def send_initial_placeholder() -> None:
+            nonlocal activity_id, last_edit_at
+            try:
+                activity_id = await self._send_message(inbound, "…")
+                last_edit_at = time.monotonic()
+            except Exception:  # pragma: no cover
+                logger.exception("Teams placeholder send failed")
+
+        async def edit_worker() -> None:
+            nonlocal last_sent, last_edit_at
+            while not (worker_done.is_set() and accumulated == last_sent):
+                await wake.wait()
+                wake.clear()
+                if activity_id is None or accumulated == last_sent:
+                    continue
+                elapsed = time.monotonic() - last_edit_at
+                if elapsed < self._stream_edit_min_interval:
+                    try:
+                        await asyncio.wait_for(wake.wait(), timeout=self._stream_edit_min_interval - elapsed)
+                        wake.clear()
+                    except asyncio.TimeoutError:
+                        pass
+                snapshot = accumulated
+                if snapshot == last_sent:
+                    continue
+                try:
+                    await self._update_activity(inbound, activity_id, snapshot)
+                except Exception:  # pragma: no cover
+                    logger.exception("Teams interim edit failed")
+                last_sent = snapshot
+                last_edit_at = time.monotonic()
+
+        await send_initial_placeholder()
+        edit_task = asyncio.create_task(edit_worker(), name="activity-edit-worker")
+
+        try:
+            async for update in stream:
+                if self._stream_transform_hook is not None:
+                    transformed = self._stream_transform_hook(update)
+                    if isinstance(transformed, Awaitable):
+                        transformed = await transformed
+                    if transformed is None:
+                        continue
+                    update = transformed
+                chunk = getattr(update, "text", None)
+                if chunk:
+                    accumulated += chunk
+                    wake.set()
+        except Exception:
+            logger.exception("Teams streaming consumption failed")
+        finally:
+            worker_done.set()
+            wake.set()
+            try:
+                await edit_task
+            except Exception:  # pragma: no cover
+                logger.exception("Teams edit worker crashed")
+
+        try:
+            await stream.get_final_response()
+        except Exception:  # pragma: no cover
+            logger.exception("Stream finalize failed")
+
+        # Final flush — make sure the user sees everything that arrived after
+        # the worker's last edit.
+        if activity_id is not None and accumulated and accumulated != last_sent:
+            try:
+                await self._update_activity(inbound, activity_id, accumulated)
+            except Exception:  # pragma: no cover
+                logger.exception("Teams final edit failed")
+        elif not accumulated and activity_id is not None:
+            # No text streamed — replace the placeholder with a stub so the
+            # user isn't left staring at "…".
+            try:
+                await self._update_activity(inbound, activity_id, "(no response)")
+            except Exception:  # pragma: no cover
+                logger.exception("Teams placeholder replace failed")
+
+    # -- Bot Framework REST helpers --------------------------------------- #
+
+    def _activity_payload(self, inbound: Mapping[str, Any], text: str) -> dict[str, Any]:
+        """Build the outbound Activity envelope (text-only message)."""
+        recipient = inbound.get("from") or {}
+        from_user = inbound.get("recipient") or {}
+        return {
+            "type": "message",
+            "from": from_user,
+            "recipient": recipient,
+            "conversation": inbound.get("conversation") or {},
+            "replyToId": inbound.get("id"),
+            "channelId": inbound.get("channelId"),
+            "serviceUrl": inbound.get("serviceUrl"),
+            "text": text,
+            "textFormat": "plain",
+        }
+
+    async def _send_message(self, inbound: Mapping[str, Any], text: str) -> str | None:
+        """POST a new Activity. Returns the assigned activity id."""
+        if self._http is None:  # pragma: no cover - guarded by lifecycle
+            raise RuntimeError("activity channel not started")
+        service_url = str(inbound.get("serviceUrl") or "").rstrip("/")
+        conversation_id = (inbound.get("conversation") or {}).get("id")
+        if not service_url or not isinstance(conversation_id, str):
+            return None
+        url = f"{service_url}/v3/conversations/{conversation_id}/activities"
+        token = await self._get_token()
+        response = await self._http.post(
+            url, json=self._activity_payload(inbound, text), headers=self._auth_headers(token)
+        )
+        response.raise_for_status()
+        payload = response.json() if response.content else {}
+        return payload.get("id") if isinstance(payload, dict) else None
+
+    async def _update_activity(self, inbound: Mapping[str, Any], activity_id: str, text: str) -> None:
+        """PUT-edit an existing Activity (Teams updateActivity)."""
+        if self._http is None:  # pragma: no cover - guarded by lifecycle
+            raise RuntimeError("activity channel not started")
+        service_url = str(inbound.get("serviceUrl") or "").rstrip("/")
+        conversation_id = (inbound.get("conversation") or {}).get("id")
+        if not service_url or not isinstance(conversation_id, str):
+            return
+        url = f"{service_url}/v3/conversations/{conversation_id}/activities/{activity_id}"
+        token = await self._get_token()
+        response = await self._http.put(
+            url, json=self._activity_payload(inbound, text), headers=self._auth_headers(token)
+        )
+        response.raise_for_status()
+
+    async def _send_typing(self, inbound: Mapping[str, Any]) -> None:
+        """Send a Teams typing indicator; failures are logged and swallowed.
+
+        The typing activity is purely a UX nicety — if it fails (token
+        expired, transient network issue, channel that doesn't support
+        typing) we never surface that to the user or block the actual
+        agent run.
+        """
+        if self._http is None:  # pragma: no cover - guarded by lifecycle
+            raise RuntimeError("activity channel not started")
+        service_url = str(inbound.get("serviceUrl") or "").rstrip("/")
+        conversation_id = (inbound.get("conversation") or {}).get("id")
+        if not service_url or not isinstance(conversation_id, str):
+            return
+        url = f"{service_url}/v3/conversations/{conversation_id}/activities"
+        token = await self._get_token()
+        try:
+            await self._http.post(
+                url,
+                json={
+                    "type": "typing",
+                    "from": inbound.get("recipient") or {},
+                    "recipient": inbound.get("from") or {},
+                    "conversation": inbound.get("conversation") or {},
+                    "serviceUrl": inbound.get("serviceUrl"),
+                },
+                headers=self._auth_headers(token),
+            )
+        except Exception:  # pragma: no cover - non-critical UX
+            logger.exception("Teams typing send failed")
+
+
+__all__ = ["ActivityProtocolChannel", "activity_protocol_isolation_key"]
diff --git a/python/packages/hosting-activity-protocol/pyproject.toml b/python/packages/hosting-activity-protocol/pyproject.toml
new file mode 100644
index 0000000000..cd18431a07
--- /dev/null
+++ b/python/packages/hosting-activity-protocol/pyproject.toml
@@ -0,0 +1,107 @@
+[project]
+name = "agent-framework-hosting-activity-protocol"
+description = "Bot Framework Activity Protocol channel for agent-framework-hosting (Teams, Slack, etc. via Azure Bot Service)."
+authors = [{ name = "Microsoft", email = "af-support@microsoft.com"}]
+readme = "README.md"
+requires-python = ">=3.10"
+version = "1.0.0a260424"
+license-files = ["LICENSE"]
+urls.homepage = "https://aka.ms/agent-framework"
+urls.source = "https://github.com/microsoft/agent-framework/tree/main/python"
+urls.release_notes = "https://github.com/microsoft/agent-framework/releases?q=tag%3Apython-1&expanded=true"
+urls.issues = "https://github.com/microsoft/agent-framework/issues"
+classifiers = [
+  "License :: OSI Approved :: MIT License",
+  "Development Status :: 3 - Alpha",
+  "Intended Audience :: Developers",
+  "Programming Language :: Python :: 3",
+  "Programming Language :: Python :: 3.10",
+  "Programming Language :: Python :: 3.11",
+  "Programming Language :: Python :: 3.12",
+  "Programming Language :: Python :: 3.13",
+  "Programming Language :: Python :: 3.14",
+  "Typing :: Typed",
+]
+dependencies = [
+    "agent-framework-core>=1.2.0,<2",
+    "agent-framework-hosting==1.0.0a260424",
+    "httpx>=0.27,<1",
+    "azure-identity>=1.20,<2",
+]
+
+[tool.uv]
+prerelease = "if-necessary-or-explicit"
+environments = [
+    "sys_platform == 'darwin'",
+    "sys_platform == 'linux'",
+    "sys_platform == 'win32'"
+]
+
+[tool.uv-dynamic-versioning]
+fallback-version = "0.0.0"
+
+[tool.pytest.ini_options]
+testpaths = 'tests'
+addopts = "-ra -q -r fEX"
+asyncio_mode = "auto"
+asyncio_default_fixture_loop_scope = "function"
+filterwarnings = []
+timeout = 120
+markers = [
+    "integration: marks tests as integration tests that require external services",
+]
+
+[tool.ruff]
+extend = "../../pyproject.toml"
+
+[tool.coverage.run]
+omit = [
+    "**/__init__.py"
+]
+
+[tool.pyright]
+extends = "../../pyproject.toml"
+include = ["agent_framework_hosting_activity_protocol"]
+exclude = ['tests']
+# Bot Framework activities arrive as loosely-typed JSON-ish maps. Strict
+# ``Unknown`` reporting on every ``.get(...)`` adds noise without catching
+# real bugs — narrowing happens via runtime isinstance checks instead.
+reportUnknownArgumentType = "none"
+reportUnknownMemberType = "none"
+reportUnknownVariableType = "none"
+reportUnknownLambdaType = "none"
+reportOptionalMemberAccess = "none"
+
+[tool.mypy]
+plugins = ['pydantic.mypy']
+strict = true
+python_version = "3.10"
+ignore_missing_imports = true
+disallow_untyped_defs = true
+no_implicit_optional = true
+check_untyped_defs = true
+warn_return_any = true
+show_error_codes = true
+warn_unused_ignores = false
+disallow_incomplete_defs = true
+disallow_untyped_decorators = true
+
+[tool.bandit]
+targets = ["agent_framework_hosting_activity_protocol"]
+exclude_dirs = ["tests"]
+
+[tool.poe]
+executor.type = "uv"
+include = "../../shared_tasks.toml"
+
+[tool.poe.tasks.mypy]
+help = "Run MyPy for this package."
+cmd = "mypy --config-file $POE_ROOT/pyproject.toml agent_framework_hosting_activity_protocol"
+
+[tool.poe.tasks.test]
+help = "Run the default unit test suite for this package."
+cmd = 'pytest -m "not integration" --cov=agent_framework_hosting_activity_protocol --cov-report=term-missing:skip-covered tests'
+
+[build-system]
+requires = ["flit-core >= 3.11,<4.0"]
+build-backend = "flit_core.buildapi"
diff --git a/python/packages/hosting-activity-protocol/tests/__init__.py b/python/packages/hosting-activity-protocol/tests/__init__.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/python/packages/hosting-activity-protocol/tests/test_channel.py b/python/packages/hosting-activity-protocol/tests/test_channel.py
new file mode 100644
index 0000000000..64208d6902
--- /dev/null
+++ b/python/packages/hosting-activity-protocol/tests/test_channel.py
@@ -0,0 +1,182 @@
+# Copyright (c) Microsoft. All rights reserved.
+
+"""Unit tests for :mod:`agent_framework_hosting_activity_protocol`.
+
+The Bot Framework outbound calls and azure-identity credentials are mocked
+out so the suite never touches the network. Live token acquisition,
+streaming edits and certificate paths are out of scope here.
+"""
+
+from __future__ import annotations
+
+from dataclasses import dataclass
+from typing import Any
+from unittest.mock import AsyncMock, MagicMock
+
+import pytest
+from agent_framework_hosting import AgentFrameworkHost
+from starlette.testclient import TestClient
+
+from agent_framework_hosting_activity_protocol import ActivityProtocolChannel, activity_protocol_isolation_key
+from agent_framework_hosting_activity_protocol._channel import _parse_activity
+
+
+def test_activity_protocol_isolation_key_format() -> None:
+    assert activity_protocol_isolation_key("19:meeting_xyz@thread.v2") == "activity:19:meeting_xyz@thread.v2"
+    assert activity_protocol_isolation_key(123) == "activity:123"
+
+
+class TestParseActivity:
+    def test_text_only(self) -> None:
+        msg = _parse_activity({"type": "message", "text": "hello"})
+        assert msg.role == "user"
+        assert msg.text == "hello"
+
+    def test_with_attachment(self) -> None:
+        msg = _parse_activity({
+            "type": "message",
+            "text": "see this",
+            "attachments": [
+                {"contentType": "image/png", "contentUrl": "https://example.com/x.png"},
+            ],
+        })
+        assert msg.text == "see this"
+        assert any((getattr(c, "uri", None) or "").endswith("/x.png") for c in msg.contents)
+
+    def test_skips_invalid_attachments(self) -> None:
+        msg = _parse_activity({
+            "type": "message",
+            "text": "hi",
+            "attachments": [
+                "not-a-mapping",
+                {"contentType": "image/png"},  # no url
+                {"contentUrl": "https://example.com/y", "contentType": "no-slash"},
+            ],
+        })
+        assert msg.text == "hi"
+        # No URI content survived.
+        assert not any(getattr(c, "uri", None) for c in msg.contents)
+
+
+@dataclass
+class _FakeAgentResponse:
+    text: str
+
+
+class _FakeAgent:
+    def __init__(self, reply: str = "ok") -> None:
+        self._reply = reply
+        self.runs: list[Any] = []
+
+    def create_session(self, *, session_id: str | None = None) -> Any:
+        return {"session_id": session_id}
+
+    def run(self, messages: Any = None, *, stream: bool = False, **kwargs: Any) -> Any:
+        self.runs.append({"messages": messages, "stream": stream, "kwargs": kwargs})
+
+        async def _coro() -> _FakeAgentResponse:
+            return _FakeAgentResponse(text=self._reply)
+
+        return _coro()
+
+
+def _make_teams(stream: bool = False) -> tuple[ActivityProtocolChannel, _FakeAgent]:
+    agent = _FakeAgent("hi there")
+    ch = ActivityProtocolChannel(stream=stream, send_typing_action=False)
+    fake_http = MagicMock()
+    response_mock = MagicMock()
+    response_mock.raise_for_status = MagicMock()
+    response_mock.json = MagicMock(return_value={"id": "act-1"})
+    fake_http.post = AsyncMock(return_value=response_mock)
+    fake_http.put = AsyncMock(return_value=response_mock)
+    fake_http.aclose = AsyncMock()
+    ch._http = fake_http
+    return ch, agent
+
+
+_VALID_ACTIVITY: dict[str, Any] = {
+    "type": "message",
+    "id": "in-1",
+    "text": "hello bot",
+    "conversation": {"id": "19:meeting_xyz@thread.v2"},
+    "from": {"id": "user-1"},
+    "recipient": {"id": "bot-1"},
+    "channelId": "msteams",
+    "serviceUrl": "https://smba.trafficmanager.net/amer/",
+}
+
+
+class TestTeamsWebhook:
+    def test_message_activity_dispatches_to_agent(self) -> None:
+        ch, agent = _make_teams()
+        host = AgentFrameworkHost(target=agent, channels=[ch])
+        with TestClient(host.app) as client:
+            r = client.post("/activity/messages", json=_VALID_ACTIVITY)
+        assert r.status_code == 200
+        assert agent.runs, "expected the agent to be invoked"
+        # And the channel posted a reply back to the conversation URL.
+        assert ch._http is not None
+        ch._http.post.assert_called()  # type: ignore[attr-defined]
+        url, _ = ch._http.post.call_args[0], ch._http.post.call_args[1]  # type: ignore[attr-defined] # noqa: F841
+        assert "/v3/conversations/" in ch._http.post.call_args[0][0]  # type: ignore[attr-defined]
+
+    def test_non_message_activities_are_acked(self) -> None:
+        ch, agent = _make_teams()
+        host = AgentFrameworkHost(target=agent, channels=[ch])
+        with TestClient(host.app) as client:
+            r = client.post(
+                "/activity/messages",
+                json={"type": "conversationUpdate", "conversation": {"id": "x"}},
+            )
+        assert r.status_code == 202
+        assert not agent.runs
+
+    def test_invalid_json_returns_400(self) -> None:
+        ch, agent = _make_teams()
+        host = AgentFrameworkHost(target=agent, channels=[ch])
+        with TestClient(host.app) as client:
+            r = client.post(
+                "/activity/messages",
+                content=b"not-json",
+                headers={"content-type": "application/json"},
+            )
+        assert r.status_code == 400
+        assert not agent.runs
+
+    def test_message_missing_serviceurl_is_dropped(self) -> None:
+        ch, agent = _make_teams()
+        host = AgentFrameworkHost(target=agent, channels=[ch])
+        bad = dict(_VALID_ACTIVITY)
+        bad.pop("serviceUrl")
+        with TestClient(host.app) as client:
+            r = client.post("/activity/messages", json=bad)
+        # Bot Framework still expects 200 to dequeue.
+        assert r.status_code == 200
+        assert not agent.runs
+
+
+@pytest.mark.asyncio
+class TestOutbound:
+    async def test_send_message_posts_to_conversation_url(self) -> None:
+        ch, _agent = _make_teams()
+        await ch._send_message(_VALID_ACTIVITY, "hi")
+        assert ch._http is not None
+        ch._http.post.assert_called()  # type: ignore[attr-defined]
+        url = ch._http.post.call_args[0][0]  # type: ignore[attr-defined]
+        assert "/v3/conversations/" in url
+        body = ch._http.post.call_args[1]["json"]  # type: ignore[attr-defined]
+        assert body["text"] == "hi"
+
+
+class TestConfig:
+    def test_rejects_both_secret_and_certificate(self) -> None:
+        with pytest.raises(ValueError, match="not both"):
+            ActivityProtocolChannel(
+                app_id="x",
+                app_password="s",
+                certificate_path="/tmp/does-not-exist.pem",
+            )
+
+    def test_dev_mode_no_credential(self) -> None:
+        ch = ActivityProtocolChannel()
+        assert ch._credential is None
diff --git a/python/pyproject.toml b/python/pyproject.toml
index 406aaf6efc..dac9ad7a17 100644
--- a/python/pyproject.toml
+++ b/python/pyproject.toml
@@ -86,6 +86,7 @@ agent-framework-foundry-local = { workspace = true }
 agent-framework-gemini = { workspace = true }
 agent-framework-github-copilot = { workspace = true }
 agent-framework-hosting = { workspace = true }
+agent-framework-hosting-activity-protocol = { workspace = true }
 agent-framework-hyperlight = { workspace = true }
 agent-framework-lab = { workspace = true }
 agent-framework-mem0 = { workspace = true }
@@ -207,6 +208,7 @@ executionEnvironments = [
     { root = "packages/foundry_local/tests", reportPrivateUsage = "none" },
     { root = "packages/github_copilot/tests", reportPrivateUsage = "none" },
     { root = "packages/hosting/tests", reportPrivateUsage = "none" },
+    { root = "packages/hosting-activity-protocol/tests", reportPrivateUsage = "none" },
     { root = "packages/lab/gaia/tests", reportPrivateUsage = "none" },
     { root = "packages/lab/lightning/tests", reportPrivateUsage = "none" },
     { root = "packages/lab/tau2/tests", reportPrivateUsage = "none" },
diff --git a/python/uv.lock b/python/uv.lock
index a4b58d2270..78ca29b424 100644
--- a/python/uv.lock
+++ b/python/uv.lock
@@ -48,6 +48,7 @@ members = [
     "agent-framework-gemini",
     "agent-framework-github-copilot",
     "agent-framework-hosting",
+    "agent-framework-hosting-activity-protocol",
     "agent-framework-hyperlight",
     "agent-framework-lab",
     "agent-framework-mem0",
@@ -630,6 +631,25 @@ provides-extras = ["serve"]
 [package.metadata.requires-dev]
 dev = [{ name = "httpx", specifier = ">=0.28.1" }]
 
+[[package]]
+name = "agent-framework-hosting-activity-protocol"
+version = "1.0.0a260424"
+source = { editable = "packages/hosting-activity-protocol" }
+dependencies = [
+    { name = "agent-framework-core", marker = "sys_platform == 'darwin' or sys_platform == 'linux' or sys_platform == 'win32'" },
+    { name = "agent-framework-hosting", marker = "sys_platform == 'darwin' or sys_platform == 'linux' or sys_platform == 'win32'" },
+    { name = "azure-identity", marker = "sys_platform == 'darwin' or sys_platform == 'linux' or sys_platform == 'win32'" },
+    { name = "httpx", marker = "sys_platform == 'darwin' or sys_platform == 'linux' or sys_platform == 'win32'" },
+]
+
+[package.metadata]
+requires-dist = [
+    { name = "agent-framework-core", editable = "packages/core" },
+    { name = "agent-framework-hosting", editable = "packages/hosting" },
+    { name = "azure-identity", specifier = ">=1.20,<2" },
+    { name = "httpx", specifier = ">=0.27,<1" },
+]
+
 [[package]]
 name = "agent-framework-hyperlight"
 version = "1.0.0a260429"

From f60466c6b981ed1e3a3ee4779aadd482b0d16877 Mon Sep 17 00:00:00 2001
From: eavanvalkenburg <github@vanvalkenburg.eu>
Date: Thu, 7 May 2026 16:28:00 +0200
Subject: [PATCH 6/6] review: address PR-5 round 2 feedback
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- security (#3198327004): add `service_url_allowed_hosts` constructor
  option (default `botframework.com` + `smba.trafficmanager.net`) and
  reject inbound activities whose `serviceUrl` host falls outside it
  with HTTP 400 — without this gate a malicious caller could redirect
  outbound replies (and the attached bearer token) to an
  attacker-controlled host
- security (#3198324219): add `inbound_auth_validator` async callback;
  log a loud WARNING at startup when no validator AND no operator
  reverse-proxy is configured so the dev-mode bypass cannot
  accidentally ship to production. Document the contract: prototype
  intentionally does not ship JWT validation (out of scope); operators
  must plug a validator or terminate auth in front of the channel
- retry semantics (#3198328746): distinguish transient outbound
  failures (httpx network errors, non-2xx from Bot Service) — return
  502 so Bot Service retries — from deterministic agent failures —
  return 200 so Bot Service does not retry the same broken activity
  in a loop
- bug (#3198330424): fix the placeholder-failure deadlock. When
  `send_initial_placeholder` fails, `activity_id` stays `None`, the
  edit-worker loop exit condition (`accumulated == last_sent`) is
  unreachable while no PUT is possible, and the worker would deadlock
  on `wake.wait()` forever after `worker_done` is set. Now: skip the
  worker entirely on placeholder failure and POST a single final
  activity at the end with whatever accumulated
- tests (#3198334465, #3187178091, #3198336045): add coverage for
  - `_is_service_url_allowed` allow/deny matrix + webhook 400 on
    disallowed serviceUrl
  - `inbound_auth_validator` allow/deny/raises paths
  - outbound `Authorization: Bearer <token>` header presence in
    production mode and absence in dev mode
  - the streaming path (`_stream_to_conversation`): placeholder +
    final edit, placeholder-failure fallback (with timeout guard
    against deadlock regression), and empty-stream `(no response)`
    placeholder replacement
  - retry-signal differentiation: outbound `httpx.ConnectError` →
    502; deterministic `ValueError` from the agent → 200

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 .../_channel.py                               | 170 ++++++++++--
 .../tests/test_channel.py                     | 253 +++++++++++++++++-
 2 files changed, 402 insertions(+), 21 deletions(-)

diff --git a/python/packages/hosting-activity-protocol/agent_framework_hosting_activity_protocol/_channel.py b/python/packages/hosting-activity-protocol/agent_framework_hosting_activity_protocol/_channel.py
index 36137f35cb..e54d9622b3 100644
--- a/python/packages/hosting-activity-protocol/agent_framework_hosting_activity_protocol/_channel.py
+++ b/python/packages/hosting-activity-protocol/agent_framework_hosting_activity_protocol/_channel.py
@@ -67,8 +67,9 @@
 
 import asyncio
 import time
-from collections.abc import Awaitable, Mapping
+from collections.abc import Awaitable, Callable, Mapping
 from typing import Any
+from urllib.parse import urlparse
 
 import httpx
 from agent_framework import (
@@ -100,6 +101,20 @@
 _BOTFRAMEWORK_TENANT = "botframework.com"
 _BOTFRAMEWORK_SCOPE = "https://api.botframework.com/.default"
 
+# Default allow-list of host suffixes the channel will POST a bearer token
+# to. Bot Service surfaces ``serviceUrl`` per-conversation as one of these
+# canonical hosts; a malicious inbound activity claiming a serviceUrl
+# outside this set could otherwise exfiltrate a real Bot Framework access
+# token. Operators with a private deployment (sovereign cloud, Direct Line
+# only, etc.) override this via ``service_url_allowed_hosts``.
+_DEFAULT_SERVICE_URL_HOSTS = (
+    "botframework.com",
+    "smba.trafficmanager.net",
+)
+
+
+InboundAuthValidator = Callable[[Request], Awaitable[bool]]
+
 
 def activity_protocol_isolation_key(conversation_id: Any) -> str:
     """Build the namespaced isolation key the Teams channel writes under.
@@ -111,6 +126,10 @@ def activity_protocol_isolation_key(conversation_id: Any) -> str:
     return f"activity:{conversation_id}"
 
 
+class _OutboundError(RuntimeError):
+    """Marker for transient outbound failures that should produce 502/retry."""
+
+
 def _parse_activity(activity: Mapping[str, Any]) -> Message:
     """Translate one Bot Framework ``message`` Activity into an Agent Framework Message.
 
@@ -166,6 +185,8 @@ def __init__(
         stream: bool = True,
         stream_transform_hook: ChannelStreamTransformHook | None = None,
         stream_edit_min_interval: float = 0.7,
+        inbound_auth_validator: InboundAuthValidator | None = None,
+        service_url_allowed_hosts: tuple[str, ...] = _DEFAULT_SERVICE_URL_HOSTS,
     ) -> None:
         """Configure the Teams channel.
 
@@ -198,6 +219,30 @@ def __init__(
             stream_edit_min_interval: Seconds between successive in-place
                 edits. Teams is more rate-sensitive than Telegram, so default
                 is higher.
+            inbound_auth_validator: Optional async callable invoked for each
+                inbound webhook request **before** the activity is parsed.
+                Return ``True`` to allow, ``False`` to reject with HTTP 401.
+                The webhook endpoint accepts unauthenticated requests by
+                default — Bot Framework normally validates inbound calls via
+                the JWT in the ``Authorization`` header (see Microsoft's
+                bot framework auth docs). The prototype intentionally does
+                NOT ship a built-in JWT validator (key rotation, OpenID
+                config caching, etc. are out of scope); plug your own
+                validator here, or terminate auth in front of the channel
+                (e.g. APIM, Application Gateway). When no credentials AND
+                no validator are configured the channel logs a loud
+                warning at startup so the dev-mode bypass cannot
+                accidentally ship.
+            service_url_allowed_hosts: Host (or host suffix) allow-list the
+                channel will POST a bearer token to. Defaults to the public
+                Bot Framework host suffixes (``botframework.com`` and
+                ``smba.trafficmanager.net``). An inbound activity claiming a
+                ``serviceUrl`` outside this set is rejected — without this
+                gate a malicious caller could redirect outbound replies (and
+                the attached bearer token) to an attacker-controlled host.
+                Pass an extended tuple for sovereign clouds or private
+                deployments; pass ``()`` to disable the check entirely
+                (only safe with strong inbound auth).
         """
         if app_password and certificate_path:
             raise ValueError("ActivityProtocolChannel: pass either app_password or certificate_path, not both.")
@@ -210,6 +255,8 @@ def __init__(
         self._stream_default = stream
         self._stream_transform_hook = stream_transform_hook
         self._stream_edit_min_interval = stream_edit_min_interval
+        self._inbound_auth_validator = inbound_auth_validator
+        self._service_url_allowed_hosts = tuple(h.lower().lstrip(".") for h in service_url_allowed_hosts)
         self._ctx: ChannelContext | None = None
         self._http: httpx.AsyncClient | None = None
 
@@ -250,6 +297,12 @@ async def _on_startup(self) -> None:
         When no Bot Framework credential is configured we log a loud warning —
         outbound replies will not authenticate, which is only acceptable
         against the local Bot Framework Emulator.
+
+        When no inbound auth validator is configured we also log a loud
+        warning so the dev-mode bypass cannot accidentally ship to
+        production: Bot Framework normally validates inbound requests via
+        a JWT in ``Authorization``; without that gate any caller that can
+        reach the webhook can drive the bot.
         """
         if self._http is None:
             self._http = httpx.AsyncClient(timeout=30.0)
@@ -267,6 +320,14 @@ async def _on_startup(self) -> None:
                 cred_kind,
                 self._tenant_id,
             )
+        if self._inbound_auth_validator is None:
+            logger.warning(
+                "ActivityProtocolChannel %s/messages has no inbound_auth_validator — "
+                "the webhook will accept ANY caller. Plug an inbound_auth_validator "
+                "or terminate auth in front of the channel before exposing this "
+                "endpoint to a public network.",
+                self.path,
+            )
 
     async def _on_shutdown(self) -> None:
         """Close the HTTP client and best-effort close the credential.
@@ -303,16 +364,44 @@ def _auth_headers(self, token: str | None) -> dict[str, str]:
 
     # -- request handling -------------------------------------------------- #
 
+    def _is_service_url_allowed(self, service_url: str | None) -> bool:
+        """Return ``True`` if ``service_url`` host matches the allow-list."""
+        if not self._service_url_allowed_hosts:
+            return True
+        if not service_url:
+            return False
+        try:
+            host = (urlparse(service_url).hostname or "").lower()
+        except Exception:
+            return False
+        if not host:
+            return False
+        return any(host == allowed or host.endswith(f".{allowed}") for allowed in self._service_url_allowed_hosts)
+
     async def _handle(self, request: Request) -> Response:
         """Bot Framework webhook entry point.
 
         Only ``message`` activities are processed; ``conversationUpdate``,
         ``invoke``, ``typing`` and other activity types are silently
-        acknowledged. The webhook always returns 200 (or 202 for ignored
-        types) so Bot Framework can dequeue the activity even if our
-        downstream processing fails — failures are logged and re-tried by
-        the user, not by Teams.
+        acknowledged. Auth-rejected requests return 401, malformed JSON
+        returns 400, and serviceUrl outside the allow-list returns 400.
+
+        For *transient* outbound failures (network error / non-2xx from
+        Bot Service / token acquisition failure) we surface 502 so Bot
+        Service retries the inbound activity. Non-transient failures
+        (parsing errors, validation errors, deterministic agent crashes)
+        return 200 so Bot Service does not retry the same broken
+        activity in a loop.
         """
+        if self._inbound_auth_validator is not None:
+            try:
+                allowed = await self._inbound_auth_validator(request)
+            except Exception:
+                logger.exception("ActivityProtocolChannel inbound_auth_validator raised; rejecting request")
+                return JSONResponse({"error": "unauthorized"}, status_code=401)
+            if not allowed:
+                return JSONResponse({"error": "unauthorized"}, status_code=401)
+
         try:
             activity = await request.json()
         except Exception:
@@ -323,10 +412,27 @@ async def _handle(self, request: Request) -> Response:
         if activity.get("type") != "message":
             return JSONResponse({}, status_code=202)
 
+        service_url = activity.get("serviceUrl")
+        if not self._is_service_url_allowed(service_url if isinstance(service_url, str) else None):
+            logger.warning(
+                "ActivityProtocolChannel rejecting activity with serviceUrl=%r (not in allow-list)",
+                service_url,
+            )
+            return JSONResponse({"error": "serviceUrl not allowed"}, status_code=400)
+
         try:
             await self._process_activity(activity)
+        except (httpx.HTTPError, _OutboundError):
+            # Transient outbound failure (network error, non-2xx from Bot
+            # Service, token acquisition error). Surface 502 so Bot
+            # Service retries the inbound activity rather than dropping it.
+            logger.exception("ActivityProtocolChannel outbound transient failure — signalling Bot Service to retry")
+            return JSONResponse({"error": "upstream failure"}, status_code=502)
         except Exception:
-            logger.exception("Teams activity processing failed")
+            # Deterministic / agent-side failure: 200 so Bot Service does
+            # not retry the same broken activity in a loop. Operator picks
+            # the failure up via logs / telemetry.
+            logger.exception("ActivityProtocolChannel activity processing failed")
         # Bot Framework expects 200 OK to dequeue the activity.
         return JSONResponse({}, status_code=200)
 
@@ -400,28 +506,47 @@ async def _stream_to_conversation(
         inbound: Mapping[str, Any],
         stream: ResponseStream[AgentResponseUpdate, AgentResponse],
     ) -> None:
-        """Iterate the stream and progressively edit a single Teams activity."""
+        """Iterate the stream and progressively edit a single Teams activity.
+
+        If the initial placeholder POST fails we fall back to buffering
+        the whole stream and POSTing a single final message at the end.
+        Without that fallback the edit-loop's exit condition
+        ``accumulated == last_sent`` is unreachable while ``activity_id``
+        is ``None`` (no PUT possible), and the worker would deadlock
+        forever on ``wake.wait()`` after ``worker_done`` is set.
+        """
         accumulated = ""
         last_sent = ""
         last_edit_at = 0.0
         activity_id: str | None = None
+        placeholder_ok = False
         worker_done = asyncio.Event()
         wake = asyncio.Event()
 
         async def send_initial_placeholder() -> None:
-            nonlocal activity_id, last_edit_at
+            nonlocal activity_id, last_edit_at, placeholder_ok
             try:
                 activity_id = await self._send_message(inbound, "…")
                 last_edit_at = time.monotonic()
-            except Exception:  # pragma: no cover
-                logger.exception("Teams placeholder send failed")
+                placeholder_ok = activity_id is not None
+            except Exception:
+                logger.exception(
+                    "Activity placeholder send failed — falling back to single final POST",
+                )
+                placeholder_ok = False
 
         async def edit_worker() -> None:
             nonlocal last_sent, last_edit_at
+            # When the placeholder failed we have no activity_id to PUT
+            # into; the loop's only useful work is exiting cleanly. Skip
+            # straight to that — the final flush below will POST the
+            # accumulated text in one shot.
+            if not placeholder_ok:
+                return
             while not (worker_done.is_set() and accumulated == last_sent):
                 await wake.wait()
                 wake.clear()
-                if activity_id is None or accumulated == last_sent:
+                if accumulated == last_sent:
                     continue
                 elapsed = time.monotonic() - last_edit_at
                 if elapsed < self._stream_edit_min_interval:
@@ -434,9 +559,9 @@ async def edit_worker() -> None:
                 if snapshot == last_sent:
                     continue
                 try:
-                    await self._update_activity(inbound, activity_id, snapshot)
+                    await self._update_activity(inbound, activity_id or "", snapshot)
                 except Exception:  # pragma: no cover
-                    logger.exception("Teams interim edit failed")
+                    logger.exception("Activity interim edit failed")
                 last_sent = snapshot
                 last_edit_at = time.monotonic()
 
@@ -457,14 +582,14 @@ async def edit_worker() -> None:
                     accumulated += chunk
                     wake.set()
         except Exception:
-            logger.exception("Teams streaming consumption failed")
+            logger.exception("Activity streaming consumption failed")
         finally:
             worker_done.set()
             wake.set()
             try:
                 await edit_task
             except Exception:  # pragma: no cover
-                logger.exception("Teams edit worker crashed")
+                logger.exception("Activity edit worker crashed")
 
         try:
             await stream.get_final_response()
@@ -472,19 +597,26 @@ async def edit_worker() -> None:
             logger.exception("Stream finalize failed")
 
         # Final flush — make sure the user sees everything that arrived after
-        # the worker's last edit.
-        if activity_id is not None and accumulated and accumulated != last_sent:
+        # the worker's last edit. If the placeholder failed we POST a fresh
+        # activity here with whatever accumulated.
+        if not placeholder_ok:
+            text = accumulated or "(no response)"
+            try:
+                await self._send_message(inbound, text)
+            except Exception:  # pragma: no cover
+                logger.exception("Activity fallback final send failed")
+        elif activity_id is not None and accumulated and accumulated != last_sent:
             try:
                 await self._update_activity(inbound, activity_id, accumulated)
             except Exception:  # pragma: no cover
-                logger.exception("Teams final edit failed")
+                logger.exception("Activity final edit failed")
         elif not accumulated and activity_id is not None:
             # No text streamed — replace the placeholder with a stub so the
             # user isn't left staring at "…".
             try:
                 await self._update_activity(inbound, activity_id, "(no response)")
             except Exception:  # pragma: no cover
-                logger.exception("Teams placeholder replace failed")
+                logger.exception("Activity placeholder replace failed")
 
     # -- Bot Framework REST helpers --------------------------------------- #
 
diff --git a/python/packages/hosting-activity-protocol/tests/test_channel.py b/python/packages/hosting-activity-protocol/tests/test_channel.py
index 64208d6902..b756afe052 100644
--- a/python/packages/hosting-activity-protocol/tests/test_channel.py
+++ b/python/packages/hosting-activity-protocol/tests/test_channel.py
@@ -150,8 +150,10 @@ def test_message_missing_serviceurl_is_dropped(self) -> None:
         bad.pop("serviceUrl")
         with TestClient(host.app) as client:
             r = client.post("/activity/messages", json=bad)
-        # Bot Framework still expects 200 to dequeue.
-        assert r.status_code == 200
+        # No serviceUrl → fails the allow-list check (None doesn't match
+        # any allowed host suffix), surfaced as 400 so a misconfigured
+        # caller knows the activity was structurally invalid.
+        assert r.status_code == 400
         assert not agent.runs
 
 
@@ -180,3 +182,250 @@ def test_rejects_both_secret_and_certificate(self) -> None:
     def test_dev_mode_no_credential(self) -> None:
         ch = ActivityProtocolChannel()
         assert ch._credential is None
+
+
+class TestServiceUrlAllowList:
+    """``serviceUrl`` is supplied by the inbound activity and the channel
+    POSTs a real bearer token to it — anything outside the Bot Framework
+    host suffixes must be rejected so a malicious caller can't redirect
+    outbound replies to an attacker-controlled host."""
+
+    def test_default_allows_smba_trafficmanager(self) -> None:
+        ch = ActivityProtocolChannel()
+        assert ch._is_service_url_allowed("https://smba.trafficmanager.net/amer/")
+        assert ch._is_service_url_allowed("https://emea.smba.trafficmanager.net/")
+        assert ch._is_service_url_allowed("https://api.botframework.com/")
+
+    def test_default_rejects_arbitrary_host(self) -> None:
+        ch = ActivityProtocolChannel()
+        assert not ch._is_service_url_allowed("https://attacker.example.com/")
+        assert not ch._is_service_url_allowed("https://botframework.com.attacker.com/")
+        assert not ch._is_service_url_allowed("")
+        assert not ch._is_service_url_allowed(None)
+
+    def test_custom_allowlist(self) -> None:
+        ch = ActivityProtocolChannel(service_url_allowed_hosts=("internal.contoso.com",))
+        assert ch._is_service_url_allowed("https://internal.contoso.com/v3/")
+        assert ch._is_service_url_allowed("https://eu.internal.contoso.com/")
+        assert not ch._is_service_url_allowed("https://smba.trafficmanager.net/")
+
+    def test_empty_allowlist_disables_check(self) -> None:
+        ch = ActivityProtocolChannel(service_url_allowed_hosts=())
+        assert ch._is_service_url_allowed("https://anywhere.example.org/")
+
+    def test_webhook_rejects_disallowed_serviceurl(self) -> None:
+        ch, agent = _make_teams()
+        host = AgentFrameworkHost(target=agent, channels=[ch])
+        bad = dict(_VALID_ACTIVITY)
+        bad["serviceUrl"] = "https://attacker.example.com/v3/"
+        with TestClient(host.app) as client:
+            r = client.post("/activity/messages", json=bad)
+        assert r.status_code == 400
+        assert not agent.runs
+        # No outbound POST attempted with a bearer token.
+        assert ch._http is not None
+        ch._http.post.assert_not_called()  # type: ignore[attr-defined]
+
+
+class TestInboundAuthValidator:
+    def test_allow_passes_through(self) -> None:
+        async def allow(_req: Any) -> bool:
+            return True
+
+        ch, agent = _make_teams()
+        ch._inbound_auth_validator = allow
+        host = AgentFrameworkHost(target=agent, channels=[ch])
+        with TestClient(host.app) as client:
+            r = client.post("/activity/messages", json=_VALID_ACTIVITY)
+        assert r.status_code == 200
+        assert agent.runs
+
+    def test_reject_returns_401(self) -> None:
+        async def deny(_req: Any) -> bool:
+            return False
+
+        ch, agent = _make_teams()
+        ch._inbound_auth_validator = deny
+        host = AgentFrameworkHost(target=agent, channels=[ch])
+        with TestClient(host.app) as client:
+            r = client.post("/activity/messages", json=_VALID_ACTIVITY)
+        assert r.status_code == 401
+        assert not agent.runs
+
+    def test_validator_raises_returns_401(self) -> None:
+        async def boom(_req: Any) -> bool:
+            raise RuntimeError("validator broke")
+
+        ch, agent = _make_teams()
+        ch._inbound_auth_validator = boom
+        host = AgentFrameworkHost(target=agent, channels=[ch])
+        with TestClient(host.app) as client:
+            r = client.post("/activity/messages", json=_VALID_ACTIVITY)
+        assert r.status_code == 401
+        assert not agent.runs
+
+
+@pytest.mark.asyncio
+class TestOutboundAuthHeader:
+    async def test_no_credential_sends_no_authorization_header(self) -> None:
+        ch, _agent = _make_teams()
+        # Default _make_teams has no credential — dev mode.
+        await ch._send_message(_VALID_ACTIVITY, "hi")
+        assert ch._http is not None
+        headers = ch._http.post.call_args[1]["headers"]  # type: ignore[attr-defined]
+        assert "Authorization" not in headers
+
+    async def test_with_credential_sends_bearer_token(self) -> None:
+        ch, _agent = _make_teams()
+        # Inject a fake credential with a fixed token.
+        token_obj = MagicMock()
+        token_obj.token = "tok-abc123"
+        cred = MagicMock()
+        cred.get_token = AsyncMock(return_value=token_obj)
+        ch._credential = cred  # type: ignore[assignment]
+        await ch._send_message(_VALID_ACTIVITY, "hi")
+        assert ch._http is not None
+        headers = ch._http.post.call_args[1]["headers"]  # type: ignore[attr-defined]
+        assert headers.get("Authorization") == "Bearer tok-abc123"
+
+
+class TestRetrySignal:
+    """Distinguish transient outbound failures (network / 5xx) — which
+    must surface 502 so Bot Service retries — from deterministic agent
+    failures (which must return 200 to avoid retry loops)."""
+
+    def test_outbound_http_error_returns_502(self) -> None:
+        import httpx as _httpx
+
+        ch, agent = _make_teams()
+        # Make _send_message raise a transient httpx error.
+        assert ch._http is not None
+        ch._http.post = AsyncMock(side_effect=_httpx.ConnectError("nope"))  # type: ignore[attr-defined]
+        host = AgentFrameworkHost(target=agent, channels=[ch])
+        with TestClient(host.app) as client:
+            r = client.post("/activity/messages", json=_VALID_ACTIVITY)
+        assert r.status_code == 502
+
+    def test_deterministic_agent_failure_returns_200(self) -> None:
+        ch, agent = _make_teams()
+
+        def boom(messages: Any = None, *, stream: bool = False, **kwargs: Any) -> Any:
+            async def _coro() -> Any:
+                raise ValueError("agent crashed")
+
+            return _coro()
+
+        agent.run = boom  # type: ignore[assignment]
+        host = AgentFrameworkHost(target=agent, channels=[ch])
+        with TestClient(host.app) as client:
+            r = client.post("/activity/messages", json=_VALID_ACTIVITY)
+        # Deterministic failure → 200 (Bot Service does not retry the same
+        # broken activity in a loop).
+        assert r.status_code == 200
+
+
+@pytest.mark.asyncio
+class TestStreaming:
+    async def test_stream_sends_placeholder_and_edits(self) -> None:
+        ch, _agent = _make_teams(stream=True)
+
+        # Build a fake stream that emits two text chunks then finalizes.
+        @dataclass
+        class _Up:
+            text: str
+
+        class _Stream:
+            def __init__(self) -> None:
+                self._chunks = ["hel", "lo"]
+
+            def __aiter__(self) -> Any:
+                async def gen() -> Any:
+                    for c in self._chunks:
+                        yield _Up(c)
+
+                return gen()
+
+            async def get_final_response(self) -> Any:
+                return _FakeAgentResponse(text="hello")
+
+        # Use a tight throttle so the test doesn't sit on `wait_for`.
+        ch._stream_edit_min_interval = 0.0
+        await ch._stream_to_conversation(_VALID_ACTIVITY, _Stream())  # type: ignore[arg-type]
+        assert ch._http is not None
+        # Placeholder POST + at least one final PUT.
+        ch._http.post.assert_called()  # type: ignore[attr-defined]
+        ch._http.put.assert_called()  # type: ignore[attr-defined]
+        # Final edit body carries the full accumulated text.
+        last_put_body = ch._http.put.call_args[1]["json"]  # type: ignore[attr-defined]
+        assert last_put_body["text"] == "hello"
+
+    async def test_stream_placeholder_failure_falls_back_to_single_post(self) -> None:
+        # The bug: when send_initial_placeholder fails, activity_id stays
+        # None, the edit_worker can never reach its exit condition
+        # (`accumulated == last_sent` while no PUT possible) and the
+        # whole conversation deadlocks. After the fix we fall back to
+        # buffering the stream and POSTing a single final activity.
+        ch, _agent = _make_teams(stream=True)
+        # Make the FIRST POST (placeholder) raise; subsequent POST (final
+        # fallback) succeeds.
+        import httpx as _httpx
+
+        ok_response = MagicMock()
+        ok_response.raise_for_status = MagicMock()
+        ok_response.json = MagicMock(return_value={"id": "act-final"})
+        ok_response.content = b"{}"
+        post_mock = AsyncMock(side_effect=[_httpx.HTTPError("boom"), ok_response])
+        assert ch._http is not None
+        ch._http.post = post_mock  # type: ignore[attr-defined]
+
+        @dataclass
+        class _Up:
+            text: str
+
+        class _Stream:
+            def __aiter__(self) -> Any:
+                async def gen() -> Any:
+                    yield _Up("partial-1")
+                    yield _Up("-partial-2")
+
+                return gen()
+
+            async def get_final_response(self) -> Any:
+                return _FakeAgentResponse(text="partial-1-partial-2")
+
+        ch._stream_edit_min_interval = 0.0
+        # Should NOT hang. Use asyncio.wait_for with a small timeout to
+        # guard the test against future regressions of the deadlock.
+        import asyncio as _asyncio
+
+        await _asyncio.wait_for(
+            ch._stream_to_conversation(_VALID_ACTIVITY, _Stream()),  # type: ignore[arg-type]
+            timeout=2.0,
+        )
+        # Two POSTs total: placeholder (failed) + fallback final.
+        assert post_mock.await_count == 2
+        # Fallback POST contains the full accumulated text.
+        fallback_body = post_mock.call_args[1]["json"]
+        assert fallback_body["text"] == "partial-1-partial-2"
+
+    async def test_stream_with_no_text_replaces_placeholder(self) -> None:
+        ch, _agent = _make_teams(stream=True)
+
+        class _EmptyStream:
+            def __aiter__(self) -> Any:
+                async def gen() -> Any:
+                    if False:
+                        yield None  # type: ignore[unreachable]
+
+                return gen()
+
+            async def get_final_response(self) -> Any:
+                return _FakeAgentResponse(text="")
+
+        ch._stream_edit_min_interval = 0.0
+        await ch._stream_to_conversation(_VALID_ACTIVITY, _EmptyStream())  # type: ignore[arg-type]
+        # The placeholder PUT-replaces with "(no response)" so the user
+        # isn't left staring at "…".
+        assert ch._http is not None
+        last_put_body = ch._http.put.call_args[1]["json"]  # type: ignore[attr-defined]
+        assert last_put_body["text"] == "(no response)"