From c4b681e26b820b89fbf96a600f350f85c8a1cba0 Mon Sep 17 00:00:00 2001
From: eavanvalkenburg <github@vanvalkenburg.eu>
Date: Thu, 2 Jul 2026 16:45:08 +0200
Subject: [PATCH 1/7] Add Python hosting protocol helper surface

Introduce AgentFrameworkState and SessionStore for app-owned hosting routes, add Responses run conversion/rendering helpers, and update the local Responses sample to use native FastAPI routing with streaming support.

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 python/packages/hosting-responses/README.md   |  50 +-
 .../__init__.py                               |  10 +
 .../_parsing.py                               | 785 +++++++++++++++++-
 .../tests/hosting_responses/test_parsing.py   | 129 +++
 python/packages/hosting/README.md             | 120 +--
 .../agent_framework_hosting/__init__.py       |   5 +
 .../hosting/agent_framework_hosting/_state.py | 222 +++++
 .../hosting/tests/hosting/test_state.py       | 138 +++
 .../samples/04-hosting/af-hosting/README.md   |   2 +-
 .../af-hosting/local_responses/README.md      |  44 +-
 .../af-hosting/local_responses/app.py         | 153 ++--
 .../local_responses/call_server_af.py         |  14 +-
 .../af-hosting/local_responses/pyproject.toml |   3 +-
 13 files changed, 1471 insertions(+), 204 deletions(-)
 create mode 100644 python/packages/hosting/agent_framework_hosting/_state.py
 create mode 100644 python/packages/hosting/tests/hosting/test_state.py

diff --git a/python/packages/hosting-responses/README.md b/python/packages/hosting-responses/README.md
index ae03d364af3..956d59f516f 100644
--- a/python/packages/hosting-responses/README.md
+++ b/python/packages/hosting-responses/README.md
@@ -1,21 +1,49 @@
 # agent-framework-hosting-responses
 
-OpenAI Responses-shaped channel for `agent-framework-hosting`.
+OpenAI Responses-shaped helpers for app-owned Agent Framework hosting.
 
-Exposes a single `POST /responses` endpoint that accepts the OpenAI
-Responses API request body and returns either a Responses-shaped JSON
-body or a Server-Sent-Events stream when `stream=True`.
+This package provides the Responses-specific conversion layer:
+
+- `responses_to_run(...)` — convert a Responses request body into Agent
+  Framework run values.
+- `responses_session_id(...)` — extract a prior `resp_*` response id or
+  `conv_*` conversation id from the request body when present.
+- `create_response_id(...)` — mint a Responses-shaped response id.
+- `responses_from_run(...)` — convert an `AgentResponse` into a
+  Responses-compatible JSON payload.
+- `responses_stream_events_from_run(...)` — convert an Agent Framework
+  `ResponseStream` into Responses-compatible SSE events.
+
+FastAPI/Starlette/Django/Azure Functions code owns route registration,
+authentication, status codes, response construction, and background work.
 
 ```python
-from agent_framework.openai import OpenAIChatClient
-from agent_framework_hosting import AgentFrameworkHost
-from agent_framework_hosting_responses import ResponsesChannel
+from agent_framework_hosting import AgentFrameworkState, SessionStore
+from agent_framework_hosting_responses import (
+    create_response_id,
+    responses_from_run,
+    responses_session_id,
+    responses_to_run,
+)
+from fastapi import Body, FastAPI
+from fastapi.responses import JSONResponse
+
+app = FastAPI()
+state = AgentFrameworkState(agent, session_store=SessionStore)
 
-agent = OpenAIChatClient().as_agent(name="Assistant")
 
-host = AgentFrameworkHost(target=agent, channels=[ResponsesChannel()])
-host.serve(port=8000)
+@app.post("/responses")
+async def responses(body: dict = Body(...)) -> JSONResponse:
+    run = responses_to_run(body)
+    session_id = responses_session_id(body)
+    response_id = create_response_id()
+    result = await (await state.get_target()).run(
+        run["messages"],
+        session=await state.get_session(session_id or response_id),
+        options=run["options"],
+    )
+    return JSONResponse(responses_from_run(result, response_id=response_id, session_id=session_id))
 ```
 
-The base host plumbing lives in
+The base execution-state helpers live in
 [`agent-framework-hosting`](https://pypi.org/project/agent-framework-hosting/).
diff --git a/python/packages/hosting-responses/agent_framework_hosting_responses/__init__.py b/python/packages/hosting-responses/agent_framework_hosting_responses/__init__.py
index cd221b56824..eea77e876a8 100644
--- a/python/packages/hosting-responses/agent_framework_hosting_responses/__init__.py
+++ b/python/packages/hosting-responses/agent_framework_hosting_responses/__init__.py
@@ -6,9 +6,14 @@
 
 from ._channel import ResponsesChannel
 from ._parsing import (
+    create_response_id,
     messages_from_responses_input,
     parse_responses_identity,
     parse_responses_request,
+    responses_from_run,
+    responses_session_id,
+    responses_stream_events_from_run,
+    responses_to_run,
 )
 
 try:
@@ -19,7 +24,12 @@
 __all__ = [
     "ResponsesChannel",
     "__version__",
+    "create_response_id",
     "messages_from_responses_input",
     "parse_responses_identity",
     "parse_responses_request",
+    "responses_from_run",
+    "responses_session_id",
+    "responses_stream_events_from_run",
+    "responses_to_run",
 ]
diff --git a/python/packages/hosting-responses/agent_framework_hosting_responses/_parsing.py b/python/packages/hosting-responses/agent_framework_hosting_responses/_parsing.py
index fa742c55563..72c8d632118 100644
--- a/python/packages/hosting-responses/agent_framework_hosting_responses/_parsing.py
+++ b/python/packages/hosting-responses/agent_framework_hosting_responses/_parsing.py
@@ -15,11 +15,30 @@
 
 from __future__ import annotations
 
-from collections.abc import Mapping
+import json
+import time
+import uuid
+from collections.abc import AsyncIterator, Mapping, Sequence
 from typing import Any, cast
 
-from agent_framework import Content, Message
-from agent_framework_hosting import ChannelIdentity, ChannelSession
+from agent_framework import AgentResponse, AgentResponseUpdate, ChatOptions, Content, Message, ResponseStream
+from agent_framework_hosting import AgentRunArgs, ChannelIdentity, ChannelSession
+from openai.types.responses import (
+    Response as OpenAIResponse,
+)
+from openai.types.responses import (
+    ResponseFunctionToolCall,
+    ResponseFunctionToolCallOutputItem,
+    ResponseInputFile,
+    ResponseInputImage,
+    ResponseInputText,
+    ResponseOutputItem,
+    ResponseOutputMessage,
+    ResponseOutputText,
+)
+from pydantic import TypeAdapter, ValidationError
+
+_RESPONSE_OUTPUT_ITEM_ADAPTER: TypeAdapter[Any] = TypeAdapter(ResponseOutputItem)
 
 # OpenAI Responses field name → Agent Framework ChatOptions field name.
 _RESPONSES_OPTION_REMAP = {
@@ -29,6 +48,7 @@
 # Fields the Responses transport owns; they are consumed separately and must
 # not also appear in options.
 _RESPONSES_TRANSPORT_KEYS = frozenset({"input", "stream", "previous_response_id"})
+_RESPONSES_RUN_TRANSPORT_KEYS = frozenset({"input", "stream", "previous_response_id", "conversation_id"})
 
 
 def parse_responses_identity(body: Mapping[str, Any], channel_name: str) -> ChannelIdentity | None:
@@ -149,8 +169,767 @@ def parse_responses_request(
     return messages, options, session
 
 
+def create_response_id() -> str:
+    """Create a Responses-shaped response id."""
+    return f"resp_{uuid.uuid4().hex}"
+
+
+def responses_session_id(body: Mapping[str, Any]) -> str | None:
+    """Return the Responses session id from request body, if present.
+
+    The returned value can be a ``resp_*`` previous response id or a ``conv_*``
+    conversation id. Callers choose whether this request-derived value is
+    trusted for their route and deployment.
+
+    Args:
+        body: OpenAI Responses-shaped request body.
+
+    Returns:
+        Previous response id, conversation id, or ``None``.
+    """
+    previous_response_id = body.get("previous_response_id")
+    if isinstance(previous_response_id, str) and previous_response_id:
+        return previous_response_id
+    conversation_id = body.get("conversation_id")
+    if isinstance(conversation_id, str) and conversation_id:
+        return conversation_id
+    return None
+
+
+def responses_to_run(body: Mapping[str, Any]) -> AgentRunArgs:
+    """Convert a Responses request body into Agent Framework run values.
+
+    Args:
+        body: OpenAI Responses-shaped request body.
+
+    Returns:
+        Arguments corresponding to ``Agent.run``.
+
+    Raises:
+        ValueError: If the request body has invalid ``input``.
+    """
+    messages = messages_from_responses_input(body.get("input"))
+    options: dict[str, Any] = {}
+    for key, value in body.items():
+        if key in _RESPONSES_RUN_TRANSPORT_KEYS or value is None:
+            continue
+        options[_RESPONSES_OPTION_REMAP.get(key, key)] = value
+    return AgentRunArgs(
+        messages=messages,
+        options=cast("ChatOptions[Any]", options),
+        stream=bool(body.get("stream", False)),
+    )
+
+
+def responses_from_run(
+    result: AgentResponse[Any],
+    *,
+    response_id: str,
+    session_id: str | None = None,
+) -> dict[str, Any]:
+    """Convert an Agent Framework response into a Responses payload.
+
+    Args:
+        result: Agent response returned by a run.
+
+    Keyword Args:
+        response_id: Id for the response being created.
+        session_id: Optional prior ``resp_*`` or ``conv_*`` session id. When it
+            is a conversation id, the helper renders it in the Responses
+            conversation field.
+
+    Returns:
+        Responses-compatible JSON payload.
+    """
+    output_items = _result_to_output_items(result, status="completed")
+    response_kwargs: dict[str, Any] = {
+        "id": response_id,
+        "object": "response",
+        "created_at": int(time.time()),
+        "status": "completed",
+        "model": _model_from_result(result),
+        "output": output_items,
+        "parallel_tool_calls": False,
+        "tool_choice": "auto",
+        "tools": [],
+        "metadata": {},
+    }
+    if session_id is not None and session_id.startswith("conv_"):
+        response_kwargs["conversation"] = {"id": session_id}
+    return _response_payload(OpenAIResponse(**response_kwargs))
+
+
+def _model_from_result(result: Any) -> str:
+    model = getattr(result, "model", None)
+    if isinstance(model, str) and model:
+        return model
+    raw = getattr(result, "raw_representation", None)
+    raw_model = getattr(raw, "model", None)
+    if isinstance(raw_model, str) and raw_model:
+        return raw_model
+    additional_properties = getattr(result, "additional_properties", None)
+    if isinstance(additional_properties, Mapping):
+        additional_model = cast(Mapping[str, Any], additional_properties).get("model")
+        if isinstance(additional_model, str) and additional_model:
+            return additional_model
+    return "agent"
+
+
+def _result_to_output_items(result: Any, *, status: str) -> list[ResponseOutputItem]:
+    """Render an agent or workflow result as Responses output items."""
+    messages = getattr(result, "messages", None)
+    if isinstance(messages, Sequence) and not isinstance(messages, (str, bytes, bytearray)):
+        return _messages_to_output_items(cast("Sequence[Any]", messages), status=status)
+
+    if isinstance(result, Message):
+        return _messages_to_output_items([result], status=status)
+    if isinstance(result, Content):
+        return _contents_to_output_items([result], status=status)
+
+    get_outputs = getattr(result, "get_outputs", None)
+    if callable(get_outputs):
+        output_items: list[ResponseOutputItem] = []
+        for output in cast("Sequence[Any]", get_outputs()):
+            output_items.extend(_output_to_output_items(output, status=status))
+        return output_items
+
+    text = getattr(result, "text", None)
+    if isinstance(text, str):
+        return _text_output_items(text, status=status)
+    return _text_output_items(_result_to_text(result), status=status)
+
+
+def _output_to_output_items(output: Any, *, status: str) -> list[ResponseOutputItem]:
+    if isinstance(output, Message):
+        return _messages_to_output_items([output], status=status)
+    if isinstance(output, Content):
+        return _contents_to_output_items([output], status=status)
+    messages = getattr(output, "messages", None)
+    if isinstance(messages, Sequence) and not isinstance(messages, (str, bytes, bytearray)):
+        return _messages_to_output_items(cast("Sequence[Any]", messages), status=status)
+    text = getattr(output, "text", None)
+    if isinstance(text, str):
+        return _text_output_items(text, status=status)
+    return _text_output_items(str(output), status=status)
+
+
+def _messages_to_output_items(messages: Sequence[Any], *, status: str) -> list[ResponseOutputItem]:
+    output_items: list[ResponseOutputItem] = []
+    message_contents: list[Content] = []
+
+    for message in messages:
+        if not isinstance(message, Message):
+            if message_contents:
+                output_items.extend(_contents_to_output_items(message_contents, status=status))
+                message_contents.clear()
+            output_items.extend(_output_to_output_items(message, status=status))
+            continue
+        message_contents.extend(message.contents)
+
+    if message_contents:
+        output_items.extend(_contents_to_output_items(message_contents, status=status))
+
+    return output_items
+
+
+def _contents_to_output_items(
+    contents: Sequence[Content],
+    *,
+    status: str,
+    seen_raw_items: dict[tuple[str, str], int] | None = None,
+) -> list[ResponseOutputItem]:
+    output_items: list[ResponseOutputItem] = []
+    message_content: list[Any] = []
+    seen: dict[tuple[str, str], int] = seen_raw_items if seen_raw_items is not None else {}
+
+    def flush_message() -> None:
+        if not message_content:
+            return
+        output_items.append(_message_output_item(message_content, status=status))
+        message_content.clear()
+
+    content_list = list(contents)
+    index = 0
+    while index < len(content_list):
+        content = content_list[index]
+        raw_item = _raw_response_output_item(content.raw_representation)
+        if raw_item is not None:
+            raw_key = _response_output_item_key(raw_item)
+            if raw_key in seen:
+                output_items[seen[raw_key]] = raw_item
+            else:
+                flush_message()
+                seen[raw_key] = len(output_items)
+                output_items.append(raw_item)
+            index += 1
+            continue
+
+        next_content = content_list[index + 1] if index + 1 < len(content_list) else None
+        if _is_matching_code_interpreter_result(content, next_content):
+            flush_message()
+            output_items.append(_code_interpreter_output_item(content, status=status, result_content=next_content))
+            index += 2
+            continue
+        if _is_matching_image_generation_result(content, next_content):
+            flush_message()
+            output_items.append(_image_generation_output_item(content, status=status, result_content=next_content))
+            index += 2
+            continue
+        if _is_matching_mcp_result(content, next_content):
+            flush_message()
+            output_items.append(_mcp_call_output_item(content, status=status, result_content=next_content))
+            index += 2
+            continue
+
+        match content.type:
+            case "text":
+                message_content.append(_message_text_content(content))
+            case "text_reasoning":
+                flush_message()
+                output_items.append(_reasoning_output_item(content, status=status))
+            case "function_call":
+                flush_message()
+                output_items.append(_function_call_output_item(content, status=status))
+            case "function_result":
+                flush_message()
+                output_items.append(_function_result_output_item(content, status=status))
+            case "code_interpreter_tool_call" | "code_interpreter_tool_result":
+                flush_message()
+                output_items.append(_code_interpreter_output_item(content, status=status))
+            case "image_generation_tool_call" | "image_generation_tool_result":
+                flush_message()
+                output_items.append(_image_generation_output_item(content, status=status))
+            case "mcp_server_tool_call":
+                flush_message()
+                output_items.append(_mcp_call_output_item(content, status=status))
+            case "mcp_server_tool_result":
+                flush_message()
+                output_items.append(_mcp_result_output_item(content, status=status))
+            case "shell_tool_call":
+                flush_message()
+                output_items.append(_shell_call_output_item(content, status=status))
+            case "shell_tool_result":
+                flush_message()
+                output_items.append(_shell_result_output_item(content, status=status))
+            case "function_approval_request":
+                flush_message()
+                output_items.append(_function_approval_request_output_item(content))
+            case "function_approval_response":
+                flush_message()
+                output_items.append(_function_approval_response_output_item(content))
+            case "data" | "uri" | "hosted_file":
+                flush_message()
+                output_items.append(_media_content_output_item(content, status=status))
+            case "error":
+                message_content.append(ResponseOutputText(type="output_text", text=str(content), annotations=[]))
+            case _:
+                flush_message()
+                output_items.extend(_text_output_items(json.dumps(content.to_dict(), default=str), status=status))
+        index += 1
+
+    flush_message()
+    return output_items
+
+
+def _is_matching_code_interpreter_result(content: Content, next_content: Content | None) -> bool:
+    return (
+        content.type == "code_interpreter_tool_call"
+        and next_content is not None
+        and next_content.type == "code_interpreter_tool_result"
+        and content.call_id == next_content.call_id
+    )
+
+
+def _is_matching_image_generation_result(content: Content, next_content: Content | None) -> bool:
+    return (
+        content.type == "image_generation_tool_call"
+        and next_content is not None
+        and next_content.type == "image_generation_tool_result"
+        and content.image_id == next_content.image_id
+    )
+
+
+def _is_matching_mcp_result(content: Content, next_content: Content | None) -> bool:
+    return (
+        content.type == "mcp_server_tool_call"
+        and next_content is not None
+        and next_content.type == "mcp_server_tool_result"
+        and content.call_id == next_content.call_id
+    )
+
+
+def _message_status(status: str) -> str:
+    return status if status in ("in_progress", "completed", "incomplete") else "incomplete"
+
+
+def _text_output_items(text: str, *, status: str, message_id: str | None = None) -> list[ResponseOutputItem]:
+    return [
+        _message_output_item(
+            [ResponseOutputText(type="output_text", text=text, annotations=[])],
+            status=status,
+            message_id=message_id,
+        )
+    ]
+
+
+def _message_output_item(content: Sequence[Any], *, status: str, message_id: str | None = None) -> ResponseOutputItem:
+    return cast(
+        ResponseOutputItem,
+        ResponseOutputMessage(
+            id=message_id or f"msg_{uuid.uuid4().hex}",
+            type="message",
+            role="assistant",
+            status=_message_status(status),  # type: ignore[arg-type]
+            content=list(content),
+        ),
+    )
+
+
+def _message_text_content(content: Content) -> Any:
+    raw_type = _raw_type(content.raw_representation)
+    if raw_type in ("output_text", "refusal"):
+        return content.raw_representation
+    return ResponseOutputText(type="output_text", text=content.text or "", annotations=[])
+
+
+def _reasoning_output_item(content: Content, *, status: str) -> ResponseOutputItem:
+    item_data: dict[str, Any] = {
+        "id": content.id or f"rs_{uuid.uuid4().hex}",
+        "type": "reasoning",
+        "summary": [],
+        "status": _message_status(status),
+    }
+    if content.text:
+        item_data["content"] = [{"type": "reasoning_text", "text": content.text}]
+    if content.protected_data:
+        item_data["encrypted_content"] = content.protected_data
+    return _response_output_item(item_data)
+
+
+def _function_call_output_item(content: Content, *, status: str) -> ResponseOutputItem:
+    return cast(
+        ResponseOutputItem,
+        ResponseFunctionToolCall(
+            id=content.additional_properties.get("fc_id") if content.additional_properties else None,
+            type="function_call",
+            call_id=content.call_id or f"call_{uuid.uuid4().hex}",
+            name=content.name or "tool",
+            arguments=_arguments_to_str(content.arguments),
+            status=_message_status(status),  # type: ignore[arg-type]
+        ),
+    )
+
+
+def _function_result_output_item(content: Content, *, status: str) -> ResponseOutputItem:
+    if content.exception:
+        output: str | list[Any] = content.exception
+    elif output_parts := _content_parts_to_input_items(content.items):
+        output = output_parts
+    elif isinstance(content.result, str):
+        output = content.result
+    elif content.result is None:
+        output = ""
+    else:
+        output = json.dumps(content.result, default=str)
+    return cast(
+        ResponseOutputItem,
+        ResponseFunctionToolCallOutputItem(
+            id=f"fcout_{uuid.uuid4().hex}",
+            type="function_call_output",
+            call_id=content.call_id or f"call_{uuid.uuid4().hex}",
+            output=output,
+            status=_message_status(status),  # type: ignore[arg-type]
+        ),
+    )
+
+
+def _code_interpreter_output_item(
+    content: Content,
+    *,
+    status: str,
+    result_content: Content | None = None,
+) -> ResponseOutputItem:
+    output_parts: list[dict[str, Any]] = []
+    outputs_value: Any = result_content.outputs if result_content is not None else content.outputs
+    if isinstance(outputs_value, Sequence) and not isinstance(outputs_value, (str, bytes, bytearray)):
+        for item in cast(Sequence[Any], outputs_value):
+            if isinstance(item, Content) and item.type == "text":
+                output_parts.append({"type": "logs", "logs": item.text or ""})
+            elif isinstance(item, Content) and item.type in ("data", "uri") and item.uri:
+                output_parts.append({"type": "image", "url": item.uri})
+
+    return _response_output_item({
+        "id": _content_item_id(content, result_content) or f"ci_{uuid.uuid4().hex}",
+        "type": "code_interpreter_call",
+        "code": _content_sequence_text(content.inputs),
+        "container_id": str(_content_property(content, result_content, "container_id") or "agent_framework"),
+        "outputs": output_parts or None,
+        "status": _code_interpreter_status(status),
+    })
+
+
+def _image_generation_output_item(
+    content: Content,
+    *,
+    status: str,
+    result_content: Content | None = None,
+) -> ResponseOutputItem:
+    result_source = result_content.outputs if result_content is not None else content.outputs
+    image_id = content.image_id or (result_content.image_id if result_content is not None else None)
+    return _response_output_item({
+        "id": image_id or f"ig_{uuid.uuid4().hex}",
+        "type": "image_generation_call",
+        "result": _image_generation_result(result_source),
+        "status": _image_generation_status(status),
+    })
+
+
+def _mcp_call_output_item(
+    content: Content,
+    *,
+    status: str,
+    result_content: Content | None = None,
+) -> ResponseOutputItem:
+    return _response_output_item({
+        "id": content.call_id or f"mcp_{uuid.uuid4().hex}",
+        "type": "mcp_call",
+        "server_label": content.server_name or "default",
+        "name": content.tool_name or "tool",
+        "arguments": _arguments_to_str(content.arguments),
+        "output": _stringify_output(result_content.output) if result_content is not None else None,
+        "status": _mcp_status(status),
+    })
+
+
+def _mcp_result_output_item(content: Content, *, status: str) -> ResponseOutputItem:
+    return _response_output_item({
+        "id": content.call_id or f"mcp_{uuid.uuid4().hex}",
+        "type": "mcp_call",
+        "server_label": content.server_name or "default",
+        "name": content.tool_name or "tool",
+        "arguments": "",
+        "output": _stringify_output(content.output),
+        "status": _mcp_status(status),
+    })
+
+
+def _shell_call_output_item(content: Content, *, status: str) -> ResponseOutputItem:
+    return _response_output_item({
+        "id": content.additional_properties.get("item_id") or f"shell_{uuid.uuid4().hex}",
+        "type": "shell_call",
+        "call_id": content.call_id or f"call_{uuid.uuid4().hex}",
+        "action": {
+            "commands": content.commands or [],
+            "timeout_ms": content.timeout_ms,
+            "max_output_length": content.max_output_length,
+        },
+        "environment": {"type": "local"},
+        "status": _message_status(status),
+    })
+
+
+def _shell_result_output_item(content: Content, *, status: str) -> ResponseOutputItem:
+    outputs: list[dict[str, Any]] = []
+    outputs_value: Any = content.outputs
+    if isinstance(outputs_value, Sequence) and not isinstance(outputs_value, (str, bytes, bytearray)):
+        for item in cast(Sequence[Any], outputs_value):
+            if not isinstance(item, Content):
+                continue
+            outcome = {"type": "timeout"} if item.timed_out else {"type": "exit", "exit_code": item.exit_code or 0}
+            outputs.append({"stdout": item.stdout or "", "stderr": item.stderr or "", "outcome": outcome})
+
+    return _response_output_item({
+        "id": content.additional_properties.get("item_id") or f"shellout_{uuid.uuid4().hex}",
+        "type": "shell_call_output",
+        "call_id": content.call_id or f"call_{uuid.uuid4().hex}",
+        "output": outputs,
+        "max_output_length": content.max_output_length,
+        "status": _message_status(status),
+    })
+
+
+def _function_approval_request_output_item(content: Content) -> ResponseOutputItem:
+    function_call = content.function_call
+    return _response_output_item({
+        "id": content.id or f"approval_{uuid.uuid4().hex}",
+        "type": "mcp_approval_request",
+        "server_label": (
+            function_call.additional_properties.get("server_label", "agent_framework")
+            if function_call is not None
+            else "agent_framework"
+        ),
+        "name": function_call.name if function_call is not None and function_call.name else "tool",
+        "arguments": _arguments_to_str(function_call.arguments if function_call is not None else None),
+    })
+
+
+def _function_approval_response_output_item(content: Content) -> ResponseOutputItem:
+    return _response_output_item({
+        "id": content.id or f"approval_{uuid.uuid4().hex}",
+        "type": "mcp_approval_response",
+        "approval_request_id": content.id or "",
+        "approve": bool(content.approved),
+    })
+
+
+def _media_content_output_item(content: Content, *, status: str) -> ResponseOutputItem:
+    parts = _content_parts_to_input_items([content])
+    if parts:
+        return cast(
+            ResponseOutputItem,
+            ResponseFunctionToolCallOutputItem(
+                id=f"content_{uuid.uuid4().hex}",
+                type="function_call_output",
+                call_id=f"content_{uuid.uuid4().hex}",
+                output=parts,
+                status=_message_status(status),  # type: ignore[arg-type]
+            ),
+        )
+    return _text_output_items(json.dumps(content.to_dict(), default=str), status=status)[0]
+
+
+def _content_parts_to_input_items(contents: Sequence[Content] | None) -> list[Any]:
+    if not contents:
+        return []
+
+    parts: list[Any] = []
+    for content in contents:
+        match content.type:
+            case "text":
+                parts.append(ResponseInputText(type="input_text", text=content.text or ""))
+            case "data" | "uri":
+                if not content.uri:
+                    continue
+                if _is_image_content(content):
+                    parts.append(ResponseInputImage(type="input_image", image_url=content.uri, detail="auto"))
+                else:
+                    parts.append(ResponseInputFile(type="input_file", file_url=content.uri))
+            case "hosted_file":
+                if content.file_id:
+                    parts.append(ResponseInputFile(type="input_file", file_id=content.file_id))
+            case _:
+                parts.append(ResponseInputText(type="input_text", text=json.dumps(content.to_dict(), default=str)))
+    return parts
+
+
+def _content_sequence_text(contents: Sequence[Content] | None) -> str | None:
+    if not contents:
+        return None
+    text = "".join(content.text or "" for content in contents if content.type == "text")
+    return text or None
+
+
+def _is_image_content(content: Content) -> bool:
+    media_type = content.media_type or ""
+    if media_type.startswith("image/"):
+        return True
+    return (content.uri or "").startswith("data:image/")
+
+
+def _image_generation_result(outputs: Any) -> str | None:
+    if isinstance(outputs, Content):
+        return _image_generation_content_result(outputs)
+    if isinstance(outputs, Sequence) and not isinstance(outputs, (str, bytes, bytearray)):
+        for output in cast(Sequence[Any], outputs):
+            if isinstance(output, Content) and (result := _image_generation_content_result(output)):
+                return result
+    if isinstance(outputs, str):
+        return outputs
+    return None
+
+
+def _image_generation_content_result(content: Content) -> str | None:
+    uri = content.uri
+    if not uri:
+        return None
+    if ";base64," in uri:
+        return uri.split(";base64,", 1)[1]
+    return uri
+
+
+def _content_item_id(content: Content, result_content: Content | None = None) -> str | None:
+    item_id = content.additional_properties.get("item_id")
+    if isinstance(item_id, str) and item_id:
+        return item_id
+    if result_content is not None:
+        result_item_id = result_content.additional_properties.get("item_id")
+        if isinstance(result_item_id, str) and result_item_id:
+            return result_item_id
+    return content.call_id or (result_content.call_id if result_content is not None else None)
+
+
+def _content_property(content: Content, result_content: Content | None, key: str) -> Any:
+    if key in content.additional_properties:
+        return content.additional_properties[key]
+    if result_content is not None and key in result_content.additional_properties:
+        return result_content.additional_properties[key]
+    return None
+
+
+def _code_interpreter_status(status: str) -> str:
+    if status in ("in_progress", "completed", "incomplete", "failed"):
+        return status
+    return "incomplete"
+
+
+def _image_generation_status(status: str) -> str:
+    if status in ("in_progress", "completed", "failed"):
+        return status
+    return "failed"
+
+
+def _mcp_status(status: str) -> str:
+    if status in ("in_progress", "completed", "incomplete", "failed"):
+        return status
+    return "incomplete"
+
+
+def _arguments_to_str(arguments: Any | None) -> str:
+    if arguments is None:
+        return ""
+    if isinstance(arguments, str):
+        return arguments
+    return json.dumps(arguments, default=str)
+
+
+def _stringify_output(output: Any) -> str:
+    if output is None:
+        return ""
+    if isinstance(output, str):
+        return output
+    if isinstance(output, Sequence) and not isinstance(output, (str, bytes, bytearray)):
+        return "".join(_stringify_output(item) for item in cast(Sequence[Any], output))
+    return json.dumps(output, default=str)
+
+
+def _raw_response_output_item(raw: Any) -> ResponseOutputItem | None:
+    if _raw_type(raw) is None:
+        return None
+    try:
+        return cast(ResponseOutputItem, _RESPONSE_OUTPUT_ITEM_ADAPTER.validate_python(raw))
+    except ValidationError:
+        return None
+
+
+def _response_output_item(value: Mapping[str, Any]) -> ResponseOutputItem:
+    return cast(ResponseOutputItem, _RESPONSE_OUTPUT_ITEM_ADAPTER.validate_python(value))
+
+
+def _response_output_item_key(item: ResponseOutputItem) -> tuple[str, str]:
+    item_type = _raw_type(item) or "unknown"
+    item_id = getattr(item, "id", None) or getattr(item, "call_id", None)
+    if isinstance(item_id, str) and item_id:
+        return item_type, item_id
+    return item_type, str(id(item))
+
+
+def _raw_type(raw: Any) -> str | None:
+    raw_type = getattr(raw, "type", None)
+    if isinstance(raw_type, str):
+        return raw_type
+    if isinstance(raw, Mapping):
+        mapping_type = cast(Mapping[str, Any], raw).get("type")
+        if isinstance(mapping_type, str):
+            return mapping_type
+    return None
+
+
+def _result_to_text(result: Any) -> str:
+    text = getattr(result, "text", None)
+    if isinstance(text, str):
+        return text
+    get_outputs = getattr(result, "get_outputs", None)
+    if callable(get_outputs):
+        return "".join(_output_to_text(output) for output in cast(Sequence[Any], get_outputs()))
+    return str(result)
+
+
+def _output_to_text(output: Any) -> str:
+    text = getattr(output, "text", None)
+    if isinstance(text, str):
+        return text
+    return str(output)
+
+
+def _response_payload(response: OpenAIResponse) -> dict[str, Any]:
+    payload = response.model_dump(mode="json", exclude_none=True)
+    created_at = payload.get("created_at")
+    if isinstance(created_at, float):
+        payload["created_at"] = int(created_at)
+    return payload
+
+
+def _sse_event(event_type: str, payload: Mapping[str, Any]) -> str:
+    """Format one Server-Sent Event."""
+    return f"event: {event_type}\ndata: {_json_dumps(payload)}\n\n"
+
+
+def _json_dumps(payload: Mapping[str, Any]) -> str:
+    """Serialize a Responses SSE payload."""
+    return json.dumps(payload, separators=(",", ":"))
+
+
+async def responses_stream_events_from_run(
+    stream: ResponseStream[AgentResponseUpdate, AgentResponse[Any]],
+    *,
+    response_id: str,
+    session_id: str | None = None,
+) -> AsyncIterator[str]:
+    """Convert an Agent Framework response stream into Responses SSE events.
+
+    Args:
+        stream: Agent Framework response stream returned by ``agent.run(...,
+            stream=True)``.
+
+    Keyword Args:
+        response_id: Id for the response being created.
+        session_id: Optional prior ``resp_*`` or ``conv_*`` session id.
+
+    Yields:
+        Server-Sent Event strings.
+    """
+    yield _sse_event(
+        "response.created",
+        {
+            "type": "response.created",
+            "response": {
+                "id": response_id,
+                "object": "response",
+                "created_at": int(time.time()),
+                "status": "in_progress",
+                "model": "agent",
+                "output": [],
+            },
+        },
+    )
+
+    async for update in stream:
+        if update.text:
+            yield _sse_event(
+                "response.output_text.delta",
+                {
+                    "type": "response.output_text.delta",
+                    "delta": update.text,
+                },
+            )
+
+    final = await stream.get_final_response()
+    yield _sse_event(
+        "response.completed",
+        {
+            "type": "response.completed",
+            "response": responses_from_run(final, response_id=response_id, session_id=session_id),
+        },
+    )
+
+
 __all__ = [
+    "create_response_id",
     "messages_from_responses_input",
     "parse_responses_identity",
     "parse_responses_request",
+    "responses_from_run",
+    "responses_session_id",
+    "responses_stream_events_from_run",
+    "responses_to_run",
 ]
diff --git a/python/packages/hosting-responses/tests/hosting_responses/test_parsing.py b/python/packages/hosting-responses/tests/hosting_responses/test_parsing.py
index bdc65058066..6fd749d898e 100644
--- a/python/packages/hosting-responses/tests/hosting_responses/test_parsing.py
+++ b/python/packages/hosting-responses/tests/hosting_responses/test_parsing.py
@@ -4,12 +4,20 @@
 
 from __future__ import annotations
 
+from collections.abc import AsyncIterator, Sequence
+
 import pytest
+from agent_framework import AgentResponse, AgentResponseUpdate, Content, Message, ResponseStream
 
 from agent_framework_hosting_responses import (
+    create_response_id,
     messages_from_responses_input,
     parse_responses_identity,
     parse_responses_request,
+    responses_from_run,
+    responses_session_id,
+    responses_stream_events_from_run,
+    responses_to_run,
 )
 
 
@@ -167,3 +175,124 @@ def test_returns_none_when_absent(self) -> None:
 
     def test_returns_none_for_non_string(self) -> None:
         assert parse_responses_identity({"safety_identifier": 42}, "responses") is None
+
+
+class TestResponsesRunHelpers:
+    def test_create_response_id_shape(self) -> None:
+        response_id = create_response_id()
+
+        assert response_id.startswith("resp_")
+
+    def test_responses_session_id_prefers_previous_response(self) -> None:
+        assert responses_session_id({"previous_response_id": "resp_1", "conversation_id": "conv_1"}) == "resp_1"
+
+    def test_responses_session_id_uses_conversation_id(self) -> None:
+        assert responses_session_id({"conversation_id": "conv_1"}) == "conv_1"
+
+    def test_responses_session_id_returns_none_when_absent(self) -> None:
+        assert responses_session_id({"input": "hi"}) is None
+
+    def test_responses_to_run_returns_messages_options_and_stream(self) -> None:
+        run = responses_to_run({
+            "input": "hi",
+            "stream": True,
+            "previous_response_id": "resp_1",
+            "conversation_id": "conv_1",
+            "max_output_tokens": 32,
+            "model": "gpt-x",
+        })
+
+        assert run["messages"][0].text == "hi"
+        assert run["stream"] is True
+        assert run["options"] == {"max_tokens": 32, "model": "gpt-x"}
+
+    def test_responses_from_run_returns_response_payload(self) -> None:
+        result = AgentResponse(
+            messages=Message(role="assistant", contents=[Content.from_text("hello")]),
+            additional_properties={"model": "test-model"},
+        )
+
+        payload = responses_from_run(result, response_id="resp_new")
+
+        assert payload["id"] == "resp_new"
+        assert payload["model"] == "test-model"
+        assert payload["output"][0]["content"][0]["text"] == "hello"
+
+    def test_responses_from_run_preserves_multimodal_output_items(self) -> None:
+        result = AgentResponse(
+            messages=Message(
+                role="assistant",
+                contents=[
+                    Content.from_text_reasoning(id="rs_1", text="checking"),
+                    Content.from_function_call("call_1", "collect_media", arguments={"city": "Seattle"}),
+                    Content.from_function_result(
+                        "call_1",
+                        result=[
+                            Content.from_text("caption"),
+                            Content.from_uri("https://example.com/cat.png", media_type="image/png"),
+                            Content.from_hosted_file("file_pdf", media_type="application/pdf"),
+                        ],
+                    ),
+                    Content.from_text("done"),
+                ],
+            )
+        )
+
+        payload = responses_from_run(result, response_id="resp_new")
+
+        output = payload["output"]
+        assert [item["type"] for item in output] == [
+            "reasoning",
+            "function_call",
+            "function_call_output",
+            "message",
+        ]
+        assert output[0]["content"][0]["text"] == "checking"
+        assert output[1]["name"] == "collect_media"
+        assert output[1]["arguments"] == '{"city": "Seattle"}'
+        assert output[2]["output"] == [
+            {"text": "caption", "type": "input_text"},
+            {"detail": "auto", "type": "input_image", "image_url": "https://example.com/cat.png"},
+            {"type": "input_file", "file_id": "file_pdf"},
+        ]
+        assert output[3]["content"][0]["text"] == "done"
+
+    def test_responses_from_run_maps_conversation_session(self) -> None:
+        result = AgentResponse(messages=Message(role="assistant", contents=[Content.from_text("hello")]))
+
+        payload = responses_from_run(result, response_id="resp_new", session_id="conv_1")
+
+        assert payload["conversation"] == {"id": "conv_1"}
+
+    def test_responses_from_run_omits_previous_response_session(self) -> None:
+        result = AgentResponse(messages=Message(role="assistant", contents=[Content.from_text("hello")]))
+
+        payload = responses_from_run(result, response_id="resp_new", session_id="resp_1")
+
+        assert "conversation" not in payload
+
+    async def test_responses_stream_events_from_run(self) -> None:
+        async def updates() -> AsyncIterator[AgentResponseUpdate]:
+            yield AgentResponseUpdate(contents=[Content.from_text("hel")], role="assistant")
+            yield AgentResponseUpdate(contents=[Content.from_text("lo")], role="assistant")
+
+        def finalizer(items: Sequence[AgentResponseUpdate]) -> AgentResponse:
+            return AgentResponse.from_updates(items)
+
+        stream = ResponseStream(updates(), finalizer=finalizer)
+
+        events = [
+            event
+            async for event in responses_stream_events_from_run(
+                stream,
+                response_id="resp_new",
+                session_id="conv_1",
+            )
+        ]
+
+        assert events[0].startswith("event: response.created")
+        assert "response.output_text.delta" in events[1]
+        assert "hel" in events[1]
+        assert "lo" in events[2]
+        assert events[-1].startswith("event: response.completed")
+        assert '"conversation":{"id":"conv_1"}' in events[-1]
diff --git a/python/packages/hosting/README.md b/python/packages/hosting/README.md
index d08be242d1f..944325b95c1 100644
--- a/python/packages/hosting/README.md
+++ b/python/packages/hosting/README.md
@@ -1,122 +1,40 @@
 # agent-framework-hosting
 
-Multi-channel hosting for Microsoft Agent Framework agents.
+Shared execution-state helpers for app-owned Agent Framework hosting.
 
-`agent-framework-hosting` lets you serve a single agent or workflow target
-through one or more **channels**. The host owns one Starlette ASGI app,
-route/lifecycle composition, and per-`isolation_key` session resolution.
-Each channel owns its protocol parsing and response rendering.
+This package keeps Agent Framework state separate from web-framework concerns:
 
-The base package contains only channel-neutral plumbing:
+- `AgentFrameworkState` — stores an agent/workflow target and optional session
+  state for routes that the app owns.
+- `SessionStore` — maps an app-selected session id to an `AgentSession` for
+  non-persisted servers.
+- Existing experimental channel-hosting types remain available while the package
+  is unreleased, but the v1 direction is protocol helpers plus app-owned routes.
 
-- `AgentFrameworkHost` — the Starlette host.
-- `Channel` — the channel protocol.
-- `ChannelRequest` / `ChannelSession` / `ChannelIdentity` — the request
-  envelope and optional channel metadata.
-- `ChannelContext` / `ChannelContribution` / `ChannelCommand` — channel-side
-  hooks for invoking the target and contributing routes, commands, and
-  lifecycle callbacks.
-- `ChannelRunHook` / `ChannelResponseHook` / `ChannelStreamUpdateHook` —
-  host-invoked customization seams.
-
-`ChannelStreamUpdateHook` applies to streamed updates only. It is not a
-substitute for final-response redaction.
-
-Concrete channels live in their own packages so you only install what you use:
-
-| Package | Transport |
-|---|---|
-| `agent-framework-hosting-responses` | OpenAI Responses API |
-
-Additional channel packages can build on the same host contract without adding
-their protocol dependencies to the base package.
-
-## Install
-
-```bash
-pip install agent-framework-hosting agent-framework-hosting-responses
-# or with Hypercorn pre-installed for the demo `host.serve(...)` helper
-pip install "agent-framework-hosting[serve]" agent-framework-hosting-responses
-# add the [disk] extra to persist reset-session aliases
-pip install "agent-framework-hosting[disk]"
-```
+Use FastAPI, Starlette, Azure Functions, Django, or another framework for route
+registration, auth, middleware, response construction, and background work.
 
 ## Quickstart
 
 ```python
 from agent_framework.openai import OpenAIChatClient
-from agent_framework_hosting import AgentFrameworkHost, Channel
+from agent_framework_hosting import AgentFrameworkState, SessionStore
 
 agent = OpenAIChatClient().as_agent(name="Assistant")
+state = AgentFrameworkState(agent, session_store=SessionStore)
 
-# Add channels from sibling packages, e.g. `agent-framework-hosting-responses`
-# exposes a `ResponsesChannel` that serves the OpenAI Responses API.
-channels: list[Channel] = []
-
-host = AgentFrameworkHost(target=agent, channels=channels)
-host.serve(port=8000)
-```
-
-## Session state and workflow checkpoints
-
-By default the host keeps live `AgentSession` objects and reset-session aliases
-in memory. Channels opt into continuity by setting
-`ChannelRequest.session = ChannelSession(isolation_key=...)`; requests with the
-same isolation key reuse the same host-created session.
-
-The host treats `isolation_key` as an opaque partition key. Each channel or
-hosting environment decides where that key comes from:
-
-- protocol headers supplied by a trusted platform,
-- request body fields such as a previous response or conversation ID,
-- route/path parameters,
-- channel-native metadata such as chat/user IDs, or
-- environment-provided context in an ephemeral host.
-
-The host should be able to carry any of those sources as long as the channel or
-platform has already authenticated and authorized the caller before passing the
-key to `ChannelSession`.
-
-The built-in request-context helper recognizes the `x-agent-user-isolation-key`
-and `x-agent-chat-isolation-key` header names because some hosting
-environments, including Foundry Hosted Agents, already use them. Reusing those
-header names does **not** mean `agent-framework-hosting` is the supported way to
-run on Foundry Hosted Agents; use `agent-framework-foundry-hosting` for that
-hosting surface.
-
-For long-running deployments that need `reset_session(...)` aliases to survive
-restart, pass `state_dir`:
-
-```python
-host = AgentFrameworkHost(
-    target=agent,
-    channels=channels,
-    state_dir="./.host-state",
-)
+session = await state.get_session("conversation-1")
+result = await (await state.get_target()).run("Hello", session=session)
 ```
 
-This creates `./.host-state/sessions/` and stores only lightweight alias
-bookkeeping. Live `AgentSession` objects are still rehydrated lazily by the
-configured history provider on the next turn.
-
-For workflow targets, `checkpoint_location=...` is the clearest way to enable
-checkpoint persistence. As a convenience, `state_dir="./.host-state"` also
-derives `./.host-state/checkpoints/` for workflow targets. Use the mapping form
-when you want only one component:
+Targets can be direct instances, synchronous factories, asynchronous factories,
+or awaitables:
 
 ```python
-from agent_framework_hosting import HostStatePaths
-
-host = AgentFrameworkHost(
-    target=workflow,
-    channels=channels,
-    state_dir=HostStatePaths(
-        sessions="/var/lib/myapp/sessions",
-        checkpoints="/var/lib/myapp/checkpoints",
-    ),
-)
+state = AgentFrameworkState(create_agent)  # cached by default
+state = AgentFrameworkState(create_agent, cache_target=False)
 ```
 
 Cross-channel identity linking, multicast delivery, background runs,
 continuation tokens, and durable delivery runners are follow-up enhancements,
-not part of this v1 host contract.
+not part of this v1 state surface.
diff --git a/python/packages/hosting/agent_framework_hosting/__init__.py b/python/packages/hosting/agent_framework_hosting/__init__.py
index ab78ccd4b9e..cb5ed5567fd 100644
--- a/python/packages/hosting/agent_framework_hosting/__init__.py
+++ b/python/packages/hosting/agent_framework_hosting/__init__.py
@@ -20,6 +20,7 @@
     reset_current_isolation_keys,
     set_current_isolation_keys,
 )
+from ._state import AgentFrameworkState, AgentRunArgs, SessionStore, WorkflowRunArgs
 from ._types import (
     Channel,
     ChannelCommand,
@@ -44,6 +45,8 @@
     "ISOLATION_HEADER_CHAT",
     "ISOLATION_HEADER_USER",
     "AgentFrameworkHost",
+    "AgentFrameworkState",
+    "AgentRunArgs",
     "Channel",
     "ChannelCommand",
     "ChannelCommandContext",
@@ -58,6 +61,8 @@
     "HostStatePaths",
     "HostedRunResult",
     "IsolationKeys",
+    "SessionStore",
+    "WorkflowRunArgs",
     "__version__",
     "get_current_isolation_keys",
     "logger",
diff --git a/python/packages/hosting/agent_framework_hosting/_state.py b/python/packages/hosting/agent_framework_hosting/_state.py
new file mode 100644
index 00000000000..86b4ae49125
--- /dev/null
+++ b/python/packages/hosting/agent_framework_hosting/_state.py
@@ -0,0 +1,222 @@
+# Copyright (c) Microsoft. All rights reserved.
+
+from __future__ import annotations
+
+import inspect
+from collections.abc import Awaitable, Callable, Mapping
+from typing import Any, Generic, TypedDict, TypeVar
+
+from agent_framework import AgentRunInputs, AgentSession, ChatOptions, SupportsAgentRun, Workflow
+
+
+class SessionStore:
+    """In-memory session lookup for non-persisted servers.
+
+    The store maps application-selected session ids to ``AgentSession``
+    instances. The id is an opaque partition key; callers are responsible for
+    deciding whether it came from a trusted request field, platform context, or
+    other route-local state.
+    """
+
+    def __init__(self, agent: SupportsAgentRun) -> None:
+        """Create a session store for ``agent``.
+
+        Args:
+            agent: The agent that creates sessions when a session id is first
+                observed.
+        """
+        self.agent = agent
+        self._sessions: dict[str, AgentSession] = {}
+
+    async def get(self, session_id: str) -> AgentSession:
+        """Return the session for ``session_id``, creating it when needed.
+
+        Args:
+            session_id: Opaque app-selected session id.
+
+        Returns:
+            The cached or newly created ``AgentSession``.
+
+        Raises:
+            ValueError: If ``session_id`` is empty.
+        """
+        if not session_id:
+            raise ValueError("session_id must be a non-empty string")
+        if session_id not in self._sessions:
+            self._sessions[session_id] = self.agent.create_session(session_id=session_id)
+        return self._sessions[session_id]
+
+    async def reset(self, session_id: str) -> None:
+        """Forget the current session for ``session_id``.
+
+        Args:
+            session_id: Opaque app-selected session id.
+
+        Raises:
+            ValueError: If ``session_id`` is empty.
+        """
+        if not session_id:
+            raise ValueError("session_id must be a non-empty string")
+        self._sessions.pop(session_id, None)
+
+
+TargetT = TypeVar("TargetT", SupportsAgentRun, Workflow)
+SessionStoreFactory = Callable[[SupportsAgentRun], SessionStore]
+
+
+class AgentRunArgs(TypedDict):
+    """Arguments prepared for ``Agent.run``."""
+
+    messages: AgentRunInputs
+    options: ChatOptions[Any]
+    stream: bool
+
+
+class WorkflowRunArgs(TypedDict):
+    """Arguments prepared for ``Workflow.run``."""
+
+    message: Any | None
+    responses: Mapping[str, Any] | None
+    stream: bool
+
+
+class AgentFrameworkState(Generic[TargetT]):
+    """Shared execution state for app-owned hosting routes.
+
+    ``AgentFrameworkState`` intentionally does not own routes, middleware,
+    protocol dispatch, or native SDK calls. Web frameworks keep those concerns;
+    this object holds the Agent Framework target and optional session store that
+    route code may share.
+    """
+
+    def __init__(
+        self,
+        target: TargetT | Awaitable[TargetT] | Callable[[], TargetT | Awaitable[TargetT]],
+        *,
+        session_store: SessionStore | type[SessionStore] | SessionStoreFactory | None = None,
+        cache_target: bool = True,
+    ) -> None:
+        """Create shared state for ``target``.
+
+        Args:
+            target: Agent or workflow target used by route code. May be a
+                target instance, a synchronous factory, an asynchronous factory,
+                or an awaitable target.
+
+        Keyword Args:
+            session_store: Existing store, store class, or factory. When omitted
+                and ``target`` is an agent, an in-memory ``SessionStore`` is
+                created. Workflow targets do not get a default session store.
+            cache_target: Whether to cache a resolved callable/awaitable target.
+                Defaults to ``True`` so expensive target setup happens once.
+
+        Raises:
+            ValueError: If ``cache_target=False`` is used with a one-shot
+                awaitable target.
+            TypeError: If a session store class/factory is supplied for a
+                workflow target.
+        """
+        if not cache_target and inspect.isawaitable(target):
+            raise ValueError("cache_target=False requires a target instance or callable target factory")
+        self._target_source = target
+        self._cache_target = cache_target
+        self._cached_target: TargetT | None = None
+        self._session_store_source = session_store
+        self._cached_session_store = session_store if isinstance(session_store, SessionStore) else None
+        if not callable(target) and not inspect.isawaitable(target):
+            self._cached_target = target
+            if self._cached_session_store is None and isinstance(target, SupportsAgentRun):
+                self._cached_session_store = self._init_session_store(target, session_store)
+            elif session_store is not None and not isinstance(target, SupportsAgentRun):
+                raise TypeError("session_store requires an agent target that supports create_session")
+
+    async def get_target(self) -> TargetT:
+        """Return the resolved target.
+
+        Returns:
+            The target instance. Callable and awaitable targets are resolved
+            first and cached by default.
+        """
+        if self._cache_target and self._cached_target is not None:
+            return self._cached_target
+
+        target = self._target_source() if callable(self._target_source) else self._target_source
+        if inspect.isawaitable(target):
+            target = await target
+        if self._cache_target:
+            self._cached_target = target
+        return target
+
+    async def get_session_store(self) -> SessionStore:
+        """Return the session store for the current target.
+
+        Returns:
+            The configured or lazily created ``SessionStore``.
+
+        Raises:
+            TypeError: If the resolved target is not an agent target.
+        """
+        if self._cached_session_store is not None:
+            return self._cached_session_store
+
+        target = await self.get_target()
+        store = self._init_session_store(target, self._session_store_source)
+        if self._cache_target:
+            self._cached_session_store = store
+        return store
+
+    async def get_session(self, session_id: str) -> AgentSession:
+        """Return the session for ``session_id`` from the current store.
+
+        Args:
+            session_id: Opaque app-selected session id.
+
+        Returns:
+            The cached or newly created ``AgentSession``.
+        """
+        store = await self.get_session_store()
+        return await store.get(session_id)
+
+    async def reset_session(self, session_id: str) -> None:
+        """Forget the current session for ``session_id``.
+
+        Args:
+            session_id: Opaque app-selected session id.
+        """
+        store = await self.get_session_store()
+        await store.reset(session_id)
+
+    @property
+    def target(self) -> TargetT:
+        """Return a synchronously available target.
+
+        Raises:
+            RuntimeError: If the target is a callable or awaitable that has not
+                been resolved with :meth:`get_target`.
+        """
+        if self._cached_target is not None:
+            return self._cached_target
+        if not callable(self._target_source) and not inspect.isawaitable(self._target_source):
+            return self._target_source
+        raise RuntimeError("target is resolved asynchronously; use `await state.get_target()`")
+
+    @property
+    def session_store(self) -> SessionStore | None:
+        """Return a synchronously available session store, if one is cached."""
+        return self._cached_session_store
+
+    def _init_session_store(
+        self,
+        target: TargetT,
+        session_store: SessionStore | type[SessionStore] | SessionStoreFactory | None,
+    ) -> SessionStore:
+        if isinstance(session_store, SessionStore):
+            return session_store
+
+        if not isinstance(target, SupportsAgentRun):
+            raise TypeError("session_store requires an agent target that supports create_session")
+
+        if session_store is None:
+            return SessionStore(target)
+
+        return session_store(target)
diff --git a/python/packages/hosting/tests/hosting/test_state.py b/python/packages/hosting/tests/hosting/test_state.py
new file mode 100644
index 00000000000..8626c6c2e44
--- /dev/null
+++ b/python/packages/hosting/tests/hosting/test_state.py
@@ -0,0 +1,138 @@
+# Copyright (c) Microsoft. All rights reserved.
+
+from __future__ import annotations
+
+from typing import Any
+
+import pytest
+from agent_framework import AgentResponse, AgentSession, Message
+
+from agent_framework_hosting import AgentFrameworkState, SessionStore
+
+
+class _FakeAgent:
+    """Minimal agent target for state tests."""
+
+    id = "fake-agent"
+    name = "Fake Agent"
+    description = "Fake agent for tests"
+
+    def __init__(self) -> None:
+        self.created_sessions: list[AgentSession] = []
+
+    def create_session(self, *, session_id: str | None = None) -> AgentSession:
+        session = AgentSession(session_id=session_id)
+        self.created_sessions.append(session)
+        return session
+
+    def get_session(self, service_session_id: str, *, session_id: str | None = None) -> AgentSession:
+        return AgentSession(session_id=session_id, service_session_id=service_session_id)
+
+    async def run(self, messages: Any = None, **_: Any) -> AgentResponse:
+        return AgentResponse(messages=Message(role="assistant", contents=["ok"]))
+
+
+class TestSessionStore:
+    async def test_get_reuses_session_for_same_id(self) -> None:
+        agent = _FakeAgent()
+        store = SessionStore(agent)
+
+        first = await store.get("session-1")
+        second = await store.get("session-1")
+
+        assert first is second
+        assert first.session_id == "session-1"
+        assert len(agent.created_sessions) == 1
+
+    async def test_reset_forgets_session(self) -> None:
+        agent = _FakeAgent()
+        store = SessionStore(agent)
+
+        first = await store.get("session-1")
+        await store.reset("session-1")
+        second = await store.get("session-1")
+
+        assert first is not second
+        assert len(agent.created_sessions) == 2
+
+    async def test_empty_session_id_raises(self) -> None:
+        store = SessionStore(_FakeAgent())
+
+        with pytest.raises(ValueError, match="session_id"):
+            await store.get("")
+        with pytest.raises(ValueError, match="session_id"):
+            await store.reset("")
+
+
+class TestAgentFrameworkState:
+    def test_default_session_store_for_agent(self) -> None:
+        agent = _FakeAgent()
+        state = AgentFrameworkState(agent)
+
+        assert state.target is agent
+        assert isinstance(state.session_store, SessionStore)
+
+    def test_accepts_session_store_instance(self) -> None:
+        agent = _FakeAgent()
+        store = SessionStore(agent)
+        state = AgentFrameworkState(agent, session_store=store)
+
+        assert state.target is agent
+        assert state.session_store is store
+
+    def test_accepts_session_store_factory(self) -> None:
+        agent = _FakeAgent()
+
+        def factory(target: Any) -> SessionStore:
+            return SessionStore(target)
+
+        state = AgentFrameworkState(agent, session_store=factory)
+
+        assert isinstance(state.session_store, SessionStore)
+
+    async def test_callable_target_cached_by_default(self) -> None:
+        calls = 0
+
+        def create_agent() -> _FakeAgent:
+            nonlocal calls
+            calls += 1
+            return _FakeAgent()
+
+        state = AgentFrameworkState(create_agent)
+
+        first = await state.get_target()
+        second = await state.get_target()
+
+        assert first is second
+        assert calls == 1
+
+    async def test_callable_target_cache_can_be_disabled(self) -> None:
+        calls = 0
+
+        def create_agent() -> _FakeAgent:
+            nonlocal calls
+            calls += 1
+            return _FakeAgent()
+
+        state = AgentFrameworkState(create_agent, cache_target=False)
+
+        first = await state.get_target()
+        second = await state.get_target()
+
+        assert first is not second
+        assert calls == 2
+
+    async def test_async_callable_target(self) -> None:
+        async def create_agent() -> _FakeAgent:
+            return _FakeAgent()
+
+        state = AgentFrameworkState(create_agent)
+
+        assert isinstance(await state.get_target(), _FakeAgent)
+
+    async def test_get_session_resolves_target_and_store(self) -> None:
+        state = AgentFrameworkState(lambda: _FakeAgent())
+
+        session = await state.get_session("session-1")
+
+        assert session.session_id == "session-1"
diff --git a/python/samples/04-hosting/af-hosting/README.md b/python/samples/04-hosting/af-hosting/README.md
index c21ebbecd5e..367dfcabc71 100644
--- a/python/samples/04-hosting/af-hosting/README.md
+++ b/python/samples/04-hosting/af-hosting/README.md
@@ -10,7 +10,7 @@ its own package. This first sample set includes
 
 | Sample | What it shows | Packaging |
 |---|---|---|
-| [`local_responses/`](./local_responses) | The minimal shape: one agent + one `@tool` + `ResponsesChannel` + a single `run_hook` that strips caller-supplied options and forces a `reasoning` preset. | **Local only.** Start here to learn the run-hook seam. |
+| [`local_responses/`](./local_responses) | The minimal shape: one agent + one `@tool` + native FastAPI route + Responses helper functions + `SessionStore`. | **Local only.** Start here to learn the helper seam. |
 | [`local_responses_workflow/`](./local_responses_workflow) | A 4-step `Workflow` (typed `SloganBrief` intake → writer → legal → formatter) hosted behind the Responses channel via a `run_hook` that parses inbound text/JSON into the workflow's typed input. The host writes per-conversation checkpoints via `checkpoint_location=…`. Demonstrates workflow targets + structured input adaptation + resume-across-turns. Includes a `call_server.rest` file with REST examples. | **Local only.** |
 | [`local_telegram/`](./local_telegram) | Telegram bot with `@tool`, `FileHistoryProvider`, `run_hook`, and slash commands (`/new`, `/whoami`, `/weather`). Pure Telegram — no HTTP endpoint. | **Local only.** Start here to learn the Telegram channel. |
 | [`local_multi_channel/`](./local_multi_channel) | Same agent behind two channels at once: `ResponsesChannel` + `TelegramChannel`. Shared `FileHistoryProvider` enables cross-channel session resumption (resume a Telegram chat from the Responses endpoint by passing the Telegram isolation key as `previous_response_id`). | **Local only.** |
diff --git a/python/samples/04-hosting/af-hosting/local_responses/README.md b/python/samples/04-hosting/af-hosting/local_responses/README.md
index e4b08f408c9..2ffcf5642da 100644
--- a/python/samples/04-hosting/af-hosting/local_responses/README.md
+++ b/python/samples/04-hosting/af-hosting/local_responses/README.md
@@ -1,19 +1,29 @@
-# local_responses — Responses-only with a settings-altering hook
+# local_responses — Responses helpers with native FastAPI routes
 
-The smallest end-to-end `agent-framework-hosting` shape: one Foundry
-agent with a `@tool`, one `ResponsesChannel`, one `run_hook`. Useful as
-the entry-point sample for understanding the **channel run-hook** seam
-without any multi-channel or identity-link concerns.
+The smallest end-to-end Responses hosting shape: one Foundry agent with a
+`@tool`, one native FastAPI route, a small `SessionStore`, and the Responses
+helper functions:
 
-What the run hook demonstrates:
+- `responses_to_run(...)`
+- `responses_session_id(...)`
+- `create_response_id(...)`
+- `responses_from_run(...)`
 
-- **Strips** caller-supplied `model` / `temperature` / `store` so the
-  host owns the backing deployment and persistence settings.
-- **Forces** a `reasoning` preset (`effort=medium`, `summary=auto`) on
-  every turn — caller-side overrides are ignored.
+The sample demonstrates the lighter hosting direction. Agent Framework provides
+the run conversion and session-state pieces; FastAPI owns route registration,
+request bodies, response objects, and server startup.
 
-`app:app` is a module-level Starlette ASGI app; recommended local launch
-is Hypercorn.
+What the route demonstrates:
+
+- **Strips** caller-supplied `model` / `temperature` / `store` so the app owns
+  deployment and persistence settings.
+- **Forces** a `reasoning` preset (`effort=medium`, `summary=auto`) on every
+  turn.
+- Produces the AF messages, options, and session id that the route passes to
+  `agent.run(...)`.
+
+`app:app` is a module-level FastAPI ASGI app; recommended local launch is
+Hypercorn.
 
 ## Run
 
@@ -40,14 +50,14 @@ uv sync --group dev
 # Plain OpenAI SDK call:
 uv run python call_server.py
 
-# The client intentionally omits `model`; the host chooses the backing
-# deployment from FOUNDRY_MODEL.
+# The client intentionally omits `model`; the app chooses the backing deployment
+# from FOUNDRY_MODEL.
 
-# The script then sends a second turn, "And what about Amsterdam?",
-# using the first `response.id` as `previous_response_id`.
+# The script then sends a second turn, "And what about Amsterdam?", using the
+# first `response.id` as `previous_response_id`.
 
 # Same two-turn interaction through an Agent Framework Agent backed by
-# OpenAIChatClient, with streaming enabled:
+# OpenAIChatClient:
 uv run python call_server_af.py
 ```
 
diff --git a/python/samples/04-hosting/af-hosting/local_responses/app.py b/python/samples/04-hosting/af-hosting/local_responses/app.py
index 73313614748..e00caa5ccc9 100644
--- a/python/samples/04-hosting/af-hosting/local_responses/app.py
+++ b/python/samples/04-hosting/af-hosting/local_responses/app.py
@@ -1,28 +1,19 @@
 # Copyright (c) Microsoft. All rights reserved.
 
-"""Minimal Responses-only hosting sample.
+"""Minimal Responses-only hosting sample with native FastAPI routes.
 
-Single agent with one ``@tool`` (``lookup_weather``), single channel
-(``ResponsesChannel``), one ``run_hook`` that demonstrates the
-settings-mutation seam over caller-supplied options.
+This sample demonstrates the helper-first hosting shape:
 
-What the hook does
-------------------
-On every Responses request the hook receives the ``ChannelRequest`` that
-the channel built from the inbound HTTP body. It:
-
-- strips ``model`` (the host owns the backing deployment), ``store``
-  (this agent owns persistence), and ``temperature`` (the configured
-  model may not honor it),
-- forces a ``reasoning`` effort + summary preset so the deployed surface
-  is consistent regardless of what the caller sent.
-
-The hook is the documented escape hatch over the uniform
-``ChannelRequest`` envelope.
+1. ``agent-framework-hosting-responses`` converts Responses request/response
+   payloads to and from Agent Framework run values.
+2. ``agent-framework-hosting`` owns shared execution state via
+   ``AgentFrameworkState`` and ``SessionStore``.
+3. FastAPI owns the route, request parsing, policy decisions, and response
+   object.
 
 Run
 ---
-``app`` is a module-level Starlette ASGI app. Recommended local launch::
+``app`` is a module-level FastAPI ASGI app. Recommended local launch::
 
     uv sync
     az login
@@ -42,16 +33,26 @@
 
 from __future__ import annotations
 
+import asyncio
 import os
-from dataclasses import replace
 from pathlib import Path
-from typing import Annotated
+from typing import Annotated, Any, cast
 
-from agent_framework import Agent, FileHistoryProvider, tool
+from agent_framework import Agent, FileHistoryProvider, ResponseStream, tool
 from agent_framework_foundry import FoundryChatClient
-from agent_framework_hosting import AgentFrameworkHost, ChannelRequest
-from agent_framework_hosting_responses import ResponsesChannel
+from agent_framework_hosting import AgentFrameworkState, SessionStore
+from agent_framework_hosting_responses import (
+    create_response_id,
+    responses_from_run,
+    responses_session_id,
+    responses_stream_events_from_run,
+    responses_to_run,
+)
 from azure.identity.aio import DefaultAzureCredential
+from fastapi import Body, FastAPI, HTTPException
+from fastapi.responses import JSONResponse, StreamingResponse
+from hypercorn.asyncio import serve
+from hypercorn.config import Config
 
 SESSIONS_DIR = Path(__file__).resolve().parent / "storage" / "sessions"
 SESSIONS_DIR.mkdir(parents=True, exist_ok=True)
@@ -71,37 +72,9 @@ def lookup_weather(
     return reports.get(location, f"{location} is sunny with a high of {high_temp}°C.")
 
 
-# the run hook defines what you want to allow the user to passthrough when they call your host
-# since the responses clients can call with all of the responses options,
-# you can decide with this run_hook which of those: are rejected
-# which are passed through, which are altered, which are added.
-# In this sample below, we are removing, model, temperature and store if set
-# and we add reasoning, but note that this could also be set on the Agent itself
-# the difference is that this option is specific to the Responses channel
-# so if you want to differentiate between options over channels
-# you would set the option in the run_hook, if it needs to be the same (like store)
-# you would set it in the agent.
-def run_hook(request: ChannelRequest, **_: object) -> ChannelRequest:
-    """Strip caller-supplied options the host should own and force a
-    reasoning preset."""
-    options = dict(request.options or {})
-
-    # The host owns the backing deployment; the agent's default_options
-    # own ``store``; the model may not honor ``temperature``. Strip them
-    # so the caller can't override.
-    options.pop("model", None)
-    options.pop("temperature", None)
-    options.pop("store", None)
-
-    # Force a consistent reasoning preset on every turn.
-    options["reasoning"] = {"effort": "medium", "summary": "auto"}
-
-    return replace(request, options=options or None)
-
-
-def build_host() -> AgentFrameworkHost:
-    # Here we define how our agent should run, with tools, options, etc:
-    agent = Agent(
+def create_agent() -> Agent:
+    """Create the sample weather agent."""
+    return Agent(
         client=FoundryChatClient(credential=DefaultAzureCredential()),
         name="WeatherAgent",
         instructions=(
@@ -112,15 +85,75 @@ def build_host() -> AgentFrameworkHost:
         context_providers=[FileHistoryProvider(SESSIONS_DIR)],
         default_options={"store": False},
     )
-    return AgentFrameworkHost(
-        target=agent,
-        channels=[ResponsesChannel(run_hook=run_hook)],
-        debug=True,
+
+
+app = FastAPI()
+state = AgentFrameworkState(create_agent, session_store=SessionStore)
+
+
+@app.post("/responses")
+async def responses(body: dict[str, Any] = Body(...)) -> JSONResponse | StreamingResponse:  # noqa: B008
+    """Handle one OpenAI Responses-shaped request."""
+    run = responses_to_run(body)
+    session_id = responses_session_id(body)
+    response_id = create_response_id()
+
+    options = dict(run["options"])
+    # App-specific policy: caller cannot pick deployment/persistence settings,
+    # and this sample forces a consistent reasoning preset.
+    options.pop("model", None)
+    options.pop("temperature", None)
+    options.pop("store", None)
+    options["reasoning"] = {"effort": "medium", "summary": "auto"}
+    options_for_run = cast(Any, options)
+
+    target = cast(Agent[Any], await state.get_target())
+    session = await state.get_session(session_id or response_id)
+    if run["stream"]:
+        stream = target.run(
+            run["messages"],
+            stream=True,
+            session=session,
+            options=options_for_run,
+        )
+        if not isinstance(stream, ResponseStream):
+            raise HTTPException(status_code=500, detail="agent did not return a response stream")
+        return StreamingResponse(
+            responses_stream_events_from_run(
+                stream,
+                response_id=response_id,
+                session_id=session_id,
+            ),
+            media_type="text/event-stream",
+        )
+
+    result = await target.run(
+        run["messages"],
+        session=session,
+        options=options_for_run,
+    )
+    return JSONResponse(
+        responses_from_run(
+            result,
+            response_id=response_id,
+            session_id=session_id,
+        )
     )
 
 
-app = build_host().app
+async def main() -> None:
+    """Run the sample with Hypercorn for local development."""
+    config = Config()
+    config.bind = [f"0.0.0.0:{int(os.environ.get('PORT', '8000'))}"]
+    await serve(cast(Any, app), config)
 
 
 if __name__ == "__main__":
-    build_host().serve(host="0.0.0.0", port=int(os.environ.get("PORT", "8000")))
+    asyncio.run(main())
+
+"""
+Sample output:
+User: What is the weather in Tokyo?
+Agent: Tokyo is clear with a high of 18°C.
+Response ID: resp_...
+"""
diff --git a/python/samples/04-hosting/af-hosting/local_responses/call_server_af.py b/python/samples/04-hosting/af-hosting/local_responses/call_server_af.py
index 91e8d3aa6fd..3c93a88c748 100644
--- a/python/samples/04-hosting/af-hosting/local_responses/call_server_af.py
+++ b/python/samples/04-hosting/af-hosting/local_responses/call_server_af.py
@@ -3,8 +3,8 @@
 """Agent Framework agent client for the local_responses sample.
 
 Creates a local :class:`agent_framework.Agent` backed by
-:class:`agent_framework.openai.OpenAIChatClient`, points that client at the
-hosted ``/responses`` endpoint, and streams both turns:
+:class:`agent_framework.openai.OpenAIChatClient` and points that client at the
+hosted ``/responses`` endpoint for both turns:
 
 1. ``What is the weather in Tokyo?``
 2. ``And what about Amsterdam?``
@@ -45,14 +45,8 @@ async def main() -> None:
 
     for prompt in PROMPTS:
         print(f"User: {prompt}")
-        stream = agent.run(prompt, stream=True, session=session)
-        print("Agent: ", end="", flush=True)
-        async for update in stream:
-            if update.text:
-                print(update.text, end="", flush=True)
-
-        response = await stream.get_final_response()
-        print("\n")
+        response = await agent.run(prompt, session=session)
+        print(f"Agent: {response.text}\n")
         print(f"Response ID: {response.response_id}\n")
 
 
diff --git a/python/samples/04-hosting/af-hosting/local_responses/pyproject.toml b/python/samples/04-hosting/af-hosting/local_responses/pyproject.toml
index f301dd6bfc4..adb6550ac2a 100644
--- a/python/samples/04-hosting/af-hosting/local_responses/pyproject.toml
+++ b/python/samples/04-hosting/af-hosting/local_responses/pyproject.toml
@@ -1,7 +1,7 @@
 [project]
 name = "agent-framework-hosting-sample-local-responses"
 version = "0.0.1"
-description = "Minimal Responses-only local hosting sample with a settings-altering run hook."
+description = "Minimal Responses-only local hosting sample with native FastAPI routes."
 requires-python = ">=3.10"
 dependencies = [
     "agent-framework-foundry",
@@ -9,6 +9,7 @@ dependencies = [
     "agent-framework-hosting-responses",
     "azure-identity",
     "aiohttp>=3.13.5",
+    "fastapi>=0.115.0,<0.138.1",
     "hypercorn>=0.17",
 ]
 

From c679bb934064a2163d4eabb8d311d0642a930b59 Mon Sep 17 00:00:00 2001
From: eavanvalkenburg <github@vanvalkenburg.eu>
Date: Thu, 2 Jul 2026 18:22:00 +0200
Subject: [PATCH 2/7] Fix CI failures, session continuity, and streaming model
 reporting

- Fix constrained TargetT TypeVar in AgentFrameworkState: split __init__
  into per-shape overloads (instance/sync factory/async factory/awaitable)
  since a bound TypeVar combined with one big Callable/Awaitable union
  parameter was unsolvable across pyright/pyrefly/ty/zuban.
- Fix _FakeAgent test fixtures to structurally satisfy SupportsAgentRun
  (matching attribute types and overloaded run()), which the above surfaced.
- Add SessionStore.put() to alias an additional session id to an
  already-resolved session, and use it in the local_responses sample to fix
  a real session-continuity bug: previous_response_id rotates every turn,
  so without aliasing the newly minted response id, turn 3+ of a
  conversation silently lost all prior history. Verified against a live
  Foundry model across a 3-turn conversation.
- Fix responses_stream_events_from_run to report the real model instead of
  the "agent" fallback: AgentResponse.from_updates never carries a raw
  representation forward, so capture model from the individual streamed
  updates' raw representations instead. Verified live.
- Add response_model=None to the sample's FastAPI route (it could not boot
  at all: FastAPI tried to build a Pydantic response model from the
  JSONResponse | StreamingResponse return annotation).
- Map responses_to_run's ValueError to HTTP 400 instead of a 500.
- Add HTTP round-trip integration tests (packages/hosting-responses) that
  exercise the same FastAPI + AgentFrameworkState + Responses helper wiring
  as the sample via httpx.ASGITransport, including a regression test for
  the session-continuity fix.
- Add Workflow-target test coverage, SessionStore.put/reset_session tests,
  and TypeError-path coverage to packages/hosting/tests/hosting/test_state.py.
- Extend call_server.py / call_server_af.py to a third conversation turn so
  they actually exercise the continuity chain (previous scripts stopped at
  turn 2, which would never have revealed the bug above).

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 .../_parsing.py                               |  26 +-
 .../packages/hosting-responses/pyproject.toml |   6 +
 .../hosting_responses/test_http_round_trip.py | 265 ++++++++++++++++++
 .../tests/hosting_responses/test_parsing.py   |   6 +-
 python/packages/hosting/README.md             |   6 +-
 .../hosting/agent_framework_hosting/_state.py |  67 ++++-
 .../hosting/tests/hosting/test_state.py       | 135 ++++++++-
 .../af-hosting/local_responses/README.md      |  12 +-
 .../af-hosting/local_responses/app.py         |  28 +-
 .../af-hosting/local_responses/call_server.py |  16 +-
 .../local_responses/call_server_af.py         |  13 +-
 python/uv.lock                                |  12 +
 12 files changed, 561 insertions(+), 31 deletions(-)
 create mode 100644 python/packages/hosting-responses/tests/hosting_responses/test_http_round_trip.py

diff --git a/python/packages/hosting-responses/agent_framework_hosting_responses/_parsing.py b/python/packages/hosting-responses/agent_framework_hosting_responses/_parsing.py
index 72c8d632118..c391aeb979a 100644
--- a/python/packages/hosting-responses/agent_framework_hosting_responses/_parsing.py
+++ b/python/packages/hosting-responses/agent_framework_hosting_responses/_parsing.py
@@ -259,6 +259,21 @@ def responses_from_run(
     return _response_payload(OpenAIResponse(**response_kwargs))
 
 
+def _model_from_update(update: AgentResponseUpdate) -> str | None:
+    """Best-effort model id from one streamed update's raw representation.
+
+    ``AgentResponse.from_updates`` does not carry a chunk's raw representation
+    forward onto the finalized response (see ``_finalize_response`` in core),
+    so ``_model_from_result`` can never find a model for a streamed result.
+    Each ``AgentResponseUpdate`` still has its own raw chat chunk, which
+    usually reports the model, so the streaming SSE helper captures it here
+    instead.
+    """
+    raw = update.raw_representation
+    model = getattr(raw, "model", None)
+    return model if isinstance(model, str) and model else None
+
+
 def _model_from_result(result: Any) -> str:
     model = getattr(result, "model", None)
     if isinstance(model, str) and model:
@@ -903,7 +918,10 @@ async def responses_stream_events_from_run(
         },
     )
 
+    model: str | None = None
     async for update in stream:
+        if model is None:
+            model = _model_from_update(update)
         if update.text:
             yield _sse_event(
                 "response.output_text.delta",
@@ -914,11 +932,17 @@ async def responses_stream_events_from_run(
             )
 
     final = await stream.get_final_response()
+    payload = responses_from_run(final, response_id=response_id, session_id=session_id)
+    if model is not None:
+        # The finalized `AgentResponse` never carries a raw representation
+        # (see `_model_from_update`), so prefer the model observed on the
+        # stream's own chunks over `responses_from_run`'s "agent" fallback.
+        payload["model"] = model
     yield _sse_event(
         "response.completed",
         {
             "type": "response.completed",
-            "response": responses_from_run(final, response_id=response_id, session_id=session_id),
+            "response": payload,
         },
     )
 
diff --git a/python/packages/hosting-responses/pyproject.toml b/python/packages/hosting-responses/pyproject.toml
index a8b96654d21..82806d9ebaa 100644
--- a/python/packages/hosting-responses/pyproject.toml
+++ b/python/packages/hosting-responses/pyproject.toml
@@ -28,6 +28,12 @@ dependencies = [
     "openai>=1.99.0,<3",
 ]
 
+[dependency-groups]
+dev = [
+    "fastapi>=0.115.0,<0.138.1",
+    "httpx>=0.28.1",
+]
+
 [tool.uv]
 prerelease = "if-necessary-or-explicit"
 environments = [
diff --git a/python/packages/hosting-responses/tests/hosting_responses/test_http_round_trip.py b/python/packages/hosting-responses/tests/hosting_responses/test_http_round_trip.py
new file mode 100644
index 00000000000..4955f3040d2
--- /dev/null
+++ b/python/packages/hosting-responses/tests/hosting_responses/test_http_round_trip.py
@@ -0,0 +1,265 @@
+# Copyright (c) Microsoft. All rights reserved.
+
+"""HTTP round-trip tests: POST -> FastAPI route -> JSON/SSE response.
+
+These exercise the same wiring as the `local_responses` sample: helpers from
+`agent_framework_hosting_responses` convert between the Responses protocol and
+Agent Framework run values, `agent_framework_hosting`'s `AgentFrameworkState` /
+`SessionStore` hold shared execution state, and a small FastAPI route owns
+everything else (parsing, policy, response construction). Requests go through
+`httpx.AsyncClient` with `ASGITransport` -- no real server process or live
+model is involved.
+"""
+
+from __future__ import annotations
+
+import json
+from collections.abc import AsyncIterator, Awaitable, Mapping
+from typing import Any, Literal, overload
+
+import httpx
+from agent_framework import (
+    AgentResponse,
+    AgentResponseUpdate,
+    AgentRunInputs,
+    AgentSession,
+    Content,
+    Message,
+    ResponseStream,
+)
+from agent_framework_hosting import AgentFrameworkState, SessionStore
+from fastapi import Body, FastAPI, HTTPException
+from fastapi.responses import JSONResponse, StreamingResponse
+
+from agent_framework_hosting_responses import (
+    create_response_id,
+    responses_from_run,
+    responses_session_id,
+    responses_stream_events_from_run,
+    responses_to_run,
+)
+
+
+class _StubAgent:
+    """Deterministic ``SupportsAgentRun`` stub that tracks session continuity.
+
+    Each call records the ``session_id`` of the ``AgentSession`` it was
+    invoked with and a per-session turn counter, so tests can assert that a
+    chain of requests reused one session instead of silently starting fresh
+    ones.
+    """
+
+    id = "stub-agent"
+    name: str | None = "stub-agent"
+    description: str | None = "stub agent for HTTP round-trip tests"
+
+    def __init__(self) -> None:
+        self.session_ids_seen: list[str | None] = []
+        self.turn_counts: dict[str | None, int] = {}
+
+    def create_session(self, *, session_id: str | None = None) -> AgentSession:
+        return AgentSession(session_id=session_id)
+
+    def get_session(self, service_session_id: str, *, session_id: str | None = None) -> AgentSession:
+        return AgentSession(session_id=session_id, service_session_id=service_session_id)
+
+    @overload
+    def run(
+        self,
+        messages: AgentRunInputs | None = None,
+        *,
+        stream: Literal[False] = ...,
+        session: AgentSession | None = None,
+        function_invocation_kwargs: Mapping[str, Any] | None = None,
+        client_kwargs: Mapping[str, Any] | None = None,
+    ) -> Awaitable[AgentResponse[Any]]: ...
+
+    @overload
+    def run(
+        self,
+        messages: AgentRunInputs | None = None,
+        *,
+        stream: Literal[True],
+        session: AgentSession | None = None,
+        function_invocation_kwargs: Mapping[str, Any] | None = None,
+        client_kwargs: Mapping[str, Any] | None = None,
+    ) -> ResponseStream[AgentResponseUpdate, AgentResponse[Any]]: ...
+
+    def run(
+        self,
+        messages: AgentRunInputs | None = None,
+        *,
+        stream: bool = False,
+        session: AgentSession | None = None,
+        function_invocation_kwargs: Mapping[str, Any] | None = None,
+        client_kwargs: Mapping[str, Any] | None = None,
+    ) -> Awaitable[AgentResponse[Any]] | ResponseStream[AgentResponseUpdate, AgentResponse[Any]]:
+        session_id = session.session_id if session is not None else None
+        self.session_ids_seen.append(session_id)
+        self.turn_counts[session_id] = self.turn_counts.get(session_id, 0) + 1
+        text = f"turn {self.turn_counts[session_id]} for session {session_id}"
+
+        if stream:
+
+            async def _stream() -> AsyncIterator[AgentResponseUpdate]:
+                yield AgentResponseUpdate(contents=[Content.from_text(text=text)], role="assistant")
+
+            return ResponseStream(_stream(), finalizer=lambda updates: AgentResponse.from_updates(updates))
+
+        async def _get_response() -> AgentResponse[Any]:
+            return AgentResponse(messages=Message(role="assistant", contents=[Content.from_text(text=text)]))
+
+        return _get_response()
+
+
+def _build_app(agent: _StubAgent) -> FastAPI:
+    """Build a minimal FastAPI app mirroring the `local_responses` sample's route."""
+    app = FastAPI()
+    state = AgentFrameworkState(agent, session_store=SessionStore)
+
+    @app.post("/responses", response_model=None)
+    async def responses(body: dict[str, Any] = Body(...)) -> JSONResponse | StreamingResponse:  # noqa: B008
+        try:
+            run = responses_to_run(body)
+        except ValueError as exc:
+            raise HTTPException(status_code=400, detail=str(exc)) from exc
+        session_id = responses_session_id(body)
+        response_id = create_response_id()
+
+        target = await state.get_target()
+        store = await state.get_session_store()
+        lookup_id = session_id or response_id
+        session = await store.get(lookup_id)
+        if response_id != lookup_id:
+            # Alias the newly minted response id to this turn's session, same
+            # as the sample, so the next `previous_response_id` still resolves.
+            await store.put(response_id, session)
+
+        if run["stream"]:
+            stream = target.run(run["messages"], stream=True, session=session)
+            if not isinstance(stream, ResponseStream):
+                raise HTTPException(status_code=500, detail="agent did not return a response stream")
+            return StreamingResponse(
+                responses_stream_events_from_run(stream, response_id=response_id, session_id=session_id),
+                media_type="text/event-stream",
+            )
+
+        result = await target.run(run["messages"], session=session)
+        return JSONResponse(responses_from_run(result, response_id=response_id, session_id=session_id))
+
+    return app
+
+
+async def _post(app: FastAPI, payload: dict[str, Any]) -> httpx.Response:
+    """Send a POST /responses request through the ASGI app, no real socket involved."""
+    transport = httpx.ASGITransport(app=app)
+    async with httpx.AsyncClient(transport=transport, base_url="http://test") as client:
+        return await client.post("/responses", json=payload, timeout=30)
+
+
+def _parse_sse_events(body: str) -> list[dict[str, Any]]:
+    """Parse SSE text into a list of `{"event": ..., "data": ...}` dicts."""
+    events: list[dict[str, Any]] = []
+    for block in body.split("\n\n"):
+        if not block.strip():
+            continue
+        event_type: str | None = None
+        data: str | None = None
+        for line in block.split("\n"):
+            if line.startswith("event: "):
+                event_type = line[len("event: ") :]
+            elif line.startswith("data: "):
+                data = line[len("data: ") :]
+        if event_type is not None and data is not None:
+            events.append({"event": event_type, "data": json.loads(data)})
+    return events
+
+
+class TestNonStreamingRoundTrip:
+    async def test_returns_responses_shaped_payload(self) -> None:
+        app = _build_app(_StubAgent())
+        response = await _post(app, {"input": "hello"})
+
+        assert response.status_code == 200
+        payload = response.json()
+        assert payload["object"] == "response"
+        assert payload["status"] == "completed"
+        assert payload["id"].startswith("resp_")
+        assert any(item["type"] == "message" for item in payload["output"])
+
+    async def test_invalid_input_returns_400_not_500(self) -> None:
+        app = _build_app(_StubAgent())
+        response = await _post(app, {})
+
+        assert response.status_code == 400
+        assert "input" in response.json()["detail"]
+
+
+class TestStreamingRoundTrip:
+    async def test_stream_emits_created_delta_and_completed_events(self) -> None:
+        app = _build_app(_StubAgent())
+        response = await _post(app, {"input": "hello", "stream": True})
+
+        assert response.status_code == 200
+        assert "text/event-stream" in response.headers["content-type"]
+
+        events = _parse_sse_events(response.text)
+        event_types = [e["event"] for e in events]
+        assert event_types[0] == "response.created"
+        assert event_types[-1] == "response.completed"
+        assert "response.output_text.delta" in event_types
+
+        completed = events[-1]["data"]["response"]
+        assert completed["status"] == "completed"
+        assert completed["id"].startswith("resp_")
+
+
+class TestSessionContinuity:
+    """Regression coverage for the `previous_response_id` aliasing fix.
+
+    `previous_response_id` rotates every turn. Without aliasing the newly
+    minted response id to the same session, turn 3 would silently resolve to
+    a brand-new, empty session instead of the one from turns 1-2.
+    """
+
+    async def test_previous_response_id_chain_preserves_session_across_three_turns(self) -> None:
+        agent = _StubAgent()
+        app = _build_app(agent)
+
+        turn1 = await _post(app, {"input": "hi"})
+        assert turn1.status_code == 200
+        turn2 = await _post(app, {"input": "still there?", "previous_response_id": turn1.json()["id"]})
+        assert turn2.status_code == 200
+        turn3 = await _post(app, {"input": "still there?", "previous_response_id": turn2.json()["id"]})
+        assert turn3.status_code == 200
+
+        assert len(agent.session_ids_seen) == 3
+        # All three turns must have run against the same underlying session,
+        # not three independent ones.
+        first_session_id = agent.session_ids_seen[0]
+        assert first_session_id is not None
+        assert agent.session_ids_seen == [first_session_id] * 3
+        assert agent.turn_counts[first_session_id] == 3
+
+    async def test_conversation_id_preserves_session_across_turns(self) -> None:
+        agent = _StubAgent()
+        app = _build_app(agent)
+
+        turn1 = await _post(app, {"input": "hi", "conversation_id": "conv_stable"})
+        assert turn1.status_code == 200
+        turn2 = await _post(app, {"input": "still there?", "conversation_id": "conv_stable"})
+        assert turn2.status_code == 200
+
+        assert agent.session_ids_seen == ["conv_stable", "conv_stable"]
+        assert agent.turn_counts["conv_stable"] == 2
+
+    async def test_unrelated_requests_get_independent_sessions(self) -> None:
+        agent = _StubAgent()
+        app = _build_app(agent)
+
+        first = await _post(app, {"input": "hi"})
+        second = await _post(app, {"input": "unrelated"})
+
+        assert first.status_code == 200
+        assert second.status_code == 200
+        assert agent.session_ids_seen[0] != agent.session_ids_seen[1]
diff --git a/python/packages/hosting-responses/tests/hosting_responses/test_parsing.py b/python/packages/hosting-responses/tests/hosting_responses/test_parsing.py
index 6fd749d898e..5aaebf4b5fe 100644
--- a/python/packages/hosting-responses/tests/hosting_responses/test_parsing.py
+++ b/python/packages/hosting-responses/tests/hosting_responses/test_parsing.py
@@ -5,6 +5,7 @@
 from __future__ import annotations
 
 from collections.abc import AsyncIterator, Sequence
+from typing import cast
 
 import pytest
 from agent_framework import AgentResponse, AgentResponseUpdate, Content, Message, ResponseStream
@@ -202,7 +203,10 @@ def test_responses_to_run_returns_messages_options_and_stream(self) -> None:
             "model": "gpt-x",
         })
 
-        assert run["messages"][0].text == "hi"
+        # `responses_to_run` always produces a `list[Message]`; the TypedDict
+        # field is typed as the wider `Agent.run` input shape, so narrow here.
+        messages = cast("list[Message]", run["messages"])
+        assert messages[0].text == "hi"
         assert run["stream"] is True
         assert run["options"] == {"max_tokens": 32, "model": "gpt-x"}
 
diff --git a/python/packages/hosting/README.md b/python/packages/hosting/README.md
index 944325b95c1..032fddd3908 100644
--- a/python/packages/hosting/README.md
+++ b/python/packages/hosting/README.md
@@ -7,7 +7,11 @@ This package keeps Agent Framework state separate from web-framework concerns:
 - `AgentFrameworkState` — stores an agent/workflow target and optional session
   state for routes that the app owns.
 - `SessionStore` — maps an app-selected session id to an `AgentSession` for
-  non-persisted servers.
+  non-persisted servers. `get`/`reset` manage a session by its own id; `put`
+  aliases an *additional* id to an already-resolved session — useful when a
+  protocol's continuation id rotates every turn (for example, OpenAI
+  Responses' `previous_response_id`) and a later request needs to resolve the
+  new id back to the same conversation.
 - Existing experimental channel-hosting types remain available while the package
   is unreleased, but the v1 direction is protocol helpers plus app-owned routes.
 
diff --git a/python/packages/hosting/agent_framework_hosting/_state.py b/python/packages/hosting/agent_framework_hosting/_state.py
index 86b4ae49125..cb6aa6218b7 100644
--- a/python/packages/hosting/agent_framework_hosting/_state.py
+++ b/python/packages/hosting/agent_framework_hosting/_state.py
@@ -4,7 +4,7 @@
 
 import inspect
 from collections.abc import Awaitable, Callable, Mapping
-from typing import Any, Generic, TypedDict, TypeVar
+from typing import Any, Generic, TypedDict, TypeVar, overload
 
 from agent_framework import AgentRunInputs, AgentSession, ChatOptions, SupportsAgentRun, Workflow
 
@@ -59,8 +59,29 @@ async def reset(self, session_id: str) -> None:
             raise ValueError("session_id must be a non-empty string")
         self._sessions.pop(session_id, None)
 
+    async def put(self, session_id: str, session: AgentSession) -> None:
+        """Associate an existing ``session`` with an additional ``session_id``.
 
-TargetT = TypeVar("TargetT", SupportsAgentRun, Workflow)
+        Use this to alias a rotating protocol id (for example, a freshly
+        minted response id) to a session that was already looked up under a
+        different, prior id. Protocols whose continuation id changes every
+        turn (such as OpenAI Responses' ``previous_response_id`` chaining)
+        need this so a later request referencing the new id still resolves
+        to the same conversation instead of starting a fresh session.
+
+        Args:
+            session_id: Opaque app-selected session id to associate.
+            session: The session to associate with ``session_id``.
+
+        Raises:
+            ValueError: If ``session_id`` is empty.
+        """
+        if not session_id:
+            raise ValueError("session_id must be a non-empty string")
+        self._sessions[session_id] = session
+
+
+TargetT = TypeVar("TargetT", bound="SupportsAgentRun | Workflow")
 SessionStoreFactory = Callable[[SupportsAgentRun], SessionStore]
 
 
@@ -89,6 +110,48 @@ class AgentFrameworkState(Generic[TargetT]):
     route code may share.
     """
 
+    # `target` accepts an instance, a sync/async factory, or a bare awaitable.
+    # Each shape is declared as its own overload rather than one big union
+    # because type checkers struggle to bind `TargetT` when it appears both
+    # bare and inside `Callable`/`Awaitable` alternatives in a single union
+    # parameter (observed as inference failures across pyright, pyrefly, ty,
+    # and zuban).
+    @overload
+    def __init__(
+        self,
+        target: TargetT,
+        *,
+        session_store: SessionStore | type[SessionStore] | SessionStoreFactory | None = None,
+        cache_target: bool = True,
+    ) -> None: ...
+
+    @overload
+    def __init__(
+        self,
+        target: Callable[[], TargetT],
+        *,
+        session_store: SessionStore | type[SessionStore] | SessionStoreFactory | None = None,
+        cache_target: bool = True,
+    ) -> None: ...
+
+    @overload
+    def __init__(
+        self,
+        target: Callable[[], Awaitable[TargetT]],
+        *,
+        session_store: SessionStore | type[SessionStore] | SessionStoreFactory | None = None,
+        cache_target: bool = True,
+    ) -> None: ...
+
+    @overload
+    def __init__(
+        self,
+        target: Awaitable[TargetT],
+        *,
+        session_store: SessionStore | type[SessionStore] | SessionStoreFactory | None = None,
+        cache_target: bool = True,
+    ) -> None: ...
+
     def __init__(
         self,
         target: TargetT | Awaitable[TargetT] | Callable[[], TargetT | Awaitable[TargetT]],
diff --git a/python/packages/hosting/tests/hosting/test_state.py b/python/packages/hosting/tests/hosting/test_state.py
index 8626c6c2e44..f09c9b9f758 100644
--- a/python/packages/hosting/tests/hosting/test_state.py
+++ b/python/packages/hosting/tests/hosting/test_state.py
@@ -2,20 +2,47 @@
 
 from __future__ import annotations
 
-from typing import Any
+import importlib
+from collections.abc import AsyncIterator, Awaitable, Mapping
+from typing import Any, Literal, overload
 
 import pytest
-from agent_framework import AgentResponse, AgentSession, Message
+from agent_framework import (
+    AgentResponse,
+    AgentResponseUpdate,
+    AgentRunInputs,
+    AgentSession,
+    Content,
+    Message,
+    ResponseStream,
+    Workflow,
+)
 
 from agent_framework_hosting import AgentFrameworkState, SessionStore
 
 
+def _workflow_fixture(name: str) -> Any:
+    """Load a fixture from ``_workflow_fixtures.py`` via the ``conftest``-registered alias.
+
+    Mirrors ``test_host.py``'s helper: the local ``conftest.py`` registers
+    ``_workflow_fixtures.py`` under the collision-proof name
+    ``hosting_workflow_fixtures`` so it stays importable in both
+    package-local and aggregate pytest runs.
+    """
+    return getattr(importlib.import_module("hosting_workflow_fixtures"), name)
+
+
 class _FakeAgent:
-    """Minimal agent target for state tests."""
+    """Minimal agent target for state tests.
+
+    Declares ``run`` with the same two overloads as ``SupportsAgentRun`` (one
+    per ``stream`` value) so it satisfies the protocol under static type
+    checking, not just at runtime.
+    """
 
-    id = "fake-agent"
-    name = "Fake Agent"
-    description = "Fake agent for tests"
+    id: str = "fake-agent"
+    name: str | None = "Fake Agent"
+    description: str | None = "Fake agent for tests"
 
     def __init__(self) -> None:
         self.created_sessions: list[AgentSession] = []
@@ -28,8 +55,48 @@ def create_session(self, *, session_id: str | None = None) -> AgentSession:
     def get_session(self, service_session_id: str, *, session_id: str | None = None) -> AgentSession:
         return AgentSession(session_id=session_id, service_session_id=service_session_id)
 
-    async def run(self, messages: Any = None, **_: Any) -> AgentResponse:
-        return AgentResponse(messages=Message(role="assistant", contents=["ok"]))
+    @overload
+    def run(
+        self,
+        messages: AgentRunInputs | None = None,
+        *,
+        stream: Literal[False] = ...,
+        session: AgentSession | None = None,
+        function_invocation_kwargs: Mapping[str, Any] | None = None,
+        client_kwargs: Mapping[str, Any] | None = None,
+    ) -> Awaitable[AgentResponse[Any]]: ...
+
+    @overload
+    def run(
+        self,
+        messages: AgentRunInputs | None = None,
+        *,
+        stream: Literal[True],
+        session: AgentSession | None = None,
+        function_invocation_kwargs: Mapping[str, Any] | None = None,
+        client_kwargs: Mapping[str, Any] | None = None,
+    ) -> ResponseStream[AgentResponseUpdate, AgentResponse[Any]]: ...
+
+    def run(
+        self,
+        messages: AgentRunInputs | None = None,
+        *,
+        stream: bool = False,
+        session: AgentSession | None = None,
+        function_invocation_kwargs: Mapping[str, Any] | None = None,
+        client_kwargs: Mapping[str, Any] | None = None,
+    ) -> Awaitable[AgentResponse[Any]] | ResponseStream[AgentResponseUpdate, AgentResponse[Any]]:
+        if stream:
+
+            async def _stream() -> AsyncIterator[AgentResponseUpdate]:
+                yield AgentResponseUpdate(contents=[Content.from_text(text="ok")], role="assistant")
+
+            return ResponseStream(_stream(), finalizer=lambda updates: AgentResponse.from_updates(updates))
+
+        async def _get_response() -> AgentResponse[Any]:
+            return AgentResponse(messages=Message(role="assistant", contents=[Content.from_text(text="ok")]))
+
+        return _get_response()
 
 
 class TestSessionStore:
@@ -63,6 +130,24 @@ async def test_empty_session_id_raises(self) -> None:
         with pytest.raises(ValueError, match="session_id"):
             await store.reset("")
 
+    async def test_put_aliases_new_id_to_existing_session(self) -> None:
+        agent = _FakeAgent()
+        store = SessionStore(agent)
+
+        session = await store.get("resp_1")
+        await store.put("resp_2", session)
+
+        assert await store.get("resp_2") is session
+        # Aliasing did not create a second session via the agent.
+        assert len(agent.created_sessions) == 1
+
+    async def test_put_empty_session_id_raises(self) -> None:
+        store = SessionStore(_FakeAgent())
+        session = await store.get("resp_1")
+
+        with pytest.raises(ValueError, match="session_id"):
+            await store.put("", session)
+
 
 class TestAgentFrameworkState:
     def test_default_session_store_for_agent(self) -> None:
@@ -136,3 +221,37 @@ async def test_get_session_resolves_target_and_store(self) -> None:
         session = await state.get_session("session-1")
 
         assert session.session_id == "session-1"
+
+    async def test_reset_session_forgets_session(self) -> None:
+        agent = _FakeAgent()
+        state = AgentFrameworkState(agent)
+
+        first = await state.get_session("session-1")
+        await state.reset_session("session-1")
+        second = await state.get_session("session-1")
+
+        assert first is not second
+        assert len(agent.created_sessions) == 2
+
+    def test_session_store_for_non_agent_target_raises_type_error(self) -> None:
+        workflow = _workflow_fixture("build_echo_workflow")()
+
+        with pytest.raises(TypeError, match="session_store requires an agent target"):
+            AgentFrameworkState(workflow, session_store=SessionStore)
+
+    async def test_workflow_target_has_no_default_session_store(self) -> None:
+        workflow: Workflow = _workflow_fixture("build_echo_workflow")()
+        state = AgentFrameworkState(workflow)
+
+        assert await state.get_target() is workflow
+        assert state.session_store is None
+        with pytest.raises(TypeError, match="session_store requires an agent target"):
+            await state.get_session_store()
+
+    async def test_workflow_target_resolved_from_factory(self) -> None:
+        build_echo_workflow = _workflow_fixture("build_echo_workflow")
+
+        state = AgentFrameworkState(build_echo_workflow)
+
+        target = await state.get_target()
+        assert isinstance(target, Workflow)
diff --git a/python/samples/04-hosting/af-hosting/local_responses/README.md b/python/samples/04-hosting/af-hosting/local_responses/README.md
index 2ffcf5642da..31e4a2d5412 100644
--- a/python/samples/04-hosting/af-hosting/local_responses/README.md
+++ b/python/samples/04-hosting/af-hosting/local_responses/README.md
@@ -21,6 +21,10 @@ What the route demonstrates:
   turn.
 - Produces the AF messages, options, and session id that the route passes to
   `agent.run(...)`.
+- **Aliases** each newly minted response id to the session it was just
+  resolved from. OpenAI's `previous_response_id` rotates every turn, so
+  without this alias step turn 3+ of a conversation would silently resolve to
+  a brand-new, empty session instead of the one from earlier turns.
 
 `app:app` is a module-level FastAPI ASGI app; recommended local launch is
 Hypercorn.
@@ -53,10 +57,12 @@ uv run python call_server.py
 # The client intentionally omits `model`; the app chooses the backing deployment
 # from FOUNDRY_MODEL.
 
-# The script then sends a second turn, "And what about Amsterdam?", using the
-# first `response.id` as `previous_response_id`.
+# The script then sends two more turns, each continuing from the previous
+# turn's `response.id` as `previous_response_id`. The third turn asks about
+# the first turn's city, so it only succeeds if the server still remembers
+# that far back in the chain.
 
-# Same two-turn interaction through an Agent Framework Agent backed by
+# Same three-turn interaction through an Agent Framework Agent backed by
 # OpenAIChatClient:
 uv run python call_server_af.py
 ```
diff --git a/python/samples/04-hosting/af-hosting/local_responses/app.py b/python/samples/04-hosting/af-hosting/local_responses/app.py
index e00caa5ccc9..bc399539612 100644
--- a/python/samples/04-hosting/af-hosting/local_responses/app.py
+++ b/python/samples/04-hosting/af-hosting/local_responses/app.py
@@ -91,10 +91,13 @@ def create_agent() -> Agent:
 state = AgentFrameworkState(create_agent, session_store=SessionStore)
 
 
-@app.post("/responses")
+@app.post("/responses", response_model=None)
 async def responses(body: dict[str, Any] = Body(...)) -> JSONResponse | StreamingResponse:  # noqa: B008
     """Handle one OpenAI Responses-shaped request."""
-    run = responses_to_run(body)
+    try:
+        run = responses_to_run(body)
+    except ValueError as exc:
+        raise HTTPException(status_code=400, detail=str(exc)) from exc
     session_id = responses_session_id(body)
     response_id = create_response_id()
 
@@ -108,7 +111,16 @@ async def responses(body: dict[str, Any] = Body(...)) -> JSONResponse | Streamin
     options_for_run = cast(Any, options)
 
     target = cast(Agent[Any], await state.get_target())
-    session = await state.get_session(session_id or response_id)
+    store = await state.get_session_store()
+    lookup_id = session_id or response_id
+    session = await store.get(lookup_id)
+    if response_id != lookup_id:
+        # `previous_response_id` chaining rotates its id every turn. Alias the
+        # newly minted response id to this turn's session so the next
+        # request (which will send this response's id back as its
+        # `previous_response_id`) still resolves to the same conversation
+        # instead of silently starting a new one.
+        await store.put(response_id, session)
     if run["stream"]:
         stream = target.run(
             run["messages"],
@@ -151,9 +163,7 @@ async def main() -> None:
 if __name__ == "__main__":
     asyncio.run(main())
 
-"""
-Sample output:
-User: What is the weather in Tokyo?
-Agent: Tokyo is clear with a high of 18°C.
-Response ID: resp_...
-"""
+# Sample output:
+# User: What is the weather in Tokyo?
+# Agent: Tokyo is clear with a high of 18°C.
+# Response ID: resp_...
diff --git a/python/samples/04-hosting/af-hosting/local_responses/call_server.py b/python/samples/04-hosting/af-hosting/local_responses/call_server.py
index 7066e9e7ac5..648e7fc9868 100644
--- a/python/samples/04-hosting/af-hosting/local_responses/call_server.py
+++ b/python/samples/04-hosting/af-hosting/local_responses/call_server.py
@@ -15,8 +15,10 @@
 
     uv run python call_server.py
 
-The script sends a follow-up turn ("And what about Amsterdam?") using the
-first response's ``response.id`` as ``previous_response_id``.
+The script sends two follow-up turns, each continuing from the previous
+turn's ``response.id`` as ``previous_response_id``. The third turn asks about
+information from the *first* turn only, so it also exercises session
+continuity across a rotating response id chain, not just a single hop.
 """
 
 from __future__ import annotations
@@ -26,6 +28,7 @@
 BASE_URL = "http://127.0.0.1:8000"
 PROMPT = "What is the weather in Tokyo?"
 FOLLOW_UP_PROMPT = "And what about Amsterdam?"
+THIRD_PROMPT = "Which of the two cities we just discussed is warmer?"
 
 
 def main() -> None:
@@ -46,6 +49,15 @@ def main() -> None:
     print(f"Agent: {follow_up.output_text}")
     print(f"Response ID: {follow_up.id}")
 
+    third = client.responses.create(
+        input=THIRD_PROMPT,
+        previous_response_id=follow_up.id,
+    )
+    print()
+    print(f"User: {THIRD_PROMPT}")
+    print(f"Agent: {third.output_text}")
+    print(f"Response ID: {third.id}")
+
 
 if __name__ == "__main__":
     main()
diff --git a/python/samples/04-hosting/af-hosting/local_responses/call_server_af.py b/python/samples/04-hosting/af-hosting/local_responses/call_server_af.py
index 3c93a88c748..078087c0912 100644
--- a/python/samples/04-hosting/af-hosting/local_responses/call_server_af.py
+++ b/python/samples/04-hosting/af-hosting/local_responses/call_server_af.py
@@ -4,14 +4,18 @@
 
 Creates a local :class:`agent_framework.Agent` backed by
 :class:`agent_framework.openai.OpenAIChatClient` and points that client at the
-hosted ``/responses`` endpoint for both turns:
+hosted ``/responses`` endpoint for all turns:
 
 1. ``What is the weather in Tokyo?``
 2. ``And what about Amsterdam?``
+3. ``Which of the two cities we just discussed is warmer?``
 
-Both turns use the same :class:`agent_framework.AgentSession`; the first
-turn binds the hosted response id to the session, and the second turn
-continues through that session.
+All turns use the same :class:`agent_framework.AgentSession`; the first turn
+binds the hosted response id to the session, and later turns continue through
+that session via a chain of rotating ``previous_response_id`` values. The
+third turn only makes sense if the server still remembers the first turn, so
+it also exercises session continuity across that whole chain, not just a
+single hop.
 
 Start the server first (in another shell)::
 
@@ -33,6 +37,7 @@
 PROMPTS = [
     "What is the weather in Tokyo?",
     "And what about Amsterdam?",
+    "Which of the two cities we just discussed is warmer?",
 ]
 
 
diff --git a/python/uv.lock b/python/uv.lock
index 0fe3298f2a3..af07359e37d 100644
--- a/python/uv.lock
+++ b/python/uv.lock
@@ -677,6 +677,12 @@ dependencies = [
     { name = "openai", marker = "sys_platform == 'darwin' or sys_platform == 'linux' or sys_platform == 'win32'" },
 ]
 
+[package.dev-dependencies]
+dev = [
+    { name = "fastapi", marker = "sys_platform == 'darwin' or sys_platform == 'linux' or sys_platform == 'win32'" },
+    { name = "httpx", marker = "sys_platform == 'darwin' or sys_platform == 'linux' or sys_platform == 'win32'" },
+]
+
 [package.metadata]
 requires-dist = [
     { name = "agent-framework-core", editable = "packages/core" },
@@ -684,6 +690,12 @@ requires-dist = [
     { name = "openai", specifier = ">=1.99.0,<3" },
 ]
 
+[package.metadata.requires-dev]
+dev = [
+    { name = "fastapi", specifier = ">=0.115.0,<0.138.1" },
+    { name = "httpx", specifier = ">=0.28.1" },
+]
+
 [[package]]
 name = "agent-framework-hosting-telegram"
 version = "1.0.0a260625"

From 2d3d920c0da17f72e2c7c19a5cff151b403c7d8a Mon Sep 17 00:00:00 2001
From: eavanvalkenburg <github@vanvalkenburg.eu>
Date: Fri, 3 Jul 2026 10:03:57 +0200
Subject: [PATCH 3/7] Simplify session-continuity aliasing: fold put() into
 get()

Per feedback: the growth of SessionStore was not the problem -- it's
intentional, since OpenAI's previous_response_id is designed to let a
caller continue (fork) from any earlier response, not just the latest
one, so every response id has to stay independently resolvable. That
part stays as-is.

What was too complex was the call site: routes had to manually fetch a
session and then conditionally alias it with a separate put() call.
Folded that into a single get(session_id, alias=...) call instead:

- SessionStore.get() gains an optional `alias` keyword that registers an
  additional id for the same session in the same call (no-op if alias is
  None or equal to session_id). Removed the separate put() method.
- AgentFrameworkState.get_session() passes `alias` through.
- local_responses sample and the HTTP round-trip integration tests now
  do `await state.get_session(lookup_id, alias=response_id)` instead of
  pulling the store out and orchestrating get()/put() by hand.
- Documented that this in-memory SessionStore intentionally never evicts
  (by design, to support forking), and that a storage-backed replacement
  (Redis, a database, ...) is responsible for its own TTL/eviction
  policy.

Verified against a live Foundry model across a 3-turn previous_response_id
chain after the simplification.

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 .../hosting_responses/test_http_round_trip.py |  9 +--
 python/packages/hosting/README.md             | 19 +++++--
 .../hosting/agent_framework_hosting/_state.py | 55 ++++++++++---------
 .../hosting/tests/hosting/test_state.py       | 15 ++++-
 .../af-hosting/local_responses/README.md      |  8 ++-
 .../af-hosting/local_responses/app.py         | 14 ++---
 6 files changed, 69 insertions(+), 51 deletions(-)

diff --git a/python/packages/hosting-responses/tests/hosting_responses/test_http_round_trip.py b/python/packages/hosting-responses/tests/hosting_responses/test_http_round_trip.py
index 4955f3040d2..c7c5ee4159d 100644
--- a/python/packages/hosting-responses/tests/hosting_responses/test_http_round_trip.py
+++ b/python/packages/hosting-responses/tests/hosting_responses/test_http_round_trip.py
@@ -127,13 +127,10 @@ async def responses(body: dict[str, Any] = Body(...)) -> JSONResponse | Streamin
         response_id = create_response_id()
 
         target = await state.get_target()
-        store = await state.get_session_store()
         lookup_id = session_id or response_id
-        session = await store.get(lookup_id)
-        if response_id != lookup_id:
-            # Alias the newly minted response id to this turn's session, same
-            # as the sample, so the next `previous_response_id` still resolves.
-            await store.put(response_id, session)
+        # Alias the newly minted response id to this turn's session, same as
+        # the sample, so a later `previous_response_id` still resolves.
+        session = await state.get_session(lookup_id, alias=response_id)
 
         if run["stream"]:
             stream = target.run(run["messages"], stream=True, session=session)
diff --git a/python/packages/hosting/README.md b/python/packages/hosting/README.md
index 032fddd3908..06e960edb73 100644
--- a/python/packages/hosting/README.md
+++ b/python/packages/hosting/README.md
@@ -7,17 +7,26 @@ This package keeps Agent Framework state separate from web-framework concerns:
 - `AgentFrameworkState` — stores an agent/workflow target and optional session
   state for routes that the app owns.
 - `SessionStore` — maps an app-selected session id to an `AgentSession` for
-  non-persisted servers. `get`/`reset` manage a session by its own id; `put`
-  aliases an *additional* id to an already-resolved session — useful when a
-  protocol's continuation id rotates every turn (for example, OpenAI
-  Responses' `previous_response_id`) and a later request needs to resolve the
-  new id back to the same conversation.
+  non-persisted servers. `get(session_id, alias=...)` resolves (creating if
+  needed) and, in the same call, can register an *additional* id for the same
+  session — useful when a protocol's continuation id rotates every turn (for
+  example, OpenAI Responses' `previous_response_id`, which by design lets a
+  caller continue from any earlier point, not just the latest turn) and a
+  later request needs to resolve the new id back to the same conversation.
+  `reset` forgets a session by its own id.
 - Existing experimental channel-hosting types remain available while the package
   is unreleased, but the v1 direction is protocol helpers plus app-owned routes.
 
 Use FastAPI, Starlette, Azure Functions, Django, or another framework for route
 registration, auth, middleware, response construction, and background work.
 
+> The built-in `SessionStore` is an in-memory `dict` with no eviction — every
+> id it has ever seen (including aliases) stays resolvable for the life of the
+> process, which is intentional for the reasons above. If you back a
+> `SessionStore`-shaped store with real storage (Redis, a database, ...), you
+> are responsible for that store's own TTL/eviction policy; this reference
+> implementation does not model that concern.
+
 ## Quickstart
 
 ```python
diff --git a/python/packages/hosting/agent_framework_hosting/_state.py b/python/packages/hosting/agent_framework_hosting/_state.py
index cb6aa6218b7..007e55397d8 100644
--- a/python/packages/hosting/agent_framework_hosting/_state.py
+++ b/python/packages/hosting/agent_framework_hosting/_state.py
@@ -16,6 +16,16 @@ class SessionStore:
     instances. The id is an opaque partition key; callers are responsible for
     deciding whether it came from a trusted request field, platform context, or
     other route-local state.
+
+    This reference implementation is a plain ``dict`` with no eviction: every
+    id ever seen stays resolvable for the life of the process. That is
+    intentional here (protocols such as OpenAI Responses'
+    ``previous_response_id`` let a caller continue from *any* earlier point in
+    a conversation, not just the latest turn, so every id needs to stay
+    independently addressable -- see :meth:`get`'s ``alias`` argument).
+    A storage-backed replacement (Redis, a database, ...) should apply its own
+    TTL/eviction policy for these ids; this in-memory store does not model
+    that concern.
     """
 
     def __init__(self, agent: SupportsAgentRun) -> None:
@@ -28,12 +38,21 @@ def __init__(self, agent: SupportsAgentRun) -> None:
         self.agent = agent
         self._sessions: dict[str, AgentSession] = {}
 
-    async def get(self, session_id: str) -> AgentSession:
+    async def get(self, session_id: str, *, alias: str | None = None) -> AgentSession:
         """Return the session for ``session_id``, creating it when needed.
 
         Args:
             session_id: Opaque app-selected session id.
 
+        Keyword Args:
+            alias: Optional additional id to register for the same session in
+                one call, for example a freshly minted id that the next
+                request will present instead of ``session_id``. A no-op when
+                ``alias`` is ``None`` or equal to ``session_id``. Callers that
+                want a single stable key for a whole conversation instead of
+                per-turn aliases should use a stable id (such as a
+                ``conversation_id``) as ``session_id`` and skip ``alias``.
+
         Returns:
             The cached or newly created ``AgentSession``.
 
@@ -44,7 +63,10 @@ async def get(self, session_id: str) -> AgentSession:
             raise ValueError("session_id must be a non-empty string")
         if session_id not in self._sessions:
             self._sessions[session_id] = self.agent.create_session(session_id=session_id)
-        return self._sessions[session_id]
+        session = self._sessions[session_id]
+        if alias and alias != session_id:
+            self._sessions[alias] = session
+        return session
 
     async def reset(self, session_id: str) -> None:
         """Forget the current session for ``session_id``.
@@ -59,27 +81,6 @@ async def reset(self, session_id: str) -> None:
             raise ValueError("session_id must be a non-empty string")
         self._sessions.pop(session_id, None)
 
-    async def put(self, session_id: str, session: AgentSession) -> None:
-        """Associate an existing ``session`` with an additional ``session_id``.
-
-        Use this to alias a rotating protocol id (for example, a freshly
-        minted response id) to a session that was already looked up under a
-        different, prior id. Protocols whose continuation id changes every
-        turn (such as OpenAI Responses' ``previous_response_id`` chaining)
-        need this so a later request referencing the new id still resolves
-        to the same conversation instead of starting a fresh session.
-
-        Args:
-            session_id: Opaque app-selected session id to associate.
-            session: The session to associate with ``session_id``.
-
-        Raises:
-            ValueError: If ``session_id`` is empty.
-        """
-        if not session_id:
-            raise ValueError("session_id must be a non-empty string")
-        self._sessions[session_id] = session
-
 
 TargetT = TypeVar("TargetT", bound="SupportsAgentRun | Workflow")
 SessionStoreFactory = Callable[[SupportsAgentRun], SessionStore]
@@ -228,17 +229,21 @@ async def get_session_store(self) -> SessionStore:
             self._cached_session_store = store
         return store
 
-    async def get_session(self, session_id: str) -> AgentSession:
+    async def get_session(self, session_id: str, *, alias: str | None = None) -> AgentSession:
         """Return the session for ``session_id`` from the current store.
 
         Args:
             session_id: Opaque app-selected session id.
 
+        Keyword Args:
+            alias: Optional additional id to register for the same session in
+                one call. See :meth:`SessionStore.get`.
+
         Returns:
             The cached or newly created ``AgentSession``.
         """
         store = await self.get_session_store()
-        return await store.get(session_id)
+        return await store.get(session_id, alias=alias)
 
     async def reset_session(self, session_id: str) -> None:
         """Forget the current session for ``session_id``.
diff --git a/python/packages/hosting/tests/hosting/test_state.py b/python/packages/hosting/tests/hosting/test_state.py
index f09c9b9f758..f920803bd2c 100644
--- a/python/packages/hosting/tests/hosting/test_state.py
+++ b/python/packages/hosting/tests/hosting/test_state.py
@@ -135,18 +135,27 @@ async def test_put_aliases_new_id_to_existing_session(self) -> None:
         store = SessionStore(agent)
 
         session = await store.get("resp_1")
-        await store.put("resp_2", session)
+        aliased = await store.get("resp_1", alias="resp_2")
 
+        assert aliased is session
         assert await store.get("resp_2") is session
         # Aliasing did not create a second session via the agent.
         assert len(agent.created_sessions) == 1
 
+    async def test_alias_equal_to_session_id_is_a_no_op(self) -> None:
+        agent = _FakeAgent()
+        store = SessionStore(agent)
+
+        session = await store.get("resp_1", alias="resp_1")
+
+        assert session.session_id == "resp_1"
+        assert len(agent.created_sessions) == 1
+
     async def test_put_empty_session_id_raises(self) -> None:
         store = SessionStore(_FakeAgent())
-        session = await store.get("resp_1")
 
         with pytest.raises(ValueError, match="session_id"):
-            await store.put("", session)
+            await store.get("", alias="resp_2")
 
 
 class TestAgentFrameworkState:
diff --git a/python/samples/04-hosting/af-hosting/local_responses/README.md b/python/samples/04-hosting/af-hosting/local_responses/README.md
index 31e4a2d5412..943c040d5db 100644
--- a/python/samples/04-hosting/af-hosting/local_responses/README.md
+++ b/python/samples/04-hosting/af-hosting/local_responses/README.md
@@ -22,9 +22,11 @@ What the route demonstrates:
 - Produces the AF messages, options, and session id that the route passes to
   `agent.run(...)`.
 - **Aliases** each newly minted response id to the session it was just
-  resolved from. OpenAI's `previous_response_id` rotates every turn, so
-  without this alias step turn 3+ of a conversation would silently resolve to
-  a brand-new, empty session instead of the one from earlier turns.
+  resolved from, via `state.get_session(lookup_id, alias=response_id)`.
+  OpenAI's `previous_response_id` rotates every turn *by design* — it lets a
+  caller continue from any earlier response, not just the latest one — so
+  every response id needs to stay independently resolvable, not just the
+  most recent.
 
 `app:app` is a module-level FastAPI ASGI app; recommended local launch is
 Hypercorn.
diff --git a/python/samples/04-hosting/af-hosting/local_responses/app.py b/python/samples/04-hosting/af-hosting/local_responses/app.py
index bc399539612..3b692ec98d9 100644
--- a/python/samples/04-hosting/af-hosting/local_responses/app.py
+++ b/python/samples/04-hosting/af-hosting/local_responses/app.py
@@ -111,16 +111,12 @@ async def responses(body: dict[str, Any] = Body(...)) -> JSONResponse | Streamin
     options_for_run = cast(Any, options)
 
     target = cast(Agent[Any], await state.get_target())
-    store = await state.get_session_store()
     lookup_id = session_id or response_id
-    session = await store.get(lookup_id)
-    if response_id != lookup_id:
-        # `previous_response_id` chaining rotates its id every turn. Alias the
-        # newly minted response id to this turn's session so the next
-        # request (which will send this response's id back as its
-        # `previous_response_id`) still resolves to the same conversation
-        # instead of silently starting a new one.
-        await store.put(response_id, session)
+    # `previous_response_id` chaining rotates its id every turn, and OpenAI's
+    # Responses API deliberately lets a caller continue from *any* earlier
+    # response, not just the latest one -- so the newly minted response id
+    # also needs to resolve back to this session on a later request.
+    session = await state.get_session(lookup_id, alias=response_id)
     if run["stream"]:
         stream = target.run(
             run["messages"],

From 76c4faad240a726db4f03e1292ec8453e43a1a93 Mon Sep 17 00:00:00 2001
From: eavanvalkenburg <github@vanvalkenburg.eu>
Date: Fri, 3 Jul 2026 11:22:12 +0200
Subject: [PATCH 4/7] Refine hosting state helpers

Split the shared state surface into AgentState and WorkflowState, keep SessionStore and CheckpointStore as plain storage, and make state helpers responsible for get-or-create behavior. Update the Responses sample and HTTP round-trip tests to store the post-run session explicitly under the minted response id, and support WorkflowBuilder/orchestration-style builders via structural build() support.

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 python/packages/hosting-responses/README.md   |   8 +-
 .../hosting_responses/test_http_round_trip.py |  23 +-
 python/packages/hosting/README.md             |  81 +++-
 .../agent_framework_hosting/__init__.py       |  15 +-
 .../hosting/agent_framework_hosting/_state.py | 434 +++++++++++-------
 .../tests/hosting/_workflow_fixtures.py       |   5 +
 .../hosting/tests/hosting/test_state.py       | 251 ++++++----
 .../af-hosting/local_responses/README.md      |   5 +-
 .../af-hosting/local_responses/app.py         |  35 +-
 9 files changed, 571 insertions(+), 286 deletions(-)

diff --git a/python/packages/hosting-responses/README.md b/python/packages/hosting-responses/README.md
index 956d59f516f..dd6a121a30e 100644
--- a/python/packages/hosting-responses/README.md
+++ b/python/packages/hosting-responses/README.md
@@ -18,7 +18,7 @@ FastAPI/Starlette/Django/Azure Functions code owns route registration,
 authentication, status codes, response construction, and background work.
 
 ```python
-from agent_framework_hosting import AgentFrameworkState, SessionStore
+from agent_framework_hosting import AgentState
 from agent_framework_hosting_responses import (
     create_response_id,
     responses_from_run,
@@ -29,7 +29,7 @@ from fastapi import Body, FastAPI
 from fastapi.responses import JSONResponse
 
 app = FastAPI()
-state = AgentFrameworkState(agent, session_store=SessionStore)
+state = AgentState(agent)
 
 
 @app.post("/responses")
@@ -37,11 +37,13 @@ async def responses(body: dict = Body(...)) -> JSONResponse:
     run = responses_to_run(body)
     session_id = responses_session_id(body)
     response_id = create_response_id()
+    session = await state.get_or_create_session(session_id or response_id)
     result = await (await state.get_target()).run(
         run["messages"],
-        session=await state.get_session(session_id or response_id),
+        session=session,
         options=run["options"],
     )
+    await state.session_store.set(response_id, session)
     return JSONResponse(responses_from_run(result, response_id=response_id, session_id=session_id))
 ```
 
diff --git a/python/packages/hosting-responses/tests/hosting_responses/test_http_round_trip.py b/python/packages/hosting-responses/tests/hosting_responses/test_http_round_trip.py
index c7c5ee4159d..f1efb1616bc 100644
--- a/python/packages/hosting-responses/tests/hosting_responses/test_http_round_trip.py
+++ b/python/packages/hosting-responses/tests/hosting_responses/test_http_round_trip.py
@@ -4,7 +4,7 @@
 
 These exercise the same wiring as the `local_responses` sample: helpers from
 `agent_framework_hosting_responses` convert between the Responses protocol and
-Agent Framework run values, `agent_framework_hosting`'s `AgentFrameworkState` /
+Agent Framework run values, `agent_framework_hosting`'s `AgentState` /
 `SessionStore` hold shared execution state, and a small FastAPI route owns
 everything else (parsing, policy, response construction). Requests go through
 `httpx.AsyncClient` with `ASGITransport` -- no real server process or live
@@ -27,7 +27,7 @@
     Message,
     ResponseStream,
 )
-from agent_framework_hosting import AgentFrameworkState, SessionStore
+from agent_framework_hosting import AgentState
 from fastapi import Body, FastAPI, HTTPException
 from fastapi.responses import JSONResponse, StreamingResponse
 
@@ -115,7 +115,7 @@ async def _get_response() -> AgentResponse[Any]:
 def _build_app(agent: _StubAgent) -> FastAPI:
     """Build a minimal FastAPI app mirroring the `local_responses` sample's route."""
     app = FastAPI()
-    state = AgentFrameworkState(agent, session_store=SessionStore)
+    state = AgentState(agent)
 
     @app.post("/responses", response_model=None)
     async def responses(body: dict[str, Any] = Body(...)) -> JSONResponse | StreamingResponse:  # noqa: B008
@@ -128,20 +128,29 @@ async def responses(body: dict[str, Any] = Body(...)) -> JSONResponse | Streamin
 
         target = await state.get_target()
         lookup_id = session_id or response_id
-        # Alias the newly minted response id to this turn's session, same as
-        # the sample, so a later `previous_response_id` still resolves.
-        session = await state.get_session(lookup_id, alias=response_id)
+        session = await state.get_or_create_session(lookup_id)
 
         if run["stream"]:
             stream = target.run(run["messages"], stream=True, session=session)
             if not isinstance(stream, ResponseStream):
                 raise HTTPException(status_code=500, detail="agent did not return a response stream")
+
+            async def stream_events() -> AsyncIterator[str]:
+                async for event in responses_stream_events_from_run(
+                    stream,
+                    response_id=response_id,
+                    session_id=session_id,
+                ):
+                    yield event
+                await state.session_store.set(response_id, session)
+
             return StreamingResponse(
-                responses_stream_events_from_run(stream, response_id=response_id, session_id=session_id),
+                stream_events(),
                 media_type="text/event-stream",
             )
 
         result = await target.run(run["messages"], session=session)
+        await state.session_store.set(response_id, session)
         return JSONResponse(responses_from_run(result, response_id=response_id, session_id=session_id))
 
     return app
diff --git a/python/packages/hosting/README.md b/python/packages/hosting/README.md
index 06e960edb73..5217ac39e94 100644
--- a/python/packages/hosting/README.md
+++ b/python/packages/hosting/README.md
@@ -4,50 +4,89 @@ Shared execution-state helpers for app-owned Agent Framework hosting.
 
 This package keeps Agent Framework state separate from web-framework concerns:
 
-- `AgentFrameworkState` — stores an agent/workflow target and optional session
-  state for routes that the app owns.
-- `SessionStore` — maps an app-selected session id to an `AgentSession` for
-  non-persisted servers. `get(session_id, alias=...)` resolves (creating if
-  needed) and, in the same call, can register an *additional* id for the same
-  session — useful when a protocol's continuation id rotates every turn (for
-  example, OpenAI Responses' `previous_response_id`, which by design lets a
-  caller continue from any earlier point, not just the latest turn) and a
-  later request needs to resolve the new id back to the same conversation.
-  `reset` forgets a session by its own id.
+- `AgentState` — pairs an agent target with a `SessionStore`
+  (`session_id -> AgentSession`).
+- `WorkflowState` — pairs a workflow target with a `CheckpointStore`
+  (`session_id -> CheckpointStorage`).
+
+Both stores are plain storage: `get`/`set`/`delete` by an app-selected id,
+nothing more. Neither one knows how to create a new value for an id it
+hasn't seen before — use `AgentState.get_or_create_session(...)` /
+`WorkflowState.get_or_create_checkpoint_storage(...)` for that, since only
+the state object has both the store and the resolved target.
+
 - Existing experimental channel-hosting types remain available while the package
   is unreleased, but the v1 direction is protocol helpers plus app-owned routes.
 
 Use FastAPI, Starlette, Azure Functions, Django, or another framework for route
 registration, auth, middleware, response construction, and background work.
 
-> The built-in `SessionStore` is an in-memory `dict` with no eviction — every
-> id it has ever seen (including aliases) stays resolvable for the life of the
-> process, which is intentional for the reasons above. If you back a
-> `SessionStore`-shaped store with real storage (Redis, a database, ...), you
-> are responsible for that store's own TTL/eviction policy; this reference
-> implementation does not model that concern.
+> The built-in `SessionStore` / `CheckpointStore` are in-memory `dict`s with
+> no eviction — every id ever stored stays resolvable for the life of the
+> process. That is intentional: protocols such as OpenAI Responses'
+> `previous_response_id` are designed to let a caller continue from *any*
+> earlier point in a conversation, not just the latest turn, so every id
+> handed out needs to stay independently resolvable. If you back either
+> store with real storage (Redis, a database, ...), you are responsible for
+> that store's own TTL/eviction policy; these in-memory reference
+> implementations do not model that concern.
 
 ## Quickstart
 
 ```python
 from agent_framework.openai import OpenAIChatClient
-from agent_framework_hosting import AgentFrameworkState, SessionStore
+from agent_framework_hosting import AgentState
 
 agent = OpenAIChatClient().as_agent(name="Assistant")
-state = AgentFrameworkState(agent, session_store=SessionStore)
+state = AgentState(agent)
 
-session = await state.get_session("conversation-1")
+session = await state.get_or_create_session("conversation-1")
 result = await (await state.get_target()).run("Hello", session=session)
 ```
 
+If a protocol mints a new continuation id on every response, store the session
+explicitly after `run(...)` returns. `run(...)` may update the session, so store
+the post-run object:
+
+```python
+session = await state.get_or_create_session(previous_response_id)
+result = await (await state.get_target()).run("Hello", session=session)
+await state.session_store.set(response_id, session)
+```
+
 Targets can be direct instances, synchronous factories, asynchronous factories,
 or awaitables:
 
 ```python
-state = AgentFrameworkState(create_agent)  # cached by default
-state = AgentFrameworkState(create_agent, cache_target=False)
+state = AgentState(create_agent)  # cached by default
+state = AgentState(create_agent, cache_target=False)
+```
+
+`WorkflowState` mirrors this shape for workflow targets:
+
+```python
+from agent_framework_hosting import WorkflowState
+
+state = WorkflowState(create_workflow)
+storage = await state.get_or_create_checkpoint_storage("conversation-1")
+result = await (await state.get_target()).run("Hello", checkpoint_storage=storage)
 ```
 
+`WorkflowState` also accepts an unbuilt workflow builder directly:
+
+```python
+from agent_framework import WorkflowBuilder
+from agent_framework_hosting import WorkflowState
+
+builder = WorkflowBuilder(start_executor=executor)
+state = WorkflowState(builder)  # calls builder.build() when the target is resolved
+```
+
+This is structural: orchestration builders from `agent_framework_orchestrations`
+(`SequentialBuilder`, `ConcurrentBuilder`, `HandoffBuilder`, `GroupChatBuilder`,
+and `MagenticBuilder`) also work because they expose the same zero-argument
+`build() -> Workflow` method.
+
 Cross-channel identity linking, multicast delivery, background runs,
 continuation tokens, and durable delivery runners are follow-up enhancements,
 not part of this v1 state surface.
diff --git a/python/packages/hosting/agent_framework_hosting/__init__.py b/python/packages/hosting/agent_framework_hosting/__init__.py
index cb5ed5567fd..99d98367573 100644
--- a/python/packages/hosting/agent_framework_hosting/__init__.py
+++ b/python/packages/hosting/agent_framework_hosting/__init__.py
@@ -20,7 +20,15 @@
     reset_current_isolation_keys,
     set_current_isolation_keys,
 )
-from ._state import AgentFrameworkState, AgentRunArgs, SessionStore, WorkflowRunArgs
+from ._state import (
+    AgentRunArgs,
+    AgentState,
+    CheckpointStore,
+    SessionStore,
+    SupportsBuild,
+    WorkflowRunArgs,
+    WorkflowState,
+)
 from ._types import (
     Channel,
     ChannelCommand,
@@ -45,8 +53,8 @@
     "ISOLATION_HEADER_CHAT",
     "ISOLATION_HEADER_USER",
     "AgentFrameworkHost",
-    "AgentFrameworkState",
     "AgentRunArgs",
+    "AgentState",
     "Channel",
     "ChannelCommand",
     "ChannelCommandContext",
@@ -58,11 +66,14 @@
     "ChannelRunHook",
     "ChannelSession",
     "ChannelStreamUpdateHook",
+    "CheckpointStore",
     "HostStatePaths",
     "HostedRunResult",
     "IsolationKeys",
     "SessionStore",
+    "SupportsBuild",
     "WorkflowRunArgs",
+    "WorkflowState",
     "__version__",
     "get_current_isolation_keys",
     "logger",
diff --git a/python/packages/hosting/agent_framework_hosting/_state.py b/python/packages/hosting/agent_framework_hosting/_state.py
index 007e55397d8..a16a30c4706 100644
--- a/python/packages/hosting/agent_framework_hosting/_state.py
+++ b/python/packages/hosting/agent_framework_hosting/_state.py
@@ -1,75 +1,126 @@
 # Copyright (c) Microsoft. All rights reserved.
 
+"""Shared execution state for app-owned hosting routes.
+
+Two independent state holders, one per target kind, since agents and
+workflows keep different continuation state:
+
+- ``AgentState`` pairs an agent target with a ``SessionStore``
+  (``session_id -> AgentSession``).
+- ``WorkflowState`` pairs a workflow target with a ``CheckpointStore``
+  (``session_id -> CheckpointStorage``).
+
+Both stores are plain storage: they only get/set/delete what they are given.
+Neither one knows how to create a new value for a ``session_id`` it hasn't
+seen before -- that is the corresponding state object's job (see
+``AgentState.get_or_create_session`` / ``WorkflowState.get_or_create_checkpoint_storage``),
+since only the state object has both the store and the resolved target.
+"""
+
 from __future__ import annotations
 
 import inspect
 from collections.abc import Awaitable, Callable, Mapping
-from typing import Any, Generic, TypedDict, TypeVar, overload
+from typing import Any, Generic, Protocol, TypedDict, TypeVar, cast, runtime_checkable
 
-from agent_framework import AgentRunInputs, AgentSession, ChatOptions, SupportsAgentRun, Workflow
+from agent_framework import (
+    AgentRunInputs,
+    AgentSession,
+    ChatOptions,
+    CheckpointStorage,
+    InMemoryCheckpointStorage,
+    SupportsAgentRun,
+    Workflow,
+)
 
 
 class SessionStore:
-    """In-memory session lookup for non-persisted servers.
-
-    The store maps application-selected session ids to ``AgentSession``
-    instances. The id is an opaque partition key; callers are responsible for
-    deciding whether it came from a trusted request field, platform context, or
-    other route-local state.
-
-    This reference implementation is a plain ``dict`` with no eviction: every
-    id ever seen stays resolvable for the life of the process. That is
-    intentional here (protocols such as OpenAI Responses'
-    ``previous_response_id`` let a caller continue from *any* earlier point in
-    a conversation, not just the latest turn, so every id needs to stay
-    independently addressable -- see :meth:`get`'s ``alias`` argument).
-    A storage-backed replacement (Redis, a database, ...) should apply its own
-    TTL/eviction policy for these ids; this in-memory store does not model
-    that concern.
+    """Plain in-memory ``session_id -> AgentSession`` lookup.
+
+    This store only stores and retrieves; it does not create sessions. Use
+    :meth:`AgentState.get_or_create_session` for that -- it resolves the
+    agent target and calls ``target.create_session(...)`` the first time a
+    given ``session_id`` is seen, then stores the result here.
+
+    No eviction: every id ever stored stays resolvable for the life of the
+    process. That is intentional -- protocols such as OpenAI Responses'
+    ``previous_response_id`` are designed to let a caller continue from *any*
+    earlier point in a conversation, not just the latest turn, so every id
+    that has been handed out needs to stay independently resolvable. If you
+    back a ``SessionStore``-shaped store with real storage (Redis, a
+    database, ...), you are responsible for that store's own TTL/eviction
+    policy; this in-memory reference implementation does not model that
+    concern.
     """
 
-    def __init__(self, agent: SupportsAgentRun) -> None:
-        """Create a session store for ``agent``.
+    def __init__(self) -> None:
+        """Create an empty session store."""
+        self._sessions: dict[str, AgentSession] = {}
+
+    async def get(self, session_id: str) -> AgentSession | None:
+        """Return the stored session for ``session_id``, or ``None`` if absent.
 
         Args:
-            agent: The agent that creates sessions when a session id is first
-                observed.
+            session_id: Opaque app-selected session id.
+
+        Raises:
+            ValueError: If ``session_id`` is empty.
         """
-        self.agent = agent
-        self._sessions: dict[str, AgentSession] = {}
+        if not session_id:
+            raise ValueError("session_id must be a non-empty string")
+        return self._sessions.get(session_id)
 
-    async def get(self, session_id: str, *, alias: str | None = None) -> AgentSession:
-        """Return the session for ``session_id``, creating it when needed.
+    async def set(self, session_id: str, session: AgentSession) -> None:
+        """Store ``session`` under ``session_id``, replacing any existing entry.
 
         Args:
             session_id: Opaque app-selected session id.
+            session: The session to store.
 
-        Keyword Args:
-            alias: Optional additional id to register for the same session in
-                one call, for example a freshly minted id that the next
-                request will present instead of ``session_id``. A no-op when
-                ``alias`` is ``None`` or equal to ``session_id``. Callers that
-                want a single stable key for a whole conversation instead of
-                per-turn aliases should use a stable id (such as a
-                ``conversation_id``) as ``session_id`` and skip ``alias``.
+        Raises:
+            ValueError: If ``session_id`` is empty.
+        """
+        if not session_id:
+            raise ValueError("session_id must be a non-empty string")
+        self._sessions[session_id] = session
 
-        Returns:
-            The cached or newly created ``AgentSession``.
+    async def delete(self, session_id: str) -> None:
+        """Forget the stored session for ``session_id``, if any.
+
+        Args:
+            session_id: Opaque app-selected session id.
 
         Raises:
             ValueError: If ``session_id`` is empty.
         """
         if not session_id:
             raise ValueError("session_id must be a non-empty string")
-        if session_id not in self._sessions:
-            self._sessions[session_id] = self.agent.create_session(session_id=session_id)
-        session = self._sessions[session_id]
-        if alias and alias != session_id:
-            self._sessions[alias] = session
-        return session
+        self._sessions.pop(session_id, None)
+
+
+class CheckpointStore:
+    """Plain in-memory ``session_id -> CheckpointStorage`` lookup.
 
-    async def reset(self, session_id: str) -> None:
-        """Forget the current session for ``session_id``.
+    Maps an app-selected session id to a :class:`CheckpointStorage` scoped to
+    that conversation. This store only stores and retrieves; it does not
+    decide which checkpoint within that storage to resume from. Use
+    :meth:`WorkflowState.get_or_create_checkpoint_storage` to create a fresh
+    ``CheckpointStorage`` the first time a given ``session_id`` is seen.
+
+    Resuming a prior run is a separate, run-time decision the route makes:
+    call ``storage.get_latest(workflow_name=...)`` yourself and pass its
+    ``checkpoint_id`` into ``workflow.run(checkpoint_id=..., checkpoint_storage=storage)``.
+
+    No eviction, for the same reason as :class:`SessionStore` -- see that
+    class's docstring.
+    """
+
+    def __init__(self) -> None:
+        """Create an empty checkpoint store."""
+        self._storages: dict[str, CheckpointStorage] = {}
+
+    async def get(self, session_id: str) -> CheckpointStorage | None:
+        """Return the stored checkpoint storage for ``session_id``, or ``None`` if absent.
 
         Args:
             session_id: Opaque app-selected session id.
@@ -79,11 +130,52 @@ async def reset(self, session_id: str) -> None:
         """
         if not session_id:
             raise ValueError("session_id must be a non-empty string")
-        self._sessions.pop(session_id, None)
+        return self._storages.get(session_id)
 
+    async def set(self, session_id: str, storage: CheckpointStorage) -> None:
+        """Store ``storage`` under ``session_id``, replacing any existing entry.
 
-TargetT = TypeVar("TargetT", bound="SupportsAgentRun | Workflow")
-SessionStoreFactory = Callable[[SupportsAgentRun], SessionStore]
+        Args:
+            session_id: Opaque app-selected session id.
+            storage: The checkpoint storage to store.
+
+        Raises:
+            ValueError: If ``session_id`` is empty.
+        """
+        if not session_id:
+            raise ValueError("session_id must be a non-empty string")
+        self._storages[session_id] = storage
+
+    async def delete(self, session_id: str) -> None:
+        """Forget the stored checkpoint storage for ``session_id``, if any.
+
+        Args:
+            session_id: Opaque app-selected session id.
+
+        Raises:
+            ValueError: If ``session_id`` is empty.
+        """
+        if not session_id:
+            raise ValueError("session_id must be a non-empty string")
+        self._storages.pop(session_id, None)
+
+
+AgentT = TypeVar("AgentT", bound=SupportsAgentRun)
+WorkflowT = TypeVar("WorkflowT", bound=Workflow)
+
+
+@runtime_checkable
+class SupportsBuild(Protocol):
+    """A builder that produces a ``Workflow`` via a zero-argument ``build()``.
+
+    Matches ``agent_framework.WorkflowBuilder`` and the orchestration
+    builders in ``agent_framework_orchestrations`` (``ConcurrentBuilder``,
+    ``GroupChatBuilder``, ``HandoffBuilder``, ``MagenticBuilder``,
+    ``SequentialBuilder``) structurally, without ``agent-framework-hosting``
+    depending on either package.
+    """
+
+    def build(self) -> Workflow: ...
 
 
 class AgentRunArgs(TypedDict):
@@ -102,99 +194,49 @@ class WorkflowRunArgs(TypedDict):
     stream: bool
 
 
-class AgentFrameworkState(Generic[TargetT]):
-    """Shared execution state for app-owned hosting routes.
+class AgentState(Generic[AgentT]):
+    """Shared execution state for app-owned agent hosting routes.
 
-    ``AgentFrameworkState`` intentionally does not own routes, middleware,
-    protocol dispatch, or native SDK calls. Web frameworks keep those concerns;
-    this object holds the Agent Framework target and optional session store that
-    route code may share.
+    Holds the Agent Framework agent target and a :class:`SessionStore` that
+    route code may share. Does not own routes, middleware, protocol
+    dispatch, or native SDK calls -- web frameworks keep those concerns.
     """
 
-    # `target` accepts an instance, a sync/async factory, or a bare awaitable.
-    # Each shape is declared as its own overload rather than one big union
-    # because type checkers struggle to bind `TargetT` when it appears both
-    # bare and inside `Callable`/`Awaitable` alternatives in a single union
-    # parameter (observed as inference failures across pyright, pyrefly, ty,
-    # and zuban).
-    @overload
-    def __init__(
-        self,
-        target: TargetT,
-        *,
-        session_store: SessionStore | type[SessionStore] | SessionStoreFactory | None = None,
-        cache_target: bool = True,
-    ) -> None: ...
-
-    @overload
     def __init__(
         self,
-        target: Callable[[], TargetT],
+        target: AgentT | Awaitable[AgentT] | Callable[[], AgentT | Awaitable[AgentT]],
         *,
-        session_store: SessionStore | type[SessionStore] | SessionStoreFactory | None = None,
-        cache_target: bool = True,
-    ) -> None: ...
-
-    @overload
-    def __init__(
-        self,
-        target: Callable[[], Awaitable[TargetT]],
-        *,
-        session_store: SessionStore | type[SessionStore] | SessionStoreFactory | None = None,
-        cache_target: bool = True,
-    ) -> None: ...
-
-    @overload
-    def __init__(
-        self,
-        target: Awaitable[TargetT],
-        *,
-        session_store: SessionStore | type[SessionStore] | SessionStoreFactory | None = None,
-        cache_target: bool = True,
-    ) -> None: ...
-
-    def __init__(
-        self,
-        target: TargetT | Awaitable[TargetT] | Callable[[], TargetT | Awaitable[TargetT]],
-        *,
-        session_store: SessionStore | type[SessionStore] | SessionStoreFactory | None = None,
+        session_store: SessionStore | None = None,
         cache_target: bool = True,
     ) -> None:
         """Create shared state for ``target``.
 
         Args:
-            target: Agent or workflow target used by route code. May be a
-                target instance, a synchronous factory, an asynchronous factory,
-                or an awaitable target.
+            target: Agent target used by route code. May be a target
+                instance, a synchronous factory, an asynchronous factory, or
+                an awaitable target.
 
         Keyword Args:
-            session_store: Existing store, store class, or factory. When omitted
-                and ``target`` is an agent, an in-memory ``SessionStore`` is
-                created. Workflow targets do not get a default session store.
-            cache_target: Whether to cache a resolved callable/awaitable target.
-                Defaults to ``True`` so expensive target setup happens once.
+            session_store: Existing store to use. Defaults to a fresh
+                in-memory :class:`SessionStore`.
+            cache_target: Whether to cache a resolved callable/awaitable
+                target. Defaults to ``True`` so expensive target setup
+                happens once.
 
         Raises:
             ValueError: If ``cache_target=False`` is used with a one-shot
                 awaitable target.
-            TypeError: If a session store class/factory is supplied for a
-                workflow target.
         """
         if not cache_target and inspect.isawaitable(target):
             raise ValueError("cache_target=False requires a target instance or callable target factory")
         self._target_source = target
         self._cache_target = cache_target
-        self._cached_target: TargetT | None = None
-        self._session_store_source = session_store
-        self._cached_session_store = session_store if isinstance(session_store, SessionStore) else None
+        self._cached_target: AgentT | None = None
         if not callable(target) and not inspect.isawaitable(target):
             self._cached_target = target
-            if self._cached_session_store is None and isinstance(target, SupportsAgentRun):
-                self._cached_session_store = self._init_session_store(target, session_store)
-            elif session_store is not None and not isinstance(target, SupportsAgentRun):
-                raise TypeError("session_store requires an agent target that supports create_session")
+        self._session_store: SessionStore = session_store if session_store is not None else SessionStore()
 
-    async def get_target(self) -> TargetT:
+    async def get_target(self) -> AgentT:
         """Return the resolved target.
 
         Returns:
@@ -211,51 +253,115 @@ async def get_target(self) -> TargetT:
             self._cached_target = target
         return target
 
-    async def get_session_store(self) -> SessionStore:
-        """Return the session store for the current target.
-
-        Returns:
-            The configured or lazily created ``SessionStore``.
+    @property
+    def target(self) -> AgentT:
+        """Return a synchronously available target.
 
         Raises:
-            TypeError: If the resolved target is not an agent target.
+            RuntimeError: If the target is a callable or awaitable that has not
+                been resolved with :meth:`get_target`.
         """
-        if self._cached_session_store is not None:
-            return self._cached_session_store
+        if self._cached_target is not None:
+            return self._cached_target
+        if not callable(self._target_source) and not inspect.isawaitable(self._target_source):
+            return self._target_source
+        raise RuntimeError("target is resolved asynchronously; use `await state.get_target()`")
 
-        target = await self.get_target()
-        store = self._init_session_store(target, self._session_store_source)
-        if self._cache_target:
-            self._cached_session_store = store
-        return store
+    @property
+    def session_store(self) -> SessionStore:
+        """Return the session store for this state."""
+        return self._session_store
 
-    async def get_session(self, session_id: str, *, alias: str | None = None) -> AgentSession:
-        """Return the session for ``session_id`` from the current store.
+    async def get_or_create_session(self, session_id: str) -> AgentSession:
+        """Return the session for ``session_id``, creating and storing one if missing.
 
         Args:
             session_id: Opaque app-selected session id.
 
-        Keyword Args:
-            alias: Optional additional id to register for the same session in
-                one call. See :meth:`SessionStore.get`.
-
         Returns:
-            The cached or newly created ``AgentSession``.
+            The stored or newly created ``AgentSession``.
         """
-        store = await self.get_session_store()
-        return await store.get(session_id, alias=alias)
+        session = await self._session_store.get(session_id)
+        if session is None:
+            target = await self.get_target()
+            session = target.create_session(session_id=session_id)
+            await self._session_store.set(session_id, session)
+        return session
 
-    async def reset_session(self, session_id: str) -> None:
-        """Forget the current session for ``session_id``.
+
+class WorkflowState(Generic[WorkflowT]):
+    """Shared execution state for app-owned workflow hosting routes.
+
+    Holds the Agent Framework workflow target and a :class:`CheckpointStore`
+    that route code may share. Does not own routes, middleware, protocol
+    dispatch, or native SDK calls -- web frameworks keep those concerns.
+    """
+
+    def __init__(
+        self,
+        target: WorkflowT | SupportsBuild | Awaitable[WorkflowT] | Callable[[], WorkflowT | Awaitable[WorkflowT]],
+        *,
+        checkpoint_store: CheckpointStore | None = None,
+        cache_target: bool = True,
+    ) -> None:
+        """Create shared state for ``target``.
 
         Args:
-            session_id: Opaque app-selected session id.
+            target: Workflow target used by route code. May be a target
+                instance, a ``WorkflowBuilder``-shaped builder (see
+                :class:`SupportsBuild`; the state calls ``build()`` for you),
+                a synchronous factory, an asynchronous factory, or an
+                awaitable target.
+
+        Keyword Args:
+            checkpoint_store: Existing store to use. Defaults to a fresh
+                in-memory :class:`CheckpointStore`.
+            cache_target: Whether to cache a resolved callable/awaitable/built
+                target. Defaults to ``True`` so expensive target setup
+                happens once.
+
+        Raises:
+            ValueError: If ``cache_target=False`` is used with a one-shot
+                awaitable target.
         """
-        store = await self.get_session_store()
-        await store.reset(session_id)
+        if isinstance(target, SupportsBuild):
+            # WorkflowBuilder (and the orchestration builders) are not
+            # themselves callable or awaitable, so normalize to the bound
+            # `build` method -- the resolution logic below already knows how
+            # to treat a zero-arg factory. `build()` is typed to return the
+            # `Workflow` base class rather than this instance's narrower
+            # `WorkflowT`, but it is the same object the caller asked for.
+            target = cast("Callable[[], WorkflowT]", target.build)
+        if not cache_target and inspect.isawaitable(target):
+            raise ValueError("cache_target=False requires a target instance or callable target factory")
+        self._target_source = target
+        self._cache_target = cache_target
+        self._cached_target: WorkflowT | None = None
+        if not callable(target) and not inspect.isawaitable(target):
+            self._cached_target = target
+        self._checkpoint_store: CheckpointStore = (
+            checkpoint_store if checkpoint_store is not None else CheckpointStore()
+        )
+
+    async def get_target(self) -> WorkflowT:
+        """Return the resolved target.
+
+        Returns:
+            The target instance. Callable and awaitable targets are resolved
+            first and cached by default.
+        """
+        if self._cache_target and self._cached_target is not None:
+            return self._cached_target
+
+        target = self._target_source() if callable(self._target_source) else self._target_source
+        if inspect.isawaitable(target):
+            target = await target
+        if self._cache_target:
+            self._cached_target = target
+        return target
 
     @property
-    def target(self) -> TargetT:
+    def target(self) -> WorkflowT:
         """Return a synchronously available target.
 
         Raises:
@@ -269,22 +375,30 @@ def target(self) -> TargetT:
         raise RuntimeError("target is resolved asynchronously; use `await state.get_target()`")
 
     @property
-    def session_store(self) -> SessionStore | None:
-        """Return a synchronously available session store, if one is cached."""
-        return self._cached_session_store
-
-    def _init_session_store(
-        self,
-        target: TargetT,
-        session_store: SessionStore | type[SessionStore] | SessionStoreFactory | None,
-    ) -> SessionStore:
-        if isinstance(session_store, SessionStore):
-            return session_store
-
-        if not isinstance(target, SupportsAgentRun):
-            raise TypeError("session_store requires an agent target that supports create_session")
+    def checkpoint_store(self) -> CheckpointStore:
+        """Return the checkpoint store for this state."""
+        return self._checkpoint_store
+
+    async def get_or_create_checkpoint_storage(self, session_id: str) -> CheckpointStorage:
+        """Return the checkpoint storage for ``session_id``, creating and storing one if missing.
+
+        Unlike an agent, a ``Workflow`` has no ``create_session``-style
+        factory method, so "creating" one for a new ``session_id`` means
+        allocating a fresh, empty :class:`InMemoryCheckpointStorage` -- there
+        is nothing to restore yet. Pass the returned storage into
+        ``workflow.run(checkpoint_storage=...)``. To resume a prior run for
+        this ``session_id`` instead of starting fresh, call
+        ``storage.get_latest(workflow_name=...)`` yourself first and pass its
+        ``checkpoint_id`` into ``workflow.run(checkpoint_id=..., checkpoint_storage=...)``.
 
-        if session_store is None:
-            return SessionStore(target)
+        Args:
+            session_id: Opaque app-selected session id.
 
-        return session_store(target)
+        Returns:
+            The stored or newly created ``CheckpointStorage``.
+        """
+        storage = await self._checkpoint_store.get(session_id)
+        if storage is None:
+            storage = InMemoryCheckpointStorage()
+            await self._checkpoint_store.set(session_id, storage)
+        return storage
diff --git a/python/packages/hosting/tests/hosting/_workflow_fixtures.py b/python/packages/hosting/tests/hosting/_workflow_fixtures.py
index d797e743d92..72addb7dff8 100644
--- a/python/packages/hosting/tests/hosting/_workflow_fixtures.py
+++ b/python/packages/hosting/tests/hosting/_workflow_fixtures.py
@@ -32,6 +32,11 @@ def build_echo_workflow() -> Workflow:
     return WorkflowBuilder(start_executor=_EchoExecutor(id="echo")).build()
 
 
+def echo_workflow_builder() -> WorkflowBuilder:
+    """Return an *unbuilt* echo ``WorkflowBuilder``, for testing builder-shaped targets."""
+    return WorkflowBuilder(start_executor=_EchoExecutor(id="echo"))
+
+
 class _MultiChunkExecutor(Executor):
     """Yields three separate ``output`` events so streaming has something to chew on."""
 
diff --git a/python/packages/hosting/tests/hosting/test_state.py b/python/packages/hosting/tests/hosting/test_state.py
index f920803bd2c..f94afdaf65d 100644
--- a/python/packages/hosting/tests/hosting/test_state.py
+++ b/python/packages/hosting/tests/hosting/test_state.py
@@ -13,12 +13,13 @@
     AgentRunInputs,
     AgentSession,
     Content,
+    InMemoryCheckpointStorage,
     Message,
     ResponseStream,
     Workflow,
 )
 
-from agent_framework_hosting import AgentFrameworkState, SessionStore
+from agent_framework_hosting import AgentState, CheckpointStore, SessionStore, WorkflowState
 
 
 def _workflow_fixture(name: str) -> Any:
@@ -100,90 +101,112 @@ async def _get_response() -> AgentResponse[Any]:
 
 
 class TestSessionStore:
-    async def test_get_reuses_session_for_same_id(self) -> None:
-        agent = _FakeAgent()
-        store = SessionStore(agent)
+    async def test_get_returns_none_for_missing_id(self) -> None:
+        store = SessionStore()
 
-        first = await store.get("session-1")
-        second = await store.get("session-1")
+        assert await store.get("session-1") is None
 
-        assert first is second
-        assert first.session_id == "session-1"
-        assert len(agent.created_sessions) == 1
+    async def test_set_then_get_returns_stored_session(self) -> None:
+        store = SessionStore()
+        session = AgentSession(session_id="session-1")
 
-    async def test_reset_forgets_session(self) -> None:
-        agent = _FakeAgent()
-        store = SessionStore(agent)
+        await store.set("session-1", session)
 
-        first = await store.get("session-1")
-        await store.reset("session-1")
-        second = await store.get("session-1")
+        assert await store.get("session-1") is session
 
-        assert first is not second
-        assert len(agent.created_sessions) == 2
+    async def test_set_can_store_same_session_under_additional_id(self) -> None:
+        store = SessionStore()
+        session = AgentSession(session_id="resp_1")
+
+        await store.set("resp_1", session)
+        await store.set("resp_2", session)
+
+        assert await store.get("resp_1") is session
+        assert await store.get("resp_2") is session
+
+    async def test_set_replaces_existing_entry(self) -> None:
+        store = SessionStore()
+        first = AgentSession(session_id="session-1")
+        second = AgentSession(session_id="session-1")
+
+        await store.set("session-1", first)
+        await store.set("session-1", second)
+
+        assert await store.get("session-1") is second
+
+    async def test_delete_forgets_session(self) -> None:
+        store = SessionStore()
+        await store.set("session-1", AgentSession(session_id="session-1"))
+
+        await store.delete("session-1")
+
+        assert await store.get("session-1") is None
+
+    async def test_delete_missing_id_is_a_no_op(self) -> None:
+        store = SessionStore()
+
+        await store.delete("never-stored")
 
     async def test_empty_session_id_raises(self) -> None:
-        store = SessionStore(_FakeAgent())
+        store = SessionStore()
+        session = AgentSession(session_id="session-1")
 
         with pytest.raises(ValueError, match="session_id"):
             await store.get("")
         with pytest.raises(ValueError, match="session_id"):
-            await store.reset("")
+            await store.set("", session)
+        with pytest.raises(ValueError, match="session_id"):
+            await store.delete("")
 
-    async def test_put_aliases_new_id_to_existing_session(self) -> None:
-        agent = _FakeAgent()
-        store = SessionStore(agent)
 
-        session = await store.get("resp_1")
-        aliased = await store.get("resp_1", alias="resp_2")
+class TestCheckpointStore:
+    async def test_get_returns_none_for_missing_id(self) -> None:
+        store = CheckpointStore()
 
-        assert aliased is session
-        assert await store.get("resp_2") is session
-        # Aliasing did not create a second session via the agent.
-        assert len(agent.created_sessions) == 1
+        assert await store.get("session-1") is None
 
-    async def test_alias_equal_to_session_id_is_a_no_op(self) -> None:
-        agent = _FakeAgent()
-        store = SessionStore(agent)
+    async def test_set_then_get_returns_stored_storage(self) -> None:
+        store = CheckpointStore()
+        storage = InMemoryCheckpointStorage()
 
-        session = await store.get("resp_1", alias="resp_1")
+        await store.set("session-1", storage)
 
-        assert session.session_id == "resp_1"
-        assert len(agent.created_sessions) == 1
+        assert await store.get("session-1") is storage
+
+    async def test_delete_forgets_storage(self) -> None:
+        store = CheckpointStore()
+        await store.set("session-1", InMemoryCheckpointStorage())
 
-    async def test_put_empty_session_id_raises(self) -> None:
-        store = SessionStore(_FakeAgent())
+        await store.delete("session-1")
 
+        assert await store.get("session-1") is None
+
+    async def test_empty_session_id_raises(self) -> None:
+        store = CheckpointStore()
+        storage = InMemoryCheckpointStorage()
+
+        with pytest.raises(ValueError, match="session_id"):
+            await store.get("")
         with pytest.raises(ValueError, match="session_id"):
-            await store.get("", alias="resp_2")
+            await store.set("", storage)
+        with pytest.raises(ValueError, match="session_id"):
+            await store.delete("")
 
 
-class TestAgentFrameworkState:
-    def test_default_session_store_for_agent(self) -> None:
+class TestAgentState:
+    def test_default_session_store_is_fresh_in_memory_store(self) -> None:
         agent = _FakeAgent()
-        state = AgentFrameworkState(agent)
+        state = AgentState(agent)
 
         assert state.target is agent
         assert isinstance(state.session_store, SessionStore)
 
     def test_accepts_session_store_instance(self) -> None:
-        agent = _FakeAgent()
-        store = SessionStore(agent)
-        state = AgentFrameworkState(agent, session_store=store)
+        store = SessionStore()
+        state = AgentState(_FakeAgent(), session_store=store)
 
-        assert state.target is agent
         assert state.session_store is store
 
-    def test_accepts_session_store_factory(self) -> None:
-        agent = _FakeAgent()
-
-        def factory(target: Any) -> SessionStore:
-            return SessionStore(target)
-
-        state = AgentFrameworkState(agent, session_store=factory)
-
-        assert isinstance(state.session_store, SessionStore)
-
     async def test_callable_target_cached_by_default(self) -> None:
         calls = 0
 
@@ -192,7 +215,7 @@ def create_agent() -> _FakeAgent:
             calls += 1
             return _FakeAgent()
 
-        state = AgentFrameworkState(create_agent)
+        state = AgentState(create_agent)
 
         first = await state.get_target()
         second = await state.get_target()
@@ -208,7 +231,7 @@ def create_agent() -> _FakeAgent:
             calls += 1
             return _FakeAgent()
 
-        state = AgentFrameworkState(create_agent, cache_target=False)
+        state = AgentState(create_agent, cache_target=False)
 
         first = await state.get_target()
         second = await state.get_target()
@@ -220,47 +243,117 @@ async def test_async_callable_target(self) -> None:
         async def create_agent() -> _FakeAgent:
             return _FakeAgent()
 
-        state = AgentFrameworkState(create_agent)
+        state = AgentState(create_agent)
 
         assert isinstance(await state.get_target(), _FakeAgent)
 
-    async def test_get_session_resolves_target_and_store(self) -> None:
-        state = AgentFrameworkState(lambda: _FakeAgent())
+    def test_cache_target_false_rejects_bare_awaitable(self) -> None:
+        async def create_agent() -> _FakeAgent:
+            return _FakeAgent()
+
+        coro = create_agent()
+        try:
+            with pytest.raises(ValueError, match="cache_target=False"):
+                AgentState(coro, cache_target=False)
+        finally:
+            coro.close()
+
+    async def test_get_or_create_session_creates_and_stores_once(self) -> None:
+        agent = _FakeAgent()
+        state = AgentState(agent)
 
-        session = await state.get_session("session-1")
+        first = await state.get_or_create_session("session-1")
+        second = await state.get_or_create_session("session-1")
 
-        assert session.session_id == "session-1"
+        assert first is second
+        assert first.session_id == "session-1"
+        assert len(agent.created_sessions) == 1
 
-    async def test_reset_session_forgets_session(self) -> None:
+    async def test_get_or_create_session_reuses_a_session_set_directly_on_the_store(self) -> None:
         agent = _FakeAgent()
-        state = AgentFrameworkState(agent)
+        state = AgentState(agent)
+        pre_existing = AgentSession(session_id="session-1")
+        await state.session_store.set("session-1", pre_existing)
 
-        first = await state.get_session("session-1")
-        await state.reset_session("session-1")
-        second = await state.get_session("session-1")
+        session = await state.get_or_create_session("session-1")
+
+        assert session is pre_existing
+        assert len(agent.created_sessions) == 0
 
-        assert first is not second
-        assert len(agent.created_sessions) == 2
 
-    def test_session_store_for_non_agent_target_raises_type_error(self) -> None:
+class TestWorkflowState:
+    def test_default_checkpoint_store_is_fresh_in_memory_store(self) -> None:
         workflow = _workflow_fixture("build_echo_workflow")()
+        state: WorkflowState[Workflow] = WorkflowState(workflow)
 
-        with pytest.raises(TypeError, match="session_store requires an agent target"):
-            AgentFrameworkState(workflow, session_store=SessionStore)
+        assert state.target is workflow
+        assert isinstance(state.checkpoint_store, CheckpointStore)
 
-    async def test_workflow_target_has_no_default_session_store(self) -> None:
-        workflow: Workflow = _workflow_fixture("build_echo_workflow")()
-        state = AgentFrameworkState(workflow)
+    def test_accepts_checkpoint_store_instance(self) -> None:
+        workflow = _workflow_fixture("build_echo_workflow")()
+        store = CheckpointStore()
+        state: WorkflowState[Workflow] = WorkflowState(workflow, checkpoint_store=store)
 
-        assert await state.get_target() is workflow
-        assert state.session_store is None
-        with pytest.raises(TypeError, match="session_store requires an agent target"):
-            await state.get_session_store()
+        assert state.checkpoint_store is store
 
     async def test_workflow_target_resolved_from_factory(self) -> None:
         build_echo_workflow = _workflow_fixture("build_echo_workflow")
 
-        state = AgentFrameworkState(build_echo_workflow)
+        state: WorkflowState[Workflow] = WorkflowState(build_echo_workflow)
 
         target = await state.get_target()
         assert isinstance(target, Workflow)
+
+    async def test_accepts_workflow_builder_instance_directly(self) -> None:
+        """A ``WorkflowBuilder`` is not itself callable or awaitable; the state must
+        recognize its `build()` method and call it, not cache the raw builder."""
+        builder = _workflow_fixture("echo_workflow_builder")()
+
+        state: WorkflowState[Workflow] = WorkflowState(builder)
+
+        target = await state.get_target()
+        assert isinstance(target, Workflow)
+        assert state.target is target
+
+    async def test_workflow_builder_is_built_once_and_cached_by_default(self) -> None:
+        builder = _workflow_fixture("echo_workflow_builder")()
+        state: WorkflowState[Workflow] = WorkflowState(builder)
+
+        first = await state.get_target()
+        second = await state.get_target()
+
+        assert first is second
+
+    async def test_accepts_orchestration_style_builder_without_importing_orchestrations(self) -> None:
+        """``SupportsBuild`` is structural: any object with a zero-arg ``build() -> Workflow``
+        is accepted, matching ``agent_framework_orchestrations``' builders without this
+        package depending on that one."""
+        workflow = _workflow_fixture("build_echo_workflow")()
+
+        class _FakeOrchestrationBuilder:
+            def build(self) -> Workflow:
+                return workflow
+
+        state: WorkflowState[Workflow] = WorkflowState(_FakeOrchestrationBuilder())
+
+        assert await state.get_target() is workflow
+
+    async def test_get_or_create_checkpoint_storage_creates_and_stores_once(self) -> None:
+        workflow = _workflow_fixture("build_echo_workflow")()
+        state: WorkflowState[Workflow] = WorkflowState(workflow)
+
+        first = await state.get_or_create_checkpoint_storage("session-1")
+        second = await state.get_or_create_checkpoint_storage("session-1")
+
+        assert first is second
+        assert isinstance(first, InMemoryCheckpointStorage)
+
+    async def test_get_or_create_checkpoint_storage_reuses_storage_set_directly_on_the_store(self) -> None:
+        workflow = _workflow_fixture("build_echo_workflow")()
+        state: WorkflowState[Workflow] = WorkflowState(workflow)
+        pre_existing = InMemoryCheckpointStorage()
+        await state.checkpoint_store.set("session-1", pre_existing)
+
+        storage = await state.get_or_create_checkpoint_storage("session-1")
+
+        assert storage is pre_existing
diff --git a/python/samples/04-hosting/af-hosting/local_responses/README.md b/python/samples/04-hosting/af-hosting/local_responses/README.md
index 943c040d5db..24b552e117d 100644
--- a/python/samples/04-hosting/af-hosting/local_responses/README.md
+++ b/python/samples/04-hosting/af-hosting/local_responses/README.md
@@ -21,8 +21,9 @@ What the route demonstrates:
   turn.
 - Produces the AF messages, options, and session id that the route passes to
   `agent.run(...)`.
-- **Aliases** each newly minted response id to the session it was just
-  resolved from, via `state.get_session(lookup_id, alias=response_id)`.
+- **Stores** each newly minted response id for the session it was just
+  resolved from, via `state.session_store.set(response_id, session)` after
+  `agent.run(...)` has updated the session.
   OpenAI's `previous_response_id` rotates every turn *by design* — it lets a
   caller continue from any earlier response, not just the latest one — so
   every response id needs to stay independently resolvable, not just the
diff --git a/python/samples/04-hosting/af-hosting/local_responses/app.py b/python/samples/04-hosting/af-hosting/local_responses/app.py
index 3b692ec98d9..9aec83fb452 100644
--- a/python/samples/04-hosting/af-hosting/local_responses/app.py
+++ b/python/samples/04-hosting/af-hosting/local_responses/app.py
@@ -7,7 +7,7 @@
 1. ``agent-framework-hosting-responses`` converts Responses request/response
    payloads to and from Agent Framework run values.
 2. ``agent-framework-hosting`` owns shared execution state via
-   ``AgentFrameworkState`` and ``SessionStore``.
+   ``AgentState`` and ``SessionStore``.
 3. FastAPI owns the route, request parsing, policy decisions, and response
    object.
 
@@ -35,12 +35,13 @@
 
 import asyncio
 import os
+from collections.abc import AsyncIterator
 from pathlib import Path
 from typing import Annotated, Any, cast
 
 from agent_framework import Agent, FileHistoryProvider, ResponseStream, tool
 from agent_framework_foundry import FoundryChatClient
-from agent_framework_hosting import AgentFrameworkState, SessionStore
+from agent_framework_hosting import AgentState
 from agent_framework_hosting_responses import (
     create_response_id,
     responses_from_run,
@@ -88,7 +89,7 @@ def create_agent() -> Agent:
 
 
 app = FastAPI()
-state = AgentFrameworkState(create_agent, session_store=SessionStore)
+state = AgentState(create_agent)
 
 
 @app.post("/responses", response_model=None)
@@ -110,13 +111,9 @@ async def responses(body: dict[str, Any] = Body(...)) -> JSONResponse | Streamin
     options["reasoning"] = {"effort": "medium", "summary": "auto"}
     options_for_run = cast(Any, options)
 
-    target = cast(Agent[Any], await state.get_target())
+    target = await state.get_target()
     lookup_id = session_id or response_id
-    # `previous_response_id` chaining rotates its id every turn, and OpenAI's
-    # Responses API deliberately lets a caller continue from *any* earlier
-    # response, not just the latest one -- so the newly minted response id
-    # also needs to resolve back to this session on a later request.
-    session = await state.get_session(lookup_id, alias=response_id)
+    session = await state.get_or_create_session(lookup_id)
     if run["stream"]:
         stream = target.run(
             run["messages"],
@@ -126,12 +123,22 @@ async def responses(body: dict[str, Any] = Body(...)) -> JSONResponse | Streamin
         )
         if not isinstance(stream, ResponseStream):
             raise HTTPException(status_code=500, detail="agent did not return a response stream")
-        return StreamingResponse(
-            responses_stream_events_from_run(
+
+        async def stream_events() -> AsyncIterator[str]:
+            async for event in responses_stream_events_from_run(
                 stream,
                 response_id=response_id,
                 session_id=session_id,
-            ),
+            ):
+                yield event
+            # `agent.run(..., stream=True)` updates the session while the stream
+            # is consumed/finalized. Store it under the newly minted response id
+            # after finalization so a later `previous_response_id` can restore
+            # this exact continuation point.
+            await state.session_store.set(response_id, session)
+
+        return StreamingResponse(
+            stream_events(),
             media_type="text/event-stream",
         )
 
@@ -140,6 +147,10 @@ async def responses(body: dict[str, Any] = Body(...)) -> JSONResponse | Streamin
         session=session,
         options=options_for_run,
     )
+    # `agent.run(...)` updates the session. Store it under the newly minted
+    # response id after the run so `previous_response_id=response_id` continues
+    # from this exact point.
+    await state.session_store.set(response_id, session)
     return JSONResponse(
         responses_from_run(
             result,

From 1e2899e85097502a4ecee8a37eb87875f75a3c30 Mon Sep 17 00:00:00 2001
From: eavanvalkenburg <github@vanvalkenburg.eu>
Date: Fri, 3 Jul 2026 11:34:14 +0200
Subject: [PATCH 5/7] Fix hosting state test protocol fakes

Widen fake agents' get_session service_session_id parameter to match the SupportsAgentRun protocol under the Python 3.11 test typing checkers.

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 .../tests/hosting_responses/test_http_round_trip.py             | 2 +-
 python/packages/hosting/tests/hosting/test_state.py             | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/python/packages/hosting-responses/tests/hosting_responses/test_http_round_trip.py b/python/packages/hosting-responses/tests/hosting_responses/test_http_round_trip.py
index f1efb1616bc..5eefcd3d4f3 100644
--- a/python/packages/hosting-responses/tests/hosting_responses/test_http_round_trip.py
+++ b/python/packages/hosting-responses/tests/hosting_responses/test_http_round_trip.py
@@ -60,7 +60,7 @@ def __init__(self) -> None:
     def create_session(self, *, session_id: str | None = None) -> AgentSession:
         return AgentSession(session_id=session_id)
 
-    def get_session(self, service_session_id: str, *, session_id: str | None = None) -> AgentSession:
+    def get_session(self, service_session_id: Any, *, session_id: str | None = None) -> AgentSession:
         return AgentSession(session_id=session_id, service_session_id=service_session_id)
 
     @overload
diff --git a/python/packages/hosting/tests/hosting/test_state.py b/python/packages/hosting/tests/hosting/test_state.py
index f94afdaf65d..121bb2c76cd 100644
--- a/python/packages/hosting/tests/hosting/test_state.py
+++ b/python/packages/hosting/tests/hosting/test_state.py
@@ -53,7 +53,7 @@ def create_session(self, *, session_id: str | None = None) -> AgentSession:
         self.created_sessions.append(session)
         return session
 
-    def get_session(self, service_session_id: str, *, session_id: str | None = None) -> AgentSession:
+    def get_session(self, service_session_id: Any, *, session_id: str | None = None) -> AgentSession:
         return AgentSession(session_id=session_id, service_session_id=service_session_id)
 
     @overload

From c92472b7b8032ee71ed380547270c0fc65811de7 Mon Sep 17 00:00:00 2001
From: eavanvalkenburg <github@vanvalkenburg.eu>
Date: Fri, 3 Jul 2026 14:47:50 +0200
Subject: [PATCH 6/7] Simplify Responses stream helper naming

Rename responses_stream_events_from_run to responses_stream_from_run across exports, tests, docs, and the local Responses sample to align with the generic <protocol>_stream_from_run helper convention.

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 python/packages/hosting-responses/README.md                 | 2 +-
 .../agent_framework_hosting_responses/__init__.py           | 4 ++--
 .../agent_framework_hosting_responses/_parsing.py           | 4 ++--
 .../tests/hosting_responses/test_http_round_trip.py         | 4 ++--
 .../tests/hosting_responses/test_parsing.py                 | 6 +++---
 python/samples/04-hosting/af-hosting/local_responses/app.py | 4 ++--
 6 files changed, 12 insertions(+), 12 deletions(-)

diff --git a/python/packages/hosting-responses/README.md b/python/packages/hosting-responses/README.md
index dd6a121a30e..5ba00d2f470 100644
--- a/python/packages/hosting-responses/README.md
+++ b/python/packages/hosting-responses/README.md
@@ -11,7 +11,7 @@ This package provides the Responses-specific conversion layer:
 - `create_response_id(...)` — mint a Responses-shaped response id.
 - `responses_from_run(...)` — convert an `AgentResponse` into a
   Responses-compatible JSON payload.
-- `responses_stream_events_from_run(...)` — convert an Agent Framework
+- `responses_stream_from_run(...)` — convert an Agent Framework
   `ResponseStream` into Responses-compatible SSE events.
 
 FastAPI/Starlette/Django/Azure Functions code owns route registration,
diff --git a/python/packages/hosting-responses/agent_framework_hosting_responses/__init__.py b/python/packages/hosting-responses/agent_framework_hosting_responses/__init__.py
index eea77e876a8..26ee8da69e7 100644
--- a/python/packages/hosting-responses/agent_framework_hosting_responses/__init__.py
+++ b/python/packages/hosting-responses/agent_framework_hosting_responses/__init__.py
@@ -12,7 +12,7 @@
     parse_responses_request,
     responses_from_run,
     responses_session_id,
-    responses_stream_events_from_run,
+    responses_stream_from_run,
     responses_to_run,
 )
 
@@ -30,6 +30,6 @@
     "parse_responses_request",
     "responses_from_run",
     "responses_session_id",
-    "responses_stream_events_from_run",
+    "responses_stream_from_run",
     "responses_to_run",
 ]
diff --git a/python/packages/hosting-responses/agent_framework_hosting_responses/_parsing.py b/python/packages/hosting-responses/agent_framework_hosting_responses/_parsing.py
index c391aeb979a..9af4a1c9fb4 100644
--- a/python/packages/hosting-responses/agent_framework_hosting_responses/_parsing.py
+++ b/python/packages/hosting-responses/agent_framework_hosting_responses/_parsing.py
@@ -884,7 +884,7 @@ def _json_dumps(payload: Mapping[str, Any]) -> str:
     return json.dumps(payload, separators=(",", ":"))
 
 
-async def responses_stream_events_from_run(
+async def responses_stream_from_run(
     stream: ResponseStream[AgentResponseUpdate, AgentResponse[Any]],
     *,
     response_id: str,
@@ -954,6 +954,6 @@ async def responses_stream_events_from_run(
     "parse_responses_request",
     "responses_from_run",
     "responses_session_id",
-    "responses_stream_events_from_run",
+    "responses_stream_from_run",
     "responses_to_run",
 ]
diff --git a/python/packages/hosting-responses/tests/hosting_responses/test_http_round_trip.py b/python/packages/hosting-responses/tests/hosting_responses/test_http_round_trip.py
index 5eefcd3d4f3..96ea1663ca6 100644
--- a/python/packages/hosting-responses/tests/hosting_responses/test_http_round_trip.py
+++ b/python/packages/hosting-responses/tests/hosting_responses/test_http_round_trip.py
@@ -35,7 +35,7 @@
     create_response_id,
     responses_from_run,
     responses_session_id,
-    responses_stream_events_from_run,
+    responses_stream_from_run,
     responses_to_run,
 )
 
@@ -136,7 +136,7 @@ async def responses(body: dict[str, Any] = Body(...)) -> JSONResponse | Streamin
                 raise HTTPException(status_code=500, detail="agent did not return a response stream")
 
             async def stream_events() -> AsyncIterator[str]:
-                async for event in responses_stream_events_from_run(
+                async for event in responses_stream_from_run(
                     stream,
                     response_id=response_id,
                     session_id=session_id,
diff --git a/python/packages/hosting-responses/tests/hosting_responses/test_parsing.py b/python/packages/hosting-responses/tests/hosting_responses/test_parsing.py
index 5aaebf4b5fe..6fa100415c1 100644
--- a/python/packages/hosting-responses/tests/hosting_responses/test_parsing.py
+++ b/python/packages/hosting-responses/tests/hosting_responses/test_parsing.py
@@ -17,7 +17,7 @@
     parse_responses_request,
     responses_from_run,
     responses_session_id,
-    responses_stream_events_from_run,
+    responses_stream_from_run,
     responses_to_run,
 )
 
@@ -275,7 +275,7 @@ def test_responses_from_run_omits_previous_response_session(self) -> None:
 
         assert "conversation" not in payload
 
-    async def test_responses_stream_events_from_run(self) -> None:
+    async def test_responses_stream_from_run(self) -> None:
         async def updates() -> AsyncIterator[AgentResponseUpdate]:
             yield AgentResponseUpdate(contents=[Content.from_text("hel")], role="assistant")
             yield AgentResponseUpdate(contents=[Content.from_text("lo")], role="assistant")
@@ -287,7 +287,7 @@ def finalizer(items: Sequence[AgentResponseUpdate]) -> AgentResponse:
 
         events = [
             event
-            async for event in responses_stream_events_from_run(
+            async for event in responses_stream_from_run(
                 stream,
                 response_id="resp_new",
                 session_id="conv_1",
diff --git a/python/samples/04-hosting/af-hosting/local_responses/app.py b/python/samples/04-hosting/af-hosting/local_responses/app.py
index 9aec83fb452..ef91927cbf2 100644
--- a/python/samples/04-hosting/af-hosting/local_responses/app.py
+++ b/python/samples/04-hosting/af-hosting/local_responses/app.py
@@ -46,7 +46,7 @@
     create_response_id,
     responses_from_run,
     responses_session_id,
-    responses_stream_events_from_run,
+    responses_stream_from_run,
     responses_to_run,
 )
 from azure.identity.aio import DefaultAzureCredential
@@ -125,7 +125,7 @@ async def responses(body: dict[str, Any] = Body(...)) -> JSONResponse | Streamin
             raise HTTPException(status_code=500, detail="agent did not return a response stream")
 
         async def stream_events() -> AsyncIterator[str]:
-            async for event in responses_stream_events_from_run(
+            async for event in responses_stream_from_run(
                 stream,
                 response_id=response_id,
                 session_id=session_id,

From 32f771fd1668b06d94d3a968e0c13bdf902753f6 Mon Sep 17 00:00:00 2001
From: eavanvalkenburg <github@vanvalkenburg.eu>
Date: Fri, 3 Jul 2026 15:06:06 +0200
Subject: [PATCH 7/7] Add state-level storage setters

Add AgentState.set_session and WorkflowState.set_checkpoint_storage so app code can pair get-or-create helpers with explicit post-run storage without reaching into the underlying stores. Update Responses docs, tests, and sample to use state.set_session.

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 python/packages/hosting-responses/README.md    |  2 +-
 .../hosting_responses/test_http_round_trip.py  |  4 ++--
 python/packages/hosting/README.md              |  2 +-
 .../hosting/agent_framework_hosting/_state.py  | 18 ++++++++++++++++++
 .../hosting/tests/hosting/test_state.py        |  8 ++++----
 .../af-hosting/local_responses/README.md       |  2 +-
 .../af-hosting/local_responses/app.py          |  4 ++--
 7 files changed, 29 insertions(+), 11 deletions(-)

diff --git a/python/packages/hosting-responses/README.md b/python/packages/hosting-responses/README.md
index 5ba00d2f470..47246f02252 100644
--- a/python/packages/hosting-responses/README.md
+++ b/python/packages/hosting-responses/README.md
@@ -43,7 +43,7 @@ async def responses(body: dict = Body(...)) -> JSONResponse:
         session=session,
         options=run["options"],
     )
-    await state.session_store.set(response_id, session)
+    await state.set_session(response_id, session)
     return JSONResponse(responses_from_run(result, response_id=response_id, session_id=session_id))
 ```
 
diff --git a/python/packages/hosting-responses/tests/hosting_responses/test_http_round_trip.py b/python/packages/hosting-responses/tests/hosting_responses/test_http_round_trip.py
index 96ea1663ca6..8c0039228cb 100644
--- a/python/packages/hosting-responses/tests/hosting_responses/test_http_round_trip.py
+++ b/python/packages/hosting-responses/tests/hosting_responses/test_http_round_trip.py
@@ -142,7 +142,7 @@ async def stream_events() -> AsyncIterator[str]:
                     session_id=session_id,
                 ):
                     yield event
-                await state.session_store.set(response_id, session)
+                await state.set_session(response_id, session)
 
             return StreamingResponse(
                 stream_events(),
@@ -150,7 +150,7 @@ async def stream_events() -> AsyncIterator[str]:
             )
 
         result = await target.run(run["messages"], session=session)
-        await state.session_store.set(response_id, session)
+        await state.set_session(response_id, session)
         return JSONResponse(responses_from_run(result, response_id=response_id, session_id=session_id))
 
     return app
diff --git a/python/packages/hosting/README.md b/python/packages/hosting/README.md
index 5217ac39e94..096762fa0c4 100644
--- a/python/packages/hosting/README.md
+++ b/python/packages/hosting/README.md
@@ -51,7 +51,7 @@ the post-run object:
 ```python
 session = await state.get_or_create_session(previous_response_id)
 result = await (await state.get_target()).run("Hello", session=session)
-await state.session_store.set(response_id, session)
+await state.set_session(response_id, session)
 ```
 
 Targets can be direct instances, synchronous factories, asynchronous factories,
diff --git a/python/packages/hosting/agent_framework_hosting/_state.py b/python/packages/hosting/agent_framework_hosting/_state.py
index a16a30c4706..bbe07d965c6 100644
--- a/python/packages/hosting/agent_framework_hosting/_state.py
+++ b/python/packages/hosting/agent_framework_hosting/_state.py
@@ -288,6 +288,15 @@ async def get_or_create_session(self, session_id: str) -> AgentSession:
             await self._session_store.set(session_id, session)
         return session
 
+    async def set_session(self, session_id: str, session: AgentSession) -> None:
+        """Store ``session`` under ``session_id`` in this state's session store.
+
+        Args:
+            session_id: Opaque app-selected session id.
+            session: Session to store.
+        """
+        await self._session_store.set(session_id, session)
+
 
 class WorkflowState(Generic[WorkflowT]):
     """Shared execution state for app-owned workflow hosting routes.
@@ -402,3 +411,12 @@ async def get_or_create_checkpoint_storage(self, session_id: str) -> CheckpointS
             storage = InMemoryCheckpointStorage()
             await self._checkpoint_store.set(session_id, storage)
         return storage
+
+    async def set_checkpoint_storage(self, session_id: str, storage: CheckpointStorage) -> None:
+        """Store ``storage`` under ``session_id`` in this state's checkpoint store.
+
+        Args:
+            session_id: Opaque app-selected session id.
+            storage: Checkpoint storage to store.
+        """
+        await self._checkpoint_store.set(session_id, storage)
diff --git a/python/packages/hosting/tests/hosting/test_state.py b/python/packages/hosting/tests/hosting/test_state.py
index 121bb2c76cd..6f34d214134 100644
--- a/python/packages/hosting/tests/hosting/test_state.py
+++ b/python/packages/hosting/tests/hosting/test_state.py
@@ -269,11 +269,11 @@ async def test_get_or_create_session_creates_and_stores_once(self) -> None:
         assert first.session_id == "session-1"
         assert len(agent.created_sessions) == 1
 
-    async def test_get_or_create_session_reuses_a_session_set_directly_on_the_store(self) -> None:
+    async def test_get_or_create_session_reuses_a_session_set_on_the_state(self) -> None:
         agent = _FakeAgent()
         state = AgentState(agent)
         pre_existing = AgentSession(session_id="session-1")
-        await state.session_store.set("session-1", pre_existing)
+        await state.set_session("session-1", pre_existing)
 
         session = await state.get_or_create_session("session-1")
 
@@ -348,11 +348,11 @@ async def test_get_or_create_checkpoint_storage_creates_and_stores_once(self) ->
         assert first is second
         assert isinstance(first, InMemoryCheckpointStorage)
 
-    async def test_get_or_create_checkpoint_storage_reuses_storage_set_directly_on_the_store(self) -> None:
+    async def test_get_or_create_checkpoint_storage_reuses_storage_set_on_the_state(self) -> None:
         workflow = _workflow_fixture("build_echo_workflow")()
         state: WorkflowState[Workflow] = WorkflowState(workflow)
         pre_existing = InMemoryCheckpointStorage()
-        await state.checkpoint_store.set("session-1", pre_existing)
+        await state.set_checkpoint_storage("session-1", pre_existing)
 
         storage = await state.get_or_create_checkpoint_storage("session-1")
 
diff --git a/python/samples/04-hosting/af-hosting/local_responses/README.md b/python/samples/04-hosting/af-hosting/local_responses/README.md
index 24b552e117d..9c1c2e8d163 100644
--- a/python/samples/04-hosting/af-hosting/local_responses/README.md
+++ b/python/samples/04-hosting/af-hosting/local_responses/README.md
@@ -22,7 +22,7 @@ What the route demonstrates:
 - Produces the AF messages, options, and session id that the route passes to
   `agent.run(...)`.
 - **Stores** each newly minted response id for the session it was just
-  resolved from, via `state.session_store.set(response_id, session)` after
+  resolved from, via `state.set_session(response_id, session)` after
   `agent.run(...)` has updated the session.
   OpenAI's `previous_response_id` rotates every turn *by design* — it lets a
   caller continue from any earlier response, not just the latest one — so
diff --git a/python/samples/04-hosting/af-hosting/local_responses/app.py b/python/samples/04-hosting/af-hosting/local_responses/app.py
index ef91927cbf2..c55c8c84079 100644
--- a/python/samples/04-hosting/af-hosting/local_responses/app.py
+++ b/python/samples/04-hosting/af-hosting/local_responses/app.py
@@ -135,7 +135,7 @@ async def stream_events() -> AsyncIterator[str]:
             # is consumed/finalized. Store it under the newly minted response id
             # after finalization so a later `previous_response_id` can restore
             # this exact continuation point.
-            await state.session_store.set(response_id, session)
+            await state.set_session(response_id, session)
 
         return StreamingResponse(
             stream_events(),
@@ -150,7 +150,7 @@ async def stream_events() -> AsyncIterator[str]:
     # `agent.run(...)` updates the session. Store it under the newly minted
     # response id after the run so `previous_response_id=response_id` continues
     # from this exact point.
-    await state.session_store.set(response_id, session)
+    await state.set_session(response_id, session)
     return JSONResponse(
         responses_from_run(
             result,