From d1ad30744a6b9eca41c33b5bb2011b3939cbc97f Mon Sep 17 00:00:00 2001
From: Andrey Buzin <contactbuzin@gmail.com>
Date: Mon, 2 Mar 2026 14:01:25 -0800
Subject: [PATCH 01/10] Wire tool approval into AI SDK UI protocol

---
 src/vercel_ai_sdk/__init__.py             |  3 +-
 src/vercel_ai_sdk/agent/__init__.py       |  4 +-
 src/vercel_ai_sdk/agent/agent.py          | 10 +--
 src/vercel_ai_sdk/ai_sdk_ui/adapter.py    | 64 +++++++++++++++++
 src/vercel_ai_sdk/ai_sdk_ui/ui_message.py | 24 +++++--
 src/vercel_ai_sdk/core/hooks.py           | 23 ++++--
 tests/ai_sdk_ui/test_adapter.py           | 87 ++++++++++++++++++++++-
 7 files changed, 192 insertions(+), 23 deletions(-)

diff --git a/src/vercel_ai_sdk/__init__.py b/src/vercel_ai_sdk/__init__.py
index 79028cac..35f444d2 100644
--- a/src/vercel_ai_sdk/__init__.py
+++ b/src/vercel_ai_sdk/__init__.py
@@ -1,7 +1,7 @@
 from . import ai_gateway, ai_sdk_ui, anthropic, mcp, openai
 from .core import telemetry
 from .core.checkpoint import Checkpoint
-from .core.hooks import Hook, hook
+from .core.hooks import Hook, ToolApproval, hook
 from .core.llm import LanguageModel
 
 # Re-export core types
@@ -51,6 +51,7 @@
     "StreamResult",
     "Hook",
     "HookPart",
+    "ToolApproval",
     "StructuredOutputPart",
     "Checkpoint",
     # Functions
diff --git a/src/vercel_ai_sdk/agent/__init__.py b/src/vercel_ai_sdk/agent/__init__.py
index 4b349261..ed06c24a 100644
--- a/src/vercel_ai_sdk/agent/__init__.py
+++ b/src/vercel_ai_sdk/agent/__init__.py
@@ -1,4 +1,4 @@
 from . import local, proto, tools, vercel
-from .agent import Agent, ToolApproval
+from .agent import Agent
 
-__all__ = ["Agent", "ToolApproval", "proto", "tools", "local", "vercel"]
+__all__ = ["Agent", "proto", "tools", "local", "vercel"]
diff --git a/src/vercel_ai_sdk/agent/agent.py b/src/vercel_ai_sdk/agent/agent.py
index 8e3b4b2a..c7140613 100644
--- a/src/vercel_ai_sdk/agent/agent.py
+++ b/src/vercel_ai_sdk/agent/agent.py
@@ -4,20 +4,12 @@
 import dataclasses
 from typing import Any
 
-import pydantic
-
 import vercel_ai_sdk as ai
 
 from . import proto
 from .tools import BUILTIN_TOOLS, _filesystem
 
 
-@ai.hook
-class ToolApproval(pydantic.BaseModel):
-    granted: bool
-    reason: str | None = None
-
-
 @dataclasses.dataclass
 class Agent:
     """
@@ -48,7 +40,7 @@ async def _execute_tool(
         """
         # TODO: mypy doesn't support class decorators that change the class type —
         # @ai.hook returns type[Hook[T]] but mypy still sees the original BaseModel.
-        approval = await ToolApproval.create(  # type: ignore[attr-defined]
+        approval = await ai.ToolApproval.create(  # type: ignore[attr-defined]
             f"approve_{tc.tool_call_id}",
             metadata={"tool_name": tc.tool_name, "tool_args": tc.tool_args},
         )
diff --git a/src/vercel_ai_sdk/ai_sdk_ui/adapter.py b/src/vercel_ai_sdk/ai_sdk_ui/adapter.py
index ed080f1a..f050e3d6 100644
--- a/src/vercel_ai_sdk/ai_sdk_ui/adapter.py
+++ b/src/vercel_ai_sdk/ai_sdk_ui/adapter.py
@@ -11,6 +11,7 @@
 from typing import Any, Literal
 
 from .. import core
+from ..core import hooks
 from . import protocol, ui_message
 
 # ============================================================================
@@ -69,6 +70,7 @@ def __init__(self) -> None:
         self.started_tool_calls: set[str] = set()
         self.emitted_tool_results: set[str] = set()
         self.pending_tool_calls: set[str] = set()
+        self.emitted_approval_requests: set[str] = set()
 
     def close_open_blocks(self) -> list[protocol.UIMessageStreamPart]:
         """Close any open reasoning/text blocks, returning parts to emit."""
@@ -94,6 +96,7 @@ def reset_tool_tracking(self) -> None:
         self.started_tool_calls = set()
         self.emitted_tool_results = set()
         self.pending_tool_calls = set()
+        self.emitted_approval_requests = set()
 
     def begin_message(
         self, msg: core.messages.Message
@@ -130,6 +133,22 @@ def begin_message(
         return parts
 
 
+def _tool_call_id_from_approval_hook(
+    hook_part: core.messages.HookPart,
+) -> str | None:
+    """Extract tool_call_id from a ToolApproval HookPart.
+
+    Returns the tool_call_id if this is a ToolApproval hook whose hook_id
+    follows the ``approve_{tool_call_id}`` convention, otherwise None.
+    """
+    if hook_part.hook_type != hooks.ToolApproval.hook_type:  # type: ignore[attr-defined]
+        return None
+    prefix = "approve_"
+    if hook_part.hook_id.startswith(prefix):
+        return hook_part.hook_id[len(prefix) :]
+    return None
+
+
 async def to_ui_message_stream(
     messages: AsyncIterable[core.messages.Message],
 ) -> AsyncGenerator[protocol.UIMessageStreamPart]:
@@ -256,6 +275,33 @@ async def to_ui_message_stream(
                                 output=result,
                             )
 
+            # Pass 3: Hook-based tool approvals
+            for msg_part in msg.parts:
+                if not isinstance(msg_part, core.messages.HookPart):
+                    continue
+                approval_tc_id = _tool_call_id_from_approval_hook(msg_part)
+                if approval_tc_id is None:
+                    continue
+
+                if msg_part.status == "pending":
+                    if approval_tc_id not in state.emitted_approval_requests:
+                        state.emitted_approval_requests.add(approval_tc_id)
+                        yield protocol.ToolApprovalRequestPart(
+                            approval_id=msg_part.hook_id,
+                            tool_call_id=approval_tc_id,
+                        )
+                elif msg_part.status == "resolved":
+                    resolution = msg_part.resolution or {}
+                    if not resolution.get("granted", False):
+                        yield protocol.ToolOutputDeniedPart(
+                            tool_call_id=approval_tc_id,
+                        )
+                elif msg_part.status == "cancelled":
+                    yield protocol.ToolOutputErrorPart(
+                        tool_call_id=approval_tc_id,
+                        error_text="Hook cancelled",
+                    )
+
     # Final cleanup
     for part in state.finish_step():
         yield part
@@ -333,6 +379,10 @@ def to_messages(
 ) -> list[core.messages.Message]:
     """Convert AI SDK v6 UI messages to internal Message format.
 
+    As a side-effect, tool parts in ``approval-responded`` state trigger
+    ``ToolApproval.resolve()`` so the agent loop can resume execution
+    without the caller needing to handle approval routing explicitly.
+
     Args:
         ui_messages: List of UIMessage objects from the AI SDK v6 frontend.
 
@@ -375,6 +425,20 @@ def to_messages(
                             result=_normalize_tool_result(tp.output),
                         )
                     )
+                    # Side-effect: resolve ToolApproval hooks from approval
+                    # responses so the agent loop can resume execution.
+                    if (
+                        tp.state == "approval-responded"
+                        and tp.approval is not None
+                        and tp.approval.approved is not None
+                    ):
+                        hooks.ToolApproval.resolve(  # type: ignore[attr-defined]
+                            tp.approval.id,
+                            {
+                                "granted": tp.approval.approved,
+                                "reason": tp.approval.reason,
+                            },
+                        )
 
                 case (
                     ui_message.UIStepStartPart()
diff --git a/src/vercel_ai_sdk/ai_sdk_ui/ui_message.py b/src/vercel_ai_sdk/ai_sdk_ui/ui_message.py
index cb87d9d2..f1a15a34 100644
--- a/src/vercel_ai_sdk/ai_sdk_ui/ui_message.py
+++ b/src/vercel_ai_sdk/ai_sdk_ui/ui_message.py
@@ -37,11 +37,11 @@ class UIReasoningPart(pydantic.BaseModel):
 # Tool invocation states in AI SDK v6:
 # - "input-streaming": Tool arguments are being streamed
 # - "input-available": Tool arguments are complete, ready for execution
-# - "approval-requested": Tool requires user approval (TODO: approval workflow)
-# - "approval-responded": User has responded to approval (TODO: approval workflow)
+# - "approval-requested": Tool requires user approval before execution
+# - "approval-responded": User has responded to approval request
 # - "output-available": Tool has been executed, result is available
 # - "output-error": Tool execution failed
-# - "output-denied": Tool execution was denied by user (TODO: approval workflow)
+# - "output-denied": Tool execution was denied by user
 UIToolInvocationState = Literal[
     "input-streaming",
     "input-available",
@@ -78,6 +78,21 @@ class UIStepStartPart(pydantic.BaseModel):
     type: Literal["step-start"]
 
 
+class UIToolApproval(pydantic.BaseModel):
+    """Approval state on a tool part (AI SDK v6 protocol).
+
+    Present when a tool requires user approval before execution.
+    ``id`` matches the hook label used by the ToolApproval hook.
+    ``approved`` is None while awaiting a response, True/False after.
+    """
+
+    model_config = pydantic.ConfigDict(populate_by_name=True)
+
+    id: str
+    approved: bool | None = None
+    reason: str | None = None
+
+
 class UIToolPart(pydantic.BaseModel):
     """Tool part with dynamic type pattern: tool-{toolName}.
 
@@ -95,8 +110,7 @@ class UIToolPart(pydantic.BaseModel):
     input: str | dict[str, Any] | None = None  # JSON string or parsed dict
     output: Any | None = None
     error_text: str | None = pydantic.Field(default=None, alias="errorText")
-    # TODO: title, providerExecuted, preliminary fields
-    # TODO: approval workflow (approval object)
+    approval: UIToolApproval | None = None
 
     @property
     def tool_name(self) -> str:
diff --git a/src/vercel_ai_sdk/core/hooks.py b/src/vercel_ai_sdk/core/hooks.py
index 17a1c1f3..f4001d5e 100644
--- a/src/vercel_ai_sdk/core/hooks.py
+++ b/src/vercel_ai_sdk/core/hooks.py
@@ -72,7 +72,7 @@ class Hook[T: pydantic.BaseModel]:
     """
 
     _schema: ClassVar[type[pydantic.BaseModel]]
-    _hook_type: ClassVar[str]
+    hook_type: ClassVar[str]
 
     @classmethod
     async def create(cls, label: str, metadata: dict[str, Any] | None = None) -> T:
@@ -113,7 +113,7 @@ async def create(cls, label: str, metadata: dict[str, Any] | None = None) -> T:
         future: asyncio.Future[dict[str, Any]] = asyncio.Future()
         suspension = rt_mod.HookSuspension(
             label=label,
-            hook_type=cls._hook_type,
+            hook_type=cls.hook_type,
             metadata=metadata or {},
             future=future,
         )
@@ -142,7 +142,7 @@ async def create(cls, label: str, metadata: dict[str, Any] | None = None) -> T:
                 parts=[
                     messages_.HookPart(
                         hook_id=label,
-                        hook_type=cls._hook_type,
+                        hook_type=cls.hook_type,
                         status="resolved",
                         metadata=hook_metadata,
                         resolution=resolution,
@@ -215,7 +215,7 @@ async def cancel(cls, label: str, reason: str | None = None) -> None:
                 parts=[
                     messages_.HookPart(
                         hook_id=label,
-                        hook_type=cls._hook_type,
+                        hook_type=cls.hook_type,
                         status="cancelled",
                         metadata=hook_metadata,
                     )
@@ -235,9 +235,22 @@ def hook[T: pydantic.BaseModel](cls: type[T]) -> type[Hook[T]]:
         (Hook,),
         {
             "_schema": cls,
-            "_hook_type": cls.__name__,
+            "hook_type": cls.__name__,
             "__doc__": cls.__doc__,
         },
     )
 
     return hook_impl
+
+
+@hook
+class ToolApproval(pydantic.BaseModel):
+    """Prewired hook for tool call approval.
+
+    Used by the AI SDK UI adapter to bridge the protocol's
+    tool-approval-request / approval-responded flow to the
+    hook system.
+    """
+
+    granted: bool
+    reason: str | None = None
diff --git a/tests/ai_sdk_ui/test_adapter.py b/tests/ai_sdk_ui/test_adapter.py
index 94de6bf7..68af026e 100644
--- a/tests/ai_sdk_ui/test_adapter.py
+++ b/tests/ai_sdk_ui/test_adapter.py
@@ -8,7 +8,7 @@
 
 import vercel_ai_sdk as ai
 from vercel_ai_sdk.ai_sdk_ui import adapter, ui_message
-from vercel_ai_sdk.core import messages
+from vercel_ai_sdk.core import hooks, messages
 
 from ..conftest import MockLLM
 
@@ -492,3 +492,88 @@ def test_ui_skips_unsupported_parts() -> None:
 
     internal = adapter.to_messages([ui_msg])
     assert len(internal[0].parts) == 2
+
+
+# -----------------------------------------------------------------------------
+# Tool approval (human-in-the-loop) tests
+# -----------------------------------------------------------------------------
+
+
+@pytest.mark.asyncio
+async def test_tool_approval_hook_emits_approval_request() -> None:
+    """Pending ToolApproval HookPart emits tool-approval-request on the wire."""
+    msgs = [
+        # Tool pending (args complete, awaiting approval)
+        messages.Message(
+            id="msg-1",
+            role="assistant",
+            parts=[
+                messages.ToolPart(
+                    tool_call_id="tc-1",
+                    tool_name="rm_rf",
+                    tool_args='{"path": "/"}',
+                    status="pending",
+                    state="done",
+                ),
+            ],
+        ),
+        # Hook pending (approval requested)
+        messages.Message(
+            id="msg-1",
+            role="assistant",
+            parts=[
+                messages.HookPart(
+                    hook_id="approve_tc-1",
+                    hook_type=hooks.ToolApproval.hook_type,  # type: ignore[attr-defined]
+                    status="pending",
+                    metadata={"tool_name": "rm_rf", "tool_args": '{"path": "/"}'},
+                ),
+            ],
+        ),
+    ]
+
+    event_types = await get_event_types(msgs)
+    assert event_types == [
+        "start",
+        "start-step",
+        "tool-input-start",
+        "tool-input-available",
+        "tool-approval-request",
+        "finish-step",
+        "finish",
+    ]
+
+
+def test_approval_responded_resolves_hook() -> None:
+    """to_messages() resolves the ToolApproval hook for approval-responded parts."""
+    label = "approve_tc-42"
+    raw_messages = [
+        {
+            "id": "msg-1",
+            "role": "assistant",
+            "parts": [
+                {
+                    "type": "tool-dangerous_action",
+                    "toolCallId": "tc-42",
+                    "state": "approval-responded",
+                    "input": '{"x": 1}',
+                    "approval": {
+                        "id": label,
+                        "approved": True,
+                        "reason": "looks safe",
+                    },
+                }
+            ],
+        },
+    ]
+
+    # Clean up any leftover state from other tests
+    hooks._pending_resolutions.pop(label, None)
+
+    ui_msgs = [ui_message.UIMessage.model_validate(m) for m in raw_messages]
+    adapter.to_messages(ui_msgs)
+
+    # The side-effect should have pre-registered the resolution
+    assert label in hooks._pending_resolutions
+    resolution = hooks._pending_resolutions.pop(label)
+    assert resolution == {"granted": True, "reason": "looks safe"}

From f5ec3b5ab4855ef720dd8eddbab06a4083c4b35c Mon Sep 17 00:00:00 2001
From: Andrey Buzin <contactbuzin@gmail.com>
Date: Mon, 2 Mar 2026 16:06:03 -0800
Subject: [PATCH 02/10] Ensure the baseline example app works

---
 examples/fastapi-vite/backend/__init__.py     |  1 -
 examples/fastapi-vite/backend/main.py         | 66 ++++++++++++++++---
 examples/fastapi-vite/backend/pyproject.toml  |  6 +-
 .../fastapi-vite/backend/routes/__init__.py   |  1 -
 examples/fastapi-vite/backend/routes/chat.py  | 60 -----------------
 examples/fastapi-vite/backend/uv.lock         | 63 ++++++++++++++++--
 examples/fastapi-vite/frontend/vite.config.ts |  5 --
 7 files changed, 121 insertions(+), 81 deletions(-)
 delete mode 100644 examples/fastapi-vite/backend/__init__.py
 delete mode 100644 examples/fastapi-vite/backend/routes/__init__.py
 delete mode 100644 examples/fastapi-vite/backend/routes/chat.py

diff --git a/examples/fastapi-vite/backend/__init__.py b/examples/fastapi-vite/backend/__init__.py
deleted file mode 100644
index 7f831694..00000000
--- a/examples/fastapi-vite/backend/__init__.py
+++ /dev/null
@@ -1 +0,0 @@
-# Backend package
diff --git a/examples/fastapi-vite/backend/main.py b/examples/fastapi-vite/backend/main.py
index 7aa8cf42..9ce7211a 100644
--- a/examples/fastapi-vite/backend/main.py
+++ b/examples/fastapi-vite/backend/main.py
@@ -1,15 +1,25 @@
 """FastAPI application entry point."""
 
+from __future__ import annotations
+
+from collections.abc import AsyncGenerator
+
+import agent
 import fastapi
 import fastapi.middleware.cors
-from routes import chat
+import fastapi.responses
+import pydantic
+import storage
 
-api = fastapi.FastAPI(
+import vercel_ai_sdk as ai
+import vercel_ai_sdk.ai_sdk_ui
+
+app = fastapi.FastAPI(
     title="py-ai-fastapi-chat",
     description="Chat demo using Python Vercel AI SDK",
 )
 
-api.add_middleware(
+app.add_middleware(
     fastapi.middleware.cors.CORSMiddleware,
     allow_origins=["*"],
     allow_credentials=True,
@@ -17,14 +27,54 @@
     allow_headers=["*"],
 )
 
-api.include_router(chat.router)
-
 
-@api.get("/health")
+@app.get("/health")
 async def health() -> dict[str, str]:
     """Health check endpoint."""
     return {"status": "ok"}
 
 
-app = fastapi.FastAPI()
-app.mount("/api", api)
+file_storage = storage.FileStorage()
+
+
+class ChatRequest(pydantic.BaseModel):
+    """Request body for the chat endpoint."""
+
+    messages: list[ai.ai_sdk_ui.UIMessage]
+    session_id: str | None = None
+
+
+@app.post("/chat")
+async def chat(request: ChatRequest) -> fastapi.responses.StreamingResponse:
+    """Handle chat requests and stream responses."""
+    messages = ai.ai_sdk_ui.to_messages(request.messages)
+    session_id = request.session_id or "default"
+    checkpoint_key = f"checkpoint:{session_id}"
+
+    llm = agent.get_llm()
+
+    # Checkpoints resume an *interrupted* run (e.g. a hook that needed
+    # user input in serverless mode).  Each normal chat turn is a fresh
+    # run — the frontend carries the full message history — so we only
+    # load a checkpoint when one was saved from a previous incomplete run.
+    saved = await file_storage.get(checkpoint_key)
+    checkpoint = ai.Checkpoint.model_validate(saved) if saved else None
+
+    result = ai.run(agent.graph, llm, messages, agent.TOOLS, checkpoint=checkpoint)
+
+    async def stream_response() -> AsyncGenerator[str]:
+        async for chunk in ai.ai_sdk_ui.to_sse_stream(result):
+            yield chunk
+
+        # If the run completed (no pending hooks), clear the checkpoint
+        # so the next request starts fresh.  If hooks are pending, save
+        # the checkpoint so the next request can resume from here.
+        if result.pending_hooks:
+            await file_storage.put(checkpoint_key, result.checkpoint.model_dump())
+        else:
+            await file_storage.delete(checkpoint_key)
+
+    return fastapi.responses.StreamingResponse(
+        stream_response(),
+        headers=ai.ai_sdk_ui.UI_MESSAGE_STREAM_HEADERS,
+    )
diff --git a/examples/fastapi-vite/backend/pyproject.toml b/examples/fastapi-vite/backend/pyproject.toml
index 1909ae57..a98fb231 100644
--- a/examples/fastapi-vite/backend/pyproject.toml
+++ b/examples/fastapi-vite/backend/pyproject.toml
@@ -5,5 +5,9 @@ description = "Chat demo using Python Vercel AI SDK with FastAPI"
 requires-python = ">=3.12"
 dependencies = [
     "fastapi[standard]>=0.128.1",
-    "vercel-ai-sdk>=0.0.1.dev5",
+    "vercel-ai-sdk",
+    # "vercel-ai-sdk>=0.0.1.dev5",
 ]
+
+[tool.uv.sources]
+vercel-ai-sdk = { path = "../../.." }
diff --git a/examples/fastapi-vite/backend/routes/__init__.py b/examples/fastapi-vite/backend/routes/__init__.py
deleted file mode 100644
index d212dab6..00000000
--- a/examples/fastapi-vite/backend/routes/__init__.py
+++ /dev/null
@@ -1 +0,0 @@
-# Routes package
diff --git a/examples/fastapi-vite/backend/routes/chat.py b/examples/fastapi-vite/backend/routes/chat.py
deleted file mode 100644
index 69b95d88..00000000
--- a/examples/fastapi-vite/backend/routes/chat.py
+++ /dev/null
@@ -1,60 +0,0 @@
-"""Chat route — streams LLM responses via the AI SDK UI protocol."""
-
-from __future__ import annotations
-
-from collections.abc import AsyncGenerator
-
-import agent
-import fastapi
-import fastapi.responses
-import pydantic
-import storage
-
-import vercel_ai_sdk as ai
-import vercel_ai_sdk.ai_sdk_ui
-
-router = fastapi.APIRouter()
-file_storage = storage.FileStorage()
-
-
-class ChatRequest(pydantic.BaseModel):
-    """Request body for the chat endpoint."""
-
-    messages: list[ai.ai_sdk_ui.UIMessage]
-    session_id: str | None = None
-
-
-@router.post("/chat")
-async def chat(request: ChatRequest) -> fastapi.responses.StreamingResponse:
-    """Handle chat requests and stream responses."""
-    messages = ai.ai_sdk_ui.to_messages(request.messages)
-    session_id = request.session_id or "default"
-    checkpoint_key = f"checkpoint:{session_id}"
-
-    llm = agent.get_llm()
-
-    # Checkpoints resume an *interrupted* run (e.g. a hook that needed
-    # user input in serverless mode).  Each normal chat turn is a fresh
-    # run — the frontend carries the full message history — so we only
-    # load a checkpoint when one was saved from a previous incomplete run.
-    saved = await file_storage.get(checkpoint_key)
-    checkpoint = ai.Checkpoint.model_validate(saved) if saved else None
-
-    result = ai.run(agent.graph, llm, messages, agent.TOOLS, checkpoint=checkpoint)
-
-    async def stream_response() -> AsyncGenerator[str]:
-        async for chunk in ai.ai_sdk_ui.to_sse_stream(result):
-            yield chunk
-
-        # If the run completed (no pending hooks), clear the checkpoint
-        # so the next request starts fresh.  If hooks are pending, save
-        # the checkpoint so the next request can resume from here.
-        if result.pending_hooks:
-            await file_storage.put(checkpoint_key, result.checkpoint.model_dump())
-        else:
-            await file_storage.delete(checkpoint_key)
-
-    return fastapi.responses.StreamingResponse(
-        stream_response(),
-        headers=ai.ai_sdk_ui.UI_MESSAGE_STREAM_HEADERS,
-    )
diff --git a/examples/fastapi-vite/backend/uv.lock b/examples/fastapi-vite/backend/uv.lock
index f27e1630..8075cde9 100644
--- a/examples/fastapi-vite/backend/uv.lock
+++ b/examples/fastapi-vite/backend/uv.lock
@@ -460,6 +460,18 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/0e/61/66938bbb5fc52dbdf84594873d5b51fb1f7c7794e9c0f5bd885f30bc507b/idna-3.11-py3-none-any.whl", hash = "sha256:771a87f49d9defaf64091e6e6fe9c18d4833f140bd19464795bc32d966ca37ea", size = 71008, upload-time = "2025-10-12T14:55:18.883Z" },
 ]
 
+[[package]]
+name = "importlib-metadata"
+version = "8.7.1"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "zipp" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/f3/49/3b30cad09e7771a4982d9975a8cbf64f00d4a1ececb53297f1d9a7be1b10/importlib_metadata-8.7.1.tar.gz", hash = "sha256:49fef1ae6440c182052f407c8d34a68f72efc36db9ca90dc0113398f2fdde8bb", size = 57107, upload-time = "2025-12-21T10:00:19.278Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/fa/5e/f8e9a1d23b9c20a551a8a02ea3637b4642e22c2626e3a13a9a29cdea99eb/importlib_metadata-8.7.1-py3-none-any.whl", hash = "sha256:5a1f80bf1daa489495071efbb095d75a634cf28a8bc299581244063b53176151", size = 27865, upload-time = "2025-12-21T10:00:18.329Z" },
+]
+
 [[package]]
 name = "jinja2"
 version = "3.1.6"
@@ -695,6 +707,19 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/b5/a0/cf4297aa51bbc21e83ef0ac018947fa06aea8f2364aad7c96cbf148590e6/openai-2.20.0-py3-none-any.whl", hash = "sha256:38d989c4b1075cd1f76abc68364059d822327cf1a932531d429795f4fc18be99", size = 1098479, upload-time = "2026-02-10T19:02:52.157Z" },
 ]
 
+[[package]]
+name = "opentelemetry-api"
+version = "1.39.1"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "importlib-metadata" },
+    { name = "typing-extensions" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/97/b9/3161be15bb8e3ad01be8be5a968a9237c3027c5be504362ff800fca3e442/opentelemetry_api-1.39.1.tar.gz", hash = "sha256:fbde8c80e1b937a2c61f20347e91c0c18a1940cecf012d62e65a7caf08967c9c", size = 65767, upload-time = "2025-12-11T13:32:39.182Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/cf/df/d3f1ddf4bb4cb50ed9b1139cc7b1c54c34a1e7ce8fd1b9a37c0d1551a6bd/opentelemetry_api-1.39.1-py3-none-any.whl", hash = "sha256:2edd8463432a7f8443edce90972169b195e7d6a05500cd29e6d13898187c9950", size = 66356, upload-time = "2025-12-11T13:32:17.304Z" },
+]
+
 [[package]]
 name = "py-ai-fastapi-chat"
 version = "0.1.0"
@@ -707,7 +732,7 @@ dependencies = [
 [package.metadata]
 requires-dist = [
     { name = "fastapi", extras = ["standard"], specifier = ">=0.128.1" },
-    { name = "vercel-ai-sdk", specifier = ">=0.0.1.dev5" },
+    { name = "vercel-ai-sdk", directory = "../../../" },
 ]
 
 [[package]]
@@ -1319,18 +1344,37 @@ wheels = [
 [[package]]
 name = "vercel-ai-sdk"
 version = "0.0.1.dev5"
-source = { registry = "https://pypi.org/simple" }
+source = { directory = "../../../" }
 dependencies = [
     { name = "anthropic" },
     { name = "httpx" },
     { name = "mcp" },
     { name = "openai" },
+    { name = "opentelemetry-api" },
     { name = "pydantic" },
     { name = "vercel" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/b0/dd/3b399134076883247582af3919d5fbd38c9e270a42005fa27d1472705dd1/vercel_ai_sdk-0.0.1.dev5.tar.gz", hash = "sha256:998814780fc6163000be1b29e48dacbe710adb8a765636867bd6dd5a6b9b41b0", size = 37870, upload-time = "2026-02-25T16:31:01.844Z" }
-wheels = [
-    { url = "https://files.pythonhosted.org/packages/c5/7a/f50dd25ed596c07c2222f2abd81c413169534904bfc4e735b1a5e7084870/vercel_ai_sdk-0.0.1.dev5-py3-none-any.whl", hash = "sha256:22de26c8b667738a825f812aa5b7042d741dd905033c16b3515f6123cd220245", size = 50938, upload-time = "2026-02-25T16:31:00.175Z" },
+
+[package.metadata]
+requires-dist = [
+    { name = "anthropic", specifier = ">=0.83.0" },
+    { name = "httpx", specifier = ">=0.28.1" },
+    { name = "mcp", specifier = ">=1.18.0" },
+    { name = "openai", specifier = ">=2.14.0" },
+    { name = "opentelemetry-api", specifier = ">=1.0" },
+    { name = "pydantic", specifier = ">=2.12.5" },
+    { name = "vercel", specifier = ">=0.3.8" },
+]
+
+[package.metadata.requires-dev]
+dev = [
+    { name = "mypy", specifier = ">=1.11" },
+    { name = "opentelemetry-sdk", specifier = ">=1.0" },
+    { name = "pytest", specifier = ">=8.0" },
+    { name = "pytest-asyncio", specifier = ">=0.24" },
+    { name = "python-dotenv", specifier = ">=1.2.1" },
+    { name = "rich", specifier = ">=14.2.0" },
+    { name = "ruff", specifier = ">=0.8" },
 ]
 
 [[package]]
@@ -1464,3 +1508,12 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/9f/3e/28135a24e384493fa804216b79a6a6759a38cc4ff59118787b9fb693df93/websockets-16.0-cp314-cp314t-win_amd64.whl", hash = "sha256:b14dc141ed6d2dde437cddb216004bcac6a1df0935d79656387bd41632ba0bbd", size = 178531, upload-time = "2026-01-10T09:23:35.016Z" },
     { url = "https://files.pythonhosted.org/packages/6f/28/258ebab549c2bf3e64d2b0217b973467394a9cea8c42f70418ca2c5d0d2e/websockets-16.0-py3-none-any.whl", hash = "sha256:1637db62fad1dc833276dded54215f2c7fa46912301a24bd94d45d46a011ceec", size = 171598, upload-time = "2026-01-10T09:23:45.395Z" },
 ]
+
+[[package]]
+name = "zipp"
+version = "3.23.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/e3/02/0f2892c661036d50ede074e376733dca2ae7c6eb617489437771209d4180/zipp-3.23.0.tar.gz", hash = "sha256:a07157588a12518c9d4034df3fbbee09c814741a33ff63c05fa29d26a2404166", size = 25547, upload-time = "2025-06-08T17:06:39.4Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/2e/54/647ade08bf0db230bfea292f893923872fd20be6ac6f53b2b936ba839d75/zipp-3.23.0-py3-none-any.whl", hash = "sha256:071652d6115ed432f5ce1d34c336c0adfd6a884660d1e9712a256d3d3bd4b14e", size = 10276, upload-time = "2025-06-08T17:06:38.034Z" },
+]
diff --git a/examples/fastapi-vite/frontend/vite.config.ts b/examples/fastapi-vite/frontend/vite.config.ts
index 39d31769..0cca23e1 100644
--- a/examples/fastapi-vite/frontend/vite.config.ts
+++ b/examples/fastapi-vite/frontend/vite.config.ts
@@ -11,9 +11,4 @@ export default defineConfig({
       '@': path.resolve(__dirname, './src'),
     },
   },
-  server: {
-    proxy: {
-      '/api': 'http://localhost:8000',
-    },
-  },
 })

From 8ca7b54849ad037e9269309d6c2569e58372beed Mon Sep 17 00:00:00 2001
From: Andrey Buzin <contactbuzin@gmail.com>
Date: Mon, 2 Mar 2026 17:22:47 -0800
Subject: [PATCH 03/10] Make human-in-the-loop work in the fastapi-vite example

---
 examples/fastapi-vite/README.md               |  17 +++
 examples/fastapi-vite/backend/agent.py        |  52 ++++++-
 examples/fastapi-vite/backend/main.py         |  67 +++++++--
 examples/fastapi-vite/frontend/src/App.tsx    |  80 +++++++++--
 .../components/ai-elements/confirmation.tsx   | 131 ++++++++++++++++++
 src/vercel_ai_sdk/ai_sdk_ui/adapter.py        |  18 +++
 6 files changed, 340 insertions(+), 25 deletions(-)
 create mode 100644 examples/fastapi-vite/frontend/src/components/ai-elements/confirmation.tsx

diff --git a/examples/fastapi-vite/README.md b/examples/fastapi-vite/README.md
index 7f75c5e5..e8552512 100644
--- a/examples/fastapi-vite/README.md
+++ b/examples/fastapi-vite/README.md
@@ -1,12 +1,29 @@
 # fastapi-chat
 
 Chat demo using the Python Vercel AI SDK with a FastAPI backend and React frontend.
+Includes **human-in-the-loop tool approval** — every tool call is gated
+behind user confirmation before execution.
 
 ## Stack
 
 - **Backend:** FastAPI + vercel-ai-sdk (Python 3.12)
 - **Frontend:** Vite + React + AI SDK UI + AI Elements
 
+## Human-in-the-Loop
+
+The agent graph in `backend/agent.py` uses the `ToolApproval` hook to
+suspend execution whenever the LLM wants to call a tool.  The flow is:
+
+1. LLM emits a tool call
+2. Backend creates a `ToolApproval` hook — this emits an
+   `approval-requested` event on the SSE stream and suspends execution
+3. The frontend renders Approve / Reject buttons via the
+   `<Confirmation>` component (from AI Elements)
+4. When the user clicks a button, `addToolApprovalResponse()` patches
+   the message and sends a new request with the decision
+5. The backend resumes from the checkpoint and either executes the tool
+   or marks it as denied
+
 ## Setup
 
 ```bash
diff --git a/examples/fastapi-vite/backend/agent.py b/examples/fastapi-vite/backend/agent.py
index 94ecd714..023a66d2 100644
--- a/examples/fastapi-vite/backend/agent.py
+++ b/examples/fastapi-vite/backend/agent.py
@@ -1,5 +1,10 @@
-"""Agent logic for the chat demo."""
+"""Agent logic for the chat demo.
 
+Demonstrates human-in-the-loop tool approval using ToolApproval hooks.
+Every tool call is gated behind user approval before execution.
+"""
+
+import asyncio
 from typing import Any
 
 import vercel_ai_sdk as ai
@@ -19,16 +24,49 @@ def get_llm() -> ai.LanguageModel:
 TOOLS: list[ai.Tool[..., Any]] = [talk_to_mothership]
 
 
+async def _execute_with_approval(
+    tc: ai.ToolPart, message: ai.Message | None = None
+) -> None:
+    """Execute a tool call only after the user grants approval.
+
+    Creates a ToolApproval hook that suspends execution until the
+    frontend responds with an approve/reject decision.
+    """
+    approval = await ai.ToolApproval.create(  # type: ignore[attr-defined]
+        f"approve_{tc.tool_call_id}",
+        metadata={"tool_name": tc.tool_name, "tool_args": tc.tool_args},
+    )
+
+    if approval.granted:
+        await ai.execute_tool(tc, message=message)
+    else:
+        tc.set_error("Tool call was denied by the user.")
+
+
 async def graph(
     llm: ai.LanguageModel,
     messages: list[ai.Message],
     tools: list[ai.Tool[..., Any]],
 ) -> ai.StreamResult:
-    """
-    Agent graph: stream LLM, execute tools, repeat until done.
+    """Agent graph with human-in-the-loop tool approval.
 
-    This is a plain async function that goes through the Runtime queue
-    via stream_loop. When hooks are added later, they slot in here
-    between tool calls — no structural change needed.
+    Loops: stream LLM -> request approval -> execute tools -> repeat.
+    The ToolApproval hook suspends execution and emits an approval-
+    request event on the SSE stream.  The frontend displays Approve /
+    Reject buttons and sends the decision back on the next request.
     """
-    return await ai.stream_loop(llm, messages, tools)
+    local_messages = list(messages)
+
+    while True:
+        result = await ai.stream_step(llm, local_messages, tools)
+
+        if not result.tool_calls:
+            return result
+
+        last_msg = result.last_message
+        assert last_msg is not None
+        local_messages.append(last_msg)
+
+        await asyncio.gather(
+            *(_execute_with_approval(tc, message=last_msg) for tc in result.tool_calls)
+        )
diff --git a/examples/fastapi-vite/backend/main.py b/examples/fastapi-vite/backend/main.py
index 9ce7211a..8175dbbb 100644
--- a/examples/fastapi-vite/backend/main.py
+++ b/examples/fastapi-vite/backend/main.py
@@ -44,6 +44,29 @@ class ChatRequest(pydantic.BaseModel):
     session_id: str | None = None
 
 
+def _has_matching_approval(
+    ui_messages: list[ai.ai_sdk_ui.UIMessage],
+    pending_hooks: list[str],
+) -> bool:
+    """True when the incoming messages resolve at least one pending hook.
+
+    Hook labels follow the ``approve_{tool_call_id}`` convention set by
+    ``_execute_with_approval`` in the agent graph.
+    """
+    pending = set(pending_hooks)
+    for msg in ui_messages:
+        for part in msg.parts:
+            state = getattr(part, "state", None)
+            tcid = getattr(part, "tool_call_id", None)
+            if (
+                state == "approval-responded"
+                and tcid is not None
+                and f"approve_{tcid}" in pending
+            ):
+                return True
+    return False
+
+
 @app.post("/chat")
 async def chat(request: ChatRequest) -> fastapi.responses.StreamingResponse:
     """Handle chat requests and stream responses."""
@@ -53,24 +76,48 @@ async def chat(request: ChatRequest) -> fastapi.responses.StreamingResponse:
 
     llm = agent.get_llm()
 
-    # Checkpoints resume an *interrupted* run (e.g. a hook that needed
-    # user input in serverless mode).  Each normal chat turn is a fresh
-    # run — the frontend carries the full message history — so we only
-    # load a checkpoint when one was saved from a previous incomplete run.
+    # Only load a checkpoint when this request is actually resuming
+    # an interrupted run — i.e. the frontend is sending back an
+    # approval response that matches a pending hook.  Otherwise
+    # discard stale checkpoints so fresh turns aren't poisoned.
+    checkpoint = None
     saved = await file_storage.get(checkpoint_key)
-    checkpoint = ai.Checkpoint.model_validate(saved) if saved else None
+    if saved:
+        pending = saved.get("pending_hooks", [])
+        if _has_matching_approval(request.messages, pending):
+            checkpoint = ai.Checkpoint.model_validate(saved["checkpoint"])
+            # The frontend sends the full message history including the
+            # assistant message from the interrupted run.  The checkpoint
+            # will replay that same step, so strip the trailing assistant
+            # message to avoid sending a duplicate tool_use to the LLM.
+            if messages and messages[-1].role == "assistant":
+                messages = messages[:-1]
+        else:
+            await file_storage.delete(checkpoint_key)
 
-    result = ai.run(agent.graph, llm, messages, agent.TOOLS, checkpoint=checkpoint)
+    result = ai.run(
+        agent.graph,
+        llm,
+        messages,
+        agent.TOOLS,
+        checkpoint=checkpoint,
+        cancel_on_hooks=True,
+    )
 
     async def stream_response() -> AsyncGenerator[str]:
         async for chunk in ai.ai_sdk_ui.to_sse_stream(result):
             yield chunk
 
-        # If the run completed (no pending hooks), clear the checkpoint
-        # so the next request starts fresh.  If hooks are pending, save
-        # the checkpoint so the next request can resume from here.
+        # Save checkpoint + pending hook labels so the next request
+        # can decide whether it's a resume or a fresh turn.
         if result.pending_hooks:
-            await file_storage.put(checkpoint_key, result.checkpoint.model_dump())
+            await file_storage.put(
+                checkpoint_key,
+                {
+                    "checkpoint": result.checkpoint.model_dump(),
+                    "pending_hooks": list(result.pending_hooks.keys()),
+                },
+            )
         else:
             await file_storage.delete(checkpoint_key)
 
diff --git a/examples/fastapi-vite/frontend/src/App.tsx b/examples/fastapi-vite/frontend/src/App.tsx
index a7142590..0fedfd98 100644
--- a/examples/fastapi-vite/frontend/src/App.tsx
+++ b/examples/fastapi-vite/frontend/src/App.tsx
@@ -1,8 +1,21 @@
 import { useChat } from "@ai-sdk/react";
-import { DefaultChatTransport } from "ai";
+import {
+  DefaultChatTransport,
+  lastAssistantMessageIsCompleteWithApprovalResponses,
+} from "ai";
 import type { ToolUIPart } from "ai";
+import { CheckIcon, XIcon } from "lucide-react";
 import { Fragment } from "react";
 
+import {
+  Confirmation,
+  ConfirmationAccepted,
+  ConfirmationAction,
+  ConfirmationActions,
+  ConfirmationRejected,
+  ConfirmationRequest,
+  ConfirmationTitle,
+} from "@/components/ai-elements/confirmation";
 import {
   Conversation,
   ConversationContent,
@@ -29,11 +42,16 @@ import {
 import { TooltipProvider } from "@/components/ui/tooltip";
 
 export default function App() {
-  const { messages, sendMessage, status, stop } = useChat({
-    transport: new DefaultChatTransport({
-      api: "/api/chat",
-    }),
-  });
+  const { messages, sendMessage, addToolApprovalResponse, status, stop } =
+    useChat({
+      transport: new DefaultChatTransport({
+        api: "/api/chat",
+      }),
+      // After the user approves/rejects a tool, automatically send the
+      // updated messages back to the backend so it can resume execution.
+      sendAutomaticallyWhen:
+        lastAssistantMessageIsCompleteWithApprovalResponses,
+    });
 
   const isLoading = status === "submitted" || status === "streaming";
 
@@ -63,7 +81,8 @@ export default function App() {
                       // Handle tool parts (type starts with "tool-")
                       if (part.type.startsWith("tool-")) {
                         const toolPart = part as ToolUIPart;
-                        const isComplete = toolPart.state === "output-available";
+                        const isComplete =
+                          toolPart.state === "output-available";
 
                         return (
                           <Tool
@@ -76,6 +95,51 @@ export default function App() {
                             />
                             <ToolContent>
                               <ToolInput input={toolPart.input} />
+
+                              {/* Human-in-the-loop approval UI */}
+                              <Confirmation
+                                approval={toolPart.approval}
+                                state={toolPart.state}
+                              >
+                                <ConfirmationTitle>
+                                  <ConfirmationRequest>
+                                    Allow this tool to run?
+                                  </ConfirmationRequest>
+                                  <ConfirmationAccepted>
+                                    <CheckIcon className="size-4 text-green-500" />
+                                    <span>Approved</span>
+                                  </ConfirmationAccepted>
+                                  <ConfirmationRejected>
+                                    <XIcon className="size-4 text-destructive" />
+                                    <span>Rejected</span>
+                                  </ConfirmationRejected>
+                                </ConfirmationTitle>
+                                <ConfirmationActions>
+                                  <ConfirmationAction
+                                    variant="outline"
+                                    onClick={() =>
+                                      addToolApprovalResponse({
+                                        id: toolPart.approval!.id,
+                                        approved: false,
+                                      })
+                                    }
+                                  >
+                                    Reject
+                                  </ConfirmationAction>
+                                  <ConfirmationAction
+                                    variant="default"
+                                    onClick={() =>
+                                      addToolApprovalResponse({
+                                        id: toolPart.approval!.id,
+                                        approved: true,
+                                      })
+                                    }
+                                  >
+                                    Approve
+                                  </ConfirmationAction>
+                                </ConfirmationActions>
+                              </Confirmation>
+
                               <ToolOutput
                                 output={toolPart.output}
                                 errorText={toolPart.errorText}
@@ -86,7 +150,7 @@ export default function App() {
                       }
 
                       // Handle text parts
-                        if (part.type === "text") {
+                      if (part.type === "text") {
                         return (
                           <Message
                             key={`${message.id}-${partIndex}`}
diff --git a/examples/fastapi-vite/frontend/src/components/ai-elements/confirmation.tsx b/examples/fastapi-vite/frontend/src/components/ai-elements/confirmation.tsx
new file mode 100644
index 00000000..c537d1d3
--- /dev/null
+++ b/examples/fastapi-vite/frontend/src/components/ai-elements/confirmation.tsx
@@ -0,0 +1,131 @@
+"use client";
+
+import type { ToolUIPart } from "ai";
+import type { ComponentProps, ReactNode } from "react";
+
+import { Button } from "@/components/ui/button";
+import { cn } from "@/lib/utils";
+import { createContext, useContext } from "react";
+
+/* ------------------------------------------------------------------ */
+/* Context                                                             */
+/* ------------------------------------------------------------------ */
+
+type ToolUIPartApproval = ToolUIPart["approval"];
+
+interface ConfirmationContextValue {
+  approval: ToolUIPartApproval;
+  state: ToolUIPart["state"];
+}
+
+const ConfirmationContext = createContext<ConfirmationContextValue | null>(null);
+
+const useConfirmation = () => {
+  const ctx = useContext(ConfirmationContext);
+  if (!ctx) throw new Error("Confirmation components must be used within <Confirmation>");
+  return ctx;
+};
+
+/* ------------------------------------------------------------------ */
+/* <Confirmation>                                                      */
+/* ------------------------------------------------------------------ */
+
+export type ConfirmationProps = ComponentProps<"div"> & {
+  approval?: ToolUIPartApproval;
+  state: ToolUIPart["state"];
+};
+
+export const Confirmation = ({
+  className,
+  approval,
+  state,
+  children,
+  ...props
+}: ConfirmationProps) => {
+  if (!approval || state === "input-streaming" || state === "input-available") {
+    return null;
+  }
+
+  return (
+    <ConfirmationContext.Provider value={{ approval, state }}>
+      <div
+        className={cn(
+          "flex flex-col gap-2 rounded-md border p-3 text-sm",
+          className,
+        )}
+        {...props}
+      >
+        {children}
+      </div>
+    </ConfirmationContext.Provider>
+  );
+};
+
+/* ------------------------------------------------------------------ */
+/* <ConfirmationTitle>                                                 */
+/* ------------------------------------------------------------------ */
+
+export type ConfirmationTitleProps = ComponentProps<"p">;
+
+export const ConfirmationTitle = ({
+  className,
+  ...props
+}: ConfirmationTitleProps) => (
+  <p className={cn("inline-flex items-center gap-2", className)} {...props} />
+);
+
+/* ------------------------------------------------------------------ */
+/* State-conditional wrappers                                          */
+/* ------------------------------------------------------------------ */
+
+export const ConfirmationRequest = ({ children }: { children?: ReactNode }) => {
+  const { state } = useConfirmation();
+  return state === "approval-requested" ? <>{children}</> : null;
+};
+
+export const ConfirmationAccepted = ({ children }: { children?: ReactNode }) => {
+  const { approval, state } = useConfirmation();
+  const show =
+    approval?.approved === true &&
+    (state === "approval-responded" ||
+      state === "output-available" ||
+      state === "output-denied");
+  return show ? <>{children}</> : null;
+};
+
+export const ConfirmationRejected = ({ children }: { children?: ReactNode }) => {
+  const { approval, state } = useConfirmation();
+  const show =
+    approval?.approved === false &&
+    (state === "approval-responded" ||
+      state === "output-available" ||
+      state === "output-denied");
+  return show ? <>{children}</> : null;
+};
+
+/* ------------------------------------------------------------------ */
+/* Actions                                                             */
+/* ------------------------------------------------------------------ */
+
+export type ConfirmationActionsProps = ComponentProps<"div">;
+
+export const ConfirmationActions = ({
+  className,
+  ...props
+}: ConfirmationActionsProps) => {
+  const { state } = useConfirmation();
+  if (state !== "approval-requested") return null;
+
+  return (
+    <div
+      className={cn("flex items-center justify-end gap-2 self-end", className)}
+      {...props}
+    />
+  );
+};
+
+export type ConfirmationActionProps = ComponentProps<typeof Button>;
+
+export const ConfirmationAction = (props: ConfirmationActionProps) => (
+  <Button size="sm" type="button" {...props} />
+);
diff --git a/src/vercel_ai_sdk/ai_sdk_ui/adapter.py b/src/vercel_ai_sdk/ai_sdk_ui/adapter.py
index f050e3d6..0dff4d94 100644
--- a/src/vercel_ai_sdk/ai_sdk_ui/adapter.py
+++ b/src/vercel_ai_sdk/ai_sdk_ui/adapter.py
@@ -149,6 +149,17 @@ def _tool_call_id_from_approval_hook(
     return None
 
 
+def _is_tool_approval_hook_message(msg: core.messages.Message) -> bool:
+    """True if this message contains only ToolApproval HookParts."""
+    if not msg.parts:
+        return False
+    return all(
+        isinstance(p, core.messages.HookPart)
+        and _tool_call_id_from_approval_hook(p) is not None
+        for p in msg.parts
+    )
+
+
 async def to_ui_message_stream(
     messages: AsyncIterable[core.messages.Message],
 ) -> AsyncGenerator[protocol.UIMessageStreamPart]:
@@ -161,6 +172,13 @@ async def to_ui_message_stream(
     state = _StreamState()
 
     async for msg in messages:
+        # Tool-approval hook messages are emitted by the Runtime as
+        # separate Message objects (with their own id).  To the frontend
+        # they belong to the *same* step as the tool call, so we pin
+        # the message id to avoid creating a spurious step boundary.
+        if _is_tool_approval_hook_message(msg) and state.message_id:
+            msg = msg.model_copy(update={"id": state.message_id})
+
         for part in state.begin_message(msg):
             yield part
 

From 2f176d9f0dc898e640b4acbd6bd54a745a512639 Mon Sep 17 00:00:00 2001
From: Andrey Buzin <contactbuzin@gmail.com>
Date: Mon, 2 Mar 2026 17:57:16 -0800
Subject: [PATCH 04/10] Update tests to correctly reflect the UI protocol for
 tool approval

---
 tests/ai_sdk_ui/test_adapter.py | 104 ++++++++++++++++++++++++++++++--
 1 file changed, 100 insertions(+), 4 deletions(-)

diff --git a/tests/ai_sdk_ui/test_adapter.py b/tests/ai_sdk_ui/test_adapter.py
index 68af026e..5eb92981 100644
--- a/tests/ai_sdk_ui/test_adapter.py
+++ b/tests/ai_sdk_ui/test_adapter.py
@@ -2,6 +2,7 @@
 Based on: .reference/ai/packages/ai/src/ui/process-ui-message-stream.test.ts
 """
 
+import asyncio
 from collections.abc import AsyncGenerator
 
 import pytest
@@ -10,7 +11,7 @@
 from vercel_ai_sdk.ai_sdk_ui import adapter, ui_message
 from vercel_ai_sdk.core import hooks, messages
 
-from ..conftest import MockLLM
+from ..conftest import MockLLM, tool_msg
 
 
 async def get_event_types(msgs: list[messages.Message]) -> list[str]:
@@ -501,7 +502,14 @@ def test_ui_skips_unsupported_parts() -> None:
 
 @pytest.mark.asyncio
 async def test_tool_approval_hook_emits_approval_request() -> None:
-    """Pending ToolApproval HookPart emits tool-approval-request on the wire."""
+    """Pending ToolApproval HookPart emits tool-approval-request on the wire.
+
+    The HookPart message uses a *different* id from the tool message,
+    matching what the Runtime actually does (it creates an ad-hoc Message
+    with its own auto-generated id at runtime.py:452).  The adapter must
+    keep both in the same step so the frontend's sendAutomaticallyWhen
+    helper can find the tool part when the user responds to the approval.
+    """
     msgs = [
         # Tool pending (args complete, awaiting approval)
         messages.Message(
@@ -517,9 +525,10 @@ async def test_tool_approval_hook_emits_approval_request() -> None:
                 ),
             ],
         ),
-        # Hook pending (approval requested)
+        # Hook pending (approval requested) — different message id,
+        # just like the Runtime produces at runtime.py:452.
         messages.Message(
-            id="msg-1",
+            id="hook-msg-1",
             role="assistant",
             parts=[
                 messages.HookPart(
@@ -533,6 +542,8 @@ async def test_tool_approval_hook_emits_approval_request() -> None:
     ]
 
     event_types = await get_event_types(msgs)
+    # tool-approval-request must be in the SAME step as the tool input —
+    # no extra start-step/finish-step between them.
     assert event_types == [
         "start",
         "start-step",
@@ -577,3 +588,88 @@ def test_approval_responded_resolves_hook() -> None:
     assert label in hooks._pending_resolutions
     resolution = hooks._pending_resolutions.pop(label)
     assert resolution == {"granted": True, "reason": "looks safe"}
+
+
+@pytest.mark.asyncio
+async def test_runtime_tool_approval_same_step() -> None:
+    """E2E: tool-approval-request must land in the same SSE step as the tool call.
+
+    Runs a graph with ToolApproval through ai.run(cancel_on_hooks=True),
+    collects runtime messages, streams through the adapter, and asserts
+    that no spurious step boundary appears between tool-input-available
+    and tool-approval-request.
+
+    This is the test that would have caught the bug where the Runtime's
+    HookPart message (which has a different id from the LLM message)
+    caused the adapter to open a new step.
+    """
+
+    @ai.tool
+    async def dangerous_action(path: str) -> str:
+        """Do something dangerous."""
+        return f"deleted {path}"
+
+    async def graph(llm: ai.LanguageModel) -> None:
+        result = await ai.stream_step(
+            llm,
+            ai.make_messages(system="You are helpful.", user="delete /tmp"),
+            [dangerous_action],
+        )
+        if not result.tool_calls:
+            return
+
+        last_msg = result.last_message
+        assert last_msg is not None
+
+        async def approve_and_execute(tc: ai.ToolPart) -> None:
+            approval = await ai.ToolApproval.create(  # type: ignore[attr-defined]
+                f"approve_{tc.tool_call_id}",
+                metadata={"tool_name": tc.tool_name},
+            )
+            if approval.granted:
+                await ai.execute_tool(tc, message=last_msg)
+            else:
+                tc.set_error("denied")
+
+        await asyncio.gather(*(approve_and_execute(tc) for tc in result.tool_calls))
+
+    mock_llm = MockLLM(
+        [
+            [
+                tool_msg(
+                    tc_id="tc-1",
+                    name="dangerous_action",
+                    args='{"path": "/tmp"}',
+                )
+            ],
+        ]
+    )
+
+    runtime_messages: list[messages.Message] = []
+    result = ai.run(graph, mock_llm, cancel_on_hooks=True)
+    async for msg in result:
+        runtime_messages.append(msg)
+
+    # The run should have a pending hook (approval not yet granted)
+    assert "approve_tc-1" in result.pending_hooks
+
+    # Stream through UI adapter
+    event_types = [
+        p.type
+        async for p in adapter.to_ui_message_stream(_async_iter(runtime_messages))
+    ]
+
+    # tool-approval-request must be in the SAME step as tool-input.
+    # If a spurious step boundary sneaks in, we'd see:
+    #   [..., "tool-input-available", "finish-step", "start-step",
+    #    "tool-approval-request", ...]
+    # which breaks the frontend's sendAutomaticallyWhen helper.
+    assert event_types == [
+        "start",
+        "start-step",
+        "tool-input-start",
+        "tool-input-available",
+        "tool-approval-request",
+        "finish-step",
+        "finish",
+    ]

From 62b99a0e63444cb61c7640e947d0bf2dabaa507c Mon Sep 17 00:00:00 2001
From: Andrey Buzin <contactbuzin@gmail.com>
Date: Tue, 3 Mar 2026 12:03:56 -0800
Subject: [PATCH 05/10] Fix the Anthropic adapter and AI SDK UI bug casing
 message corruption

---
 src/vercel_ai_sdk/ai_sdk_ui/adapter.py  |  56 ++++-
 src/vercel_ai_sdk/anthropic/__init__.py |  65 ++++--
 src/vercel_ai_sdk/openai/__init__.py    |  22 +-
 tests/ai_sdk_ui/test_adapter.py         |  42 ++--
 tests/anthropic/test_anthropic.py       | 275 ++++++++++++++++++++++++
 5 files changed, 407 insertions(+), 53 deletions(-)
 create mode 100644 tests/anthropic/test_anthropic.py

diff --git a/src/vercel_ai_sdk/ai_sdk_ui/adapter.py b/src/vercel_ai_sdk/ai_sdk_ui/adapter.py
index 0dff4d94..9d1b98e2 100644
--- a/src/vercel_ai_sdk/ai_sdk_ui/adapter.py
+++ b/src/vercel_ai_sdk/ai_sdk_ui/adapter.py
@@ -474,12 +474,56 @@ def to_messages(
                 "User and system messages require non-empty content."
             )
 
-        result.append(
-            core.messages.Message(
-                id=ui_msg.id,
-                role=ui_msg.role,
-                parts=internal_parts,
+        # The UI sends one assistant message per conversation turn, but a
+        # single turn may span multiple stream_loop iterations (e.g.
+        # [text, tool(done), text, tool(done), text]).  LLM APIs expect
+        # one message per iteration, so split at completed-tool boundaries.
+        if ui_msg.role == "assistant":
+            result.extend(_split_assistant_parts(internal_parts, msg_id=ui_msg.id))
+        else:
+            result.append(
+                core.messages.Message(
+                    id=ui_msg.id,
+                    role=ui_msg.role,
+                    parts=internal_parts,
+                )
             )
-        )
 
     return result
+
+
+def _split_assistant_parts(
+    parts: list[core.messages.Part],
+    msg_id: str,
+) -> list[core.messages.Message]:
+    """Split assistant parts at completed-tool → non-tool boundaries.
+
+    Returns one ``Message`` per ``stream_loop`` iteration so that LLM
+    adapters receive correctly-shaped single-iteration messages.
+    """
+    messages: list[core.messages.Message] = []
+    current: list[core.messages.Part] = []
+    has_completed_tool = False
+
+    for part in parts:
+        if has_completed_tool and not isinstance(part, core.messages.ToolPart):
+            messages.append(
+                core.messages.Message(role="assistant", parts=current, id=msg_id)
+            )
+            current = []
+            has_completed_tool = False
+
+        current.append(part)
+
+        if isinstance(part, core.messages.ToolPart) and part.status in (
+            "result",
+            "error",
+        ):
+            has_completed_tool = True
+
+    if current:
+        messages.append(
+            core.messages.Message(role="assistant", parts=current, id=msg_id)
+        )
+
+    return messages
diff --git a/src/vercel_ai_sdk/anthropic/__init__.py b/src/vercel_ai_sdk/anthropic/__init__.py
index bce6f5f6..f0be21f8 100644
--- a/src/vercel_ai_sdk/anthropic/__init__.py
+++ b/src/vercel_ai_sdk/anthropic/__init__.py
@@ -28,12 +28,16 @@ def _messages_to_anthropic(
 ) -> tuple[str | None, list[dict[str, Any]]]:
     """Convert internal messages to Anthropic API format.
 
-    Returns (system_prompt, messages) tuple since Anthropic handles system differently.
+    Returns (system_prompt, messages) tuple since Anthropic handles
+    system prompts separately.
 
-    Handles the unified ToolPart model where tool calls and results are in the same
-    assistant message. Converts back to Anthropic's expected format:
-    - tool_use blocks in assistant messages
-    - tool_result blocks in user messages (after the assistant message)
+    Converts to the Anthropic wire format:
+
+    - ``tool_use`` blocks in assistant messages
+    - ``tool_result`` blocks in user messages (immediately after)
+
+    A final merge pass ensures strictly alternating roles (Anthropic
+    rejects consecutive same-role messages).
     """
     system_prompt: str | None = None
     result: list[dict[str, Any]] = []
@@ -49,8 +53,6 @@ def _messages_to_anthropic(
 
             for part in msg.parts:
                 if isinstance(part, core.messages.ReasoningPart):
-                    # Only include thinking blocks if we have the signature
-                    # (required by Anthropic API for multi-turn conversations)
                     if part.signature:
                         content.append(
                             {
@@ -62,7 +64,6 @@ def _messages_to_anthropic(
                 elif isinstance(part, core.messages.TextPart):
                     content.append({"type": "text", "text": part.text})
                 elif isinstance(part, core.messages.ToolPart):
-                    # tool_args is a JSON string, but Anthropic expects input as a dict
                     tool_input = json.loads(part.tool_args) if part.tool_args else {}
                     content.append(
                         {
@@ -72,12 +73,13 @@ def _messages_to_anthropic(
                             "input": tool_input,
                         }
                     )
-                    # If tool has completed (success or error), collect for user message
-                    if part.status in ("result", "error") and part.result is not None:
+                    if part.status in ("result", "error"):
                         entry: dict[str, Any] = {
                             "type": "tool_result",
                             "tool_use_id": part.tool_call_id,
-                            "content": str(part.result),
+                            "content": str(part.result)
+                            if part.result is not None
+                            else "",
                         }
                         if part.status == "error":
                             entry["is_error"] = True
@@ -85,8 +87,6 @@ def _messages_to_anthropic(
 
             if content:
                 result.append({"role": "assistant", "content": content})
-
-            # Emit tool results as a separate user message (Anthropic API format)
             if tool_results:
                 result.append({"role": "user", "content": tool_results})
         else:
@@ -96,9 +96,48 @@ def _messages_to_anthropic(
             )
             result.append({"role": "user", "content": content_text})
 
+    # Merge consecutive same-role messages (e.g. synthetic user(tool_result)
+    # followed by a real user message).
+    result = _merge_consecutive_roles(result)
+
     return system_prompt, result
 
 
+def _merge_consecutive_roles(
+    messages: list[dict[str, Any]],
+) -> list[dict[str, Any]]:
+    """Merge consecutive messages that share the same role.
+
+    Anthropic requires strictly alternating user/assistant roles.  When
+    our conversion emits a synthetic ``user`` message for ``tool_result``
+    blocks followed by a real ``user`` message, they must be merged.
+
+    Content is normalized to list-of-blocks so heterogeneous content
+    (tool_result dicts + text strings) can coexist.
+    """
+    if not messages:
+        return messages
+
+    merged: list[dict[str, Any]] = [messages[0]]
+
+    for msg in messages[1:]:
+        if msg["role"] == merged[-1]["role"]:
+            prev = _to_content_list(merged[-1]["content"])
+            cur = _to_content_list(msg["content"])
+            merged[-1]["content"] = prev + cur
+        else:
+            merged.append(msg)
+
+    return merged
+
+
+def _to_content_list(content: Any) -> list[dict[str, Any]]:
+    """Normalize Anthropic message content to list-of-blocks format."""
+    if isinstance(content, list):
+        return list(content)
+    return [{"type": "text", "text": content}]
+
+
 class AnthropicModel(core.llm.LanguageModel):
     """Anthropic adapter with native extended thinking support."""
 
diff --git a/src/vercel_ai_sdk/openai/__init__.py b/src/vercel_ai_sdk/openai/__init__.py
index 1b42b50e..545a76e0 100644
--- a/src/vercel_ai_sdk/openai/__init__.py
+++ b/src/vercel_ai_sdk/openai/__init__.py
@@ -29,14 +29,13 @@ def _tools_to_openai(tools: Sequence[core.tools.ToolLike]) -> list[dict[str, Any
 def _messages_to_openai(messages: list[core.messages.Message]) -> list[dict[str, Any]]:
     """Convert internal messages to OpenAI API format.
 
-    The Vercel AI Gateway preserves reasoning details across interactions,
-    normalizing formats from different providers. This is useful for tool
-    calling workflows where the model needs to resume its thought process.
+    Converts to the OpenAI wire format:
+
+    - ``tool_calls`` on assistant messages
+    - tool results as separate ``role: "tool"`` messages
 
-    Handles the unified ToolPart model where tool calls and results are in the same
-    assistant message. Converts back to OpenAI's expected format:
-    - tool_calls in assistant messages
-    - tool results as separate tool role messages
+    The Vercel AI Gateway preserves reasoning details across interactions,
+    normalizing formats from different providers.
 
     See: https://vercel.com/docs/ai-gateway/openai-compat/advanced
     """
@@ -64,21 +63,20 @@ def _messages_to_openai(messages: list[core.messages.Message]) -> list[dict[str,
                             },
                         }
                     )
-                    # If tool has completed (success or error),
-                    # collect for tool messages
-                    if part.status in ("result", "error") and part.result is not None:
+                    if part.status in ("result", "error"):
                         tool_results.append(
                             {
                                 "role": "tool",
                                 "tool_call_id": part.tool_call_id,
-                                "content": str(part.result),
+                                "content": str(part.result)
+                                if part.result is not None
+                                else "",
                             }
                         )
 
             entry: dict[str, Any] = {"role": "assistant"}
             if content:
                 entry["content"] = content
-            # Include reasoning for multi-turn context (gateway preserves this)
             if reasoning:
                 entry["reasoning"] = reasoning
             if tool_calls:
diff --git a/tests/ai_sdk_ui/test_adapter.py b/tests/ai_sdk_ui/test_adapter.py
index 5eb92981..d5197534 100644
--- a/tests/ai_sdk_ui/test_adapter.py
+++ b/tests/ai_sdk_ui/test_adapter.py
@@ -419,33 +419,31 @@ def test_ui_to_internal_two_turn_with_tool() -> None:
     # Convert to internal format
     internal = adapter.to_messages(ui_messages)
 
-    # Verify conversion
-    assert len(internal) == 3
+    # The single UI assistant message contains [text, tool(done), text] from
+    # two stream_loop iterations.  to_messages splits at the tool-result
+    # boundary so LLM adapters receive one message per iteration.
+    assert len(internal) == 4
     assert internal[0].role == "user"
     assert internal[0].text == "when will the robots take over?"
 
+    # First iteration: text + tool call
     assert internal[1].role == "assistant"
-    # Should have text parts (non-empty) and tool part
-    # step-start and empty text parts should be skipped
-    text_parts = [p for p in internal[1].parts if isinstance(p, messages.TextPart)]
-    tool_parts = internal[1].tool_calls
-
-    assert len(text_parts) == 2  # Two non-empty text parts
-    assert (
-        text_parts[0].text
-        == "I'll check with the mothership about this important question."
+    assert internal[1].text == (
+        "I'll check with the mothership about this important question."
     )
-    assert text_parts[1].text == "The mothership has spoken: Soon."
-
-    assert len(tool_parts) == 1
-    assert tool_parts[0].tool_name == "talk_to_mothership"
-    assert tool_parts[0].tool_call_id == "toolu_01FiXNXhq1kHx4TegRjSaJyv"
-    assert tool_parts[0].status == "result"  # output-available maps to result
-    # Non-dict results are wrapped in {"value": ...} for internal ToolPart compatibility
-    assert tool_parts[0].result == {"value": "Soon."}
-
-    assert internal[2].role == "user"
-    assert internal[2].text == "this is a test run. can you remember the first turn?"
+    assert len(internal[1].tool_calls) == 1
+    assert internal[1].tool_calls[0].tool_name == "talk_to_mothership"
+    assert internal[1].tool_calls[0].tool_call_id == "toolu_01FiXNXhq1kHx4TegRjSaJyv"
+    assert internal[1].tool_calls[0].status == "result"
+    assert internal[1].tool_calls[0].result == {"value": "Soon."}
+
+    # Second iteration: follow-up text
+    assert internal[2].role == "assistant"
+    assert internal[2].text == "The mothership has spoken: Soon."
+    assert len(internal[2].tool_calls) == 0
+
+    assert internal[3].role == "user"
+    assert internal[3].text == "this is a test run. can you remember the first turn?"
 
 
 def test_ui_tool_part_with_dict_input() -> None:
diff --git a/tests/anthropic/test_anthropic.py b/tests/anthropic/test_anthropic.py
new file mode 100644
index 00000000..42127961
--- /dev/null
+++ b/tests/anthropic/test_anthropic.py
@@ -0,0 +1,275 @@
+"""Anthropic provider: _messages_to_anthropic conversion tests."""
+
+from vercel_ai_sdk.anthropic import _messages_to_anthropic
+from vercel_ai_sdk.core.messages import Message, ReasoningPart, TextPart, ToolPart
+
+
+def test_tool_result_none_still_emits_tool_result():
+    """A tool that returns None must still produce a tool_result block.
+
+    Regression: when part.result is None the converter skipped the tool_result,
+    leaving a tool_use without a matching tool_result.  Anthropic rejects this
+    with: "tool_use ids were found without tool_result blocks immediately after".
+    """
+    tool_part = ToolPart(
+        tool_call_id="toolu_01abc",
+        tool_name="send_notification",
+        tool_args="{}",
+    )
+    tool_part.set_result(None)  # tool returned None (fire-and-forget style)
+
+    messages = [
+        Message(role="assistant", parts=[tool_part]),
+    ]
+
+    _system, anthropic_msgs = _messages_to_anthropic(messages)
+
+    # Should have: assistant message with tool_use, then user message with tool_result
+    assert len(anthropic_msgs) == 2, (
+        f"Expected 2 messages (assistant + user/tool_result), got {len(anthropic_msgs)}: {anthropic_msgs}"
+    )
+
+    assistant_msg = anthropic_msgs[0]
+    assert assistant_msg["role"] == "assistant"
+    assert any(block["type"] == "tool_use" for block in assistant_msg["content"])
+
+    user_msg = anthropic_msgs[1]
+    assert user_msg["role"] == "user"
+    tool_results = [b for b in user_msg["content"] if b["type"] == "tool_result"]
+    assert len(tool_results) == 1
+    assert tool_results[0]["tool_use_id"] == "toolu_01abc"
+
+
+def test_tool_with_normal_result():
+    """Baseline: a tool with a normal result produces the correct pair."""
+    tool_part = ToolPart(
+        tool_call_id="toolu_02xyz",
+        tool_name="get_weather",
+        tool_args='{"city": "SF"}',
+    )
+    tool_part.set_result({"temp": 62})
+
+    messages = [
+        Message(role="assistant", parts=[tool_part]),
+    ]
+
+    _system, anthropic_msgs = _messages_to_anthropic(messages)
+
+    assert len(anthropic_msgs) == 2
+    assert anthropic_msgs[1]["content"][0]["content"] == "{'temp': 62}"
+
+
+def test_tool_error_produces_tool_result():
+    """Tool errors must also produce a tool_result block (with is_error=True)."""
+    tool_part = ToolPart(
+        tool_call_id="toolu_03err",
+        tool_name="failing_tool",
+        tool_args="{}",
+    )
+    tool_part.set_error("Connection timeout")
+
+    messages = [
+        Message(role="assistant", parts=[tool_part]),
+    ]
+
+    _system, anthropic_msgs = _messages_to_anthropic(messages)
+
+    assert len(anthropic_msgs) == 2
+    tool_result = anthropic_msgs[1]["content"][0]
+    assert tool_result["type"] == "tool_result"
+    assert tool_result["is_error"] is True
+    assert tool_result["content"] == "Connection timeout"
+
+
+def test_multiple_tools_one_returns_none():
+    """When one of several tools returns None, all must have tool_results."""
+    tool_a = ToolPart(
+        tool_call_id="toolu_a",
+        tool_name="tool_a",
+        tool_args="{}",
+    )
+    tool_a.set_result("some result")
+
+    tool_b = ToolPart(
+        tool_call_id="toolu_b",
+        tool_name="tool_b",
+        tool_args="{}",
+    )
+    tool_b.set_result(None)  # returns None
+
+    messages = [
+        Message(role="assistant", parts=[tool_a, tool_b]),
+    ]
+
+    _system, anthropic_msgs = _messages_to_anthropic(messages)
+
+    assert len(anthropic_msgs) == 2
+
+    # Both tool_use blocks in assistant message
+    tool_uses = [b for b in anthropic_msgs[0]["content"] if b["type"] == "tool_use"]
+    assert len(tool_uses) == 2
+
+    # Both tool_result blocks in user message
+    tool_results = [
+        b for b in anthropic_msgs[1]["content"] if b["type"] == "tool_result"
+    ]
+    assert len(tool_results) == 2
+
+    result_ids = {r["tool_use_id"] for r in tool_results}
+    assert result_ids == {"toolu_a", "toolu_b"}
+
+
+# -- Multi-turn: consecutive user messages (tool_result + next user) -------
+
+
+def test_multi_turn_no_consecutive_same_role_messages():
+    """Multi-turn with tools must not produce consecutive same-role messages.
+
+    Regression: when a previous assistant turn includes a tool call (with
+    result), _messages_to_anthropic emits:
+      [assistant(tool_use)] [user(tool_result)] [user(next question)]
+    The two consecutive user messages violate Anthropic's alternating-role
+    requirement, causing: "tool_use ids were found without tool_result
+    blocks immediately after".
+
+    The tool_result user message must be merged with the following user
+    message (or otherwise avoid consecutive same-role messages).
+    """
+    tool = ToolPart(
+        tool_call_id="toolu_01abc",
+        tool_name="talk_to_mothership",
+        tool_args='{"question": "when?"}',
+    )
+    tool.set_result({"value": "Soon."})
+
+    messages = [
+        Message(role="user", parts=[TextPart(text="when will the robots take over?")]),
+        Message(
+            role="assistant",
+            parts=[
+                TextPart(text="I'll check with the mothership."),
+                tool,
+                TextPart(text="The mothership has spoken: Soon."),
+            ],
+        ),
+        Message(
+            role="user",
+            parts=[TextPart(text="can you remember the first turn?")],
+        ),
+    ]
+
+    _system, anthropic_msgs = _messages_to_anthropic(messages)
+
+    # Verify no consecutive same-role messages
+    for i in range(1, len(anthropic_msgs)):
+        assert anthropic_msgs[i]["role"] != anthropic_msgs[i - 1]["role"], (
+            f"Consecutive same-role messages at indices {i - 1} and {i}: "
+            f"both are '{anthropic_msgs[i]['role']}'. "
+            f"Full messages: {anthropic_msgs}"
+        )
+
+
+def test_multi_turn_tool_result_before_user_merged():
+    """When tool_result (user) is followed by a user message, they merge.
+
+    The merged user message should contain both the tool_result blocks
+    and the text content from the following user message.
+    """
+    tool = ToolPart(
+        tool_call_id="toolu_01abc",
+        tool_name="get_weather",
+        tool_args='{"city": "SF"}',
+    )
+    tool.set_result("Sunny, 62F")
+
+    messages = [
+        Message(role="user", parts=[TextPart(text="what's the weather?")]),
+        Message(role="assistant", parts=[tool]),
+        Message(role="user", parts=[TextPart(text="thanks, what about tomorrow?")]),
+    ]
+
+    _system, anthropic_msgs = _messages_to_anthropic(messages)
+
+    # Should be: user, assistant, user (tool_result + text)
+    assert len(anthropic_msgs) == 3
+    assert anthropic_msgs[0]["role"] == "user"
+    assert anthropic_msgs[1]["role"] == "assistant"
+    assert anthropic_msgs[2]["role"] == "user"
+
+    # The merged user message should contain the tool_result
+    user_content = anthropic_msgs[2]["content"]
+    assert isinstance(user_content, list)
+    tool_results = [b for b in user_content if b.get("type") == "tool_result"]
+    assert len(tool_results) == 1
+    assert tool_results[0]["tool_use_id"] == "toolu_01abc"
+
+
+def test_stream_loop_second_iteration_messages():
+    """Simulates what stream_loop sends on the 2nd LLM call in a multi-turn.
+
+    After the first stream_step returns a tool call, stream_loop appends
+    the assistant message (now with status=result after execute_tool) and
+    calls stream_step again.  The messages must not have consecutive
+    same-role entries.
+    """
+    tool = ToolPart(
+        tool_call_id="toolu_01abc",
+        tool_name="talk_to_mothership",
+        tool_args='{"question": "test"}',
+    )
+    tool.set_result("answer")
+
+    # These are the messages that stream_loop would pass to the 2nd stream_step:
+    # original user messages + assistant message from 1st step (with tool result)
+    messages = [
+        Message(role="user", parts=[TextPart(text="ask the mothership")]),
+        Message(role="assistant", parts=[tool]),
+        # No user message follows — this is the loop, not a new user turn
+    ]
+
+    _system, anthropic_msgs = _messages_to_anthropic(messages)
+
+    # Should be: user, assistant(tool_use), user(tool_result)
+    assert len(anthropic_msgs) == 3
+    assert anthropic_msgs[0]["role"] == "user"
+    assert anthropic_msgs[1]["role"] == "assistant"
+    assert anthropic_msgs[2]["role"] == "user"
+
+    # Verify the tool_result is present
+    tool_results = [
+        b for b in anthropic_msgs[2]["content"] if b.get("type") == "tool_result"
+    ]
+    assert len(tool_results) == 1
+
+
+def test_pending_tool_does_not_emit_tool_result():
+    """A tool with status='pending' must not produce a tool_result block.
+
+    When stream_step returns a message mid-stream (before tool execution),
+    the ToolPart has status='pending'.  The converter must emit only
+    the tool_use block — no tool_result.
+    """
+    tool = ToolPart(
+        tool_call_id="toolu_pending",
+        tool_name="slow_tool",
+        tool_args='{"x": 1}',
+    )
+    # Don't call set_result — status stays "pending"
+
+    messages = [
+        Message(role="user", parts=[TextPart(text="do something")]),
+        Message(role="assistant", parts=[tool]),
+    ]
+
+    _system, anthropic_msgs = _messages_to_anthropic(messages)
+
+    # assistant message with tool_use, but NO user message with tool_result
+    assert len(anthropic_msgs) == 2
+    assert anthropic_msgs[0]["role"] == "user"
+    assert anthropic_msgs[1]["role"] == "assistant"
+    assert any(b["type"] == "tool_use" for b in anthropic_msgs[1]["content"])
+
+    # No tool_result anywhere
+    for msg in anthropic_msgs:
+        if isinstance(msg["content"], list):
+            assert not any(b.get("type") == "tool_result" for b in msg["content"])

From 8ce149332468a68379e9bb9b79a1ca520a71f82b Mon Sep 17 00:00:00 2001
From: Andrey Buzin <contactbuzin@gmail.com>
Date: Tue, 3 Mar 2026 14:24:07 -0800
Subject: [PATCH 06/10] Update the checkpoint API to tuck in staleness checking
 logic

---
 examples/fastapi-vite/backend/main.py  | 48 ++------------------------
 src/vercel_ai_sdk/__init__.py          |  3 +-
 src/vercel_ai_sdk/ai_sdk_ui/adapter.py | 13 +++++++
 src/vercel_ai_sdk/core/checkpoint.py   |  9 +++++
 src/vercel_ai_sdk/core/runtime.py      | 21 ++++++++++-
 5 files changed, 47 insertions(+), 47 deletions(-)

diff --git a/examples/fastapi-vite/backend/main.py b/examples/fastapi-vite/backend/main.py
index 8175dbbb..d34322f4 100644
--- a/examples/fastapi-vite/backend/main.py
+++ b/examples/fastapi-vite/backend/main.py
@@ -44,29 +44,6 @@ class ChatRequest(pydantic.BaseModel):
     session_id: str | None = None
 
 
-def _has_matching_approval(
-    ui_messages: list[ai.ai_sdk_ui.UIMessage],
-    pending_hooks: list[str],
-) -> bool:
-    """True when the incoming messages resolve at least one pending hook.
-
-    Hook labels follow the ``approve_{tool_call_id}`` convention set by
-    ``_execute_with_approval`` in the agent graph.
-    """
-    pending = set(pending_hooks)
-    for msg in ui_messages:
-        for part in msg.parts:
-            state = getattr(part, "state", None)
-            tcid = getattr(part, "tool_call_id", None)
-            if (
-                state == "approval-responded"
-                and tcid is not None
-                and f"approve_{tcid}" in pending
-            ):
-                return True
-    return False
-
-
 @app.post("/chat")
 async def chat(request: ChatRequest) -> fastapi.responses.StreamingResponse:
     """Handle chat requests and stream responses."""
@@ -76,24 +53,10 @@ async def chat(request: ChatRequest) -> fastapi.responses.StreamingResponse:
 
     llm = agent.get_llm()
 
-    # Only load a checkpoint when this request is actually resuming
-    # an interrupted run — i.e. the frontend is sending back an
-    # approval response that matches a pending hook.  Otherwise
-    # discard stale checkpoints so fresh turns aren't poisoned.
     checkpoint = None
     saved = await file_storage.get(checkpoint_key)
     if saved:
-        pending = saved.get("pending_hooks", [])
-        if _has_matching_approval(request.messages, pending):
-            checkpoint = ai.Checkpoint.model_validate(saved["checkpoint"])
-            # The frontend sends the full message history including the
-            # assistant message from the interrupted run.  The checkpoint
-            # will replay that same step, so strip the trailing assistant
-            # message to avoid sending a duplicate tool_use to the LLM.
-            if messages and messages[-1].role == "assistant":
-                messages = messages[:-1]
-        else:
-            await file_storage.delete(checkpoint_key)
+        checkpoint = ai.Checkpoint.model_validate(saved)
 
     result = ai.run(
         agent.graph,
@@ -108,15 +71,10 @@ async def stream_response() -> AsyncGenerator[str]:
         async for chunk in ai.ai_sdk_ui.to_sse_stream(result):
             yield chunk
 
-        # Save checkpoint + pending hook labels so the next request
-        # can decide whether it's a resume or a fresh turn.
-        if result.pending_hooks:
+        if result.checkpoint.pending_hooks:
             await file_storage.put(
                 checkpoint_key,
-                {
-                    "checkpoint": result.checkpoint.model_dump(),
-                    "pending_hooks": list(result.pending_hooks.keys()),
-                },
+                result.checkpoint.model_dump(),
             )
         else:
             await file_storage.delete(checkpoint_key)
diff --git a/src/vercel_ai_sdk/__init__.py b/src/vercel_ai_sdk/__init__.py
index 35f444d2..3d175a1f 100644
--- a/src/vercel_ai_sdk/__init__.py
+++ b/src/vercel_ai_sdk/__init__.py
@@ -1,6 +1,6 @@
 from . import ai_gateway, ai_sdk_ui, anthropic, mcp, openai
 from .core import telemetry
-from .core.checkpoint import Checkpoint
+from .core.checkpoint import Checkpoint, PendingHookInfo
 from .core.hooks import Hook, ToolApproval, hook
 from .core.llm import LanguageModel
 
@@ -54,6 +54,7 @@
     "ToolApproval",
     "StructuredOutputPart",
     "Checkpoint",
+    "PendingHookInfo",
     # Functions
     "tool",
     "stream",
diff --git a/src/vercel_ai_sdk/ai_sdk_ui/adapter.py b/src/vercel_ai_sdk/ai_sdk_ui/adapter.py
index 9d1b98e2..8c60508f 100644
--- a/src/vercel_ai_sdk/ai_sdk_ui/adapter.py
+++ b/src/vercel_ai_sdk/ai_sdk_ui/adapter.py
@@ -401,6 +401,10 @@ def to_messages(
     ``ToolApproval.resolve()`` so the agent loop can resume execution
     without the caller needing to handle approval routing explicitly.
 
+    When approvals are resolved, the trailing assistant message is
+    automatically stripped.  The checkpoint will replay that step, so
+    including it would send duplicate tool-use content to the LLM.
+
     Args:
         ui_messages: List of UIMessage objects from the AI SDK v6 frontend.
 
@@ -408,6 +412,7 @@ def to_messages(
         List of internal Message objects ready for use with the runtime.
     """
     result: list[core.messages.Message] = []
+    resolved_any_approval = False
 
     for ui_msg in ui_messages:
         internal_parts: list[core.messages.Part] = []
@@ -457,6 +462,7 @@ def to_messages(
                                 "reason": tp.approval.reason,
                             },
                         )
+                        resolved_any_approval = True
 
                 case (
                     ui_message.UIStepStartPart()
@@ -489,6 +495,13 @@ def to_messages(
                 )
             )
 
+    # When resuming from a checkpoint (approvals were resolved above),
+    # the frontend sends the full history including the assistant message
+    # from the interrupted run.  The checkpoint replays that step, so
+    # strip the trailing assistant message to avoid duplicate tool-use.
+    if resolved_any_approval and result and result[-1].role == "assistant":
+        result = result[:-1]
+
     return result
 
 
diff --git a/src/vercel_ai_sdk/core/checkpoint.py b/src/vercel_ai_sdk/core/checkpoint.py
index b49629d3..40499440 100644
--- a/src/vercel_ai_sdk/core/checkpoint.py
+++ b/src/vercel_ai_sdk/core/checkpoint.py
@@ -33,7 +33,16 @@ class HookEvent(pydantic.BaseModel):
     resolution: dict[str, Any]
 
 
+class PendingHookInfo(pydantic.BaseModel):
+    """A hook that was suspended but not resolved when the run ended."""
+
+    label: str
+    hook_type: str
+    metadata: dict[str, Any] = {}
+
+
 class Checkpoint(pydantic.BaseModel):
     steps: list[StepEvent] = []
     tools: list[ToolEvent] = []
     hooks: list[HookEvent] = []
+    pending_hooks: list[PendingHookInfo] = []
diff --git a/src/vercel_ai_sdk/core/runtime.py b/src/vercel_ai_sdk/core/runtime.py
index 5c32114c..bee4e71d 100644
--- a/src/vercel_ai_sdk/core/runtime.py
+++ b/src/vercel_ai_sdk/core/runtime.py
@@ -162,6 +162,14 @@ def get_checkpoint(self) -> checkpoint_.Checkpoint:
             steps=list(self._checkpoint.steps) + self._step_log,
             tools=list(self._checkpoint.tools) + self._tool_log,
             hooks=list(self._checkpoint.hooks) + self._hook_log,
+            pending_hooks=[
+                checkpoint_.PendingHookInfo(
+                    label=sus.label,
+                    hook_type=sus.hook_type,
+                    metadata=sus.metadata,
+                )
+                for sus in self._pending_hooks.values()
+            ],
         )
 
 
@@ -388,8 +396,19 @@ def run(
     """
     result = RunResult()
 
+    # Discard stale checkpoints: if the checkpoint has pending hooks but
+    # none of them have been resolved (via Hook.resolve() / to_messages()),
+    # this isn't a resume — it's a fresh turn with an outdated checkpoint.
+    effective_checkpoint = checkpoint
+    if checkpoint and checkpoint.pending_hooks:
+        has_resolution = any(
+            ph.label in hooks_._pending_resolutions for ph in checkpoint.pending_hooks
+        )
+        if not has_resolution:
+            effective_checkpoint = None
+
     async def _generate() -> AsyncGenerator[messages_.Message]:
-        runtime = Runtime(checkpoint=checkpoint)
+        runtime = Runtime(checkpoint=effective_checkpoint)
         result._runtime = runtime
         token_runtime = _runtime.set(runtime)
         token_run_id = telemetry_.start_run()

From ac417a5e2374e857bacda47326194ee5f1711f97 Mon Sep 17 00:00:00 2001
From: Andrey Buzin <contactbuzin@gmail.com>
Date: Tue, 3 Mar 2026 14:53:01 -0800
Subject: [PATCH 07/10] Add logging for magic checkpoint behaviors

---
 src/vercel_ai_sdk/ai_sdk_ui/adapter.py |  6 +++++
 src/vercel_ai_sdk/core/runtime.py      | 32 +++++++++++++++++++++++---
 2 files changed, 35 insertions(+), 3 deletions(-)

diff --git a/src/vercel_ai_sdk/ai_sdk_ui/adapter.py b/src/vercel_ai_sdk/ai_sdk_ui/adapter.py
index 8c60508f..f39e1fd8 100644
--- a/src/vercel_ai_sdk/ai_sdk_ui/adapter.py
+++ b/src/vercel_ai_sdk/ai_sdk_ui/adapter.py
@@ -6,6 +6,7 @@
 
 import dataclasses
 import json
+import logging
 import uuid
 from collections.abc import AsyncGenerator, AsyncIterable
 from typing import Any, Literal
@@ -14,6 +15,8 @@
 from ..core import hooks
 from . import protocol, ui_message
 
+logger = logging.getLogger(__name__)
+
 # ============================================================================
 # Serialization utilities
 # ============================================================================
@@ -500,6 +503,9 @@ def to_messages(
     # from the interrupted run.  The checkpoint replays that step, so
     # strip the trailing assistant message to avoid duplicate tool-use.
     if resolved_any_approval and result and result[-1].role == "assistant":
+        logger.info(
+            "Stripping trailing assistant message (checkpoint will replay this step)"
+        )
         result = result[:-1]
 
     return result
diff --git a/src/vercel_ai_sdk/core/runtime.py b/src/vercel_ai_sdk/core/runtime.py
index bee4e71d..c5d94a12 100644
--- a/src/vercel_ai_sdk/core/runtime.py
+++ b/src/vercel_ai_sdk/core/runtime.py
@@ -4,11 +4,14 @@
 import contextvars
 import dataclasses
 import json
+import logging
 from collections.abc import AsyncGenerator, Awaitable, Callable, Coroutine, Sequence
 from typing import Any, get_type_hints
 
 import pydantic
 
+logger = logging.getLogger(__name__)
+
 from .. import mcp
 from . import checkpoint as checkpoint_
 from . import hooks as hooks_
@@ -117,6 +120,7 @@ def try_replay_step(self) -> streams_.StreamResult | None:
         if self._step_index < len(self._checkpoint.steps):
             event = self._checkpoint.steps[self._step_index]
             self._step_index += 1
+            logger.info("Replaying step %d from checkpoint", event.index)
             return event.to_stream_result()
         return None
 
@@ -132,7 +136,14 @@ def record_step(self, result: streams_.StreamResult) -> None:
 
     def try_replay_tool(self, tool_call_id: str) -> checkpoint_.ToolEvent | None:
         """Return the cached ToolEvent if available, else None."""
-        return self._tool_replay.get(tool_call_id)
+        event = self._tool_replay.get(tool_call_id)
+        if event is not None:
+            logger.info(
+                "Replaying tool %s (call_id=%s) from checkpoint",
+                event.tool_call_id,
+                tool_call_id,
+            )
+        return event
 
     def record_tool(
         self, tool_call_id: str, result: Any, *, status: str = "result"
@@ -146,7 +157,10 @@ def record_tool(
     # ── Replay / record: hooks ────────────────────────────────────
 
     def get_hook_resolution(self, label: str) -> dict[str, Any] | None:
-        return self._hook_replay.get(label)
+        resolution = self._hook_replay.get(label)
+        if resolution is not None:
+            logger.info("Resolving hook '%s' from checkpoint", label)
+        return resolution
 
     def record_hook(self, label: str, resolution: dict[str, Any]) -> None:
         self._hook_log.append(checkpoint_.HookEvent(label=label, resolution=resolution))
@@ -401,11 +415,23 @@ def run(
     # this isn't a resume — it's a fresh turn with an outdated checkpoint.
     effective_checkpoint = checkpoint
     if checkpoint and checkpoint.pending_hooks:
+        pending_labels = [ph.label for ph in checkpoint.pending_hooks]
         has_resolution = any(
-            ph.label in hooks_._pending_resolutions for ph in checkpoint.pending_hooks
+            label in hooks_._pending_resolutions for label in pending_labels
         )
         if not has_resolution:
+            logger.info(
+                "Discarding stale checkpoint: pending hooks %s have no "
+                "matching resolutions",
+                pending_labels,
+            )
             effective_checkpoint = None
+        else:
+            logger.info(
+                "Resuming from checkpoint with %d pending hook(s): %s",
+                len(pending_labels),
+                pending_labels,
+            )
 
     async def _generate() -> AsyncGenerator[messages_.Message]:
         runtime = Runtime(checkpoint=effective_checkpoint)

From 2922ffcf6206fb1dcfb20b7a10d6ebaec1784de4 Mon Sep 17 00:00:00 2001
From: Andrey Buzin <contactbuzin@gmail.com>
Date: Tue, 3 Mar 2026 14:56:42 -0800
Subject: [PATCH 08/10] Fix lint and type check

---
 src/vercel_ai_sdk/core/runtime.py |  4 ++--
 tests/anthropic/test_anthropic.py | 21 +++++++++++----------
 2 files changed, 13 insertions(+), 12 deletions(-)

diff --git a/src/vercel_ai_sdk/core/runtime.py b/src/vercel_ai_sdk/core/runtime.py
index c5d94a12..2f6ac3e0 100644
--- a/src/vercel_ai_sdk/core/runtime.py
+++ b/src/vercel_ai_sdk/core/runtime.py
@@ -10,8 +10,6 @@
 
 import pydantic
 
-logger = logging.getLogger(__name__)
-
 from .. import mcp
 from . import checkpoint as checkpoint_
 from . import hooks as hooks_
@@ -21,6 +19,8 @@
 from . import telemetry as telemetry_
 from . import tools as tools_
 
+logger = logging.getLogger(__name__)
+
 # ── Queue item types ──────────────────────────────────────────────
 
 
diff --git a/tests/anthropic/test_anthropic.py b/tests/anthropic/test_anthropic.py
index 42127961..53d5d69b 100644
--- a/tests/anthropic/test_anthropic.py
+++ b/tests/anthropic/test_anthropic.py
@@ -1,10 +1,10 @@
 """Anthropic provider: _messages_to_anthropic conversion tests."""
 
 from vercel_ai_sdk.anthropic import _messages_to_anthropic
-from vercel_ai_sdk.core.messages import Message, ReasoningPart, TextPart, ToolPart
+from vercel_ai_sdk.core.messages import Message, TextPart, ToolPart
 
 
-def test_tool_result_none_still_emits_tool_result():
+def test_tool_result_none_still_emits_tool_result() -> None:
     """A tool that returns None must still produce a tool_result block.
 
     Regression: when part.result is None the converter skipped the tool_result,
@@ -26,7 +26,8 @@ def test_tool_result_none_still_emits_tool_result():
 
     # Should have: assistant message with tool_use, then user message with tool_result
     assert len(anthropic_msgs) == 2, (
-        f"Expected 2 messages (assistant + user/tool_result), got {len(anthropic_msgs)}: {anthropic_msgs}"
+        f"Expected 2 messages (assistant + user/tool_result), "
+        f"got {len(anthropic_msgs)}: {anthropic_msgs}"
     )
 
     assistant_msg = anthropic_msgs[0]
@@ -40,7 +41,7 @@ def test_tool_result_none_still_emits_tool_result():
     assert tool_results[0]["tool_use_id"] == "toolu_01abc"
 
 
-def test_tool_with_normal_result():
+def test_tool_with_normal_result() -> None:
     """Baseline: a tool with a normal result produces the correct pair."""
     tool_part = ToolPart(
         tool_call_id="toolu_02xyz",
@@ -59,7 +60,7 @@ def test_tool_with_normal_result():
     assert anthropic_msgs[1]["content"][0]["content"] == "{'temp': 62}"
 
 
-def test_tool_error_produces_tool_result():
+def test_tool_error_produces_tool_result() -> None:
     """Tool errors must also produce a tool_result block (with is_error=True)."""
     tool_part = ToolPart(
         tool_call_id="toolu_03err",
@@ -81,7 +82,7 @@ def test_tool_error_produces_tool_result():
     assert tool_result["content"] == "Connection timeout"
 
 
-def test_multiple_tools_one_returns_none():
+def test_multiple_tools_one_returns_none() -> None:
     """When one of several tools returns None, all must have tool_results."""
     tool_a = ToolPart(
         tool_call_id="toolu_a",
@@ -122,7 +123,7 @@ def test_multiple_tools_one_returns_none():
 # -- Multi-turn: consecutive user messages (tool_result + next user) -------
 
 
-def test_multi_turn_no_consecutive_same_role_messages():
+def test_multi_turn_no_consecutive_same_role_messages() -> None:
     """Multi-turn with tools must not produce consecutive same-role messages.
 
     Regression: when a previous assistant turn includes a tool call (with
@@ -169,7 +170,7 @@ def test_multi_turn_no_consecutive_same_role_messages():
         )
 
 
-def test_multi_turn_tool_result_before_user_merged():
+def test_multi_turn_tool_result_before_user_merged() -> None:
     """When tool_result (user) is followed by a user message, they merge.
 
     The merged user message should contain both the tool_result blocks
@@ -204,7 +205,7 @@ def test_multi_turn_tool_result_before_user_merged():
     assert tool_results[0]["tool_use_id"] == "toolu_01abc"
 
 
-def test_stream_loop_second_iteration_messages():
+def test_stream_loop_second_iteration_messages() -> None:
     """Simulates what stream_loop sends on the 2nd LLM call in a multi-turn.
 
     After the first stream_step returns a tool call, stream_loop appends
@@ -242,7 +243,7 @@ def test_stream_loop_second_iteration_messages():
     assert len(tool_results) == 1
 
 
-def test_pending_tool_does_not_emit_tool_result():
+def test_pending_tool_does_not_emit_tool_result() -> None:
     """A tool with status='pending' must not produce a tool_result block.
 
     When stream_step returns a message mid-stream (before tool execution),

From c8a1292a495e29752cb15d4410a4c46e589b8818 Mon Sep 17 00:00:00 2001
From: Andrey Buzin <contactbuzin@gmail.com>
Date: Tue, 3 Mar 2026 14:58:28 -0800
Subject: [PATCH 09/10] Revert Python deps in the fastapi-vite example

---
 examples/fastapi-vite/backend/pyproject.toml |  5 +-
 examples/fastapi-vite/backend/uv.lock        | 63 ++------------------
 2 files changed, 6 insertions(+), 62 deletions(-)

diff --git a/examples/fastapi-vite/backend/pyproject.toml b/examples/fastapi-vite/backend/pyproject.toml
index a98fb231..3fa5b347 100644
--- a/examples/fastapi-vite/backend/pyproject.toml
+++ b/examples/fastapi-vite/backend/pyproject.toml
@@ -5,9 +5,6 @@ description = "Chat demo using Python Vercel AI SDK with FastAPI"
 requires-python = ">=3.12"
 dependencies = [
     "fastapi[standard]>=0.128.1",
-    "vercel-ai-sdk",
-    # "vercel-ai-sdk>=0.0.1.dev5",
+    "vercel-ai-sdk>=0.0.1.dev5",
 ]
 
-[tool.uv.sources]
-vercel-ai-sdk = { path = "../../.." }
diff --git a/examples/fastapi-vite/backend/uv.lock b/examples/fastapi-vite/backend/uv.lock
index 8075cde9..f27e1630 100644
--- a/examples/fastapi-vite/backend/uv.lock
+++ b/examples/fastapi-vite/backend/uv.lock
@@ -460,18 +460,6 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/0e/61/66938bbb5fc52dbdf84594873d5b51fb1f7c7794e9c0f5bd885f30bc507b/idna-3.11-py3-none-any.whl", hash = "sha256:771a87f49d9defaf64091e6e6fe9c18d4833f140bd19464795bc32d966ca37ea", size = 71008, upload-time = "2025-10-12T14:55:18.883Z" },
 ]
 
-[[package]]
-name = "importlib-metadata"
-version = "8.7.1"
-source = { registry = "https://pypi.org/simple" }
-dependencies = [
-    { name = "zipp" },
-]
-sdist = { url = "https://files.pythonhosted.org/packages/f3/49/3b30cad09e7771a4982d9975a8cbf64f00d4a1ececb53297f1d9a7be1b10/importlib_metadata-8.7.1.tar.gz", hash = "sha256:49fef1ae6440c182052f407c8d34a68f72efc36db9ca90dc0113398f2fdde8bb", size = 57107, upload-time = "2025-12-21T10:00:19.278Z" }
-wheels = [
-    { url = "https://files.pythonhosted.org/packages/fa/5e/f8e9a1d23b9c20a551a8a02ea3637b4642e22c2626e3a13a9a29cdea99eb/importlib_metadata-8.7.1-py3-none-any.whl", hash = "sha256:5a1f80bf1daa489495071efbb095d75a634cf28a8bc299581244063b53176151", size = 27865, upload-time = "2025-12-21T10:00:18.329Z" },
-]
-
 [[package]]
 name = "jinja2"
 version = "3.1.6"
@@ -707,19 +695,6 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/b5/a0/cf4297aa51bbc21e83ef0ac018947fa06aea8f2364aad7c96cbf148590e6/openai-2.20.0-py3-none-any.whl", hash = "sha256:38d989c4b1075cd1f76abc68364059d822327cf1a932531d429795f4fc18be99", size = 1098479, upload-time = "2026-02-10T19:02:52.157Z" },
 ]
 
-[[package]]
-name = "opentelemetry-api"
-version = "1.39.1"
-source = { registry = "https://pypi.org/simple" }
-dependencies = [
-    { name = "importlib-metadata" },
-    { name = "typing-extensions" },
-]
-sdist = { url = "https://files.pythonhosted.org/packages/97/b9/3161be15bb8e3ad01be8be5a968a9237c3027c5be504362ff800fca3e442/opentelemetry_api-1.39.1.tar.gz", hash = "sha256:fbde8c80e1b937a2c61f20347e91c0c18a1940cecf012d62e65a7caf08967c9c", size = 65767, upload-time = "2025-12-11T13:32:39.182Z" }
-wheels = [
-    { url = "https://files.pythonhosted.org/packages/cf/df/d3f1ddf4bb4cb50ed9b1139cc7b1c54c34a1e7ce8fd1b9a37c0d1551a6bd/opentelemetry_api-1.39.1-py3-none-any.whl", hash = "sha256:2edd8463432a7f8443edce90972169b195e7d6a05500cd29e6d13898187c9950", size = 66356, upload-time = "2025-12-11T13:32:17.304Z" },
-]
-
 [[package]]
 name = "py-ai-fastapi-chat"
 version = "0.1.0"
@@ -732,7 +707,7 @@ dependencies = [
 [package.metadata]
 requires-dist = [
     { name = "fastapi", extras = ["standard"], specifier = ">=0.128.1" },
-    { name = "vercel-ai-sdk", directory = "../../../" },
+    { name = "vercel-ai-sdk", specifier = ">=0.0.1.dev5" },
 ]
 
 [[package]]
@@ -1344,37 +1319,18 @@ wheels = [
 [[package]]
 name = "vercel-ai-sdk"
 version = "0.0.1.dev5"
-source = { directory = "../../../" }
+source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "anthropic" },
     { name = "httpx" },
     { name = "mcp" },
     { name = "openai" },
-    { name = "opentelemetry-api" },
     { name = "pydantic" },
     { name = "vercel" },
 ]
-
-[package.metadata]
-requires-dist = [
-    { name = "anthropic", specifier = ">=0.83.0" },
-    { name = "httpx", specifier = ">=0.28.1" },
-    { name = "mcp", specifier = ">=1.18.0" },
-    { name = "openai", specifier = ">=2.14.0" },
-    { name = "opentelemetry-api", specifier = ">=1.0" },
-    { name = "pydantic", specifier = ">=2.12.5" },
-    { name = "vercel", specifier = ">=0.3.8" },
-]
-
-[package.metadata.requires-dev]
-dev = [
-    { name = "mypy", specifier = ">=1.11" },
-    { name = "opentelemetry-sdk", specifier = ">=1.0" },
-    { name = "pytest", specifier = ">=8.0" },
-    { name = "pytest-asyncio", specifier = ">=0.24" },
-    { name = "python-dotenv", specifier = ">=1.2.1" },
-    { name = "rich", specifier = ">=14.2.0" },
-    { name = "ruff", specifier = ">=0.8" },
+sdist = { url = "https://files.pythonhosted.org/packages/b0/dd/3b399134076883247582af3919d5fbd38c9e270a42005fa27d1472705dd1/vercel_ai_sdk-0.0.1.dev5.tar.gz", hash = "sha256:998814780fc6163000be1b29e48dacbe710adb8a765636867bd6dd5a6b9b41b0", size = 37870, upload-time = "2026-02-25T16:31:01.844Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/c5/7a/f50dd25ed596c07c2222f2abd81c413169534904bfc4e735b1a5e7084870/vercel_ai_sdk-0.0.1.dev5-py3-none-any.whl", hash = "sha256:22de26c8b667738a825f812aa5b7042d741dd905033c16b3515f6123cd220245", size = 50938, upload-time = "2026-02-25T16:31:00.175Z" },
 ]
 
 [[package]]
@@ -1508,12 +1464,3 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/9f/3e/28135a24e384493fa804216b79a6a6759a38cc4ff59118787b9fb693df93/websockets-16.0-cp314-cp314t-win_amd64.whl", hash = "sha256:b14dc141ed6d2dde437cddb216004bcac6a1df0935d79656387bd41632ba0bbd", size = 178531, upload-time = "2026-01-10T09:23:35.016Z" },
     { url = "https://files.pythonhosted.org/packages/6f/28/258ebab549c2bf3e64d2b0217b973467394a9cea8c42f70418ca2c5d0d2e/websockets-16.0-py3-none-any.whl", hash = "sha256:1637db62fad1dc833276dded54215f2c7fa46912301a24bd94d45d46a011ceec", size = 171598, upload-time = "2026-01-10T09:23:45.395Z" },
 ]
-
-[[package]]
-name = "zipp"
-version = "3.23.0"
-source = { registry = "https://pypi.org/simple" }
-sdist = { url = "https://files.pythonhosted.org/packages/e3/02/0f2892c661036d50ede074e376733dca2ae7c6eb617489437771209d4180/zipp-3.23.0.tar.gz", hash = "sha256:a07157588a12518c9d4034df3fbbee09c814741a33ff63c05fa29d26a2404166", size = 25547, upload-time = "2025-06-08T17:06:39.4Z" }
-wheels = [
-    { url = "https://files.pythonhosted.org/packages/2e/54/647ade08bf0db230bfea292f893923872fd20be6ac6f53b2b936ba839d75/zipp-3.23.0-py3-none-any.whl", hash = "sha256:071652d6115ed432f5ce1d34c336c0adfd6a884660d1e9712a256d3d3bd4b14e", size = 10276, upload-time = "2025-06-08T17:06:38.034Z" },
-]

From 841876655d507f50790531be63c9699957e77029 Mon Sep 17 00:00:00 2001
From: Andrey Buzin <contactbuzin@gmail.com>
Date: Tue, 3 Mar 2026 15:01:50 -0800
Subject: [PATCH 10/10] Bump the version

---
 pyproject.toml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/pyproject.toml b/pyproject.toml
index 12d92534..2e58843b 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -1,6 +1,6 @@
 [project]
 name = "vercel-ai-sdk"
-version = "0.0.1.dev5"
+version = "0.0.1.dev6"
 description = "The AI Toolkit for Python"
 readme = "README.md"
 authors = [