diff --git a/pydantic_ai_slim/pydantic_ai/models/__init__.py b/pydantic_ai_slim/pydantic_ai/models/__init__.py
index aef137cc29..aef39920fa 100644
--- a/pydantic_ai_slim/pydantic_ai/models/__init__.py
+++ b/pydantic_ai_slim/pydantic_ai/models/__init__.py
@@ -545,6 +545,90 @@ def prompted_output_instructions(self) -> str | None:
     __repr__ = _utils.dataclasses_no_defaults_repr
 
 
+@dataclass
+class _ResolvedToolChoice:
+    """Provider-agnostic resolved tool choice.
+
+    This is the result of validating and resolving the user's `tool_choice` setting.
+    Providers should map this to their API-specific format.
+    """
+
+    mode: Literal['none', 'auto', 'required', 'specific']
+    """The resolved tool choice mode."""
+
+    tool_names: list[str] = field(default_factory=list)
+    """For 'specific' mode, the list of tool names to force. Empty for other modes."""
+
+    def filter_tools(
+        self,
+        function_tools: list[ToolDefinition],
+        output_tools: list[ToolDefinition],
+    ) -> list[ToolDefinition]:
+        """Filter tools based on the resolved mode.
+
+        - 'none': only output_tools
+        - 'required': only function_tools
+        - 'specific': specified function_tools + output_tools
+        - 'auto': all tools
+        """
+        if self.mode == 'none':
+            return list(output_tools)
+        elif self.mode == 'required':
+            return list(function_tools)
+        elif self.mode == 'specific':
+            allowed = set(self.tool_names)
+            return [t for t in function_tools if t.name in allowed] + list(output_tools)
+        else:  # 'auto'
+            return [*function_tools, *output_tools]
+
+
+def _resolve_tool_choice(  # pyright: ignore[reportUnusedFunction]
+    model_settings: ModelSettings | None,
+    model_request_parameters: ModelRequestParameters,
+) -> _ResolvedToolChoice | None:
+    """Resolve and validate tool_choice from model settings.
+
+    This centralizes the common logic for handling tool_choice across all providers:
+    - Validates tool names in list[str] against available function_tools
+    - Returns a provider-agnostic _ResolvedToolChoice for the provider to map to their API format
+
+    Args:
+        model_settings: The model settings containing tool_choice.
+        model_request_parameters: The request parameters containing tool definitions.
+
+    Returns:
+        _ResolvedToolChoice if an explicit tool_choice was provided and validated,
+        None if tool_choice was not set (provider should use default behavior based on allow_text_output).
+
+    Raises:
+        UserError: If tool names in list[str] are invalid.
+    """
+    user_tool_choice = (model_settings or {}).get('tool_choice')
+
+    if user_tool_choice is None:
+        return None
+
+    if user_tool_choice == 'none':
+        return _ResolvedToolChoice(mode='none')
+
+    if user_tool_choice in ('auto', 'required'):
+        return _ResolvedToolChoice(mode=user_tool_choice)
+
+    if isinstance(user_tool_choice, list):
+        if not user_tool_choice:
+            return _ResolvedToolChoice(mode='none')
+        function_tool_names = {t.name for t in model_request_parameters.function_tools}
+        invalid_names = set(user_tool_choice) - function_tool_names
+        if invalid_names:
+            raise UserError(
+                f'Invalid tool names in `tool_choice`: {invalid_names}. '
+                f'Available function tools: {function_tool_names or "none"}'
+            )
+        return _ResolvedToolChoice(mode='specific', tool_names=list(user_tool_choice))
+
+    return None  # pragma: no cover
+
+
 class Model(ABC):
     """Abstract class for a model."""
 
diff --git a/pydantic_ai_slim/pydantic_ai/models/anthropic.py b/pydantic_ai_slim/pydantic_ai/models/anthropic.py
index 2c7ff578d5..cde31928f6 100644
--- a/pydantic_ai_slim/pydantic_ai/models/anthropic.py
+++ b/pydantic_ai_slim/pydantic_ai/models/anthropic.py
@@ -1,6 +1,7 @@
 from __future__ import annotations as _annotations
 
 import io
+import warnings
 from collections.abc import AsyncGenerator, AsyncIterable, AsyncIterator
 from contextlib import asynccontextmanager
 from dataclasses import dataclass, field, replace
@@ -42,7 +43,15 @@
 from ..providers.anthropic import AsyncAnthropicClient
 from ..settings import ModelSettings, merge_model_settings
 from ..tools import ToolDefinition
-from . import Model, ModelRequestParameters, StreamedResponse, check_allow_model_requests, download_item, get_user_agent
+from . import (
+    Model,
+    ModelRequestParameters,
+    StreamedResponse,
+    _resolve_tool_choice,  # pyright: ignore[reportPrivateUsage]
+    check_allow_model_requests,
+    download_item,
+    get_user_agent,
+)
 
 _FINISH_REASON_MAP: dict[BetaStopReason, FinishReason] = {
     'end_turn': 'stop',
@@ -386,11 +395,9 @@ async def _messages_create(
         This is the last step before sending the request to the API.
         Most preprocessing has happened in `prepare_request()`.
         """
-        tools = self._get_tools(model_request_parameters, model_settings)
+        tools, tool_choice = self._infer_tool_choice(model_settings, model_request_parameters)
         tools, mcp_servers, builtin_tool_betas = self._add_builtin_tools(tools, model_request_parameters)
 
-        tool_choice = self._infer_tool_choice(tools, model_settings, model_request_parameters)
-
         system_prompt, anthropic_messages = await self._map_message(messages, model_request_parameters, model_settings)
         self._limit_cache_points(system_prompt, anthropic_messages, tools)
         output_format = self._native_output_format(model_request_parameters)
@@ -474,11 +481,9 @@ async def _messages_count_tokens(
             raise UserError('AsyncAnthropicBedrock client does not support `count_tokens` api.')
 
         # standalone function to make it easier to override
-        tools = self._get_tools(model_request_parameters, model_settings)
+        tools, tool_choice = self._infer_tool_choice(model_settings, model_request_parameters)
         tools, mcp_servers, builtin_tool_betas = self._add_builtin_tools(tools, model_request_parameters)
 
-        tool_choice = self._infer_tool_choice(tools, model_settings, model_request_parameters)
-
         system_prompt, anthropic_messages = await self._map_message(messages, model_request_parameters, model_settings)
         self._limit_cache_points(system_prompt, anthropic_messages, tools)
         output_format = self._native_output_format(model_request_parameters)
@@ -584,22 +589,6 @@ async def _process_streamed_response(
             _provider_url=self._provider.base_url,
         )
 
-    def _get_tools(
-        self, model_request_parameters: ModelRequestParameters, model_settings: AnthropicModelSettings
-    ) -> list[BetaToolUnionParam]:
-        tools: list[BetaToolUnionParam] = [
-            self._map_tool_definition(r) for r in model_request_parameters.tool_defs.values()
-        ]
-
-        # Add cache_control to the last tool if enabled
-        if tools and (cache_tool_defs := model_settings.get('anthropic_cache_tool_definitions')):
-            # If True, use '5m'; otherwise use the specified ttl value
-            ttl: Literal['5m', '1h'] = '5m' if cache_tool_defs is True else cache_tool_defs
-            last_tool = tools[-1]
-            last_tool['cache_control'] = self._build_cache_control(ttl)
-
-        return tools
-
     def _add_builtin_tools(
         self, tools: list[BetaToolUnionParam], model_request_parameters: ModelRequestParameters
     ) -> tuple[list[BetaToolUnionParam], list[BetaRequestMCPServerURLDefinitionParam], set[str]]:
@@ -663,26 +652,91 @@ def _add_builtin_tools(
                 )
         return tools, mcp_servers, beta_features
 
-    def _infer_tool_choice(
+    def _infer_tool_choice(  # noqa: C901
         self,
-        tools: list[BetaToolUnionParam],
         model_settings: AnthropicModelSettings,
         model_request_parameters: ModelRequestParameters,
-    ) -> BetaToolChoiceParam | None:
-        if not tools:
-            return None
+    ) -> tuple[list[BetaToolUnionParam], BetaToolChoiceParam | None]:
+        """Determine which tools to send and the API tool_choice value.
+
+        Returns:
+            A tuple of (filtered_tools, tool_choice).
+        """
+        thinking_enabled = model_settings.get('anthropic_thinking') is not None
+        function_tools = model_request_parameters.function_tools
+        output_tools = model_request_parameters.output_tools
+
+        resolved = _resolve_tool_choice(model_settings, model_request_parameters)
+
+        if resolved is None:
+            tool_defs_to_send = [*function_tools, *output_tools]
         else:
-            tool_choice: BetaToolChoiceParam
+            tool_defs_to_send = resolved.filter_tools(function_tools, output_tools)
+
+        # Map ToolDefinitions to Anthropic format
+        tools: list[BetaToolUnionParam] = [self._map_tool_definition(t) for t in tool_defs_to_send]
+
+        # Add cache_control to the last tool if enabled
+        if tools and (cache_tool_defs := model_settings.get('anthropic_cache_tool_definitions')):
+            ttl: Literal['5m', '1h'] = '5m' if cache_tool_defs is True else cache_tool_defs
+            last_tool = tools[-1]
+            last_tool['cache_control'] = self._build_cache_control(ttl)
+
+        if not tools:
+            return tools, None
 
+        tool_choice: BetaToolChoiceParam
+
+        if resolved is None:
             if not model_request_parameters.allow_text_output:
                 tool_choice = {'type': 'any'}
             else:
                 tool_choice = {'type': 'auto'}
 
-            if 'parallel_tool_calls' in model_settings:
-                tool_choice['disable_parallel_tool_use'] = not model_settings['parallel_tool_calls']
+        elif resolved.mode == 'auto':
+            if not model_request_parameters.allow_text_output:
+                tool_choice = {'type': 'any'}
+            else:
+                tool_choice = {'type': 'auto'}
+
+        elif resolved.mode == 'required':
+            if thinking_enabled:
+                raise UserError(
+                    "tool_choice='required' is not supported with Anthropic thinking mode. "
+                    'Use `output_type=NativeOutput(...)` or `PromptedOutput(...)` instead.'
+                )
+            tool_choice = {'type': 'any'}
+
+        elif resolved.mode == 'none':
+            if len(output_tools) == 1:
+                tool_choice = {'type': 'tool', 'name': output_tools[0].name}
+            else:
+                warnings.warn(
+                    "Anthropic only supports forcing a single tool. Falling back to 'auto' for multiple output tools."
+                )
+                tool_choice = {'type': 'auto'}
+
+        elif resolved.mode == 'specific':
+            if thinking_enabled:
+                raise UserError(
+                    'Forcing specific tools is not supported with Anthropic thinking mode. '
+                    'Use `output_type=NativeOutput(...)` or `PromptedOutput(...)` instead.'
+                )
+            if len(resolved.tool_names) == 1:
+                tool_choice = {'type': 'tool', 'name': resolved.tool_names[0]}
+            else:
+                warnings.warn(
+                    "Anthropic only supports forcing a single tool. Falling back to 'any' for multiple specific tools."
+                )
+                tool_choice = {'type': 'any'}
+
+        else:
+            assert_never(resolved.mode)
+
+        if 'parallel_tool_calls' in model_settings:
+            tool_choice['disable_parallel_tool_use'] = not model_settings['parallel_tool_calls']
 
-            return tool_choice
+        return tools, tool_choice
 
     async def _map_message(  # noqa: C901
         self,
@@ -887,9 +941,10 @@ async def _map_message(  # noqa: C901
             system_prompt_parts.insert(0, instructions)
         system_prompt = '\n\n'.join(system_prompt_parts)
 
+        ttl: Literal['5m', '1h']
         # Add cache_control to the last message content if anthropic_cache_messages is enabled
         if anthropic_messages and (cache_messages := model_settings.get('anthropic_cache_messages')):
-            ttl: Literal['5m', '1h'] = '5m' if cache_messages is True else cache_messages
+            ttl = '5m' if cache_messages is True else cache_messages
             m = anthropic_messages[-1]
             content = m['content']
             if isinstance(content, str):
@@ -909,7 +964,7 @@ async def _map_message(  # noqa: C901
         # If anthropic_cache_instructions is enabled, return system prompt as a list with cache_control
         if system_prompt and (cache_instructions := model_settings.get('anthropic_cache_instructions')):
             # If True, use '5m'; otherwise use the specified ttl value
-            ttl: Literal['5m', '1h'] = '5m' if cache_instructions is True else cache_instructions
+            ttl = '5m' if cache_instructions is True else cache_instructions
             system_prompt_blocks = [
                 BetaTextBlockParam(
                     type='text',
diff --git a/pydantic_ai_slim/pydantic_ai/models/bedrock.py b/pydantic_ai_slim/pydantic_ai/models/bedrock.py
index 1424d2cb58..50a83333a8 100644
--- a/pydantic_ai_slim/pydantic_ai/models/bedrock.py
+++ b/pydantic_ai_slim/pydantic_ai/models/bedrock.py
@@ -2,6 +2,7 @@
 
 import functools
 import typing
+import warnings
 from collections.abc import AsyncIterator, Iterable, Iterator, Mapping
 from contextlib import asynccontextmanager
 from dataclasses import dataclass, field
@@ -41,7 +42,13 @@
 )
 from pydantic_ai._run_context import RunContext
 from pydantic_ai.exceptions import ModelAPIError, ModelHTTPError, UserError
-from pydantic_ai.models import Model, ModelRequestParameters, StreamedResponse, download_item
+from pydantic_ai.models import (
+    Model,
+    ModelRequestParameters,
+    StreamedResponse,
+    _resolve_tool_choice,  # pyright: ignore[reportPrivateUsage]
+    download_item,
+)
 from pydantic_ai.providers import Provider, infer_provider
 from pydantic_ai.providers.bedrock import BEDROCK_GEO_PREFIXES, BedrockModelProfile
 from pydantic_ai.settings import ModelSettings
@@ -254,9 +261,6 @@ def system(self) -> str:
         """The model provider."""
         return self._provider.name
 
-    def _get_tools(self, model_request_parameters: ModelRequestParameters) -> list[ToolTypeDef]:
-        return [self._map_tool_definition(r) for r in model_request_parameters.tool_defs.values()]
-
     @staticmethod
     def _map_tool_definition(f: ToolDefinition) -> ToolTypeDef:
         tool_spec: ToolSpecificationTypeDef = {'name': f.name, 'inputSchema': {'json': f.parameters_json_schema}}
@@ -422,7 +426,7 @@ async def _messages_create(
             'inferenceConfig': inference_config,
         }
 
-        tool_config = self._map_tool_config(model_request_parameters)
+        tool_config = self._map_tool_config(model_request_parameters, model_settings)
         if tool_config:
             params['toolConfig'] = tool_config
 
@@ -478,17 +482,58 @@ def _map_inference_config(
 
         return inference_config
 
-    def _map_tool_config(self, model_request_parameters: ModelRequestParameters) -> ToolConfigurationTypeDef | None:
-        tools = self._get_tools(model_request_parameters)
-        if not tools:
+    def _map_tool_config(
+        self,
+        model_request_parameters: ModelRequestParameters,
+        model_settings: BedrockModelSettings | None,
+    ) -> ToolConfigurationTypeDef | None:
+        resolved = _resolve_tool_choice(model_settings, model_request_parameters)
+        function_tools = model_request_parameters.function_tools
+        output_tools = model_request_parameters.output_tools
+
+        if resolved is None:
+            tool_defs_to_send = [*function_tools, *output_tools]
+        else:
+            tool_defs_to_send = resolved.filter_tools(function_tools, output_tools)
+
+        if not tool_defs_to_send:
             return None
 
+        tools = [self._map_tool_definition(t) for t in tool_defs_to_send]
         tool_choice: ToolChoiceTypeDef
-        if not model_request_parameters.allow_text_output:
+
+        if resolved is None:
+            # Default behavior: infer from allow_text_output
+            if not model_request_parameters.allow_text_output:
+                tool_choice = {'any': {}}
+            else:
+                tool_choice = {'auto': {}}
+
+        elif resolved.mode == 'auto':
+            if not model_request_parameters.allow_text_output:
+                tool_choice = {'any': {}}
+            else:
+                tool_choice = {'auto': {}}
+
+        elif resolved.mode == 'required':
             tool_choice = {'any': {}}
-        else:
+
+        elif resolved.mode == 'none':
+            # We've already filtered to only output tools, use 'auto' to let model choose
             tool_choice = {'auto': {}}
 
+        elif resolved.mode == 'specific':
+            if not resolved.tool_names:  # pragma: no cover
+                raise RuntimeError('Internal error: resolved.tool_names is empty for specific tool choice.')
+            if len(resolved.tool_names) == 1:
+                tool_choice = {'tool': {'name': resolved.tool_names[0]}}
+            else:
+                warnings.warn("Bedrock only supports forcing a single tool. Falling back to 'any'.")
+                tool_choice = {'any': {}}
+
+        else:
+            assert_never(resolved.mode)
+
         tool_config: ToolConfigurationTypeDef = {'tools': tools}
         if tool_choice and BedrockModelProfile.from_profile(self.profile).bedrock_supports_tool_choice:
             tool_config['toolChoice'] = tool_choice
diff --git a/pydantic_ai_slim/pydantic_ai/models/google.py b/pydantic_ai_slim/pydantic_ai/models/google.py
index bf3ba0206d..0a7458037b 100644
--- a/pydantic_ai_slim/pydantic_ai/models/google.py
+++ b/pydantic_ai_slim/pydantic_ai/models/google.py
@@ -46,6 +46,7 @@
     Model,
     ModelRequestParameters,
     StreamedResponse,
+    _resolve_tool_choice,  # pyright: ignore[reportPrivateUsage]
     check_allow_model_requests,
     download_item,
     get_user_agent,
@@ -336,16 +337,16 @@ async def request_stream(
         response = await self._generate_content(messages, True, model_settings, model_request_parameters)
         yield await self._process_streamed_response(response, model_request_parameters)  # type: ignore
 
-    def _get_tools(
+    def _get_builtin_tools(
         self, model_request_parameters: ModelRequestParameters
-    ) -> tuple[list[ToolDict] | None, ImageConfigDict | None]:
-        tools: list[ToolDict] = [
-            ToolDict(function_declarations=[_function_declaration_from_tool(t)])
-            for t in model_request_parameters.tool_defs.values()
-        ]
+    ) -> tuple[list[ToolDict], ImageConfigDict | None]:
+        """Get Google-specific builtin tools (web search, code execution, etc.).
 
+        Returns:
+            A tuple of (builtin_tools, image_config).
+        """
+        tools: list[ToolDict] = []
         image_config: ImageConfigDict | None = None
-
         if model_request_parameters.builtin_tools:
             if model_request_parameters.function_tools:
                 raise UserError('Google does not support function tools and built-in tools at the same time.')
@@ -368,20 +369,82 @@ def _get_tools(
                     raise UserError(
                         f'`{tool.__class__.__name__}` is not supported by `GoogleModel`. If it should be, please file an issue.'
                     )
-        return tools or None, image_config
+        return tools, image_config
 
     def _get_tool_config(
-        self, model_request_parameters: ModelRequestParameters, tools: list[ToolDict] | None
-    ) -> ToolConfigDict | None:
-        if not model_request_parameters.allow_text_output and tools:
-            names: list[str] = []
-            for tool in tools:
-                for function_declaration in tool.get('function_declarations') or []:
-                    if name := function_declaration.get('name'):  # pragma: no branch
-                        names.append(name)
-            return _tool_config(names)
+        self,
+        model_request_parameters: ModelRequestParameters,
+        model_settings: GoogleModelSettings,
+    ) -> tuple[list[ToolDict] | None, ToolConfigDict | None, ImageConfigDict | None]:
+        """Determine which tools to send and the API tool config.
+
+        Returns:
+            A tuple of (filtered_tools, tool_config, image_config).
+        """
+        function_tools = model_request_parameters.function_tools
+        output_tools = model_request_parameters.output_tools
+        builtin_tools, image_config = self._get_builtin_tools(model_request_parameters)
+
+        resolved = _resolve_tool_choice(model_settings, model_request_parameters)
+
+        if resolved is None:
+            tool_defs_to_send = [*function_tools, *output_tools]
         else:
-            return None
+            tool_defs_to_send = resolved.filter_tools(function_tools, output_tools)
+        tools: list[ToolDict] = [
+            ToolDict(function_declarations=[_function_declaration_from_tool(t)]) for t in tool_defs_to_send
+        ]
+
+        tools.extend(builtin_tools)
+
+        if not tools:
+            return None, None, image_config
+
+        tool_config: ToolConfigDict | None
+
+        if resolved is None:
+            if not model_request_parameters.allow_text_output:
+                tool_config = ToolConfigDict(
+                    function_calling_config=FunctionCallingConfigDict(mode=FunctionCallingConfigMode.ANY)
+                )
+            else:
+                tool_config = None
+
+        elif resolved.mode == 'auto':
+            if not model_request_parameters.allow_text_output:
+                tool_config = ToolConfigDict(
+                    function_calling_config=FunctionCallingConfigDict(mode=FunctionCallingConfigMode.ANY)
+                )
+            else:
+                tool_config = ToolConfigDict(
+                    function_calling_config=FunctionCallingConfigDict(mode=FunctionCallingConfigMode.AUTO)
+                )
+
+        elif resolved.mode == 'required':
+            tool_config = ToolConfigDict(
+                function_calling_config=FunctionCallingConfigDict(mode=FunctionCallingConfigMode.ANY)
+            )
+
+        elif resolved.mode == 'none':
+            tool_config = ToolConfigDict(
+                function_calling_config=FunctionCallingConfigDict(
+                    mode=FunctionCallingConfigMode.ANY,
+                    allowed_function_names=[t.name for t in output_tools],
+                )
+            )
+
+        elif resolved.mode == 'specific':
+            tool_config = ToolConfigDict(
+                function_calling_config=FunctionCallingConfigDict(
+                    mode=FunctionCallingConfigMode.ANY,
+                    allowed_function_names=resolved.tool_names,
+                )
+            )
+
+        else:
+            assert_never(resolved.mode)
+
+        return tools, tool_config, image_config
 
     @overload
     async def _generate_content(
@@ -427,7 +490,7 @@ async def _build_content_and_config(
         model_settings: GoogleModelSettings,
         model_request_parameters: ModelRequestParameters,
     ) -> tuple[list[ContentUnionDict], GenerateContentConfigDict]:
-        tools, image_config = self._get_tools(model_request_parameters)
+        tools, tool_config, image_config = self._get_tool_config(model_request_parameters, model_settings)
         if model_request_parameters.function_tools and not self.profile.supports_tools:
             raise UserError('Tools are not supported by this model.')
 
@@ -446,8 +509,6 @@ async def _build_content_and_config(
             if not self.profile.supports_json_object_output:
                 raise UserError('JSON output is not supported by this model.')
             response_mime_type = 'application/json'
-
-        tool_config = self._get_tool_config(model_request_parameters, tools)
         system_instruction, contents = await self._map_messages(messages, model_request_parameters)
 
         modalities = [Modality.TEXT.value]
@@ -950,12 +1011,6 @@ def _function_declaration_from_tool(tool: ToolDefinition) -> FunctionDeclaration
     return f
 
 
-def _tool_config(function_names: list[str]) -> ToolConfigDict:
-    mode = FunctionCallingConfigMode.ANY
-    function_calling_config = FunctionCallingConfigDict(mode=mode, allowed_function_names=function_names)
-    return ToolConfigDict(function_calling_config=function_calling_config)
-
-
 def _metadata_as_usage(response: GenerateContentResponse, provider: str, provider_url: str) -> usage.RequestUsage:
     metadata = response.usage_metadata
     if metadata is None:
diff --git a/pydantic_ai_slim/pydantic_ai/models/groq.py b/pydantic_ai_slim/pydantic_ai/models/groq.py
index 780ee0b305..66428bafae 100644
--- a/pydantic_ai_slim/pydantic_ai/models/groq.py
+++ b/pydantic_ai_slim/pydantic_ai/models/groq.py
@@ -1,5 +1,6 @@
 from __future__ import annotations as _annotations
 
+import warnings
 from collections.abc import AsyncIterable, AsyncIterator, Iterable
 from contextlib import asynccontextmanager
 from dataclasses import dataclass, field
@@ -47,6 +48,7 @@
     Model,
     ModelRequestParameters,
     StreamedResponse,
+    _resolve_tool_choice,  # pyright: ignore[reportPrivateUsage]
     check_allow_model_requests,
     get_user_agent,
 )
@@ -56,6 +58,8 @@
     from groq.types import chat
     from groq.types.chat.chat_completion_content_part_image_param import ImageURL
     from groq.types.chat.chat_completion_message import ExecutedTool
+    from groq.types.chat.chat_completion_named_tool_choice_param import ChatCompletionNamedToolChoiceParam
+    from groq.types.chat.chat_completion_tool_choice_option_param import ChatCompletionToolChoiceOptionParam
 except ImportError as _import_error:
     raise ImportError(
         'Please install `groq` to use the Groq model, '
@@ -263,14 +267,8 @@ async def _completions_create(
         model_settings: GroqModelSettings,
         model_request_parameters: ModelRequestParameters,
     ) -> chat.ChatCompletion | AsyncStream[chat.ChatCompletionChunk]:
-        tools = self._get_tools(model_request_parameters)
+        tools, tool_choice = self._get_tool_choice(model_settings, model_request_parameters)
         tools += self._get_builtin_tools(model_request_parameters)
-        if not tools:
-            tool_choice: Literal['none', 'required', 'auto'] | None = None
-        elif not model_request_parameters.allow_text_output:
-            tool_choice = 'required'
-        else:
-            tool_choice = 'auto'
 
         groq_messages = self._map_messages(messages, model_request_parameters)
 
@@ -373,8 +371,67 @@ async def _process_streamed_response(
             _provider_name=self._provider.name,
         )
 
-    def _get_tools(self, model_request_parameters: ModelRequestParameters) -> list[chat.ChatCompletionToolParam]:
-        return [self._map_tool_definition(r) for r in model_request_parameters.tool_defs.values()]
+    def _get_tool_choice(
+        self,
+        model_settings: GroqModelSettings,
+        model_request_parameters: ModelRequestParameters,
+    ) -> tuple[list[chat.ChatCompletionToolParam], ChatCompletionToolChoiceOptionParam | None]:
+        """Determine which tools to send and the API tool_choice value.
+
+        Returns:
+            A tuple of (filtered_tools, tool_choice).
+        """
+        function_tools = model_request_parameters.function_tools
+        output_tools = model_request_parameters.output_tools
+
+        resolved = _resolve_tool_choice(model_settings, model_request_parameters)
+
+        if resolved is None:
+            tool_defs_to_send = [*function_tools, *output_tools]
+        else:
+            tool_defs_to_send = resolved.filter_tools(function_tools, output_tools)
+        tools: list[chat.ChatCompletionToolParam] = [self._map_tool_definition(t) for t in tool_defs_to_send]
+
+        if not tools:
+            return tools, None
+
+        tool_choice: ChatCompletionToolChoiceOptionParam
+
+        if resolved is None:
+            if not model_request_parameters.allow_text_output:
+                tool_choice = 'required'
+            else:
+                tool_choice = 'auto'
+
+        elif resolved.mode == 'auto':
+            if not model_request_parameters.allow_text_output:
+                tool_choice = 'required'
+            else:
+                tool_choice = 'auto'
+
+        elif resolved.mode == 'required':
+            tool_choice = 'required'
+
+        elif resolved.mode == 'none':
+            tool_choice = ChatCompletionNamedToolChoiceParam(
+                type='function',
+                function={'name': output_tools[0].name},
+            )
+
+        elif resolved.mode == 'specific':
+            if len(resolved.tool_names) == 1:
+                tool_choice = ChatCompletionNamedToolChoiceParam(
+                    type='function',
+                    function={'name': resolved.tool_names[0]},
+                )
+            else:
+                warnings.warn("Groq only supports forcing a single tool. Falling back to 'required'.")
+                tool_choice = 'required'
+
+        else:
+            assert_never(resolved.mode)
+
+        return tools, tool_choice
 
     def _get_builtin_tools(
         self, model_request_parameters: ModelRequestParameters
diff --git a/pydantic_ai_slim/pydantic_ai/models/huggingface.py b/pydantic_ai_slim/pydantic_ai/models/huggingface.py
index f439b3ccb6..b29641bafe 100644
--- a/pydantic_ai_slim/pydantic_ai/models/huggingface.py
+++ b/pydantic_ai_slim/pydantic_ai/models/huggingface.py
@@ -45,6 +45,7 @@
     Model,
     ModelRequestParameters,
     StreamedResponse,
+    _resolve_tool_choice,  # pyright: ignore[reportPrivateUsage]
     check_allow_model_requests,
 )
 
@@ -52,10 +53,12 @@
     import aiohttp
     from huggingface_hub import (
         AsyncInferenceClient,
+        ChatCompletionInputFunctionName,
         ChatCompletionInputMessage,
         ChatCompletionInputMessageChunk,
         ChatCompletionInputTool,
         ChatCompletionInputToolCall,
+        ChatCompletionInputToolChoiceClass,
         ChatCompletionInputURL,
         ChatCompletionOutput,
         ChatCompletionOutputMessage,
@@ -220,14 +223,7 @@ async def _completions_create(
         model_settings: HuggingFaceModelSettings,
         model_request_parameters: ModelRequestParameters,
     ) -> ChatCompletionOutput | AsyncIterable[ChatCompletionStreamOutput]:
-        tools = self._get_tools(model_request_parameters)
-
-        if not tools:
-            tool_choice: Literal['none', 'required', 'auto'] | None = None
-        elif not model_request_parameters.allow_text_output:
-            tool_choice = 'required'
-        else:
-            tool_choice = 'auto'
+        tools, tool_choice = self._get_tool_choice(model_settings, model_request_parameters)
 
         if model_request_parameters.builtin_tools:
             raise UserError('HuggingFace does not support built-in tools')
@@ -319,8 +315,63 @@ async def _process_streamed_response(
             _provider_name=self._provider.name,
         )
 
-    def _get_tools(self, model_request_parameters: ModelRequestParameters) -> list[ChatCompletionInputTool]:
-        return [self._map_tool_definition(r) for r in model_request_parameters.tool_defs.values()]
+    def _get_tool_choice(
+        self,
+        model_settings: HuggingFaceModelSettings,
+        model_request_parameters: ModelRequestParameters,
+    ) -> tuple[
+        list[ChatCompletionInputTool],
+        Literal['none', 'required', 'auto'] | ChatCompletionInputToolChoiceClass | None,
+    ]:
+        """Get tools and tool choice for the model.
+
+        Returns a tuple of (tools, tool_choice).
+        """
+        resolved = _resolve_tool_choice(model_settings, model_request_parameters)
+        function_tools = model_request_parameters.function_tools
+        output_tools = model_request_parameters.output_tools
+
+        if resolved is None:
+            tool_defs_to_send = [*function_tools, *output_tools]
+        else:
+            tool_defs_to_send = resolved.filter_tools(function_tools, output_tools)
+
+        if not tool_defs_to_send:
+            return [], None
+
+        tools = [self._map_tool_definition(r) for r in tool_defs_to_send]
+        tool_choice: Literal['none', 'required', 'auto'] | ChatCompletionInputToolChoiceClass | None
+
+        # Determine tool_choice value
+        if resolved is None:
+            # Default behavior: infer from allow_text_output
+            if not model_request_parameters.allow_text_output:
+                tool_choice = 'required'
+            else:
+                tool_choice = 'auto'
+        elif resolved.mode == 'auto':
+            if not model_request_parameters.allow_text_output:
+                tool_choice = 'required'
+            else:
+                tool_choice = 'auto'
+        elif resolved.mode == 'required':
+            tool_choice = 'required'
+        elif resolved.mode == 'none':
+            tool_choice = ChatCompletionInputToolChoiceClass(
+                function=ChatCompletionInputFunctionName(name=output_tools[0].name)  # pyright: ignore[reportCallIssue]
+            )
+        elif resolved.mode == 'specific':
+            if len(resolved.tool_names) == 1:
+                tool_choice = ChatCompletionInputToolChoiceClass(
+                    function=ChatCompletionInputFunctionName(name=resolved.tool_names[0])  # pyright: ignore[reportCallIssue]
+                )
+            else:
+                # HuggingFace only supports forcing a single tool
+                tool_choice = 'required'
+        else:
+            assert_never(resolved.mode)
+
+        return tools, tool_choice
 
     async def _map_messages(
         self, messages: list[ModelMessage], model_request_parameters: ModelRequestParameters
diff --git a/pydantic_ai_slim/pydantic_ai/models/mistral.py b/pydantic_ai_slim/pydantic_ai/models/mistral.py
index 2a3752c370..88d3fdb685 100644
--- a/pydantic_ai_slim/pydantic_ai/models/mistral.py
+++ b/pydantic_ai_slim/pydantic_ai/models/mistral.py
@@ -45,6 +45,7 @@
     Model,
     ModelRequestParameters,
     StreamedResponse,
+    _resolve_tool_choice,  # pyright: ignore[reportPrivateUsage]
     check_allow_model_requests,
     get_user_agent,
 )
@@ -227,13 +228,15 @@ async def _completions_create(
         if model_request_parameters.builtin_tools:
             raise UserError('Mistral does not support built-in tools')
 
+        tools, tool_choice = self._get_tool_choice(model_request_parameters, model_settings)
+
         try:
             response = await self.client.chat.complete_async(
                 model=str(self._model_name),
                 messages=self._map_messages(messages, model_request_parameters),
                 n=1,
-                tools=self._map_function_and_output_tools_definition(model_request_parameters) or UNSET,
-                tool_choice=self._get_tool_choice(model_request_parameters),
+                tools=tools or UNSET,
+                tool_choice=tool_choice,
                 stream=False,
                 max_tokens=model_settings.get('max_tokens', UNSET),
                 temperature=model_settings.get('temperature', UNSET),
@@ -266,14 +269,16 @@ async def _stream_completions_create(
         if model_request_parameters.builtin_tools:
             raise UserError('Mistral does not support built-in tools')
 
-        if model_request_parameters.function_tools:
-            # Function Calling
+        tools, tool_choice = self._get_tool_choice(model_request_parameters, model_settings)
+
+        if tools:
+            # Function Calling mode (with filtered tools)
             response = await self.client.chat.stream_async(
                 model=str(self._model_name),
                 messages=mistral_messages,
                 n=1,
-                tools=self._map_function_and_output_tools_definition(model_request_parameters) or UNSET,
-                tool_choice=self._get_tool_choice(model_request_parameters),
+                tools=tools,
+                tool_choice=tool_choice,
                 temperature=model_settings.get('temperature', UNSET),
                 top_p=model_settings.get('top_p', 1),
                 max_tokens=model_settings.get('max_tokens', UNSET),
@@ -284,9 +289,9 @@ async def _stream_completions_create(
                 http_headers={'User-Agent': get_user_agent()},
             )
 
-        elif model_request_parameters.output_tools:
+        elif model_request_parameters.output_tools:  # pragma: no cover
             # TODO: Port to native "manual JSON" mode
-            # Json Mode
+            # Json Mode (only output tools, no function tools filtered in)
             parameters_json_schemas = [tool.parameters_json_schema for tool in model_request_parameters.output_tools]
             user_output_format_message = self._generate_user_output_format(parameters_json_schemas)
             mistral_messages.append(user_output_format_message)
@@ -302,7 +307,7 @@ async def _stream_completions_create(
             )
 
         else:
-            # Stream Mode
+            # Stream Mode (no tools at all)
             response = await self.client.chat.stream_async(
                 model=str(self._model_name),
                 messages=mistral_messages,
@@ -312,37 +317,68 @@ async def _stream_completions_create(
         assert response, 'A unexpected empty response from Mistral.'
         return response
 
-    def _get_tool_choice(self, model_request_parameters: ModelRequestParameters) -> MistralToolChoiceEnum | None:
-        """Get tool choice for the model.
+    def _get_tool_choice(
+        self,
+        model_request_parameters: ModelRequestParameters,
+        model_settings: MistralModelSettings,
+    ) -> tuple[list[MistralTool] | None, MistralToolChoiceEnum | None]:
+        """Get tools and tool choice for the model.
+
+        Returns a tuple of (tools, tool_choice):
+        - tools: List of MistralTool definitions to send, or None if no tools
+        - tool_choice: "auto", "any", "none", "required", or None
 
+        Tool choice semantics:
         - "auto": Default mode. Model decides if it uses the tool or not.
         - "any": Select any tool.
         - "none": Prevents tool use.
         - "required": Forces tool use.
         """
-        if not model_request_parameters.function_tools and not model_request_parameters.output_tools:
-            return None
-        elif not model_request_parameters.allow_text_output:
-            return 'required'
+        resolved = _resolve_tool_choice(model_settings, model_request_parameters)
+        function_tools = model_request_parameters.function_tools
+        output_tools = model_request_parameters.output_tools
+
+        if resolved is None:
+            tool_defs_to_send = [*function_tools, *output_tools]
         else:
-            return 'auto'
+            tool_defs_to_send = resolved.filter_tools(function_tools, output_tools)
 
-    def _map_function_and_output_tools_definition(
-        self, model_request_parameters: ModelRequestParameters
-    ) -> list[MistralTool] | None:
-        """Map function and output tools to MistralTool format.
+        if not tool_defs_to_send:
+            return None, None
 
-        Returns None if both function_tools and output_tools are empty.
-        """
         tools = [
             MistralTool(
                 function=MistralFunction(
                     name=r.name, parameters=r.parameters_json_schema, description=r.description or ''
                 )
             )
-            for r in model_request_parameters.tool_defs.values()
+            for r in tool_defs_to_send
         ]
-        return tools if tools else None
+
+        # Determine tool_choice value
+        if resolved is None:
+            # Default behavior: infer from allow_text_output
+            if not model_request_parameters.allow_text_output:
+                tool_choice: MistralToolChoiceEnum = 'required'
+            else:
+                tool_choice = 'auto'
+        elif resolved.mode == 'auto':
+            if not model_request_parameters.allow_text_output:
+                tool_choice = 'required'
+            else:
+                tool_choice = 'auto'
+        elif resolved.mode == 'required':
+            tool_choice = 'required'
+        elif resolved.mode == 'none':
+            # We've filtered to output tools only, use 'required' if there are output tools
+            tool_choice = 'required' if output_tools else 'none'
+        elif resolved.mode == 'specific':
+            # Mistral doesn't support specific tool forcing, use 'required'
+            tool_choice = 'required'
+        else:
+            assert_never(resolved.mode)
+
+        return tools, tool_choice
 
     def _process_response(self, response: MistralChatCompletionResponse) -> ModelResponse:
         """Process a non-streamed response, and prepare a message to return."""
diff --git a/pydantic_ai_slim/pydantic_ai/models/openai.py b/pydantic_ai_slim/pydantic_ai/models/openai.py
index 61c8df132b..dda658f1f7 100644
--- a/pydantic_ai_slim/pydantic_ai/models/openai.py
+++ b/pydantic_ai_slim/pydantic_ai/models/openai.py
@@ -52,7 +52,15 @@
 from ..providers import Provider, infer_provider
 from ..settings import ModelSettings
 from ..tools import ToolDefinition
-from . import Model, ModelRequestParameters, StreamedResponse, check_allow_model_requests, download_item, get_user_agent
+from . import (
+    Model,
+    ModelRequestParameters,
+    StreamedResponse,
+    _resolve_tool_choice,  # pyright: ignore[reportPrivateUsage]
+    check_allow_model_requests,
+    download_item,
+    get_user_agent,
+)
 
 try:
     from openai import NOT_GIVEN, APIConnectionError, APIStatusError, AsyncOpenAI, AsyncStream
@@ -67,6 +75,8 @@
         chat_completion_chunk,
         chat_completion_token_logprob,
     )
+    from openai.types.chat.chat_completion_allowed_tool_choice_param import ChatCompletionAllowedToolChoiceParam
+    from openai.types.chat.chat_completion_allowed_tools_param import ChatCompletionAllowedToolsParam
     from openai.types.chat.chat_completion_content_part_image_param import ImageURL
     from openai.types.chat.chat_completion_content_part_input_audio_param import InputAudio
     from openai.types.chat.chat_completion_content_part_param import File, FileFile
@@ -75,19 +85,24 @@
     from openai.types.chat.chat_completion_message_function_tool_call_param import (
         ChatCompletionMessageFunctionToolCallParam,
     )
+    from openai.types.chat.chat_completion_named_tool_choice_param import ChatCompletionNamedToolChoiceParam
     from openai.types.chat.chat_completion_prediction_content_param import ChatCompletionPredictionContentParam
+    from openai.types.chat.chat_completion_tool_choice_option_param import ChatCompletionToolChoiceOptionParam
     from openai.types.chat.completion_create_params import (
         WebSearchOptions,
         WebSearchOptionsUserLocation,
         WebSearchOptionsUserLocationApproximate,
     )
     from openai.types.responses import ComputerToolParam, FileSearchToolParam, WebSearchToolParam
+    from openai.types.responses.response_create_params import ToolChoice as ResponsesToolChoice
     from openai.types.responses.response_input_param import FunctionCallOutput, Message
     from openai.types.responses.response_reasoning_item_param import (
         Content as ReasoningContent,
         Summary as ReasoningSummary,
     )
     from openai.types.responses.response_status import ResponseStatus
+    from openai.types.responses.tool_choice_allowed_param import ToolChoiceAllowedParam
+    from openai.types.responses.tool_choice_function_param import ToolChoiceFunctionParam
     from openai.types.shared import ReasoningEffort
     from openai.types.shared_params import Reasoning
 except ImportError as _import_error:
@@ -535,19 +550,9 @@ async def _completions_create(
         model_settings: OpenAIChatModelSettings,
         model_request_parameters: ModelRequestParameters,
     ) -> chat.ChatCompletion | AsyncStream[ChatCompletionChunk]:
-        tools = self._get_tools(model_request_parameters)
+        tools, tool_choice = self._get_tool_choice(model_settings, model_request_parameters)
         web_search_options = self._get_web_search_options(model_request_parameters)
 
-        if not tools:
-            tool_choice: Literal['none', 'required', 'auto'] | None = None
-        elif (
-            not model_request_parameters.allow_text_output
-            and OpenAIModelProfile.from_profile(self.profile).openai_supports_tool_choice_required
-        ):
-            tool_choice = 'required'
-        else:
-            tool_choice = 'auto'
-
         openai_messages = await self._map_messages(messages, model_request_parameters)
 
         response_format: chat.completion_create_params.ResponseFormat | None = None
@@ -743,8 +748,93 @@ def _streamed_response_cls(self) -> type[OpenAIStreamedResponse]:
     def _map_usage(self, response: chat.ChatCompletion) -> usage.RequestUsage:
         return _map_usage(response, self._provider.name, self._provider.base_url, self.model_name)
 
-    def _get_tools(self, model_request_parameters: ModelRequestParameters) -> list[chat.ChatCompletionToolParam]:
-        return [self._map_tool_definition(r) for r in model_request_parameters.tool_defs.values()]
+    def _get_tool_choice(
+        self,
+        model_settings: OpenAIChatModelSettings,
+        model_request_parameters: ModelRequestParameters,
+    ) -> tuple[list[chat.ChatCompletionToolParam], ChatCompletionToolChoiceOptionParam | None]:
+        """Determine which tools to send and the API tool_choice value.
+
+        Returns:
+            A tuple of (filtered_tools, tool_choice).
+        """
+        function_tools = model_request_parameters.function_tools
+        output_tools = model_request_parameters.output_tools
+        openai_profile = OpenAIModelProfile.from_profile(self.profile)
+
+        resolved = _resolve_tool_choice(model_settings, model_request_parameters)
+
+        if resolved is None:
+            tool_defs_to_send = [*function_tools, *output_tools]
+        else:
+            tool_defs_to_send = resolved.filter_tools(function_tools, output_tools)
+
+        tools: list[chat.ChatCompletionToolParam] = [self._map_tool_definition(t) for t in tool_defs_to_send]
+
+        if not tools:
+            return tools, None
+
+        tool_choice: ChatCompletionToolChoiceOptionParam
+
+        if resolved is None:
+            if not model_request_parameters.allow_text_output and openai_profile.openai_supports_tool_choice_required:
+                tool_choice = 'required'
+            else:
+                tool_choice = 'auto'
+
+        elif resolved.mode == 'auto':
+            if not model_request_parameters.allow_text_output and openai_profile.openai_supports_tool_choice_required:
+                tool_choice = 'required'
+            else:
+                tool_choice = 'auto'
+
+        elif resolved.mode == 'required':
+            if openai_profile.openai_supports_tool_choice_required:
+                tool_choice = 'required'
+            else:
+                warnings.warn(
+                    f"tool_choice='required' is not supported by model {self.model_name!r}, falling back to 'auto'",
+                    UserWarning,
+                    stacklevel=6,
+                )
+                tool_choice = 'auto'
+
+        elif resolved.mode == 'none':
+            if len(output_tools) == 1:
+                tool_choice = ChatCompletionNamedToolChoiceParam(
+                    type='function', function={'name': output_tools[0].name}
+                )
+            else:
+                allowed_mode: Literal['auto', 'required'] = (
+                    'required' if not model_request_parameters.allow_text_output else 'auto'
+                )
+                tool_choice = ChatCompletionAllowedToolChoiceParam(
+                    type='allowed_tools',
+                    allowed_tools=ChatCompletionAllowedToolsParam(
+                        mode=allowed_mode,
+                        tools=[{'type': 'function', 'function': {'name': t.name}} for t in output_tools],
+                    ),
+                )
+
+        elif resolved.mode == 'specific':
+            if len(resolved.tool_names) == 1:
+                tool_choice = ChatCompletionNamedToolChoiceParam(
+                    type='function', function={'name': resolved.tool_names[0]}
+                )
+            else:
+                allowed_mode = 'required' if not model_request_parameters.allow_text_output else 'auto'
+                tool_choice = ChatCompletionAllowedToolChoiceParam(
+                    type='allowed_tools',
+                    allowed_tools=ChatCompletionAllowedToolsParam(
+                        mode=allowed_mode,
+                        tools=[{'type': 'function', 'function': {'name': n}} for n in resolved.tool_names],
+                    ),
+                )
+
+        else:
+            assert_never(resolved.mode)
+
+        return tools, tool_choice
 
     def _get_web_search_options(self, model_request_parameters: ModelRequestParameters) -> WebSearchOptions | None:
         for tool in model_request_parameters.builtin_tools:
@@ -1340,25 +1430,20 @@ async def _responses_create(
         model_request_parameters: ModelRequestParameters,
     ) -> AsyncStream[responses.ResponseStreamEvent]: ...
 
-    async def _responses_create(  # noqa: C901
+    async def _responses_create(
         self,
         messages: list[ModelRequest | ModelResponse],
         stream: bool,
         model_settings: OpenAIResponsesModelSettings,
         model_request_parameters: ModelRequestParameters,
     ) -> responses.Response | AsyncStream[responses.ResponseStreamEvent]:
-        tools = (
+        function_tools, tool_choice = self._get_responses_tool_choice(model_settings, model_request_parameters)
+        tools: list[responses.ToolParam] = (
             self._get_builtin_tools(model_request_parameters)
             + list(model_settings.get('openai_builtin_tools', []))
-            + self._get_tools(model_request_parameters)
+            + function_tools
         )
         profile = OpenAIModelProfile.from_profile(self.profile)
-        if not tools:
-            tool_choice: Literal['none', 'required', 'auto'] | None = None
-        elif not model_request_parameters.allow_text_output and profile.openai_supports_tool_choice_required:
-            tool_choice = 'required'
-        else:
-            tool_choice = 'auto'
 
         previous_response_id = model_settings.get('openai_previous_response_id')
         if previous_response_id == 'auto':
@@ -1468,8 +1553,82 @@ def _get_reasoning(self, model_settings: OpenAIResponsesModelSettings) -> Reason
             return OMIT
         return Reasoning(effort=reasoning_effort, summary=reasoning_summary)
 
-    def _get_tools(self, model_request_parameters: ModelRequestParameters) -> list[responses.FunctionToolParam]:
-        return [self._map_tool_definition(r) for r in model_request_parameters.tool_defs.values()]
+    def _get_responses_tool_choice(
+        self,
+        model_settings: OpenAIResponsesModelSettings,
+        model_request_parameters: ModelRequestParameters,
+    ) -> tuple[list[responses.FunctionToolParam], ResponsesToolChoice | None]:
+        """Determine which tools to send and the API tool_choice value.
+
+        Returns:
+            A tuple of (filtered_function_tools, tool_choice).
+            Note: builtin tools are handled separately and should be added to this list.
+        """
+        function_tools = model_request_parameters.function_tools
+        output_tools = model_request_parameters.output_tools
+        openai_profile = OpenAIModelProfile.from_profile(self.profile)
+
+        resolved = _resolve_tool_choice(model_settings, model_request_parameters)
+
+        if resolved is None:
+            tool_defs_to_send = [*function_tools, *output_tools]
+        else:
+            tool_defs_to_send = resolved.filter_tools(function_tools, output_tools)
+        tools: list[responses.FunctionToolParam] = [self._map_tool_definition(t) for t in tool_defs_to_send]
+
+        tool_choice: ResponsesToolChoice | None
+
+        if resolved is None:
+            if not model_request_parameters.allow_text_output and openai_profile.openai_supports_tool_choice_required:
+                tool_choice = 'required'
+            else:
+                tool_choice = 'auto'
+
+        elif resolved.mode == 'auto':
+            if not model_request_parameters.allow_text_output and openai_profile.openai_supports_tool_choice_required:
+                tool_choice = 'required'
+            else:
+                tool_choice = 'auto'
+
+        elif resolved.mode == 'required':
+            if openai_profile.openai_supports_tool_choice_required:
+                tool_choice = 'required'
+            else:
+                warnings.warn(
+                    f"tool_choice='required' is not supported by model {self.model_name!r}, falling back to 'auto'",
+                    UserWarning,
+                    stacklevel=6,
+                )
+                tool_choice = 'auto'
+
+        elif resolved.mode == 'none':
+            if len(output_tools) == 1:
+                tool_choice = ToolChoiceFunctionParam(type='function', name=output_tools[0].name)
+            else:
+                allowed_mode: Literal['auto', 'required'] = (
+                    'required' if not model_request_parameters.allow_text_output else 'auto'
+                )
+                tool_choice = ToolChoiceAllowedParam(
+                    type='allowed_tools',
+                    mode=allowed_mode,
+                    tools=[{'type': 'function', 'name': t.name} for t in output_tools],
+                )
+
+        elif resolved.mode == 'specific':
+            if len(resolved.tool_names) == 1:
+                tool_choice = ToolChoiceFunctionParam(type='function', name=resolved.tool_names[0])
+            else:
+                allowed_mode = 'required' if not model_request_parameters.allow_text_output else 'auto'
+                tool_choice = ToolChoiceAllowedParam(
+                    type='allowed_tools',
+                    mode=allowed_mode,
+                    tools=[{'type': 'function', 'name': n} for n in resolved.tool_names],
+                )
+
+        else:
+            assert_never(resolved.mode)
+
+        return tools, tool_choice
 
     def _get_builtin_tools(self, model_request_parameters: ModelRequestParameters) -> list[responses.ToolParam]:
         tools: list[responses.ToolParam] = []
diff --git a/pydantic_ai_slim/pydantic_ai/settings.py b/pydantic_ai_slim/pydantic_ai/settings.py
index 6941eb1ab3..dabd4b0333 100644
--- a/pydantic_ai_slim/pydantic_ai/settings.py
+++ b/pydantic_ai_slim/pydantic_ai/settings.py
@@ -1,5 +1,7 @@
 from __future__ import annotations
 
+from typing import Literal
+
 from httpx import Timeout
 from typing_extensions import TypedDict
 
@@ -7,8 +9,10 @@
 class ModelSettings(TypedDict, total=False):
     """Settings to configure an LLM.
 
-    Here we include only settings which apply to multiple models / model providers,
+    Includes only settings which apply to multiple models / model providers,
     though not all of these settings are supported by all models.
+
+    All types must be JSON-serializable.
     """
 
     max_tokens: int
@@ -88,6 +92,30 @@ class ModelSettings(TypedDict, total=False):
     * Anthropic
     """
 
+    tool_choice: Literal['none', 'required', 'auto'] | list[str] | None
+    """Control which function tools the model can use.
+
+    This setting affects both which tools are sent to the model and the API tool_choice parameter.
+    Output tools (used for structured output) are managed separately and remain available when needed.
+
+    * `None` (default): All tools sent, tool_choice determined by output configuration
+    * `'auto'`: All tools sent, model decides whether to use them
+    * `'required'`: Only function tools sent (no output tools), model must use one
+    * `'none'`: Only output tools sent (no function tools), or no tools if none needed
+    * `list[str]`: Only specified function tools sent (plus output tools), model must use one
+    * `[]` (empty list): Treated as `'none'`
+
+    Supported by:
+
+    * OpenAI
+    * Anthropic (note: `'required'` and specific tools not supported with thinking/extended thinking)
+    * Gemini
+    * Groq
+    * Mistral
+    * HuggingFace
+    * Bedrock
+    """
+
     seed: int
     """The random seed to use for the model, theoretically allowing for deterministic results.
 
diff --git a/tests/models/anthropic/cassettes/test_tool_choice/test_tool_choice_auto_live.yaml b/tests/models/anthropic/cassettes/test_tool_choice/test_tool_choice_auto_live.yaml
new file mode 100644
index 0000000000..66e668551b
--- /dev/null
+++ b/tests/models/anthropic/cassettes/test_tool_choice/test_tool_choice_auto_live.yaml
@@ -0,0 +1,79 @@
+interactions:
+- request:
+    headers:
+      accept:
+      - application/json
+      accept-encoding:
+      - gzip, deflate
+      connection:
+      - keep-alive
+      content-length:
+      - '369'
+      content-type:
+      - application/json
+      host:
+      - api.anthropic.com
+    method: POST
+    parsed_body:
+      max_tokens: 4096
+      messages:
+      - content:
+        - text: What is 2+2?
+          type: text
+        role: user
+      model: claude-haiku-4-5
+      stream: false
+      tool_choice:
+        type: auto
+      tools:
+      - description: Get the weather for a city.
+        input_schema:
+          additionalProperties: false
+          properties:
+            city:
+              type: string
+          required:
+          - city
+          type: object
+        name: get_weather
+    uri: https://api.anthropic.com/v1/messages?beta=true
+  response:
+    headers:
+      connection:
+      - keep-alive
+      content-length:
+      - '521'
+      content-type:
+      - application/json
+      retry-after:
+      - '14'
+      strict-transport-security:
+      - max-age=31536000; includeSubDomains; preload
+      transfer-encoding:
+      - chunked
+    parsed_body:
+      content:
+      - text: |-
+          2 + 2 = 4
+
+          This is a simple arithmetic problem. I don't need to use any tools to answer this basic math question.
+        type: text
+      id: msg_01MPRAkxA9ciXHJpJwp7Vrd9
+      model: claude-haiku-4-5-20251001
+      role: assistant
+      stop_reason: end_turn
+      stop_sequence: null
+      type: message
+      usage:
+        cache_creation:
+          ephemeral_1h_input_tokens: 0
+          ephemeral_5m_input_tokens: 0
+        cache_creation_input_tokens: 0
+        cache_read_input_tokens: 0
+        input_tokens: 571
+        output_tokens: 36
+        service_tier: standard
+    status:
+      code: 200
+      message: OK
+version: 1
diff --git a/tests/models/anthropic/cassettes/test_tool_choice/test_tool_choice_none_live.yaml b/tests/models/anthropic/cassettes/test_tool_choice/test_tool_choice_none_live.yaml
new file mode 100644
index 0000000000..ab6a9828b4
--- /dev/null
+++ b/tests/models/anthropic/cassettes/test_tool_choice/test_tool_choice_none_live.yaml
@@ -0,0 +1,79 @@
+interactions:
+- request:
+    headers:
+      accept:
+      - application/json
+      accept-encoding:
+      - gzip, deflate
+      connection:
+      - keep-alive
+      content-length:
+      - '369'
+      content-type:
+      - application/json
+      host:
+      - api.anthropic.com
+    method: POST
+    parsed_body:
+      max_tokens: 4096
+      messages:
+      - content:
+        - text: What is 2+2?
+          type: text
+        role: user
+      model: claude-haiku-4-5
+      stream: false
+      tool_choice:
+        type: none
+      tools:
+      - description: Get the weather for a city.
+        input_schema:
+          additionalProperties: false
+          properties:
+            city:
+              type: string
+          required:
+          - city
+          type: object
+        name: get_weather
+    uri: https://api.anthropic.com/v1/messages?beta=true
+  response:
+    headers:
+      connection:
+      - keep-alive
+      content-length:
+      - '480'
+      content-type:
+      - application/json
+      retry-after:
+      - '45'
+      strict-transport-security:
+      - max-age=31536000; includeSubDomains; preload
+      transfer-encoding:
+      - chunked
+    parsed_body:
+      content:
+      - text: |-
+          2 + 2 = 4
+
+          This is a simple arithmetic problem. The sum of 2 and 2 is 4.
+        type: text
+      id: msg_01SXvsFVTX8YH6EuEmvTgEiW
+      model: claude-haiku-4-5-20251001
+      role: assistant
+      stop_reason: end_turn
+      stop_sequence: null
+      type: message
+      usage:
+        cache_creation:
+          ephemeral_1h_input_tokens: 0
+          ephemeral_5m_input_tokens: 0
+        cache_creation_input_tokens: 0
+        cache_read_input_tokens: 0
+        input_tokens: 571
+        output_tokens: 35
+        service_tier: standard
+    status:
+      code: 200
+      message: OK
+version: 1
diff --git a/tests/models/anthropic/cassettes/test_tool_choice/test_tool_choice_required_live.yaml b/tests/models/anthropic/cassettes/test_tool_choice/test_tool_choice_required_live.yaml
new file mode 100644
index 0000000000..3977646c12
--- /dev/null
+++ b/tests/models/anthropic/cassettes/test_tool_choice/test_tool_choice_required_live.yaml
@@ -0,0 +1,187 @@
+interactions:
+- request:
+    headers:
+      accept:
+      - application/json
+      accept-encoding:
+      - gzip, deflate
+      connection:
+      - keep-alive
+      content-length:
+      - '640'
+      content-type:
+      - application/json
+      host:
+      - api.anthropic.com
+    method: POST
+    parsed_body:
+      max_tokens: 4096
+      messages:
+      - content:
+        - text: What is the temperature in Paris? Use the weather tool and return the temperature as a number.
+          type: text
+        role: user
+      model: claude-haiku-4-5
+      stream: false
+      tool_choice:
+        type: any
+      tools:
+      - description: Get the weather for a city.
+        input_schema:
+          additionalProperties: false
+          properties:
+            city:
+              type: string
+          required:
+          - city
+          type: object
+        name: get_weather
+      - description: The final response which ends this conversation
+        input_schema:
+          properties:
+            response:
+              type: integer
+          required:
+          - response
+          type: object
+        name: final_result
+    uri: https://api.anthropic.com/v1/messages?beta=true
+  response:
+    headers:
+      connection:
+      - keep-alive
+      content-length:
+      - '484'
+      content-type:
+      - application/json
+      retry-after:
+      - '53'
+      strict-transport-security:
+      - max-age=31536000; includeSubDomains; preload
+      transfer-encoding:
+      - chunked
+    parsed_body:
+      content:
+      - id: toolu_01D3gpU1tfJop7nGMdNfcRsx
+        input:
+          city: Paris
+        name: get_weather
+        type: tool_use
+      id: msg_01Fsv9kDABeC5Au7dB6uvE8R
+      model: claude-haiku-4-5-20251001
+      role: assistant
+      stop_reason: tool_use
+      stop_sequence: null
+      type: message
+      usage:
+        cache_creation:
+          ephemeral_1h_input_tokens: 0
+          ephemeral_5m_input_tokens: 0
+        cache_creation_input_tokens: 0
+        cache_read_input_tokens: 0
+        input_tokens: 730
+        output_tokens: 38
+        service_tier: standard
+    status:
+      code: 200
+      message: OK
+- request:
+    headers:
+      accept:
+      - application/json
+      accept-encoding:
+      - gzip, deflate
+      connection:
+      - keep-alive
+      content-length:
+      - '945'
+      content-type:
+      - application/json
+      host:
+      - api.anthropic.com
+    method: POST
+    parsed_body:
+      max_tokens: 4096
+      messages:
+      - content:
+        - text: What is the temperature in Paris? Use the weather tool and return the temperature as a number.
+          type: text
+        role: user
+      - content:
+        - id: toolu_01D3gpU1tfJop7nGMdNfcRsx
+          input:
+            city: Paris
+          name: get_weather
+          type: tool_use
+        role: assistant
+      - content:
+        - content: The weather in Paris is sunny and 72°F.
+          is_error: false
+          tool_use_id: toolu_01D3gpU1tfJop7nGMdNfcRsx
+          type: tool_result
+        role: user
+      model: claude-haiku-4-5
+      stream: false
+      tool_choice:
+        type: any
+      tools:
+      - description: Get the weather for a city.
+        input_schema:
+          additionalProperties: false
+          properties:
+            city:
+              type: string
+          required:
+          - city
+          type: object
+        name: get_weather
+      - description: The final response which ends this conversation
+        input_schema:
+          properties:
+            response:
+              type: integer
+          required:
+          - response
+          type: object
+        name: final_result
+    uri: https://api.anthropic.com/v1/messages?beta=true
+  response:
+    headers:
+      connection:
+      - keep-alive
+      content-length:
+      - '484'
+      content-type:
+      - application/json
+      retry-after:
+      - '50'
+      strict-transport-security:
+      - max-age=31536000; includeSubDomains; preload
+      transfer-encoding:
+      - chunked
+    parsed_body:
+      content:
+      - id: toolu_01Q9UEiNVmpbMtSxtML7zdMo
+        input:
+          response: 72
+        name: final_result
+        type: tool_use
+      id: msg_01AmQc9gZFMuunfaLmVoF5T5
+      model: claude-haiku-4-5-20251001
+      role: assistant
+      stop_reason: tool_use
+      stop_sequence: null
+      type: message
+      usage:
+        cache_creation:
+          ephemeral_1h_input_tokens: 0
+          ephemeral_5m_input_tokens: 0
+        cache_creation_input_tokens: 0
+        cache_read_input_tokens: 0
+        input_tokens: 806
+        output_tokens: 38
+        service_tier: standard
+    status:
+      code: 200
+      message: OK
+version: 1
diff --git a/tests/models/anthropic/cassettes/test_tool_choice/test_tool_choice_specific_live.yaml b/tests/models/anthropic/cassettes/test_tool_choice/test_tool_choice_specific_live.yaml
new file mode 100644
index 0000000000..24d4832a82
--- /dev/null
+++ b/tests/models/anthropic/cassettes/test_tool_choice/test_tool_choice_specific_live.yaml
@@ -0,0 +1,191 @@
+interactions:
+- request:
+    headers:
+      accept:
+      - application/json
+      accept-encoding:
+      - gzip, deflate
+      connection:
+      - keep-alive
+      content-length:
+      - '580'
+      content-type:
+      - application/json
+      host:
+      - api.anthropic.com
+    method: POST
+    parsed_body:
+      max_tokens: 4096
+      messages:
+      - content:
+        - text: What is 2+2?
+          type: text
+        role: user
+      model: claude-haiku-4-5
+      stream: false
+      tool_choice:
+        name: get_weather
+        type: tool
+      tools:
+      - description: Get the weather for a city.
+        input_schema:
+          additionalProperties: false
+          properties:
+            city:
+              type: string
+          required:
+          - city
+          type: object
+        name: get_weather
+      - description: Get the current time in a city.
+        input_schema:
+          additionalProperties: false
+          properties:
+            city:
+              type: string
+          required:
+          - city
+          type: object
+        name: get_time
+    uri: https://api.anthropic.com/v1/messages?beta=true
+  response:
+    headers:
+      connection:
+      - keep-alive
+      content-length:
+      - '488'
+      content-type:
+      - application/json
+      retry-after:
+      - '47'
+      strict-transport-security:
+      - max-age=31536000; includeSubDomains; preload
+      transfer-encoding:
+      - chunked
+    parsed_body:
+      content:
+      - id: toolu_01GMZox9yeNRGPMasr4G2sb8
+        input:
+          city: <UNKNOWN>
+        name: get_weather
+        type: tool_use
+      id: msg_01DPYqAxNvskqyAt1TodvqCf
+      model: claude-haiku-4-5-20251001
+      role: assistant
+      stop_reason: tool_use
+      stop_sequence: null
+      type: message
+      usage:
+        cache_creation:
+          ephemeral_1h_input_tokens: 0
+          ephemeral_5m_input_tokens: 0
+        cache_creation_input_tokens: 0
+        cache_read_input_tokens: 0
+        input_tokens: 730
+        output_tokens: 34
+        service_tier: standard
+    status:
+      code: 200
+      message: OK
+- request:
+    headers:
+      accept:
+      - application/json
+      accept-encoding:
+      - gzip, deflate
+      connection:
+      - keep-alive
+      content-length:
+      - '893'
+      content-type:
+      - application/json
+      host:
+      - api.anthropic.com
+    method: POST
+    parsed_body:
+      max_tokens: 4096
+      messages:
+      - content:
+        - text: What is 2+2?
+          type: text
+        role: user
+      - content:
+        - id: toolu_01GMZox9yeNRGPMasr4G2sb8
+          input:
+            city: <UNKNOWN>
+          name: get_weather
+          type: tool_use
+        role: assistant
+      - content:
+        - content: The weather in <UNKNOWN> is sunny and 72°F.
+          is_error: false
+          tool_use_id: toolu_01GMZox9yeNRGPMasr4G2sb8
+          type: tool_result
+        role: user
+      model: claude-haiku-4-5
+      stream: false
+      tool_choice:
+        name: get_weather
+        type: tool
+      tools:
+      - description: Get the weather for a city.
+        input_schema:
+          additionalProperties: false
+          properties:
+            city:
+              type: string
+          required:
+          - city
+          type: object
+        name: get_weather
+      - description: Get the current time in a city.
+        input_schema:
+          additionalProperties: false
+          properties:
+            city:
+              type: string
+          required:
+          - city
+          type: object
+        name: get_time
+    uri: https://api.anthropic.com/v1/messages?beta=true
+  response:
+    headers:
+      connection:
+      - keep-alive
+      content-length:
+      - '488'
+      content-type:
+      - application/json
+      retry-after:
+      - '44'
+      strict-transport-security:
+      - max-age=31536000; includeSubDomains; preload
+      transfer-encoding:
+      - chunked
+    parsed_body:
+      content:
+      - id: toolu_01AuG2J1q864E4YSXa6HUUsh
+        input:
+          city: <UNKNOWN>
+        name: get_weather
+        type: tool_use
+      id: msg_012REmAsZn5D4TYHohRmPDGV
+      model: claude-haiku-4-5-20251001
+      role: assistant
+      stop_reason: tool_use
+      stop_sequence: null
+      type: message
+      usage:
+        cache_creation:
+          ephemeral_1h_input_tokens: 0
+          ephemeral_5m_input_tokens: 0
+        cache_creation_input_tokens: 0
+        cache_read_input_tokens: 0
+        input_tokens: 810
+        output_tokens: 34
+        service_tier: standard
+    status:
+      code: 200
+      message: OK
+version: 1
diff --git a/tests/models/anthropic/test_tool_choice.py b/tests/models/anthropic/test_tool_choice.py
new file mode 100644
index 0000000000..be9796d788
--- /dev/null
+++ b/tests/models/anthropic/test_tool_choice.py
@@ -0,0 +1,97 @@
+"""Tests for Anthropic tool_choice setting."""
+
+from __future__ import annotations as _annotations
+
+import pytest
+
+from pydantic_ai import Agent
+
+from ...conftest import try_import
+
+with try_import() as imports_successful:
+    from pydantic_ai.models.anthropic import AnthropicModel
+    from pydantic_ai.providers.anthropic import AnthropicProvider
+
+pytestmark = [
+    pytest.mark.skipif(not imports_successful(), reason='anthropic not installed'),
+    pytest.mark.anyio,
+    pytest.mark.vcr,
+]
+
+
+async def test_tool_choice_auto_live(allow_model_requests: None, anthropic_api_key: str):
+    """Test tool_choice='auto' allows model to decide whether to use tools."""
+    m = AnthropicModel('claude-haiku-4-5', provider=AnthropicProvider(api_key=anthropic_api_key))
+    agent = Agent(m)
+
+    @agent.tool_plain
+    def get_weather(city: str) -> str:
+        """Get the weather for a city."""
+        return f'The weather in {city} is sunny and 72°F.'  # pragma: no cover
+
+    result = await agent.run('What is 2+2?', model_settings={'tool_choice': 'auto'})
+    assert result.output is not None
+    assert '4' in result.output
+
+
+async def test_tool_choice_required_live(allow_model_requests: None, anthropic_api_key: str):
+    """Test tool_choice='required' forces model to use a tool."""
+    m = AnthropicModel('claude-haiku-4-5', provider=AnthropicProvider(api_key=anthropic_api_key))
+    agent = Agent(m)
+
+    @agent.tool_plain
+    def get_weather(city: str) -> str:
+        """Get the weather for a city."""
+        return f'The weather in {city} is sunny and 72°F.'
+
+    result = await agent.run(
+        'What is the temperature in Paris? Use the weather tool and return the temperature as a number.',
+        output_type=int,
+        model_settings={'tool_choice': 'required'},
+    )
+    assert result.output == 72
+
+
+async def test_tool_choice_none_live(allow_model_requests: None, anthropic_api_key: str):
+    """Test tool_choice='none' prevents model from using function tools."""
+    m = AnthropicModel('claude-haiku-4-5', provider=AnthropicProvider(api_key=anthropic_api_key))
+    agent = Agent(m)
+
+    @agent.tool_plain
+    def get_weather(city: str) -> str:
+        """Get the weather for a city."""
+        return f'The weather in {city} is sunny and 72°F.'  # pragma: no cover
+
+    result = await agent.run(
+        'What is 2+2?',
+        model_settings={'tool_choice': 'none'},
+    )
+    assert result.output is not None
+    assert '4' in result.output
+
+
+async def test_tool_choice_specific_live(allow_model_requests: None, anthropic_api_key: str):
+    """Test tool_choice=['tool_name'] forces model to use the named tool."""
+    from pydantic_ai import UsageLimits
+    from pydantic_ai.exceptions import UsageLimitExceeded
+
+    m = AnthropicModel('claude-haiku-4-5', provider=AnthropicProvider(api_key=anthropic_api_key))
+    agent = Agent(m)
+
+    @agent.tool_plain
+    def get_weather(city: str) -> str:
+        """Get the weather for a city."""
+        return f'The weather in {city} is sunny and 72°F.'
+
+    @agent.tool_plain
+    def get_time(city: str) -> str:
+        """Get the current time in a city."""
+        return f'The time in {city} is 3:00 PM.'  # pragma: no cover
+
+    # Agent is forced to call get_weather even though it's unrelated to the prompt
+    with pytest.raises(UsageLimitExceeded):
+        await agent.run(
+            'What is 2+2?',
+            model_settings={'tool_choice': ['get_weather']},
+            usage_limits=UsageLimits(request_limit=2),
+        )
diff --git a/tests/models/cassettes/test_anthropic/test_anthropic_web_fetch_tool.yaml b/tests/models/cassettes/test_anthropic/test_anthropic_web_fetch_tool.yaml
index 2992be928b..f25007369b 100644
--- a/tests/models/cassettes/test_anthropic/test_anthropic_web_fetch_tool.yaml
+++ b/tests/models/cassettes/test_anthropic/test_anthropic_web_fetch_tool.yaml
@@ -42,24 +42,23 @@ interactions:
       connection:
       - keep-alive
       content-length:
-      - '21807'
+      - '34284'
       content-type:
       - application/json
       retry-after:
-      - '39'
+      - '52'
       strict-transport-security:
       - max-age=31536000; includeSubDomains; preload
       transfer-encoding:
       - chunked
     parsed_body:
       content:
-      - signature: EsIDCkYICRgCKkAKi/j4a8lGN12CjyS27ZXcPkXHGyTbn1vJENJz+AjinyTnsrynMEhidWT5IMNAs0TDgwSwPLNmgq4MsPkVekB8EgxetaK+Nhg8wUdhTEAaDMukODgr3JaYHZwVEiIwgKBckFLJ/C7wCD9oGCIECbqpaeEuWQ8BH3Hev6wpuc+66Wu7AJM1jGH60BpsUovnKqkCrHNq6b1SDT41cm2w7cyxZggrX6crzYh0fAkZ+VC6FBjy6mJikZtX6reKD+064KZ4F1oe4Qd40EBp/wHvD7oPV/fhGut1fzwl48ZgB8uzJb3tHr9MBjs4PVTsvKstpHKpOo6NLvCknQJ/0730OTENp/JOR6h6RUl6kMl5OrHTvsDEYpselUBPtLikm9p4t+d8CxqGm/B1kg1wN3FGJK31PD3veYIOO4hBirFPXWd+AiB1rZP++2QjToZ9lD2xqP/Q3vWEU+/Ryp6uzaRFWPVQkIr+mzpIaJsYuKDiyduxF4LD/hdMTV7IVDtconeQIPQJRhuO6nICBEuqb0uIotPDnCU6iI2l9OyEeKJM0RS6/NTNG8DZnvyVJ8gGKbtZKSHK6KKsdH0f7d+DGAE=
-        thinking: |-
-          The user is asking me to fetch the content from https://ai.pydantic.dev and return only the first sentence on that page. I need to use the web_fetch tool to get the content from this URL, then identify the first sentence and return only that sentence.
-
-          Let me fetch the page first.
+      - signature: EooDCkYIChgCKkBe6ddqCwT1CKptPg14EIIaDdq/qCKZucUmb9w4ci/O5pSzheW3Vv33pkeqmFPrcr4l5CWAVM/xaV7NjHNwOPohEgza8xxqBGZ7jds5BzMaDFyd3dP3X5SSgPSg7SIwfyJLZ+yYCfCrpsgV77T7Ay6iBvfLp0ZaSb+ph+2YkSSVAxFDodWxWyv5DiVHRLJnKvEBcESvFzbas8bML22jelhD1nxGiyr6GGBCjavRGaz6LpPExc03FEa9qS0YEvAniVkVxLJprdDcW4Sm2/lLTh6TRiiicyELomVYxI4FrK1R981pA9ZdDgP8iE3YmcvhvvVJpxgUK+6Tr0LJSq5GgnlcPVEcXc+PYzqLNwlHiH+Vm9bPVs/N/JhfYBPKKREWgtXQBvpsxDM8f5Rj6569D7K3oKZ7Dbglc8eWyn1KFYHV4R+sXc4XOHJDPWuEjgW5/aYUfnP5yDlscfTHDgfrZVy7se8rjgtnpwLNstk7GbLUzgIft6p7hTTUIGB7icopfZtoahgB
+        thinking: The user wants me to fetch the content from https://ai.pydantic.dev and return only the first sentence.
+          I need to use the web_fetch tool to get the content from this URL, then identify the first sentence and return only
+          that.
         type: thinking
-      - id: srvtoolu_01So85wNUocinTvFfgKCfQeb
+      - id: srvtoolu_01MSZmtbzt6NmQizTETf3GPF
         input:
           url: https://ai.pydantic.dev
         name: web_fetch
@@ -67,300 +66,291 @@ interactions:
       - content:
           content:
             source:
-              data: |-
-                Pydantic AI
-                GenAI Agent Framework, the Pydantic way
-                Pydantic AI is a Python agent framework designed to help you quickly, confidently, and painlessly build production grade applications and workflows with Generative AI.
-                FastAPI revolutionized web development by offering an innovative and ergonomic design, built on the foundation of [Pydantic Validation](https://docs.pydantic.dev) and modern Python features like type hints.
-                Yet despite virtually every Python agent framework and LLM library using Pydantic Validation, when we began to use LLMs in [Pydantic Logfire](https://pydantic.dev/logfire), we couldn't find anything that gave us the same feeling.
-                We built Pydantic AI with one simple aim: to bring that FastAPI feeling to GenAI app and agent development.
-                Why use Pydantic AI
-                -
-                Built by the Pydantic Team:
-                [Pydantic Validation](https://docs.pydantic.dev/latest/)is the validation layer of the OpenAI SDK, the Google ADK, the Anthropic SDK, LangChain, LlamaIndex, AutoGPT, Transformers, CrewAI, Instructor and many more. Why use the derivative when you can go straight to the source? -
-                Model-agnostic: Supports virtually every
-                [model](models/overview/)and provider: OpenAI, Anthropic, Gemini, DeepSeek, Grok, Cohere, Mistral, and Perplexity; Azure AI Foundry, Amazon Bedrock, Google Vertex AI, Ollama, LiteLLM, Groq, OpenRouter, Together AI, Fireworks AI, Cerebras, Hugging Face, GitHub, Heroku, Vercel, Nebius, OVHcloud, and Outlines. If your favorite model or provider is not listed, you can easily implement a[custom model](models/overview/#custom-models). -
-                Seamless Observability: Tightly
-                [integrates](logfire/)with[Pydantic Logfire](https://pydantic.dev/logfire), our general-purpose OpenTelemetry observability platform, for real-time debugging, evals-based performance monitoring, and behavior, tracing, and cost tracking. If you already have an observability platform that supports OTel, you can[use that too](logfire/#alternative-observability-backends). -
-                Fully Type-safe: Designed to give your IDE or AI coding agent as much context as possible for auto-completion and
-                [type checking](agents/#static-type-checking), moving entire classes of errors from runtime to write-time for a bit of that Rust "if it compiles, it works" feel. -
-                Powerful Evals: Enables you to systematically test and
-                [evaluate](evals/)the performance and accuracy of the agentic systems you build, and monitor the performance over time in Pydantic Logfire. -
-                MCP, A2A, and UI: Integrates the
-                [Model Context Protocol](mcp/overview/),[Agent2Agent](a2a/), and various[UI event stream](ui/overview/)standards to give your agent access to external tools and data, let it interoperate with other agents, and build interactive applications with streaming event-based communication. -
-                Human-in-the-Loop Tool Approval: Easily lets you flag that certain tool calls
-                [require approval](deferred-tools/#human-in-the-loop-tool-approval)before they can proceed, possibly depending on tool call arguments, conversation history, or user preferences. -
-                Durable Execution: Enables you to build
-                [durable agents](durable_execution/overview/)that can preserve their progress across transient API failures and application errors or restarts, and handle long-running, asynchronous, and human-in-the-loop workflows with production-grade reliability. -
-                Streamed Outputs: Provides the ability to
-                [stream](output/#streamed-results)structured output continuously, with immediate validation, ensuring real time access to generated data. -
-                Graph Support: Provides a powerful way to define
-                [graphs](graph/)using type hints, for use in complex applications where standard control flow can degrade to spaghetti code.
-                Realistically though, no list is going to be as convincing as [giving it a try](#next-steps) and seeing how it makes you feel!
-                Sign up for our newsletter, The Pydantic Stack, with updates & tutorials on Pydantic AI, Logfire, and Pydantic:
-                Hello World Example
-                Here's a minimal example of Pydantic AI:
-                [Learn about Gateway](gateway)hello_world.py
-                from pydantic_ai import Agent
-                agent = Agent( # (1)!
-                'gateway/anthropic:claude-sonnet-4-0',
-                instructions='Be concise, reply with one sentence.', # (2)!
-                )
-                result = agent.run_sync('Where does "hello world" come from?') # (3)!
-                print(result.output)
-                """
-                The first known use of "hello, world" was in a 1974 textbook about the C programming language.
-                """
-                - We configure the agent to use
-                [Anthropic's Claude Sonnet 4.0](api/models/anthropic/)model, but you can also set the model when running the agent. - Register static
-                [instructions](agents/#instructions)using a keyword argument to the agent. [Run the agent](agents/#running-agents)synchronously, starting a conversation with the LLM.
-                from pydantic_ai import Agent
-                agent = Agent( # (1)!
-                'anthropic:claude-sonnet-4-0',
-                instructions='Be concise, reply with one sentence.', # (2)!
-                )
-                result = agent.run_sync('Where does "hello world" come from?') # (3)!
-                print(result.output)
-                """
-                The first known use of "hello, world" was in a 1974 textbook about the C programming language.
-                """
-                - We configure the agent to use
-                [Anthropic's Claude Sonnet 4.0](api/models/anthropic/)model, but you can also set the model when running the agent. - Register static
-                [instructions](agents/#instructions)using a keyword argument to the agent. [Run the agent](agents/#running-agents)synchronously, starting a conversation with the LLM.
-                (This example is complete, it can be run "as is", assuming you've [installed the pydantic_ai package](install/))
-                The exchange will be very short: Pydantic AI will send the instructions and the user prompt to the LLM, and the model will return a text response.
-                Not very interesting yet, but we can easily add [tools](tools/), [dynamic instructions](agents/#instructions), and [structured outputs](output/) to build more powerful agents.
-                Tools & Dependency Injection Example
-                Here is a concise example using Pydantic AI to build a support agent for a bank:
-                [Learn about Gateway](gateway)bank_support.py
-                from dataclasses import dataclass
-                from pydantic import BaseModel, Field
-                from pydantic_ai import Agent, RunContext
-                from bank_database import DatabaseConn
-                @dataclass
-                class SupportDependencies: # (3)!
-                customer_id: int
-                db: DatabaseConn # (12)!
-                class SupportOutput(BaseModel): # (13)!
-                support_advice: str = Field(description='Advice returned to the customer')
-                block_card: bool = Field(description="Whether to block the customer's card")
-                risk: int = Field(description='Risk level of query', ge=0, le=10)
-                support_agent = Agent( # (1)!
-                'gateway/openai:gpt-5', # (2)!
-                deps_type=SupportDependencies,
-                output_type=SupportOutput, # (9)!
-                instructions=( # (4)!
-                'You are a support agent in our bank, give the '
-                'customer support and judge the risk level of their query.'
-                ),
-                )
-                @support_agent.instructions # (5)!
-                async def add_customer_name(ctx: RunContext[SupportDependencies]) -> str:
-                customer_name = await ctx.deps.db.customer_name(id=ctx.deps.customer_id)
-                return f"The customer's name is {customer_name!r}"
-                @support_agent.tool # (6)!
-                async def customer_balance(
-                ctx: RunContext[SupportDependencies], include_pending: bool
-                ) -> float:
-                """Returns the customer's current account balance.""" # (7)!
-                return await ctx.deps.db.customer_balance(
-                id=ctx.deps.customer_id,
-                include_pending=include_pending,
-                )
-                ... # (11)!
-                async def main():
-                deps = SupportDependencies(customer_id=123, db=DatabaseConn())
-                result = await support_agent.run('What is my balance?', deps=deps) # (8)!
-                print(result.output) # (10)!
-                """
-                support_advice='Hello John, your current account balance, including pending transactions, is $123.45.' block_card=False risk=1
-                """
-                result = await support_agent.run('I just lost my card!', deps=deps)
-                print(result.output)
-                """
-                support_advice="I'm sorry to hear that, John. We are temporarily blocking your card to prevent unauthorized transactions." block_card=True risk=8
-                """
-                - This
-                [agent](agents/)will act as first-tier support in a bank. Agents are generic in the type of dependencies they accept and the type of output they return. In this case, the support agent has typeAgent[SupportDependencies, SupportOutput]
-                . - Here we configure the agent to use
-                [OpenAI's GPT-5 model](api/models/openai/), you can also set the model when running the agent. - The
-                SupportDependencies
-                dataclass is used to pass data, connections, and logic into the model that will be needed when running[instructions](agents/#instructions)and[tool](tools/)functions. Pydantic AI's system of dependency injection provides a[type-safe](agents/#static-type-checking)way to customise the behavior of your agents, and can be especially useful when running[unit tests](testing/)and evals. - Static
-                [instructions](agents/#instructions)can be registered with theto the agent.instructions
-                keyword argument - Dynamic
-                [instructions](agents/#instructions)can be registered with thedecorator, and can make use of dependency injection. Dependencies are carried via the@agent.instructions
-                argument, which is parameterized with theRunContext
-                deps_type
-                from above. If the type annotation here is wrong, static type checkers will catch it. - The
-                decorator let you register functions which the LLM may call while responding to a user. Again, dependencies are carried via@agent.tool
-                , any other arguments become the tool schema passed to the LLM. Pydantic is used to validate these arguments, and errors are passed back to the LLM so it can retry.RunContext
-                - The docstring of a tool is also passed to the LLM as the description of the tool. Parameter descriptions are
-                [extracted](tools/#function-tools-and-schema)from the docstring and added to the parameter schema sent to the LLM. [Run the agent](agents/#running-agents)asynchronously, conducting a conversation with the LLM until a final response is reached. Even in this fairly simple case, the agent will exchange multiple messages with the LLM as tools are called to retrieve an output.- The response from the agent will be guaranteed to be a
-                SupportOutput
-                . If validation fails[reflection](agents/#reflection-and-self-correction), the agent is prompted to try again. - The output will be validated with Pydantic to guarantee it is a
-                SupportOutput
-                , since the agent is generic, it'll also be typed as aSupportOutput
-                to aid with static type checking. - In a real use case, you'd add more tools and longer instructions to the agent to extend the context it's equipped with and support it can provide.
-                - This is a simple sketch of a database connection, used to keep the example short and readable. In reality, you'd be connecting to an external database (e.g. PostgreSQL) to get information about customers.
-                - This
-                [Pydantic](https://docs.pydantic.dev)model is used to constrain the structured data returned by the agent. From this simple definition, Pydantic builds the JSON Schema that tells the LLM how to return the data, and performs validation to guarantee the data is correct at the end of the run.
-                from dataclasses import dataclass
-                from pydantic import BaseModel, Field
-                from pydantic_ai import Agent, RunContext
-                from bank_database import DatabaseConn
-                @dataclass
-                class SupportDependencies: # (3)!
-                customer_id: int
-                db: DatabaseConn # (12)!
-                class SupportOutput(BaseModel): # (13)!
-                support_advice: str = Field(description='Advice returned to the customer')
-                block_card: bool = Field(description="Whether to block the customer's card")
-                risk: int = Field(description='Risk level of query', ge=0, le=10)
-                support_agent = Agent( # (1)!
-                'openai:gpt-5', # (2)!
-                deps_type=SupportDependencies,
-                output_type=SupportOutput, # (9)!
-                instructions=( # (4)!
-                'You are a support agent in our bank, give the '
-                'customer support and judge the risk level of their query.'
-                ),
-                )
-                @support_agent.instructions # (5)!
-                async def add_customer_name(ctx: RunContext[SupportDependencies]) -> str:
-                customer_name = await ctx.deps.db.customer_name(id=ctx.deps.customer_id)
-                return f"The customer's name is {customer_name!r}"
-                @support_agent.tool # (6)!
-                async def customer_balance(
-                ctx: RunContext[SupportDependencies], include_pending: bool
-                ) -> float:
-                """Returns the customer's current account balance.""" # (7)!
-                return await ctx.deps.db.customer_balance(
-                id=ctx.deps.customer_id,
-                include_pending=include_pending,
-                )
-                ... # (11)!
-                async def main():
-                deps = SupportDependencies(customer_id=123, db=DatabaseConn())
-                result = await support_agent.run('What is my balance?', deps=deps) # (8)!
-                print(result.output) # (10)!
-                """
-                support_advice='Hello John, your current account balance, including pending transactions, is $123.45.' block_card=False risk=1
-                """
-                result = await support_agent.run('I just lost my card!', deps=deps)
-                print(result.output)
-                """
-                support_advice="I'm sorry to hear that, John. We are temporarily blocking your card to prevent unauthorized transactions." block_card=True risk=8
-                """
-                - This
-                [agent](agents/)will act as first-tier support in a bank. Agents are generic in the type of dependencies they accept and the type of output they return. In this case, the support agent has typeAgent[SupportDependencies, SupportOutput]
-                . - Here we configure the agent to use
-                [OpenAI's GPT-5 model](api/models/openai/), you can also set the model when running the agent. - The
-                SupportDependencies
-                dataclass is used to pass data, connections, and logic into the model that will be needed when running[instructions](agents/#instructions)and[tool](tools/)functions. Pydantic AI's system of dependency injection provides a[type-safe](agents/#static-type-checking)way to customise the behavior of your agents, and can be especially useful when running[unit tests](testing/)and evals. - Static
-                [instructions](agents/#instructions)can be registered with theto the agent.instructions
-                keyword argument - Dynamic
-                [instructions](agents/#instructions)can be registered with thedecorator, and can make use of dependency injection. Dependencies are carried via the@agent.instructions
-                argument, which is parameterized with theRunContext
-                deps_type
-                from above. If the type annotation here is wrong, static type checkers will catch it. - The
-                decorator let you register functions which the LLM may call while responding to a user. Again, dependencies are carried via@agent.tool
-                , any other arguments become the tool schema passed to the LLM. Pydantic is used to validate these arguments, and errors are passed back to the LLM so it can retry.RunContext
-                - The docstring of a tool is also passed to the LLM as the description of the tool. Parameter descriptions are
-                [extracted](tools/#function-tools-and-schema)from the docstring and added to the parameter schema sent to the LLM. [Run the agent](agents/#running-agents)asynchronously, conducting a conversation with the LLM until a final response is reached. Even in this fairly simple case, the agent will exchange multiple messages with the LLM as tools are called to retrieve an output.- The response from the agent will be guaranteed to be a
-                SupportOutput
-                . If validation fails[reflection](agents/#reflection-and-self-correction), the agent is prompted to try again. - The output will be validated with Pydantic to guarantee it is a
-                SupportOutput
-                , since the agent is generic, it'll also be typed as aSupportOutput
-                to aid with static type checking. - In a real use case, you'd add more tools and longer instructions to the agent to extend the context it's equipped with and support it can provide.
-                - This is a simple sketch of a database connection, used to keep the example short and readable. In reality, you'd be connecting to an external database (e.g. PostgreSQL) to get information about customers.
-                - This
-                [Pydantic](https://docs.pydantic.dev)model is used to constrain the structured data returned by the agent. From this simple definition, Pydantic builds the JSON Schema that tells the LLM how to return the data, and performs validation to guarantee the data is correct at the end of the run.
-                Complete bank_support.py
-                example
-                The code included here is incomplete for the sake of brevity (the definition of DatabaseConn
-                is missing); you can find the complete bank_support.py
-                example [here](examples/bank-support/).
-                Instrumentation with Pydantic Logfire
-                Even a simple agent with just a handful of tools can result in a lot of back-and-forth with the LLM, making it nearly impossible to be confident of what's going on just from reading the code. To understand the flow of the above runs, we can watch the agent in action using Pydantic Logfire.
-                To do this, we need to [set up Logfire](logfire/#using-logfire), and add the following to our code:
-                [Learn about Gateway](gateway)bank_support_with_logfire.py
-                ...
-                from pydantic_ai import Agent, RunContext
-                from bank_database import DatabaseConn
-                import logfire
-                logfire.configure() # (1)!
-                logfire.instrument_pydantic_ai() # (2)!
-                logfire.instrument_asyncpg() # (3)!
-                ...
-                support_agent = Agent(
-                'gateway/openai:gpt-5',
-                deps_type=SupportDependencies,
-                output_type=SupportOutput,
-                system_prompt=(
-                'You are a support agent in our bank, give the '
-                'customer support and judge the risk level of their query.'
-                ),
-                )
-                - Configure the Logfire SDK, this will fail if project is not set up.
-                - This will instrument all Pydantic AI agents used from here on out. If you want to instrument only a specific agent, you can pass the
-                to the agent.instrument=True
-                keyword argument - In our demo,
-                DatabaseConn
-                usesto connect to a PostgreSQL database, soasyncpg
-                is used to log the database queries.logfire.instrument_asyncpg()
-                ...
-                from pydantic_ai import Agent, RunContext
-                from bank_database import DatabaseConn
-                import logfire
-                logfire.configure() # (1)!
-                logfire.instrument_pydantic_ai() # (2)!
-                logfire.instrument_asyncpg() # (3)!
-                ...
-                support_agent = Agent(
-                'openai:gpt-5',
-                deps_type=SupportDependencies,
-                output_type=SupportOutput,
-                system_prompt=(
-                'You are a support agent in our bank, give the '
-                'customer support and judge the risk level of their query.'
-                ),
-                )
-                - Configure the Logfire SDK, this will fail if project is not set up.
-                - This will instrument all Pydantic AI agents used from here on out. If you want to instrument only a specific agent, you can pass the
-                to the agent.instrument=True
-                keyword argument - In our demo,
-                DatabaseConn
-                usesto connect to a PostgreSQL database, soasyncpg
-                is used to log the database queries.logfire.instrument_asyncpg()
-                That's enough to get the following view of your agent in action:
-                See [Monitoring and Performance](logfire/) to learn more.
-                llms.txt
-                The Pydantic AI documentation is available in the [llms.txt](https://llmstxt.org/) format.
-                This format is defined in Markdown and suited for LLMs and AI coding assistants and agents.
-                Two formats are available:
-                : a file containing a brief description of the project, along with links to the different sections of the documentation. The structure of this file is described in detailsllms.txt
-                [here](https://llmstxt.org/#format).: Similar to thellms-full.txt
-                llms.txt
-                file, but every link content is included. Note that this file may be too large for some LLMs.
-                As of today, these files are not automatically leveraged by IDEs or coding agents, but they will use it if you provide a link or the full text.
-                Next Steps
-                To try Pydantic AI for yourself, [install it](install/) and follow the instructions [in the examples](examples/setup/).
-                Read the [docs](agents/) to learn more about building applications with Pydantic AI.
-                Read the [API Reference](api/agent/) to understand Pydantic AI's interface.
-                Join [ Slack](https://logfire.pydantic.dev/docs/join-slack/) or file an issue on [ GitHub](https://github.com/pydantic/pydantic-ai/issues) if you have any questions.
+              data: "Pydantic AI\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n \n\n\n\n\n\n[Skip to content](#pydantic-ai)\n\n**[Pydantic
+                AI Gateway](/gateway) is now available! \U0001F680\nEnterprise-ready AI model routing: One key for all your
+                models with real-time monitoring and budget control that works.**\n\n[![logo](img/logo-white.svg)](. \"Pydantic
+                AI\")\n\n\n\n\nPydantic AI\n\nPydantic AI\n\n\n\n\n\n\n\nType to start searching\n\n[pydantic/pydantic-ai](https://github.com/pydantic/pydantic-ai
+                \"Go to repository\")\n\n[![logo](img/logo-white.svg)](. \"Pydantic AI\")\nPydantic AI\n\n[pydantic/pydantic-ai](https://github.com/pydantic/pydantic-ai
+                \"Go to repository\")\n\n* Pydantic AI\n\n  [Pydantic AI](.)\n\n\n\n  Table of contents\n  + [Why use Pydantic
+                AI](#why-use-pydantic-ai)\n  + [Hello World Example](#hello-world-example)\n  + [Tools & Dependency Injection
+                Example](#tools-dependency-injection-example)\n  + [Instrumentation with Pydantic Logfire](#instrumentation-with-pydantic-logfire)\n
+                \ + [llms.txt](#llmstxt)\n  + [Next Steps](#next-steps)\n* [Installation](install/)\n* [Getting Help](help/)\n*
+                [Troubleshooting](troubleshooting/)\n* [Pydantic AI Gateway](gateway/)\n* Documentation\n\n\n\n\n  Documentation\n
+                \ + Core Concepts\n\n\n\n\n    Core Concepts\n    - [Agents](agents/)\n    - [Dependencies](dependencies/)\n
+                \   - [Function Tools](tools/)\n    - [Output](output/)\n    - [Messages and chat history](message-history/)\n
+                \   - [Direct Model Requests](direct/)\n  + Models & Providers\n\n\n\n\n    Models & Providers\n    - [Overview](models/overview/)\n
+                \   - [OpenAI](models/openai/)\n    - [Anthropic](models/anthropic/)\n    - [Google](models/google/)\n    -
+                [Bedrock](models/bedrock/)\n    - [Cohere](models/cohere/)\n    - [Groq](models/groq/)\n    - [Hugging Face](models/huggingface/)\n
+                \   - [Mistral](models/mistral/)\n    - [OpenRouter](models/openrouter/)\n    - [Outlines](models/outlines/)\n
+                \ + Tools & Toolsets\n\n\n\n\n    Tools & Toolsets\n    - [Function Tools](tools/)\n    - [Advanced Tool Features](tools-advanced/)\n
+                \   - [Toolsets](toolsets/)\n    - [Deferred Tools](deferred-tools/)\n    - [Built-in Tools](builtin-tools/)\n
+                \   - [Common Tools](common-tools/)\n    - [Third-Party Tools](third-party-tools/)\n  + Advanced Features\n\n\n\n\n
+                \   Advanced Features\n    - [Image, Audio, Video & Document Input](input/)\n    - [Thinking](thinking/)\n
+                \   - [HTTP Request Retries](retries/)\n  + MCP\n\n\n\n\n    MCP\n    - [Overview](mcp/overview/)\n    - [Client](mcp/client/)\n
+                \   - [FastMCP Client](mcp/fastmcp-client/)\n    - [Server](mcp/server/)\n  + [Multi-Agent Patterns](multi-agent-applications/)\n
+                \ + [Testing](testing/)\n* Pydantic Evals\n\n\n\n\n  Pydantic Evals\n  + [Overview](evals/)\n  + Getting Started\n\n\n\n\n
+                \   Getting Started\n    - [Quick Start](evals/quick-start/)\n    - [Core Concepts](evals/core-concepts/)\n
+                \ + Evaluators\n\n\n\n\n    Evaluators\n    - [Overview](evals/evaluators/overview/)\n    - [Built-in Evaluators](evals/evaluators/built-in/)\n
+                \   - [LLM Judge](evals/evaluators/llm-judge/)\n    - [Custom Evaluators](evals/evaluators/custom/)\n    -
+                [Span-Based](evals/evaluators/span-based/)\n  + How-To Guides\n\n\n\n\n    How-To Guides\n    - [Logfire Integration](evals/how-to/logfire-integration/)\n
+                \   - [Dataset Management](evals/how-to/dataset-management/)\n    - [Dataset Serialization](evals/how-to/dataset-serialization/)\n
+                \   - [Concurrency & Performance](evals/how-to/concurrency/)\n    - [Retry Strategies](evals/how-to/retry-strategies/)\n
+                \   - [Metrics & Attributes](evals/how-to/metrics-attributes/)\n  + Examples\n\n\n\n\n    Examples\n    -
+                [Simple Validation](evals/examples/simple-validation/)\n* Pydantic Graph\n\n\n\n\n  Pydantic Graph\n  + [Overview](graph/)\n
+                \ + [Beta API](graph/beta/)\n\n    Beta API\n    - [Steps](graph/beta/steps/)\n    - [Joins & Reducers](graph/beta/joins/)\n
+                \   - [Decisions](graph/beta/decisions/)\n    - [Parallel Execution](graph/beta/parallel/)\n* Integrations\n\n\n\n\n
+                \ Integrations\n  + [Debugging & Monitoring with Pydantic Logfire](logfire/)\n  + Durable Execution\n\n\n\n\n
+                \   Durable Execution\n    - [Overview](durable_execution/overview/)\n    - [Temporal](durable_execution/temporal/)\n
+                \   - [DBOS](durable_execution/dbos/)\n    - [Prefect](durable_execution/prefect/)\n  + UI Event Streams\n\n\n\n\n
+                \   UI Event Streams\n    - [Overview](ui/overview/)\n    - [AG-UI](ui/ag-ui/)\n    - [Vercel AI](ui/vercel-ai/)\n
+                \ + [Agent2Agent (A2A)](a2a/)\n* Related Packages\n\n\n\n\n  Related Packages\n  + [Clai](cli/)\n* Examples\n\n\n\n\n
+                \ Examples\n  + [Setup](examples/setup/)\n  + Getting Started\n\n\n\n\n    Getting Started\n    - [Pydantic
+                Model](examples/pydantic-model/)\n    - [Weather agent](examples/weather-agent/)\n  + Conversational Agents\n\n\n\n\n
+                \   Conversational Agents\n    - [Chat App with FastAPI](examples/chat-app/)\n    - [Bank support](examples/bank-support/)\n
+                \ + Data & Analytics\n\n\n\n\n    Data & Analytics\n    - [SQL Generation](examples/sql-gen/)\n    - [Data
+                Analyst](examples/data-analyst/)\n    - [RAG](examples/rag/)\n  + Streaming\n\n\n\n\n    Streaming\n    -
+                [Stream markdown](examples/stream-markdown/)\n    - [Stream whales](examples/stream-whales/)\n  + Complex
+                Workflows\n\n\n\n\n    Complex Workflows\n    - [Flight booking](examples/flight-booking/)\n    - [Question
+                Graph](examples/question-graph/)\n  + Business Applications\n\n\n\n\n    Business Applications\n    - [Slack
+                Lead Qualifier with Modal](examples/slack-lead-qualifier/)\n  + UI Examples\n\n\n\n\n    UI Examples\n    -
+                [Agent User Interaction (AG-UI)](examples/ag-ui/)\n* API Reference\n\n\n\n\n  API Reference\n  + pydantic\\_ai\n\n\n\n\n
+                \   pydantic\\_ai\n    - [pydantic\\_ai.agent](api/agent/)\n    - [pydantic\\_ai.tools](api/tools/)\n    -
+                [pydantic\\_ai.toolsets](api/toolsets/)\n    - [pydantic\\_ai.builtin\\_tools](api/builtin_tools/)\n    -
+                [pydantic\\_ai.common\\_tools](api/common_tools/)\n    - [pydantic\\_ai.durable\\_exec](api/durable_exec/)\n
+                \   - [pydantic\\_ai.output](api/output/)\n    - [pydantic\\_ai.result](api/result/)\n    - [pydantic\\_ai.messages](api/messages/)\n
+                \   - [pydantic\\_ai.exceptions](api/exceptions/)\n    - [pydantic\\_ai.settings](api/settings/)\n    - [pydantic\\_ai.usage](api/usage/)\n
+                \   - [pydantic\\_ai.mcp](api/mcp/)\n    - [pydantic\\_ai.format\\_prompt](api/format_prompt/)\n    - [pydantic\\_ai.direct](api/direct/)\n
+                \   - [pydantic\\_ai.ext](api/ext/)\n    - [pydantic\\_ai.models.anthropic](api/models/anthropic/)\n    -
+                [pydantic\\_ai.models](api/models/base/)\n    - [pydantic\\_ai.models.bedrock](api/models/bedrock/)\n    -
+                [pydantic\\_ai.models.cohere](api/models/cohere/)\n    - [pydantic\\_ai.models.fallback](api/models/fallback/)\n
+                \   - [pydantic\\_ai.models.function](api/models/function/)\n    - [pydantic\\_ai.models.google](api/models/google/)\n
+                \   - [pydantic\\_ai.models.groq](api/models/groq/)\n    - [pydantic\\_ai.models.huggingface](api/models/huggingface/)\n
+                \   - [pydantic\\_ai.models.instrumented](api/models/instrumented/)\n    - [pydantic\\_ai.models.mcp\\_sampling](api/models/mcp-sampling/)\n
+                \   - [pydantic\\_ai.models.mistral](api/models/mistral/)\n    - [pydantic\\_ai.models.openai](api/models/openai/)\n
+                \   - [pydantic\\_ai.models.openrouter](api/models/openrouter/)\n    - [pydantic\\_ai.models.outlines](api/models/outlines/)\n
+                \   - [pydantic\\_ai.models.test](api/models/test/)\n    - [pydantic\\_ai.models.wrapper](api/models/wrapper/)\n
+                \   - [pydantic\\_ai.profiles](api/profiles/)\n    - [pydantic\\_ai.providers](api/providers/)\n    - [pydantic\\_ai.retries](api/retries/)\n
+                \   - [pydantic\\_ai.run](api/run/)\n    - [pydantic\\_ai.ag\\_ui](api/ag_ui/)\n    - [pydantic\\_ai.ui](api/ui/base/)\n
+                \   - [pydantic\\_ai.ui.ag\\_ui](api/ui/ag_ui/)\n    - [pydantic\\_ai.ui.vercel\\_ai](api/ui/vercel_ai/)\n
+                \ + pydantic\\_evals\n\n\n\n\n    pydantic\\_evals\n    - [pydantic\\_evals.dataset](api/pydantic_evals/dataset/)\n
+                \   - [pydantic\\_evals.evaluators](api/pydantic_evals/evaluators/)\n    - [pydantic\\_evals.reporting](api/pydantic_evals/reporting/)\n
+                \   - [pydantic\\_evals.otel](api/pydantic_evals/otel/)\n    - [pydantic\\_evals.generation](api/pydantic_evals/generation/)\n
+                \ + pydantic\\_graph\n\n\n\n\n    pydantic\\_graph\n    - [pydantic\\_graph](api/pydantic_graph/graph/)\n
+                \   - [pydantic\\_graph.nodes](api/pydantic_graph/nodes/)\n    - [pydantic\\_graph.persistence](api/pydantic_graph/persistence/)\n
+                \   - [pydantic\\_graph.mermaid](api/pydantic_graph/mermaid/)\n    - [pydantic\\_graph.exceptions](api/pydantic_graph/exceptions/)\n
+                \   - Beta API\n\n\n\n\n      Beta API\n      * [pydantic\\_graph.beta](api/pydantic_graph/beta/)\n      *
+                [pydantic\\_graph.beta.graph](api/pydantic_graph/beta_graph/)\n      * [pydantic\\_graph.beta.graph\\_builder](api/pydantic_graph/beta_graph_builder/)\n
+                \     * [pydantic\\_graph.beta.step](api/pydantic_graph/beta_step/)\n      * [pydantic\\_graph.beta.join](api/pydantic_graph/beta_join/)\n
+                \     * [pydantic\\_graph.beta.decision](api/pydantic_graph/beta_decision/)\n      * [pydantic\\_graph.beta.node](api/pydantic_graph/beta_node/)\n
+                \ + fasta2a\n\n\n\n\n    fasta2a\n    - [fasta2a](api/fasta2a/)\n* Project\n\n\n\n\n  Project\n  + [Contributing](contributing/)\n
+                \ + [Upgrade Guide](changelog/)\n  + [Version policy](version-policy/)\n\nTable of contents\n\n* [Why use
+                Pydantic AI](#why-use-pydantic-ai)\n* [Hello World Example](#hello-world-example)\n* [Tools & Dependency Injection
+                Example](#tools-dependency-injection-example)\n* [Instrumentation with Pydantic Logfire](#instrumentation-with-pydantic-logfire)\n*
+                [llms.txt](#llmstxt)\n* [Next Steps](#next-steps)\n\n# Pydantic AI\n\n![Pydantic AI](./img/pydantic-ai-dark.svg#only-dark)\n\n![Pydantic
+                AI](./img/pydantic-ai-light.svg#only-light)\n\n*GenAI Agent Framework, the Pydantic way*\n\n[![CI](https://github.com/pydantic/pydantic-ai/actions/workflows/ci.yml/badge.svg?event=push)](https://github.com/pydantic/pydantic-ai/actions/workflows/ci.yml?query=branch%3Amain)\n[![Coverage](https://coverage-badge.samuelcolvin.workers.dev/pydantic/pydantic-ai.svg)](https://coverage-badge.samuelcolvin.workers.dev/redirect/pydantic/pydantic-ai)\n[![PyPI](https://img.shields.io/pypi/v/pydantic-ai.svg)](https://pypi.python.org/pypi/pydantic-ai)\n[![versions](https://img.shields.io/pypi/pyversions/pydantic-ai.svg)](https://github.com/pydantic/pydantic-ai)\n[![license](https://img.shields.io/github/license/pydantic/pydantic-ai.svg)](https://github.com/pydantic/pydantic-ai/blob/main/LICENSE)\n[![Join
+                Slack](https://img.shields.io/badge/Slack-Join%20Slack-4A154B?logo=slack)](https://logfire.pydantic.dev/docs/join-slack/)\n\nPydantic
+                AI is a Python agent framework designed to help you\nquickly, confidently, and painlessly build production
+                grade applications and workflows with Generative AI.\n\nFastAPI revolutionized web development by offering
+                an innovative and ergonomic design, built on the foundation of [Pydantic Validation](https://docs.pydantic.dev)
+                and modern Python features like type hints.\n\nYet despite virtually every Python agent framework and LLM
+                library using Pydantic Validation, when we began to use LLMs in [Pydantic Logfire](https://pydantic.dev/logfire),
+                we couldn't find anything that gave us the same feeling.\n\nWe built Pydantic AI with one simple aim: to bring
+                that FastAPI feeling to GenAI app and agent development.\n\n## Why use Pydantic AI\n\n1. **Built by the Pydantic
+                Team**:\n   [Pydantic Validation](https://docs.pydantic.dev/latest/) is the validation layer of the OpenAI
+                SDK, the Google ADK, the Anthropic SDK, LangChain, LlamaIndex, AutoGPT, Transformers, CrewAI, Instructor and
+                many more. *Why use the derivative when you can go straight to the source?* ![\U0001F603](https://cdn.jsdelivr.net/gh/jdecked/twemoji@15.1.0/assets/svg/1f603.svg
+                \":smiley:\")\n2. **Model-agnostic**:\n   Supports virtually every [model](models/overview/) and provider:
+                OpenAI, Anthropic, Gemini, DeepSeek, Grok, Cohere, Mistral, and Perplexity; Azure AI Foundry, Amazon Bedrock,
+                Google Vertex AI, Ollama, LiteLLM, Groq, OpenRouter, Together AI, Fireworks AI, Cerebras, Hugging Face, GitHub,
+                Heroku, Vercel, Nebius, OVHcloud, and Outlines. If your favorite model or provider is not listed, you can
+                easily implement a [custom model](models/overview/#custom-models).\n3. **Seamless Observability**:\n   Tightly
+                [integrates](logfire/) with [Pydantic Logfire](https://pydantic.dev/logfire), our general-purpose OpenTelemetry
+                observability platform, for real-time debugging, evals-based performance monitoring, and behavior, tracing,
+                and cost tracking. If you already have an observability platform that supports OTel, you can [use that too](logfire/#alternative-observability-backends).\n4.
+                **Fully Type-safe**:\n   Designed to give your IDE or AI coding agent as much context as possible for auto-completion
+                and [type checking](agents/#static-type-checking), moving entire classes of errors from runtime to write-time
+                for a bit of that Rust \"if it compiles, it works\" feel.\n5. **Powerful Evals**:\n   Enables you to systematically
+                test and [evaluate](evals/) the performance and accuracy of the agentic systems you build, and monitor the
+                performance over time in Pydantic Logfire.\n6. **MCP, A2A, and UI**:\n   Integrates the [Model Context Protocol](mcp/overview/),
+                [Agent2Agent](a2a/), and various [UI event stream](ui/overview/) standards to give your agent access to external
+                tools and data, let it interoperate with other agents, and build interactive applications with streaming event-based
+                communication.\n7. **Human-in-the-Loop Tool Approval**:\n   Easily lets you flag that certain tool calls [require
+                approval](deferred-tools/#human-in-the-loop-tool-approval) before they can proceed, possibly depending on
+                tool call arguments, conversation history, or user preferences.\n8. **Durable Execution**:\n   Enables you
+                to build [durable agents](durable_execution/overview/) that can preserve their progress across transient API
+                failures and application errors or restarts, and handle long-running, asynchronous, and human-in-the-loop
+                workflows with production-grade reliability.\n9. **Streamed Outputs**:\n   Provides the ability to [stream](output/#streamed-results)
+                structured output continuously, with immediate validation, ensuring real time access to generated data.\n10.
+                **Graph Support**:\n    Provides a powerful way to define [graphs](graph/) using type hints, for use in complex
+                applications where standard control flow can degrade to spaghetti code.\n\nRealistically though, no list is
+                going to be as convincing as [giving it a try](#next-steps) and seeing how it makes you feel!\n\n**Sign up
+                for our newsletter, *The Pydantic Stack*, with updates & tutorials on Pydantic AI, Logfire, and Pydantic:**\n\nSubscribe\n\n##
+                Hello World Example\n\nHere's a minimal example of Pydantic AI:\n\nWith Pydantic AI GatewayDirectly to Provider
+                API\n\n[Learn about Gateway](../gateway) hello\\_world.py\n\n```\nfrom pydantic_ai import Agent\n\nagent =
+                Agent(  # (1)!\n    'gateway/anthropic:claude-sonnet-4-0',\n    instructions='Be concise, reply with one sentence.',
+                \ # (2)!\n)\n\nresult = agent.run_sync('Where does \"hello world\" come from?')  # (3)!\nprint(result.output)\n\"\"\"\nThe
+                first known use of \"hello, world\" was in a 1974 textbook about the C programming language.\n\"\"\"\n```\n\n1.
+                We configure the agent to use [Anthropic's Claude Sonnet 4.0](api/models/anthropic/) model, but you can also
+                set the model when running the agent.\n2. Register static [instructions](agents/#instructions) using a keyword
+                argument to the agent.\n3. [Run the agent](agents/#running-agents) synchronously, starting a conversation
+                with the LLM.\n\nhello\\_world.py\n\n```\nfrom pydantic_ai import Agent\n\nagent = Agent(  # (1)!\n    'anthropic:claude-sonnet-4-0',\n
+                \   instructions='Be concise, reply with one sentence.',  # (2)!\n)\n\nresult = agent.run_sync('Where does
+                \"hello world\" come from?')  # (3)!\nprint(result.output)\n\"\"\"\nThe first known use of \"hello, world\"
+                was in a 1974 textbook about the C programming language.\n\"\"\"\n```\n\n1. We configure the agent to use
+                [Anthropic's Claude Sonnet 4.0](api/models/anthropic/) model, but you can also set the model when running
+                the agent.\n2. Register static [instructions](agents/#instructions) using a keyword argument to the agent.\n3.
+                [Run the agent](agents/#running-agents) synchronously, starting a conversation with the LLM.\n\n*(This example
+                is complete, it can be run \"as is\", assuming you've [installed the `pydantic_ai` package](install/))*\n\nThe
+                exchange will be very short: Pydantic AI will send the instructions and the user prompt to the LLM, and the
+                model will return a text response.\n\nNot very interesting yet, but we can easily add [tools](tools/), [dynamic
+                instructions](agents/#instructions), and [structured outputs](output/) to build more powerful agents.\n\n##
+                Tools & Dependency Injection Example\n\nHere is a concise example using Pydantic AI to build a support agent
+                for a bank:\n\nWith Pydantic AI GatewayDirectly to Provider API\n\n[Learn about Gateway](../gateway) bank\\_support.py\n\n```\nfrom
+                dataclasses import dataclass\n\nfrom pydantic import BaseModel, Field\nfrom pydantic_ai import Agent, RunContext\n\nfrom
+                bank_database import DatabaseConn\n\n\n@dataclass\nclass SupportDependencies:  # (3)!\n    customer_id: int\n
+                \   db: DatabaseConn  # (12)!\n\n\nclass SupportOutput(BaseModel):  # (13)!\n    support_advice: str = Field(description='Advice
+                returned to the customer')\n    block_card: bool = Field(description=\"Whether to block the customer's card\")\n
+                \   risk: int = Field(description='Risk level of query', ge=0, le=10)\n\n\nsupport_agent = Agent(  # (1)!\n
+                \   'gateway/openai:gpt-5',  # (2)!\n    deps_type=SupportDependencies,\n    output_type=SupportOutput,  #
+                (9)!\n    instructions=(  # (4)!\n        'You are a support agent in our bank, give the '\n        'customer
+                support and judge the risk level of their query.'\n    ),\n)\n\n\n@support_agent.instructions  # (5)!\nasync
+                def add_customer_name(ctx: RunContext[SupportDependencies]) -> str:\n    customer_name = await ctx.deps.db.customer_name(id=ctx.deps.customer_id)\n
+                \   return f\"The customer's name is {customer_name!r}\"\n\n\n@support_agent.tool  # (6)!\nasync def customer_balance(\n
+                \   ctx: RunContext[SupportDependencies], include_pending: bool\n) -> float:\n    \"\"\"Returns the customer's
+                current account balance.\"\"\"  # (7)!\n    return await ctx.deps.db.customer_balance(\n        id=ctx.deps.customer_id,\n
+                \       include_pending=include_pending,\n    )\n\n\n...  # (11)!\n\n\nasync def main():\n    deps = SupportDependencies(customer_id=123,
+                db=DatabaseConn())\n    result = await support_agent.run('What is my balance?', deps=deps)  # (8)!\n    print(result.output)
+                \ # (10)!\n    \"\"\"\n    support_advice='Hello John, your current account balance, including pending transactions,
+                is $123.45.' block_card=False risk=1\n    \"\"\"\n\n    result = await support_agent.run('I just lost my card!',
+                deps=deps)\n    print(result.output)\n    \"\"\"\n    support_advice=\"I'm sorry to hear that, John. We are
+                temporarily blocking your card to prevent unauthorized transactions.\" block_card=True risk=8\n    \"\"\"\n```\n\n1.
+                This [agent](agents/) will act as first-tier support in a bank. Agents are generic in the type of dependencies
+                they accept and the type of output they return. In this case, the support agent has type `Agent[SupportDependencies,
+                SupportOutput]`.\n2. Here we configure the agent to use [OpenAI's GPT-5 model](api/models/openai/), you can
+                also set the model when running the agent.\n3. The `SupportDependencies` dataclass is used to pass data, connections,
+                and logic into the model that will be needed when running [instructions](agents/#instructions) and [tool](tools/)
+                functions. Pydantic AI's system of dependency injection provides a [type-safe](agents/#static-type-checking)
+                way to customise the behavior of your agents, and can be especially useful when running [unit tests](testing/)
+                and evals.\n4. Static [instructions](agents/#instructions) can be registered with the [`instructions` keyword
+                argument](api/agent/#pydantic_ai.agent.Agent.__init__) to the agent.\n5. Dynamic [instructions](agents/#instructions)
+                can be registered with the [`@agent.instructions`](api/agent/#pydantic_ai.agent.Agent.instructions) decorator,
+                and can make use of dependency injection. Dependencies are carried via the [`RunContext`](api/tools/#pydantic_ai.tools.RunContext)
+                argument, which is parameterized with the `deps_type` from above. If the type annotation here is wrong, static
+                type checkers will catch it.\n6. The [`@agent.tool`](tools/) decorator let you register functions which the
+                LLM may call while responding to a user. Again, dependencies are carried via [`RunContext`](api/tools/#pydantic_ai.tools.RunContext),
+                any other arguments become the tool schema passed to the LLM. Pydantic is used to validate these arguments,
+                and errors are passed back to the LLM so it can retry.\n7. The docstring of a tool is also passed to the LLM
+                as the description of the tool. Parameter descriptions are [extracted](tools/#function-tools-and-schema) from
+                the docstring and added to the parameter schema sent to the LLM.\n8. [Run the agent](agents/#running-agents)
+                asynchronously, conducting a conversation with the LLM until a final response is reached. Even in this fairly
+                simple case, the agent will exchange multiple messages with the LLM as tools are called to retrieve an output.\n9.
+                The response from the agent will be guaranteed to be a `SupportOutput`. If validation fails [reflection](agents/#reflection-and-self-correction),
+                the agent is prompted to try again.\n10. The output will be validated with Pydantic to guarantee it is a `SupportOutput`,
+                since the agent is generic, it'll also be typed as a `SupportOutput` to aid with static type checking.\n11.
+                In a real use case, you'd add more tools and longer instructions to the agent to extend the context it's equipped
+                with and support it can provide.\n12. This is a simple sketch of a database connection, used to keep the example
+                short and readable. In reality, you'd be connecting to an external database (e.g. PostgreSQL) to get information
+                about customers.\n13. This [Pydantic](https://docs.pydantic.dev) model is used to constrain the structured
+                data returned by the agent. From this simple definition, Pydantic builds the JSON Schema that tells the LLM
+                how to return the data, and performs validation to guarantee the data is correct at the end of the run.\n\nbank\\_support.py\n\n```\nfrom
+                dataclasses import dataclass\n\nfrom pydantic import BaseModel, Field\nfrom pydantic_ai import Agent, RunContext\n\nfrom
+                bank_database import DatabaseConn\n\n\n@dataclass\nclass SupportDependencies:  # (3)!\n    customer_id: int\n
+                \   db: DatabaseConn  # (12)!\n\n\nclass SupportOutput(BaseModel):  # (13)!\n    support_advice: str = Field(description='Advice
+                returned to the customer')\n    block_card: bool = Field(description=\"Whether to block the customer's card\")\n
+                \   risk: int = Field(description='Risk level of query', ge=0, le=10)\n\n\nsupport_agent = Agent(  # (1)!\n
+                \   'openai:gpt-5',  # (2)!\n    deps_type=SupportDependencies,\n    output_type=SupportOutput,  # (9)!\n
+                \   instructions=(  # (4)!\n        'You are a support agent in our bank, give the '\n        'customer support
+                and judge the risk level of their query.'\n    ),\n)\n\n\n@support_agent.instructions  # (5)!\nasync def add_customer_name(ctx:
+                RunContext[SupportDependencies]) -> str:\n    customer_name = await ctx.deps.db.customer_name(id=ctx.deps.customer_id)\n
+                \   return f\"The customer's name is {customer_name!r}\"\n\n\n@support_agent.tool  # (6)!\nasync def customer_balance(\n
+                \   ctx: RunContext[SupportDependencies], include_pending: bool\n) -> float:\n    \"\"\"Returns the customer's
+                current account balance.\"\"\"  # (7)!\n    return await ctx.deps.db.customer_balance(\n        id=ctx.deps.customer_id,\n
+                \       include_pending=include_pending,\n    )\n\n\n...  # (11)!\n\n\nasync def main():\n    deps = SupportDependencies(customer_id=123,
+                db=DatabaseConn())\n    result = await support_agent.run('What is my balance?', deps=deps)  # (8)!\n    print(result.output)
+                \ # (10)!\n    \"\"\"\n    support_advice='Hello John, your current account balance, including pending transactions,
+                is $123.45.' block_card=False risk=1\n    \"\"\"\n\n    result = await support_agent.run('I just lost my card!',
+                deps=deps)\n    print(result.output)\n    \"\"\"\n    support_advice=\"I'm sorry to hear that, John. We are
+                temporarily blocking your card to prevent unauthorized transactions.\" block_card=True risk=8\n    \"\"\"\n```\n\n1.
+                This [agent](agents/) will act as first-tier support in a bank. Agents are generic in the type of dependencies
+                they accept and the type of output they return. In this case, the support agent has type `Agent[SupportDependencies,
+                SupportOutput]`.\n2. Here we configure the agent to use [OpenAI's GPT-5 model](api/models/openai/), you can
+                also set the model when running the agent.\n3. The `SupportDependencies` dataclass is used to pass data, connections,
+                and logic into the model that will be needed when running [instructions](agents/#instructions) and [tool](tools/)
+                functions. Pydantic AI's system of dependency injection provides a [type-safe](agents/#static-type-checking)
+                way to customise the behavior of your agents, and can be especially useful when running [unit tests](testing/)
+                and evals.\n4. Static [instructions](agents/#instructions) can be registered with the [`instructions` keyword
+                argument](api/agent/#pydantic_ai.agent.Agent.__init__) to the agent.\n5. Dynamic [instructions](agents/#instructions)
+                can be registered with the [`@agent.instructions`](api/agent/#pydantic_ai.agent.Agent.instructions) decorator,
+                and can make use of dependency injection. Dependencies are carried via the [`RunContext`](api/tools/#pydantic_ai.tools.RunContext)
+                argument, which is parameterized with the `deps_type` from above. If the type annotation here is wrong, static
+                type checkers will catch it.\n6. The [`@agent.tool`](tools/) decorator let you register functions which the
+                LLM may call while responding to a user. Again, dependencies are carried via [`RunContext`](api/tools/#pydantic_ai.tools.RunContext),
+                any other arguments become the tool schema passed to the LLM. Pydantic is used to validate these arguments,
+                and errors are passed back to the LLM so it can retry.\n7. The docstring of a tool is also passed to the LLM
+                as the description of the tool. Parameter descriptions are [extracted](tools/#function-tools-and-schema) from
+                the docstring and added to the parameter schema sent to the LLM.\n8. [Run the agent](agents/#running-agents)
+                asynchronously, conducting a conversation with the LLM until a final response is reached. Even in this fairly
+                simple case, the agent will exchange multiple messages with the LLM as tools are called to retrieve an output.\n9.
+                The response from the agent will be guaranteed to be a `SupportOutput`. If validation fails [reflection](agents/#reflection-and-self-correction),
+                the agent is prompted to try again.\n10. The output will be validated with Pydantic to guarantee it is a `SupportOutput`,
+                since the agent is generic, it'll also be typed as a `SupportOutput` to aid with static type checking.\n11.
+                In a real use case, you'd add more tools and longer instructions to the agent to extend the context it's equipped
+                with and support it can provide.\n12. This is a simple sketch of a database connection, used to keep the example
+                short and readable. In reality, you'd be connecting to an external database (e.g. PostgreSQL) to get information
+                about customers.\n13. This [Pydantic](https://docs.pydantic.dev) model is used to constrain the structured
+                data returned by the agent. From this simple definition, Pydantic builds the JSON Schema that tells the LLM
+                how to return the data, and performs validation to guarantee the data is correct at the end of the run.\n\nComplete
+                `bank_support.py` example\n\nThe code included here is incomplete for the sake of brevity (the definition
+                of `DatabaseConn` is missing); you can find the complete `bank_support.py` example [here](examples/bank-support/).\n\n##
+                Instrumentation with Pydantic Logfire\n\nEven a simple agent with just a handful of tools can result in a
+                lot of back-and-forth with the LLM, making it nearly impossible to be confident of what's going on just from
+                reading the code.\nTo understand the flow of the above runs, we can watch the agent in action using Pydantic
+                Logfire.\n\nTo do this, we need to [set up Logfire](logfire/#using-logfire), and add the following to our
+                code:\n\nWith Pydantic AI GatewayDirectly to Provider API\n\n[Learn about Gateway](../gateway) bank\\_support\\_with\\_logfire.py\n\n```\n...\nfrom
+                pydantic_ai import Agent, RunContext\n\nfrom bank_database import DatabaseConn\n\nimport logfire\n\nlogfire.configure()
+                \ # (1)!\nlogfire.instrument_pydantic_ai()  # (2)!\nlogfire.instrument_asyncpg()  # (3)!\n\n...\n\nsupport_agent
+                = Agent(\n    'gateway/openai:gpt-5',\n    deps_type=SupportDependencies,\n    output_type=SupportOutput,\n
+                \   system_prompt=(\n        'You are a support agent in our bank, give the '\n        'customer support and
+                judge the risk level of their query.'\n    ),\n)\n```\n\n1. Configure the Logfire SDK, this will fail if project
+                is not set up.\n2. This will instrument all Pydantic AI agents used from here on out. If you want to instrument
+                only a specific agent, you can pass the [`instrument=True` keyword argument](api/agent/#pydantic_ai.agent.Agent.__init__)
+                to the agent.\n3. In our demo, `DatabaseConn` uses `asyncpg` to connect to a PostgreSQL database, so [`logfire.instrument_asyncpg()`](https://magicstack.github.io/asyncpg/current/)
+                is used to log the database queries.\n\nbank\\_support\\_with\\_logfire.py\n\n```\n...\nfrom pydantic_ai import
+                Agent, RunContext\n\nfrom bank_database import DatabaseConn\n\nimport logfire\n\nlogfire.configure()  # (1)!\nlogfire.instrument_pydantic_ai()
+                \ # (2)!\nlogfire.instrument_asyncpg()  # (3)!\n\n...\n\nsupport_agent = Agent(\n    'openai:gpt-5',\n    deps_type=SupportDependencies,\n
+                \   output_type=SupportOutput,\n    system_prompt=(\n        'You are a support agent in our bank, give the
+                '\n        'customer support and judge the risk level of their query.'\n    ),\n)\n```\n\n1. Configure the
+                Logfire SDK, this will fail if project is not set up.\n2. This will instrument all Pydantic AI agents used
+                from here on out. If you want to instrument only a specific agent, you can pass the [`instrument=True` keyword
+                argument](api/agent/#pydantic_ai.agent.Agent.__init__) to the agent.\n3. In our demo, `DatabaseConn` uses
+                `asyncpg` to connect to a PostgreSQL database, so [`logfire.instrument_asyncpg()`](https://magicstack.github.io/asyncpg/current/)
+                is used to log the database queries.\n\nThat's enough to get the following view of your agent in action:\n\nSee
+                [Monitoring and Performance](logfire/) to learn more.\n\n## `llms.txt`\n\nThe Pydantic AI documentation is
+                available in the [llms.txt](https://llmstxt.org/) format.\nThis format is defined in Markdown and suited for
+                LLMs and AI coding assistants and agents.\n\nTwo formats are available:\n\n* [`llms.txt`](https://ai.pydantic.dev/llms.txt):
+                a file containing a brief description\n  of the project, along with links to the different sections of the
+                documentation. The structure\n  of this file is described in details [here](https://llmstxt.org/#format).\n*
+                [`llms-full.txt`](https://ai.pydantic.dev/llms-full.txt): Similar to the `llms.txt` file,\n  but every link
+                content is included. Note that this file may be too large for some LLMs.\n\nAs of today, these files are not
+                automatically leveraged by IDEs or coding agents, but they will use it if you provide a link or the full text.\n\n##
+                Next Steps\n\nTo try Pydantic AI for yourself, [install it](install/) and follow the instructions [in the
+                examples](examples/setup/).\n\nRead the [docs](agents/) to learn more about building applications with Pydantic
+                AI.\n\nRead the [API Reference](api/agent/) to understand Pydantic AI's interface.\n\nJoin  [Slack](https://logfire.pydantic.dev/docs/join-slack/)
+                or file an issue on  [GitHub](https://github.com/pydantic/pydantic-ai/issues) if you have any questions.\n\n\n\n©
+                Pydantic Services Inc. 2024 to present"
               media_type: text/plain
               type: text
             title: Pydantic AI
             type: document
-          retrieved_at: '2025-11-14T23:34:21.151000+00:00'
+          retrieved_at: '2025-12-08T15:05:59.571000+00:00'
           type: web_fetch_result
           url: https://ai.pydantic.dev
-        tool_use_id: srvtoolu_01So85wNUocinTvFfgKCfQeb
+        tool_use_id: srvtoolu_01MSZmtbzt6NmQizTETf3GPF
         type: web_fetch_tool_result
       - text: Pydantic AI is a Python agent framework designed to help you quickly, confidently, and painlessly build production
           grade applications and workflows with Generative AI.
         type: text
-      id: msg_014MfQbsguyfo8X7ffezhM5Q
+      id: msg_015NpiPXidB2wEH4VhabzwgC
       model: claude-sonnet-4-20250514
       role: assistant
       stop_reason: end_turn
@@ -372,8 +362,8 @@ interactions:
           ephemeral_5m_input_tokens: 0
         cache_creation_input_tokens: 0
         cache_read_input_tokens: 0
-        input_tokens: 7262
-        output_tokens: 171
+        input_tokens: 11440
+        output_tokens: 158
         server_tool_use:
           web_fetch_requests: 1
           web_search_requests: 0
@@ -390,7 +380,7 @@ interactions:
       connection:
       - keep-alive
       content-length:
-      - '21997'
+      - '34473'
       content-type:
       - application/json
       host:
@@ -404,13 +394,12 @@ interactions:
           type: text
         role: user
       - content:
-        - signature: EsIDCkYICRgCKkAKi/j4a8lGN12CjyS27ZXcPkXHGyTbn1vJENJz+AjinyTnsrynMEhidWT5IMNAs0TDgwSwPLNmgq4MsPkVekB8EgxetaK+Nhg8wUdhTEAaDMukODgr3JaYHZwVEiIwgKBckFLJ/C7wCD9oGCIECbqpaeEuWQ8BH3Hev6wpuc+66Wu7AJM1jGH60BpsUovnKqkCrHNq6b1SDT41cm2w7cyxZggrX6crzYh0fAkZ+VC6FBjy6mJikZtX6reKD+064KZ4F1oe4Qd40EBp/wHvD7oPV/fhGut1fzwl48ZgB8uzJb3tHr9MBjs4PVTsvKstpHKpOo6NLvCknQJ/0730OTENp/JOR6h6RUl6kMl5OrHTvsDEYpselUBPtLikm9p4t+d8CxqGm/B1kg1wN3FGJK31PD3veYIOO4hBirFPXWd+AiB1rZP++2QjToZ9lD2xqP/Q3vWEU+/Ryp6uzaRFWPVQkIr+mzpIaJsYuKDiyduxF4LD/hdMTV7IVDtconeQIPQJRhuO6nICBEuqb0uIotPDnCU6iI2l9OyEeKJM0RS6/NTNG8DZnvyVJ8gGKbtZKSHK6KKsdH0f7d+DGAE=
-          thinking: |-
-            The user is asking me to fetch the content from https://ai.pydantic.dev and return only the first sentence on that page. I need to use the web_fetch tool to get the content from this URL, then identify the first sentence and return only that sentence.
-
-            Let me fetch the page first.
+        - signature: EooDCkYIChgCKkBe6ddqCwT1CKptPg14EIIaDdq/qCKZucUmb9w4ci/O5pSzheW3Vv33pkeqmFPrcr4l5CWAVM/xaV7NjHNwOPohEgza8xxqBGZ7jds5BzMaDFyd3dP3X5SSgPSg7SIwfyJLZ+yYCfCrpsgV77T7Ay6iBvfLp0ZaSb+ph+2YkSSVAxFDodWxWyv5DiVHRLJnKvEBcESvFzbas8bML22jelhD1nxGiyr6GGBCjavRGaz6LpPExc03FEa9qS0YEvAniVkVxLJprdDcW4Sm2/lLTh6TRiiicyELomVYxI4FrK1R981pA9ZdDgP8iE3YmcvhvvVJpxgUK+6Tr0LJSq5GgnlcPVEcXc+PYzqLNwlHiH+Vm9bPVs/N/JhfYBPKKREWgtXQBvpsxDM8f5Rj6569D7K3oKZ7Dbglc8eWyn1KFYHV4R+sXc4XOHJDPWuEjgW5/aYUfnP5yDlscfTHDgfrZVy7se8rjgtnpwLNstk7GbLUzgIft6p7hTTUIGB7icopfZtoahgB
+          thinking: The user wants me to fetch the content from https://ai.pydantic.dev and return only the first sentence.
+            I need to use the web_fetch tool to get the content from this URL, then identify the first sentence and return
+            only that.
           type: thinking
-        - id: srvtoolu_01So85wNUocinTvFfgKCfQeb
+        - id: srvtoolu_01MSZmtbzt6NmQizTETf3GPF
           input:
             url: https://ai.pydantic.dev
           name: web_fetch
@@ -419,295 +408,290 @@ interactions:
             content:
               citations: null
               source:
-                data: |-
-                  Pydantic AI
-                  GenAI Agent Framework, the Pydantic way
-                  Pydantic AI is a Python agent framework designed to help you quickly, confidently, and painlessly build production grade applications and workflows with Generative AI.
-                  FastAPI revolutionized web development by offering an innovative and ergonomic design, built on the foundation of [Pydantic Validation](https://docs.pydantic.dev) and modern Python features like type hints.
-                  Yet despite virtually every Python agent framework and LLM library using Pydantic Validation, when we began to use LLMs in [Pydantic Logfire](https://pydantic.dev/logfire), we couldn't find anything that gave us the same feeling.
-                  We built Pydantic AI with one simple aim: to bring that FastAPI feeling to GenAI app and agent development.
-                  Why use Pydantic AI
-                  -
-                  Built by the Pydantic Team:
-                  [Pydantic Validation](https://docs.pydantic.dev/latest/)is the validation layer of the OpenAI SDK, the Google ADK, the Anthropic SDK, LangChain, LlamaIndex, AutoGPT, Transformers, CrewAI, Instructor and many more. Why use the derivative when you can go straight to the source? -
-                  Model-agnostic: Supports virtually every
-                  [model](models/overview/)and provider: OpenAI, Anthropic, Gemini, DeepSeek, Grok, Cohere, Mistral, and Perplexity; Azure AI Foundry, Amazon Bedrock, Google Vertex AI, Ollama, LiteLLM, Groq, OpenRouter, Together AI, Fireworks AI, Cerebras, Hugging Face, GitHub, Heroku, Vercel, Nebius, OVHcloud, and Outlines. If your favorite model or provider is not listed, you can easily implement a[custom model](models/overview/#custom-models). -
-                  Seamless Observability: Tightly
-                  [integrates](logfire/)with[Pydantic Logfire](https://pydantic.dev/logfire), our general-purpose OpenTelemetry observability platform, for real-time debugging, evals-based performance monitoring, and behavior, tracing, and cost tracking. If you already have an observability platform that supports OTel, you can[use that too](logfire/#alternative-observability-backends). -
-                  Fully Type-safe: Designed to give your IDE or AI coding agent as much context as possible for auto-completion and
-                  [type checking](agents/#static-type-checking), moving entire classes of errors from runtime to write-time for a bit of that Rust "if it compiles, it works" feel. -
-                  Powerful Evals: Enables you to systematically test and
-                  [evaluate](evals/)the performance and accuracy of the agentic systems you build, and monitor the performance over time in Pydantic Logfire. -
-                  MCP, A2A, and UI: Integrates the
-                  [Model Context Protocol](mcp/overview/),[Agent2Agent](a2a/), and various[UI event stream](ui/overview/)standards to give your agent access to external tools and data, let it interoperate with other agents, and build interactive applications with streaming event-based communication. -
-                  Human-in-the-Loop Tool Approval: Easily lets you flag that certain tool calls
-                  [require approval](deferred-tools/#human-in-the-loop-tool-approval)before they can proceed, possibly depending on tool call arguments, conversation history, or user preferences. -
-                  Durable Execution: Enables you to build
-                  [durable agents](durable_execution/overview/)that can preserve their progress across transient API failures and application errors or restarts, and handle long-running, asynchronous, and human-in-the-loop workflows with production-grade reliability. -
-                  Streamed Outputs: Provides the ability to
-                  [stream](output/#streamed-results)structured output continuously, with immediate validation, ensuring real time access to generated data. -
-                  Graph Support: Provides a powerful way to define
-                  [graphs](graph/)using type hints, for use in complex applications where standard control flow can degrade to spaghetti code.
-                  Realistically though, no list is going to be as convincing as [giving it a try](#next-steps) and seeing how it makes you feel!
-                  Sign up for our newsletter, The Pydantic Stack, with updates & tutorials on Pydantic AI, Logfire, and Pydantic:
-                  Hello World Example
-                  Here's a minimal example of Pydantic AI:
-                  [Learn about Gateway](gateway)hello_world.py
-                  from pydantic_ai import Agent
-                  agent = Agent( # (1)!
-                  'gateway/anthropic:claude-sonnet-4-0',
-                  instructions='Be concise, reply with one sentence.', # (2)!
-                  )
-                  result = agent.run_sync('Where does "hello world" come from?') # (3)!
-                  print(result.output)
-                  """
-                  The first known use of "hello, world" was in a 1974 textbook about the C programming language.
-                  """
-                  - We configure the agent to use
-                  [Anthropic's Claude Sonnet 4.0](api/models/anthropic/)model, but you can also set the model when running the agent. - Register static
-                  [instructions](agents/#instructions)using a keyword argument to the agent. [Run the agent](agents/#running-agents)synchronously, starting a conversation with the LLM.
-                  from pydantic_ai import Agent
-                  agent = Agent( # (1)!
-                  'anthropic:claude-sonnet-4-0',
-                  instructions='Be concise, reply with one sentence.', # (2)!
-                  )
-                  result = agent.run_sync('Where does "hello world" come from?') # (3)!
-                  print(result.output)
-                  """
-                  The first known use of "hello, world" was in a 1974 textbook about the C programming language.
-                  """
-                  - We configure the agent to use
-                  [Anthropic's Claude Sonnet 4.0](api/models/anthropic/)model, but you can also set the model when running the agent. - Register static
-                  [instructions](agents/#instructions)using a keyword argument to the agent. [Run the agent](agents/#running-agents)synchronously, starting a conversation with the LLM.
-                  (This example is complete, it can be run "as is", assuming you've [installed the pydantic_ai package](install/))
-                  The exchange will be very short: Pydantic AI will send the instructions and the user prompt to the LLM, and the model will return a text response.
-                  Not very interesting yet, but we can easily add [tools](tools/), [dynamic instructions](agents/#instructions), and [structured outputs](output/) to build more powerful agents.
-                  Tools & Dependency Injection Example
-                  Here is a concise example using Pydantic AI to build a support agent for a bank:
-                  [Learn about Gateway](gateway)bank_support.py
-                  from dataclasses import dataclass
-                  from pydantic import BaseModel, Field
-                  from pydantic_ai import Agent, RunContext
-                  from bank_database import DatabaseConn
-                  @dataclass
-                  class SupportDependencies: # (3)!
-                  customer_id: int
-                  db: DatabaseConn # (12)!
-                  class SupportOutput(BaseModel): # (13)!
-                  support_advice: str = Field(description='Advice returned to the customer')
-                  block_card: bool = Field(description="Whether to block the customer's card")
-                  risk: int = Field(description='Risk level of query', ge=0, le=10)
-                  support_agent = Agent( # (1)!
-                  'gateway/openai:gpt-5', # (2)!
-                  deps_type=SupportDependencies,
-                  output_type=SupportOutput, # (9)!
-                  instructions=( # (4)!
-                  'You are a support agent in our bank, give the '
-                  'customer support and judge the risk level of their query.'
-                  ),
-                  )
-                  @support_agent.instructions # (5)!
-                  async def add_customer_name(ctx: RunContext[SupportDependencies]) -> str:
-                  customer_name = await ctx.deps.db.customer_name(id=ctx.deps.customer_id)
-                  return f"The customer's name is {customer_name!r}"
-                  @support_agent.tool # (6)!
-                  async def customer_balance(
-                  ctx: RunContext[SupportDependencies], include_pending: bool
-                  ) -> float:
-                  """Returns the customer's current account balance.""" # (7)!
-                  return await ctx.deps.db.customer_balance(
-                  id=ctx.deps.customer_id,
-                  include_pending=include_pending,
-                  )
-                  ... # (11)!
-                  async def main():
-                  deps = SupportDependencies(customer_id=123, db=DatabaseConn())
-                  result = await support_agent.run('What is my balance?', deps=deps) # (8)!
-                  print(result.output) # (10)!
-                  """
-                  support_advice='Hello John, your current account balance, including pending transactions, is $123.45.' block_card=False risk=1
-                  """
-                  result = await support_agent.run('I just lost my card!', deps=deps)
-                  print(result.output)
-                  """
-                  support_advice="I'm sorry to hear that, John. We are temporarily blocking your card to prevent unauthorized transactions." block_card=True risk=8
-                  """
-                  - This
-                  [agent](agents/)will act as first-tier support in a bank. Agents are generic in the type of dependencies they accept and the type of output they return. In this case, the support agent has typeAgent[SupportDependencies, SupportOutput]
-                  . - Here we configure the agent to use
-                  [OpenAI's GPT-5 model](api/models/openai/), you can also set the model when running the agent. - The
-                  SupportDependencies
-                  dataclass is used to pass data, connections, and logic into the model that will be needed when running[instructions](agents/#instructions)and[tool](tools/)functions. Pydantic AI's system of dependency injection provides a[type-safe](agents/#static-type-checking)way to customise the behavior of your agents, and can be especially useful when running[unit tests](testing/)and evals. - Static
-                  [instructions](agents/#instructions)can be registered with theto the agent.instructions
-                  keyword argument - Dynamic
-                  [instructions](agents/#instructions)can be registered with thedecorator, and can make use of dependency injection. Dependencies are carried via the@agent.instructions
-                  argument, which is parameterized with theRunContext
-                  deps_type
-                  from above. If the type annotation here is wrong, static type checkers will catch it. - The
-                  decorator let you register functions which the LLM may call while responding to a user. Again, dependencies are carried via@agent.tool
-                  , any other arguments become the tool schema passed to the LLM. Pydantic is used to validate these arguments, and errors are passed back to the LLM so it can retry.RunContext
-                  - The docstring of a tool is also passed to the LLM as the description of the tool. Parameter descriptions are
-                  [extracted](tools/#function-tools-and-schema)from the docstring and added to the parameter schema sent to the LLM. [Run the agent](agents/#running-agents)asynchronously, conducting a conversation with the LLM until a final response is reached. Even in this fairly simple case, the agent will exchange multiple messages with the LLM as tools are called to retrieve an output.- The response from the agent will be guaranteed to be a
-                  SupportOutput
-                  . If validation fails[reflection](agents/#reflection-and-self-correction), the agent is prompted to try again. - The output will be validated with Pydantic to guarantee it is a
-                  SupportOutput
-                  , since the agent is generic, it'll also be typed as aSupportOutput
-                  to aid with static type checking. - In a real use case, you'd add more tools and longer instructions to the agent to extend the context it's equipped with and support it can provide.
-                  - This is a simple sketch of a database connection, used to keep the example short and readable. In reality, you'd be connecting to an external database (e.g. PostgreSQL) to get information about customers.
-                  - This
-                  [Pydantic](https://docs.pydantic.dev)model is used to constrain the structured data returned by the agent. From this simple definition, Pydantic builds the JSON Schema that tells the LLM how to return the data, and performs validation to guarantee the data is correct at the end of the run.
-                  from dataclasses import dataclass
-                  from pydantic import BaseModel, Field
-                  from pydantic_ai import Agent, RunContext
-                  from bank_database import DatabaseConn
-                  @dataclass
-                  class SupportDependencies: # (3)!
-                  customer_id: int
-                  db: DatabaseConn # (12)!
-                  class SupportOutput(BaseModel): # (13)!
-                  support_advice: str = Field(description='Advice returned to the customer')
-                  block_card: bool = Field(description="Whether to block the customer's card")
-                  risk: int = Field(description='Risk level of query', ge=0, le=10)
-                  support_agent = Agent( # (1)!
-                  'openai:gpt-5', # (2)!
-                  deps_type=SupportDependencies,
-                  output_type=SupportOutput, # (9)!
-                  instructions=( # (4)!
-                  'You are a support agent in our bank, give the '
-                  'customer support and judge the risk level of their query.'
-                  ),
-                  )
-                  @support_agent.instructions # (5)!
-                  async def add_customer_name(ctx: RunContext[SupportDependencies]) -> str:
-                  customer_name = await ctx.deps.db.customer_name(id=ctx.deps.customer_id)
-                  return f"The customer's name is {customer_name!r}"
-                  @support_agent.tool # (6)!
-                  async def customer_balance(
-                  ctx: RunContext[SupportDependencies], include_pending: bool
-                  ) -> float:
-                  """Returns the customer's current account balance.""" # (7)!
-                  return await ctx.deps.db.customer_balance(
-                  id=ctx.deps.customer_id,
-                  include_pending=include_pending,
-                  )
-                  ... # (11)!
-                  async def main():
-                  deps = SupportDependencies(customer_id=123, db=DatabaseConn())
-                  result = await support_agent.run('What is my balance?', deps=deps) # (8)!
-                  print(result.output) # (10)!
-                  """
-                  support_advice='Hello John, your current account balance, including pending transactions, is $123.45.' block_card=False risk=1
-                  """
-                  result = await support_agent.run('I just lost my card!', deps=deps)
-                  print(result.output)
-                  """
-                  support_advice="I'm sorry to hear that, John. We are temporarily blocking your card to prevent unauthorized transactions." block_card=True risk=8
-                  """
-                  - This
-                  [agent](agents/)will act as first-tier support in a bank. Agents are generic in the type of dependencies they accept and the type of output they return. In this case, the support agent has typeAgent[SupportDependencies, SupportOutput]
-                  . - Here we configure the agent to use
-                  [OpenAI's GPT-5 model](api/models/openai/), you can also set the model when running the agent. - The
-                  SupportDependencies
-                  dataclass is used to pass data, connections, and logic into the model that will be needed when running[instructions](agents/#instructions)and[tool](tools/)functions. Pydantic AI's system of dependency injection provides a[type-safe](agents/#static-type-checking)way to customise the behavior of your agents, and can be especially useful when running[unit tests](testing/)and evals. - Static
-                  [instructions](agents/#instructions)can be registered with theto the agent.instructions
-                  keyword argument - Dynamic
-                  [instructions](agents/#instructions)can be registered with thedecorator, and can make use of dependency injection. Dependencies are carried via the@agent.instructions
-                  argument, which is parameterized with theRunContext
-                  deps_type
-                  from above. If the type annotation here is wrong, static type checkers will catch it. - The
-                  decorator let you register functions which the LLM may call while responding to a user. Again, dependencies are carried via@agent.tool
-                  , any other arguments become the tool schema passed to the LLM. Pydantic is used to validate these arguments, and errors are passed back to the LLM so it can retry.RunContext
-                  - The docstring of a tool is also passed to the LLM as the description of the tool. Parameter descriptions are
-                  [extracted](tools/#function-tools-and-schema)from the docstring and added to the parameter schema sent to the LLM. [Run the agent](agents/#running-agents)asynchronously, conducting a conversation with the LLM until a final response is reached. Even in this fairly simple case, the agent will exchange multiple messages with the LLM as tools are called to retrieve an output.- The response from the agent will be guaranteed to be a
-                  SupportOutput
-                  . If validation fails[reflection](agents/#reflection-and-self-correction), the agent is prompted to try again. - The output will be validated with Pydantic to guarantee it is a
-                  SupportOutput
-                  , since the agent is generic, it'll also be typed as aSupportOutput
-                  to aid with static type checking. - In a real use case, you'd add more tools and longer instructions to the agent to extend the context it's equipped with and support it can provide.
-                  - This is a simple sketch of a database connection, used to keep the example short and readable. In reality, you'd be connecting to an external database (e.g. PostgreSQL) to get information about customers.
-                  - This
-                  [Pydantic](https://docs.pydantic.dev)model is used to constrain the structured data returned by the agent. From this simple definition, Pydantic builds the JSON Schema that tells the LLM how to return the data, and performs validation to guarantee the data is correct at the end of the run.
-                  Complete bank_support.py
-                  example
-                  The code included here is incomplete for the sake of brevity (the definition of DatabaseConn
-                  is missing); you can find the complete bank_support.py
-                  example [here](examples/bank-support/).
-                  Instrumentation with Pydantic Logfire
-                  Even a simple agent with just a handful of tools can result in a lot of back-and-forth with the LLM, making it nearly impossible to be confident of what's going on just from reading the code. To understand the flow of the above runs, we can watch the agent in action using Pydantic Logfire.
-                  To do this, we need to [set up Logfire](logfire/#using-logfire), and add the following to our code:
-                  [Learn about Gateway](gateway)bank_support_with_logfire.py
-                  ...
-                  from pydantic_ai import Agent, RunContext
-                  from bank_database import DatabaseConn
-                  import logfire
-                  logfire.configure() # (1)!
-                  logfire.instrument_pydantic_ai() # (2)!
-                  logfire.instrument_asyncpg() # (3)!
-                  ...
-                  support_agent = Agent(
-                  'gateway/openai:gpt-5',
-                  deps_type=SupportDependencies,
-                  output_type=SupportOutput,
-                  system_prompt=(
-                  'You are a support agent in our bank, give the '
-                  'customer support and judge the risk level of their query.'
-                  ),
-                  )
-                  - Configure the Logfire SDK, this will fail if project is not set up.
-                  - This will instrument all Pydantic AI agents used from here on out. If you want to instrument only a specific agent, you can pass the
-                  to the agent.instrument=True
-                  keyword argument - In our demo,
-                  DatabaseConn
-                  usesto connect to a PostgreSQL database, soasyncpg
-                  is used to log the database queries.logfire.instrument_asyncpg()
-                  ...
-                  from pydantic_ai import Agent, RunContext
-                  from bank_database import DatabaseConn
-                  import logfire
-                  logfire.configure() # (1)!
-                  logfire.instrument_pydantic_ai() # (2)!
-                  logfire.instrument_asyncpg() # (3)!
-                  ...
-                  support_agent = Agent(
-                  'openai:gpt-5',
-                  deps_type=SupportDependencies,
-                  output_type=SupportOutput,
-                  system_prompt=(
-                  'You are a support agent in our bank, give the '
-                  'customer support and judge the risk level of their query.'
-                  ),
-                  )
-                  - Configure the Logfire SDK, this will fail if project is not set up.
-                  - This will instrument all Pydantic AI agents used from here on out. If you want to instrument only a specific agent, you can pass the
-                  to the agent.instrument=True
-                  keyword argument - In our demo,
-                  DatabaseConn
-                  usesto connect to a PostgreSQL database, soasyncpg
-                  is used to log the database queries.logfire.instrument_asyncpg()
-                  That's enough to get the following view of your agent in action:
-                  See [Monitoring and Performance](logfire/) to learn more.
-                  llms.txt
-                  The Pydantic AI documentation is available in the [llms.txt](https://llmstxt.org/) format.
-                  This format is defined in Markdown and suited for LLMs and AI coding assistants and agents.
-                  Two formats are available:
-                  : a file containing a brief description of the project, along with links to the different sections of the documentation. The structure of this file is described in detailsllms.txt
-                  [here](https://llmstxt.org/#format).: Similar to thellms-full.txt
-                  llms.txt
-                  file, but every link content is included. Note that this file may be too large for some LLMs.
-                  As of today, these files are not automatically leveraged by IDEs or coding agents, but they will use it if you provide a link or the full text.
-                  Next Steps
-                  To try Pydantic AI for yourself, [install it](install/) and follow the instructions [in the examples](examples/setup/).
-                  Read the [docs](agents/) to learn more about building applications with Pydantic AI.
-                  Read the [API Reference](api/agent/) to understand Pydantic AI's interface.
-                  Join [ Slack](https://logfire.pydantic.dev/docs/join-slack/) or file an issue on [ GitHub](https://github.com/pydantic/pydantic-ai/issues) if you have any questions.
+                data: "Pydantic AI\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n \n\n\n\n\n\n[Skip to content](#pydantic-ai)\n\n**[Pydantic
+                  AI Gateway](/gateway) is now available! \U0001F680\nEnterprise-ready AI model routing: One key for all your
+                  models with real-time monitoring and budget control that works.**\n\n[![logo](img/logo-white.svg)](. \"Pydantic
+                  AI\")\n\n\n\n\nPydantic AI\n\nPydantic AI\n\n\n\n\n\n\n\nType to start searching\n\n[pydantic/pydantic-ai](https://github.com/pydantic/pydantic-ai
+                  \"Go to repository\")\n\n[![logo](img/logo-white.svg)](. \"Pydantic AI\")\nPydantic AI\n\n[pydantic/pydantic-ai](https://github.com/pydantic/pydantic-ai
+                  \"Go to repository\")\n\n* Pydantic AI\n\n  [Pydantic AI](.)\n\n\n\n  Table of contents\n  + [Why use Pydantic
+                  AI](#why-use-pydantic-ai)\n  + [Hello World Example](#hello-world-example)\n  + [Tools & Dependency Injection
+                  Example](#tools-dependency-injection-example)\n  + [Instrumentation with Pydantic Logfire](#instrumentation-with-pydantic-logfire)\n
+                  \ + [llms.txt](#llmstxt)\n  + [Next Steps](#next-steps)\n* [Installation](install/)\n* [Getting Help](help/)\n*
+                  [Troubleshooting](troubleshooting/)\n* [Pydantic AI Gateway](gateway/)\n* Documentation\n\n\n\n\n  Documentation\n
+                  \ + Core Concepts\n\n\n\n\n    Core Concepts\n    - [Agents](agents/)\n    - [Dependencies](dependencies/)\n
+                  \   - [Function Tools](tools/)\n    - [Output](output/)\n    - [Messages and chat history](message-history/)\n
+                  \   - [Direct Model Requests](direct/)\n  + Models & Providers\n\n\n\n\n    Models & Providers\n    - [Overview](models/overview/)\n
+                  \   - [OpenAI](models/openai/)\n    - [Anthropic](models/anthropic/)\n    - [Google](models/google/)\n    -
+                  [Bedrock](models/bedrock/)\n    - [Cohere](models/cohere/)\n    - [Groq](models/groq/)\n    - [Hugging Face](models/huggingface/)\n
+                  \   - [Mistral](models/mistral/)\n    - [OpenRouter](models/openrouter/)\n    - [Outlines](models/outlines/)\n
+                  \ + Tools & Toolsets\n\n\n\n\n    Tools & Toolsets\n    - [Function Tools](tools/)\n    - [Advanced Tool
+                  Features](tools-advanced/)\n    - [Toolsets](toolsets/)\n    - [Deferred Tools](deferred-tools/)\n    -
+                  [Built-in Tools](builtin-tools/)\n    - [Common Tools](common-tools/)\n    - [Third-Party Tools](third-party-tools/)\n
+                  \ + Advanced Features\n\n\n\n\n    Advanced Features\n    - [Image, Audio, Video & Document Input](input/)\n
+                  \   - [Thinking](thinking/)\n    - [HTTP Request Retries](retries/)\n  + MCP\n\n\n\n\n    MCP\n    - [Overview](mcp/overview/)\n
+                  \   - [Client](mcp/client/)\n    - [FastMCP Client](mcp/fastmcp-client/)\n    - [Server](mcp/server/)\n
+                  \ + [Multi-Agent Patterns](multi-agent-applications/)\n  + [Testing](testing/)\n* Pydantic Evals\n\n\n\n\n
+                  \ Pydantic Evals\n  + [Overview](evals/)\n  + Getting Started\n\n\n\n\n    Getting Started\n    - [Quick
+                  Start](evals/quick-start/)\n    - [Core Concepts](evals/core-concepts/)\n  + Evaluators\n\n\n\n\n    Evaluators\n
+                  \   - [Overview](evals/evaluators/overview/)\n    - [Built-in Evaluators](evals/evaluators/built-in/)\n
+                  \   - [LLM Judge](evals/evaluators/llm-judge/)\n    - [Custom Evaluators](evals/evaluators/custom/)\n    -
+                  [Span-Based](evals/evaluators/span-based/)\n  + How-To Guides\n\n\n\n\n    How-To Guides\n    - [Logfire
+                  Integration](evals/how-to/logfire-integration/)\n    - [Dataset Management](evals/how-to/dataset-management/)\n
+                  \   - [Dataset Serialization](evals/how-to/dataset-serialization/)\n    - [Concurrency & Performance](evals/how-to/concurrency/)\n
+                  \   - [Retry Strategies](evals/how-to/retry-strategies/)\n    - [Metrics & Attributes](evals/how-to/metrics-attributes/)\n
+                  \ + Examples\n\n\n\n\n    Examples\n    - [Simple Validation](evals/examples/simple-validation/)\n* Pydantic
+                  Graph\n\n\n\n\n  Pydantic Graph\n  + [Overview](graph/)\n  + [Beta API](graph/beta/)\n\n    Beta API\n    -
+                  [Steps](graph/beta/steps/)\n    - [Joins & Reducers](graph/beta/joins/)\n    - [Decisions](graph/beta/decisions/)\n
+                  \   - [Parallel Execution](graph/beta/parallel/)\n* Integrations\n\n\n\n\n  Integrations\n  + [Debugging
+                  & Monitoring with Pydantic Logfire](logfire/)\n  + Durable Execution\n\n\n\n\n    Durable Execution\n    -
+                  [Overview](durable_execution/overview/)\n    - [Temporal](durable_execution/temporal/)\n    - [DBOS](durable_execution/dbos/)\n
+                  \   - [Prefect](durable_execution/prefect/)\n  + UI Event Streams\n\n\n\n\n    UI Event Streams\n    - [Overview](ui/overview/)\n
+                  \   - [AG-UI](ui/ag-ui/)\n    - [Vercel AI](ui/vercel-ai/)\n  + [Agent2Agent (A2A)](a2a/)\n* Related Packages\n\n\n\n\n
+                  \ Related Packages\n  + [Clai](cli/)\n* Examples\n\n\n\n\n  Examples\n  + [Setup](examples/setup/)\n  +
+                  Getting Started\n\n\n\n\n    Getting Started\n    - [Pydantic Model](examples/pydantic-model/)\n    - [Weather
+                  agent](examples/weather-agent/)\n  + Conversational Agents\n\n\n\n\n    Conversational Agents\n    - [Chat
+                  App with FastAPI](examples/chat-app/)\n    - [Bank support](examples/bank-support/)\n  + Data & Analytics\n\n\n\n\n
+                  \   Data & Analytics\n    - [SQL Generation](examples/sql-gen/)\n    - [Data Analyst](examples/data-analyst/)\n
+                  \   - [RAG](examples/rag/)\n  + Streaming\n\n\n\n\n    Streaming\n    - [Stream markdown](examples/stream-markdown/)\n
+                  \   - [Stream whales](examples/stream-whales/)\n  + Complex Workflows\n\n\n\n\n    Complex Workflows\n    -
+                  [Flight booking](examples/flight-booking/)\n    - [Question Graph](examples/question-graph/)\n  + Business
+                  Applications\n\n\n\n\n    Business Applications\n    - [Slack Lead Qualifier with Modal](examples/slack-lead-qualifier/)\n
+                  \ + UI Examples\n\n\n\n\n    UI Examples\n    - [Agent User Interaction (AG-UI)](examples/ag-ui/)\n* API
+                  Reference\n\n\n\n\n  API Reference\n  + pydantic\\_ai\n\n\n\n\n    pydantic\\_ai\n    - [pydantic\\_ai.agent](api/agent/)\n
+                  \   - [pydantic\\_ai.tools](api/tools/)\n    - [pydantic\\_ai.toolsets](api/toolsets/)\n    - [pydantic\\_ai.builtin\\_tools](api/builtin_tools/)\n
+                  \   - [pydantic\\_ai.common\\_tools](api/common_tools/)\n    - [pydantic\\_ai.durable\\_exec](api/durable_exec/)\n
+                  \   - [pydantic\\_ai.output](api/output/)\n    - [pydantic\\_ai.result](api/result/)\n    - [pydantic\\_ai.messages](api/messages/)\n
+                  \   - [pydantic\\_ai.exceptions](api/exceptions/)\n    - [pydantic\\_ai.settings](api/settings/)\n    -
+                  [pydantic\\_ai.usage](api/usage/)\n    - [pydantic\\_ai.mcp](api/mcp/)\n    - [pydantic\\_ai.format\\_prompt](api/format_prompt/)\n
+                  \   - [pydantic\\_ai.direct](api/direct/)\n    - [pydantic\\_ai.ext](api/ext/)\n    - [pydantic\\_ai.models.anthropic](api/models/anthropic/)\n
+                  \   - [pydantic\\_ai.models](api/models/base/)\n    - [pydantic\\_ai.models.bedrock](api/models/bedrock/)\n
+                  \   - [pydantic\\_ai.models.cohere](api/models/cohere/)\n    - [pydantic\\_ai.models.fallback](api/models/fallback/)\n
+                  \   - [pydantic\\_ai.models.function](api/models/function/)\n    - [pydantic\\_ai.models.google](api/models/google/)\n
+                  \   - [pydantic\\_ai.models.groq](api/models/groq/)\n    - [pydantic\\_ai.models.huggingface](api/models/huggingface/)\n
+                  \   - [pydantic\\_ai.models.instrumented](api/models/instrumented/)\n    - [pydantic\\_ai.models.mcp\\_sampling](api/models/mcp-sampling/)\n
+                  \   - [pydantic\\_ai.models.mistral](api/models/mistral/)\n    - [pydantic\\_ai.models.openai](api/models/openai/)\n
+                  \   - [pydantic\\_ai.models.openrouter](api/models/openrouter/)\n    - [pydantic\\_ai.models.outlines](api/models/outlines/)\n
+                  \   - [pydantic\\_ai.models.test](api/models/test/)\n    - [pydantic\\_ai.models.wrapper](api/models/wrapper/)\n
+                  \   - [pydantic\\_ai.profiles](api/profiles/)\n    - [pydantic\\_ai.providers](api/providers/)\n    - [pydantic\\_ai.retries](api/retries/)\n
+                  \   - [pydantic\\_ai.run](api/run/)\n    - [pydantic\\_ai.ag\\_ui](api/ag_ui/)\n    - [pydantic\\_ai.ui](api/ui/base/)\n
+                  \   - [pydantic\\_ai.ui.ag\\_ui](api/ui/ag_ui/)\n    - [pydantic\\_ai.ui.vercel\\_ai](api/ui/vercel_ai/)\n
+                  \ + pydantic\\_evals\n\n\n\n\n    pydantic\\_evals\n    - [pydantic\\_evals.dataset](api/pydantic_evals/dataset/)\n
+                  \   - [pydantic\\_evals.evaluators](api/pydantic_evals/evaluators/)\n    - [pydantic\\_evals.reporting](api/pydantic_evals/reporting/)\n
+                  \   - [pydantic\\_evals.otel](api/pydantic_evals/otel/)\n    - [pydantic\\_evals.generation](api/pydantic_evals/generation/)\n
+                  \ + pydantic\\_graph\n\n\n\n\n    pydantic\\_graph\n    - [pydantic\\_graph](api/pydantic_graph/graph/)\n
+                  \   - [pydantic\\_graph.nodes](api/pydantic_graph/nodes/)\n    - [pydantic\\_graph.persistence](api/pydantic_graph/persistence/)\n
+                  \   - [pydantic\\_graph.mermaid](api/pydantic_graph/mermaid/)\n    - [pydantic\\_graph.exceptions](api/pydantic_graph/exceptions/)\n
+                  \   - Beta API\n\n\n\n\n      Beta API\n      * [pydantic\\_graph.beta](api/pydantic_graph/beta/)\n      *
+                  [pydantic\\_graph.beta.graph](api/pydantic_graph/beta_graph/)\n      * [pydantic\\_graph.beta.graph\\_builder](api/pydantic_graph/beta_graph_builder/)\n
+                  \     * [pydantic\\_graph.beta.step](api/pydantic_graph/beta_step/)\n      * [pydantic\\_graph.beta.join](api/pydantic_graph/beta_join/)\n
+                  \     * [pydantic\\_graph.beta.decision](api/pydantic_graph/beta_decision/)\n      * [pydantic\\_graph.beta.node](api/pydantic_graph/beta_node/)\n
+                  \ + fasta2a\n\n\n\n\n    fasta2a\n    - [fasta2a](api/fasta2a/)\n* Project\n\n\n\n\n  Project\n  + [Contributing](contributing/)\n
+                  \ + [Upgrade Guide](changelog/)\n  + [Version policy](version-policy/)\n\nTable of contents\n\n* [Why use
+                  Pydantic AI](#why-use-pydantic-ai)\n* [Hello World Example](#hello-world-example)\n* [Tools & Dependency
+                  Injection Example](#tools-dependency-injection-example)\n* [Instrumentation with Pydantic Logfire](#instrumentation-with-pydantic-logfire)\n*
+                  [llms.txt](#llmstxt)\n* [Next Steps](#next-steps)\n\n# Pydantic AI\n\n![Pydantic AI](./img/pydantic-ai-dark.svg#only-dark)\n\n![Pydantic
+                  AI](./img/pydantic-ai-light.svg#only-light)\n\n*GenAI Agent Framework, the Pydantic way*\n\n[![CI](https://github.com/pydantic/pydantic-ai/actions/workflows/ci.yml/badge.svg?event=push)](https://github.com/pydantic/pydantic-ai/actions/workflows/ci.yml?query=branch%3Amain)\n[![Coverage](https://coverage-badge.samuelcolvin.workers.dev/pydantic/pydantic-ai.svg)](https://coverage-badge.samuelcolvin.workers.dev/redirect/pydantic/pydantic-ai)\n[![PyPI](https://img.shields.io/pypi/v/pydantic-ai.svg)](https://pypi.python.org/pypi/pydantic-ai)\n[![versions](https://img.shields.io/pypi/pyversions/pydantic-ai.svg)](https://github.com/pydantic/pydantic-ai)\n[![license](https://img.shields.io/github/license/pydantic/pydantic-ai.svg)](https://github.com/pydantic/pydantic-ai/blob/main/LICENSE)\n[![Join
+                  Slack](https://img.shields.io/badge/Slack-Join%20Slack-4A154B?logo=slack)](https://logfire.pydantic.dev/docs/join-slack/)\n\nPydantic
+                  AI is a Python agent framework designed to help you\nquickly, confidently, and painlessly build production
+                  grade applications and workflows with Generative AI.\n\nFastAPI revolutionized web development by offering
+                  an innovative and ergonomic design, built on the foundation of [Pydantic Validation](https://docs.pydantic.dev)
+                  and modern Python features like type hints.\n\nYet despite virtually every Python agent framework and LLM
+                  library using Pydantic Validation, when we began to use LLMs in [Pydantic Logfire](https://pydantic.dev/logfire),
+                  we couldn't find anything that gave us the same feeling.\n\nWe built Pydantic AI with one simple aim: to
+                  bring that FastAPI feeling to GenAI app and agent development.\n\n## Why use Pydantic AI\n\n1. **Built by
+                  the Pydantic Team**:\n   [Pydantic Validation](https://docs.pydantic.dev/latest/) is the validation layer
+                  of the OpenAI SDK, the Google ADK, the Anthropic SDK, LangChain, LlamaIndex, AutoGPT, Transformers, CrewAI,
+                  Instructor and many more. *Why use the derivative when you can go straight to the source?* ![\U0001F603](https://cdn.jsdelivr.net/gh/jdecked/twemoji@15.1.0/assets/svg/1f603.svg
+                  \":smiley:\")\n2. **Model-agnostic**:\n   Supports virtually every [model](models/overview/) and provider:
+                  OpenAI, Anthropic, Gemini, DeepSeek, Grok, Cohere, Mistral, and Perplexity; Azure AI Foundry, Amazon Bedrock,
+                  Google Vertex AI, Ollama, LiteLLM, Groq, OpenRouter, Together AI, Fireworks AI, Cerebras, Hugging Face,
+                  GitHub, Heroku, Vercel, Nebius, OVHcloud, and Outlines. If your favorite model or provider is not listed,
+                  you can easily implement a [custom model](models/overview/#custom-models).\n3. **Seamless Observability**:\n
+                  \  Tightly [integrates](logfire/) with [Pydantic Logfire](https://pydantic.dev/logfire), our general-purpose
+                  OpenTelemetry observability platform, for real-time debugging, evals-based performance monitoring, and behavior,
+                  tracing, and cost tracking. If you already have an observability platform that supports OTel, you can [use
+                  that too](logfire/#alternative-observability-backends).\n4. **Fully Type-safe**:\n   Designed to give your
+                  IDE or AI coding agent as much context as possible for auto-completion and [type checking](agents/#static-type-checking),
+                  moving entire classes of errors from runtime to write-time for a bit of that Rust \"if it compiles, it works\"
+                  feel.\n5. **Powerful Evals**:\n   Enables you to systematically test and [evaluate](evals/) the performance
+                  and accuracy of the agentic systems you build, and monitor the performance over time in Pydantic Logfire.\n6.
+                  **MCP, A2A, and UI**:\n   Integrates the [Model Context Protocol](mcp/overview/), [Agent2Agent](a2a/), and
+                  various [UI event stream](ui/overview/) standards to give your agent access to external tools and data,
+                  let it interoperate with other agents, and build interactive applications with streaming event-based communication.\n7.
+                  **Human-in-the-Loop Tool Approval**:\n   Easily lets you flag that certain tool calls [require approval](deferred-tools/#human-in-the-loop-tool-approval)
+                  before they can proceed, possibly depending on tool call arguments, conversation history, or user preferences.\n8.
+                  **Durable Execution**:\n   Enables you to build [durable agents](durable_execution/overview/) that can preserve
+                  their progress across transient API failures and application errors or restarts, and handle long-running,
+                  asynchronous, and human-in-the-loop workflows with production-grade reliability.\n9. **Streamed Outputs**:\n
+                  \  Provides the ability to [stream](output/#streamed-results) structured output continuously, with immediate
+                  validation, ensuring real time access to generated data.\n10. **Graph Support**:\n    Provides a powerful
+                  way to define [graphs](graph/) using type hints, for use in complex applications where standard control
+                  flow can degrade to spaghetti code.\n\nRealistically though, no list is going to be as convincing as [giving
+                  it a try](#next-steps) and seeing how it makes you feel!\n\n**Sign up for our newsletter, *The Pydantic
+                  Stack*, with updates & tutorials on Pydantic AI, Logfire, and Pydantic:**\n\nSubscribe\n\n## Hello World
+                  Example\n\nHere's a minimal example of Pydantic AI:\n\nWith Pydantic AI GatewayDirectly to Provider API\n\n[Learn
+                  about Gateway](../gateway) hello\\_world.py\n\n```\nfrom pydantic_ai import Agent\n\nagent = Agent(  # (1)!\n
+                  \   'gateway/anthropic:claude-sonnet-4-0',\n    instructions='Be concise, reply with one sentence.',  #
+                  (2)!\n)\n\nresult = agent.run_sync('Where does \"hello world\" come from?')  # (3)!\nprint(result.output)\n\"\"\"\nThe
+                  first known use of \"hello, world\" was in a 1974 textbook about the C programming language.\n\"\"\"\n```\n\n1.
+                  We configure the agent to use [Anthropic's Claude Sonnet 4.0](api/models/anthropic/) model, but you can
+                  also set the model when running the agent.\n2. Register static [instructions](agents/#instructions) using
+                  a keyword argument to the agent.\n3. [Run the agent](agents/#running-agents) synchronously, starting a conversation
+                  with the LLM.\n\nhello\\_world.py\n\n```\nfrom pydantic_ai import Agent\n\nagent = Agent(  # (1)!\n    'anthropic:claude-sonnet-4-0',\n
+                  \   instructions='Be concise, reply with one sentence.',  # (2)!\n)\n\nresult = agent.run_sync('Where does
+                  \"hello world\" come from?')  # (3)!\nprint(result.output)\n\"\"\"\nThe first known use of \"hello, world\"
+                  was in a 1974 textbook about the C programming language.\n\"\"\"\n```\n\n1. We configure the agent to use
+                  [Anthropic's Claude Sonnet 4.0](api/models/anthropic/) model, but you can also set the model when running
+                  the agent.\n2. Register static [instructions](agents/#instructions) using a keyword argument to the agent.\n3.
+                  [Run the agent](agents/#running-agents) synchronously, starting a conversation with the LLM.\n\n*(This example
+                  is complete, it can be run \"as is\", assuming you've [installed the `pydantic_ai` package](install/))*\n\nThe
+                  exchange will be very short: Pydantic AI will send the instructions and the user prompt to the LLM, and
+                  the model will return a text response.\n\nNot very interesting yet, but we can easily add [tools](tools/),
+                  [dynamic instructions](agents/#instructions), and [structured outputs](output/) to build more powerful agents.\n\n##
+                  Tools & Dependency Injection Example\n\nHere is a concise example using Pydantic AI to build a support agent
+                  for a bank:\n\nWith Pydantic AI GatewayDirectly to Provider API\n\n[Learn about Gateway](../gateway) bank\\_support.py\n\n```\nfrom
+                  dataclasses import dataclass\n\nfrom pydantic import BaseModel, Field\nfrom pydantic_ai import Agent, RunContext\n\nfrom
+                  bank_database import DatabaseConn\n\n\n@dataclass\nclass SupportDependencies:  # (3)!\n    customer_id:
+                  int\n    db: DatabaseConn  # (12)!\n\n\nclass SupportOutput(BaseModel):  # (13)!\n    support_advice: str
+                  = Field(description='Advice returned to the customer')\n    block_card: bool = Field(description=\"Whether
+                  to block the customer's card\")\n    risk: int = Field(description='Risk level of query', ge=0, le=10)\n\n\nsupport_agent
+                  = Agent(  # (1)!\n    'gateway/openai:gpt-5',  # (2)!\n    deps_type=SupportDependencies,\n    output_type=SupportOutput,
+                  \ # (9)!\n    instructions=(  # (4)!\n        'You are a support agent in our bank, give the '\n        'customer
+                  support and judge the risk level of their query.'\n    ),\n)\n\n\n@support_agent.instructions  # (5)!\nasync
+                  def add_customer_name(ctx: RunContext[SupportDependencies]) -> str:\n    customer_name = await ctx.deps.db.customer_name(id=ctx.deps.customer_id)\n
+                  \   return f\"The customer's name is {customer_name!r}\"\n\n\n@support_agent.tool  # (6)!\nasync def customer_balance(\n
+                  \   ctx: RunContext[SupportDependencies], include_pending: bool\n) -> float:\n    \"\"\"Returns the customer's
+                  current account balance.\"\"\"  # (7)!\n    return await ctx.deps.db.customer_balance(\n        id=ctx.deps.customer_id,\n
+                  \       include_pending=include_pending,\n    )\n\n\n...  # (11)!\n\n\nasync def main():\n    deps = SupportDependencies(customer_id=123,
+                  db=DatabaseConn())\n    result = await support_agent.run('What is my balance?', deps=deps)  # (8)!\n    print(result.output)
+                  \ # (10)!\n    \"\"\"\n    support_advice='Hello John, your current account balance, including pending transactions,
+                  is $123.45.' block_card=False risk=1\n    \"\"\"\n\n    result = await support_agent.run('I just lost my
+                  card!', deps=deps)\n    print(result.output)\n    \"\"\"\n    support_advice=\"I'm sorry to hear that, John.
+                  We are temporarily blocking your card to prevent unauthorized transactions.\" block_card=True risk=8\n    \"\"\"\n```\n\n1.
+                  This [agent](agents/) will act as first-tier support in a bank. Agents are generic in the type of dependencies
+                  they accept and the type of output they return. In this case, the support agent has type `Agent[SupportDependencies,
+                  SupportOutput]`.\n2. Here we configure the agent to use [OpenAI's GPT-5 model](api/models/openai/), you
+                  can also set the model when running the agent.\n3. The `SupportDependencies` dataclass is used to pass data,
+                  connections, and logic into the model that will be needed when running [instructions](agents/#instructions)
+                  and [tool](tools/) functions. Pydantic AI's system of dependency injection provides a [type-safe](agents/#static-type-checking)
+                  way to customise the behavior of your agents, and can be especially useful when running [unit tests](testing/)
+                  and evals.\n4. Static [instructions](agents/#instructions) can be registered with the [`instructions` keyword
+                  argument](api/agent/#pydantic_ai.agent.Agent.__init__) to the agent.\n5. Dynamic [instructions](agents/#instructions)
+                  can be registered with the [`@agent.instructions`](api/agent/#pydantic_ai.agent.Agent.instructions) decorator,
+                  and can make use of dependency injection. Dependencies are carried via the [`RunContext`](api/tools/#pydantic_ai.tools.RunContext)
+                  argument, which is parameterized with the `deps_type` from above. If the type annotation here is wrong,
+                  static type checkers will catch it.\n6. The [`@agent.tool`](tools/) decorator let you register functions
+                  which the LLM may call while responding to a user. Again, dependencies are carried via [`RunContext`](api/tools/#pydantic_ai.tools.RunContext),
+                  any other arguments become the tool schema passed to the LLM. Pydantic is used to validate these arguments,
+                  and errors are passed back to the LLM so it can retry.\n7. The docstring of a tool is also passed to the
+                  LLM as the description of the tool. Parameter descriptions are [extracted](tools/#function-tools-and-schema)
+                  from the docstring and added to the parameter schema sent to the LLM.\n8. [Run the agent](agents/#running-agents)
+                  asynchronously, conducting a conversation with the LLM until a final response is reached. Even in this fairly
+                  simple case, the agent will exchange multiple messages with the LLM as tools are called to retrieve an output.\n9.
+                  The response from the agent will be guaranteed to be a `SupportOutput`. If validation fails [reflection](agents/#reflection-and-self-correction),
+                  the agent is prompted to try again.\n10. The output will be validated with Pydantic to guarantee it is a
+                  `SupportOutput`, since the agent is generic, it'll also be typed as a `SupportOutput` to aid with static
+                  type checking.\n11. In a real use case, you'd add more tools and longer instructions to the agent to extend
+                  the context it's equipped with and support it can provide.\n12. This is a simple sketch of a database connection,
+                  used to keep the example short and readable. In reality, you'd be connecting to an external database (e.g.
+                  PostgreSQL) to get information about customers.\n13. This [Pydantic](https://docs.pydantic.dev) model is
+                  used to constrain the structured data returned by the agent. From this simple definition, Pydantic builds
+                  the JSON Schema that tells the LLM how to return the data, and performs validation to guarantee the data
+                  is correct at the end of the run.\n\nbank\\_support.py\n\n```\nfrom dataclasses import dataclass\n\nfrom
+                  pydantic import BaseModel, Field\nfrom pydantic_ai import Agent, RunContext\n\nfrom bank_database import
+                  DatabaseConn\n\n\n@dataclass\nclass SupportDependencies:  # (3)!\n    customer_id: int\n    db: DatabaseConn
+                  \ # (12)!\n\n\nclass SupportOutput(BaseModel):  # (13)!\n    support_advice: str = Field(description='Advice
+                  returned to the customer')\n    block_card: bool = Field(description=\"Whether to block the customer's card\")\n
+                  \   risk: int = Field(description='Risk level of query', ge=0, le=10)\n\n\nsupport_agent = Agent(  # (1)!\n
+                  \   'openai:gpt-5',  # (2)!\n    deps_type=SupportDependencies,\n    output_type=SupportOutput,  # (9)!\n
+                  \   instructions=(  # (4)!\n        'You are a support agent in our bank, give the '\n        'customer
+                  support and judge the risk level of their query.'\n    ),\n)\n\n\n@support_agent.instructions  # (5)!\nasync
+                  def add_customer_name(ctx: RunContext[SupportDependencies]) -> str:\n    customer_name = await ctx.deps.db.customer_name(id=ctx.deps.customer_id)\n
+                  \   return f\"The customer's name is {customer_name!r}\"\n\n\n@support_agent.tool  # (6)!\nasync def customer_balance(\n
+                  \   ctx: RunContext[SupportDependencies], include_pending: bool\n) -> float:\n    \"\"\"Returns the customer's
+                  current account balance.\"\"\"  # (7)!\n    return await ctx.deps.db.customer_balance(\n        id=ctx.deps.customer_id,\n
+                  \       include_pending=include_pending,\n    )\n\n\n...  # (11)!\n\n\nasync def main():\n    deps = SupportDependencies(customer_id=123,
+                  db=DatabaseConn())\n    result = await support_agent.run('What is my balance?', deps=deps)  # (8)!\n    print(result.output)
+                  \ # (10)!\n    \"\"\"\n    support_advice='Hello John, your current account balance, including pending transactions,
+                  is $123.45.' block_card=False risk=1\n    \"\"\"\n\n    result = await support_agent.run('I just lost my
+                  card!', deps=deps)\n    print(result.output)\n    \"\"\"\n    support_advice=\"I'm sorry to hear that, John.
+                  We are temporarily blocking your card to prevent unauthorized transactions.\" block_card=True risk=8\n    \"\"\"\n```\n\n1.
+                  This [agent](agents/) will act as first-tier support in a bank. Agents are generic in the type of dependencies
+                  they accept and the type of output they return. In this case, the support agent has type `Agent[SupportDependencies,
+                  SupportOutput]`.\n2. Here we configure the agent to use [OpenAI's GPT-5 model](api/models/openai/), you
+                  can also set the model when running the agent.\n3. The `SupportDependencies` dataclass is used to pass data,
+                  connections, and logic into the model that will be needed when running [instructions](agents/#instructions)
+                  and [tool](tools/) functions. Pydantic AI's system of dependency injection provides a [type-safe](agents/#static-type-checking)
+                  way to customise the behavior of your agents, and can be especially useful when running [unit tests](testing/)
+                  and evals.\n4. Static [instructions](agents/#instructions) can be registered with the [`instructions` keyword
+                  argument](api/agent/#pydantic_ai.agent.Agent.__init__) to the agent.\n5. Dynamic [instructions](agents/#instructions)
+                  can be registered with the [`@agent.instructions`](api/agent/#pydantic_ai.agent.Agent.instructions) decorator,
+                  and can make use of dependency injection. Dependencies are carried via the [`RunContext`](api/tools/#pydantic_ai.tools.RunContext)
+                  argument, which is parameterized with the `deps_type` from above. If the type annotation here is wrong,
+                  static type checkers will catch it.\n6. The [`@agent.tool`](tools/) decorator let you register functions
+                  which the LLM may call while responding to a user. Again, dependencies are carried via [`RunContext`](api/tools/#pydantic_ai.tools.RunContext),
+                  any other arguments become the tool schema passed to the LLM. Pydantic is used to validate these arguments,
+                  and errors are passed back to the LLM so it can retry.\n7. The docstring of a tool is also passed to the
+                  LLM as the description of the tool. Parameter descriptions are [extracted](tools/#function-tools-and-schema)
+                  from the docstring and added to the parameter schema sent to the LLM.\n8. [Run the agent](agents/#running-agents)
+                  asynchronously, conducting a conversation with the LLM until a final response is reached. Even in this fairly
+                  simple case, the agent will exchange multiple messages with the LLM as tools are called to retrieve an output.\n9.
+                  The response from the agent will be guaranteed to be a `SupportOutput`. If validation fails [reflection](agents/#reflection-and-self-correction),
+                  the agent is prompted to try again.\n10. The output will be validated with Pydantic to guarantee it is a
+                  `SupportOutput`, since the agent is generic, it'll also be typed as a `SupportOutput` to aid with static
+                  type checking.\n11. In a real use case, you'd add more tools and longer instructions to the agent to extend
+                  the context it's equipped with and support it can provide.\n12. This is a simple sketch of a database connection,
+                  used to keep the example short and readable. In reality, you'd be connecting to an external database (e.g.
+                  PostgreSQL) to get information about customers.\n13. This [Pydantic](https://docs.pydantic.dev) model is
+                  used to constrain the structured data returned by the agent. From this simple definition, Pydantic builds
+                  the JSON Schema that tells the LLM how to return the data, and performs validation to guarantee the data
+                  is correct at the end of the run.\n\nComplete `bank_support.py` example\n\nThe code included here is incomplete
+                  for the sake of brevity (the definition of `DatabaseConn` is missing); you can find the complete `bank_support.py`
+                  example [here](examples/bank-support/).\n\n## Instrumentation with Pydantic Logfire\n\nEven a simple agent
+                  with just a handful of tools can result in a lot of back-and-forth with the LLM, making it nearly impossible
+                  to be confident of what's going on just from reading the code.\nTo understand the flow of the above runs,
+                  we can watch the agent in action using Pydantic Logfire.\n\nTo do this, we need to [set up Logfire](logfire/#using-logfire),
+                  and add the following to our code:\n\nWith Pydantic AI GatewayDirectly to Provider API\n\n[Learn about Gateway](../gateway)
+                  bank\\_support\\_with\\_logfire.py\n\n```\n...\nfrom pydantic_ai import Agent, RunContext\n\nfrom bank_database
+                  import DatabaseConn\n\nimport logfire\n\nlogfire.configure()  # (1)!\nlogfire.instrument_pydantic_ai()  #
+                  (2)!\nlogfire.instrument_asyncpg()  # (3)!\n\n...\n\nsupport_agent = Agent(\n    'gateway/openai:gpt-5',\n
+                  \   deps_type=SupportDependencies,\n    output_type=SupportOutput,\n    system_prompt=(\n        'You are
+                  a support agent in our bank, give the '\n        'customer support and judge the risk level of their query.'\n
+                  \   ),\n)\n```\n\n1. Configure the Logfire SDK, this will fail if project is not set up.\n2. This will instrument
+                  all Pydantic AI agents used from here on out. If you want to instrument only a specific agent, you can pass
+                  the [`instrument=True` keyword argument](api/agent/#pydantic_ai.agent.Agent.__init__) to the agent.\n3.
+                  In our demo, `DatabaseConn` uses `asyncpg` to connect to a PostgreSQL database, so [`logfire.instrument_asyncpg()`](https://magicstack.github.io/asyncpg/current/)
+                  is used to log the database queries.\n\nbank\\_support\\_with\\_logfire.py\n\n```\n...\nfrom pydantic_ai
+                  import Agent, RunContext\n\nfrom bank_database import DatabaseConn\n\nimport logfire\n\nlogfire.configure()
+                  \ # (1)!\nlogfire.instrument_pydantic_ai()  # (2)!\nlogfire.instrument_asyncpg()  # (3)!\n\n...\n\nsupport_agent
+                  = Agent(\n    'openai:gpt-5',\n    deps_type=SupportDependencies,\n    output_type=SupportOutput,\n    system_prompt=(\n
+                  \       'You are a support agent in our bank, give the '\n        'customer support and judge the risk level
+                  of their query.'\n    ),\n)\n```\n\n1. Configure the Logfire SDK, this will fail if project is not set up.\n2.
+                  This will instrument all Pydantic AI agents used from here on out. If you want to instrument only a specific
+                  agent, you can pass the [`instrument=True` keyword argument](api/agent/#pydantic_ai.agent.Agent.__init__)
+                  to the agent.\n3. In our demo, `DatabaseConn` uses `asyncpg` to connect to a PostgreSQL database, so [`logfire.instrument_asyncpg()`](https://magicstack.github.io/asyncpg/current/)
+                  is used to log the database queries.\n\nThat's enough to get the following view of your agent in action:\n\nSee
+                  [Monitoring and Performance](logfire/) to learn more.\n\n## `llms.txt`\n\nThe Pydantic AI documentation
+                  is available in the [llms.txt](https://llmstxt.org/) format.\nThis format is defined in Markdown and suited
+                  for LLMs and AI coding assistants and agents.\n\nTwo formats are available:\n\n* [`llms.txt`](https://ai.pydantic.dev/llms.txt):
+                  a file containing a brief description\n  of the project, along with links to the different sections of the
+                  documentation. The structure\n  of this file is described in details [here](https://llmstxt.org/#format).\n*
+                  [`llms-full.txt`](https://ai.pydantic.dev/llms-full.txt): Similar to the `llms.txt` file,\n  but every link
+                  content is included. Note that this file may be too large for some LLMs.\n\nAs of today, these files are
+                  not automatically leveraged by IDEs or coding agents, but they will use it if you provide a link or the
+                  full text.\n\n## Next Steps\n\nTo try Pydantic AI for yourself, [install it](install/) and follow the instructions
+                  [in the examples](examples/setup/).\n\nRead the [docs](agents/) to learn more about building applications
+                  with Pydantic AI.\n\nRead the [API Reference](api/agent/) to understand Pydantic AI's interface.\n\nJoin
+                  \ [Slack](https://logfire.pydantic.dev/docs/join-slack/) or file an issue on  [GitHub](https://github.com/pydantic/pydantic-ai/issues)
+                  if you have any questions.\n\n\n\n© Pydantic Services Inc. 2024 to present"
                 media_type: text/plain
                 type: text
               title: Pydantic AI
               type: document
-            retrieved_at: '2025-11-14T23:34:21.151000+00:00'
+            retrieved_at: '2025-12-08T15:05:59.571000+00:00'
             type: web_fetch_result
             url: https://ai.pydantic.dev
-          tool_use_id: srvtoolu_01So85wNUocinTvFfgKCfQeb
+          tool_use_id: srvtoolu_01MSZmtbzt6NmQizTETf3GPF
           type: web_fetch_tool_result
         - text: Pydantic AI is a Python agent framework designed to help you quickly, confidently, and painlessly build production
             grade applications and workflows with Generative AI.
@@ -738,37 +722,49 @@ interactions:
       connection:
       - keep-alive
       content-length:
-      - '3150'
+      - '4730'
       content-type:
       - application/json
       retry-after:
-      - '36'
+      - '47'
       strict-transport-security:
       - max-age=31536000; includeSubDomains; preload
       transfer-encoding:
       - chunked
     parsed_body:
       content:
-      - signature: ErIHCkYICRgCKkDZrwipmaxoEat4WffzPSjVzIuSQWM2sHE6FLC2wt5S2qiJN2MQh//EImuLE9I2ssZjTMxGXZV+esnf5ipnzbvnEgxfcXs2ax8vnLdroxMaDCpqvdPKpCP3Qi0txCIw55NdOjY30P3/yRL9RF8sPGioyitlzkhSpf+PuC3YXwz4N0hoy8zVY1MHecwc60vcKpkGxtZsfqmAuJwjeGRr/Ugxcxd69+0X/Y9pojMiklNHq9otW+ehDX0rR0EzfdN/2jNOs3bOrzfy9jmvYE5FU2c5e0JpMP3LH0LrFvZYkSh7RkbhYuHvrOqohlE3BhpflrszowmiozUk+aG4wSqx5Dtxo9W7jfeU4wduy6OyEFdIqdYdTMR8VVf9Qnd5bLX4rY09xcGQc4JcX2mFjdSR2WgEJM7p5lytlN5unH3selWBVPbCj7ogU8DbT9zhY3zkDW1dMt2vNbWNaY4gVrLwi42qBJvjC5eJTADckvXAt+MCT9AAe1kmH9NlsgBnRy13O4lhXv9SPNDfk2tU5Tdco4h/I/fXh+WuPe6/MKk+tJuoBQTGVQ5ryFmomsNiwhwtLbQ44fLVHhyqEKSEdo/107xvbzhjmY/MAzn1Pmc9rd+OhFsjUCvgqI8cWNc/E694eJqg3J2S+I6YRzG3d2tR7laUivf+J38c2XmwSyXfdRoJpyZ9TixubpPk04WSchdFlEkxPBGEWLDkWOVL1PG5ztY48di7EzM1tvAwiT1BOxl4WRZ78Ewc+C5BVHwT658rIrcKJXXI/zBMsoReQT9xsRhpozbb576wNXggJdZsd2ysQY0O6Pihz54emwigm+zPbO5n8HvlrGKf6dSsrwusUJ1BIY4wI6qjz7gweRryReDEvEzMT8Ul4mIrigRy4yL2w+03qAclz8oGwxinMvcu8vJzXg+uRm/WbOgyco4gTPQiN4NcXbzwhVtJlNWZYXCiiMb/i6IXuOzZmSjI7LqxLubD9RgOy/2890RLvVJQBBVnOowW8q+iE93CoVBr1l5D54opLS9fHYcM7ezV0Ul34qMu6K0uoBG0+aLVlZHKEecN2/VE4fh0zYEDaeqRZfNH2gnAGmokdmPtEHlp33pvJ0IFDAbxKq2CVFFdB+lCGlaLQuZ5v6Mhq4b6H8DjaGZqo/vcB/MK4pr/F1SRjLzSHyh7Ey4ogBYSOXWfaeXQiZZFoEfxIUG9PzofIA1CCFk+eZSG7bGY4wXe2Whhh5bs+cJ3duYI9SL+49WBABgB
+      - signature: EoMLCkYIChgCKkAJqNs+Sem70XQqD4BTpMDThWZMMjR2WEgJKIlYvj4B8noeoZolpVe9rsKZqYy37KFQfVlgKVvznIhNoGYABCGdEgzfs4fFZUkmJ8pta9saDHNxHH70HOLepd+lICIwfnIjiGn76xEZI5AhKLCBCXvVWIaOJvYwmyZ2XTRot7v9VHCdnqpM3dS5NeU/BL6wKuoJpOdesmsKzzPUz2OpeaaCrD+0CDnHdzIHv1tM6kXMJvqrj4boQ+OE/s5FcFWwGArl0/SW3NwT11RoqFQQVI2ekTF8EqFIoixUBnRhwGEk+LauI+f429lKWoEvKP7bNAWrsu3j+jbBRNevFAk2BmfoDP9bfZtLAh1y/9topi6x5xvFNR4nNk/pXnkQLMjwAwjq63e4YZzxg3mMZ4e1Rzoyb18c6/TQgvZMYog87HCyWf+yJS9zVQxbl33szJcujnG6EHYRHw33Kb3/z73Sedv+FJgGf4oC1U9CPB1jErLkbhBb48yxpCdU1AZH+1jzgE4Gt1wY2yax7zG53m7IYvuELSM4H2mR9yF/V3WdmhTad8cOb1MtNek7JTsGPxxPd/FqKVLCl8vGXLz8W6GUzbSrtXtk0gnoiWoWbPzAj92K285k7fN7SfgsQPPhJseoDQg7CRL7tdU6xKYph0AsWsjPcv0x0xNwEW5L5uSMFgEZUmponS/pKOJYxuO9HcanU2GRyN91YEa3KrQDye8Pjei01iL/tVUYmQ4xHxCruNFbY7fVSqlYmc2r68sixCjSi8it3/MrR9ZtMZ8ujU9S50raPoP9Vy6fkfodP0BEEKADC/tSuZuDIr4TpZrtlLOIhDOzmzIV6+5biyQhDT28xypeASOv+M4KMjMaGIenZWMr0p2ER/xtK0Q+z9pNGBSDsP1E5jGjMxs25lObHkw8WHpssPf6hzEfxRYMAUriB+NHAuWfvro3pc+T8/yEWw31iW8vLwgZ0FdO3rabvCl0rIo6Wcu1pozHN63TSOP2p8vLtzWUEvOjLb0mR5BJgqZ8yqa3jyt1DrNyivXUuXlw0xqOcZwwWB5y1a2QDKAY5uzI37oEntLYCJ0fcyy0/stQiy5kbQbzDgIyQje9+NpT7CcoH6MURuR9QnUJ33K7/D+LzI7YUSJo8zT5szNhYov9m54+4klKTDnjuYGtFlT6tivkEdkybLPXSlKtrmvHZNCoJkZ3qlK5POwVJYTbLqm73INRttG+mPD3fH7GLLgF3eHvJOq0VzvXYT0j31tSe+zrPskwEqbl/ghPUR579KbQeWMmi9AeyD1F/MBUFf7nBqu27yCcH0oje+LjEN4sE1A9RPCXXdPC1zFPVgwfoSR/IR7xCRvL4Dp70QxBRujzZW008wRg2AXR+l5Dfz+OSfh4hCXg91GnVZmq8iNSL77yfwwK9o3EK48REbRV+ezJ3DQFeUrkDSw8tXCnpCtqIL/L74s7e0OYbgxpITrKEkOt4eMhTbWJY6JgwhUdViVKhdlf1OU6WRyOptZl1kRtKm7khQZ7ThSEaIDdRsndHR8cRBhHV+h31wKw6bgMvOQmqvAdljPXGPqkDLKDDrGkTMHn2fyHxRmCm24edSpNkBtIzyzMwlG9k33UP4ITly7vkcQCXxP+TD9qXdD33i/WzYYdiu5Vhfdxhxo9kUPDcUzp03eqBm2BetsXdva2+Nk0wy6ozUF+1wlqdMYBhf/JkorunuSB+dLW1lnp+c7GVRWKOWvljncJ0I6uWFD8B/kcH4eIQx49Cb0bZf2rDgVXqAkwKaBptupW6+AdDZfCB5Cs9DCXUVgFHSGljeCn2Rbelig68ncUwxio53luA3ldtfE8QV4uGSOf11OW0mnKOS6GHDro0SggtvsuL3eoVhgB
         thinking: |-
-          The user is asking about what framework is mentioned on the Pydantic AI page that I just fetched. Looking at the content, I can see several frameworks mentioned:
+          The user is asking about what framework is mentioned on the page I just fetched from https://ai.pydantic.dev. Let me look through the content to identify the frameworks mentioned.
+
+          Looking at the content, I can see several frameworks mentioned:
+
+          1. **Pydantic AI** - This is the main framework the page is about. It's described as "a Python agent framework designed to help you quickly, confidently, and painlessly build production grade applications and workflows with Generative AI."
+
+          2. **FastAPI** - The page mentions "FastAPI revolutionized web development by offering an innovative and ergonomic design, built on the foundation of Pydantic Validation and modern Python features like type hints." It also says "We built Pydantic AI with one simple aim: to bring that FastAPI feeling to GenAI app and agent development."
 
-          1. Pydantic AI itself - described as "a Python agent framework"
-          2. FastAPI - mentioned as having "revolutionized web development by offering an innovative and ergonomic design"
-          3. Various other frameworks/libraries mentioned like LangChain, LlamaIndex, AutoGPT, Transformers, CrewAI, Instructor
-          4. Pydantic Validation is mentioned as being used by many frameworks
-          5. OpenTelemetry is mentioned in relation to observability
+          3. **Pydantic Validation** - Mentioned as the foundation that FastAPI is built on.
 
-          But the most prominently featured framework that seems to be the main comparison point is FastAPI, as the page talks about bringing "that FastAPI feeling to GenAI app and agent development."
+          4. **Other frameworks mentioned in passing**: LangChain, LlamaIndex, AutoGPT, Transformers, CrewAI, Instructor (these are mentioned as examples of libraries that use Pydantic Validation)
+
+          The primary framework the page is about is **Pydantic AI**, but it also prominently mentions **FastAPI** as an inspiration and comparison point.
         type: thinking
-      - text: "Based on the page I fetched, the main framework it mentions and compares itself to is **FastAPI**. The page
-          states that \"FastAPI revolutionized web development by offering an innovative and ergonomic design\" and that Pydantic
-          AI was built with the aim \"to bring that FastAPI feeling to GenAI app and agent development.\"\n\nThe page also
-          mentions several other frameworks and libraries including:\n- LangChain\n- LlamaIndex  \n- AutoGPT\n- Transformers\n-
-          CrewAI\n- Instructor\n\nIt notes that \"virtually every Python agent framework and LLM library\" uses Pydantic Validation,
-          which is the foundation that Pydantic AI builds upon."
+      - text: |-
+          Based on the page I fetched, several frameworks are mentioned:
+
+          **Primary framework:**
+          - **Pydantic AI** - The main subject of the page, described as "a Python agent framework designed to help you quickly, confidently, and painlessly build production grade applications and workflows with Generative AI."
+
+          **Key comparison framework:**
+          - **FastAPI** - Prominently mentioned as the inspiration, with the page stating: "FastAPI revolutionized web development by offering an innovative and ergonomic design, built on the foundation of Pydantic Validation and modern Python features like type hints" and "We built Pydantic AI with one simple aim: to bring that FastAPI feeling to GenAI app and agent development."
+
+          **Other frameworks mentioned:**
+          - **Pydantic Validation** (the foundation both are built on)
+          - **LangChain, LlamaIndex, AutoGPT, Transformers, CrewAI, Instructor** (mentioned as examples of libraries that use Pydantic Validation)
+
+          The page positions Pydantic AI as bringing the same innovative and ergonomic design philosophy that made FastAPI successful to the GenAI and agent development space.
         type: text
-      id: msg_01SJJ9cZeR6yBpdy3Lf1Lx5i
+      id: msg_01Ea11Z69qskEERXpgbimoGg
       model: claude-sonnet-4-20250514
       role: assistant
       stop_reason: end_turn
@@ -780,8 +776,8 @@ interactions:
           ephemeral_5m_input_tokens: 0
         cache_creation_input_tokens: 0
         cache_read_input_tokens: 0
-        input_tokens: 6346
-        output_tokens: 354
+        input_tokens: 10537
+        output_tokens: 568
         service_tier: standard
     status:
       code: 200
diff --git a/tests/models/cassettes/test_anthropic/test_anthropic_web_fetch_tool_stream.yaml b/tests/models/cassettes/test_anthropic/test_anthropic_web_fetch_tool_stream.yaml
index d03bb3a332..9dbd8d8ed3 100644
--- a/tests/models/cassettes/test_anthropic/test_anthropic_web_fetch_tool_stream.yaml
+++ b/tests/models/cassettes/test_anthropic/test_anthropic_web_fetch_tool_stream.yaml
@@ -8,7 +8,7 @@ interactions:
       connection:
       - keep-alive
       content-length:
-      - '361'
+      - '466'
       content-type:
       - application/json
       host:
@@ -29,168 +29,327 @@ interactions:
       tool_choice:
         type: auto
       tools:
-      - name: web_fetch
+      - allowed_domains: null
+        blocked_domains: null
+        citations: null
+        max_content_tokens: null
+        max_uses: null
+        name: web_fetch
         type: web_fetch_20250910
     uri: https://api.anthropic.com/v1/messages?beta=true
   response:
     body:
-      string: |+
-        event: message_start
-        data: {"type":"message_start","message":{"model":"claude-sonnet-4-20250514","id":"msg_015eAVGKhBrs95jUkYb2BaDt","type":"message","role":"assistant","content":[],"stop_reason":null,"stop_sequence":null,"usage":{"input_tokens":899,"cache_creation_input_tokens":0,"cache_read_input_tokens":0,"cache_creation":{"ephemeral_5m_input_tokens":0,"ephemeral_1h_input_tokens":0},"output_tokens":3,"service_tier":"standard"}}        }
-
-        event: content_block_start
-        data: {"type":"content_block_start","index":0,"content_block":{"type":"thinking","thinking":"","signature":""}      }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":0,"delta":{"type":"thinking_delta","thinking":"The user wants"}         }
-
-        event: ping
-        data: {"type": "ping"}
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":0,"delta":{"type":"thinking_delta","thinking":" me to fetch"}    }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":0,"delta":{"type":"thinking_delta","thinking":" the content"}       }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":0,"delta":{"type":"thinking_delta","thinking":" from the URL https"}               }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":0,"delta":{"type":"thinking_delta","thinking":"://ai.pydantic.dev"}   }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":0,"delta":{"type":"thinking_delta","thinking":" and provide"}           }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":0,"delta":{"type":"thinking_delta","thinking":" only"}   }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":0,"delta":{"type":"thinking_delta","thinking":" the first sentence from"}             }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":0,"delta":{"type":"thinking_delta","thinking":" that page."}   }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":0,"delta":{"type":"thinking_delta","thinking":" I need to use the web_fetch"}    }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":0,"delta":{"type":"thinking_delta","thinking":" tool to"}         }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":0,"delta":{"type":"thinking_delta","thinking":" get the content from"}    }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":0,"delta":{"type":"thinking_delta","thinking":" this URL."}             }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":0,"delta":{"type":"signature_delta","signature":"EusCCkYICRgCKkAG/7zhRcmUoiMtml5iZUXVv3nqupp8kgk0nrq9zOoklaXzVCnrb9kwLNWGETIcCaAnLd0cd0ESwjslkVKdV9n8EgxKKdu8LlEvh9VGIWIaDAJ2Ja2NEacp1Am6jSIwyNO36tV+Sj+q6dWf79U+3KOIa1khXbIYarpkIViCuYQaZwpJ4Vtedrd7dLWTY2d5KtIB9Pug5UPuvepSOjyhxLaohtGxmdvZN8crGwBdTJYF9GHSli/rzvkR6CpH+ixd8iSopwFcsJgQ3j68fr/yD7cHmZ06jU3LaESVEBwTHnlK0ABiYnGvD3SvX6PgImMSQxQ1ThARFTA7DePoWw+z5DI0L2vgSun2qTYHkmGxzaEskhNIBlK9r7wS3tVcO0Di4lD/rhYV61tklL2NBWJqvm7ZCtJTN09CzPFJy7HDkg7bSINVL4kuu9gTWEtb/o40tw1b+sO62UcfxQTVFQ4Cj8D8XFZbGAE="}   }
-
-        event: content_block_stop
-        data: {"type":"content_block_stop","index":0               }
-
-        event: content_block_start
-        data: {"type":"content_block_start","index":1,"content_block":{"type":"server_tool_use","id":"srvtoolu_018ADaxdJjyZ8HXtF3sTBPNk","name":"web_fetch","input":{}}         }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":1,"delta":{"type":"input_json_delta","partial_json":""}   }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":1,"delta":{"type":"input_json_delta","partial_json":"{\"url\": \""}            }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":1,"delta":{"type":"input_json_delta","partial_json":"https://ai"}              }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":1,"delta":{"type":"input_json_delta","partial_json":".p"}   }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":1,"delta":{"type":"input_json_delta","partial_json":"yd"}             }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":1,"delta":{"type":"input_json_delta","partial_json":"antic.dev\"}"} }
-
-        event: content_block_stop
-        data: {"type":"content_block_stop","index":1             }
-
-        event: content_block_start
-        data: {"type":"content_block_start","index":2,"content_block":{"type":"web_fetch_tool_result","tool_use_id":"srvtoolu_018ADaxdJjyZ8HXtF3sTBPNk","content":{"type":"web_fetch_result","url":"https://ai.pydantic.dev","retrieved_at":"2025-11-14T23:34:21.151000+00:00","content":{"type":"document","source":{"type":"text","media_type":"text/plain","data":"Pydantic AI\nGenAI Agent Framework, the Pydantic way\nPydantic AI is a Python agent framework designed to help you quickly, confidently, and painlessly build production grade applications and workflows with Generative AI.\nFastAPI revolutionized web development by offering an innovative and ergonomic design, built on the foundation of [Pydantic Validation](https://docs.pydantic.dev) and modern Python features like type hints.\nYet despite virtually every Python agent framework and LLM library using Pydantic Validation, when we began to use LLMs in [Pydantic Logfire](https://pydantic.dev/logfire), we couldn't find anything that gave us the same feeling.\nWe built Pydantic AI with one simple aim: to bring that FastAPI feeling to GenAI app and agent development.\nWhy use Pydantic AI\n-\nBuilt by the Pydantic Team:\n[Pydantic Validation](https://docs.pydantic.dev/latest/)is the validation layer of the OpenAI SDK, the Google ADK, the Anthropic SDK, LangChain, LlamaIndex, AutoGPT, Transformers, CrewAI, Instructor and many more. Why use the derivative when you can go straight to the source? -\nModel-agnostic: Supports virtually every\n[model](models/overview/)and provider: OpenAI, Anthropic, Gemini, DeepSeek, Grok, Cohere, Mistral, and Perplexity; Azure AI Foundry, Amazon Bedrock, Google Vertex AI, Ollama, LiteLLM, Groq, OpenRouter, Together AI, Fireworks AI, Cerebras, Hugging Face, GitHub, Heroku, Vercel, Nebius, OVHcloud, and Outlines. If your favorite model or provider is not listed, you can easily implement a[custom model](models/overview/#custom-models). -\nSeamless Observability: Tightly\n[integrates](logfire/)with[Pydantic Logfire](https://pydantic.dev/logfire), our general-purpose OpenTelemetry observability platform, for real-time debugging, evals-based performance monitoring, and behavior, tracing, and cost tracking. If you already have an observability platform that supports OTel, you can[use that too](logfire/#alternative-observability-backends). -\nFully Type-safe: Designed to give your IDE or AI coding agent as much context as possible for auto-completion and\n[type checking](agents/#static-type-checking), moving entire classes of errors from runtime to write-time for a bit of that Rust \"if it compiles, it works\" feel. -\nPowerful Evals: Enables you to systematically test and\n[evaluate](evals/)the performance and accuracy of the agentic systems you build, and monitor the performance over time in Pydantic Logfire. -\nMCP, A2A, and UI: Integrates the\n[Model Context Protocol](mcp/overview/),[Agent2Agent](a2a/), and various[UI event stream](ui/overview/)standards to give your agent access to external tools and data, let it interoperate with other agents, and build interactive applications with streaming event-based communication. -\nHuman-in-the-Loop Tool Approval: Easily lets you flag that certain tool calls\n[require approval](deferred-tools/#human-in-the-loop-tool-approval)before they can proceed, possibly depending on tool call arguments, conversation history, or user preferences. -\nDurable Execution: Enables you to build\n[durable agents](durable_execution/overview/)that can preserve their progress across transient API failures and application errors or restarts, and handle long-running, asynchronous, and human-in-the-loop workflows with production-grade reliability. -\nStreamed Outputs: Provides the ability to\n[stream](output/#streamed-results)structured output continuously, with immediate validation, ensuring real time access to generated data. -\nGraph Support: Provides a powerful way to define\n[graphs](graph/)using type hints, for use in complex applications where standard control flow can degrade to spaghetti code.\nRealistically though, no list is going to be as convincing as [giving it a try](#next-steps) and seeing how it makes you feel!\nSign up for our newsletter, The Pydantic Stack, with updates & tutorials on Pydantic AI, Logfire, and Pydantic:\nHello World Example\nHere's a minimal example of Pydantic AI:\n[Learn about Gateway](gateway)hello_world.py\nfrom pydantic_ai import Agent\nagent = Agent( # (1)!\n'gateway/anthropic:claude-sonnet-4-0',\ninstructions='Be concise, reply with one sentence.', # (2)!\n)\nresult = agent.run_sync('Where does \"hello world\" come from?') # (3)!\nprint(result.output)\n\"\"\"\nThe first known use of \"hello, world\" was in a 1974 textbook about the C programming language.\n\"\"\"\n- We configure the agent to use\n[Anthropic's Claude Sonnet 4.0](api/models/anthropic/)model, but you can also set the model when running the agent. - Register static\n[instructions](agents/#instructions)using a keyword argument to the agent. [Run the agent](agents/#running-agents)synchronously, starting a conversation with the LLM.\nfrom pydantic_ai import Agent\nagent = Agent( # (1)!\n'anthropic:claude-sonnet-4-0',\ninstructions='Be concise, reply with one sentence.', # (2)!\n)\nresult = agent.run_sync('Where does \"hello world\" come from?') # (3)!\nprint(result.output)\n\"\"\"\nThe first known use of \"hello, world\" was in a 1974 textbook about the C programming language.\n\"\"\"\n- We configure the agent to use\n[Anthropic's Claude Sonnet 4.0](api/models/anthropic/)model, but you can also set the model when running the agent. - Register static\n[instructions](agents/#instructions)using a keyword argument to the agent. [Run the agent](agents/#running-agents)synchronously, starting a conversation with the LLM.\n(This example is complete, it can be run \"as is\", assuming you've [installed the pydantic_ai package](install/))\nThe exchange will be very short: Pydantic AI will send the instructions and the user prompt to the LLM, and the model will return a text response.\nNot very interesting yet, but we can easily add [tools](tools/), [dynamic instructions](agents/#instructions), and [structured outputs](output/) to build more powerful agents.\nTools & Dependency Injection Example\nHere is a concise example using Pydantic AI to build a support agent for a bank:\n[Learn about Gateway](gateway)bank_support.py\nfrom dataclasses import dataclass\nfrom pydantic import BaseModel, Field\nfrom pydantic_ai import Agent, RunContext\nfrom bank_database import DatabaseConn\n@dataclass\nclass SupportDependencies: # (3)!\ncustomer_id: int\ndb: DatabaseConn # (12)!\nclass SupportOutput(BaseModel): # (13)!\nsupport_advice: str = Field(description='Advice returned to the customer')\nblock_card: bool = Field(description=\"Whether to block the customer's card\")\nrisk: int = Field(description='Risk level of query', ge=0, le=10)\nsupport_agent = Agent( # (1)!\n'gateway/openai:gpt-5', # (2)!\ndeps_type=SupportDependencies,\noutput_type=SupportOutput, # (9)!\ninstructions=( # (4)!\n'You are a support agent in our bank, give the '\n'customer support and judge the risk level of their query.'\n),\n)\n@support_agent.instructions # (5)!\nasync def add_customer_name(ctx: RunContext[SupportDependencies]) -> str:\ncustomer_name = await ctx.deps.db.customer_name(id=ctx.deps.customer_id)\nreturn f\"The customer's name is {customer_name!r}\"\n@support_agent.tool # (6)!\nasync def customer_balance(\nctx: RunContext[SupportDependencies], include_pending: bool\n) -> float:\n\"\"\"Returns the customer's current account balance.\"\"\" # (7)!\nreturn await ctx.deps.db.customer_balance(\nid=ctx.deps.customer_id,\ninclude_pending=include_pending,\n)\n... # (11)!\nasync def main():\ndeps = SupportDependencies(customer_id=123, db=DatabaseConn())\nresult = await support_agent.run('What is my balance?', deps=deps) # (8)!\nprint(result.output) # (10)!\n\"\"\"\nsupport_advice='Hello John, your current account balance, including pending transactions, is $123.45.' block_card=False risk=1\n\"\"\"\nresult = await support_agent.run('I just lost my card!', deps=deps)\nprint(result.output)\n\"\"\"\nsupport_advice=\"I'm sorry to hear that, John. We are temporarily blocking your card to prevent unauthorized transactions.\" block_card=True risk=8\n\"\"\"\n- This\n[agent](agents/)will act as first-tier support in a bank. Agents are generic in the type of dependencies they accept and the type of output they return. In this case, the support agent has typeAgent[SupportDependencies, SupportOutput]\n. - Here we configure the agent to use\n[OpenAI's GPT-5 model](api/models/openai/), you can also set the model when running the agent. - The\nSupportDependencies\ndataclass is used to pass data, connections, and logic into the model that will be needed when running[instructions](agents/#instructions)and[tool](tools/)functions. Pydantic AI's system of dependency injection provides a[type-safe](agents/#static-type-checking)way to customise the behavior of your agents, and can be especially useful when running[unit tests](testing/)and evals. - Static\n[instructions](agents/#instructions)can be registered with theto the agent.instructions\nkeyword argument - Dynamic\n[instructions](agents/#instructions)can be registered with thedecorator, and can make use of dependency injection. Dependencies are carried via the@agent.instructions\nargument, which is parameterized with theRunContext\ndeps_type\nfrom above. If the type annotation here is wrong, static type checkers will catch it. - The\ndecorator let you register functions which the LLM may call while responding to a user. Again, dependencies are carried via@agent.tool\n, any other arguments become the tool schema passed to the LLM. Pydantic is used to validate these arguments, and errors are passed back to the LLM so it can retry.RunContext\n- The docstring of a tool is also passed to the LLM as the description of the tool. Parameter descriptions are\n[extracted](tools/#function-tools-and-schema)from the docstring and added to the parameter schema sent to the LLM. [Run the agent](agents/#running-agents)asynchronously, conducting a conversation with the LLM until a final response is reached. Even in this fairly simple case, the agent will exchange multiple messages with the LLM as tools are called to retrieve an output.- The response from the agent will be guaranteed to be a\nSupportOutput\n. If validation fails[reflection](agents/#reflection-and-self-correction), the agent is prompted to try again. - The output will be validated with Pydantic to guarantee it is a\nSupportOutput\n, since the agent is generic, it'll also be typed as aSupportOutput\nto aid with static type checking. - In a real use case, you'd add more tools and longer instructions to the agent to extend the context it's equipped with and support it can provide.\n- This is a simple sketch of a database connection, used to keep the example short and readable. In reality, you'd be connecting to an external database (e.g. PostgreSQL) to get information about customers.\n- This\n[Pydantic](https://docs.pydantic.dev)model is used to constrain the structured data returned by the agent. From this simple definition, Pydantic builds the JSON Schema that tells the LLM how to return the data, and performs validation to guarantee the data is correct at the end of the run.\nfrom dataclasses import dataclass\nfrom pydantic import BaseModel, Field\nfrom pydantic_ai import Agent, RunContext\nfrom bank_database import DatabaseConn\n@dataclass\nclass SupportDependencies: # (3)!\ncustomer_id: int\ndb: DatabaseConn # (12)!\nclass SupportOutput(BaseModel): # (13)!\nsupport_advice: str = Field(description='Advice returned to the customer')\nblock_card: bool = Field(description=\"Whether to block the customer's card\")\nrisk: int = Field(description='Risk level of query', ge=0, le=10)\nsupport_agent = Agent( # (1)!\n'openai:gpt-5', # (2)!\ndeps_type=SupportDependencies,\noutput_type=SupportOutput, # (9)!\ninstructions=( # (4)!\n'You are a support agent in our bank, give the '\n'customer support and judge the risk level of their query.'\n),\n)\n@support_agent.instructions # (5)!\nasync def add_customer_name(ctx: RunContext[SupportDependencies]) -> str:\ncustomer_name = await ctx.deps.db.customer_name(id=ctx.deps.customer_id)\nreturn f\"The customer's name is {customer_name!r}\"\n@support_agent.tool # (6)!\nasync def customer_balance(\nctx: RunContext[SupportDependencies], include_pending: bool\n) -> float:\n\"\"\"Returns the customer's current account balance.\"\"\" # (7)!\nreturn await ctx.deps.db.customer_balance(\nid=ctx.deps.customer_id,\ninclude_pending=include_pending,\n)\n... # (11)!\nasync def main():\ndeps = SupportDependencies(customer_id=123, db=DatabaseConn())\nresult = await support_agent.run('What is my balance?', deps=deps) # (8)!\nprint(result.output) # (10)!\n\"\"\"\nsupport_advice='Hello John, your current account balance, including pending transactions, is $123.45.' block_card=False risk=1\n\"\"\"\nresult = await support_agent.run('I just lost my card!', deps=deps)\nprint(result.output)\n\"\"\"\nsupport_advice=\"I'm sorry to hear that, John. We are temporarily blocking your card to prevent unauthorized transactions.\" block_card=True risk=8\n\"\"\"\n- This\n[agent](agents/)will act as first-tier support in a bank. Agents are generic in the type of dependencies they accept and the type of output they return. In this case, the support agent has typeAgent[SupportDependencies, SupportOutput]\n. - Here we configure the agent to use\n[OpenAI's GPT-5 model](api/models/openai/), you can also set the model when running the agent. - The\nSupportDependencies\ndataclass is used to pass data, connections, and logic into the model that will be needed when running[instructions](agents/#instructions)and[tool](tools/)functions. Pydantic AI's system of dependency injection provides a[type-safe](agents/#static-type-checking)way to customise the behavior of your agents, and can be especially useful when running[unit tests](testing/)and evals. - Static\n[instructions](agents/#instructions)can be registered with theto the agent.instructions\nkeyword argument - Dynamic\n[instructions](agents/#instructions)can be registered with thedecorator, and can make use of dependency injection. Dependencies are carried via the@agent.instructions\nargument, which is parameterized with theRunContext\ndeps_type\nfrom above. If the type annotation here is wrong, static type checkers will catch it. - The\ndecorator let you register functions which the LLM may call while responding to a user. Again, dependencies are carried via@agent.tool\n, any other arguments become the tool schema passed to the LLM. Pydantic is used to validate these arguments, and errors are passed back to the LLM so it can retry.RunContext\n- The docstring of a tool is also passed to the LLM as the description of the tool. Parameter descriptions are\n[extracted](tools/#function-tools-and-schema)from the docstring and added to the parameter schema sent to the LLM. [Run the agent](agents/#running-agents)asynchronously, conducting a conversation with the LLM until a final response is reached. Even in this fairly simple case, the agent will exchange multiple messages with the LLM as tools are called to retrieve an output.- The response from the agent will be guaranteed to be a\nSupportOutput\n. If validation fails[reflection](agents/#reflection-and-self-correction), the agent is prompted to try again. - The output will be validated with Pydantic to guarantee it is a\nSupportOutput\n, since the agent is generic, it'll also be typed as aSupportOutput\nto aid with static type checking. - In a real use case, you'd add more tools and longer instructions to the agent to extend the context it's equipped with and support it can provide.\n- This is a simple sketch of a database connection, used to keep the example short and readable. In reality, you'd be connecting to an external database (e.g. PostgreSQL) to get information about customers.\n- This\n[Pydantic](https://docs.pydantic.dev)model is used to constrain the structured data returned by the agent. From this simple definition, Pydantic builds the JSON Schema that tells the LLM how to return the data, and performs validation to guarantee the data is correct at the end of the run.\nComplete bank_support.py\nexample\nThe code included here is incomplete for the sake of brevity (the definition of DatabaseConn\nis missing); you can find the complete bank_support.py\nexample [here](examples/bank-support/).\nInstrumentation with Pydantic Logfire\nEven a simple agent with just a handful of tools can result in a lot of back-and-forth with the LLM, making it nearly impossible to be confident of what's going on just from reading the code. To understand the flow of the above runs, we can watch the agent in action using Pydantic Logfire.\nTo do this, we need to [set up Logfire](logfire/#using-logfire), and add the following to our code:\n[Learn about Gateway](gateway)bank_support_with_logfire.py\n...\nfrom pydantic_ai import Agent, RunContext\nfrom bank_database import DatabaseConn\nimport logfire\nlogfire.configure() # (1)!\nlogfire.instrument_pydantic_ai() # (2)!\nlogfire.instrument_asyncpg() # (3)!\n...\nsupport_agent = Agent(\n'gateway/openai:gpt-5',\ndeps_type=SupportDependencies,\noutput_type=SupportOutput,\nsystem_prompt=(\n'You are a support agent in our bank, give the '\n'customer support and judge the risk level of their query.'\n),\n)\n- Configure the Logfire SDK, this will fail if project is not set up.\n- This will instrument all Pydantic AI agents used from here on out. If you want to instrument only a specific agent, you can pass the\nto the agent.instrument=True\nkeyword argument - In our demo,\nDatabaseConn\nusesto connect to a PostgreSQL database, soasyncpg\nis used to log the database queries.logfire.instrument_asyncpg()\n...\nfrom pydantic_ai import Agent, RunContext\nfrom bank_database import DatabaseConn\nimport logfire\nlogfire.configure() # (1)!\nlogfire.instrument_pydantic_ai() # (2)!\nlogfire.instrument_asyncpg() # (3)!\n...\nsupport_agent = Agent(\n'openai:gpt-5',\ndeps_type=SupportDependencies,\noutput_type=SupportOutput,\nsystem_prompt=(\n'You are a support agent in our bank, give the '\n'customer support and judge the risk level of their query.'\n),\n)\n- Configure the Logfire SDK, this will fail if project is not set up.\n- This will instrument all Pydantic AI agents used from here on out. If you want to instrument only a specific agent, you can pass the\nto the agent.instrument=True\nkeyword argument - In our demo,\nDatabaseConn\nusesto connect to a PostgreSQL database, soasyncpg\nis used to log the database queries.logfire.instrument_asyncpg()\nThat's enough to get the following view of your agent in action:\nSee [Monitoring and Performance](logfire/) to learn more.\nllms.txt\nThe Pydantic AI documentation is available in the [llms.txt](https://llmstxt.org/) format.\nThis format is defined in Markdown and suited for LLMs and AI coding assistants and agents.\nTwo formats are available:\n: a file containing a brief description of the project, along with links to the different sections of the documentation. The structure of this file is described in detailsllms.txt\n[here](https://llmstxt.org/#format).: Similar to thellms-full.txt\nllms.txt\nfile, but every link content is included. Note that this file may be too large for some LLMs.\nAs of today, these files are not automatically leveraged by IDEs or coding agents, but they will use it if you provide a link or the full text.\nNext Steps\nTo try Pydantic AI for yourself, [install it](install/) and follow the instructions [in the examples](examples/setup/).\nRead the [docs](agents/) to learn more about building applications with Pydantic AI.\nRead the [API Reference](api/agent/) to understand Pydantic AI's interface.\nJoin [ Slack](https://logfire.pydantic.dev/docs/join-slack/) or file an issue on [ GitHub](https://github.com/pydantic/pydantic-ai/issues) if you have any questions."},"title":"Pydantic AI"}}} }
-
-        event: content_block_stop
-        data: {"type":"content_block_stop","index":2    }
-
-        event: content_block_start
-        data: {"type":"content_block_start","index":3,"content_block":{"type":"text","text":""}      }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":3,"delta":{"type":"text_delta","text":"P"} }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":3,"delta":{"type":"text_delta","text":"ydantic AI is a"}          }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":3,"delta":{"type":"text_delta","text":" Python"}}
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":3,"delta":{"type":"text_delta","text":" agent"}    }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":3,"delta":{"type":"text_delta","text":" framework"}              }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":3,"delta":{"type":"text_delta","text":" designe"}     }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":3,"delta":{"type":"text_delta","text":"d to help"}             }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":3,"delta":{"type":"text_delta","text":" you quickly"}         }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":3,"delta":{"type":"text_delta","text":","}               }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":3,"delta":{"type":"text_delta","text":" confi"}          }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":3,"delta":{"type":"text_delta","text":"dently,"}    }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":3,"delta":{"type":"text_delta","text":" and pain"} }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":3,"delta":{"type":"text_delta","text":"lessly build production"}            }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":3,"delta":{"type":"text_delta","text":" grade"}              }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":3,"delta":{"type":"text_delta","text":" applications"}        }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":3,"delta":{"type":"text_delta","text":" an"}           }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":3,"delta":{"type":"text_delta","text":"d workflows"}               }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":3,"delta":{"type":"text_delta","text":" with"}   }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":3,"delta":{"type":"text_delta","text":" Gener"}        }
-
-        event: content_block_delta
-        data: {"type":"content_block_delta","index":3,"delta":{"type":"text_delta","text":"ative AI."}           }
-
-        event: content_block_stop
-        data: {"type":"content_block_stop","index":3   }
-
-        event: message_delta
-        data: {"type":"message_delta","delta":{"stop_reason":"end_turn","stop_sequence":null},"usage":{"input_tokens":7244,"cache_creation_input_tokens":0,"cache_read_input_tokens":0,"output_tokens":153,"server_tool_use":{"web_search_requests":0,"web_fetch_requests":1}}            }
-
-        event: message_stop
-        data: {"type":"message_stop"         }
-
+      string: "event: message_start\ndata: {\"type\":\"message_start\",\"message\":{\"model\":\"claude-sonnet-4-20250514\",\"id\":\"msg_01JxeuU5zQRPduCDXsDQhMry\",\"type\":\"message\",\"role\":\"assistant\",\"content\":[],\"stop_reason\":null,\"stop_sequence\":null,\"usage\":{\"input_tokens\":899,\"cache_creation_input_tokens\":0,\"cache_read_input_tokens\":0,\"cache_creation\":{\"ephemeral_5m_input_tokens\":0,\"ephemeral_1h_input_tokens\":0},\"output_tokens\":8,\"service_tier\":\"standard\"}}
+        \          }\n\nevent: content_block_start\ndata: {\"type\":\"content_block_start\",\"index\":0,\"content_block\":{\"type\":\"thinking\",\"thinking\":\"\",\"signature\":\"\"}
+        \   }\n\nevent: content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":0,\"delta\":{\"type\":\"thinking_delta\",\"thinking\":\"The
+        user is asking for the first sentence\"}      }\n\nevent: ping\ndata: {\"type\": \"ping\"}\n\nevent: content_block_delta\ndata:
+        {\"type\":\"content_block_delta\",\"index\":0,\"delta\":{\"type\":\"thinking_delta\",\"thinking\":\" on a specific\"}
+        \            }\n\nevent: content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":0,\"delta\":{\"type\":\"thinking_delta\",\"thinking\":\"
+        web page. I need to use the\"}    }\n\nevent: content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":0,\"delta\":{\"type\":\"thinking_delta\",\"thinking\":\"
+        web_fetch tool to get\"}       }\n\nevent: content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":0,\"delta\":{\"type\":\"thinking_delta\",\"thinking\":\"
+        the content from that URL an\"}             }\n\nevent: content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":0,\"delta\":{\"type\":\"thinking_delta\",\"thinking\":\"d
+        then identify\"}     }\n\nevent: content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":0,\"delta\":{\"type\":\"thinking_delta\",\"thinking\":\"
+        the first sentence.\\n\\nThe\"}           }\n\nevent: content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":0,\"delta\":{\"type\":\"thinking_delta\",\"thinking\":\"
+        URL provide\"}      }\n\nevent: content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":0,\"delta\":{\"type\":\"thinking_delta\",\"thinking\":\"d
+        is https\"}}\n\nevent: content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":0,\"delta\":{\"type\":\"thinking_delta\",\"thinking\":\"://ai.pydantic.dev\"}
+        }\n\nevent: content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":0,\"delta\":{\"type\":\"thinking_delta\",\"thinking\":\"
+        -\"}           }\n\nevent: content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":0,\"delta\":{\"type\":\"thinking_delta\",\"thinking\":\"
+        this appears to be a vali\"}            }\n\nevent: content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":0,\"delta\":{\"type\":\"thinking_delta\",\"thinking\":\"d
+        URL with\"}     }\n\nevent: content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":0,\"delta\":{\"type\":\"thinking_delta\",\"thinking\":\"
+        the\"}              }\n\nevent: content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":0,\"delta\":{\"type\":\"thinking_delta\",\"thinking\":\"
+        https\"}    }\n\nevent: content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":0,\"delta\":{\"type\":\"thinking_delta\",\"thinking\":\"
+        schema\"}            }\n\nevent: content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":0,\"delta\":{\"type\":\"thinking_delta\",\"thinking\":\"
+        include\"}           }\n\nevent: content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":0,\"delta\":{\"type\":\"thinking_delta\",\"thinking\":\"d.\"}
+        \      }\n\nevent: content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":0,\"delta\":{\"type\":\"thinking_delta\",\"thinking\":\"\"}
+        \      }\n\nevent: content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":0,\"delta\":{\"type\":\"signature_delta\",\"signature\":\"EsADCkYIChgCKkA58AqPyRf+zhQwXZM7L/AlQu/MXqlBYT9D+Iin18ScuuGOJF9C0G2tTRtuap+cryX9hT5kc/qcUYlnIb9Vm8BfEgzmZTiT2aAYFcrlsqwaDPzuOGNFvVPoClWurCIwmtlSAwBmrVAOblmM9pdEC3LDbBdJ43qZlP3EHrxuV+Z7/XxW9raDXU4Kz0Ug+GiEKqcC+uDpVdQEtTxJYYxouugfzpunt5grRDUECpgdkXY0u8Hy8XhfwaIkEOmkY8RckI9fqatCczffZ4fWztKzw1Nygxqmox7NgZhw+NBuliEjr3Mm1L+bKbDuOxsjMlOrl2fRMNIupBiJWVP+qiStetD1mF+8+qEjb01vHaWUjScsNhmxus4+zJGVu9CyV42rnw9pb4v3w4vvuaBxw3GpanyXjbRaOP/L5v16kxIM/tZzJb8TQw8R8rFnIWPLSKZ2mT/r5js1A+f3DKb41dEe8T21JyZCR5PkBoWP+xmvxzbp9/zCl3CeVfGXG18NtigQwo2yvi0N4TC4sGHmcAMKafbvt+TwJODEmBBYBW/zYaqUyYjxhz04g29Ji2WKqUQf+8eg+SSbfc8LcBgB\"}
+        \             }\n\nevent: content_block_stop\ndata: {\"type\":\"content_block_stop\",\"index\":0       }\n\nevent:
+        content_block_start\ndata: {\"type\":\"content_block_start\",\"index\":1,\"content_block\":{\"type\":\"server_tool_use\",\"id\":\"srvtoolu_011CmugtvU55veq6jzEtGtnt\",\"name\":\"web_fetch\",\"input\":{}}
+        \        }\n\nevent: content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":1,\"delta\":{\"type\":\"input_json_delta\",\"partial_json\":\"\"}
+        \       }\n\nevent: content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":1,\"delta\":{\"type\":\"input_json_delta\",\"partial_json\":\"{\\\"ur\"}
+        }\n\nevent: content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":1,\"delta\":{\"type\":\"input_json_delta\",\"partial_json\":\"l\\\":
+        \\\"htt\"}          }\n\nevent: content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":1,\"delta\":{\"type\":\"input_json_delta\",\"partial_json\":\"ps://ai\"}
+        \      }\n\nevent: content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":1,\"delta\":{\"type\":\"input_json_delta\",\"partial_json\":\".pydantic\"}
+        \   }\n\nevent: content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":1,\"delta\":{\"type\":\"input_json_delta\",\"partial_json\":\".dev\\\"}\"}
+        \        }\n\nevent: content_block_stop\ndata: {\"type\":\"content_block_stop\",\"index\":1            }\n\nevent:
+        content_block_start\ndata: {\"type\":\"content_block_start\",\"index\":2,\"content_block\":{\"type\":\"web_fetch_tool_result\",\"tool_use_id\":\"srvtoolu_011CmugtvU55veq6jzEtGtnt\",\"content\":{\"type\":\"web_fetch_result\",\"url\":\"https://ai.pydantic.dev\",\"retrieved_at\":\"2025-12-08T15:05:59.571000+00:00\",\"content\":{\"type\":\"document\",\"source\":{\"type\":\"text\",\"media_type\":\"text/plain\",\"data\":\"Pydantic
+        AI\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n \\n\\n\\n\\n\\n\\n[Skip to content](#pydantic-ai)\\n\\n**[Pydantic
+        AI Gateway](/gateway) is now available! \U0001F680\\nEnterprise-ready AI model routing: One key for all your models
+        with real-time monitoring and budget control that works.**\\n\\n[![logo](img/logo-white.svg)](. \\\"Pydantic AI\\\")\\n\\n\\n\\n\\nPydantic
+        AI\\n\\nPydantic AI\\n\\n\\n\\n\\n\\n\\n\\nType to start searching\\n\\n[pydantic/pydantic-ai](https://github.com/pydantic/pydantic-ai
+        \\\"Go to repository\\\")\\n\\n[![logo](img/logo-white.svg)](. \\\"Pydantic AI\\\")\\nPydantic AI\\n\\n[pydantic/pydantic-ai](https://github.com/pydantic/pydantic-ai
+        \\\"Go to repository\\\")\\n\\n* Pydantic AI\\n\\n  [Pydantic AI](.)\\n\\n\\n\\n  Table of contents\\n  + [Why use
+        Pydantic AI](#why-use-pydantic-ai)\\n  + [Hello World Example](#hello-world-example)\\n  + [Tools & Dependency Injection
+        Example](#tools-dependency-injection-example)\\n  + [Instrumentation with Pydantic Logfire](#instrumentation-with-pydantic-logfire)\\n
+        \ + [llms.txt](#llmstxt)\\n  + [Next Steps](#next-steps)\\n* [Installation](install/)\\n* [Getting Help](help/)\\n*
+        [Troubleshooting](troubleshooting/)\\n* [Pydantic AI Gateway](gateway/)\\n* Documentation\\n\\n\\n\\n\\n  Documentation\\n
+        \ + Core Concepts\\n\\n\\n\\n\\n    Core Concepts\\n    - [Agents](agents/)\\n    - [Dependencies](dependencies/)\\n
+        \   - [Function Tools](tools/)\\n    - [Output](output/)\\n    - [Messages and chat history](message-history/)\\n
+        \   - [Direct Model Requests](direct/)\\n  + Models & Providers\\n\\n\\n\\n\\n    Models & Providers\\n    - [Overview](models/overview/)\\n
+        \   - [OpenAI](models/openai/)\\n    - [Anthropic](models/anthropic/)\\n    - [Google](models/google/)\\n    - [Bedrock](models/bedrock/)\\n
+        \   - [Cohere](models/cohere/)\\n    - [Groq](models/groq/)\\n    - [Hugging Face](models/huggingface/)\\n    - [Mistral](models/mistral/)\\n
+        \   - [OpenRouter](models/openrouter/)\\n    - [Outlines](models/outlines/)\\n  + Tools & Toolsets\\n\\n\\n\\n\\n
+        \   Tools & Toolsets\\n    - [Function Tools](tools/)\\n    - [Advanced Tool Features](tools-advanced/)\\n    - [Toolsets](toolsets/)\\n
+        \   - [Deferred Tools](deferred-tools/)\\n    - [Built-in Tools](builtin-tools/)\\n    - [Common Tools](common-tools/)\\n
+        \   - [Third-Party Tools](third-party-tools/)\\n  + Advanced Features\\n\\n\\n\\n\\n    Advanced Features\\n    -
+        [Image, Audio, Video & Document Input](input/)\\n    - [Thinking](thinking/)\\n    - [HTTP Request Retries](retries/)\\n
+        \ + MCP\\n\\n\\n\\n\\n    MCP\\n    - [Overview](mcp/overview/)\\n    - [Client](mcp/client/)\\n    - [FastMCP Client](mcp/fastmcp-client/)\\n
+        \   - [Server](mcp/server/)\\n  + [Multi-Agent Patterns](multi-agent-applications/)\\n  + [Testing](testing/)\\n*
+        Pydantic Evals\\n\\n\\n\\n\\n  Pydantic Evals\\n  + [Overview](evals/)\\n  + Getting Started\\n\\n\\n\\n\\n    Getting
+        Started\\n    - [Quick Start](evals/quick-start/)\\n    - [Core Concepts](evals/core-concepts/)\\n  + Evaluators\\n\\n\\n\\n\\n
+        \   Evaluators\\n    - [Overview](evals/evaluators/overview/)\\n    - [Built-in Evaluators](evals/evaluators/built-in/)\\n
+        \   - [LLM Judge](evals/evaluators/llm-judge/)\\n    - [Custom Evaluators](evals/evaluators/custom/)\\n    - [Span-Based](evals/evaluators/span-based/)\\n
+        \ + How-To Guides\\n\\n\\n\\n\\n    How-To Guides\\n    - [Logfire Integration](evals/how-to/logfire-integration/)\\n
+        \   - [Dataset Management](evals/how-to/dataset-management/)\\n    - [Dataset Serialization](evals/how-to/dataset-serialization/)\\n
+        \   - [Concurrency & Performance](evals/how-to/concurrency/)\\n    - [Retry Strategies](evals/how-to/retry-strategies/)\\n
+        \   - [Metrics & Attributes](evals/how-to/metrics-attributes/)\\n  + Examples\\n\\n\\n\\n\\n    Examples\\n    - [Simple
+        Validation](evals/examples/simple-validation/)\\n* Pydantic Graph\\n\\n\\n\\n\\n  Pydantic Graph\\n  + [Overview](graph/)\\n
+        \ + [Beta API](graph/beta/)\\n\\n    Beta API\\n    - [Steps](graph/beta/steps/)\\n    - [Joins & Reducers](graph/beta/joins/)\\n
+        \   - [Decisions](graph/beta/decisions/)\\n    - [Parallel Execution](graph/beta/parallel/)\\n* Integrations\\n\\n\\n\\n\\n
+        \ Integrations\\n  + [Debugging & Monitoring with Pydantic Logfire](logfire/)\\n  + Durable Execution\\n\\n\\n\\n\\n
+        \   Durable Execution\\n    - [Overview](durable_execution/overview/)\\n    - [Temporal](durable_execution/temporal/)\\n
+        \   - [DBOS](durable_execution/dbos/)\\n    - [Prefect](durable_execution/prefect/)\\n  + UI Event Streams\\n\\n\\n\\n\\n
+        \   UI Event Streams\\n    - [Overview](ui/overview/)\\n    - [AG-UI](ui/ag-ui/)\\n    - [Vercel AI](ui/vercel-ai/)\\n
+        \ + [Agent2Agent (A2A)](a2a/)\\n* Related Packages\\n\\n\\n\\n\\n  Related Packages\\n  + [Clai](cli/)\\n* Examples\\n\\n\\n\\n\\n
+        \ Examples\\n  + [Setup](examples/setup/)\\n  + Getting Started\\n\\n\\n\\n\\n    Getting Started\\n    - [Pydantic
+        Model](examples/pydantic-model/)\\n    - [Weather agent](examples/weather-agent/)\\n  + Conversational Agents\\n\\n\\n\\n\\n
+        \   Conversational Agents\\n    - [Chat App with FastAPI](examples/chat-app/)\\n    - [Bank support](examples/bank-support/)\\n
+        \ + Data & Analytics\\n\\n\\n\\n\\n    Data & Analytics\\n    - [SQL Generation](examples/sql-gen/)\\n    - [Data
+        Analyst](examples/data-analyst/)\\n    - [RAG](examples/rag/)\\n  + Streaming\\n\\n\\n\\n\\n    Streaming\\n    -
+        [Stream markdown](examples/stream-markdown/)\\n    - [Stream whales](examples/stream-whales/)\\n  + Complex Workflows\\n\\n\\n\\n\\n
+        \   Complex Workflows\\n    - [Flight booking](examples/flight-booking/)\\n    - [Question Graph](examples/question-graph/)\\n
+        \ + Business Applications\\n\\n\\n\\n\\n    Business Applications\\n    - [Slack Lead Qualifier with Modal](examples/slack-lead-qualifier/)\\n
+        \ + UI Examples\\n\\n\\n\\n\\n    UI Examples\\n    - [Agent User Interaction (AG-UI)](examples/ag-ui/)\\n* API Reference\\n\\n\\n\\n\\n
+        \ API Reference\\n  + pydantic\\\\_ai\\n\\n\\n\\n\\n    pydantic\\\\_ai\\n    - [pydantic\\\\_ai.agent](api/agent/)\\n
+        \   - [pydantic\\\\_ai.tools](api/tools/)\\n    - [pydantic\\\\_ai.toolsets](api/toolsets/)\\n    - [pydantic\\\\_ai.builtin\\\\_tools](api/builtin_tools/)\\n
+        \   - [pydantic\\\\_ai.common\\\\_tools](api/common_tools/)\\n    - [pydantic\\\\_ai.durable\\\\_exec](api/durable_exec/)\\n
+        \   - [pydantic\\\\_ai.output](api/output/)\\n    - [pydantic\\\\_ai.result](api/result/)\\n    - [pydantic\\\\_ai.messages](api/messages/)\\n
+        \   - [pydantic\\\\_ai.exceptions](api/exceptions/)\\n    - [pydantic\\\\_ai.settings](api/settings/)\\n    - [pydantic\\\\_ai.usage](api/usage/)\\n
+        \   - [pydantic\\\\_ai.mcp](api/mcp/)\\n    - [pydantic\\\\_ai.format\\\\_prompt](api/format_prompt/)\\n    - [pydantic\\\\_ai.direct](api/direct/)\\n
+        \   - [pydantic\\\\_ai.ext](api/ext/)\\n    - [pydantic\\\\_ai.models.anthropic](api/models/anthropic/)\\n    - [pydantic\\\\_ai.models](api/models/base/)\\n
+        \   - [pydantic\\\\_ai.models.bedrock](api/models/bedrock/)\\n    - [pydantic\\\\_ai.models.cohere](api/models/cohere/)\\n
+        \   - [pydantic\\\\_ai.models.fallback](api/models/fallback/)\\n    - [pydantic\\\\_ai.models.function](api/models/function/)\\n
+        \   - [pydantic\\\\_ai.models.google](api/models/google/)\\n    - [pydantic\\\\_ai.models.groq](api/models/groq/)\\n
+        \   - [pydantic\\\\_ai.models.huggingface](api/models/huggingface/)\\n    - [pydantic\\\\_ai.models.instrumented](api/models/instrumented/)\\n
+        \   - [pydantic\\\\_ai.models.mcp\\\\_sampling](api/models/mcp-sampling/)\\n    - [pydantic\\\\_ai.models.mistral](api/models/mistral/)\\n
+        \   - [pydantic\\\\_ai.models.openai](api/models/openai/)\\n    - [pydantic\\\\_ai.models.openrouter](api/models/openrouter/)\\n
+        \   - [pydantic\\\\_ai.models.outlines](api/models/outlines/)\\n    - [pydantic\\\\_ai.models.test](api/models/test/)\\n
+        \   - [pydantic\\\\_ai.models.wrapper](api/models/wrapper/)\\n    - [pydantic\\\\_ai.profiles](api/profiles/)\\n    -
+        [pydantic\\\\_ai.providers](api/providers/)\\n    - [pydantic\\\\_ai.retries](api/retries/)\\n    - [pydantic\\\\_ai.run](api/run/)\\n
+        \   - [pydantic\\\\_ai.ag\\\\_ui](api/ag_ui/)\\n    - [pydantic\\\\_ai.ui](api/ui/base/)\\n    - [pydantic\\\\_ai.ui.ag\\\\_ui](api/ui/ag_ui/)\\n
+        \   - [pydantic\\\\_ai.ui.vercel\\\\_ai](api/ui/vercel_ai/)\\n  + pydantic\\\\_evals\\n\\n\\n\\n\\n    pydantic\\\\_evals\\n
+        \   - [pydantic\\\\_evals.dataset](api/pydantic_evals/dataset/)\\n    - [pydantic\\\\_evals.evaluators](api/pydantic_evals/evaluators/)\\n
+        \   - [pydantic\\\\_evals.reporting](api/pydantic_evals/reporting/)\\n    - [pydantic\\\\_evals.otel](api/pydantic_evals/otel/)\\n
+        \   - [pydantic\\\\_evals.generation](api/pydantic_evals/generation/)\\n  + pydantic\\\\_graph\\n\\n\\n\\n\\n    pydantic\\\\_graph\\n
+        \   - [pydantic\\\\_graph](api/pydantic_graph/graph/)\\n    - [pydantic\\\\_graph.nodes](api/pydantic_graph/nodes/)\\n
+        \   - [pydantic\\\\_graph.persistence](api/pydantic_graph/persistence/)\\n    - [pydantic\\\\_graph.mermaid](api/pydantic_graph/mermaid/)\\n
+        \   - [pydantic\\\\_graph.exceptions](api/pydantic_graph/exceptions/)\\n    - Beta API\\n\\n\\n\\n\\n      Beta API\\n
+        \     * [pydantic\\\\_graph.beta](api/pydantic_graph/beta/)\\n      * [pydantic\\\\_graph.beta.graph](api/pydantic_graph/beta_graph/)\\n
+        \     * [pydantic\\\\_graph.beta.graph\\\\_builder](api/pydantic_graph/beta_graph_builder/)\\n      * [pydantic\\\\_graph.beta.step](api/pydantic_graph/beta_step/)\\n
+        \     * [pydantic\\\\_graph.beta.join](api/pydantic_graph/beta_join/)\\n      * [pydantic\\\\_graph.beta.decision](api/pydantic_graph/beta_decision/)\\n
+        \     * [pydantic\\\\_graph.beta.node](api/pydantic_graph/beta_node/)\\n  + fasta2a\\n\\n\\n\\n\\n    fasta2a\\n    -
+        [fasta2a](api/fasta2a/)\\n* Project\\n\\n\\n\\n\\n  Project\\n  + [Contributing](contributing/)\\n  + [Upgrade Guide](changelog/)\\n
+        \ + [Version policy](version-policy/)\\n\\nTable of contents\\n\\n* [Why use Pydantic AI](#why-use-pydantic-ai)\\n*
+        [Hello World Example](#hello-world-example)\\n* [Tools & Dependency Injection Example](#tools-dependency-injection-example)\\n*
+        [Instrumentation with Pydantic Logfire](#instrumentation-with-pydantic-logfire)\\n* [llms.txt](#llmstxt)\\n* [Next
+        Steps](#next-steps)\\n\\n# Pydantic AI\\n\\n![Pydantic AI](./img/pydantic-ai-dark.svg#only-dark)\\n\\n![Pydantic AI](./img/pydantic-ai-light.svg#only-light)\\n\\n*GenAI
+        Agent Framework, the Pydantic way*\\n\\n[![CI](https://github.com/pydantic/pydantic-ai/actions/workflows/ci.yml/badge.svg?event=push)](https://github.com/pydantic/pydantic-ai/actions/workflows/ci.yml?query=branch%3Amain)\\n[![Coverage](https://coverage-badge.samuelcolvin.workers.dev/pydantic/pydantic-ai.svg)](https://coverage-badge.samuelcolvin.workers.dev/redirect/pydantic/pydantic-ai)\\n[![PyPI](https://img.shields.io/pypi/v/pydantic-ai.svg)](https://pypi.python.org/pypi/pydantic-ai)\\n[![versions](https://img.shields.io/pypi/pyversions/pydantic-ai.svg)](https://github.com/pydantic/pydantic-ai)\\n[![license](https://img.shields.io/github/license/pydantic/pydantic-ai.svg)](https://github.com/pydantic/pydantic-ai/blob/main/LICENSE)\\n[![Join
+        Slack](https://img.shields.io/badge/Slack-Join%20Slack-4A154B?logo=slack)](https://logfire.pydantic.dev/docs/join-slack/)\\n\\nPydantic
+        AI is a Python agent framework designed to help you\\nquickly, confidently, and painlessly build production grade
+        applications and workflows with Generative AI.\\n\\nFastAPI revolutionized web development by offering an innovative
+        and ergonomic design, built on the foundation of [Pydantic Validation](https://docs.pydantic.dev) and modern Python
+        features like type hints.\\n\\nYet despite virtually every Python agent framework and LLM library using Pydantic Validation,
+        when we began to use LLMs in [Pydantic Logfire](https://pydantic.dev/logfire), we couldn't find anything that gave
+        us the same feeling.\\n\\nWe built Pydantic AI with one simple aim: to bring that FastAPI feeling to GenAI app and
+        agent development.\\n\\n## Why use Pydantic AI\\n\\n1. **Built by the Pydantic Team**:\\n   [Pydantic Validation](https://docs.pydantic.dev/latest/)
+        is the validation layer of the OpenAI SDK, the Google ADK, the Anthropic SDK, LangChain, LlamaIndex, AutoGPT, Transformers,
+        CrewAI, Instructor and many more. *Why use the derivative when you can go straight to the source?* ![\U0001F603](https://cdn.jsdelivr.net/gh/jdecked/twemoji@15.1.0/assets/svg/1f603.svg
+        \\\":smiley:\\\")\\n2. **Model-agnostic**:\\n   Supports virtually every [model](models/overview/) and provider: OpenAI,
+        Anthropic, Gemini, DeepSeek, Grok, Cohere, Mistral, and Perplexity; Azure AI Foundry, Amazon Bedrock, Google Vertex
+        AI, Ollama, LiteLLM, Groq, OpenRouter, Together AI, Fireworks AI, Cerebras, Hugging Face, GitHub, Heroku, Vercel,
+        Nebius, OVHcloud, and Outlines. If your favorite model or provider is not listed, you can easily implement a [custom
+        model](models/overview/#custom-models).\\n3. **Seamless Observability**:\\n   Tightly [integrates](logfire/) with
+        [Pydantic Logfire](https://pydantic.dev/logfire), our general-purpose OpenTelemetry observability platform, for real-time
+        debugging, evals-based performance monitoring, and behavior, tracing, and cost tracking. If you already have an observability
+        platform that supports OTel, you can [use that too](logfire/#alternative-observability-backends).\\n4. **Fully Type-safe**:\\n
+        \  Designed to give your IDE or AI coding agent as much context as possible for auto-completion and [type checking](agents/#static-type-checking),
+        moving entire classes of errors from runtime to write-time for a bit of that Rust \\\"if it compiles, it works\\\"
+        feel.\\n5. **Powerful Evals**:\\n   Enables you to systematically test and [evaluate](evals/) the performance and
+        accuracy of the agentic systems you build, and monitor the performance over time in Pydantic Logfire.\\n6. **MCP,
+        A2A, and UI**:\\n   Integrates the [Model Context Protocol](mcp/overview/), [Agent2Agent](a2a/), and various [UI event
+        stream](ui/overview/) standards to give your agent access to external tools and data, let it interoperate with other
+        agents, and build interactive applications with streaming event-based communication.\\n7. **Human-in-the-Loop Tool
+        Approval**:\\n   Easily lets you flag that certain tool calls [require approval](deferred-tools/#human-in-the-loop-tool-approval)
+        before they can proceed, possibly depending on tool call arguments, conversation history, or user preferences.\\n8.
+        **Durable Execution**:\\n   Enables you to build [durable agents](durable_execution/overview/) that can preserve their
+        progress across transient API failures and application errors or restarts, and handle long-running, asynchronous,
+        and human-in-the-loop workflows with production-grade reliability.\\n9. **Streamed Outputs**:\\n   Provides the ability
+        to [stream](output/#streamed-results) structured output continuously, with immediate validation, ensuring real time
+        access to generated data.\\n10. **Graph Support**:\\n    Provides a powerful way to define [graphs](graph/) using
+        type hints, for use in complex applications where standard control flow can degrade to spaghetti code.\\n\\nRealistically
+        though, no list is going to be as convincing as [giving it a try](#next-steps) and seeing how it makes you feel!\\n\\n**Sign
+        up for our newsletter, *The Pydantic Stack*, with updates & tutorials on Pydantic AI, Logfire, and Pydantic:**\\n\\nSubscribe\\n\\n##
+        Hello World Example\\n\\nHere's a minimal example of Pydantic AI:\\n\\nWith Pydantic AI GatewayDirectly to Provider
+        API\\n\\n[Learn about Gateway](../gateway) hello\\\\_world.py\\n\\n```\\nfrom pydantic_ai import Agent\\n\\nagent
+        = Agent(  # (1)!\\n    'gateway/anthropic:claude-sonnet-4-0',\\n    instructions='Be concise, reply with one sentence.',
+        \ # (2)!\\n)\\n\\nresult = agent.run_sync('Where does \\\"hello world\\\" come from?')  # (3)!\\nprint(result.output)\\n\\\"\\\"\\\"\\nThe
+        first known use of \\\"hello, world\\\" was in a 1974 textbook about the C programming language.\\n\\\"\\\"\\\"\\n```\\n\\n1.
+        We configure the agent to use [Anthropic's Claude Sonnet 4.0](api/models/anthropic/) model, but you can also set the
+        model when running the agent.\\n2. Register static [instructions](agents/#instructions) using a keyword argument to
+        the agent.\\n3. [Run the agent](agents/#running-agents) synchronously, starting a conversation with the LLM.\\n\\nhello\\\\_world.py\\n\\n```\\nfrom
+        pydantic_ai import Agent\\n\\nagent = Agent(  # (1)!\\n    'anthropic:claude-sonnet-4-0',\\n    instructions='Be concise,
+        reply with one sentence.',  # (2)!\\n)\\n\\nresult = agent.run_sync('Where does \\\"hello world\\\" come from?')  #
+        (3)!\\nprint(result.output)\\n\\\"\\\"\\\"\\nThe first known use of \\\"hello, world\\\" was in a 1974 textbook about
+        the C programming language.\\n\\\"\\\"\\\"\\n```\\n\\n1. We configure the agent to use [Anthropic's Claude Sonnet
+        4.0](api/models/anthropic/) model, but you can also set the model when running the agent.\\n2. Register static [instructions](agents/#instructions)
+        using a keyword argument to the agent.\\n3. [Run the agent](agents/#running-agents) synchronously, starting a conversation
+        with the LLM.\\n\\n*(This example is complete, it can be run \\\"as is\\\", assuming you've [installed the `pydantic_ai`
+        package](install/))*\\n\\nThe exchange will be very short: Pydantic AI will send the instructions and the user prompt
+        to the LLM, and the model will return a text response.\\n\\nNot very interesting yet, but we can easily add [tools](tools/),
+        [dynamic instructions](agents/#instructions), and [structured outputs](output/) to build more powerful agents.\\n\\n##
+        Tools & Dependency Injection Example\\n\\nHere is a concise example using Pydantic AI to build a support agent for
+        a bank:\\n\\nWith Pydantic AI GatewayDirectly to Provider API\\n\\n[Learn about Gateway](../gateway) bank\\\\_support.py\\n\\n```\\nfrom
+        dataclasses import dataclass\\n\\nfrom pydantic import BaseModel, Field\\nfrom pydantic_ai import Agent, RunContext\\n\\nfrom
+        bank_database import DatabaseConn\\n\\n\\n@dataclass\\nclass SupportDependencies:  # (3)!\\n    customer_id: int\\n
+        \   db: DatabaseConn  # (12)!\\n\\n\\nclass SupportOutput(BaseModel):  # (13)!\\n    support_advice: str = Field(description='Advice
+        returned to the customer')\\n    block_card: bool = Field(description=\\\"Whether to block the customer's card\\\")\\n
+        \   risk: int = Field(description='Risk level of query', ge=0, le=10)\\n\\n\\nsupport_agent = Agent(  # (1)!\\n    'gateway/openai:gpt-5',
+        \ # (2)!\\n    deps_type=SupportDependencies,\\n    output_type=SupportOutput,  # (9)!\\n    instructions=(  # (4)!\\n
+        \       'You are a support agent in our bank, give the '\\n        'customer support and judge the risk level of their
+        query.'\\n    ),\\n)\\n\\n\\n@support_agent.instructions  # (5)!\\nasync def add_customer_name(ctx: RunContext[SupportDependencies])
+        -> str:\\n    customer_name = await ctx.deps.db.customer_name(id=ctx.deps.customer_id)\\n    return f\\\"The customer's
+        name is {customer_name!r}\\\"\\n\\n\\n@support_agent.tool  # (6)!\\nasync def customer_balance(\\n    ctx: RunContext[SupportDependencies],
+        include_pending: bool\\n) -> float:\\n    \\\"\\\"\\\"Returns the customer's current account balance.\\\"\\\"\\\"
+        \ # (7)!\\n    return await ctx.deps.db.customer_balance(\\n        id=ctx.deps.customer_id,\\n        include_pending=include_pending,\\n
+        \   )\\n\\n\\n...  # (11)!\\n\\n\\nasync def main():\\n    deps = SupportDependencies(customer_id=123, db=DatabaseConn())\\n
+        \   result = await support_agent.run('What is my balance?', deps=deps)  # (8)!\\n    print(result.output)  # (10)!\\n
+        \   \\\"\\\"\\\"\\n    support_advice='Hello John, your current account balance, including pending transactions, is
+        $123.45.' block_card=False risk=1\\n    \\\"\\\"\\\"\\n\\n    result = await support_agent.run('I just lost my card!',
+        deps=deps)\\n    print(result.output)\\n    \\\"\\\"\\\"\\n    support_advice=\\\"I'm sorry to hear that, John. We
+        are temporarily blocking your card to prevent unauthorized transactions.\\\" block_card=True risk=8\\n    \\\"\\\"\\\"\\n```\\n\\n1.
+        This [agent](agents/) will act as first-tier support in a bank. Agents are generic in the type of dependencies they
+        accept and the type of output they return. In this case, the support agent has type `Agent[SupportDependencies, SupportOutput]`.\\n2.
+        Here we configure the agent to use [OpenAI's GPT-5 model](api/models/openai/), you can also set the model when running
+        the agent.\\n3. The `SupportDependencies` dataclass is used to pass data, connections, and logic into the model that
+        will be needed when running [instructions](agents/#instructions) and [tool](tools/) functions. Pydantic AI's system
+        of dependency injection provides a [type-safe](agents/#static-type-checking) way to customise the behavior of your
+        agents, and can be especially useful when running [unit tests](testing/) and evals.\\n4. Static [instructions](agents/#instructions)
+        can be registered with the [`instructions` keyword argument](api/agent/#pydantic_ai.agent.Agent.__init__) to the agent.\\n5.
+        Dynamic [instructions](agents/#instructions) can be registered with the [`@agent.instructions`](api/agent/#pydantic_ai.agent.Agent.instructions)
+        decorator, and can make use of dependency injection. Dependencies are carried via the [`RunContext`](api/tools/#pydantic_ai.tools.RunContext)
+        argument, which is parameterized with the `deps_type` from above. If the type annotation here is wrong, static type
+        checkers will catch it.\\n6. The [`@agent.tool`](tools/) decorator let you register functions which the LLM may call
+        while responding to a user. Again, dependencies are carried via [`RunContext`](api/tools/#pydantic_ai.tools.RunContext),
+        any other arguments become the tool schema passed to the LLM. Pydantic is used to validate these arguments, and errors
+        are passed back to the LLM so it can retry.\\n7. The docstring of a tool is also passed to the LLM as the description
+        of the tool. Parameter descriptions are [extracted](tools/#function-tools-and-schema) from the docstring and added
+        to the parameter schema sent to the LLM.\\n8. [Run the agent](agents/#running-agents) asynchronously, conducting a
+        conversation with the LLM until a final response is reached. Even in this fairly simple case, the agent will exchange
+        multiple messages with the LLM as tools are called to retrieve an output.\\n9. The response from the agent will be
+        guaranteed to be a `SupportOutput`. If validation fails [reflection](agents/#reflection-and-self-correction), the
+        agent is prompted to try again.\\n10. The output will be validated with Pydantic to guarantee it is a `SupportOutput`,
+        since the agent is generic, it'll also be typed as a `SupportOutput` to aid with static type checking.\\n11. In a
+        real use case, you'd add more tools and longer instructions to the agent to extend the context it's equipped with
+        and support it can provide.\\n12. This is a simple sketch of a database connection, used to keep the example short
+        and readable. In reality, you'd be connecting to an external database (e.g. PostgreSQL) to get information about customers.\\n13.
+        This [Pydantic](https://docs.pydantic.dev) model is used to constrain the structured data returned by the agent. From
+        this simple definition, Pydantic builds the JSON Schema that tells the LLM how to return the data, and performs validation
+        to guarantee the data is correct at the end of the run.\\n\\nbank\\\\_support.py\\n\\n```\\nfrom dataclasses import
+        dataclass\\n\\nfrom pydantic import BaseModel, Field\\nfrom pydantic_ai import Agent, RunContext\\n\\nfrom bank_database
+        import DatabaseConn\\n\\n\\n@dataclass\\nclass SupportDependencies:  # (3)!\\n    customer_id: int\\n    db: DatabaseConn
+        \ # (12)!\\n\\n\\nclass SupportOutput(BaseModel):  # (13)!\\n    support_advice: str = Field(description='Advice returned
+        to the customer')\\n    block_card: bool = Field(description=\\\"Whether to block the customer's card\\\")\\n    risk:
+        int = Field(description='Risk level of query', ge=0, le=10)\\n\\n\\nsupport_agent = Agent(  # (1)!\\n    'openai:gpt-5',
+        \ # (2)!\\n    deps_type=SupportDependencies,\\n    output_type=SupportOutput,  # (9)!\\n    instructions=(  # (4)!\\n
+        \       'You are a support agent in our bank, give the '\\n        'customer support and judge the risk level of their
+        query.'\\n    ),\\n)\\n\\n\\n@support_agent.instructions  # (5)!\\nasync def add_customer_name(ctx: RunContext[SupportDependencies])
+        -> str:\\n    customer_name = await ctx.deps.db.customer_name(id=ctx.deps.customer_id)\\n    return f\\\"The customer's
+        name is {customer_name!r}\\\"\\n\\n\\n@support_agent.tool  # (6)!\\nasync def customer_balance(\\n    ctx: RunContext[SupportDependencies],
+        include_pending: bool\\n) -> float:\\n    \\\"\\\"\\\"Returns the customer's current account balance.\\\"\\\"\\\"
+        \ # (7)!\\n    return await ctx.deps.db.customer_balance(\\n        id=ctx.deps.customer_id,\\n        include_pending=include_pending,\\n
+        \   )\\n\\n\\n...  # (11)!\\n\\n\\nasync def main():\\n    deps = SupportDependencies(customer_id=123, db=DatabaseConn())\\n
+        \   result = await support_agent.run('What is my balance?', deps=deps)  # (8)!\\n    print(result.output)  # (10)!\\n
+        \   \\\"\\\"\\\"\\n    support_advice='Hello John, your current account balance, including pending transactions, is
+        $123.45.' block_card=False risk=1\\n    \\\"\\\"\\\"\\n\\n    result = await support_agent.run('I just lost my card!',
+        deps=deps)\\n    print(result.output)\\n    \\\"\\\"\\\"\\n    support_advice=\\\"I'm sorry to hear that, John. We
+        are temporarily blocking your card to prevent unauthorized transactions.\\\" block_card=True risk=8\\n    \\\"\\\"\\\"\\n```\\n\\n1.
+        This [agent](agents/) will act as first-tier support in a bank. Agents are generic in the type of dependencies they
+        accept and the type of output they return. In this case, the support agent has type `Agent[SupportDependencies, SupportOutput]`.\\n2.
+        Here we configure the agent to use [OpenAI's GPT-5 model](api/models/openai/), you can also set the model when running
+        the agent.\\n3. The `SupportDependencies` dataclass is used to pass data, connections, and logic into the model that
+        will be needed when running [instructions](agents/#instructions) and [tool](tools/) functions. Pydantic AI's system
+        of dependency injection provides a [type-safe](agents/#static-type-checking) way to customise the behavior of your
+        agents, and can be especially useful when running [unit tests](testing/) and evals.\\n4. Static [instructions](agents/#instructions)
+        can be registered with the [`instructions` keyword argument](api/agent/#pydantic_ai.agent.Agent.__init__) to the agent.\\n5.
+        Dynamic [instructions](agents/#instructions) can be registered with the [`@agent.instructions`](api/agent/#pydantic_ai.agent.Agent.instructions)
+        decorator, and can make use of dependency injection. Dependencies are carried via the [`RunContext`](api/tools/#pydantic_ai.tools.RunContext)
+        argument, which is parameterized with the `deps_type` from above. If the type annotation here is wrong, static type
+        checkers will catch it.\\n6. The [`@agent.tool`](tools/) decorator let you register functions which the LLM may call
+        while responding to a user. Again, dependencies are carried via [`RunContext`](api/tools/#pydantic_ai.tools.RunContext),
+        any other arguments become the tool schema passed to the LLM. Pydantic is used to validate these arguments, and errors
+        are passed back to the LLM so it can retry.\\n7. The docstring of a tool is also passed to the LLM as the description
+        of the tool. Parameter descriptions are [extracted](tools/#function-tools-and-schema) from the docstring and added
+        to the parameter schema sent to the LLM.\\n8. [Run the agent](agents/#running-agents) asynchronously, conducting a
+        conversation with the LLM until a final response is reached. Even in this fairly simple case, the agent will exchange
+        multiple messages with the LLM as tools are called to retrieve an output.\\n9. The response from the agent will be
+        guaranteed to be a `SupportOutput`. If validation fails [reflection](agents/#reflection-and-self-correction), the
+        agent is prompted to try again.\\n10. The output will be validated with Pydantic to guarantee it is a `SupportOutput`,
+        since the agent is generic, it'll also be typed as a `SupportOutput` to aid with static type checking.\\n11. In a
+        real use case, you'd add more tools and longer instructions to the agent to extend the context it's equipped with
+        and support it can provide.\\n12. This is a simple sketch of a database connection, used to keep the example short
+        and readable. In reality, you'd be connecting to an external database (e.g. PostgreSQL) to get information about customers.\\n13.
+        This [Pydantic](https://docs.pydantic.dev) model is used to constrain the structured data returned by the agent. From
+        this simple definition, Pydantic builds the JSON Schema that tells the LLM how to return the data, and performs validation
+        to guarantee the data is correct at the end of the run.\\n\\nComplete `bank_support.py` example\\n\\nThe code included
+        here is incomplete for the sake of brevity (the definition of `DatabaseConn` is missing); you can find the complete
+        `bank_support.py` example [here](examples/bank-support/).\\n\\n## Instrumentation with Pydantic Logfire\\n\\nEven
+        a simple agent with just a handful of tools can result in a lot of back-and-forth with the LLM, making it nearly impossible
+        to be confident of what's going on just from reading the code.\\nTo understand the flow of the above runs, we can
+        watch the agent in action using Pydantic Logfire.\\n\\nTo do this, we need to [set up Logfire](logfire/#using-logfire),
+        and add the following to our code:\\n\\nWith Pydantic AI GatewayDirectly to Provider API\\n\\n[Learn about Gateway](../gateway)
+        bank\\\\_support\\\\_with\\\\_logfire.py\\n\\n```\\n...\\nfrom pydantic_ai import Agent, RunContext\\n\\nfrom bank_database
+        import DatabaseConn\\n\\nimport logfire\\n\\nlogfire.configure()  # (1)!\\nlogfire.instrument_pydantic_ai()  # (2)!\\nlogfire.instrument_asyncpg()
+        \ # (3)!\\n\\n...\\n\\nsupport_agent = Agent(\\n    'gateway/openai:gpt-5',\\n    deps_type=SupportDependencies,\\n
+        \   output_type=SupportOutput,\\n    system_prompt=(\\n        'You are a support agent in our bank, give the '\\n
+        \       'customer support and judge the risk level of their query.'\\n    ),\\n)\\n```\\n\\n1. Configure the Logfire
+        SDK, this will fail if project is not set up.\\n2. This will instrument all Pydantic AI agents used from here on out.
+        If you want to instrument only a specific agent, you can pass the [`instrument=True` keyword argument](api/agent/#pydantic_ai.agent.Agent.__init__)
+        to the agent.\\n3. In our demo, `DatabaseConn` uses `asyncpg` to connect to a PostgreSQL database, so [`logfire.instrument_asyncpg()`](https://magicstack.github.io/asyncpg/current/)
+        is used to log the database queries.\\n\\nbank\\\\_support\\\\_with\\\\_logfire.py\\n\\n```\\n...\\nfrom pydantic_ai
+        import Agent, RunContext\\n\\nfrom bank_database import DatabaseConn\\n\\nimport logfire\\n\\nlogfire.configure()
+        \ # (1)!\\nlogfire.instrument_pydantic_ai()  # (2)!\\nlogfire.instrument_asyncpg()  # (3)!\\n\\n...\\n\\nsupport_agent
+        = Agent(\\n    'openai:gpt-5',\\n    deps_type=SupportDependencies,\\n    output_type=SupportOutput,\\n    system_prompt=(\\n
+        \       'You are a support agent in our bank, give the '\\n        'customer support and judge the risk level of their
+        query.'\\n    ),\\n)\\n```\\n\\n1. Configure the Logfire SDK, this will fail if project is not set up.\\n2. This will
+        instrument all Pydantic AI agents used from here on out. If you want to instrument only a specific agent, you can
+        pass the [`instrument=True` keyword argument](api/agent/#pydantic_ai.agent.Agent.__init__) to the agent.\\n3. In our
+        demo, `DatabaseConn` uses `asyncpg` to connect to a PostgreSQL database, so [`logfire.instrument_asyncpg()`](https://magicstack.github.io/asyncpg/current/)
+        is used to log the database queries.\\n\\nThat's enough to get the following view of your agent in action:\\n\\nSee
+        [Monitoring and Performance](logfire/) to learn more.\\n\\n## `llms.txt`\\n\\nThe Pydantic AI documentation is available
+        in the [llms.txt](https://llmstxt.org/) format.\\nThis format is defined in Markdown and suited for LLMs and AI coding
+        assistants and agents.\\n\\nTwo formats are available:\\n\\n* [`llms.txt`](https://ai.pydantic.dev/llms.txt): a file
+        containing a brief description\\n  of the project, along with links to the different sections of the documentation.
+        The structure\\n  of this file is described in details [here](https://llmstxt.org/#format).\\n* [`llms-full.txt`](https://ai.pydantic.dev/llms-full.txt):
+        Similar to the `llms.txt` file,\\n  but every link content is included. Note that this file may be too large for some
+        LLMs.\\n\\nAs of today, these files are not automatically leveraged by IDEs or coding agents, but they will use it
+        if you provide a link or the full text.\\n\\n## Next Steps\\n\\nTo try Pydantic AI for yourself, [install it](install/)
+        and follow the instructions [in the examples](examples/setup/).\\n\\nRead the [docs](agents/) to learn more about
+        building applications with Pydantic AI.\\n\\nRead the [API Reference](api/agent/) to understand Pydantic AI's interface.\\n\\nJoin
+        \ [Slack](https://logfire.pydantic.dev/docs/join-slack/) or file an issue on  [GitHub](https://github.com/pydantic/pydantic-ai/issues)
+        if you have any questions.\\n\\n\\n\\n© Pydantic Services Inc. 2024 to present\"},\"title\":\"Pydantic AI\"}}}  }\n\nevent:
+        content_block_stop\ndata: {\"type\":\"content_block_stop\",\"index\":2               }\n\nevent: content_block_start\ndata:
+        {\"type\":\"content_block_start\",\"index\":3,\"content_block\":{\"type\":\"text\",\"text\":\"\"}               }\n\nevent:
+        content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":3,\"delta\":{\"type\":\"text_delta\",\"text\":\"\\\"\"}
+        \       }\n\nevent: content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":3,\"delta\":{\"type\":\"text_delta\",\"text\":\"Gen\"}
+        \      }\n\nevent: content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":3,\"delta\":{\"type\":\"text_delta\",\"text\":\"A\"}
+        \ }\n\nevent: content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":3,\"delta\":{\"type\":\"text_delta\",\"text\":\"I
+        Agent\"}              }\n\nevent: content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":3,\"delta\":{\"type\":\"text_delta\",\"text\":\"
+        Framework\"}  }\n\nevent: content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":3,\"delta\":{\"type\":\"text_delta\",\"text\":\",\"}
+        \   }\n\nevent: content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":3,\"delta\":{\"type\":\"text_delta\",\"text\":\"
+        the\"}              }\n\nevent: content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":3,\"delta\":{\"type\":\"text_delta\",\"text\":\"
+        Pydantic way\"}              }\n\nevent: content_block_delta\ndata: {\"type\":\"content_block_delta\",\"index\":3,\"delta\":{\"type\":\"text_delta\",\"text\":\"\\\"\"}
+        \      }\n\nevent: content_block_stop\ndata: {\"type\":\"content_block_stop\",\"index\":3        }\n\nevent: message_delta\ndata:
+        {\"type\":\"message_delta\",\"delta\":{\"stop_reason\":\"end_turn\",\"stop_sequence\":null},\"usage\":{\"input_tokens\":11453,\"cache_creation_input_tokens\":0,\"cache_read_input_tokens\":0,\"output_tokens\":151,\"server_tool_use\":{\"web_search_requests\":0,\"web_fetch_requests\":1}}
+        \            }\n\nevent: message_stop\ndata: {\"type\":\"message_stop\"   }\n\n"
     headers:
       cache-control:
       - no-cache
@@ -199,7 +358,7 @@ interactions:
       content-type:
       - text/event-stream; charset=utf-8
       retry-after:
-      - '15'
+      - '46'
       strict-transport-security:
       - max-age=31536000; includeSubDomains; preload
       transfer-encoding:
@@ -208,4 +367,3 @@ interactions:
       code: 200
       message: OK
 version: 1
-...
diff --git a/tests/models/cassettes/test_google/test_google_model_web_search_tool.yaml b/tests/models/cassettes/test_google/test_google_model_web_search_tool.yaml
index 3da8a73955..929a05e527 100644
--- a/tests/models/cassettes/test_google/test_google_model_web_search_tool.yaml
+++ b/tests/models/cassettes/test_google/test_google_model_web_search_tool.yaml
@@ -8,7 +8,7 @@ interactions:
       connection:
       - keep-alive
       content-length:
-      - '247'
+      - '277'
       content-type:
       - application/json
       host:
@@ -19,7 +19,9 @@ interactions:
       - parts:
         - text: What is the weather in San Francisco today?
         role: user
-      generationConfig: {}
+      generationConfig:
+        responseModalities:
+        - TEXT
       systemInstruction:
         parts:
         - text: You are a helpful chatbot.
@@ -32,11 +34,11 @@ interactions:
       alt-svc:
       - h3=":443"; ma=2592000,h3-29=":443"; ma=2592000
       content-length:
-      - '9827'
+      - '11738'
       content-type:
       - application/json; charset=UTF-8
       server-timing:
-      - gfet4t7; dur=8115
+      - gfet4t7; dur=9106
       transfer-encoding:
       - chunked
       vary:
@@ -48,15 +50,13 @@ interactions:
       - content:
           parts:
           - text: |-
-              ## Weather in San Francisco is Mild and Partly Cloudy
+              **San Francisco Experiences a Mostly Cloudy Day with Mild Temperatures**
 
-              **San Francisco, CA** - Residents and visitors in San Francisco are experiencing a mild Tuesday, with partly cloudy skies and temperatures hovering around 69°F. There is a very low chance of rain throughout the day.
+              As of Monday in San Francisco, the weather is predominantly mostly cloudy with a current temperature of 51°F, which feels more like 49°F. Other reports describe the sky as partly cloudy. The forecast for the day indicates that cloudy conditions will persist with a slight 10% chance of rain.
 
-              According to the latest weather reports, the forecast for the remainder of the day is expected to be sunny, with highs ranging from the mid-60s to the lower 80s. Winds are predicted to come from the west at 10 to 15 mph.
+              The high temperature for the day is expected to reach the low to mid-50s, with forecasts predicting a high of 54°F. The low for tonight is anticipated to be in the mid-40s, with some forecasts calling for a low of 45°F.
 
-              As the evening approaches, the skies are expected to remain partly cloudy, with temperatures dropping to the upper 50s. There is a slight increase in the chance of rain overnight, but it remains low at 20%.
-
-              Overall, today's weather in San Francisco is pleasant, with a mix of sun and clouds and comfortable temperatures.
+              Humidity levels are relatively high, reported at 77%. Winds are generally light, coming from the north at 5 to 10 mph. Visibility has been noted as being around 1.5 to 2 miles. There is also a possibility of dense fog in some areas.
           role: model
         finishReason: STOP
         groundingMetadata:
@@ -65,51 +65,79 @@ interactions:
               title: Weather information for San Francisco, CA, US
               uri: https://www.google.com/search?q=weather+in+San Francisco, CA,+US
           - web:
-              title: weather.gov
-              uri: https://vertexaisearch.cloud.google.com/grounding-api-redirect/AUZIYQF_uqo2G5Goeww8iF1L_dYa2sqWGhzu_UnxEZd1gQ7ZNuXEVVVYEEYcx_La3kuODFm0dPUhHeF4qGP1c6kJ86i4SKfvRqFitMCvNiDx07eC5iM7axwepoTv3FeUdIRC-ou1P-6DDykZ4QzcxcrKISa_1Q==
+              title: cbsnews.com
+              uri: https://vertexaisearch.cloud.google.com/grounding-api-redirect/AUZIYQHs0KxAufAKly9TnNAnn-Baxlk1USk6vVjzW1FEEUCZKnE5eeatKXcIXJ4HZNDI7ROs1q3IuHTZp5bZwB3hc-u1sXnXI0rosZTNt-t6H9FTF9owH4M5u-54bnuL01OC1C3fEnU7MNRV
           - web:
               title: wunderground.com
-              uri: https://vertexaisearch.cloud.google.com/grounding-api-redirect/AUZIYQFywixFZicmDjijfhfLNw8ya7XdqWR31aJp8CHyULLelG8bujH1TuqeP9RAhK6Pcm1qz11ujm2yM7gM5bJXDFsZwbsubub4cnUp5ixRaloJcjVrHkyd5RHblhkDDxHGiREV9BcuqeJovdr8qhtrCKMcvJk=
+              uri: https://vertexaisearch.cloud.google.com/grounding-api-redirect/AUZIYQGIi3F3lZlGrWP6vK_zucR90Esg-PCBYRgHOK0gvSIwbHM1jKGKhLwKbv-chvrUhyhc5IZ9XAjo59IBjM6Tk5p2qQK7QGW-WgFi0Nrus7IrBqgNJfWCAMTgqkde8RXWk-T2edNf90TJGVoJIKXhcuWxpuE=
+          - web:
+              title: accuweather.com
+              uri: https://vertexaisearch.cloud.google.com/grounding-api-redirect/AUZIYQFUEG5HLOGJoFbOTpesMFek1T82haMch6RGzVbNaG-m-B7mbwLkfb4pHpCE8CH_RHUMa5GKNPUxev47neFe9YXiKJdXKo4gMABpBHjb3AjAXg5UNoY3hvMfhBVw-mxSLTzHuRzdxvjgMpDbskeuMVt0jM543GJnG06EVVzeYm8UUemWTS2UJyE=
+          - web:
+              title: theweathernetwork.com
+              uri: https://vertexaisearch.cloud.google.com/grounding-api-redirect/AUZIYQHtG8yKh-VGE2kjUi05sHqdu5HUVFr6NUs9F3SdvzlnHjubasE5fLourWIMk6Wmgd6VFmAj8NcY3HNeFosMwnxMc3zyvlZ2V6gNDMFuGgJCofZD1vlE0t2vv4KFC13o1LnElXVvzht7u-6kfwQybN_57kHs63NjwCQLiYECj8Ub7yDRhCYAzCU=
+          - web:
+              title: weather.com
+              uri: https://vertexaisearch.cloud.google.com/grounding-api-redirect/AUZIYQHggnMLBYdYahOGPJ6dykd1mBx7bs82NTc6T-pndOKmIdb8s-3QQ2571SFt8NPG6_UstE9rYG5g2yegUOlsiREqykqesDB7UP58H3ApEe2hDCMTqSyRllMUusJecf2jVHF8kb2Y1rCBNkzaXKuhtxgx6OPvoaYNnYDhIo73
           groundingSupports:
           - groundingChunkIndices:
             - 0
             segment:
-              endIndex: 216
-              startIndex: 55
-              text: '**San Francisco, CA** - Residents and visitors in San Francisco are experiencing a mild Tuesday, with
-                partly cloudy skies and temperatures hovering around 69°F.'
+              endIndex: 213
+              startIndex: 74
+              text: As of Monday in San Francisco, the weather is predominantly mostly cloudy with a current temperature of
+                51°F, which feels more like 49°F.
           - groundingChunkIndices:
-            - 0
+            - 1
             segment:
-              endIndex: 271
-              startIndex: 217
-              text: There is a very low chance of rain throughout the day.
+              endIndex: 262
+              startIndex: 214
+              text: Other reports describe the sky as partly cloudy.
           - groundingChunkIndices:
-            - 1
+            - 0
             segment:
-              endIndex: 434
-              startIndex: 273
-              text: According to the latest weather reports, the forecast for the remainder of the day is expected to be sunny,
-                with highs ranging from the mid-60s to the lower 80s.
+              endIndex: 367
+              startIndex: 263
+              text: The forecast for the day indicates that cloudy conditions will persist with a slight 10% chance of rain.
           - groundingChunkIndices:
             - 2
+            - 3
             segment:
-              endIndex: 493
-              startIndex: 435
-              text: Winds are predicted to come from the west at 10 to 15 mph.
+              endIndex: 485
+              startIndex: 369
+              text: The high temperature for the day is expected to reach the low to mid-50s, with forecasts predicting a
+                high of 54°F.
           - groundingChunkIndices:
-            - 1
+            - 3
             segment:
-              endIndex: 614
-              startIndex: 495
-              text: As the evening approaches, the skies are expected to remain partly cloudy, with temperatures dropping
-                to the upper 50s.
+              endIndex: 590
+              startIndex: 486
+              text: The low for tonight is anticipated to be in the mid-40s, with some forecasts calling for a low of 45°F.
           - groundingChunkIndices:
             - 0
             segment:
-              endIndex: 701
-              startIndex: 615
-              text: There is a slight increase in the chance of rain overnight, but it remains low at 20%.
+              endIndex: 645
+              startIndex: 592
+              text: Humidity levels are relatively high, reported at 77%.
+          - groundingChunkIndices:
+            - 2
+            segment:
+              endIndex: 710
+              startIndex: 646
+              text: Winds are generally light, coming from the north at 5 to 10 mph.
+          - groundingChunkIndices:
+            - 4
+            - 5
+            segment:
+              endIndex: 768
+              startIndex: 711
+              text: Visibility has been noted as being around 1.5 to 2 miles.
+          - groundingChunkIndices:
+            - 2
+            segment:
+              endIndex: 824
+              startIndex: 769
+              text: There is also a possibility of dense fog in some areas.
           searchEntryPoint:
             renderedContent: |
               <style>
@@ -233,26 +261,26 @@ interactions:
                   <div class="gradient-container"><div class="gradient"></div></div>
                 </div>
                 <div class="carousel">
-                  <a class="chip" href="https://vertexaisearch.cloud.google.com/grounding-api-redirect/AUZIYQGpaVYtZtg0AbOkyluH7ZfyxRSvLNFvK5HnFIwTqMQdOecLCFYzxIHes41UAd1GgIx1aL-q51HCGjUQXXLrnESB-F5HEvrsMB2_mb3hOwZrelCAn-F28bDl6IQvgTriNrfzd3IlnDYc42uD37aYMQjIWgznihXP-MiUdY5Cchwxn7_GcQNdbsPMQX6K9S0SQX_5GChPnOvfO48W-ULhcHTR">weather in San Francisco today</a>
+                  <a class="chip" href="https://vertexaisearch.cloud.google.com/grounding-api-redirect/AUZIYQHYi9CDfoqDHMbuxANn04bg0jc0HZNnGSZBOAvwQ4PYX7cBTfLxy1Bm7zUoqDYGAzk0yZYpmLxSfoYKKMbV7q1NAIP0BaWYZqKWkpwdLhFJTij1I4ZRW8cL1BO0_mJar3rvs4HWWycLc_nm69WuvnNmErdK4t9FqNHw0rGc9JDNSX2N8umj2vNc-HvbildKmkskpf2BsRbjwDIFkVEY2X9I">weather in San Francisco today</a>
                 </div>
               </div>
           webSearchQueries:
           - weather in San Francisco today
         index: 0
       modelVersion: gemini-2.5-pro
-      responseId: btnJaOrqE4_6qtsP7bOboQs
+      responseId: y1I3aaeTDvOLmtkPgevhkAE
       usageMetadata:
-        candidatesTokenCount: 201
+        candidatesTokenCount: 215
         promptTokenCount: 17
         promptTokensDetails:
         - modality: TEXT
           tokenCount: 17
-        thoughtsTokenCount: 213
-        toolUsePromptTokenCount: 119
+        thoughtsTokenCount: 444
+        toolUsePromptTokenCount: 103
         toolUsePromptTokensDetails:
         - modality: TEXT
-          tokenCount: 119
-        totalTokenCount: 550
+          tokenCount: 103
+        totalTokenCount: 779
     status:
       code: 200
       message: OK
@@ -265,7 +293,7 @@ interactions:
       connection:
       - keep-alive
       content-length:
-      - '1184'
+      - '1232'
       content-type:
       - application/json
       host:
@@ -278,20 +306,20 @@ interactions:
         role: user
       - parts:
         - text: |-
-            ## Weather in San Francisco is Mild and Partly Cloudy
+            **San Francisco Experiences a Mostly Cloudy Day with Mild Temperatures**
 
-            **San Francisco, CA** - Residents and visitors in San Francisco are experiencing a mild Tuesday, with partly cloudy skies and temperatures hovering around 69°F. There is a very low chance of rain throughout the day.
+            As of Monday in San Francisco, the weather is predominantly mostly cloudy with a current temperature of 51°F, which feels more like 49°F. Other reports describe the sky as partly cloudy. The forecast for the day indicates that cloudy conditions will persist with a slight 10% chance of rain.
 
-            According to the latest weather reports, the forecast for the remainder of the day is expected to be sunny, with highs ranging from the mid-60s to the lower 80s. Winds are predicted to come from the west at 10 to 15 mph.
+            The high temperature for the day is expected to reach the low to mid-50s, with forecasts predicting a high of 54°F. The low for tonight is anticipated to be in the mid-40s, with some forecasts calling for a low of 45°F.
 
-            As the evening approaches, the skies are expected to remain partly cloudy, with temperatures dropping to the upper 50s. There is a slight increase in the chance of rain overnight, but it remains low at 20%.
-
-            Overall, today's weather in San Francisco is pleasant, with a mix of sun and clouds and comfortable temperatures.
+            Humidity levels are relatively high, reported at 77%. Winds are generally light, coming from the north at 5 to 10 mph. Visibility has been noted as being around 1.5 to 2 miles. There is also a possibility of dense fog in some areas.
         role: model
       - parts:
         - text: how about Mexico City?
         role: user
-      generationConfig: {}
+      generationConfig:
+        responseModalities:
+        - TEXT
       systemInstruction:
         parts:
         - text: You are a helpful chatbot.
@@ -304,11 +332,11 @@ interactions:
       alt-svc:
       - h3=":443"; ma=2592000,h3-29=":443"; ma=2592000
       content-length:
-      - '8690'
+      - '10879'
       content-type:
       - application/json; charset=UTF-8
       server-timing:
-      - gfet4t7; dur=6875
+      - gfet4t7; dur=7699
       transfer-encoding:
       - chunked
       vary:
@@ -320,43 +348,83 @@ interactions:
       - content:
           parts:
           - text: |-
-              In Mexico City today, you can expect a day of mixed sun and clouds with a high likelihood of showers and thunderstorms, particularly in the afternoon and evening.
+              **Mexico City Sees a Mix of Clouds and Sun with Mild Temperatures**
 
-              Currently, the weather is partly cloudy with temperatures in the mid-60s Fahrenheit (around 17-18°C). As the day progresses, the temperature is expected to rise, reaching a high of around 73-75°F (approximately 23°C).
+              Today in Mexico City, residents can expect partly to mostly cloudy skies with a high temperature reaching the upper 60s, with some forecasts predicting a high of 67°F or 68°F. There is a slight chance of showers, with precipitation probabilities ranging from 25% to 40%.
 
-              There is a significant chance of rain, with forecasts indicating a 60% to 100% probability of precipitation, especially from mid-afternoon into the evening. Winds are generally light, coming from the north-northeast at 10 to 15 mph.
+              Currently, the temperature is around 58°F, feeling like 58°F. The wind is relatively calm, coming from the north-northwest at approximately 6 mph. Humidity levels are at 56%.
 
-              Tonight, the skies will remain cloudy with a continued chance of showers, and the temperature will drop to a low of around 57°F (about 14°C).
+              Tonight, the skies are expected to be partly cloudy with a low temperature in the upper 40s to low 50s. There is still a chance of rain showers this evening, clearing up overnight. The sun rose at 6:58 AM and is set to go down at 5:58 PM.
           role: model
         finishReason: STOP
         groundingMetadata:
           groundingChunks:
           - web:
-              title: theweathernetwork.com
-              uri: https://vertexaisearch.cloud.google.com/grounding-api-redirect/AUZIYQEvigSUuLwtMoqPNq2bvqCduH6yYQLKmhzoj0-SQbxBb2rs_ow380KClss6yfKqxmQ-3HIrmzasviLVdO2FhQ_uEIGfpv6-_r4XOSSLu57LKZgAFYTsswd5Q--VkuO2eEr4Vh8b0aK4KFi3Rt3k_r99frmOa-8mCHzWrXI_HeS58IvIpda0XNtWVEjg
+              title: weatherbug.com
+              uri: https://vertexaisearch.cloud.google.com/grounding-api-redirect/AUZIYQGNALHx6WbEk-l7IywrVofZAc2f2B3liR_LzjbU-1am45jWx9hcx90BpU7s99-o3AlvyF3rFjbEUsCFf3iXkMtOTRQ6jXV-dANbcpH5Xay-cxn0bEap1w1Pc1LRW3vBu_SENFOfmxLEZ34c-OxqZ31RL75U6sjx2i4ZDkZ4PFh2AU96STIf3d1jHA==
           - web:
-              title: wunderground.com
-              uri: https://vertexaisearch.cloud.google.com/grounding-api-redirect/AUZIYQFEXnJiWubQ1I2xMumZnSwxzZzhO_s2AdGg1yFakgO7GqJXU25aq3-Zl5xFEsUk9KpDtKUsS0NrBQxRNYCTkbKMknHSD5n8Yps9aAYvLOvyKgKPDFt4SkBkt1RO1nyPOweAzOzjPmnnd8AqBqOq
+              title: accuweather.com
+              uri: https://vertexaisearch.cloud.google.com/grounding-api-redirect/AUZIYQH7JB3O5Oy3_PWu31FwdJElbZYSRGZeZWlIDXoEOtOaIQuIX_wPZaP8LyNT1K3_nPEGsobbg_tSkYiqLn_D1SD_-wGu0-RwwxF4bN8UcM5GCOMVdf7gI3a2WVyBBUL7_BPiW9Rrnf2eDjjOv0jtEIJw1tDGDvJh9R54phebi_Cls5aDD7ajlg==
+          - web:
+              title: accuweather.com
+              uri: https://vertexaisearch.cloud.google.com/grounding-api-redirect/AUZIYQGrARwtoF8hUa_8zy1oHzNBmQTFitFKcqATKStBQC2h_7YLvNzHVV4XzGridgTcihzPfjXUTW_0OZ0qs6iG_157KwIdS2ePZTccfXIQ3XdTii0DIT-4L-xmQl8dPpHm1Lmx1Q8XSiOJA55QXjvXsstMI3OJ8PyT8ewzhD136NdMbdPV0Ftp
           - web:
               title: wunderground.com
-              uri: https://vertexaisearch.cloud.google.com/grounding-api-redirect/AUZIYQEDXOJgWay-hTPi0eqxph51YPv_mX15kug_vYdV3Ybx19gm4XsIFdbDN3OhP8tHbKJDheVySvDaxmXZK2lsEJlHITYidz_uKAiY38_peXIPv0Kw4LvBYLWUh4SPwHBLgHAR3CsLQo3293ZbIXZ_3A==
+              uri: https://vertexaisearch.cloud.google.com/grounding-api-redirect/AUZIYQHoTyQZHYOqP2WvRsPSvTGoKXpwgkZVJipTrznFmWt1mDux7eNnL5Wh46MfZ5CghEY7e7aIGejO5NvpK5DJQ2e3wV-smAcf2MYbm-4nIXi17hXJ6X4Rb7wXNGsD4GzyQe45Qcqqnt8xw39vUBut
           groundingSupports:
           - groundingChunkIndices:
             - 0
             - 1
+            segment:
+              endIndex: 246
+              startIndex: 69
+              text: Today in Mexico City, residents can expect partly to mostly cloudy skies with a high temperature reaching
+                the upper 60s, with some forecasts predicting a high of 67°F or 68°F.
+          - groundingChunkIndices:
             - 2
+            - 3
+            segment:
+              endIndex: 341
+              startIndex: 247
+              text: There is a slight chance of showers, with precipitation probabilities ranging from 25% to 40%.
+          - groundingChunkIndices:
+            - 3
+            segment:
+              endIndex: 406
+              startIndex: 343
+              text: Currently, the temperature is around 58°F, feeling like 58°F.
+          - groundingChunkIndices:
+            - 0
+            segment:
+              endIndex: 491
+              startIndex: 407
+              text: The wind is relatively calm, coming from the north-northwest at approximately 6 mph.
+          - groundingChunkIndices:
+            - 0
             segment:
-              endIndex: 542
-              startIndex: 386
-              text: There is a significant chance of rain, with forecasts indicating a 60% to 100% probability of precipitation,
-                especially from mid-afternoon into the evening.
+              endIndex: 519
+              startIndex: 492
+              text: Humidity levels are at 56%.
           - groundingChunkIndices:
+            - 0
             - 1
-            - 2
+            - 3
+            segment:
+              endIndex: 624
+              startIndex: 521
+              text: Tonight, the skies are expected to be partly cloudy with a low temperature in the upper 40s to low 50s.
+          - groundingChunkIndices:
+            - 3
+            segment:
+              endIndex: 701
+              startIndex: 625
+              text: There is still a chance of rain showers this evening, clearing up overnight.
+          - groundingChunkIndices:
+            - 0
             segment:
-              endIndex: 618
-              startIndex: 543
-              text: Winds are generally light, coming from the north-northeast at 10 to 15 mph.
+              endIndex: 759
+              startIndex: 702
+              text: The sun rose at 6:58 AM and is set to go down at 5:58 PM.
           searchEntryPoint:
             renderedContent: |
               <style>
@@ -480,26 +548,26 @@ interactions:
                   <div class="gradient-container"><div class="gradient"></div></div>
                 </div>
                 <div class="carousel">
-                  <a class="chip" href="https://vertexaisearch.cloud.google.com/grounding-api-redirect/AUZIYQGbyM4W4itB9H_ZJw2_8WIuXcL7VHN0Ek1Cm5mXlJ9nwPPb-OBVlLWqvK6Zu3T72A8yNEzw9czyIcQ6Q0d7lWJhUGqPEJj5CzI9ZG8zJs0D1p5vZxrurYFVVkH2_lSsF7OXc09V2aZ9lXKeYqweKX5UG6wDWM3Pz4UVB8QTe7iSINZaYrn_RMncMcDqXjXuxbZvLMuMtGBTtep4wuc57z9Xjw==">current weather in Mexico City</a>
+                  <a class="chip" href="https://vertexaisearch.cloud.google.com/grounding-api-redirect/AUZIYQFkPCkMkdzoKEYlbMN6KZIkazXrXeVJYoRizodSWf9DKXunl6o7g6DaioHZn_51L3jcgaXBqW5UvMNzB8_MZv2Si0V5uuF2JD0VB0DZ2YaZfuauMogremXPcFPM7fOI9HL5BLEklVKz6OASOk-q6uyeFRiVA44Jm_zxhjs0FzD71NK6YMy5Kra5O7djaCQhZ9naFxuPb-dEL5dbZ-pMJQ==">weather in Mexico City today</a>
                 </div>
               </div>
           webSearchQueries:
-          - current weather in Mexico City
+          - weather in Mexico City today
         index: 0
       modelVersion: gemini-2.5-pro
-      responseId: dtnJaKyTAri3qtsPu4imqQs
+      responseId: 01I3ab71ENy4mtkPpNOJsQY
       usageMetadata:
-        candidatesTokenCount: 206
-        promptTokenCount: 209
+        candidatesTokenCount: 213
+        promptTokenCount: 223
         promptTokensDetails:
         - modality: TEXT
-          tokenCount: 209
-        thoughtsTokenCount: 131
-        toolUsePromptTokenCount: 286
+          tokenCount: 223
+        thoughtsTokenCount: 169
+        toolUsePromptTokenCount: 318
         toolUsePromptTokensDetails:
         - modality: TEXT
-          tokenCount: 286
-        totalTokenCount: 832
+          tokenCount: 318
+        totalTokenCount: 923
     status:
       code: 200
       message: OK
diff --git a/tests/models/cassettes/test_google/test_google_tool_output.yaml b/tests/models/cassettes/test_google/test_google_tool_output.yaml
index c5e447520d..e9451f6649 100644
--- a/tests/models/cassettes/test_google/test_google_tool_output.yaml
+++ b/tests/models/cassettes/test_google/test_google_tool_output.yaml
@@ -8,7 +8,7 @@ interactions:
       connection:
       - keep-alive
       content-length:
-      - '620'
+      - '705'
       content-type:
       - application/json
       host:
@@ -19,7 +19,9 @@ interactions:
       - parts:
         - text: What is the largest city in the user country?
         role: user
-      generationConfig: {}
+      generationConfig:
+        responseModalities:
+        - TEXT
       toolConfig:
         functionCallingConfig:
           allowedFunctionNames:
@@ -30,32 +32,33 @@ interactions:
       - functionDeclarations:
         - description: ''
           name: get_user_country
-          parameters:
+          parameters_json_schema:
+            additionalProperties: false
             properties: {}
-            type: OBJECT
+            type: object
         - description: The final response which ends this conversation
           name: final_result
-          parameters:
+          parameters_json_schema:
             properties:
               city:
-                type: STRING
+                type: string
               country:
-                type: STRING
+                type: string
             required:
             - city
             - country
-            type: OBJECT
+            type: object
     uri: https://generativelanguage.googleapis.com/v1beta/models/gemini-2.0-flash:generateContent
   response:
     headers:
       alt-svc:
       - h3=":443"; ma=2592000,h3-29=":443"; ma=2592000
       content-length:
-      - '733'
+      - '734'
       content-type:
       - application/json; charset=UTF-8
       server-timing:
-      - gfet4t7; dur=581
+      - gfet4t7; dur=943
       transfer-encoding:
       - chunked
       vary:
@@ -64,7 +67,7 @@ interactions:
       - Referer
     parsed_body:
       candidates:
-      - avgLogprobs: 5.670217797160149e-06
+      - avgLogprobs: 2.3644883185625075e-06
         content:
           parts:
           - functionCall:
@@ -73,17 +76,17 @@ interactions:
           role: model
         finishReason: STOP
       modelVersion: gemini-2.0-flash
-      responseId: LlteaIDvD9m7nvgPz5Sb0Aw
+      responseId: ihI3adbMKZCez7IPy9_U-Qg
       usageMetadata:
         candidatesTokenCount: 5
         candidatesTokensDetails:
         - modality: TEXT
           tokenCount: 5
-        promptTokenCount: 33
+        promptTokenCount: 25
         promptTokensDetails:
         - modality: TEXT
-          tokenCount: 33
-        totalTokenCount: 38
+          tokenCount: 25
+        totalTokenCount: 30
     status:
       code: 200
       message: OK
@@ -96,7 +99,7 @@ interactions:
       connection:
       - keep-alive
       content-length:
-      - '929'
+      - '1086'
       content-type:
       - application/json
       host:
@@ -110,17 +113,20 @@ interactions:
       - parts:
         - functionCall:
             args: {}
-            id: pyd_ai_3fa5644dae1d4aad997ae39c70006fbd
+            id: pyd_ai_8f775a6033464e2f9d721abc0befe93a
             name: get_user_country
+          thoughtSignature: Y29udGV4dF9lbmdpbmVlcmluZ19pc190aGVfd2F5X3RvX2dv
         role: model
       - parts:
         - functionResponse:
-            id: pyd_ai_3fa5644dae1d4aad997ae39c70006fbd
+            id: pyd_ai_8f775a6033464e2f9d721abc0befe93a
             name: get_user_country
             response:
               return_value: Mexico
         role: user
-      generationConfig: {}
+      generationConfig:
+        responseModalities:
+        - TEXT
       toolConfig:
         functionCallingConfig:
           allowedFunctionNames:
@@ -131,21 +137,22 @@ interactions:
       - functionDeclarations:
         - description: ''
           name: get_user_country
-          parameters:
+          parameters_json_schema:
+            additionalProperties: false
             properties: {}
-            type: OBJECT
+            type: object
         - description: The final response which ends this conversation
           name: final_result
-          parameters:
+          parameters_json_schema:
             properties:
               city:
-                type: STRING
+                type: string
               country:
-                type: STRING
+                type: string
             required:
             - city
             - country
-            type: OBJECT
+            type: object
     uri: https://generativelanguage.googleapis.com/v1beta/models/gemini-2.0-flash:generateContent
   response:
     headers:
@@ -156,7 +163,7 @@ interactions:
       content-type:
       - application/json; charset=UTF-8
       server-timing:
-      - gfet4t7; dur=605
+      - gfet4t7; dur=830
       transfer-encoding:
       - chunked
       vary:
@@ -176,17 +183,17 @@ interactions:
           role: model
         finishReason: STOP
       modelVersion: gemini-2.0-flash
-      responseId: LlteaOzCOPOdnvgPrJbnoQg
+      responseId: ixI3ae73LOjoz7IPgeK2yQg
       usageMetadata:
         candidatesTokenCount: 8
         candidatesTokensDetails:
         - modality: TEXT
           tokenCount: 8
-        promptTokenCount: 47
+        promptTokenCount: 39
         promptTokensDetails:
         - modality: TEXT
-          tokenCount: 47
-        totalTokenCount: 55
+          tokenCount: 39
+        totalTokenCount: 47
     status:
       code: 200
       message: OK
diff --git a/tests/models/cassettes/test_openai/test_image_url_tool_response.yaml b/tests/models/cassettes/test_openai/test_image_url_tool_response.yaml
index c4893ed41d..69c2d02e97 100644
--- a/tests/models/cassettes/test_openai/test_image_url_tool_response.yaml
+++ b/tests/models/cassettes/test_openai/test_image_url_tool_response.yaml
@@ -8,7 +8,7 @@ interactions:
       connection:
       - keep-alive
       content-length:
-      - '344'
+      - '338'
       content-type:
       - application/json
       host:
@@ -21,7 +21,6 @@ interactions:
           type: text
         role: user
       model: gpt-4o
-      n: 1
       stream: false
       tool_choice: auto
       tools:
@@ -47,9 +46,11 @@ interactions:
       content-type:
       - application/json
       openai-organization:
-      - pydantic-28gund
+      - user-grnwlxd1653lxdzp921aoihz
       openai-processing-ms:
-      - '296'
+      - '356'
+      openai-project:
+      - proj_FYsIItHHgnSPdHBVMzhNBWGa
       openai-version:
       - '2020-10-01'
       strict-transport-security:
@@ -70,16 +71,16 @@ interactions:
           - function:
               arguments: '{}'
               name: get_image
-            id: call_4hrT4QP9jfojtK69vGiFCFjG
+            id: call_Xn7ZD27IylZB66yw2n38IWXe
             type: function
-      created: 1745960879
-      id: chatcmpl-BRmTHlrARTzAHK1na9s80xDlQGYPX
+      created: 1765216833
+      id: chatcmpl-CkZpBs2uAOr90Y3bazEGxLfYjrJgJ
       model: gpt-4o-2024-08-06
       object: chat.completion
       service_tier: default
-      system_fingerprint: fp_a6889ffe71
+      system_fingerprint: fp_e5bb698939
       usage:
-        completion_tokens: 11
+        completion_tokens: 10
         completion_tokens_details:
           accepted_prediction_tokens: 0
           audio_tokens: 0
@@ -89,7 +90,7 @@ interactions:
         prompt_tokens_details:
           audio_tokens: 0
           cached_tokens: 0
-        total_tokens: 57
+        total_tokens: 56
     status:
       code: 200
       message: OK
@@ -102,12 +103,12 @@ interactions:
       connection:
       - keep-alive
       content-length:
-      - '783'
+      - '792'
       content-type:
       - application/json
       cookie:
-      - __cf_bm=Y3biMCTZO5Th3UvQ860GYUMLYxiUXSAsxnMCouTdgeU-1745960879-1.0.1.1-WBVYj595xgEl4EU9MYihK2kKPDzCpSFRaWFoKWmVf4S4BdGfkiDKKFlJK5flK_2WSQEfGfU_PcQ6Xm8XBDmStha3DpcGZRonkltc5FYs4y4;
-        _cfuvid=YlYL5E_xNEFa1AD61lBj94CGwQ3GptpRIuO1JpjWSJY-1745960879715-0.0.1.1-604800000
+      - __cf_bm=vPgKiJqpcKFzgDkIX8ulUwInFUACX879aARRorhKjUY-1765216833-1.0.1.1-grWt61jAxHgVn8jEkPPM7gZgouPzhJNCnVRi2xs4JIzHBd5MezsJYuXsmCvsCxMZu0y8eeW7JLpOK75HeGhvUs78wDu4v.UDXpmKlYzVc0E;
+        _cfuvid=FbemPHGOS.s47WgNJknQvM0LCa3j23gJ88DjgJDcl6g-1765216833540-0.0.1.1-604800000
       host:
       - api.openai.com
     method: POST
@@ -117,16 +118,17 @@ interactions:
         - text: What food is in the image you can get from the get_image tool?
           type: text
         role: user
-      - role: assistant
+      - content: null
+        role: assistant
         tool_calls:
         - function:
             arguments: '{}'
             name: get_image
-          id: call_4hrT4QP9jfojtK69vGiFCFjG
+          id: call_Xn7ZD27IylZB66yw2n38IWXe
           type: function
       - content: See file bd38f5
         role: tool
-        tool_call_id: call_4hrT4QP9jfojtK69vGiFCFjG
+        tool_call_id: call_Xn7ZD27IylZB66yw2n38IWXe
       - content:
         - text: 'This is file bd38f5:'
           type: text
@@ -135,7 +137,6 @@ interactions:
           type: image_url
         role: user
       model: gpt-4o
-      n: 1
       stream: false
       tool_choice: auto
       tools:
@@ -161,9 +162,11 @@ interactions:
       content-type:
       - application/json
       openai-organization:
-      - pydantic-28gund
+      - user-grnwlxd1653lxdzp921aoihz
       openai-processing-ms:
-      - '1565'
+      - '1342'
+      openai-project:
+      - proj_FYsIItHHgnSPdHBVMzhNBWGa
       openai-version:
       - '2020-10-01'
       strict-transport-security:
@@ -180,24 +183,24 @@ interactions:
           content: The image shows a potato.
           refusal: null
           role: assistant
-      created: 1745960880
-      id: chatcmpl-BRmTI0Y2zmkGw27kLarhsmiFQTGxR
+      created: 1765216835
+      id: chatcmpl-CkZpD3JSLa7qZKvU5yYhrf7L3wOxA
       model: gpt-4o-2024-08-06
       object: chat.completion
       service_tier: default
-      system_fingerprint: fp_90122d973c
+      system_fingerprint: fp_83554c687e
       usage:
-        completion_tokens: 8
+        completion_tokens: 7
         completion_tokens_details:
           accepted_prediction_tokens: 0
           audio_tokens: 0
           reasoning_tokens: 0
           rejected_prediction_tokens: 0
-        prompt_tokens: 503
+        prompt_tokens: 507
         prompt_tokens_details:
           audio_tokens: 0
           cached_tokens: 0
-        total_tokens: 511
+        total_tokens: 514
     status:
       code: 200
       message: OK
diff --git a/tests/models/cassettes/test_openai_responses/test_openai_responses_model_simple_response_with_tool_call.yaml b/tests/models/cassettes/test_openai_responses/test_openai_responses_model_simple_response_with_tool_call.yaml
index ee210dc368..13f82f4c71 100644
--- a/tests/models/cassettes/test_openai_responses/test_openai_responses_model_simple_response_with_tool_call.yaml
+++ b/tests/models/cassettes/test_openai_responses/test_openai_responses_model_simple_response_with_tool_call.yaml
@@ -42,15 +42,15 @@ interactions:
       connection:
       - keep-alive
       content-length:
-      - '1720'
+      - '1754'
       content-type:
       - application/json
       openai-organization:
-      - pydantic-28gund
+      - user-grnwlxd1653lxdzp921aoihz
       openai-processing-ms:
-      - '1811'
+      - '2123'
       openai-project:
-      - proj_dKobscVY9YJxeEaDJen54e3d
+      - proj_FYsIItHHgnSPdHBVMzhNBWGa
       openai-version:
       - '2020-10-01'
       strict-transport-security:
@@ -61,9 +61,9 @@ interactions:
       background: false
       billing:
         payer: developer
-      created_at: 1761323546
+      created_at: 1765216837
       error: null
-      id: resp_04907f5d3de791830068fbaa19bb908195a91378279dba0f14
+      id: resp_0098e6898ef1de50006937124569a481a3bda8b1b858020932
       incomplete_details: null
       instructions: null
       max_output_tokens: null
@@ -73,14 +73,15 @@ interactions:
       object: response
       output:
       - arguments: '{"country":"PotatoLand"}'
-        call_id: call_YfwRsW8sUxDKipwyhWTzOXCA
-        id: fc_04907f5d3de791830068fbaa1b310c81958dc9c508e878c632
+        call_id: call_kcWh9j9hyUL1tNm1GIKH0nZX
+        id: fc_0098e6898ef1de500069371246676881a38f9192ffdd2416bd
         name: get_capital
         status: completed
         type: function_call
       parallel_tool_calls: true
       previous_response_id: null
       prompt_cache_key: null
+      prompt_cache_retention: null
       reasoning:
         effort: null
         summary: null
@@ -131,12 +132,12 @@ interactions:
       connection:
       - keep-alive
       content-length:
-      - '579'
+      - '565'
       content-type:
       - application/json
       cookie:
-      - __cf_bm=g29aPgrRIxmp3X5o6PZW9E8aKljsJ3_YKN58sMhqjnI-1761323547-1.0.1.1-Uj.mPGHnvAjpHojYAfG.QReYxHtLCz0jBoPrirBGA48A.LawB_Afgv0C8s0DC2TIU2y6zbyq4bA1moTVcNApxaq4NaLqfKpLe2hQBB_xM.M;
-        _cfuvid=kiKLNQ6S_H_I6dKfHm0bpQwt35G4FrXx6u4P3LxaXIQ-1761323547535-0.0.1.1-604800000
+      - __cf_bm=rNFW2HXvBcwKYFTyo2r9Kn6xEgVWiRCwuofw_Y7MgnU-1765216839-1.0.1.1-EomCcZa_DuoXHdeLvTDDqvgfVjx6EO2ePh26V1z54f6IZVzCT6ZLLWEYSSQKFrCT9k2D5FAoUvaWTDWelXEPtKYJhYzXIg1KrGaW_EL0F14;
+        _cfuvid=xaAIsidmbLe4Yt5wP4pfjvOB.UZq7mRODDOhHtWv1u4-1765216839552-0.0.1.1-604800000
       host:
       - api.openai.com
     method: POST
@@ -145,11 +146,10 @@ interactions:
       - content: What is the capital of PotatoLand?
         role: user
       - arguments: '{"country":"PotatoLand"}'
-        call_id: call_YfwRsW8sUxDKipwyhWTzOXCA
+        call_id: call_kcWh9j9hyUL1tNm1GIKH0nZX
         name: get_capital
-        status: null
         type: function_call
-      - call_id: call_YfwRsW8sUxDKipwyhWTzOXCA
+      - call_id: call_kcWh9j9hyUL1tNm1GIKH0nZX
         output: Potato City
         type: function_call_output
       model: gpt-4o
@@ -176,15 +176,15 @@ interactions:
       connection:
       - keep-alive
       content-length:
-      - '1810'
+      - '1844'
       content-type:
       - application/json
       openai-organization:
-      - pydantic-28gund
+      - user-grnwlxd1653lxdzp921aoihz
       openai-processing-ms:
-      - '1028'
+      - '2160'
       openai-project:
-      - proj_dKobscVY9YJxeEaDJen54e3d
+      - proj_FYsIItHHgnSPdHBVMzhNBWGa
       openai-version:
       - '2020-10-01'
       strict-transport-security:
@@ -195,9 +195,9 @@ interactions:
       background: false
       billing:
         payer: developer
-      created_at: 1761323547
+      created_at: 1765216840
       error: null
-      id: resp_0e9950da9eac6a780068fbaa1bc030819da585a6f85ddad1e6
+      id: resp_077bb69e040244a30069371248858c8193bad172300ddd4528
       incomplete_details: null
       instructions: null
       max_output_tokens: null
@@ -211,13 +211,14 @@ interactions:
           logprobs: []
           text: The capital of PotatoLand is Potato City.
           type: output_text
-        id: msg_0e9950da9eac6a780068fbaa1c738c819d8bddf998e57232c3
+        id: msg_077bb69e040244a30069371249a1ec819385b08d57120776b8
         role: assistant
         status: completed
         type: message
       parallel_tool_calls: true
       previous_response_id: null
       prompt_cache_key: null
+      prompt_cache_retention: null
       reasoning:
         effort: null
         summary: null
diff --git a/tests/models/cassettes/test_openai_responses/test_tool_output.yaml b/tests/models/cassettes/test_openai_responses/test_tool_output.yaml
index bc201f7c19..7923a64b41 100644
--- a/tests/models/cassettes/test_openai_responses/test_tool_output.yaml
+++ b/tests/models/cassettes/test_openai_responses/test_tool_output.yaml
@@ -8,7 +8,7 @@ interactions:
       connection:
       - keep-alive
       content-length:
-      - '556'
+      - '586'
       content-type:
       - application/json
       host:
@@ -22,7 +22,7 @@ interactions:
       stream: false
       tool_choice: required
       tools:
-      - description: ''
+      - description: null
         name: get_user_country
         parameters:
           additionalProperties: false
@@ -33,6 +33,7 @@ interactions:
       - description: The final response which ends this conversation
         name: final_result
         parameters:
+          additionalProperties: false
           properties:
             city:
               type: string
@@ -42,7 +43,7 @@ interactions:
           - city
           - country
           type: object
-        strict: false
+        strict: true
         type: function
     uri: https://api.openai.com/v1/responses
   response:
@@ -52,13 +53,15 @@ interactions:
       connection:
       - keep-alive
       content-length:
-      - '1854'
+      - '2106'
       content-type:
       - application/json
       openai-organization:
-      - pydantic-28gund
+      - user-grnwlxd1653lxdzp921aoihz
       openai-processing-ms:
-      - '568'
+      - '2124'
+      openai-project:
+      - proj_FYsIItHHgnSPdHBVMzhNBWGa
       openai-version:
       - '2020-10-01'
       strict-transport-security:
@@ -67,27 +70,33 @@ interactions:
       - chunked
     parsed_body:
       background: false
-      created_at: 1749516043
+      billing:
+        payer: developer
+      created_at: 1765216844
       error: null
-      id: resp_68477f0b40a8819cb8d55594bc2c232a001fd29e2d5573f7
+      id: resp_04c1bf8ad3be7d27006937124c0f18819c8e3cfa2c478b5678
       incomplete_details: null
       instructions: null
       max_output_tokens: null
+      max_tool_calls: null
       metadata: {}
       model: gpt-4o-2024-08-06
       object: response
       output:
       - arguments: '{}'
-        call_id: call_ZWkVhdUjupo528U9dqgFeRkH
-        id: fc_68477f0bb8e4819cba6d781e174d77f8001fd29e2d5573f7
+        call_id: call_bzir81UHdS66eGfDbGdkxItT
+        id: fc_04c1bf8ad3be7d27006937124d6218819cad7022b00dd3530b
         name: get_user_country
         status: completed
         type: function_call
       parallel_tool_calls: true
       previous_response_id: null
+      prompt_cache_key: null
+      prompt_cache_retention: null
       reasoning:
         effort: null
         summary: null
+      safety_identifier: null
       service_tier: default
       status: completed
       store: true
@@ -95,6 +104,7 @@ interactions:
       text:
         format:
           type: text
+        verbosity: medium
       tool_choice: required
       tools:
       - description: null
@@ -108,6 +118,7 @@ interactions:
       - description: The final response which ends this conversation
         name: final_result
         parameters:
+          additionalProperties: false
           properties:
             city:
               type: string
@@ -117,8 +128,9 @@ interactions:
           - city
           - country
           type: object
-        strict: false
+        strict: true
         type: function
+      top_logprobs: 0
       top_p: 1.0
       truncation: disabled
       usage:
@@ -142,12 +154,12 @@ interactions:
       connection:
       - keep-alive
       content-length:
-      - '792'
+      - '788'
       content-type:
       - application/json
       cookie:
-      - __cf_bm=78_bxRDp8.6VLECkU4_YSNYd7PlmVGdN1E4j5KBkoOA-1749516043-1.0.1.1-Z9ZwaEzQZcS64A536kPafni6AZEqjCr1xDJ1h2WXjDrs0G_LuZPuq7Z27rs6w0.2DAk_UEY0.H.YMVFpWwe0QTOI28mlvDMbZvVsP6LT4Ug;
-        _cfuvid=Qym79CFc.nJ8O7pqDQfy1eFUEqIDIX3VuqfAl93F07o-1749516043838-0.0.1.1-604800000
+      - __cf_bm=oteH2esXXRfhkwJb4BPTAN0.uyZgA.VC9qqR2pJSFUg-1765216846-1.0.1.1-MZPKGs1jBVfhVKX7m8v5CZf4ocLYshMrz_7c9_N7U1HgAvzRHlysjyUlHI89tWuLvwK57VGop4jJWwUwU31_JeZkwzsZueA_Dzh6gH4BbEU;
+        _cfuvid=wA9.XZo8aKxnFt4PyulsqdLSn_osZyaiN.pC5ecpV9A-1765216846197-0.0.1.1-604800000
       host:
       - api.openai.com
     method: POST
@@ -155,20 +167,18 @@ interactions:
       input:
       - content: What is the largest city in the user country?
         role: user
-      - content: ''
-        role: assistant
       - arguments: '{}'
-        call_id: call_ZWkVhdUjupo528U9dqgFeRkH
+        call_id: call_bzir81UHdS66eGfDbGdkxItT
         name: get_user_country
         type: function_call
-      - call_id: call_ZWkVhdUjupo528U9dqgFeRkH
+      - call_id: call_bzir81UHdS66eGfDbGdkxItT
         output: Mexico
         type: function_call_output
       model: gpt-4o
       stream: false
       tool_choice: required
       tools:
-      - description: ''
+      - description: null
         name: get_user_country
         parameters:
           additionalProperties: false
@@ -179,6 +189,7 @@ interactions:
       - description: The final response which ends this conversation
         name: final_result
         parameters:
+          additionalProperties: false
           properties:
             city:
               type: string
@@ -188,7 +199,7 @@ interactions:
           - city
           - country
           type: object
-        strict: false
+        strict: true
         type: function
     uri: https://api.openai.com/v1/responses
   response:
@@ -198,13 +209,15 @@ interactions:
       connection:
       - keep-alive
       content-length:
-      - '1898'
+      - '2150'
       content-type:
       - application/json
       openai-organization:
-      - pydantic-28gund
+      - user-grnwlxd1653lxdzp921aoihz
       openai-processing-ms:
-      - '840'
+      - '2114'
+      openai-project:
+      - proj_FYsIItHHgnSPdHBVMzhNBWGa
       openai-version:
       - '2020-10-01'
       strict-transport-security:
@@ -213,27 +226,33 @@ interactions:
       - chunked
     parsed_body:
       background: false
-      created_at: 1749516044
+      billing:
+        payer: developer
+      created_at: 1765216846
       error: null
-      id: resp_68477f0bfda8819ea65458cd7cc389b801dc81d4bc91f560
+      id: resp_032b8ae48d9012e1006937124ef11c819dbf3ff33c3a91e4ae
       incomplete_details: null
       instructions: null
       max_output_tokens: null
+      max_tool_calls: null
       metadata: {}
       model: gpt-4o-2024-08-06
       object: response
       output:
       - arguments: '{"city":"Mexico City","country":"Mexico"}'
-        call_id: call_iFBd0zULhSZRR908DfH73VwN
-        id: fc_68477f0c91cc819e8024e7e633f0f09401dc81d4bc91f560
+        call_id: call_pQ58SKRjGbf62NBIIqpX4JB0
+        id: fc_032b8ae48d9012e100693712501798819d81203cd609c1e77a
         name: final_result
         status: completed
         type: function_call
       parallel_tool_calls: true
       previous_response_id: null
+      prompt_cache_key: null
+      prompt_cache_retention: null
       reasoning:
         effort: null
         summary: null
+      safety_identifier: null
       service_tier: default
       status: completed
       store: true
@@ -241,6 +260,7 @@ interactions:
       text:
         format:
           type: text
+        verbosity: medium
       tool_choice: required
       tools:
       - description: null
@@ -254,6 +274,7 @@ interactions:
       - description: The final response which ends this conversation
         name: final_result
         parameters:
+          additionalProperties: false
           properties:
             city:
               type: string
@@ -263,18 +284,19 @@ interactions:
           - city
           - country
           type: object
-        strict: false
+        strict: true
         type: function
+      top_logprobs: 0
       top_p: 1.0
       truncation: disabled
       usage:
-        input_tokens: 85
+        input_tokens: 81
         input_tokens_details:
           cached_tokens: 0
         output_tokens: 20
         output_tokens_details:
           reasoning_tokens: 0
-        total_tokens: 105
+        total_tokens: 101
       user: null
     status:
       code: 200
diff --git a/tests/models/google/__init__.py b/tests/models/google/__init__.py
new file mode 100644
index 0000000000..7a3f72e592
--- /dev/null
+++ b/tests/models/google/__init__.py
@@ -0,0 +1 @@
+"""Tests for Google models."""
diff --git a/tests/models/google/cassettes/test_tool_choice/test_tool_choice_auto_live.yaml b/tests/models/google/cassettes/test_tool_choice/test_tool_choice_auto_live.yaml
new file mode 100644
index 0000000000..6da8b938e6
--- /dev/null
+++ b/tests/models/google/cassettes/test_tool_choice/test_tool_choice_auto_live.yaml
@@ -0,0 +1,79 @@
+interactions:
+- request:
+    headers:
+      accept:
+      - '*/*'
+      accept-encoding:
+      - gzip, deflate
+      connection:
+      - keep-alive
+      content-length:
+      - '435'
+      content-type:
+      - application/json
+      host:
+      - generativelanguage.googleapis.com
+    method: POST
+    parsed_body:
+      contents:
+      - parts:
+        - text: What is 2+2?
+        role: user
+      generationConfig:
+        responseModalities:
+        - TEXT
+      toolConfig:
+        functionCallingConfig:
+          mode: AUTO
+      tools:
+      - functionDeclarations:
+        - description: Get the weather for a city.
+          name: get_weather
+          parameters_json_schema:
+            additionalProperties: false
+            properties:
+              city:
+                type: string
+            required:
+            - city
+            type: object
+    uri: https://generativelanguage.googleapis.com/v1beta/models/gemini-2.5-flash:generateContent
+  response:
+    headers:
+      alt-svc:
+      - h3=":443"; ma=2592000,h3-29=":443"; ma=2592000
+      content-length:
+      - '898'
+      content-type:
+      - application/json; charset=UTF-8
+      server-timing:
+      - gfet4t7; dur=886
+      transfer-encoding:
+      - chunked
+      vary:
+      - Origin
+      - X-Origin
+      - Referer
+    parsed_body:
+      candidates:
+      - content:
+          parts:
+          - text: 2+2 is 4.
+            thoughtSignature: CuUBAXLI2nwEslcG7V2JKQpujVGAgAu5E2OIH6Xv9Q0Lw17n7eK2bQF4zGkpnazh569f5aKwJm3Ez+RAprR0K5pFq8BU9BA+6lrLck72CdxodJx+Cm78Weu3PPsNbVL/cKbPO4xDXr+g7a+ZBwJCJSugUN4yCm2NWqJt5mYNPuVgxIYF9jJ4hC2pPXU+o9mhYds8b3fQrr9hODf7lzhLvVDsqvO8bJv1ry5Mtg0tX4oU17zPaFyn/PmFdapho9sJLol7TODoOY2b7snleDX4/oUtMbdUSrohrzlqc3jW5hzbwnLby50wtQ==
+          role: model
+        finishReason: STOP
+        index: 0
+      modelVersion: gemini-2.5-flash
+      responseId: wHU3ab_LC-iyqtsPqabQoA4
+      usageMetadata:
+        candidatesTokenCount: 7
+        promptTokenCount: 47
+        promptTokensDetails:
+        - modality: TEXT
+          tokenCount: 47
+        thoughtsTokenCount: 44
+        totalTokenCount: 98
+    status:
+      code: 200
+      message: OK
+version: 1
diff --git a/tests/models/google/cassettes/test_tool_choice/test_tool_choice_none_live.yaml b/tests/models/google/cassettes/test_tool_choice/test_tool_choice_none_live.yaml
new file mode 100644
index 0000000000..2663cb5d3a
--- /dev/null
+++ b/tests/models/google/cassettes/test_tool_choice/test_tool_choice_none_live.yaml
@@ -0,0 +1,78 @@
+interactions:
+- request:
+    headers:
+      accept:
+      - '*/*'
+      accept-encoding:
+      - gzip, deflate
+      connection:
+      - keep-alive
+      content-length:
+      - '435'
+      content-type:
+      - application/json
+      host:
+      - generativelanguage.googleapis.com
+    method: POST
+    parsed_body:
+      contents:
+      - parts:
+        - text: What is 2+2?
+        role: user
+      generationConfig:
+        responseModalities:
+        - TEXT
+      toolConfig:
+        functionCallingConfig:
+          mode: NONE
+      tools:
+      - functionDeclarations:
+        - description: Get the weather for a city.
+          name: get_weather
+          parameters_json_schema:
+            additionalProperties: false
+            properties:
+              city:
+                type: string
+            required:
+            - city
+            type: object
+    uri: https://generativelanguage.googleapis.com/v1beta/models/gemini-2.5-flash:generateContent
+  response:
+    headers:
+      alt-svc:
+      - h3=":443"; ma=2592000,h3-29=":443"; ma=2592000
+      content-length:
+      - '550'
+      content-type:
+      - application/json; charset=UTF-8
+      server-timing:
+      - gfet4t7; dur=612
+      transfer-encoding:
+      - chunked
+      vary:
+      - Origin
+      - X-Origin
+      - Referer
+    parsed_body:
+      candidates:
+      - content:
+          parts:
+          - text: 2 + 2 = 4
+          role: model
+        finishReason: STOP
+        index: 0
+      modelVersion: gemini-2.5-flash
+      responseId: xXU3adymMcW1qtsPj6-BuAU
+      usageMetadata:
+        candidatesTokenCount: 7
+        promptTokenCount: 47
+        promptTokensDetails:
+        - modality: TEXT
+          tokenCount: 47
+        thoughtsTokenCount: 22
+        totalTokenCount: 76
+    status:
+      code: 200
+      message: OK
+version: 1
diff --git a/tests/models/google/cassettes/test_tool_choice/test_tool_choice_required_live.yaml b/tests/models/google/cassettes/test_tool_choice/test_tool_choice_required_live.yaml
new file mode 100644
index 0000000000..5a479cf9fe
--- /dev/null
+++ b/tests/models/google/cassettes/test_tool_choice/test_tool_choice_required_live.yaml
@@ -0,0 +1,203 @@
+interactions:
+- request:
+    headers:
+      accept:
+      - '*/*'
+      accept-encoding:
+      - gzip, deflate
+      connection:
+      - keep-alive
+      content-length:
+      - '786'
+      content-type:
+      - application/json
+      host:
+      - generativelanguage.googleapis.com
+    method: POST
+    parsed_body:
+      contents:
+      - parts:
+        - text: What is the temperature in Paris? Use the weather tool and return the temperature as a number.
+        role: user
+      generationConfig:
+        responseModalities:
+        - TEXT
+      toolConfig:
+        functionCallingConfig:
+          allowedFunctionNames:
+          - get_weather
+          - final_result
+          mode: ANY
+      tools:
+      - functionDeclarations:
+        - description: Get the weather for a city.
+          name: get_weather
+          parameters_json_schema:
+            additionalProperties: false
+            properties:
+              city:
+                type: string
+            required:
+            - city
+            type: object
+        - description: The final response which ends this conversation
+          name: final_result
+          parameters_json_schema:
+            properties:
+              response:
+                type: integer
+            required:
+            - response
+            type: object
+    uri: https://generativelanguage.googleapis.com/v1beta/models/gemini-2.5-flash:generateContent
+  response:
+    headers:
+      alt-svc:
+      - h3=":443"; ma=2592000,h3-29=":443"; ma=2592000
+      content-length:
+      - '3310'
+      content-type:
+      - application/json; charset=UTF-8
+      server-timing:
+      - gfet4t7; dur=2824
+      transfer-encoding:
+      - chunked
+      vary:
+      - Origin
+      - X-Origin
+      - Referer
+    parsed_body:
+      candidates:
+      - content:
+          parts:
+          - functionCall:
+              args:
+                city: Paris
+              name: get_weather
+            thoughtSignature: Cu4OAXLI2nxCjXhrluC5vgwVpXhM4jIrPXckWL6T5uS34j11LPzSrV0fm5ghN6wxkV3Fxur9jvvfhQ+QahGCYxChW1q+e3yvPq+D+ml8FBhLkIjfpE/YoK3iowdTlW6yhW3MqsMjfuQc1nULCXCa/K1lx0WHi2+6e9ZMSl8Mto7kibHDC/ItWSv0I9mBjcRwSYOBS5dgrdECEBlah/m4iyG4nEkNDikFYfQZ17WjV6jrgybtqB3JGjbOt0csUC/gV0gfweqL6E1L3IP8LXYhyTmWuW/aQO5OEuuIVsPHMMns36LxVWpPp3DIA2u/OF5uCz6lkfVL9M/nEUgzDWP7dxBDpPVPVAijGaW11b1+pbLwS7wk8AabHPhlit+LfCdGiSy2pdpKviXVvIpBxQcsz2N/wqS70stlrSt7YRxp+JATnV8fzebYqZWQB7AmrbX6WycqliDuyADQZotFAVzFAjCP6BpMJXf6tmFmhzF1UY0hKwYTtPQpiHP5AYUW30yOA9JBcmv3lIGc6yR58mCN7moBWY+PZuqUelYWMOqAbtH6eGCUbxs00KmyJ1pltw2cMPmhNjP6yh8aggRmm9l3ou44fcw7l70cpz3BKKD/RKu2cdij4tuMGyL8eytZwFgl1M5gZfzJpldxUoEXYPgdeqr5NxmfVr7K2kjXUBHFtXQb/ngbuNNMb67q5U2jsB2ZCb2za1ZhRQcYeFYvZP1hF0HE9EKIjgVyxd/OM85Jr9l1Fnzc7xaXZMtVp2uNDlv3/tcr2SPFpxtpZ1qbadXespV5N/ULInfTtpeNCQ96wawdfjChFkbQURHYJFnKQF2ZtCOKzkb5hHmkhimxTVJAMs0EIKXNlTc1rz3uKqtihWV3JMezYBUDEzevNcO26T+H58hAVYeaQyh+ACnBi4U8WIDMoS1dnW2Qw/4cKUPe57bg26uZYb0fT8UM9as2JEhFQ161N9TZ9+hqG2yLiSsC9If7QJsa3MtyxWtc+1f/PQdfjEPNTrXZlLsTy8UFtNI+qERcG3ESPpsDHuClceVr2WFbSHhv7Rh3ecRlOS7gq3nuVqka+apg1F1FaK2SAyQlFHnNfiH3Rfnp/pv5emY1HxGzKzE1rzlOPYEV8gOBaDf0MCbizWgI7na/6cFeN6j4cZr+YXFhl3d5fM2D7px1KFB0DcHUB/g97/E2Q9QyO5UDTcM+97xPFifVGwQNn8+qhWJ3/RtP3QMHhdo7MuxwLjqCsMOwi+IK2GsR2oBODN3ddKvJN+pIHCuiC4eghqv/93O+2McIpYITaUjqtXS6wuuY9vtYpl55ssIhFRLgfGEbsh6wTNRmKjJXZqMxyTzQMLs1SltnVKFKAltlz5L4xKiAfzHFw+KPYINAQLY/UyQXWsDUZPyLdCYxwqJX+yB+haH4qIMpGF6sjV8ftvv8q/Wj1OhEBzHu7CGZin1a6chpZrUG8MrI6XmMZriz0XLPqR0cpTfbvN1c4wM6TmgO4QlqaNUmn74A0YY80qza1d5vkiid7gBvApgKm2C48mN4rCXmIPNDjzFME+/M+wS/mLQ2T7cC8w4DWCNrF7eoxE8wrl1SxPvK7rbpVibRdg/qbs4f1m3PNaQLGJvzmgFIStJyq5K9ADjg60lB9ZFC26x8zfsSZxw0loLUlTnqlKtdogTIjlZk+ZSvCQIp8JgMuwDCxKbeC7XGAyDNtoCt6vTAurGPJKBCB/kfGAEbF+Eaf1i9L05bMUWHpawUq4S0/ukqz0R+g9HwdPEN6pkq60XYn2+/l0C8/q/GLVPIxYEv9I12oLxCU+A9b1h2RqnD2lW+43U8PM+ce8OATPQ5L/GLhoFWZbHEswejNA4Ib/sIoNADk7DwHHCKX+xGpj6td9cmGaTK3d7MIHKwqEsrYRl1zUTLj7EBTlkaBLsTcFgGJz0bwVttM4CqUeOGqcEF4sgLAhQjpsZ/6GMHWbn7xv1/JAyT1nQt+M0W5Ly8Z724zcYMxdG4dKfUDlqAf7PbfPM2aYXHNlfOCrteMqWkp+HFanRTvcT8DnMRIsCwvmDfSn6fPhnhW7BAWirfDXQUEW+aE7aAdafKDifNj8DtF1c+Lw9Gz0jOeOa4OqhciGJi5IWTKfouSa5RN89G9kyAXpm6RPAhcaFV5G6FGq1rbReqoVrLyTaeQy1M4Q1YMCcosEXS7JR9NTtLfEixksVPsNinJtroZIEFN6Hpyx6SSC8+dAAUNxiLJvwAM2atxP4lCgziPJgegTOz/2fVCEHheSgU9fAecppI05Sp7CYtKdfmpgnG9GauI6hGUSpz07/aRoaoWuJSGZh/oBVNOd2iVPxGMPiIRDThHf2ATqxAQ7FY0WjFS2luehWoDOr3rmBhlu9Qc1wPNpVS96IT45y6wnqf6xWZzL95ahW4joyDWSGrV9tCplM+jK+G0G8hK/oTwcVQ9j3seKe/pJ6WvH6Z6+LZH/MAgm33WFLD+FgR6W1hQRSWFdJtxAOv/pvgQiAvh7+JYI8+tq4HhK09AjsG6gK2DR3ndUhxlNNi5/b4pSeF
+          role: model
+        finishMessage: Model generated function call(s).
+        finishReason: STOP
+        index: 0
+      modelVersion: gemini-2.5-flash
+      responseId: w3U3abbnHLy1qtsPlPqJgQ4
+      usageMetadata:
+        candidatesTokenCount: 15
+        promptTokenCount: 98
+        promptTokensDetails:
+        - modality: TEXT
+          tokenCount: 98
+        thoughtsTokenCount: 448
+        totalTokenCount: 561
+    status:
+      code: 200
+      message: OK
+- request:
+    headers:
+      accept:
+      - '*/*'
+      accept-encoding:
+      - gzip, deflate
+      connection:
+      - keep-alive
+      content-length:
+      - '3702'
+      content-type:
+      - application/json
+      host:
+      - generativelanguage.googleapis.com
+    method: POST
+    parsed_body:
+      contents:
+      - parts:
+        - text: What is the temperature in Paris? Use the weather tool and return the temperature as a number.
+        role: user
+      - parts:
+        - functionCall:
+            args:
+              city: Paris
+            id: pyd_ai_0fc4eeb753d3446b9d330f2fd0ed6068
+            name: get_weather
+          thoughtSignature: Cu4OAXLI2nxCjXhrluC5vgwVpXhM4jIrPXckWL6T5uS34j11LPzSrV0fm5ghN6wxkV3Fxur9jvvfhQ-QahGCYxChW1q-e3yvPq-D-ml8FBhLkIjfpE_YoK3iowdTlW6yhW3MqsMjfuQc1nULCXCa_K1lx0WHi2-6e9ZMSl8Mto7kibHDC_ItWSv0I9mBjcRwSYOBS5dgrdECEBlah_m4iyG4nEkNDikFYfQZ17WjV6jrgybtqB3JGjbOt0csUC_gV0gfweqL6E1L3IP8LXYhyTmWuW_aQO5OEuuIVsPHMMns36LxVWpPp3DIA2u_OF5uCz6lkfVL9M_nEUgzDWP7dxBDpPVPVAijGaW11b1-pbLwS7wk8AabHPhlit-LfCdGiSy2pdpKviXVvIpBxQcsz2N_wqS70stlrSt7YRxp-JATnV8fzebYqZWQB7AmrbX6WycqliDuyADQZotFAVzFAjCP6BpMJXf6tmFmhzF1UY0hKwYTtPQpiHP5AYUW30yOA9JBcmv3lIGc6yR58mCN7moBWY-PZuqUelYWMOqAbtH6eGCUbxs00KmyJ1pltw2cMPmhNjP6yh8aggRmm9l3ou44fcw7l70cpz3BKKD_RKu2cdij4tuMGyL8eytZwFgl1M5gZfzJpldxUoEXYPgdeqr5NxmfVr7K2kjXUBHFtXQb_ngbuNNMb67q5U2jsB2ZCb2za1ZhRQcYeFYvZP1hF0HE9EKIjgVyxd_OM85Jr9l1Fnzc7xaXZMtVp2uNDlv3_tcr2SPFpxtpZ1qbadXespV5N_ULInfTtpeNCQ96wawdfjChFkbQURHYJFnKQF2ZtCOKzkb5hHmkhimxTVJAMs0EIKXNlTc1rz3uKqtihWV3JMezYBUDEzevNcO26T-H58hAVYeaQyh-ACnBi4U8WIDMoS1dnW2Qw_4cKUPe57bg26uZYb0fT8UM9as2JEhFQ161N9TZ9-hqG2yLiSsC9If7QJsa3MtyxWtc-1f_PQdfjEPNTrXZlLsTy8UFtNI-qERcG3ESPpsDHuClceVr2WFbSHhv7Rh3ecRlOS7gq3nuVqka-apg1F1FaK2SAyQlFHnNfiH3Rfnp_pv5emY1HxGzKzE1rzlOPYEV8gOBaDf0MCbizWgI7na_6cFeN6j4cZr-YXFhl3d5fM2D7px1KFB0DcHUB_g97_E2Q9QyO5UDTcM-97xPFifVGwQNn8-qhWJ3_RtP3QMHhdo7MuxwLjqCsMOwi-IK2GsR2oBODN3ddKvJN-pIHCuiC4eghqv_93O-2McIpYITaUjqtXS6wuuY9vtYpl55ssIhFRLgfGEbsh6wTNRmKjJXZqMxyTzQMLs1SltnVKFKAltlz5L4xKiAfzHFw-KPYINAQLY_UyQXWsDUZPyLdCYxwqJX-yB-haH4qIMpGF6sjV8ftvv8q_Wj1OhEBzHu7CGZin1a6chpZrUG8MrI6XmMZriz0XLPqR0cpTfbvN1c4wM6TmgO4QlqaNUmn74A0YY80qza1d5vkiid7gBvApgKm2C48mN4rCXmIPNDjzFME-_M-wS_mLQ2T7cC8w4DWCNrF7eoxE8wrl1SxPvK7rbpVibRdg_qbs4f1m3PNaQLGJvzmgFIStJyq5K9ADjg60lB9ZFC26x8zfsSZxw0loLUlTnqlKtdogTIjlZk-ZSvCQIp8JgMuwDCxKbeC7XGAyDNtoCt6vTAurGPJKBCB_kfGAEbF-Eaf1i9L05bMUWHpawUq4S0_ukqz0R-g9HwdPEN6pkq60XYn2-_l0C8_q_GLVPIxYEv9I12oLxCU-A9b1h2RqnD2lW-43U8PM-ce8OATPQ5L_GLhoFWZbHEswejNA4Ib_sIoNADk7DwHHCKX-xGpj6td9cmGaTK3d7MIHKwqEsrYRl1zUTLj7EBTlkaBLsTcFgGJz0bwVttM4CqUeOGqcEF4sgLAhQjpsZ_6GMHWbn7xv1_JAyT1nQt-M0W5Ly8Z724zcYMxdG4dKfUDlqAf7PbfPM2aYXHNlfOCrteMqWkp-HFanRTvcT8DnMRIsCwvmDfSn6fPhnhW7BAWirfDXQUEW-aE7aAdafKDifNj8DtF1c-Lw9Gz0jOeOa4OqhciGJi5IWTKfouSa5RN89G9kyAXpm6RPAhcaFV5G6FGq1rbReqoVrLyTaeQy1M4Q1YMCcosEXS7JR9NTtLfEixksVPsNinJtroZIEFN6Hpyx6SSC8-dAAUNxiLJvwAM2atxP4lCgziPJgegTOz_2fVCEHheSgU9fAecppI05Sp7CYtKdfmpgnG9GauI6hGUSpz07_aRoaoWuJSGZh_oBVNOd2iVPxGMPiIRDThHf2ATqxAQ7FY0WjFS2luehWoDOr3rmBhlu9Qc1wPNpVS96IT45y6wnqf6xWZzL95ahW4joyDWSGrV9tCplM-jK-G0G8hK_oTwcVQ9j3seKe_pJ6WvH6Z6-LZH_MAgm33WFLD-FgR6W1hQRSWFdJtxAOv_pvgQiAvh7-JYI8-tq4HhK09AjsG6gK2DR3ndUhxlNNi5_b4pSeF
+        role: model
+      - parts:
+        - functionResponse:
+            id: pyd_ai_0fc4eeb753d3446b9d330f2fd0ed6068
+            name: get_weather
+            response:
+              return_value: The weather in Paris is sunny and 72°F.
+        role: user
+      generationConfig:
+        responseModalities:
+        - TEXT
+      toolConfig:
+        functionCallingConfig:
+          allowedFunctionNames:
+          - get_weather
+          - final_result
+          mode: ANY
+      tools:
+      - functionDeclarations:
+        - description: Get the weather for a city.
+          name: get_weather
+          parameters_json_schema:
+            additionalProperties: false
+            properties:
+              city:
+                type: string
+            required:
+            - city
+            type: object
+        - description: The final response which ends this conversation
+          name: final_result
+          parameters_json_schema:
+            properties:
+              response:
+                type: integer
+            required:
+            - response
+            type: object
+    uri: https://generativelanguage.googleapis.com/v1beta/models/gemini-2.5-flash:generateContent
+  response:
+    headers:
+      alt-svc:
+      - h3=":443"; ma=2592000,h3-29=":443"; ma=2592000
+      content-length:
+      - '1372'
+      content-type:
+      - application/json; charset=UTF-8
+      server-timing:
+      - gfet4t7; dur=1144
+      transfer-encoding:
+      - chunked
+      vary:
+      - Origin
+      - X-Origin
+      - Referer
+    parsed_body:
+      candidates:
+      - content:
+          parts:
+          - functionCall:
+              args:
+                response: 72
+              name: final_result
+            thoughtSignature: Cr8DAXLI2nwnpfBQvh11KgRwYj3C3IsAsfFH8UnMQ45ClCxZR8osUSbK/oaRvkQccAQT2l2t5RZ8Ycqsl0bgrpxRvoFKRq8dVHv6pH8jG8VCXKMBQK9XsVLBBATtk2gJhMi1ttne6kLHZa5EvrVC1tizuVOEQu+iLi6xNImJpUs7YYCCBJgZP39Aa9XZT7StVSspC5cZk1WOhgedbGw1hUmMkAgKBaLhxpdwAf3lesM7xNdgFhDdj/k4KdaGgUXN0sJEjk3UZ43glcJTl/GjLiQVcyXJOSuMTlJmqvWl4x7UDoP7iYiVgiVMy/ptZHouexsbaLXwBXazpP2gc2zClxNXoTUPdFcLKEe6JoaLbHu2+fRlLwvBee+UVURrnxYlS9imcq0gsejt2yQwAEZZ0xlrtP/Ag5s7ZBx1v4Xz27Ad3vQDVB5ZK2NAm3H8tyren9yVVE9hGNflUH858AHBS+UZxjsjZmHB2zmALoXd5gXHFKngSGRIBSCPF5TZRl+vtItVmkmqEPufR+9vx/SUhnDEc/dg7bvN2iFVbiYinaxiyXp8ZGYQZPT4DGriOWznSKvUViTET28cy9gsimlUCx6n
+          role: model
+        finishMessage: Model generated function call(s).
+        finishReason: STOP
+        index: 0
+      modelVersion: gemini-2.5-flash
+      responseId: xHU3adjNL_WkqtsP_7iBkQ4
+      usageMetadata:
+        candidatesTokenCount: 16
+        promptTokenCount: 142
+        promptTokensDetails:
+        - modality: TEXT
+          tokenCount: 142
+        thoughtsTokenCount: 114
+        totalTokenCount: 272
+    status:
+      code: 200
+      message: OK
+version: 1
diff --git a/tests/models/google/cassettes/test_tool_choice/test_tool_choice_specific_live.yaml b/tests/models/google/cassettes/test_tool_choice/test_tool_choice_specific_live.yaml
new file mode 100644
index 0000000000..02ba40e02d
--- /dev/null
+++ b/tests/models/google/cassettes/test_tool_choice/test_tool_choice_specific_live.yaml
@@ -0,0 +1,203 @@
+interactions:
+- request:
+    headers:
+      accept:
+      - '*/*'
+      accept-encoding:
+      - gzip, deflate
+      connection:
+      - keep-alive
+      content-length:
+      - '690'
+      content-type:
+      - application/json
+      host:
+      - generativelanguage.googleapis.com
+    method: POST
+    parsed_body:
+      contents:
+      - parts:
+        - text: What is 2+2?
+        role: user
+      generationConfig:
+        responseModalities:
+        - TEXT
+      toolConfig:
+        functionCallingConfig:
+          allowedFunctionNames:
+          - get_weather
+          mode: ANY
+      tools:
+      - functionDeclarations:
+        - description: Get the weather for a city.
+          name: get_weather
+          parameters_json_schema:
+            additionalProperties: false
+            properties:
+              city:
+                type: string
+            required:
+            - city
+            type: object
+        - description: Get the current time in a city.
+          name: get_time
+          parameters_json_schema:
+            additionalProperties: false
+            properties:
+              city:
+                type: string
+            required:
+            - city
+            type: object
+    uri: https://generativelanguage.googleapis.com/v1beta/models/gemini-2.5-flash:generateContent
+  response:
+    headers:
+      alt-svc:
+      - h3=":443"; ma=2592000,h3-29=":443"; ma=2592000
+      content-length:
+      - '981'
+      content-type:
+      - application/json; charset=UTF-8
+      server-timing:
+      - gfet4t7; dur=721
+      transfer-encoding:
+      - chunked
+      vary:
+      - Origin
+      - X-Origin
+      - Referer
+    parsed_body:
+      candidates:
+      - content:
+          parts:
+          - functionCall:
+              args:
+                city: london
+              name: get_weather
+            thoughtSignature: CpwBAXLI2nxEoEhTeMVzLexhKwKasOzkFC0bxq2oUKvhzugqQrAVkBdNTxOIQXr1zYxmfcYExomV0gQ0WUX0Z+BCp+TNtPk/Qtg8NXSwiCmjIb3YiibIRwKu50Hp9D7iX6zTeDQmfo02c/TC5g6R9uxBNhK8Vf/LO4KSdog2Bx92X5t758usIeMh4efyDFQxtmAE3NWanNKN39MHdqao
+          role: model
+        finishMessage: Model generated function call(s).
+        finishReason: STOP
+        index: 0
+      modelVersion: gemini-2.5-flash
+      responseId: x3U3aeFFgqea2Q-Ox8zQBQ
+      usageMetadata:
+        candidatesTokenCount: 15
+        promptTokenCount: 87
+        promptTokensDetails:
+        - modality: TEXT
+          tokenCount: 87
+        thoughtsTokenCount: 26
+        totalTokenCount: 128
+    status:
+      code: 200
+      message: OK
+- request:
+    headers:
+      accept:
+      - '*/*'
+      accept-encoding:
+      - gzip, deflate
+      connection:
+      - keep-alive
+      content-length:
+      - '1280'
+      content-type:
+      - application/json
+      host:
+      - generativelanguage.googleapis.com
+    method: POST
+    parsed_body:
+      contents:
+      - parts:
+        - text: What is 2+2?
+        role: user
+      - parts:
+        - functionCall:
+            args:
+              city: london
+            id: pyd_ai_f35a67b6c40f41109c88db5ceb13d04d
+            name: get_weather
+          thoughtSignature: CpwBAXLI2nxEoEhTeMVzLexhKwKasOzkFC0bxq2oUKvhzugqQrAVkBdNTxOIQXr1zYxmfcYExomV0gQ0WUX0Z-BCp-TNtPk_Qtg8NXSwiCmjIb3YiibIRwKu50Hp9D7iX6zTeDQmfo02c_TC5g6R9uxBNhK8Vf_LO4KSdog2Bx92X5t758usIeMh4efyDFQxtmAE3NWanNKN39MHdqao
+        role: model
+      - parts:
+        - functionResponse:
+            id: pyd_ai_f35a67b6c40f41109c88db5ceb13d04d
+            name: get_weather
+            response:
+              return_value: The weather in london is sunny and 72°F.
+        role: user
+      generationConfig:
+        responseModalities:
+        - TEXT
+      toolConfig:
+        functionCallingConfig:
+          allowedFunctionNames:
+          - get_weather
+          mode: ANY
+      tools:
+      - functionDeclarations:
+        - description: Get the weather for a city.
+          name: get_weather
+          parameters_json_schema:
+            additionalProperties: false
+            properties:
+              city:
+                type: string
+            required:
+            - city
+            type: object
+        - description: Get the current time in a city.
+          name: get_time
+          parameters_json_schema:
+            additionalProperties: false
+            properties:
+              city:
+                type: string
+            required:
+            - city
+            type: object
+    uri: https://generativelanguage.googleapis.com/v1beta/models/gemini-2.5-flash:generateContent
+  response:
+    headers:
+      alt-svc:
+      - h3=":443"; ma=2592000,h3-29=":443"; ma=2592000
+      content-length:
+      - '1248'
+      content-type:
+      - application/json; charset=UTF-8
+      server-timing:
+      - gfet4t7; dur=992
+      transfer-encoding:
+      - chunked
+      vary:
+      - Origin
+      - X-Origin
+      - Referer
+    parsed_body:
+      candidates:
+      - content:
+          parts:
+          - functionCall:
+              args:
+                city: london
+              name: get_weather
+            thoughtSignature: CuACAXLI2nweDEQEjYyylY2PvbSSKEsJ4XMlPi/inEA/cxp9KJJVRng9i4K3xMmQL/nShtRd3u5AKKyQsrCX5wQ39XWHQYhp9gsZIQ0BJAxPTqrZ+UWDDRcziH7vsLBvKynoiIOjtUUmCl3rID4hukDPrmibK2jfre9mKJddVDwRQvjT208GMJ3vaefH61JroyLQRq3RKBbyMzS9QsbU12HL75miNS2cnMn5/wd9zz9tuyH/1u1hMWP/P++LhWHFiYFY4x9wRISuACiMKvMv+s84UkrHh0EkdfPZ3bfX90PhKz7ISIAbrnBlaueVUqt1YZYg3meY9w66aGJ+tVExrYaU8c1U6gl3N7zYCMRJZpw6QFmR56OG5h3Edg0Bz08LwhPiqaOGsuglBsyVzCrVwGiRxjIyvj0pnQRc4Znbh/lEcOCRaSDVIvA5kn0X2fE8FkHw8HLRgbgJpaGrh6Sh9i0MeA==
+          role: model
+        finishMessage: Model generated function call(s).
+        finishReason: STOP
+        index: 0
+      modelVersion: gemini-2.5-flash
+      responseId: yHU3ad6JCbmoqtsPrLvesQU
+      usageMetadata:
+        candidatesTokenCount: 15
+        promptTokenCount: 131
+        promptTokensDetails:
+        - modality: TEXT
+          tokenCount: 131
+        thoughtsTokenCount: 69
+        totalTokenCount: 215
+    status:
+      code: 200
+      message: OK
+version: 1
diff --git a/tests/models/google/test_tool_choice.py b/tests/models/google/test_tool_choice.py
new file mode 100644
index 0000000000..14d3e60fa2
--- /dev/null
+++ b/tests/models/google/test_tool_choice.py
@@ -0,0 +1,97 @@
+"""Tests for Google tool_choice setting."""
+
+from __future__ import annotations as _annotations
+
+import pytest
+
+from pydantic_ai import Agent
+
+from ...conftest import try_import
+
+with try_import() as imports_successful:
+    from pydantic_ai.models.google import GoogleModel
+    from pydantic_ai.providers.google import GoogleProvider
+
+pytestmark = [
+    pytest.mark.skipif(not imports_successful(), reason='google-genai not installed'),
+    pytest.mark.anyio,
+    pytest.mark.vcr,
+]
+
+
+async def test_tool_choice_auto_live(allow_model_requests: None, gemini_api_key: str):
+    """Test tool_choice='auto' allows model to decide whether to use tools."""
+    m = GoogleModel('gemini-2.5-flash', provider=GoogleProvider(api_key=gemini_api_key))
+    agent = Agent(m)
+
+    @agent.tool_plain
+    def get_weather(city: str) -> str:
+        """Get the weather for a city."""
+        return f'The weather in {city} is sunny and 72°F.'  # pragma: no cover
+
+    result = await agent.run('What is 2+2?', model_settings={'tool_choice': 'auto'})
+    assert result.output is not None
+    assert '4' in result.output
+
+
+async def test_tool_choice_required_live(allow_model_requests: None, gemini_api_key: str):
+    """Test tool_choice='required' forces model to use a tool."""
+    m = GoogleModel('gemini-2.5-flash', provider=GoogleProvider(api_key=gemini_api_key))
+    agent = Agent(m)
+
+    @agent.tool_plain
+    def get_weather(city: str) -> str:
+        """Get the weather for a city."""
+        return f'The weather in {city} is sunny and 72°F.'
+
+    result = await agent.run(
+        'What is the temperature in Paris? Use the weather tool and return the temperature as a number.',
+        output_type=int,
+        model_settings={'tool_choice': 'required'},
+    )
+    assert result.output == 72
+
+
+async def test_tool_choice_none_live(allow_model_requests: None, gemini_api_key: str):
+    """Test tool_choice='none' prevents model from using function tools."""
+    m = GoogleModel('gemini-2.5-flash', provider=GoogleProvider(api_key=gemini_api_key))
+    agent = Agent(m)
+
+    @agent.tool_plain
+    def get_weather(city: str) -> str:
+        """Get the weather for a city."""
+        return f'The weather in {city} is sunny and 72°F.'  # pragma: no cover
+
+    result = await agent.run(
+        'What is 2+2?',
+        model_settings={'tool_choice': 'none'},
+    )
+    assert result.output is not None
+    assert '4' in result.output
+
+
+async def test_tool_choice_specific_live(allow_model_requests: None, gemini_api_key: str):
+    """Test tool_choice=['tool_name'] forces model to use the named tool."""
+    from pydantic_ai import UsageLimits
+    from pydantic_ai.exceptions import UsageLimitExceeded
+
+    m = GoogleModel('gemini-2.5-flash', provider=GoogleProvider(api_key=gemini_api_key))
+    agent = Agent(m)
+
+    @agent.tool_plain
+    def get_weather(city: str) -> str:
+        """Get the weather for a city."""
+        return f'The weather in {city} is sunny and 72°F.'
+
+    @agent.tool_plain
+    def get_time(city: str) -> str:
+        """Get the current time in a city."""
+        return f'The time in {city} is 3:00 PM.'  # pragma: no cover
+
+    # Agent is forced to call get_weather even though it's unrelated to the prompt
+    with pytest.raises(UsageLimitExceeded):
+        await agent.run(
+            'What is 2+2?',
+            model_settings={'tool_choice': ['get_weather']},
+            usage_limits=UsageLimits(request_limit=2),
+        )
diff --git a/tests/models/openai/__init__.py b/tests/models/openai/__init__.py
new file mode 100644
index 0000000000..67a6848c3a
--- /dev/null
+++ b/tests/models/openai/__init__.py
@@ -0,0 +1 @@
+"""Tests for OpenAI models."""
diff --git a/tests/models/openai/cassettes/test_tool_choice/test_tool_choice_auto_live.yaml b/tests/models/openai/cassettes/test_tool_choice/test_tool_choice_auto_live.yaml
new file mode 100644
index 0000000000..5bca793777
--- /dev/null
+++ b/tests/models/openai/cassettes/test_tool_choice/test_tool_choice_auto_live.yaml
@@ -0,0 +1,93 @@
+interactions:
+- request:
+    headers:
+      accept:
+      - application/json
+      accept-encoding:
+      - gzip, deflate
+      connection:
+      - keep-alive
+      content-length:
+      - '354'
+      content-type:
+      - application/json
+      host:
+      - api.openai.com
+    method: POST
+    parsed_body:
+      messages:
+      - content: What is 2+2?
+        role: user
+      model: gpt-5-mini
+      stream: false
+      tool_choice: auto
+      tools:
+      - function:
+          description: Get the weather for a city.
+          name: get_weather
+          parameters:
+            additionalProperties: false
+            properties:
+              city:
+                type: string
+            required:
+            - city
+            type: object
+          strict: true
+        type: function
+    uri: https://api.openai.com/v1/chat/completions
+  response:
+    headers:
+      access-control-expose-headers:
+      - X-Request-ID
+      alt-svc:
+      - h3=":443"; ma=86400
+      connection:
+      - keep-alive
+      content-length:
+      - '783'
+      content-type:
+      - application/json
+      openai-organization:
+      - user-grnwlxd1653lxdzp921aoihz
+      openai-processing-ms:
+      - '969'
+      openai-project:
+      - proj_FYsIItHHgnSPdHBVMzhNBWGa
+      openai-version:
+      - '2020-10-01'
+      strict-transport-security:
+      - max-age=31536000; includeSubDomains; preload
+      transfer-encoding:
+      - chunked
+    parsed_body:
+      choices:
+      - finish_reason: stop
+        index: 0
+        message:
+          annotations: []
+          content: 2 + 2 = 4.
+          refusal: null
+          role: assistant
+      created: 1765242169
+      id: chatcmpl-CkgPpexmls8SXPdfc6CVKUd8TfnIH
+      model: gpt-5-mini-2025-08-07
+      object: chat.completion
+      service_tier: default
+      system_fingerprint: null
+      usage:
+        completion_tokens: 17
+        completion_tokens_details:
+          accepted_prediction_tokens: 0
+          audio_tokens: 0
+          reasoning_tokens: 0
+          rejected_prediction_tokens: 0
+        prompt_tokens: 132
+        prompt_tokens_details:
+          audio_tokens: 0
+          cached_tokens: 0
+        total_tokens: 149
+    status:
+      code: 200
+      message: OK
+version: 1
diff --git a/tests/models/openai/cassettes/test_tool_choice/test_tool_choice_none_live.yaml b/tests/models/openai/cassettes/test_tool_choice/test_tool_choice_none_live.yaml
new file mode 100644
index 0000000000..40a7f1c268
--- /dev/null
+++ b/tests/models/openai/cassettes/test_tool_choice/test_tool_choice_none_live.yaml
@@ -0,0 +1,103 @@
+interactions:
+- request:
+    headers:
+      accept:
+      - application/json
+      accept-encoding:
+      - gzip, deflate
+      connection:
+      - keep-alive
+      content-length:
+      - '398'
+      content-type:
+      - application/json
+      host:
+      - api.openai.com
+    method: POST
+    parsed_body:
+      messages:
+      - content: What is the weather in Paris? Use the tool if available.
+        role: user
+      model: gpt-5-mini
+      stream: false
+      tool_choice: none
+      tools:
+      - function:
+          description: Get the weather for a city.
+          name: get_weather
+          parameters:
+            additionalProperties: false
+            properties:
+              city:
+                type: string
+            required:
+            - city
+            type: object
+          strict: true
+        type: function
+    uri: https://api.openai.com/v1/chat/completions
+  response:
+    headers:
+      access-control-expose-headers:
+      - X-Request-ID
+      alt-svc:
+      - h3=":443"; ma=86400
+      connection:
+      - keep-alive
+      content-length:
+      - '1952'
+      content-type:
+      - application/json
+      openai-organization:
+      - user-grnwlxd1653lxdzp921aoihz
+      openai-processing-ms:
+      - '8417'
+      openai-project:
+      - proj_FYsIItHHgnSPdHBVMzhNBWGa
+      openai-version:
+      - '2020-10-01'
+      strict-transport-security:
+      - max-age=31536000; includeSubDomains; preload
+      transfer-encoding:
+      - chunked
+    parsed_body:
+      choices:
+      - finish_reason: stop
+        index: 0
+        message:
+          annotations: []
+          content: "I can’t fetch live weather data right now (I don’t have access to the live-data tool at the moment). I
+            can, however, give you a quick summary of what Paris is typically like at this time of year and some ways to check
+            the current conditions.\n\nTypical conditions for Paris in early December:\n- Temperatures: roughly 3–10°C (37–50°F)
+            — nights near freezing, daytime cool.  \n- Sky: often cloudy or overcast.  \n- Precipitation: light rain or drizzle
+            is common.  \n- Wind: usually mild to moderate.  \n- Daylight: short days; evenings get dark early.\n\nHow to
+            get the current, live weather right now:\n- Check a weather website or app (Météo‑France, BBC Weather, Weather.com,
+            or your phone’s weather app).  \n- Ask a smart assistant on your phone/speaker (Siri, Google Assistant, Alexa).
+            \ \n- If you want, I can fetch the current conditions and forecast once live-data access is available — or I can
+            show you step‑by‑step how to check on a specific site or app.\n\nDo you want clothing/recommendation (what to
+            pack or wear today) based on the typical conditions, or would you like instructions for checking a live forecast
+            on a particular site or app?"
+          refusal: null
+          role: assistant
+      created: 1765242183
+      id: chatcmpl-CkgQ36TEJeOvaM8LWdzjbLgRDgqyE
+      model: gpt-5-mini-2025-08-07
+      object: chat.completion
+      service_tier: default
+      system_fingerprint: null
+      usage:
+        completion_tokens: 661
+        completion_tokens_details:
+          accepted_prediction_tokens: 0
+          audio_tokens: 0
+          reasoning_tokens: 384
+          rejected_prediction_tokens: 0
+        prompt_tokens: 138
+        prompt_tokens_details:
+          audio_tokens: 0
+          cached_tokens: 0
+        total_tokens: 799
+    status:
+      code: 200
+      message: OK
+version: 1
diff --git a/tests/models/openai/cassettes/test_tool_choice/test_tool_choice_required_live.yaml b/tests/models/openai/cassettes/test_tool_choice/test_tool_choice_required_live.yaml
new file mode 100644
index 0000000000..e7ee680654
--- /dev/null
+++ b/tests/models/openai/cassettes/test_tool_choice/test_tool_choice_required_live.yaml
@@ -0,0 +1,236 @@
+interactions:
+- request:
+    headers:
+      accept:
+      - application/json
+      accept-encoding:
+      - gzip, deflate
+      connection:
+      - keep-alive
+      content-length:
+      - '702'
+      content-type:
+      - application/json
+      host:
+      - api.openai.com
+    method: POST
+    parsed_body:
+      messages:
+      - content: What is the temperature in Paris? Use the weather tool and return the temperature as a number.
+        role: user
+      model: gpt-5-mini
+      stream: false
+      tool_choice: required
+      tools:
+      - function:
+          description: Get the weather for a city.
+          name: get_weather
+          parameters:
+            additionalProperties: false
+            properties:
+              city:
+                type: string
+            required:
+            - city
+            type: object
+          strict: true
+        type: function
+      - function:
+          description: The final response which ends this conversation
+          name: final_result
+          parameters:
+            additionalProperties: false
+            properties:
+              response:
+                type: integer
+            required:
+            - response
+            type: object
+          strict: true
+        type: function
+    uri: https://api.openai.com/v1/chat/completions
+  response:
+    headers:
+      access-control-expose-headers:
+      - X-Request-ID
+      alt-svc:
+      - h3=":443"; ma=86400
+      connection:
+      - keep-alive
+      content-length:
+      - '1053'
+      content-type:
+      - application/json
+      openai-organization:
+      - user-grnwlxd1653lxdzp921aoihz
+      openai-processing-ms:
+      - '3585'
+      openai-project:
+      - proj_FYsIItHHgnSPdHBVMzhNBWGa
+      openai-version:
+      - '2020-10-01'
+      strict-transport-security:
+      - max-age=31536000; includeSubDomains; preload
+      transfer-encoding:
+      - chunked
+    parsed_body:
+      choices:
+      - finish_reason: tool_calls
+        index: 0
+        message:
+          annotations: []
+          content: null
+          refusal: null
+          role: assistant
+          tool_calls:
+          - function:
+              arguments: '{"city":"Paris"}'
+              name: get_weather
+            id: call_u0pRHSmUP8t3cbjfSM7v1A7y
+            type: function
+      created: 1765242172
+      id: chatcmpl-CkgPsVsXpJRTZFCXphaH15QtUVMAO
+      model: gpt-5-mini-2025-08-07
+      object: chat.completion
+      service_tier: default
+      system_fingerprint: null
+      usage:
+        completion_tokens: 279
+        completion_tokens_details:
+          accepted_prediction_tokens: 0
+          audio_tokens: 0
+          reasoning_tokens: 256
+          rejected_prediction_tokens: 0
+        prompt_tokens: 166
+        prompt_tokens_details:
+          audio_tokens: 0
+          cached_tokens: 0
+        total_tokens: 445
+    status:
+      code: 200
+      message: OK
+- request:
+    headers:
+      accept:
+      - application/json
+      accept-encoding:
+      - gzip, deflate
+      connection:
+      - keep-alive
+      content-length:
+      - '995'
+      content-type:
+      - application/json
+      cookie:
+      - __cf_bm=hh996J5PFkiiXoeT9VbPMZi28ps6pxjzTg.2.wCFM28-1765242175-1.0.1.1-7wN_j0BHFbXzIfAmY1euNAtZTbwhDL9e_gNAX.wdUuKrKmIP.0jVn62BvygzUrXSXzkjUBrXh5zonY.gtt_P7DdGBzGazQhv1kxcSTyEh74;
+        _cfuvid=YmhDCKmj4MJp37mQzs3zP22LolFIMD5NpvReH26meFY-1765242175599-0.0.1.1-604800000
+      host:
+      - api.openai.com
+    method: POST
+    parsed_body:
+      messages:
+      - content: What is the temperature in Paris? Use the weather tool and return the temperature as a number.
+        role: user
+      - content: null
+        role: assistant
+        tool_calls:
+        - function:
+            arguments: '{"city":"Paris"}'
+            name: get_weather
+          id: call_u0pRHSmUP8t3cbjfSM7v1A7y
+          type: function
+      - content: The weather in Paris is sunny and 72°F.
+        role: tool
+        tool_call_id: call_u0pRHSmUP8t3cbjfSM7v1A7y
+      model: gpt-5-mini
+      stream: false
+      tool_choice: required
+      tools:
+      - function:
+          description: Get the weather for a city.
+          name: get_weather
+          parameters:
+            additionalProperties: false
+            properties:
+              city:
+                type: string
+            required:
+            - city
+            type: object
+          strict: true
+        type: function
+      - function:
+          description: The final response which ends this conversation
+          name: final_result
+          parameters:
+            additionalProperties: false
+            properties:
+              response:
+                type: integer
+            required:
+            - response
+            type: object
+          strict: true
+        type: function
+    uri: https://api.openai.com/v1/chat/completions
+  response:
+    headers:
+      access-control-expose-headers:
+      - X-Request-ID
+      alt-svc:
+      - h3=":443"; ma=86400
+      connection:
+      - keep-alive
+      content-length:
+      - '1051'
+      content-type:
+      - application/json
+      openai-organization:
+      - user-grnwlxd1653lxdzp921aoihz
+      openai-processing-ms:
+      - '5782'
+      openai-project:
+      - proj_FYsIItHHgnSPdHBVMzhNBWGa
+      openai-version:
+      - '2020-10-01'
+      strict-transport-security:
+      - max-age=31536000; includeSubDomains; preload
+      transfer-encoding:
+      - chunked
+    parsed_body:
+      choices:
+      - finish_reason: tool_calls
+        index: 0
+        message:
+          annotations: []
+          content: null
+          refusal: null
+          role: assistant
+          tool_calls:
+          - function:
+              arguments: '{"response":72}'
+              name: final_result
+            id: call_VFfKcHWlxtVOtwW6hJvPxdgn
+            type: function
+      created: 1765242176
+      id: chatcmpl-CkgPwA8aiofTgU8pcgcxapgMgIjGs
+      model: gpt-5-mini-2025-08-07
+      object: chat.completion
+      service_tier: default
+      system_fingerprint: null
+      usage:
+        completion_tokens: 343
+        completion_tokens_details:
+          accepted_prediction_tokens: 0
+          audio_tokens: 0
+          reasoning_tokens: 320
+          rejected_prediction_tokens: 0
+        prompt_tokens: 205
+        prompt_tokens_details:
+          audio_tokens: 0
+          cached_tokens: 0
+        total_tokens: 548
+    status:
+      code: 200
+      message: OK
+version: 1
diff --git a/tests/models/openai/cassettes/test_tool_choice/test_tool_choice_specific_live.yaml b/tests/models/openai/cassettes/test_tool_choice/test_tool_choice_specific_live.yaml
new file mode 100644
index 0000000000..40ef552d98
--- /dev/null
+++ b/tests/models/openai/cassettes/test_tool_choice/test_tool_choice_specific_live.yaml
@@ -0,0 +1,242 @@
+interactions:
+- request:
+    headers:
+      accept:
+      - application/json
+      accept-encoding:
+      - gzip, deflate
+      connection:
+      - keep-alive
+      content-length:
+      - '634'
+      content-type:
+      - application/json
+      host:
+      - api.openai.com
+    method: POST
+    parsed_body:
+      messages:
+      - content: What is 2+2?
+        role: user
+      model: gpt-5-mini
+      stream: false
+      tool_choice:
+        function:
+          name: get_weather
+        type: function
+      tools:
+      - function:
+          description: Get the weather for a city.
+          name: get_weather
+          parameters:
+            additionalProperties: false
+            properties:
+              city:
+                type: string
+            required:
+            - city
+            type: object
+          strict: true
+        type: function
+      - function:
+          description: Get the current time in a city.
+          name: get_time
+          parameters:
+            additionalProperties: false
+            properties:
+              city:
+                type: string
+            required:
+            - city
+            type: object
+          strict: true
+        type: function
+    uri: https://api.openai.com/v1/chat/completions
+  response:
+    headers:
+      access-control-expose-headers:
+      - X-Request-ID
+      alt-svc:
+      - h3=":443"; ma=86400
+      connection:
+      - keep-alive
+      content-length:
+      - '1056'
+      content-type:
+      - application/json
+      openai-organization:
+      - user-grnwlxd1653lxdzp921aoihz
+      openai-processing-ms:
+      - '5939'
+      openai-project:
+      - proj_FYsIItHHgnSPdHBVMzhNBWGa
+      openai-version:
+      - '2020-10-01'
+      strict-transport-security:
+      - max-age=31536000; includeSubDomains; preload
+      transfer-encoding:
+      - chunked
+    parsed_body:
+      choices:
+      - finish_reason: tool_calls
+        index: 0
+        message:
+          annotations: []
+          content: null
+          refusal: null
+          role: assistant
+          tool_calls:
+          - function:
+              arguments: '{"city":"New York"}'
+              name: get_weather
+            id: call_WPfYJrBdxH9rRn3Qd2jtlHQ6
+            type: function
+      created: 1765242192
+      id: chatcmpl-CkgQCjUB0llfrP8HDXeKmHIJ9L0Fe
+      model: gpt-5-mini-2025-08-07
+      object: chat.completion
+      service_tier: default
+      system_fingerprint: null
+      usage:
+        completion_tokens: 280
+        completion_tokens_details:
+          accepted_prediction_tokens: 0
+          audio_tokens: 0
+          reasoning_tokens: 256
+          rejected_prediction_tokens: 0
+        prompt_tokens: 154
+        prompt_tokens_details:
+          audio_tokens: 0
+          cached_tokens: 0
+        total_tokens: 434
+    status:
+      code: 200
+      message: OK
+- request:
+    headers:
+      accept:
+      - application/json
+      accept-encoding:
+      - gzip, deflate
+      connection:
+      - keep-alive
+      content-length:
+      - '933'
+      content-type:
+      - application/json
+      cookie:
+      - __cf_bm=aMR8LQbbk6A2dDLig0U7V8n4D9mDlu8Di7WZlqjOCmA-1765242198-1.0.1.1-1vqs6ks3Kal02LIC68LHYOhM7F0T__NJDkVf5rTho1jpqJq.7wa_rTEEaO6HjYxanyZ3tml6BIXM65b4mFxinoIZT2lz1hoQwjsWAjRqlFw;
+        _cfuvid=57S3CL.R7VIt5_BFE7k7tUZ9IdnONe41q6bmK92s3k0-1765242198408-0.0.1.1-604800000
+      host:
+      - api.openai.com
+    method: POST
+    parsed_body:
+      messages:
+      - content: What is 2+2?
+        role: user
+      - content: null
+        role: assistant
+        tool_calls:
+        - function:
+            arguments: '{"city":"New York"}'
+            name: get_weather
+          id: call_WPfYJrBdxH9rRn3Qd2jtlHQ6
+          type: function
+      - content: The weather in New York is sunny and 72°F.
+        role: tool
+        tool_call_id: call_WPfYJrBdxH9rRn3Qd2jtlHQ6
+      model: gpt-5-mini
+      stream: false
+      tool_choice:
+        function:
+          name: get_weather
+        type: function
+      tools:
+      - function:
+          description: Get the weather for a city.
+          name: get_weather
+          parameters:
+            additionalProperties: false
+            properties:
+              city:
+                type: string
+            required:
+            - city
+            type: object
+          strict: true
+        type: function
+      - function:
+          description: Get the current time in a city.
+          name: get_time
+          parameters:
+            additionalProperties: false
+            properties:
+              city:
+                type: string
+            required:
+            - city
+            type: object
+          strict: true
+        type: function
+    uri: https://api.openai.com/v1/chat/completions
+  response:
+    headers:
+      access-control-expose-headers:
+      - X-Request-ID
+      alt-svc:
+      - h3=":443"; ma=86400
+      connection:
+      - keep-alive
+      content-length:
+      - '1056'
+      content-type:
+      - application/json
+      openai-organization:
+      - user-grnwlxd1653lxdzp921aoihz
+      openai-processing-ms:
+      - '4913'
+      openai-project:
+      - proj_FYsIItHHgnSPdHBVMzhNBWGa
+      openai-version:
+      - '2020-10-01'
+      strict-transport-security:
+      - max-age=31536000; includeSubDomains; preload
+      transfer-encoding:
+      - chunked
+    parsed_body:
+      choices:
+      - finish_reason: tool_calls
+        index: 0
+        message:
+          annotations: []
+          content: null
+          refusal: null
+          role: assistant
+          tool_calls:
+          - function:
+              arguments: '{"city":"New York"}'
+              name: get_weather
+            id: call_U2xZleySYYYhMizPivCd4ikp
+            type: function
+      created: 1765242198
+      id: chatcmpl-CkgQIb3rqgzBJRGc9qoH5qG0YT3pk
+      model: gpt-5-mini-2025-08-07
+      object: chat.completion
+      service_tier: default
+      system_fingerprint: null
+      usage:
+        completion_tokens: 286
+        completion_tokens_details:
+          accepted_prediction_tokens: 0
+          audio_tokens: 0
+          reasoning_tokens: 256
+          rejected_prediction_tokens: 0
+        prompt_tokens: 195
+        prompt_tokens_details:
+          audio_tokens: 0
+          cached_tokens: 0
+        total_tokens: 481
+    status:
+      code: 200
+      message: OK
+version: 1
diff --git a/tests/models/openai/test_tool_choice.py b/tests/models/openai/test_tool_choice.py
new file mode 100644
index 0000000000..98ba281e2d
--- /dev/null
+++ b/tests/models/openai/test_tool_choice.py
@@ -0,0 +1,103 @@
+"""Tests for OpenAI Chat tool_choice setting."""
+
+from __future__ import annotations as _annotations
+
+import pytest
+
+from pydantic_ai import Agent
+
+from ...conftest import try_import
+
+with try_import() as imports_successful:
+    from pydantic_ai.models.openai import OpenAIChatModel
+    from pydantic_ai.providers.openai import OpenAIProvider
+
+pytestmark = [
+    pytest.mark.skipif(not imports_successful(), reason='openai not installed'),
+    pytest.mark.anyio,
+    pytest.mark.vcr,
+]
+
+
+async def test_tool_choice_auto_live(allow_model_requests: None, openai_api_key: str):
+    """Test tool_choice='auto' allows model to decide whether to use tools."""
+    m = OpenAIChatModel('gpt-5-mini', provider=OpenAIProvider(api_key=openai_api_key))
+    agent = Agent(m)
+
+    @agent.tool_plain
+    def get_weather(city: str) -> str:
+        """Get the weather for a city."""
+        return f'The weather in {city} is sunny and 72°F.'  # pragma: no cover
+
+    result = await agent.run('What is 2+2?', model_settings={'tool_choice': 'auto'})
+    assert result.output is not None
+    assert '4' in result.output
+
+
+async def test_tool_choice_required_live(allow_model_requests: None, openai_api_key: str):
+    """Test tool_choice='required' forces model to use a tool."""
+    m = OpenAIChatModel('gpt-5-mini', provider=OpenAIProvider(api_key=openai_api_key))
+    agent = Agent(m)
+
+    @agent.tool_plain
+    def get_weather(city: str) -> str:
+        """Get the weather for a city."""
+        return f'The weather in {city} is sunny and 72°F.'
+
+    result = await agent.run(
+        'What is the temperature in Paris? Use the weather tool and return the temperature as a number.',
+        output_type=int,
+        model_settings={'tool_choice': 'required'},
+    )
+    assert result.output == 72
+
+
+async def test_tool_choice_none_live(allow_model_requests: None, openai_api_key: str):
+    """Test tool_choice='none' prevents model from using function tools."""
+    m = OpenAIChatModel('gpt-5-mini', provider=OpenAIProvider(api_key=openai_api_key))
+    agent = Agent(m)
+
+    @agent.tool_plain
+    def get_weather(city: str) -> str:
+        """Get the weather for a city."""
+        return f'The weather in {city} is sunny and 72°F.'  # pragma: no cover
+
+    result = await agent.run(
+        'What is the weather in Paris? Use the tool if available.',
+        model_settings={'tool_choice': 'none'},
+    )
+    assert result.output is not None
+    tool_calls = [
+        m
+        for m in result.all_messages()
+        if hasattr(m, 'parts')
+        and any(hasattr(p, 'tool_name') and p.tool_name == 'get_weather' for p in getattr(m, 'parts', []))
+    ]
+    assert len(tool_calls) == 0
+
+
+async def test_tool_choice_specific_live(allow_model_requests: None, openai_api_key: str):
+    """Test tool_choice=['tool_name'] forces model to use the named tool."""
+    from pydantic_ai import UsageLimits
+    from pydantic_ai.exceptions import UsageLimitExceeded
+
+    m = OpenAIChatModel('gpt-5-mini', provider=OpenAIProvider(api_key=openai_api_key))
+    agent = Agent(m)
+
+    @agent.tool_plain
+    def get_weather(city: str) -> str:
+        """Get the weather for a city."""
+        return f'The weather in {city} is sunny and 72°F.'
+
+    @agent.tool_plain
+    def get_time(city: str) -> str:
+        """Get the current time in a city."""
+        return f'The time in {city} is 3:00 PM.'  # pragma: no cover
+
+    # Agent is forced to call get_weather even though it's unrelated to the prompt
+    with pytest.raises(UsageLimitExceeded):
+        await agent.run(
+            'What is 2+2?',
+            model_settings={'tool_choice': ['get_weather']},
+            usage_limits=UsageLimits(request_limit=2),
+        )
diff --git a/tests/models/openai_responses/__init__.py b/tests/models/openai_responses/__init__.py
new file mode 100644
index 0000000000..7330227278
--- /dev/null
+++ b/tests/models/openai_responses/__init__.py
@@ -0,0 +1 @@
+"""Tests for OpenAI Responses models."""
diff --git a/tests/models/openai_responses/cassettes/test_tool_choice/test_tool_choice_auto_live.yaml b/tests/models/openai_responses/cassettes/test_tool_choice/test_tool_choice_auto_live.yaml
new file mode 100644
index 0000000000..4d0b14c08f
--- /dev/null
+++ b/tests/models/openai_responses/cassettes/test_tool_choice/test_tool_choice_auto_live.yaml
@@ -0,0 +1,135 @@
+interactions:
+- request:
+    headers:
+      accept:
+      - application/json
+      accept-encoding:
+      - gzip, deflate
+      connection:
+      - keep-alive
+      content-length:
+      - '380'
+      content-type:
+      - application/json
+      host:
+      - api.openai.com
+    method: POST
+    parsed_body:
+      include:
+      - reasoning.encrypted_content
+      input:
+      - content: What is 2+2?
+        role: user
+      model: gpt-5-mini
+      stream: false
+      tool_choice: auto
+      tools:
+      - description: Get the weather for a city.
+        name: get_weather
+        parameters:
+          additionalProperties: false
+          properties:
+            city:
+              type: string
+          required:
+          - city
+          type: object
+        strict: true
+        type: function
+    uri: https://api.openai.com/v1/responses
+  response:
+    headers:
+      alt-svc:
+      - h3=":443"; ma=86400
+      connection:
+      - keep-alive
+      content-length:
+      - '3036'
+      content-type:
+      - application/json
+      openai-organization:
+      - user-grnwlxd1653lxdzp921aoihz
+      openai-processing-ms:
+      - '1164'
+      openai-project:
+      - proj_FYsIItHHgnSPdHBVMzhNBWGa
+      openai-version:
+      - '2020-10-01'
+      strict-transport-security:
+      - max-age=31536000; includeSubDomains; preload
+      transfer-encoding:
+      - chunked
+    parsed_body:
+      background: false
+      billing:
+        payer: developer
+      created_at: 1765242204
+      error: null
+      id: resp_0477a600c0ff0451006937755ca4fc819184301e68defe1284
+      incomplete_details: null
+      instructions: null
+      max_output_tokens: null
+      max_tool_calls: null
+      metadata: {}
+      model: gpt-5-mini-2025-08-07
+      object: response
+      output:
+      - encrypted_content: gAAAAABpN3VdTLjJI3BztEIXoVDlvXvDxMcqTUwq956B3B1YY9BcTmBcZEVy9j8khotd4LfbKoVxxay_4UoqP0XdImPKWHBp9N3kNxM2DR76Y734cBn-_zsr4L4nObl--qkUBqoGJWxNZ_a79gP3xWvpSSBaDbINgTKhL3hv2E7i6BhG9_a6AyHTcUNyAw70iG5RC12K5MjKe3xi3rs78VmRrZRNKhG1u5JiIRAGVeJ3yatx0fgjsVNeFGCNlUVNf1idCDF9ZLuWIDr4F1jsxSw2Ly18P2XNB6ZMXP-QLHv18V8_p2Wx_sAuM35cSYMPn8dA3B1oBMgc9Sk0IT9278UUDbUFiVOBHPFXGvCBLZEAcCRpYMxJcp5HncIeaPCexfBMGjpAft5jpqqA-uryYF2UckXUgwejykh7ncZenvrjcKb9KduCRZLH7PVOb_PDf3Mj0Fw0ERLD2JjAGVdkiXJK3aq-DzHWf30p_2Z3GSftLDT6Ko91IPTymJIfY-TrDFz1mN3UawAVBEgNg9kaYRmzRt_IEQgHC6WC-vW-MY-qTKiboY-Qs8Qgyv5YLGx1C-tVSj0q3XrU7RFHp2NjA18wRQAQoPq45Zn5Xwty-8ebyltlwpALPeGedtYsG9X4nSF0aGq-mC8gFmjrCEaa6596O8XpabItPBq71gSvujUEZmIB5YAmMq3e2OyWnehhkZv7JFNZ7dY8CSpdB-me6chIageLAbZHXMPDlV9L5nNv_btGKAS5lCk1FBPAA6B8tpT6qZwAPs-0dI3LLRfFsS9vnsaIgO4LnN0dhTC7qsfgX_hl9AX4iIhfh7SA8L70EiuUdQO-6Kj_vHqTu1hpyePXZsG3YjqWsRHfRrUF6RIVeTDMri9EnjlDepEn9rig7Zop9qaQ-_lIlLxIg5hXz-SP1Yx3VnwkIBSS1BSKz3_ZUy0zIekMa-6mnbV3oWlR7cydz5yuzibCzzIfaogUSj-SEIV18LLr1GjLm8oLI53v9gQ_y6e7_HrRZxEju9dNlg7KuluKPvmt
+        id: rs_0477a600c0ff0451006937755d1da4819193e1aa6f057d14f7
+        summary: []
+        type: reasoning
+      - content:
+        - annotations: []
+          logprobs: []
+          text: 2 + 2 = 4.
+          type: output_text
+        id: msg_0477a600c0ff0451006937755d87ec81919cf9aaec2742c63a
+        role: assistant
+        status: completed
+        type: message
+      parallel_tool_calls: true
+      previous_response_id: null
+      prompt_cache_key: null
+      prompt_cache_retention: null
+      reasoning:
+        effort: medium
+        summary: null
+      safety_identifier: null
+      service_tier: default
+      status: completed
+      store: true
+      temperature: 1.0
+      text:
+        format:
+          type: text
+        verbosity: medium
+      tool_choice: auto
+      tools:
+      - description: Get the weather for a city.
+        name: get_weather
+        parameters:
+          additionalProperties: false
+          properties:
+            city:
+              type: string
+          required:
+          - city
+          type: object
+        strict: true
+        type: function
+      top_logprobs: 0
+      top_p: 1.0
+      truncation: disabled
+      usage:
+        input_tokens: 50
+        input_tokens_details:
+          cached_tokens: 0
+        output_tokens: 14
+        output_tokens_details:
+          reasoning_tokens: 0
+        total_tokens: 64
+      user: null
+    status:
+      code: 200
+      message: OK
+version: 1
diff --git a/tests/models/openai_responses/cassettes/test_tool_choice/test_tool_choice_none_live.yaml b/tests/models/openai_responses/cassettes/test_tool_choice/test_tool_choice_none_live.yaml
new file mode 100644
index 0000000000..72a4d8eca8
--- /dev/null
+++ b/tests/models/openai_responses/cassettes/test_tool_choice/test_tool_choice_none_live.yaml
@@ -0,0 +1,143 @@
+interactions:
+- request:
+    headers:
+      accept:
+      - application/json
+      accept-encoding:
+      - gzip, deflate
+      connection:
+      - keep-alive
+      content-length:
+      - '424'
+      content-type:
+      - application/json
+      host:
+      - api.openai.com
+    method: POST
+    parsed_body:
+      include:
+      - reasoning.encrypted_content
+      input:
+      - content: What is the weather in Paris? Use the tool if available.
+        role: user
+      model: gpt-5-mini
+      stream: false
+      tool_choice: none
+      tools:
+      - description: Get the weather for a city.
+        name: get_weather
+        parameters:
+          additionalProperties: false
+          properties:
+            city:
+              type: string
+          required:
+          - city
+          type: object
+        strict: true
+        type: function
+    uri: https://api.openai.com/v1/responses
+  response:
+    headers:
+      alt-svc:
+      - h3=":443"; ma=86400
+      connection:
+      - keep-alive
+      content-length:
+      - '7089'
+      content-type:
+      - application/json
+      openai-organization:
+      - user-grnwlxd1653lxdzp921aoihz
+      openai-processing-ms:
+      - '9379'
+      openai-project:
+      - proj_FYsIItHHgnSPdHBVMzhNBWGa
+      openai-version:
+      - '2020-10-01'
+      strict-transport-security:
+      - max-age=31536000; includeSubDomains; preload
+      transfer-encoding:
+      - chunked
+    parsed_body:
+      background: false
+      billing:
+        payer: developer
+      created_at: 1765242214
+      error: null
+      id: resp_082274208daf287000693775667280819da6969c47dc18abd5
+      incomplete_details: null
+      instructions: null
+      max_output_tokens: null
+      max_tool_calls: null
+      metadata: {}
+      model: gpt-5-mini-2025-08-07
+      object: response
+      output:
+      - encrypted_content: gAAAAABpN3Vv98sW7fVOKvvSGYJHrHIL1CT9xp6yWoYpYaf-BXroQZ0cOkGGaO2XQ1gyHktEw2gtX6hFHQPMabuXVhb5IjMZoAltic3KPFWbJFpkUvJHelNghYKU2k5erL6RRstYiWPov2r2ZenVaVn7QMBuIao0KN8J76mpqNiFSTs_o4AgCkqWAsvOz5QfI4qalaWuBfYvfy6nan6TbXyUWejrC_rtg8SZMqo4HhEFONMFA6novL1dV1i9DXvu1xG90gcJzF7jwesY2CZ9VcD6Og1Xy4-pztCmLJMln8lEDnHGx32j2xWfWX5Z8HfMk3KUIl50ch5LM7rdjwd-0LH9dh3aCPBChcPJnDg6V95YaotBBI964S-imZ7t553ZpJilRnawK4-xzqWufuw5nu8nIjK6ru1LQqI3I0LJ00SItJUASeJcMfFg-YxcJH9YMJ8M4UhzTI_xgF08gKmVVsoaCl5FXP0VPo0JuerDu0Djf_N0a6USCez05ut0nkIz4gdAStLzYlI3cIC_Dco_Ao7hGNUIJiyIVM5LcLbuPaBut5o3d6_4STS6Pw2HlIjQOLJ2TeeioJjxLsfVX9VOqDk2NSpAVEE_l_RtVOIXmyOzVcRRx7NVrxROb_wr5Bcs85A1mVm_T9A5-qDe8Y2C7iWtBKjbvl4YVvcGO2d0bpSi43ZSj8ejcbOMNiSnwKQlII_aVrjQgM9vZCTHRFRa_9xgHHqT3KmRHTqpj_5FcBmIVeNnk9Bl8PNoLnmAkZEOps-5nuxUDGQV3Osa7Yge54Yx3tcQ6Mle0yDQJKKHCzultcwi_TMkQuWO_GJlUJPMyPKGM9ZJHO5xY8m2dq2jKXb6ePYqWQXzolpKa2GvtC8kDr83NDbBkAvh2OHik80IjyaIe9ijbiYcdrWXPpGQbedjvc6ntG0vSDmS-9aLHfj7WQdDphwWS0S95cG5Ltz3BZxQBv-jhKZGjZAMLwpRj5fmrSmfBVw6KwjRQOO64buD_4cWjvRCNEP3h6GnEgCz4wjQtaPPTgQBTKF6Du-lcTU7ug9L9hTODlFNaD3wZpMM3P2VUKdUHe5PmePiR0Vw9ATENum3fcc_xIi0vJm7Ote2mY3-W8V_Ov0Xq-Qm1TMusa3atD9nOHuPRGc29Ig4klqz9IDTdOALFT83SYdeE5l2VdGGNbv3g2D-znpLsN3Rw8ZBaCyW7v7IMKU97jxsLmCLVQ12hT8IDu69EJy5n-Rqqp8bBU9G-MMARTPBecJcrGgpKgLmZZthhFdpJARNftQg39W68VZ6nlQV3vOuDzzQ5Wna0yPJdSL8M4Iy18SwY03EYhyqBUxCJBaJuydxN6WocJaxT-5BN2Lkw4jKuYGp7jfIjF8tQijU2kvCJ4_HRU2YcefheEL7Vsivh7pN7WWN-4Fstm1cRF7l33rMhKKVKUmkjaKqLSXjJ8wcJVTg7nKC1Too_nR0DGN7jVSGBiGSLse5QAKAhs8WhLBzvKRP7ViCGZVh466R2kU5GLLK0qRKwaAu-z-n54cmb1-6PIXhDfCTNe0Ev6bwrEI3xQg6eplS0uc0xSAuhtBdoloFbaB6Tuj1_zmswYjF_YpsLEoAq0FEBELs5mficFUVWRwoBAV-qRkOFW5fjohVwgthJwozAqO_4kpdOIxwNFciVn7kpXE3q5AdWnAlDJS6k1OzKlmLJCrNgaLfIwiSJRzpzDuC3ojxKs0V-PSu7r28HuA2-bn5KbZj4CRbzo-oW45-KtfrVOsegPgEkaHQ7e3w9xrLmgMp5_vz7PhrdfpJGqgXzLLw3XmQF2FQmgmU3MqbcTZpHb0uoYM2qtL3oikPj1duqvXsDkeiNOuWKm5a1TgjvM37WTAcpQ3ouh7zFKsZtEK5w68vEG3-r06nI8ZqZsfMbxGrIMnfW4-2HyEgurlegg4RJ2fVbZCVRgwvG4hRph5WJOuoRtkItpoWjBJ5-inHtADk_6zsvzZe2pKVrt4m3z7qlRIoEDJqNo4k2ICx1aiDKvBQPs2ZMsxJ4fawEiiVrmIfAZnBJ8bgfs3SpGCRi-PSgBz6wr-nFV6nmJKSFw_Ii6boJy-BaD8Gbu4iwx0XwH5203BqbuirQB3xJ98VufFKU9Hbu5P3EsS7GqFu7FLS6zA6JTlyanVUofijlSCq1Xq5EY4dC94cWZ_tT8aLb2maVCUi42OAOfsfNHV9Y3xYABnoXowQtKQxEH6vtd8yxTkFRUXXecJ8yqgD_An0CVGR9yA8sAw3WeAxhJBN46TRp1H_UFNnXCZ3hJouDO9Lid-dXOpEtgrMSls3CRh3aOW2sYjSOn0JqrFA8GiFWOvIZhg_ilWpL47ch9M4t92-P5lOj2Ch9OyGqIGInC_jor61lSzkTzPua0YcZo896Tv3FpFEGV2v3x0qTbIPJh-hhxbthbqIrkn-8JsFhfLoo0CT_vtlW0St1PkbPh0KlbfdFr5QELBBvogVes0oTcFqP3rHJI4ZLIzeNp6OVak54GUbn_nd0FsPKoWFErmmYbx8hMylQQfwvhVHYohtI52pwRA8_aLKNKKL8ST8lnnWSG0ZjQQpWbp1gVHFlxrAWq8HYMKk3Kcn3FHJ0_yRxqpuR1IZfCWfPnOFyKbBMu6HG7uV439s8xRZdaQLo9gW1M8ArzLYOUWow-i5gNIZZ9gVKaili6yLSmpnp9hHMAK4cZME7I7m2e8FPFK44FcSUXlg1T0inOWJNdXloxXsOl1ec6SE5AVXZ-gWW2aEOKfARrwfS_SWALu3c71dU64b4jA4UL59q7nZymfUBEtp3G6EQynGg0QRcvRTfRpSLlF3beEgT1RwwMH5w3zgSjuxAmD4jwR_zSs6H50td9xMnWyYyAsf2OLAbXF-L3Epc3zcAY5rrM6CGEJxGif6yR5z9yFG5K46zeosVtw611NX8WIGrT5Fd2R4nstSt4vdgwYxFogQ3AmC7db7eNcpAKd2uiwL-ImNqTNt0bwOxgDSw1ExAgrWo0qOu1YIjx-Ge4PPy4l6ymr5Hx-EK83WhX807JG3ZugnrIO6ol5fD6WAcpphlkQuNWK0jG5YwolK3h6Uour8qkdTXTNLrdI-Cs5Vx5tGaosVX5tJQxwETQb8mWzlZCcphId4EBgiVWyV6WF74zcqV6REJ5-vIV9cEQlj-bw4UbbNeHyVYTwCj5OkfW-ymxBiUEeAxP_LqryWtcPs11B2U-1IHegEWOgBtdyi4xA0S6Gh12HXK8CIy0nccTf61qyTJkfcho5yDTisJgcsk0mHDxcc2qOPIclGH3bII7BNzfXKe1iubBUOn1LS-CgS9YS6bTWM2pT_CY-6pQ0t6DLjiQgPashazaQAVDrEmweczMtwunvMhYSvgeIp3RlZhZqqsUZjlv3Xy06fryFAyFseqlJOMaQnAENuf5n3ZQdl1lo-KIr-M0bjzpl73spXLCFVi6xKr57d2zpgJyzhYD5CFZp9sH8XbNa2HjYY4khYgz0eqOhICmWf7LuNCN8H1mJIVMZXAh54WIIWnDz52-q-1QxFUha9aaAnWz0tbMvDKjdbocUwH7Vx7hOFdMRdh4T2yy-Mi5pZDdDTXGxr8L-PCRj6OahttZZZoaiB0-KNLwz35bGQUASPIgfZH6lXEpQaapZ7jvHy58ENcykkIE9L3OIACI8FxSSQPuOidZhp-ACWsZ0JTg49sLVDyvn7fO0IK2Pm89Qx9mzSTmDyZ88iW8EOEWbw6N92G8_1sDmmLmJmnvVxM-JXXAd_oNaJw_uNly8ThVDNiixiZM8lAzvlpbiUZH6Xfept8qJGFgSzB_9FJPaVGVsKOGRn2HGVK2cZVgb1lHUZKemXS79yNnOidRQVhn9bs6JnxEh1aMZcrXJ0-pavXNhLVp8z--dfDEGCW4d6Sm7oF3VGIRRqIC9gL0Q22yravoCj6G1UmXmclXT-OKLnaPc-Sq0lQYMOFJy2is6tTeniJN4EkMnPtunWH8N62Rm6PjhAq9HbIsBZIHiWmIMELyxaGd4FxXvxG9b5VtTRYfLvDU7Ff5M81y2QXUrbpUu0TjwAxR9ZHsx4UrSaMWQE6tV6N86acfR0zVt14EWq5AcTvx9ZLmxVNj7ueJXkDcw1qxpGo-b2Ydmuei2ATR88iO6Xu8CfQ3dhDAobmMQ=
+        id: rs_082274208daf28700069377566ede4819d9b74f9088caeac29
+        summary: []
+        type: reasoning
+      - content:
+        - annotations: []
+          logprobs: []
+          text: |-
+            I don't have access to live weather data right now, so I can't fetch the current conditions for Paris. I can, however:
+
+            - Give a quick typical/seasonal description for Paris in early December: generally cool and damp. Daytime highs often around 4–9°C (39–48°F), nights near 0–5°C (32–41°F). Skies are frequently overcast with a good chance of rain or drizzle; occasional wind but usually not severe.
+            - Tell you how to get an up-to-date forecast: check a weather site or app (Météo‑France, Weather.com, AccuWeather), use a smartphone assistant, or ask a smart speaker.
+            - If you share a specific date/time you care about, I can give a climatological (typical) forecast for that date.
+            - If you want, I can fetch the live weather for you once live-data access is available — or you can paste the current conditions you see and I’ll help interpret them.
+
+            Which would you like?
+          type: output_text
+        id: msg_082274208daf2870006937756d1b1c819dad473afd73fbe874
+        role: assistant
+        status: completed
+        type: message
+      parallel_tool_calls: true
+      previous_response_id: null
+      prompt_cache_key: null
+      prompt_cache_retention: null
+      reasoning:
+        effort: medium
+        summary: null
+      safety_identifier: null
+      service_tier: default
+      status: completed
+      store: true
+      temperature: 1.0
+      text:
+        format:
+          type: text
+        verbosity: medium
+      tool_choice: none
+      tools:
+      - description: Get the weather for a city.
+        name: get_weather
+        parameters:
+          additionalProperties: false
+          properties:
+            city:
+              type: string
+          required:
+          - city
+          type: object
+        strict: true
+        type: function
+      top_logprobs: 0
+      top_p: 1.0
+      truncation: disabled
+      usage:
+        input_tokens: 56
+        input_tokens_details:
+          cached_tokens: 0
+        output_tokens: 726
+        output_tokens_details:
+          reasoning_tokens: 512
+        total_tokens: 782
+      user: null
+    status:
+      code: 200
+      message: OK
+version: 1
diff --git a/tests/models/openai_responses/cassettes/test_tool_choice/test_tool_choice_required_live.yaml b/tests/models/openai_responses/cassettes/test_tool_choice/test_tool_choice_required_live.yaml
new file mode 100644
index 0000000000..dcefba1738
--- /dev/null
+++ b/tests/models/openai_responses/cassettes/test_tool_choice/test_tool_choice_required_live.yaml
@@ -0,0 +1,325 @@
+interactions:
+- request:
+    headers:
+      accept:
+      - application/json
+      accept-encoding:
+      - gzip, deflate
+      connection:
+      - keep-alive
+      content-length:
+      - '715'
+      content-type:
+      - application/json
+      host:
+      - api.openai.com
+    method: POST
+    parsed_body:
+      include:
+      - reasoning.encrypted_content
+      input:
+      - content: What is the temperature in Paris? Use the weather tool and return the temperature as a number.
+        role: user
+      model: gpt-5-mini
+      stream: false
+      tool_choice: required
+      tools:
+      - description: Get the weather for a city.
+        name: get_weather
+        parameters:
+          additionalProperties: false
+          properties:
+            city:
+              type: string
+          required:
+          - city
+          type: object
+        strict: true
+        type: function
+      - description: The final response which ends this conversation
+        name: final_result
+        parameters:
+          additionalProperties: false
+          properties:
+            response:
+              type: integer
+          required:
+          - response
+          type: object
+        strict: true
+        type: function
+    uri: https://api.openai.com/v1/responses
+  response:
+    headers:
+      alt-svc:
+      - h3=":443"; ma=86400
+      connection:
+      - keep-alive
+      content-length:
+      - '4285'
+      content-type:
+      - application/json
+      openai-organization:
+      - user-grnwlxd1653lxdzp921aoihz
+      openai-processing-ms:
+      - '2789'
+      openai-project:
+      - proj_FYsIItHHgnSPdHBVMzhNBWGa
+      openai-version:
+      - '2020-10-01'
+      strict-transport-security:
+      - max-age=31536000; includeSubDomains; preload
+      transfer-encoding:
+      - chunked
+    parsed_body:
+      background: false
+      billing:
+        payer: developer
+      created_at: 1765242207
+      error: null
+      id: resp_0c300b9f64a943d1006937755f130881a2b0249fccb582d58a
+      incomplete_details: null
+      instructions: null
+      max_output_tokens: null
+      max_tool_calls: null
+      metadata: {}
+      model: gpt-5-mini-2025-08-07
+      object: response
+      output:
+      - encrypted_content: gAAAAABpN3Vhvfy0YhxKwdujtNarPo-sObDX6MajOh8JawgsmvBUo_yzvrc-ypduxn17CXwgbSeK8NYsAydEzw9pT13rfCZTx7K-jR89HdRAjim5DXabRwllFfmycmYKa6Eb-pCdQQr_zDDKbuCBkSOhQU4vGWF4shTjx3cdnAHRdzctSzZNFJDP0DlHSPGXRlhqRU1SkTvUFI-jSmX37HuPj8Hk6EP7eLGEP7WYQv8BSY_ZqRW7HDiGzjNjAVhBYsWHhN11bPi6MgeiGPin9qYHvbx1fZmP87OtSoGUZXYudIevStixR3Mz261pczfvTDSahuul4b6m9bmTeKhuotHCtKTGKZ-Ew1NKu7lpjYNOXTp7nHlhm8o8lAXWzb6tu3hLhqcKeHfV1heoezg-snJ5j13_J5Je2UavIVpeViTmMtDmYcaAgWAOGZOv0k2Lt-tvv_cD6WIY_osIgIA8GuRKn_B-BYVh6bNIOy6spR0GornWWK-zrjiIbzXQ2JSUU9590UznCj76mTogRCdrtveB0rMmgqzomo6uCkCJsISUD4O64_It6XvayMTDpVfIsbCvIxg2ZGcL58R1cnXl9QKbomK_UWy6xLkaBS2Ik-0Ivt31mBU9LU9XFijAMC_rOZspFMcg5tna2AIy5RtXqdVnjU1PRVJoH67C4tzLeUO4xvGfFvIIVP3ep0Xsn9eBny337Hi_1gfIXMBbnqJAHTPGmK31-aELaRv_GQKDCnNu6rQIr0IXrWj3E89Ma1YyE5V8Dlvdj4Vspt2v1AZfqp7dLJcpt7VDMpkSZ3eTMppmD_-AVzHtnn3V57JwKyIDXuZRiSAy3I2l5DDydBUTOrsAGeE9D0qE0ssSixsPsA_W-FTEe-Do3slmDFI1qTRZX-hkW-yDfoaGtoaC0uJ6f_UXro9rJw9TdzEwvr_id6Vncb4gYYkmZVrPykQcQnkM046Ni6vpmlARRuHIRHppHWHd-cb51QsyVo0eO5mpvc_Egj6wT3Hkt-hUtjaRP1ktTFLdovNgdWqHVQ_AYl628wX8xEu__XJVGwCy4X0VW3NhCoyXkw825oUaw0Z59obZUJOHlXZvQc-vkorY6Eem9ADVUh7ORfXigvz5pnMVzwhgIOmgWVuUw3ztEzdkL0-Cbbr_tPmsLpXKtDE9nmet2Cbr4DjnB056mx3A572w9Ocgi241WTHk22OEcDGew4hZsXVwNF0CaD7wKm56nuE7UR87a14o5f5LlahYPBsCgjfVRbXzj7-8VLe9ILgmBC3hrWsvpCvZrSo614KCkE4on5MLoVbJsH4JJXMSF9s3_M_uuBkooiEBAlAQugCaxCpFdq6DXtnlPR_DmgUzG7gVid49i690u8YKZqU4W8ph5evxEx6iURQ7FRJ3zUJD39NpE7p7f2s829oNydLhdnVSjos0Ed202woR6CZYkyvWBAfzUHvfrzQBcYfsVwzIjXAEPiGv6x7lNaVahCwFUvw7BbwoTuzOGPmBT39WaNJ24gjhpmwMu5I2_8X33Hru6JfKku1WY4f9nAAz-OMs7YrQJ9uXOLPFfRODRD8H53LUWeoGSQNL7UoQIibP1xZJHOu1HF6WXPevAzJ4EFd2vzvZjnacfGS6Ue55Y6nSlqXer5PXhvdvkerLLOiafg6epIMhCW94CfTGQhD7tguJkLlWIRCDmU6uBl1SGdykuKkyXNyHtr49355-aggY4K80GdU8dljA42pTh8Wu5SGXCm87I9MtbjeSQi-wRFu14aHH4YRqaxF6H3TZRwic8OXnqMQb1czzZslfOn8TnVUfzIemJb6Cjt2rpzKYmJL1p3P0TxZbe7Do6KXZssdiK714oB3aQSXsCiMWXvY0LkEoINdbZg7UGhsVAwzQ29-lT7lJYVNMy1RrEfU8jsbS8sDGjvqJ0eLCAWqC2fzS
+        id: rs_0c300b9f64a943d1006937755faf1481a2a6f771da45d4873a
+        summary: []
+        type: reasoning
+      - arguments: '{"city":"Paris"}'
+        call_id: call_PPLNFkXKSZBDITYgrg9dIsOJ
+        id: fc_0c300b9f64a943d1006937756186a481a2b72aa5bc5829ae2f
+        name: get_weather
+        status: completed
+        type: function_call
+      parallel_tool_calls: true
+      previous_response_id: null
+      prompt_cache_key: null
+      prompt_cache_retention: null
+      reasoning:
+        effort: medium
+        summary: null
+      safety_identifier: null
+      service_tier: default
+      status: completed
+      store: true
+      temperature: 1.0
+      text:
+        format:
+          type: text
+        verbosity: medium
+      tool_choice: required
+      tools:
+      - description: Get the weather for a city.
+        name: get_weather
+        parameters:
+          additionalProperties: false
+          properties:
+            city:
+              type: string
+          required:
+          - city
+          type: object
+        strict: true
+        type: function
+      - description: The final response which ends this conversation
+        name: final_result
+        parameters:
+          additionalProperties: false
+          properties:
+            response:
+              type: integer
+          required:
+          - response
+          type: object
+        strict: true
+        type: function
+      top_logprobs: 0
+      top_p: 1.0
+      truncation: disabled
+      usage:
+        input_tokens: 84
+        input_tokens_details:
+          cached_tokens: 0
+        output_tokens: 148
+        output_tokens_details:
+          reasoning_tokens: 128
+        total_tokens: 232
+      user: null
+    status:
+      code: 200
+      message: OK
+- request:
+    headers:
+      accept:
+      - application/json
+      accept-encoding:
+      - gzip, deflate
+      connection:
+      - keep-alive
+      content-length:
+      - '3075'
+      content-type:
+      - application/json
+      cookie:
+      - __cf_bm=kY_QRp3qdLAe2brCi2cHsMQJ2Zv_Snfkly_TRNir7Xc-1765242209-1.0.1.1-wqtJIzrurJEWZLYVXcWbT46QsWarpOUNmIbvrCGeHlnuuJ3RXf27SZIFcGqORVVDw1Z0jDTizgWSSfNHGyU8XVX_Roq_8t_NIVt7Q3gClvc;
+        _cfuvid=aPA0Oc0NPOUeRgFRkIbnohaThCiw1f4qP.yX9UZUNNY-1765242209867-0.0.1.1-604800000
+      host:
+      - api.openai.com
+    method: POST
+    parsed_body:
+      include:
+      - reasoning.encrypted_content
+      input:
+      - content: What is the temperature in Paris? Use the weather tool and return the temperature as a number.
+        role: user
+      - encrypted_content: gAAAAABpN3Vhvfy0YhxKwdujtNarPo-sObDX6MajOh8JawgsmvBUo_yzvrc-ypduxn17CXwgbSeK8NYsAydEzw9pT13rfCZTx7K-jR89HdRAjim5DXabRwllFfmycmYKa6Eb-pCdQQr_zDDKbuCBkSOhQU4vGWF4shTjx3cdnAHRdzctSzZNFJDP0DlHSPGXRlhqRU1SkTvUFI-jSmX37HuPj8Hk6EP7eLGEP7WYQv8BSY_ZqRW7HDiGzjNjAVhBYsWHhN11bPi6MgeiGPin9qYHvbx1fZmP87OtSoGUZXYudIevStixR3Mz261pczfvTDSahuul4b6m9bmTeKhuotHCtKTGKZ-Ew1NKu7lpjYNOXTp7nHlhm8o8lAXWzb6tu3hLhqcKeHfV1heoezg-snJ5j13_J5Je2UavIVpeViTmMtDmYcaAgWAOGZOv0k2Lt-tvv_cD6WIY_osIgIA8GuRKn_B-BYVh6bNIOy6spR0GornWWK-zrjiIbzXQ2JSUU9590UznCj76mTogRCdrtveB0rMmgqzomo6uCkCJsISUD4O64_It6XvayMTDpVfIsbCvIxg2ZGcL58R1cnXl9QKbomK_UWy6xLkaBS2Ik-0Ivt31mBU9LU9XFijAMC_rOZspFMcg5tna2AIy5RtXqdVnjU1PRVJoH67C4tzLeUO4xvGfFvIIVP3ep0Xsn9eBny337Hi_1gfIXMBbnqJAHTPGmK31-aELaRv_GQKDCnNu6rQIr0IXrWj3E89Ma1YyE5V8Dlvdj4Vspt2v1AZfqp7dLJcpt7VDMpkSZ3eTMppmD_-AVzHtnn3V57JwKyIDXuZRiSAy3I2l5DDydBUTOrsAGeE9D0qE0ssSixsPsA_W-FTEe-Do3slmDFI1qTRZX-hkW-yDfoaGtoaC0uJ6f_UXro9rJw9TdzEwvr_id6Vncb4gYYkmZVrPykQcQnkM046Ni6vpmlARRuHIRHppHWHd-cb51QsyVo0eO5mpvc_Egj6wT3Hkt-hUtjaRP1ktTFLdovNgdWqHVQ_AYl628wX8xEu__XJVGwCy4X0VW3NhCoyXkw825oUaw0Z59obZUJOHlXZvQc-vkorY6Eem9ADVUh7ORfXigvz5pnMVzwhgIOmgWVuUw3ztEzdkL0-Cbbr_tPmsLpXKtDE9nmet2Cbr4DjnB056mx3A572w9Ocgi241WTHk22OEcDGew4hZsXVwNF0CaD7wKm56nuE7UR87a14o5f5LlahYPBsCgjfVRbXzj7-8VLe9ILgmBC3hrWsvpCvZrSo614KCkE4on5MLoVbJsH4JJXMSF9s3_M_uuBkooiEBAlAQugCaxCpFdq6DXtnlPR_DmgUzG7gVid49i690u8YKZqU4W8ph5evxEx6iURQ7FRJ3zUJD39NpE7p7f2s829oNydLhdnVSjos0Ed202woR6CZYkyvWBAfzUHvfrzQBcYfsVwzIjXAEPiGv6x7lNaVahCwFUvw7BbwoTuzOGPmBT39WaNJ24gjhpmwMu5I2_8X33Hru6JfKku1WY4f9nAAz-OMs7YrQJ9uXOLPFfRODRD8H53LUWeoGSQNL7UoQIibP1xZJHOu1HF6WXPevAzJ4EFd2vzvZjnacfGS6Ue55Y6nSlqXer5PXhvdvkerLLOiafg6epIMhCW94CfTGQhD7tguJkLlWIRCDmU6uBl1SGdykuKkyXNyHtr49355-aggY4K80GdU8dljA42pTh8Wu5SGXCm87I9MtbjeSQi-wRFu14aHH4YRqaxF6H3TZRwic8OXnqMQb1czzZslfOn8TnVUfzIemJb6Cjt2rpzKYmJL1p3P0TxZbe7Do6KXZssdiK714oB3aQSXsCiMWXvY0LkEoINdbZg7UGhsVAwzQ29-lT7lJYVNMy1RrEfU8jsbS8sDGjvqJ0eLCAWqC2fzS
+        id: rs_0c300b9f64a943d1006937755faf1481a2a6f771da45d4873a
+        summary: []
+        type: reasoning
+      - arguments: '{"city":"Paris"}'
+        call_id: call_PPLNFkXKSZBDITYgrg9dIsOJ
+        id: fc_0c300b9f64a943d1006937756186a481a2b72aa5bc5829ae2f
+        name: get_weather
+        type: function_call
+      - call_id: call_PPLNFkXKSZBDITYgrg9dIsOJ
+        output: The weather in Paris is sunny and 72°F.
+        type: function_call_output
+      model: gpt-5-mini
+      stream: false
+      tool_choice: required
+      tools:
+      - description: Get the weather for a city.
+        name: get_weather
+        parameters:
+          additionalProperties: false
+          properties:
+            city:
+              type: string
+          required:
+          - city
+          type: object
+        strict: true
+        type: function
+      - description: The final response which ends this conversation
+        name: final_result
+        parameters:
+          additionalProperties: false
+          properties:
+            response:
+              type: integer
+          required:
+          - response
+          type: object
+        strict: true
+        type: function
+    uri: https://api.openai.com/v1/responses
+  response:
+    headers:
+      alt-svc:
+      - h3=":443"; ma=86400
+      connection:
+      - keep-alive
+      content-length:
+      - '4988'
+      content-type:
+      - application/json
+      openai-organization:
+      - user-grnwlxd1653lxdzp921aoihz
+      openai-processing-ms:
+      - '3263'
+      openai-project:
+      - proj_FYsIItHHgnSPdHBVMzhNBWGa
+      openai-version:
+      - '2020-10-01'
+      strict-transport-security:
+      - max-age=31536000; includeSubDomains; preload
+      transfer-encoding:
+      - chunked
+    parsed_body:
+      background: false
+      billing:
+        payer: developer
+      created_at: 1765242210
+      error: null
+      id: resp_0c300b9f64a943d10069377562137881a299b8ca9f4c12ade9
+      incomplete_details: null
+      instructions: null
+      max_output_tokens: null
+      max_tool_calls: null
+      metadata: {}
+      model: gpt-5-mini-2025-08-07
+      object: response
+      output:
+      - encrypted_content: gAAAAABpN3VlOgELAMyXuTnt-RjYoo5t6_6WI5HK7oe52kDCSlM6BrPPFTLVm2AjnsCZbb11Ue8X3m274rEdiZPgSWSyMehHbNL167c8hIp7J5SmOCiJuFYSj6jiNtwMz0PrNNTFEzRy5qeYiUxCxhWY2fhHTqLsZUOWG_ODkGyQPsLK10zDTisC0B_Ie-3eFEJ_jeoIj2yoBqMK0mVOiKuHPzECphM29rAN-7JW7dx_Ri85iMuMctETtjcyhCe0CBJUzWcKI5zC_ZYm8jg040A3xfLYNiDYYsyJoGHzQPqh1dG7d0JP6HwGD0BVvuVuj7CYRon-HnQHnymvMMZZsaAMEagIBXTAK04jQKXrpFwt0ZKTT6iRPuZuTvjAKFXvngnB_rLEVhhZjmYeGbeK8jpTdFNo7dKlib2OJbEIPKn9st2XGXvE-9oDf2bFC7T0qTpVVauC0YvhLvQRf51AFCI0WcFIX24OLLDJt992WgN0kLS2LYHPE95-INXN1xODa2JlgpPyesaLb6-V0sc_LR_vP8iTz7pNU-Auzq0L-_M6oH0qRWdrlyFoNOU_9TnkWNhe9619le5eFbVoHAEVNa8iBx6MmV6tMWgeXIAGrZ_wgRPqNy9hmH-VV_CYtVgYsIAJvy_Kj52lViLCst6SvsydeO3nbozX9DBISfRhXSizS-SDOBBMoFGWXw0dcSgXAFhZ_X2Xhi2B8vlNCCBMyJsJ-I7QdbTa9QzJw8n7sVGEpeETByjc2q_OLwAddnt8U2fhfQ4wVOcb1XW3VWCbh854mty479h9td5KC0SxOhzCZrl-M6jux7QNxu3RZ9NN368cTp71O3AyLSfEcx9P9hb4npWWbSdoNyf1xPKmDpycTa15uBGNUXNK2T7Ym3W1ojkPPxL3al4e8-gJwwkIi6gCPtsgiuN8kRiBrEgvgl4PwKwK6koOfSNDKRq1DF8-V5vPzbZG9_YH5aYwmxO_kym80yM2p7xTknv_y9buGlIMH_o98NICGEkSgEsBL1QEOSvw1-edEnUxcTmaffwwp7Ll_sU086wtTamjp0gk_L2BbQpzAkgRGTVUssRdroph2es6v2MpcepxC9pTIvKsXAAeJT2g7zVuxU-4mO8JssfVzi8P2vRZCawcFyHNbWe3Kf3OXK-D4O3jc94G5VvTloNaDhwDRh_-G83TQTBqPVOpyrooy3xWpfpW_hUBaKLSciL7_bre-oDD6hKIhkhxbuxs-teOT7qZaBi0zbCH4JKFgEhQafOt89dPS2IHzjXkXNd0BzzLTixTpTekjWGGMmT6KHfUQde4pFvQcqLdY_qK9PGpcJZDH14JOs0I7udDI4v-4lEIRKdXALugM_kGXdf_Th4_J-jEyuwF8lpHUXS_3mFNGgn_F38-fEa2C38_4h3GmvXcuhA9sNY2M8SiBgiewT_9JpZQ6itA7pSy7LT7k8t7Aitio1r4kQIy0j7XpNy2PWnPZNTw6YUg5FCfAHiiSEHWUx72XCNvBof_RWxDrla1kxSnBU0dyMuiFa-v_8V2Ky0a0j86m80b9NhR_sHgQNnA69ZMdewZCfybNkK2lM1PZ73s8I6-sxZfBdw8xrjHANSIvfgUElJ2YSl0DSb27_ehzsCeZ0qkeE0ugGyHBmDUvsdnFTCnKX8vjSypRGpNAAe5y07JM4mjnnVUTM9mo6nsWVLb07qZx-pJ_26FD24U8BEpx-v8aFvgoDkQy-Qb9TAp3Eu0ziuSsRjMbu7cfQwndhucHfX9fRPrYgerWduw-l5LatMGZtDfjYdniTgzXsGJhf0qG3Q44kbhzx_T848T8WPEfpacoiVTtT-k9FLpV-Nc-XbzBaqKVCtJN_jlVSk9sErz5a7WtsxDVCACAcU2toLqighhTFhDCoEX0wyChgFoi3tbJvT6BUnTzy9stxq8543YwHgL2caQZCDKC_N3IhG8qXU5hR4rpmg7OR5Mq8WNAle51QAXTjrr_YD97a5alKcFo3tO57lM9DslU-CBmH1u2g96_QgToCJmffCbEentSpXj1ijObWU2SElag4JhsEHHYVkNlz8zpwXK9oMwSTDlQTj6PhJj1pGhSf-RcU9Br1sfoNsvMjs3xA5spifOx9Maxw-p-O27rAwMUvZS0MeP1RN7yo1u7Q_hiWWXZ21Jdpm9AX6D5Fu_hTAKzAn5RNT-6Z_LR5W-EUMurLMoCkAOYSM7fGUb200He6c9uCPkDhaAdakjqKkzr6asubMuMK64dKcz9h_zb-ZGAq3aBLxTOZ4Yb0y3dNFIlyArH2E9JwPf4VjKmG15NODiQdRh1hR1D-zvLLtPnabrUn045LB8bklzXpG6UJ3i_wrGWbZfw4FN4Hp6lXyT8NcEWews5Qlz9vTmLJAvyGttglJf21HRmcJdt-qGo2eJxgraFS18-TofuDd26LZoqSZ5o_FbU-EnivFjOCqMWrmlG1fB_SCagdAP3gdxSlpJN0D00LwkaqI7lmm2MR0OfCzPlwxF_mRKCCVzvcL1muQ8017yeMnKz0UnoiC7yLwH5poX9NZ83v9WiLF-jgp9E3fh05kHEFPbsRxOzf84m0TmPhcJWYtFKI4GWReihQUj9Ip29I_1W1K-CkGdN7EfdmB_JxVPjEPB
+        id: rs_0c300b9f64a943d1006937756263ec81a28a62555ad1cc25eb
+        summary: []
+        type: reasoning
+      - arguments: '{"response":72}'
+        call_id: call_B47N6gnjzH09hv03fN4bLcGv
+        id: fc_0c300b9f64a943d100693775650c6c81a2891b32e16cb5e0af
+        name: final_result
+        status: completed
+        type: function_call
+      parallel_tool_calls: true
+      previous_response_id: null
+      prompt_cache_key: null
+      prompt_cache_retention: null
+      reasoning:
+        effort: medium
+        summary: null
+      safety_identifier: null
+      service_tier: default
+      status: completed
+      store: true
+      temperature: 1.0
+      text:
+        format:
+          type: text
+        verbosity: medium
+      tool_choice: required
+      tools:
+      - description: Get the weather for a city.
+        name: get_weather
+        parameters:
+          additionalProperties: false
+          properties:
+            city:
+              type: string
+          required:
+          - city
+          type: object
+        strict: true
+        type: function
+      - description: The final response which ends this conversation
+        name: final_result
+        parameters:
+          additionalProperties: false
+          properties:
+            response:
+              type: integer
+          required:
+          - response
+          type: object
+        strict: true
+        type: function
+      top_logprobs: 0
+      top_p: 1.0
+      truncation: disabled
+      usage:
+        input_tokens: 278
+        input_tokens_details:
+          cached_tokens: 0
+        output_tokens: 276
+        output_tokens_details:
+          reasoning_tokens: 256
+        total_tokens: 554
+      user: null
+    status:
+      code: 200
+      message: OK
+version: 1
diff --git a/tests/models/openai_responses/cassettes/test_tool_choice/test_tool_choice_specific_live.yaml b/tests/models/openai_responses/cassettes/test_tool_choice/test_tool_choice_specific_live.yaml
new file mode 100644
index 0000000000..87fb6bad89
--- /dev/null
+++ b/tests/models/openai_responses/cassettes/test_tool_choice/test_tool_choice_specific_live.yaml
@@ -0,0 +1,337 @@
+interactions:
+- request:
+    headers:
+      accept:
+      - application/json
+      accept-encoding:
+      - gzip, deflate
+      connection:
+      - keep-alive
+      content-length:
+      - '634'
+      content-type:
+      - application/json
+      host:
+      - api.openai.com
+    method: POST
+    parsed_body:
+      include:
+      - reasoning.encrypted_content
+      input:
+      - content: What is 2+2?
+        role: user
+      model: gpt-5-mini
+      stream: false
+      tool_choice:
+        name: get_weather
+        type: function
+      tools:
+      - description: Get the weather for a city.
+        name: get_weather
+        parameters:
+          additionalProperties: false
+          properties:
+            city:
+              type: string
+          required:
+          - city
+          type: object
+        strict: true
+        type: function
+      - description: Get the current time in a city.
+        name: get_time
+        parameters:
+          additionalProperties: false
+          properties:
+            city:
+              type: string
+          required:
+          - city
+          type: object
+        strict: true
+        type: function
+    uri: https://api.openai.com/v1/responses
+  response:
+    headers:
+      alt-svc:
+      - h3=":443"; ma=86400
+      connection:
+      - keep-alive
+      content-length:
+      - '5776'
+      content-type:
+      - application/json
+      openai-organization:
+      - user-grnwlxd1653lxdzp921aoihz
+      openai-processing-ms:
+      - '5832'
+      openai-project:
+      - proj_FYsIItHHgnSPdHBVMzhNBWGa
+      openai-version:
+      - '2020-10-01'
+      strict-transport-security:
+      - max-age=31536000; includeSubDomains; preload
+      transfer-encoding:
+      - chunked
+    parsed_body:
+      background: false
+      billing:
+        payer: developer
+      created_at: 1765242224
+      error: null
+      id: resp_025d1e83cbbdd6ec0069377570574881a1bcb3008becbedc3e
+      incomplete_details: null
+      instructions: null
+      max_output_tokens: null
+      max_tool_calls: null
+      metadata: {}
+      model: gpt-5-mini-2025-08-07
+      object: response
+      output:
+      - encrypted_content: gAAAAABpN3V2I4wd1pU3Je-LmnD52VTgnhUqbTePfv5tWBZ-wxk6xubXG6FX2PNObyZjUaviEOZtIrYbeS4Vbi4SqVJ3fzvWr4I32nlIduN5Hdxor8oVWRB_lK6XZMjPBxwAmEYenPusxCdOcX_MYn5H_917B3VpMS3znZjAmbJttAqMUQCOfen2GmM3fWB9N7gZGPViFhJUYsdvjrQf0E82Nx8xX-HhvKFoi0uaEXQzumNjQl-JAp5cjsDFKQinYPxKBV6yAJKW05OSB4IFPDLJiQZrtDyev4m4pXAPAOvya9XCa5N7jIm4PuGHndlDTPNBLALtfCGK5pWnhKyU4yAX3HQ7eIPQegH1_MLunfeic5vwkFYd1Bs61CRzo9dnLK6qYBukI9yX9aEDAzWplmxyT16qajpPZRtlHMsQZjbjNZ0huylT1iR5CbBWq2VxKAA5BU226XUC70G8iMvKLj1ZYYVy0yJOQnxQfIMzksTADhXKAN9dgapJXNtU0HFPOto_weuIJM6alWaMerAiMUIHr3bAdvo2Ce6xyZfnQE0Agddb2i-Lq3_FR9htbWYltfifcxQF0-PbP8i_TYYkGTH0_IuPqy0I5hwWjvdBbgrFG-gYEcbnk71_oP5O_XPn9gKHVitqEIY7pT2meKpnIybHUqUqw61I2kyntDuLg2R7M-jRjqXFr_nq7XSOkHX5nw8zhjPFXPAzHKIxf3U_qfCYsnV-RMzuD6be6fgucgGdodrJ6G6lK1k4IUjMI5Uvn6AdM_ELsQslF8VDsAuDn-RouM26nFY5F1DBsk-DX4Ny2WpWSzXrn3MLo14Q37zlqJ-6i5ZHhd41xRHK5rPAtFA6hrJV4oWYxnWyB6JRgPnBr6wtSMfVV47s3cV9y_P5O-GhcLYT6JwOXbHhdrH9S0isyxJ09aKrCNuTbil0sDc2aXi2gBupd8yD5P2APc0mbjfyyaoWYAtWjdmwkckrPi61tGMp7tndX9_BUdw2-kwCP5Ee2sHRoczV-vs_7aojWRO_xKz78IVGVBEHF-NkYUKm_l-aAMXZxkXFu3vbUT7xbXTZQutImWXbnNpNVP9qLA7uOikkIrmgNJF9E49MDRTuHEd1iXrdSnKDXAX_qJJ7z994t6NceFXTsGYj6nppCl2VJ1jMZ2H8hk12-8Reo7-VvHGnyCSkCWCrCChaMj9OOYEM3syeK3AQiiXs39PAxl6yt-VXZqtKFYd89liRBCzG7eDri47OV3LJcjn040LgZ4UV5MjD2neXuF4CXX49wK5lDKb9eD1wgDK-SCmYuRNO7YLxuL2GRfi5kIMM1Lzq-2p07HOa2laili_TM3hgXMypoEd1cLnbEHVKOI44ihC3koeODZtDKXdRxwFFezCDRIctCWKUJ_h9qxIAoSa39Kg7_hvbbj_BVvLMkWuU3I7kuBcFRcbhMSUkBA8y45MRhSD6Rhuk1SQLhrgCYJiZaAeApiJ7PzCP4Xljbsl_TTmaWQA39oBQyqLoetPAkbMZflrgKhGJtb1PoEx1CQsoFmlNlsYuqK_flDxic1-2I9npUJsvbZ8H0hCYWHnFXoixFpsGSnKITcMJoxcYy5qAsT2v2fq5Q9_4AtDmaipn_BkwSWNQPUvpubRwP1VIJBzoDAvUbdzEN2SN8dsujYxKF60CWYhOYxT_x6ez8astPvW-VrC3d8dwMicRzPgh2fR8DQ13oJbSRSDJFGsEWiZGWGZAGouAdBKq1kZ5MU43W3MhD5V926B3W49RtsfAWnUB4JzJsofeUJmjFUyuuFaXiFWmA6lUMvZASkhp6LAuJrQC5qu4dfb-eaCLASniNZ_QID_oC_AtCEt8Y1MdFCckIhcNCw_usAkjszOoUM3FIO2mBqkLHeWTZZ2tmXZLlIHI2AH1fJdtQzXNaFsWIRfNVRrRtUw42Nkul8bsYFquZPBq1Sv3GKYp2K37D-_SvBZEmyZWcAzGGjrRI-z_I67pcS7UUet7wtKlFCqKPYzPMLDMfWo4nqWybTev--gLUUmKKFAC5bDdEOu5B9y3_exr77zVKKQX9WXtTiYol9MJrOQ0hT0Ci1j6B779lU2jWYp_cquecZD9aP7DUcKXO6B9rvn_tozspuqA8P0xE9GqnpAW2R0z1BI9Ed4HsdqiERm7G5Gm5WhIIVZmo5YzDzwE2PMnk0206IOb1i3cfX2BQ19C77hV8ehQHO1MTxj0-_AlSd_2TsJWglXWk39wyjG9OkPcyFrmY_1XYFXxzhVw63wxpfwCrMvqqMX3BGM7ezIy4UQyWNdpmgzRhCbn6T5Gu6HHptNcOKEyr0v7xgNSPH9v5HYzQIWIL1GkKzY10nH1_YjdnKOIsPlHRKgNdeeanMFn2zUd8XkRmQuTaoDIZPZeoKIxz2CfYhQ7A-e-czZT2LTmOA-Hjk04DAsWPV8gyqqes9NEfzyG9h2Ut7h89Gs4o97ck6na4yleLwcNm2kC4_vKsi1d933Sn2wjeLqGL_E2QK9DhQdaTLTV84gAd8wnZl590uUmWWrBlwXMYlFDq5DlAWOgIMVE2ETekatqqcxLiqpdIIKfj_GFSKCvWLj5JXM7V68c3fILYFHiriwkGikWMSmIYdVD8dAxPQlSgjQ-GWvkJHc46Fs8EMomTjPHXEjGzAANKmi8rpjmlj9zCakzHqb1nM6VTuAnX88QIymk8CPoLvwzX3AxL14D1fj3n3D86EnAvCc0O00R2WnRptF6mnxzAjRyWps8HKFD_ARmK5biv_Pni4Z4TUsNx8WlTInd5PnrdBpPte8Heg40VdGOA06qBUNLWi4xLIQr_zRQfeQKkzYMnFsk3slgVy7_Tp1Uz-yjmUI3ETh6vxlEpPu_TCF5SzHADZP-crn_fW15J2rXEqEI-YU8iDcNqi78n0b0Qh6DByPtU08o1QeKWU0D6oylbgagN6Mm76YU4VHobTzbclZCG4z1_X1-GPnJelGFfrciRjaMaq2OmIEUTWE8ax2jcP-lCDaJcR7z-t_WTxQinZwcBeOiDuSIQi9aVZpJjZjELbLozdsctMEnFHabz2cqbjqGJ1PWFc1hdUPfVRpNCclMt0ymtflvu4UxegrFFAVLN4hT5zLpamqkueUUupzL4f155zxm7qOAhRetNXi2mpjGnIiNCjz3pTKI3-TwxtlYAZzAnkpqBAfpUDARwT4EEr_NkE0Pgiv3IemTBKgbQY-mjDFyBtMq2T5nANW5RnD3CQpTvg0wDkWSLyApRSQvNEknXA8s6q7Rl_w-m0u8irYof5TVuNOeZTLTbuWWUUHYUqAqMfrI8D4VqolJJfr3hAnaifg70sCugRNE6z3YoSGRTgfdpJtkIUaVFLpvsG_8JHsH-MV_eIHyQkoIvfSQopF3DPu7hvTp2BQzQASwQW-j
+        id: rs_025d1e83cbbdd6ec0069377570970081a1a299cfaf76f7316f
+        summary: []
+        type: reasoning
+      - arguments: '{"city":"New York"}'
+        call_id: call_FMq3A2xkTeLWDmukYTZjnaFQ
+        id: fc_025d1e83cbbdd6ec0069377575c16c81a1912fedf2e78eb874
+        name: get_weather
+        status: completed
+        type: function_call
+      parallel_tool_calls: true
+      previous_response_id: null
+      prompt_cache_key: null
+      prompt_cache_retention: null
+      reasoning:
+        effort: medium
+        summary: null
+      safety_identifier: null
+      service_tier: default
+      status: completed
+      store: true
+      temperature: 1.0
+      text:
+        format:
+          type: text
+        verbosity: medium
+      tool_choice:
+        name: get_weather
+        type: function
+      tools:
+      - description: Get the weather for a city.
+        name: get_weather
+        parameters:
+          additionalProperties: false
+          properties:
+            city:
+              type: string
+          required:
+          - city
+          type: object
+        strict: true
+        type: function
+      - description: Get the current time in a city.
+        name: get_time
+        parameters:
+          additionalProperties: false
+          properties:
+            city:
+              type: string
+          required:
+          - city
+          type: object
+        strict: true
+        type: function
+      top_logprobs: 0
+      top_p: 1.0
+      truncation: disabled
+      usage:
+        input_tokens: 72
+        input_tokens_details:
+          cached_tokens: 0
+        output_tokens: 341
+        output_tokens_details:
+          reasoning_tokens: 320
+        total_tokens: 413
+      user: null
+    status:
+      code: 200
+      message: OK
+- request:
+    headers:
+      accept:
+      - application/json
+      accept-encoding:
+      - gzip, deflate
+      connection:
+      - keep-alive
+      content-length:
+      - '4472'
+      content-type:
+      - application/json
+      cookie:
+      - __cf_bm=_nqwe_fhs0loJmBXPufpL7J_mBeSMzvyzqSkFRTG8fY-1765242230-1.0.1.1-c5vfua9JNC4mWRa6FUZP16YCC0PQ.PI8TRJQ.dKee3KNIiLEEdbLO6zqeJVP4YXQ0iTeDFFg4n5CQaWE.fgRjdeGJ6qnElsMyl0cK3Sx9PA;
+        _cfuvid=EwOHzRdWJ1FivS6t.wbQwRv4EKDt3V9bJUSTNkLpopc-1765242230190-0.0.1.1-604800000
+      host:
+      - api.openai.com
+    method: POST
+    parsed_body:
+      include:
+      - reasoning.encrypted_content
+      input:
+      - content: What is 2+2?
+        role: user
+      - encrypted_content: gAAAAABpN3V2I4wd1pU3Je-LmnD52VTgnhUqbTePfv5tWBZ-wxk6xubXG6FX2PNObyZjUaviEOZtIrYbeS4Vbi4SqVJ3fzvWr4I32nlIduN5Hdxor8oVWRB_lK6XZMjPBxwAmEYenPusxCdOcX_MYn5H_917B3VpMS3znZjAmbJttAqMUQCOfen2GmM3fWB9N7gZGPViFhJUYsdvjrQf0E82Nx8xX-HhvKFoi0uaEXQzumNjQl-JAp5cjsDFKQinYPxKBV6yAJKW05OSB4IFPDLJiQZrtDyev4m4pXAPAOvya9XCa5N7jIm4PuGHndlDTPNBLALtfCGK5pWnhKyU4yAX3HQ7eIPQegH1_MLunfeic5vwkFYd1Bs61CRzo9dnLK6qYBukI9yX9aEDAzWplmxyT16qajpPZRtlHMsQZjbjNZ0huylT1iR5CbBWq2VxKAA5BU226XUC70G8iMvKLj1ZYYVy0yJOQnxQfIMzksTADhXKAN9dgapJXNtU0HFPOto_weuIJM6alWaMerAiMUIHr3bAdvo2Ce6xyZfnQE0Agddb2i-Lq3_FR9htbWYltfifcxQF0-PbP8i_TYYkGTH0_IuPqy0I5hwWjvdBbgrFG-gYEcbnk71_oP5O_XPn9gKHVitqEIY7pT2meKpnIybHUqUqw61I2kyntDuLg2R7M-jRjqXFr_nq7XSOkHX5nw8zhjPFXPAzHKIxf3U_qfCYsnV-RMzuD6be6fgucgGdodrJ6G6lK1k4IUjMI5Uvn6AdM_ELsQslF8VDsAuDn-RouM26nFY5F1DBsk-DX4Ny2WpWSzXrn3MLo14Q37zlqJ-6i5ZHhd41xRHK5rPAtFA6hrJV4oWYxnWyB6JRgPnBr6wtSMfVV47s3cV9y_P5O-GhcLYT6JwOXbHhdrH9S0isyxJ09aKrCNuTbil0sDc2aXi2gBupd8yD5P2APc0mbjfyyaoWYAtWjdmwkckrPi61tGMp7tndX9_BUdw2-kwCP5Ee2sHRoczV-vs_7aojWRO_xKz78IVGVBEHF-NkYUKm_l-aAMXZxkXFu3vbUT7xbXTZQutImWXbnNpNVP9qLA7uOikkIrmgNJF9E49MDRTuHEd1iXrdSnKDXAX_qJJ7z994t6NceFXTsGYj6nppCl2VJ1jMZ2H8hk12-8Reo7-VvHGnyCSkCWCrCChaMj9OOYEM3syeK3AQiiXs39PAxl6yt-VXZqtKFYd89liRBCzG7eDri47OV3LJcjn040LgZ4UV5MjD2neXuF4CXX49wK5lDKb9eD1wgDK-SCmYuRNO7YLxuL2GRfi5kIMM1Lzq-2p07HOa2laili_TM3hgXMypoEd1cLnbEHVKOI44ihC3koeODZtDKXdRxwFFezCDRIctCWKUJ_h9qxIAoSa39Kg7_hvbbj_BVvLMkWuU3I7kuBcFRcbhMSUkBA8y45MRhSD6Rhuk1SQLhrgCYJiZaAeApiJ7PzCP4Xljbsl_TTmaWQA39oBQyqLoetPAkbMZflrgKhGJtb1PoEx1CQsoFmlNlsYuqK_flDxic1-2I9npUJsvbZ8H0hCYWHnFXoixFpsGSnKITcMJoxcYy5qAsT2v2fq5Q9_4AtDmaipn_BkwSWNQPUvpubRwP1VIJBzoDAvUbdzEN2SN8dsujYxKF60CWYhOYxT_x6ez8astPvW-VrC3d8dwMicRzPgh2fR8DQ13oJbSRSDJFGsEWiZGWGZAGouAdBKq1kZ5MU43W3MhD5V926B3W49RtsfAWnUB4JzJsofeUJmjFUyuuFaXiFWmA6lUMvZASkhp6LAuJrQC5qu4dfb-eaCLASniNZ_QID_oC_AtCEt8Y1MdFCckIhcNCw_usAkjszOoUM3FIO2mBqkLHeWTZZ2tmXZLlIHI2AH1fJdtQzXNaFsWIRfNVRrRtUw42Nkul8bsYFquZPBq1Sv3GKYp2K37D-_SvBZEmyZWcAzGGjrRI-z_I67pcS7UUet7wtKlFCqKPYzPMLDMfWo4nqWybTev--gLUUmKKFAC5bDdEOu5B9y3_exr77zVKKQX9WXtTiYol9MJrOQ0hT0Ci1j6B779lU2jWYp_cquecZD9aP7DUcKXO6B9rvn_tozspuqA8P0xE9GqnpAW2R0z1BI9Ed4HsdqiERm7G5Gm5WhIIVZmo5YzDzwE2PMnk0206IOb1i3cfX2BQ19C77hV8ehQHO1MTxj0-_AlSd_2TsJWglXWk39wyjG9OkPcyFrmY_1XYFXxzhVw63wxpfwCrMvqqMX3BGM7ezIy4UQyWNdpmgzRhCbn6T5Gu6HHptNcOKEyr0v7xgNSPH9v5HYzQIWIL1GkKzY10nH1_YjdnKOIsPlHRKgNdeeanMFn2zUd8XkRmQuTaoDIZPZeoKIxz2CfYhQ7A-e-czZT2LTmOA-Hjk04DAsWPV8gyqqes9NEfzyG9h2Ut7h89Gs4o97ck6na4yleLwcNm2kC4_vKsi1d933Sn2wjeLqGL_E2QK9DhQdaTLTV84gAd8wnZl590uUmWWrBlwXMYlFDq5DlAWOgIMVE2ETekatqqcxLiqpdIIKfj_GFSKCvWLj5JXM7V68c3fILYFHiriwkGikWMSmIYdVD8dAxPQlSgjQ-GWvkJHc46Fs8EMomTjPHXEjGzAANKmi8rpjmlj9zCakzHqb1nM6VTuAnX88QIymk8CPoLvwzX3AxL14D1fj3n3D86EnAvCc0O00R2WnRptF6mnxzAjRyWps8HKFD_ARmK5biv_Pni4Z4TUsNx8WlTInd5PnrdBpPte8Heg40VdGOA06qBUNLWi4xLIQr_zRQfeQKkzYMnFsk3slgVy7_Tp1Uz-yjmUI3ETh6vxlEpPu_TCF5SzHADZP-crn_fW15J2rXEqEI-YU8iDcNqi78n0b0Qh6DByPtU08o1QeKWU0D6oylbgagN6Mm76YU4VHobTzbclZCG4z1_X1-GPnJelGFfrciRjaMaq2OmIEUTWE8ax2jcP-lCDaJcR7z-t_WTxQinZwcBeOiDuSIQi9aVZpJjZjELbLozdsctMEnFHabz2cqbjqGJ1PWFc1hdUPfVRpNCclMt0ymtflvu4UxegrFFAVLN4hT5zLpamqkueUUupzL4f155zxm7qOAhRetNXi2mpjGnIiNCjz3pTKI3-TwxtlYAZzAnkpqBAfpUDARwT4EEr_NkE0Pgiv3IemTBKgbQY-mjDFyBtMq2T5nANW5RnD3CQpTvg0wDkWSLyApRSQvNEknXA8s6q7Rl_w-m0u8irYof5TVuNOeZTLTbuWWUUHYUqAqMfrI8D4VqolJJfr3hAnaifg70sCugRNE6z3YoSGRTgfdpJtkIUaVFLpvsG_8JHsH-MV_eIHyQkoIvfSQopF3DPu7hvTp2BQzQASwQW-j
+        id: rs_025d1e83cbbdd6ec0069377570970081a1a299cfaf76f7316f
+        summary: []
+        type: reasoning
+      - arguments: '{"city":"New York"}'
+        call_id: call_FMq3A2xkTeLWDmukYTZjnaFQ
+        id: fc_025d1e83cbbdd6ec0069377575c16c81a1912fedf2e78eb874
+        name: get_weather
+        type: function_call
+      - call_id: call_FMq3A2xkTeLWDmukYTZjnaFQ
+        output: The weather in New York is sunny and 72°F.
+        type: function_call_output
+      model: gpt-5-mini
+      stream: false
+      tool_choice:
+        name: get_weather
+        type: function
+      tools:
+      - description: Get the weather for a city.
+        name: get_weather
+        parameters:
+          additionalProperties: false
+          properties:
+            city:
+              type: string
+          required:
+          - city
+          type: object
+        strict: true
+        type: function
+      - description: Get the current time in a city.
+        name: get_time
+        parameters:
+          additionalProperties: false
+          properties:
+            city:
+              type: string
+          required:
+          - city
+          type: object
+        strict: true
+        type: function
+    uri: https://api.openai.com/v1/responses
+  response:
+    headers:
+      alt-svc:
+      - h3=":443"; ma=86400
+      connection:
+      - keep-alive
+      content-length:
+      - '5013'
+      content-type:
+      - application/json
+      openai-organization:
+      - user-grnwlxd1653lxdzp921aoihz
+      openai-processing-ms:
+      - '2674'
+      openai-project:
+      - proj_FYsIItHHgnSPdHBVMzhNBWGa
+      openai-version:
+      - '2020-10-01'
+      strict-transport-security:
+      - max-age=31536000; includeSubDomains; preload
+      transfer-encoding:
+      - chunked
+    parsed_body:
+      background: false
+      billing:
+        payer: developer
+      created_at: 1765242230
+      error: null
+      id: resp_025d1e83cbbdd6ec0069377576e48881a1bae0a909378538dc
+      incomplete_details: null
+      instructions: null
+      max_output_tokens: null
+      max_tool_calls: null
+      metadata: {}
+      model: gpt-5-mini-2025-08-07
+      object: response
+      output:
+      - encrypted_content: gAAAAABpN3V5emoz3SE162s8QpEGWJXJ8lyjBgDeLXFDNNvRACshBPGZVa3FOQpOR4NZ-qT8Ym3Nd-kr66p7-ulp82JVJ0hRJFSfeASUFW6fGb-j4-XoXwNP0IAo_tIFHBjOdX49z5kfjJJsHxjcCe3v8djlL_gA_kCEvhOQymP5W8AKjMm18dBbDQy5Os-goCzGPELGE-z4HJrqJExlujiDWIBbf1mXPsloJPO9Z9xEvFHhqKZS49Lo7cRyhF2UGy8MGLi29LM6i9LDot0Q54NbRjso3YagjEubR86-VAXa0KzqAegQaBSuT0415Vdhv0AjUWouBhngyV9X1ECa09Q0tb4_VhEZ_XQe1CEsJJnnGjJ1iXSS-3E4ZL0V2IV3BrnP9GYjuWTPJR-9MIXk8HQbAquytIkDN5DNHIygjPEfI9wuq2lfpxLCmRVrlsBCb88-QPoeq6l1_9hZhrEAsnIjzrj9qXCetcQPtbAaefaMJVQwcVgqkTNa8aRrNz6OS51hzRHweivOh2ZN5xfKc3VPcQwFBxmIj8D3f4STkE4FYzJPWx6m0JgdGPvh3mX91p2V77pDQt2kMcU16axa3ZiJrFL9wZWEPJpkrfy-ShsRfDl5SFInORfJ--ZerUfN-TAs-eyarEz4zqRW2WSVcgKXcWJ0gLgQCl126q4KLGJS-BBXrCY61pewQ5xPhYzEutdY4wkeR10_fmrC6VOTwpSyD2VCwSEXmbU_ANiDR8Nsvsh6d-V2BOet1eWTNAFYGrLX_-TKJNRag2xCNj4jysWS3n5Ns-Ff_zLzflO-PBk8YWnsPBN28ZfHLOKJrNk3smAg1b4cbKQRK5epTIPtTQfUOcGPCD9GnyibTKGkBA4TTC9vSnhTAHKfRvevJKg4h7DJCRhGtoc9RfB9fIoj086363vllNCJdcvdXetw0xsHC9IY5M2rmfNYHqt55aWKIcXa4DCS4RDdCV9rECzETMafpGqM5LyWiS7gf1PKO-Tw2hygFsiR4F3lqIGTsoaR6tLbTOUb6VrF06JnLuDD82YKEROF0q8jOvjLfAzDO8acXTnk9dtWzzFj3Gbx1kwOfSuGvxZG5d_gTob-wBl36jrxT0O2UWHUWW-8HoWASZtu5RYJIgKHzWOHV5dxDwXno-7-oC1nBGkybn2LV3lR8vHI61_oYVU65GfFyLTXtqUJD3RmvHfabrMQDMcivJxOS1dGMNLJTldrSl5nPzLWsJs_sWZ3aWmMRWFpCbZ3ck6na8eODC-Vm9efHeRCZWCuaWLyMCd8SGAu7NGgW5uStNLVNt8fT8xs1ALkvp0zrR6T7KMcQ3TsPBmeqXC38acGtIEVEgwmsdGZRBSsdik0LBAOlPikmkEenPd9Bg4IL6IgPxz4w5zd8tr9hipmElWSKVZb4ZO6pV8mSnXehP_3xM9XzWmu9kX0uyyYV7YvO7BHNsjHgyu8mY2JWwpbtN_8TrKYKPrC-RR26flBNt2SM_WQcKvnXo0h5--3hE5IJ8Hn0R1w0g45lsNWndn23p_rfq8bTMeNeIY3M4y4QToxABeBeob-zeRPQpm0DTwQjudmnmIJFnvKVjY=
+        id: rs_025d1e83cbbdd6ec00693775775ed881a1b6107d6136ef176f
+        summary: []
+        type: reasoning
+      - encrypted_content: gAAAAABpN3V5hM8lgApa0Pe97wsWluHWNkpqm6fuZPAjQaz6aqjDVzDjI2ZIlmD89220_7SWvuVn0f11Sglv0OZqgQLaA1yHHXXfHxssQzgZ6PpxWavjzGTpdniAX1oDO1Nmv3Xw8OlNRvO9EYdgoQZUa1cdo6LIP1LHcPJm4OlL4q6JFQ5y0rEF_l6hVR5DOfbV7w8MXVYIbIYZFlbc-73JWt1CKosbOpXGXWUZkylEFgLX-ldEwnmTZMSBe9rR_KYicZr5lG2Ha8iRVzgyZq_K-5LdkoNCreUIpamDKH5YWfVALKLbTHT7uT5rFuF2lbP6DusINN3kOL_3CsPIwyC6ys49HVEnntqUWn-YysXf3U-BfFxDwR80cxW4RtAa_M9f95c7XaQW7JXKSXLqZOdaNrvfT8bTjOoubokuUaTdHlsnacbC7B400YjjCYdhkZkaxxgLyU4ut72iy-mSu2sUyTMdNrYL1h_txw9N2kgSgK1BheHAQ51VvlZ5zsUeBIUkb03u1jhmSRKhhtZEvuyyRAiOCEUkcZH23UiIhjbCnO2-gQKodVr-9SVLW-uwYUvbsQwZxtI61LMdKvVe9k5PmfmwRrCyu6r3SZRVFbSV-Hbc4Sat_VnVTeQ96O6h1_DWArwl0oAYuvcfTLbsyRBKQqZljh2YG4-idxdIHvDR6w8422lEia6TT-aE8ZdIaco3a_G3v9XbKjGUMSSgksdjR7b_z8Z_DrZO_0yIWeTGLy7hzoa0EYRa3hlSKyuTd-u2ckVMYGtkg6-_NQ6m9T6LI1oG9RSVMHAAthR276KrUw-BM8XAg4gCpdtrg5KCpcBeRwav5KJ985bXfw8CeMH4xsBfj9OIFZUiENugHEYeMSRIofJHmAE=
+        id: rs_025d1e83cbbdd6ec0069377578f58c81a19479691e1f52003c
+        summary: []
+        type: reasoning
+      - arguments: '{"city":"New York"}'
+        call_id: call_6d0Ml7A8HyBCVJEM1erWCIU5
+        id: fc_025d1e83cbbdd6ec0069377579229081a1b6ba86ea6b11f955
+        name: get_weather
+        status: completed
+        type: function_call
+      parallel_tool_calls: true
+      previous_response_id: null
+      prompt_cache_key: null
+      prompt_cache_retention: null
+      reasoning:
+        effort: medium
+        summary: null
+      safety_identifier: null
+      service_tier: default
+      status: completed
+      store: true
+      temperature: 1.0
+      text:
+        format:
+          type: text
+        verbosity: medium
+      tool_choice:
+        name: get_weather
+        type: function
+      tools:
+      - description: Get the weather for a city.
+        name: get_weather
+        parameters:
+          additionalProperties: false
+          properties:
+            city:
+              type: string
+          required:
+          - city
+          type: object
+        strict: true
+        type: function
+      - description: Get the current time in a city.
+        name: get_time
+        parameters:
+          additionalProperties: false
+          properties:
+            city:
+              type: string
+          required:
+          - city
+          type: object
+        strict: true
+        type: function
+      top_logprobs: 0
+      top_p: 1.0
+      truncation: disabled
+      usage:
+        input_tokens: 489
+        input_tokens_details:
+          cached_tokens: 0
+        output_tokens: 149
+        output_tokens_details:
+          reasoning_tokens: 128
+        total_tokens: 638
+      user: null
+    status:
+      code: 200
+      message: OK
+version: 1
diff --git a/tests/models/openai_responses/test_tool_choice.py b/tests/models/openai_responses/test_tool_choice.py
new file mode 100644
index 0000000000..1e4b76910c
--- /dev/null
+++ b/tests/models/openai_responses/test_tool_choice.py
@@ -0,0 +1,103 @@
+"""Tests for OpenAI Responses tool_choice setting."""
+
+from __future__ import annotations as _annotations
+
+import pytest
+
+from pydantic_ai import Agent
+
+from ...conftest import try_import
+
+with try_import() as imports_successful:
+    from pydantic_ai.models.openai import OpenAIResponsesModel
+    from pydantic_ai.providers.openai import OpenAIProvider
+
+pytestmark = [
+    pytest.mark.skipif(not imports_successful(), reason='openai not installed'),
+    pytest.mark.anyio,
+    pytest.mark.vcr,
+]
+
+
+async def test_tool_choice_auto_live(allow_model_requests: None, openai_api_key: str):
+    """Test tool_choice='auto' allows model to decide whether to use tools."""
+    m = OpenAIResponsesModel('gpt-5-mini', provider=OpenAIProvider(api_key=openai_api_key))
+    agent = Agent(m)
+
+    @agent.tool_plain
+    def get_weather(city: str) -> str:
+        """Get the weather for a city."""
+        return f'The weather in {city} is sunny and 72°F.'  # pragma: no cover
+
+    result = await agent.run('What is 2+2?', model_settings={'tool_choice': 'auto'})
+    assert result.output is not None
+    assert '4' in result.output
+
+
+async def test_tool_choice_required_live(allow_model_requests: None, openai_api_key: str):
+    """Test tool_choice='required' forces model to use a tool."""
+    m = OpenAIResponsesModel('gpt-5-mini', provider=OpenAIProvider(api_key=openai_api_key))
+    agent = Agent(m)
+
+    @agent.tool_plain
+    def get_weather(city: str) -> str:
+        """Get the weather for a city."""
+        return f'The weather in {city} is sunny and 72°F.'
+
+    result = await agent.run(
+        'What is the temperature in Paris? Use the weather tool and return the temperature as a number.',
+        output_type=int,
+        model_settings={'tool_choice': 'required'},
+    )
+    assert result.output == 72
+
+
+async def test_tool_choice_none_live(allow_model_requests: None, openai_api_key: str):
+    """Test tool_choice='none' prevents model from using function tools."""
+    m = OpenAIResponsesModel('gpt-5-mini', provider=OpenAIProvider(api_key=openai_api_key))
+    agent = Agent(m)
+
+    @agent.tool_plain
+    def get_weather(city: str) -> str:
+        """Get the weather for a city."""
+        return f'The weather in {city} is sunny and 72°F.'  # pragma: no cover
+
+    result = await agent.run(
+        'What is the weather in Paris? Use the tool if available.',
+        model_settings={'tool_choice': 'none'},
+    )
+    assert result.output is not None
+    tool_calls = [
+        m
+        for m in result.all_messages()
+        if hasattr(m, 'parts')
+        and any(hasattr(p, 'tool_name') and p.tool_name == 'get_weather' for p in getattr(m, 'parts', []))
+    ]
+    assert len(tool_calls) == 0
+
+
+async def test_tool_choice_specific_live(allow_model_requests: None, openai_api_key: str):
+    """Test tool_choice=['tool_name'] forces model to use the named tool."""
+    from pydantic_ai import UsageLimits
+    from pydantic_ai.exceptions import UsageLimitExceeded
+
+    m = OpenAIResponsesModel('gpt-5-mini', provider=OpenAIProvider(api_key=openai_api_key))
+    agent = Agent(m)
+
+    @agent.tool_plain
+    def get_weather(city: str) -> str:
+        """Get the weather for a city."""
+        return f'The weather in {city} is sunny and 72°F.'
+
+    @agent.tool_plain
+    def get_time(city: str) -> str:
+        """Get the current time in a city."""
+        return f'The time in {city} is 3:00 PM.'  # pragma: no cover
+
+    # Agent is forced to call get_weather even though it's unrelated to the prompt
+    with pytest.raises(UsageLimitExceeded):
+        await agent.run(
+            'What is 2+2?',
+            model_settings={'tool_choice': ['get_weather']},
+            usage_limits=UsageLimits(request_limit=2),
+        )
diff --git a/tests/models/test_anthropic.py b/tests/models/test_anthropic.py
index 95fb44c502..f094f6ee66 100644
--- a/tests/models/test_anthropic.py
+++ b/tests/models/test_anthropic.py
@@ -4139,12 +4139,8 @@ async def test_anthropic_web_fetch_tool(allow_model_requests: None, anthropic_ap
             ModelResponse(
                 parts=[
                     ThinkingPart(
-                        content="""\
-The user is asking me to fetch the content from https://ai.pydantic.dev and return only the first sentence on that page. I need to use the web_fetch tool to get the content from this URL, then identify the first sentence and return only that sentence.
-
-Let me fetch the page first.\
-""",
-                        signature='EsIDCkYICRgCKkAKi/j4a8lGN12CjyS27ZXcPkXHGyTbn1vJENJz+AjinyTnsrynMEhidWT5IMNAs0TDgwSwPLNmgq4MsPkVekB8EgxetaK+Nhg8wUdhTEAaDMukODgr3JaYHZwVEiIwgKBckFLJ/C7wCD9oGCIECbqpaeEuWQ8BH3Hev6wpuc+66Wu7AJM1jGH60BpsUovnKqkCrHNq6b1SDT41cm2w7cyxZggrX6crzYh0fAkZ+VC6FBjy6mJikZtX6reKD+064KZ4F1oe4Qd40EBp/wHvD7oPV/fhGut1fzwl48ZgB8uzJb3tHr9MBjs4PVTsvKstpHKpOo6NLvCknQJ/0730OTENp/JOR6h6RUl6kMl5OrHTvsDEYpselUBPtLikm9p4t+d8CxqGm/B1kg1wN3FGJK31PD3veYIOO4hBirFPXWd+AiB1rZP++2QjToZ9lD2xqP/Q3vWEU+/Ryp6uzaRFWPVQkIr+mzpIaJsYuKDiyduxF4LD/hdMTV7IVDtconeQIPQJRhuO6nICBEuqb0uIotPDnCU6iI2l9OyEeKJM0RS6/NTNG8DZnvyVJ8gGKbtZKSHK6KKsdH0f7d+DGAE=',
+                        content='The user wants me to fetch the content from https://ai.pydantic.dev and return only the first sentence. I need to use the web_fetch tool to get the content from this URL, then identify the first sentence and return only that.',
+                        signature='EooDCkYIChgCKkBe6ddqCwT1CKptPg14EIIaDdq/qCKZucUmb9w4ci/O5pSzheW3Vv33pkeqmFPrcr4l5CWAVM/xaV7NjHNwOPohEgza8xxqBGZ7jds5BzMaDFyd3dP3X5SSgPSg7SIwfyJLZ+yYCfCrpsgV77T7Ay6iBvfLp0ZaSb+ph+2YkSSVAxFDodWxWyv5DiVHRLJnKvEBcESvFzbas8bML22jelhD1nxGiyr6GGBCjavRGaz6LpPExc03FEa9qS0YEvAniVkVxLJprdDcW4Sm2/lLTh6TRiiicyELomVYxI4FrK1R981pA9ZdDgP8iE3YmcvhvvVJpxgUK+6Tr0LJSq5GgnlcPVEcXc+PYzqLNwlHiH+Vm9bPVs/N/JhfYBPKKREWgtXQBvpsxDM8f5Rj6569D7K3oKZ7Dbglc8eWyn1KFYHV4R+sXc4XOHJDPWuEjgW5/aYUfnP5yDlscfTHDgfrZVy7se8rjgtnpwLNstk7GbLUzgIft6p7hTTUIGB7icopfZtoahgB',
                         provider_name='anthropic',
                     ),
                     BuiltinToolCallPart(
@@ -4179,13 +4175,13 @@ async def test_anthropic_web_fetch_tool(allow_model_requests: None, anthropic_ap
                     ),
                 ],
                 usage=RequestUsage(
-                    input_tokens=7262,
-                    output_tokens=171,
+                    input_tokens=11440,
+                    output_tokens=158,
                     details={
                         'cache_creation_input_tokens': 0,
                         'cache_read_input_tokens': 0,
-                        'input_tokens': 7262,
-                        'output_tokens': 171,
+                        'input_tokens': 11440,
+                        'output_tokens': 158,
                     },
                 ),
                 model_name='claude-sonnet-4-20250514',
@@ -4220,12 +4216,8 @@ async def test_anthropic_web_fetch_tool(allow_model_requests: None, anthropic_ap
             ModelResponse(
                 parts=[
                     ThinkingPart(
-                        content="""\
-The user is asking me to fetch the content from https://ai.pydantic.dev and return only the first sentence on that page. I need to use the web_fetch tool to get the content from this URL, then identify the first sentence and return only that sentence.
-
-Let me fetch the page first.\
-""",
-                        signature='EsIDCkYICRgCKkAKi/j4a8lGN12CjyS27ZXcPkXHGyTbn1vJENJz+AjinyTnsrynMEhidWT5IMNAs0TDgwSwPLNmgq4MsPkVekB8EgxetaK+Nhg8wUdhTEAaDMukODgr3JaYHZwVEiIwgKBckFLJ/C7wCD9oGCIECbqpaeEuWQ8BH3Hev6wpuc+66Wu7AJM1jGH60BpsUovnKqkCrHNq6b1SDT41cm2w7cyxZggrX6crzYh0fAkZ+VC6FBjy6mJikZtX6reKD+064KZ4F1oe4Qd40EBp/wHvD7oPV/fhGut1fzwl48ZgB8uzJb3tHr9MBjs4PVTsvKstpHKpOo6NLvCknQJ/0730OTENp/JOR6h6RUl6kMl5OrHTvsDEYpselUBPtLikm9p4t+d8CxqGm/B1kg1wN3FGJK31PD3veYIOO4hBirFPXWd+AiB1rZP++2QjToZ9lD2xqP/Q3vWEU+/Ryp6uzaRFWPVQkIr+mzpIaJsYuKDiyduxF4LD/hdMTV7IVDtconeQIPQJRhuO6nICBEuqb0uIotPDnCU6iI2l9OyEeKJM0RS6/NTNG8DZnvyVJ8gGKbtZKSHK6KKsdH0f7d+DGAE=',
+                        content='The user wants me to fetch the content from https://ai.pydantic.dev and return only the first sentence. I need to use the web_fetch tool to get the content from this URL, then identify the first sentence and return only that.',
+                        signature='EooDCkYIChgCKkBe6ddqCwT1CKptPg14EIIaDdq/qCKZucUmb9w4ci/O5pSzheW3Vv33pkeqmFPrcr4l5CWAVM/xaV7NjHNwOPohEgza8xxqBGZ7jds5BzMaDFyd3dP3X5SSgPSg7SIwfyJLZ+yYCfCrpsgV77T7Ay6iBvfLp0ZaSb+ph+2YkSSVAxFDodWxWyv5DiVHRLJnKvEBcESvFzbas8bML22jelhD1nxGiyr6GGBCjavRGaz6LpPExc03FEa9qS0YEvAniVkVxLJprdDcW4Sm2/lLTh6TRiiicyELomVYxI4FrK1R981pA9ZdDgP8iE3YmcvhvvVJpxgUK+6Tr0LJSq5GgnlcPVEcXc+PYzqLNwlHiH+Vm9bPVs/N/JhfYBPKKREWgtXQBvpsxDM8f5Rj6569D7K3oKZ7Dbglc8eWyn1KFYHV4R+sXc4XOHJDPWuEjgW5/aYUfnP5yDlscfTHDgfrZVy7se8rjgtnpwLNstk7GbLUzgIft6p7hTTUIGB7icopfZtoahgB',
                         provider_name='anthropic',
                     ),
                     BuiltinToolCallPart(
@@ -4260,13 +4252,13 @@ async def test_anthropic_web_fetch_tool(allow_model_requests: None, anthropic_ap
                     ),
                 ],
                 usage=RequestUsage(
-                    input_tokens=7262,
-                    output_tokens=171,
+                    input_tokens=11440,
+                    output_tokens=158,
                     details={
                         'cache_creation_input_tokens': 0,
                         'cache_read_input_tokens': 0,
-                        'input_tokens': 7262,
-                        'output_tokens': 171,
+                        'input_tokens': 11440,
+                        'output_tokens': 158,
                     },
                 ),
                 model_name='claude-sonnet-4-20250514',
@@ -4290,43 +4282,49 @@ async def test_anthropic_web_fetch_tool(allow_model_requests: None, anthropic_ap
                 parts=[
                     ThinkingPart(
                         content="""\
-The user is asking about what framework is mentioned on the Pydantic AI page that I just fetched. Looking at the content, I can see several frameworks mentioned:
+The user is asking about what framework is mentioned on the page I just fetched from https://ai.pydantic.dev. Let me look through the content to identify the frameworks mentioned.
+
+Looking at the content, I can see several frameworks mentioned:
+
+1. **Pydantic AI** - This is the main framework the page is about. It's described as "a Python agent framework designed to help you quickly, confidently, and painlessly build production grade applications and workflows with Generative AI."
 
-1. Pydantic AI itself - described as "a Python agent framework"
-2. FastAPI - mentioned as having "revolutionized web development by offering an innovative and ergonomic design"
-3. Various other frameworks/libraries mentioned like LangChain, LlamaIndex, AutoGPT, Transformers, CrewAI, Instructor
-4. Pydantic Validation is mentioned as being used by many frameworks
-5. OpenTelemetry is mentioned in relation to observability
+2. **FastAPI** - The page mentions "FastAPI revolutionized web development by offering an innovative and ergonomic design, built on the foundation of Pydantic Validation and modern Python features like type hints." It also says "We built Pydantic AI with one simple aim: to bring that FastAPI feeling to GenAI app and agent development."
 
-But the most prominently featured framework that seems to be the main comparison point is FastAPI, as the page talks about bringing "that FastAPI feeling to GenAI app and agent development."\
+3. **Pydantic Validation** - Mentioned as the foundation that FastAPI is built on.
+
+4. **Other frameworks mentioned in passing**: LangChain, LlamaIndex, AutoGPT, Transformers, CrewAI, Instructor (these are mentioned as examples of libraries that use Pydantic Validation)
+
+The primary framework the page is about is **Pydantic AI**, but it also prominently mentions **FastAPI** as an inspiration and comparison point.\
 """,
-                        signature='ErIHCkYICRgCKkDZrwipmaxoEat4WffzPSjVzIuSQWM2sHE6FLC2wt5S2qiJN2MQh//EImuLE9I2ssZjTMxGXZV+esnf5ipnzbvnEgxfcXs2ax8vnLdroxMaDCpqvdPKpCP3Qi0txCIw55NdOjY30P3/yRL9RF8sPGioyitlzkhSpf+PuC3YXwz4N0hoy8zVY1MHecwc60vcKpkGxtZsfqmAuJwjeGRr/Ugxcxd69+0X/Y9pojMiklNHq9otW+ehDX0rR0EzfdN/2jNOs3bOrzfy9jmvYE5FU2c5e0JpMP3LH0LrFvZYkSh7RkbhYuHvrOqohlE3BhpflrszowmiozUk+aG4wSqx5Dtxo9W7jfeU4wduy6OyEFdIqdYdTMR8VVf9Qnd5bLX4rY09xcGQc4JcX2mFjdSR2WgEJM7p5lytlN5unH3selWBVPbCj7ogU8DbT9zhY3zkDW1dMt2vNbWNaY4gVrLwi42qBJvjC5eJTADckvXAt+MCT9AAe1kmH9NlsgBnRy13O4lhXv9SPNDfk2tU5Tdco4h/I/fXh+WuPe6/MKk+tJuoBQTGVQ5ryFmomsNiwhwtLbQ44fLVHhyqEKSEdo/107xvbzhjmY/MAzn1Pmc9rd+OhFsjUCvgqI8cWNc/E694eJqg3J2S+I6YRzG3d2tR7laUivf+J38c2XmwSyXfdRoJpyZ9TixubpPk04WSchdFlEkxPBGEWLDkWOVL1PG5ztY48di7EzM1tvAwiT1BOxl4WRZ78Ewc+C5BVHwT658rIrcKJXXI/zBMsoReQT9xsRhpozbb576wNXggJdZsd2ysQY0O6Pihz54emwigm+zPbO5n8HvlrGKf6dSsrwusUJ1BIY4wI6qjz7gweRryReDEvEzMT8Ul4mIrigRy4yL2w+03qAclz8oGwxinMvcu8vJzXg+uRm/WbOgyco4gTPQiN4NcXbzwhVtJlNWZYXCiiMb/i6IXuOzZmSjI7LqxLubD9RgOy/2890RLvVJQBBVnOowW8q+iE93CoVBr1l5D54opLS9fHYcM7ezV0Ul34qMu6K0uoBG0+aLVlZHKEecN2/VE4fh0zYEDaeqRZfNH2gnAGmokdmPtEHlp33pvJ0IFDAbxKq2CVFFdB+lCGlaLQuZ5v6Mhq4b6H8DjaGZqo/vcB/MK4pr/F1SRjLzSHyh7Ey4ogBYSOXWfaeXQiZZFoEfxIUG9PzofIA1CCFk+eZSG7bGY4wXe2Whhh5bs+cJ3duYI9SL+49WBABgB',
+                        signature='EoMLCkYIChgCKkAJqNs+Sem70XQqD4BTpMDThWZMMjR2WEgJKIlYvj4B8noeoZolpVe9rsKZqYy37KFQfVlgKVvznIhNoGYABCGdEgzfs4fFZUkmJ8pta9saDHNxHH70HOLepd+lICIwfnIjiGn76xEZI5AhKLCBCXvVWIaOJvYwmyZ2XTRot7v9VHCdnqpM3dS5NeU/BL6wKuoJpOdesmsKzzPUz2OpeaaCrD+0CDnHdzIHv1tM6kXMJvqrj4boQ+OE/s5FcFWwGArl0/SW3NwT11RoqFQQVI2ekTF8EqFIoixUBnRhwGEk+LauI+f429lKWoEvKP7bNAWrsu3j+jbBRNevFAk2BmfoDP9bfZtLAh1y/9topi6x5xvFNR4nNk/pXnkQLMjwAwjq63e4YZzxg3mMZ4e1Rzoyb18c6/TQgvZMYog87HCyWf+yJS9zVQxbl33szJcujnG6EHYRHw33Kb3/z73Sedv+FJgGf4oC1U9CPB1jErLkbhBb48yxpCdU1AZH+1jzgE4Gt1wY2yax7zG53m7IYvuELSM4H2mR9yF/V3WdmhTad8cOb1MtNek7JTsGPxxPd/FqKVLCl8vGXLz8W6GUzbSrtXtk0gnoiWoWbPzAj92K285k7fN7SfgsQPPhJseoDQg7CRL7tdU6xKYph0AsWsjPcv0x0xNwEW5L5uSMFgEZUmponS/pKOJYxuO9HcanU2GRyN91YEa3KrQDye8Pjei01iL/tVUYmQ4xHxCruNFbY7fVSqlYmc2r68sixCjSi8it3/MrR9ZtMZ8ujU9S50raPoP9Vy6fkfodP0BEEKADC/tSuZuDIr4TpZrtlLOIhDOzmzIV6+5biyQhDT28xypeASOv+M4KMjMaGIenZWMr0p2ER/xtK0Q+z9pNGBSDsP1E5jGjMxs25lObHkw8WHpssPf6hzEfxRYMAUriB+NHAuWfvro3pc+T8/yEWw31iW8vLwgZ0FdO3rabvCl0rIo6Wcu1pozHN63TSOP2p8vLtzWUEvOjLb0mR5BJgqZ8yqa3jyt1DrNyivXUuXlw0xqOcZwwWB5y1a2QDKAY5uzI37oEntLYCJ0fcyy0/stQiy5kbQbzDgIyQje9+NpT7CcoH6MURuR9QnUJ33K7/D+LzI7YUSJo8zT5szNhYov9m54+4klKTDnjuYGtFlT6tivkEdkybLPXSlKtrmvHZNCoJkZ3qlK5POwVJYTbLqm73INRttG+mPD3fH7GLLgF3eHvJOq0VzvXYT0j31tSe+zrPskwEqbl/ghPUR579KbQeWMmi9AeyD1F/MBUFf7nBqu27yCcH0oje+LjEN4sE1A9RPCXXdPC1zFPVgwfoSR/IR7xCRvL4Dp70QxBRujzZW008wRg2AXR+l5Dfz+OSfh4hCXg91GnVZmq8iNSL77yfwwK9o3EK48REbRV+ezJ3DQFeUrkDSw8tXCnpCtqIL/L74s7e0OYbgxpITrKEkOt4eMhTbWJY6JgwhUdViVKhdlf1OU6WRyOptZl1kRtKm7khQZ7ThSEaIDdRsndHR8cRBhHV+h31wKw6bgMvOQmqvAdljPXGPqkDLKDDrGkTMHn2fyHxRmCm24edSpNkBtIzyzMwlG9k33UP4ITly7vkcQCXxP+TD9qXdD33i/WzYYdiu5Vhfdxhxo9kUPDcUzp03eqBm2BetsXdva2+Nk0wy6ozUF+1wlqdMYBhf/JkorunuSB+dLW1lnp+c7GVRWKOWvljncJ0I6uWFD8B/kcH4eIQx49Cb0bZf2rDgVXqAkwKaBptupW6+AdDZfCB5Cs9DCXUVgFHSGljeCn2Rbelig68ncUwxio53luA3ldtfE8QV4uGSOf11OW0mnKOS6GHDro0SggtvsuL3eoVhgB',
                         provider_name='anthropic',
                     ),
                     TextPart(
                         content="""\
-Based on the page I fetched, the main framework it mentions and compares itself to is **FastAPI**. The page states that "FastAPI revolutionized web development by offering an innovative and ergonomic design" and that Pydantic AI was built with the aim "to bring that FastAPI feeling to GenAI app and agent development."
+Based on the page I fetched, several frameworks are mentioned:
+
+**Primary framework:**
+- **Pydantic AI** - The main subject of the page, described as "a Python agent framework designed to help you quickly, confidently, and painlessly build production grade applications and workflows with Generative AI."
 
-The page also mentions several other frameworks and libraries including:
-- LangChain
-- LlamaIndex  \n\
-- AutoGPT
-- Transformers
-- CrewAI
-- Instructor
+**Key comparison framework:**
+- **FastAPI** - Prominently mentioned as the inspiration, with the page stating: "FastAPI revolutionized web development by offering an innovative and ergonomic design, built on the foundation of Pydantic Validation and modern Python features like type hints" and "We built Pydantic AI with one simple aim: to bring that FastAPI feeling to GenAI app and agent development."
 
-It notes that "virtually every Python agent framework and LLM library" uses Pydantic Validation, which is the foundation that Pydantic AI builds upon.\
+**Other frameworks mentioned:**
+- **Pydantic Validation** (the foundation both are built on)
+- **LangChain, LlamaIndex, AutoGPT, Transformers, CrewAI, Instructor** (mentioned as examples of libraries that use Pydantic Validation)
+
+The page positions Pydantic AI as bringing the same innovative and ergonomic design philosophy that made FastAPI successful to the GenAI and agent development space.\
 """
                     ),
                 ],
                 usage=RequestUsage(
-                    input_tokens=6346,
-                    output_tokens=354,
+                    input_tokens=10537,
+                    output_tokens=568,
                     details={
                         'cache_creation_input_tokens': 0,
                         'cache_read_input_tokens': 0,
-                        'input_tokens': 6346,
-                        'output_tokens': 354,
+                        'input_tokens': 10537,
+                        'output_tokens': 568,
                     },
                 ),
                 model_name='claude-sonnet-4-20250514',
@@ -4367,9 +4365,7 @@ async def test_anthropic_web_fetch_tool_stream(
                             event_parts.append(event)
 
     assert agent_run.result is not None
-    assert agent_run.result.output == snapshot(
-        'Pydantic AI is a Python agent framework designed to help you quickly, confidently, and painlessly build production grade applications and workflows with Generative AI.'
-    )
+    assert agent_run.result.output == snapshot('"GenAI Agent Framework, the Pydantic way"')
 
     assert agent_run.result.all_messages() == snapshot(
         [
@@ -4385,8 +4381,12 @@ async def test_anthropic_web_fetch_tool_stream(
             ModelResponse(
                 parts=[
                     ThinkingPart(
-                        content='The user wants me to fetch the content from the URL https://ai.pydantic.dev and provide only the first sentence from that page. I need to use the web_fetch tool to get the content from this URL.',
-                        signature='EusCCkYICRgCKkAG/7zhRcmUoiMtml5iZUXVv3nqupp8kgk0nrq9zOoklaXzVCnrb9kwLNWGETIcCaAnLd0cd0ESwjslkVKdV9n8EgxKKdu8LlEvh9VGIWIaDAJ2Ja2NEacp1Am6jSIwyNO36tV+Sj+q6dWf79U+3KOIa1khXbIYarpkIViCuYQaZwpJ4Vtedrd7dLWTY2d5KtIB9Pug5UPuvepSOjyhxLaohtGxmdvZN8crGwBdTJYF9GHSli/rzvkR6CpH+ixd8iSopwFcsJgQ3j68fr/yD7cHmZ06jU3LaESVEBwTHnlK0ABiYnGvD3SvX6PgImMSQxQ1ThARFTA7DePoWw+z5DI0L2vgSun2qTYHkmGxzaEskhNIBlK9r7wS3tVcO0Di4lD/rhYV61tklL2NBWJqvm7ZCtJTN09CzPFJy7HDkg7bSINVL4kuu9gTWEtb/o40tw1b+sO62UcfxQTVFQ4Cj8D8XFZbGAE=',
+                        content="""\
+The user is asking for the first sentence on a specific web page. I need to use the web_fetch tool to get the content from that URL and then identify the first sentence.
+
+The URL provided is https://ai.pydantic.dev - this appears to be a valid URL with the https schema included.\
+""",
+                        signature='EsADCkYIChgCKkA58AqPyRf+zhQwXZM7L/AlQu/MXqlBYT9D+Iin18ScuuGOJF9C0G2tTRtuap+cryX9hT5kc/qcUYlnIb9Vm8BfEgzmZTiT2aAYFcrlsqwaDPzuOGNFvVPoClWurCIwmtlSAwBmrVAOblmM9pdEC3LDbBdJ43qZlP3EHrxuV+Z7/XxW9raDXU4Kz0Ug+GiEKqcC+uDpVdQEtTxJYYxouugfzpunt5grRDUECpgdkXY0u8Hy8XhfwaIkEOmkY8RckI9fqatCczffZ4fWztKzw1Nygxqmox7NgZhw+NBuliEjr3Mm1L+bKbDuOxsjMlOrl2fRMNIupBiJWVP+qiStetD1mF+8+qEjb01vHaWUjScsNhmxus4+zJGVu9CyV42rnw9pb4v3w4vvuaBxw3GpanyXjbRaOP/L5v16kxIM/tZzJb8TQw8R8rFnIWPLSKZ2mT/r5js1A+f3DKb41dEe8T21JyZCR5PkBoWP+xmvxzbp9/zCl3CeVfGXG18NtigQwo2yvi0N4TC4sGHmcAMKafbvt+TwJODEmBBYBW/zYaqUyYjxhz04g29Ji2WKqUQf+8eg+SSbfc8LcBgB',
                         provider_name='anthropic',
                     ),
                     BuiltinToolCallPart(
@@ -4416,18 +4416,16 @@ async def test_anthropic_web_fetch_tool_stream(
                         timestamp=IsDatetime(),
                         provider_name='anthropic',
                     ),
-                    TextPart(
-                        content='Pydantic AI is a Python agent framework designed to help you quickly, confidently, and painlessly build production grade applications and workflows with Generative AI.'
-                    ),
+                    TextPart(content='"GenAI Agent Framework, the Pydantic way"'),
                 ],
                 usage=RequestUsage(
-                    input_tokens=7244,
-                    output_tokens=153,
+                    input_tokens=11453,
+                    output_tokens=151,
                     details={
                         'cache_creation_input_tokens': 0,
                         'cache_read_input_tokens': 0,
-                        'input_tokens': 7244,
-                        'output_tokens': 153,
+                        'input_tokens': 11453,
+                        'output_tokens': 151,
                     },
                 ),
                 model_name='claude-sonnet-4-20250514',
@@ -4442,34 +4440,58 @@ async def test_anthropic_web_fetch_tool_stream(
     )
     assert event_parts == snapshot(
         [
-            PartDeltaEvent(index=0, delta=ThinkingPartDelta(content_delta='The user wants', provider_name='anthropic')),
-            PartDeltaEvent(index=0, delta=ThinkingPartDelta(content_delta=' me to fetch', provider_name='anthropic')),
-            PartDeltaEvent(index=0, delta=ThinkingPartDelta(content_delta=' the content', provider_name='anthropic')),
             PartDeltaEvent(
-                index=0, delta=ThinkingPartDelta(content_delta=' from the URL https', provider_name='anthropic')
+                index=0,
+                delta=ThinkingPartDelta(
+                    content_delta='The user is asking for the first sentence', provider_name='anthropic'
+                ),
             ),
+            PartDeltaEvent(index=0, delta=ThinkingPartDelta(content_delta=' on a specific', provider_name='anthropic')),
             PartDeltaEvent(
-                index=0, delta=ThinkingPartDelta(content_delta='://ai.pydantic.dev', provider_name='anthropic')
+                index=0,
+                delta=ThinkingPartDelta(content_delta=' web page. I need to use the', provider_name='anthropic'),
             ),
-            PartDeltaEvent(index=0, delta=ThinkingPartDelta(content_delta=' and provide', provider_name='anthropic')),
-            PartDeltaEvent(index=0, delta=ThinkingPartDelta(content_delta=' only', provider_name='anthropic')),
             PartDeltaEvent(
-                index=0, delta=ThinkingPartDelta(content_delta=' the first sentence from', provider_name='anthropic')
+                index=0, delta=ThinkingPartDelta(content_delta=' web_fetch tool to get', provider_name='anthropic')
             ),
-            PartDeltaEvent(index=0, delta=ThinkingPartDelta(content_delta=' that page.', provider_name='anthropic')),
             PartDeltaEvent(
                 index=0,
-                delta=ThinkingPartDelta(content_delta=' I need to use the web_fetch', provider_name='anthropic'),
+                delta=ThinkingPartDelta(content_delta=' the content from that URL an', provider_name='anthropic'),
             ),
-            PartDeltaEvent(index=0, delta=ThinkingPartDelta(content_delta=' tool to', provider_name='anthropic')),
             PartDeltaEvent(
-                index=0, delta=ThinkingPartDelta(content_delta=' get the content from', provider_name='anthropic')
+                index=0, delta=ThinkingPartDelta(content_delta='d then identify', provider_name='anthropic')
             ),
-            PartDeltaEvent(index=0, delta=ThinkingPartDelta(content_delta=' this URL.', provider_name='anthropic')),
             PartDeltaEvent(
                 index=0,
                 delta=ThinkingPartDelta(
-                    signature_delta='EusCCkYICRgCKkAG/7zhRcmUoiMtml5iZUXVv3nqupp8kgk0nrq9zOoklaXzVCnrb9kwLNWGETIcCaAnLd0cd0ESwjslkVKdV9n8EgxKKdu8LlEvh9VGIWIaDAJ2Ja2NEacp1Am6jSIwyNO36tV+Sj+q6dWf79U+3KOIa1khXbIYarpkIViCuYQaZwpJ4Vtedrd7dLWTY2d5KtIB9Pug5UPuvepSOjyhxLaohtGxmdvZN8crGwBdTJYF9GHSli/rzvkR6CpH+ixd8iSopwFcsJgQ3j68fr/yD7cHmZ06jU3LaESVEBwTHnlK0ABiYnGvD3SvX6PgImMSQxQ1ThARFTA7DePoWw+z5DI0L2vgSun2qTYHkmGxzaEskhNIBlK9r7wS3tVcO0Di4lD/rhYV61tklL2NBWJqvm7ZCtJTN09CzPFJy7HDkg7bSINVL4kuu9gTWEtb/o40tw1b+sO62UcfxQTVFQ4Cj8D8XFZbGAE=',
+                    content_delta="""\
+ the first sentence.
+
+The\
+""",
+                    provider_name='anthropic',
+                ),
+            ),
+            PartDeltaEvent(index=0, delta=ThinkingPartDelta(content_delta=' URL provide', provider_name='anthropic')),
+            PartDeltaEvent(index=0, delta=ThinkingPartDelta(content_delta='d is https', provider_name='anthropic')),
+            PartDeltaEvent(
+                index=0, delta=ThinkingPartDelta(content_delta='://ai.pydantic.dev', provider_name='anthropic')
+            ),
+            PartDeltaEvent(index=0, delta=ThinkingPartDelta(content_delta=' -', provider_name='anthropic')),
+            PartDeltaEvent(
+                index=0, delta=ThinkingPartDelta(content_delta=' this appears to be a vali', provider_name='anthropic')
+            ),
+            PartDeltaEvent(index=0, delta=ThinkingPartDelta(content_delta='d URL with', provider_name='anthropic')),
+            PartDeltaEvent(index=0, delta=ThinkingPartDelta(content_delta=' the', provider_name='anthropic')),
+            PartDeltaEvent(index=0, delta=ThinkingPartDelta(content_delta=' https', provider_name='anthropic')),
+            PartDeltaEvent(index=0, delta=ThinkingPartDelta(content_delta=' schema', provider_name='anthropic')),
+            PartDeltaEvent(index=0, delta=ThinkingPartDelta(content_delta=' include', provider_name='anthropic')),
+            PartDeltaEvent(index=0, delta=ThinkingPartDelta(content_delta='d.', provider_name='anthropic')),
+            PartDeltaEvent(index=0, delta=ThinkingPartDelta(content_delta='', provider_name='anthropic')),
+            PartDeltaEvent(
+                index=0,
+                delta=ThinkingPartDelta(
+                    signature_delta='EsADCkYIChgCKkA58AqPyRf+zhQwXZM7L/AlQu/MXqlBYT9D+Iin18ScuuGOJF9C0G2tTRtuap+cryX9hT5kc/qcUYlnIb9Vm8BfEgzmZTiT2aAYFcrlsqwaDPzuOGNFvVPoClWurCIwmtlSAwBmrVAOblmM9pdEC3LDbBdJ43qZlP3EHrxuV+Z7/XxW9raDXU4Kz0Ug+GiEKqcC+uDpVdQEtTxJYYxouugfzpunt5grRDUECpgdkXY0u8Hy8XhfwaIkEOmkY8RckI9fqatCczffZ4fWztKzw1Nygxqmox7NgZhw+NBuliEjr3Mm1L+bKbDuOxsjMlOrl2fRMNIupBiJWVP+qiStetD1mF+8+qEjb01vHaWUjScsNhmxus4+zJGVu9CyV42rnw9pb4v3w4vvuaBxw3GpanyXjbRaOP/L5v16kxIM/tZzJb8TQw8R8rFnIWPLSKZ2mT/r5js1A+f3DKb41dEe8T21JyZCR5PkBoWP+xmvxzbp9/zCl3CeVfGXG18NtigQwo2yvi0N4TC4sGHmcAMKafbvt+TwJODEmBBYBW/zYaqUyYjxhz04g29Ji2WKqUQf+8eg+SSbfc8LcBgB',
                     provider_name='anthropic',
                 ),
             ),
@@ -4479,25 +4501,24 @@ async def test_anthropic_web_fetch_tool_stream(
                 previous_part_kind='thinking',
             ),
             PartDeltaEvent(
-                index=1, delta=ToolCallPartDelta(args_delta='', tool_call_id='srvtoolu_018ADaxdJjyZ8HXtF3sTBPNk')
+                index=1, delta=ToolCallPartDelta(args_delta='', tool_call_id='srvtoolu_011CmugtvU55veq6jzEtGtnt')
             ),
             PartDeltaEvent(
-                index=1,
-                delta=ToolCallPartDelta(args_delta='{"url": "', tool_call_id='srvtoolu_018ADaxdJjyZ8HXtF3sTBPNk'),
+                index=1, delta=ToolCallPartDelta(args_delta='{"ur', tool_call_id='srvtoolu_011CmugtvU55veq6jzEtGtnt')
             ),
             PartDeltaEvent(
                 index=1,
-                delta=ToolCallPartDelta(args_delta='https://ai', tool_call_id='srvtoolu_018ADaxdJjyZ8HXtF3sTBPNk'),
+                delta=ToolCallPartDelta(args_delta='l": "htt', tool_call_id='srvtoolu_011CmugtvU55veq6jzEtGtnt'),
             ),
             PartDeltaEvent(
-                index=1, delta=ToolCallPartDelta(args_delta='.p', tool_call_id='srvtoolu_018ADaxdJjyZ8HXtF3sTBPNk')
+                index=1, delta=ToolCallPartDelta(args_delta='ps://ai', tool_call_id='srvtoolu_011CmugtvU55veq6jzEtGtnt')
             ),
             PartDeltaEvent(
-                index=1, delta=ToolCallPartDelta(args_delta='yd', tool_call_id='srvtoolu_018ADaxdJjyZ8HXtF3sTBPNk')
+                index=1,
+                delta=ToolCallPartDelta(args_delta='.pydantic', tool_call_id='srvtoolu_011CmugtvU55veq6jzEtGtnt'),
             ),
             PartDeltaEvent(
-                index=1,
-                delta=ToolCallPartDelta(args_delta='antic.dev"}', tool_call_id='srvtoolu_018ADaxdJjyZ8HXtF3sTBPNk'),
+                index=1, delta=ToolCallPartDelta(args_delta='.dev"}', tool_call_id='srvtoolu_011CmugtvU55veq6jzEtGtnt')
             ),
             PartStartEvent(
                 index=2,
@@ -4509,285 +4530,802 @@ async def test_anthropic_web_fetch_tool_stream(
                             'source': {
                                 'data': '''\
 Pydantic AI
-GenAI Agent Framework, the Pydantic way
-Pydantic AI is a Python agent framework designed to help you quickly, confidently, and painlessly build production grade applications and workflows with Generative AI.
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ \n\
+
+
+
+
+
+[Skip to content](#pydantic-ai)
+
+**[Pydantic AI Gateway](/gateway) is now available! 🚀
+Enterprise-ready AI model routing: One key for all your models with real-time monitoring and budget control that works.**
+
+[![logo](img/logo-white.svg)](. "Pydantic AI")
+
+
+
+
+Pydantic AI
+
+Pydantic AI
+
+
+
+
+
+
+
+Type to start searching
+
+[pydantic/pydantic-ai](https://github.com/pydantic/pydantic-ai "Go to repository")
+
+[![logo](img/logo-white.svg)](. "Pydantic AI")
+Pydantic AI
+
+[pydantic/pydantic-ai](https://github.com/pydantic/pydantic-ai "Go to repository")
+
+* Pydantic AI
+
+  [Pydantic AI](.)
+
+
+
+  Table of contents
+  + [Why use Pydantic AI](#why-use-pydantic-ai)
+  + [Hello World Example](#hello-world-example)
+  + [Tools & Dependency Injection Example](#tools-dependency-injection-example)
+  + [Instrumentation with Pydantic Logfire](#instrumentation-with-pydantic-logfire)
+  + [llms.txt](#llmstxt)
+  + [Next Steps](#next-steps)
+* [Installation](install/)
+* [Getting Help](help/)
+* [Troubleshooting](troubleshooting/)
+* [Pydantic AI Gateway](gateway/)
+* Documentation
+
+
+
+
+  Documentation
+  + Core Concepts
+
+
+
+
+    Core Concepts
+    - [Agents](agents/)
+    - [Dependencies](dependencies/)
+    - [Function Tools](tools/)
+    - [Output](output/)
+    - [Messages and chat history](message-history/)
+    - [Direct Model Requests](direct/)
+  + Models & Providers
+
+
+
+
+    Models & Providers
+    - [Overview](models/overview/)
+    - [OpenAI](models/openai/)
+    - [Anthropic](models/anthropic/)
+    - [Google](models/google/)
+    - [Bedrock](models/bedrock/)
+    - [Cohere](models/cohere/)
+    - [Groq](models/groq/)
+    - [Hugging Face](models/huggingface/)
+    - [Mistral](models/mistral/)
+    - [OpenRouter](models/openrouter/)
+    - [Outlines](models/outlines/)
+  + Tools & Toolsets
+
+
+
+
+    Tools & Toolsets
+    - [Function Tools](tools/)
+    - [Advanced Tool Features](tools-advanced/)
+    - [Toolsets](toolsets/)
+    - [Deferred Tools](deferred-tools/)
+    - [Built-in Tools](builtin-tools/)
+    - [Common Tools](common-tools/)
+    - [Third-Party Tools](third-party-tools/)
+  + Advanced Features
+
+
+
+
+    Advanced Features
+    - [Image, Audio, Video & Document Input](input/)
+    - [Thinking](thinking/)
+    - [HTTP Request Retries](retries/)
+  + MCP
+
+
+
+
+    MCP
+    - [Overview](mcp/overview/)
+    - [Client](mcp/client/)
+    - [FastMCP Client](mcp/fastmcp-client/)
+    - [Server](mcp/server/)
+  + [Multi-Agent Patterns](multi-agent-applications/)
+  + [Testing](testing/)
+* Pydantic Evals
+
+
+
+
+  Pydantic Evals
+  + [Overview](evals/)
+  + Getting Started
+
+
+
+
+    Getting Started
+    - [Quick Start](evals/quick-start/)
+    - [Core Concepts](evals/core-concepts/)
+  + Evaluators
+
+
+
+
+    Evaluators
+    - [Overview](evals/evaluators/overview/)
+    - [Built-in Evaluators](evals/evaluators/built-in/)
+    - [LLM Judge](evals/evaluators/llm-judge/)
+    - [Custom Evaluators](evals/evaluators/custom/)
+    - [Span-Based](evals/evaluators/span-based/)
+  + How-To Guides
+
+
+
+
+    How-To Guides
+    - [Logfire Integration](evals/how-to/logfire-integration/)
+    - [Dataset Management](evals/how-to/dataset-management/)
+    - [Dataset Serialization](evals/how-to/dataset-serialization/)
+    - [Concurrency & Performance](evals/how-to/concurrency/)
+    - [Retry Strategies](evals/how-to/retry-strategies/)
+    - [Metrics & Attributes](evals/how-to/metrics-attributes/)
+  + Examples
+
+
+
+
+    Examples
+    - [Simple Validation](evals/examples/simple-validation/)
+* Pydantic Graph
+
+
+
+
+  Pydantic Graph
+  + [Overview](graph/)
+  + [Beta API](graph/beta/)
+
+    Beta API
+    - [Steps](graph/beta/steps/)
+    - [Joins & Reducers](graph/beta/joins/)
+    - [Decisions](graph/beta/decisions/)
+    - [Parallel Execution](graph/beta/parallel/)
+* Integrations
+
+
+
+
+  Integrations
+  + [Debugging & Monitoring with Pydantic Logfire](logfire/)
+  + Durable Execution
+
+
+
+
+    Durable Execution
+    - [Overview](durable_execution/overview/)
+    - [Temporal](durable_execution/temporal/)
+    - [DBOS](durable_execution/dbos/)
+    - [Prefect](durable_execution/prefect/)
+  + UI Event Streams
+
+
+
+
+    UI Event Streams
+    - [Overview](ui/overview/)
+    - [AG-UI](ui/ag-ui/)
+    - [Vercel AI](ui/vercel-ai/)
+  + [Agent2Agent (A2A)](a2a/)
+* Related Packages
+
+
+
+
+  Related Packages
+  + [Clai](cli/)
+* Examples
+
+
+
+
+  Examples
+  + [Setup](examples/setup/)
+  + Getting Started
+
+
+
+
+    Getting Started
+    - [Pydantic Model](examples/pydantic-model/)
+    - [Weather agent](examples/weather-agent/)
+  + Conversational Agents
+
+
+
+
+    Conversational Agents
+    - [Chat App with FastAPI](examples/chat-app/)
+    - [Bank support](examples/bank-support/)
+  + Data & Analytics
+
+
+
+
+    Data & Analytics
+    - [SQL Generation](examples/sql-gen/)
+    - [Data Analyst](examples/data-analyst/)
+    - [RAG](examples/rag/)
+  + Streaming
+
+
+
+
+    Streaming
+    - [Stream markdown](examples/stream-markdown/)
+    - [Stream whales](examples/stream-whales/)
+  + Complex Workflows
+
+
+
+
+    Complex Workflows
+    - [Flight booking](examples/flight-booking/)
+    - [Question Graph](examples/question-graph/)
+  + Business Applications
+
+
+
+
+    Business Applications
+    - [Slack Lead Qualifier with Modal](examples/slack-lead-qualifier/)
+  + UI Examples
+
+
+
+
+    UI Examples
+    - [Agent User Interaction (AG-UI)](examples/ag-ui/)
+* API Reference
+
+
+
+
+  API Reference
+  + pydantic\\_ai
+
+
+
+
+    pydantic\\_ai
+    - [pydantic\\_ai.agent](api/agent/)
+    - [pydantic\\_ai.tools](api/tools/)
+    - [pydantic\\_ai.toolsets](api/toolsets/)
+    - [pydantic\\_ai.builtin\\_tools](api/builtin_tools/)
+    - [pydantic\\_ai.common\\_tools](api/common_tools/)
+    - [pydantic\\_ai.durable\\_exec](api/durable_exec/)
+    - [pydantic\\_ai.output](api/output/)
+    - [pydantic\\_ai.result](api/result/)
+    - [pydantic\\_ai.messages](api/messages/)
+    - [pydantic\\_ai.exceptions](api/exceptions/)
+    - [pydantic\\_ai.settings](api/settings/)
+    - [pydantic\\_ai.usage](api/usage/)
+    - [pydantic\\_ai.mcp](api/mcp/)
+    - [pydantic\\_ai.format\\_prompt](api/format_prompt/)
+    - [pydantic\\_ai.direct](api/direct/)
+    - [pydantic\\_ai.ext](api/ext/)
+    - [pydantic\\_ai.models.anthropic](api/models/anthropic/)
+    - [pydantic\\_ai.models](api/models/base/)
+    - [pydantic\\_ai.models.bedrock](api/models/bedrock/)
+    - [pydantic\\_ai.models.cohere](api/models/cohere/)
+    - [pydantic\\_ai.models.fallback](api/models/fallback/)
+    - [pydantic\\_ai.models.function](api/models/function/)
+    - [pydantic\\_ai.models.google](api/models/google/)
+    - [pydantic\\_ai.models.groq](api/models/groq/)
+    - [pydantic\\_ai.models.huggingface](api/models/huggingface/)
+    - [pydantic\\_ai.models.instrumented](api/models/instrumented/)
+    - [pydantic\\_ai.models.mcp\\_sampling](api/models/mcp-sampling/)
+    - [pydantic\\_ai.models.mistral](api/models/mistral/)
+    - [pydantic\\_ai.models.openai](api/models/openai/)
+    - [pydantic\\_ai.models.openrouter](api/models/openrouter/)
+    - [pydantic\\_ai.models.outlines](api/models/outlines/)
+    - [pydantic\\_ai.models.test](api/models/test/)
+    - [pydantic\\_ai.models.wrapper](api/models/wrapper/)
+    - [pydantic\\_ai.profiles](api/profiles/)
+    - [pydantic\\_ai.providers](api/providers/)
+    - [pydantic\\_ai.retries](api/retries/)
+    - [pydantic\\_ai.run](api/run/)
+    - [pydantic\\_ai.ag\\_ui](api/ag_ui/)
+    - [pydantic\\_ai.ui](api/ui/base/)
+    - [pydantic\\_ai.ui.ag\\_ui](api/ui/ag_ui/)
+    - [pydantic\\_ai.ui.vercel\\_ai](api/ui/vercel_ai/)
+  + pydantic\\_evals
+
+
+
+
+    pydantic\\_evals
+    - [pydantic\\_evals.dataset](api/pydantic_evals/dataset/)
+    - [pydantic\\_evals.evaluators](api/pydantic_evals/evaluators/)
+    - [pydantic\\_evals.reporting](api/pydantic_evals/reporting/)
+    - [pydantic\\_evals.otel](api/pydantic_evals/otel/)
+    - [pydantic\\_evals.generation](api/pydantic_evals/generation/)
+  + pydantic\\_graph
+
+
+
+
+    pydantic\\_graph
+    - [pydantic\\_graph](api/pydantic_graph/graph/)
+    - [pydantic\\_graph.nodes](api/pydantic_graph/nodes/)
+    - [pydantic\\_graph.persistence](api/pydantic_graph/persistence/)
+    - [pydantic\\_graph.mermaid](api/pydantic_graph/mermaid/)
+    - [pydantic\\_graph.exceptions](api/pydantic_graph/exceptions/)
+    - Beta API
+
+
+
+
+      Beta API
+      * [pydantic\\_graph.beta](api/pydantic_graph/beta/)
+      * [pydantic\\_graph.beta.graph](api/pydantic_graph/beta_graph/)
+      * [pydantic\\_graph.beta.graph\\_builder](api/pydantic_graph/beta_graph_builder/)
+      * [pydantic\\_graph.beta.step](api/pydantic_graph/beta_step/)
+      * [pydantic\\_graph.beta.join](api/pydantic_graph/beta_join/)
+      * [pydantic\\_graph.beta.decision](api/pydantic_graph/beta_decision/)
+      * [pydantic\\_graph.beta.node](api/pydantic_graph/beta_node/)
+  + fasta2a
+
+
+
+
+    fasta2a
+    - [fasta2a](api/fasta2a/)
+* Project
+
+
+
+
+  Project
+  + [Contributing](contributing/)
+  + [Upgrade Guide](changelog/)
+  + [Version policy](version-policy/)
+
+Table of contents
+
+* [Why use Pydantic AI](#why-use-pydantic-ai)
+* [Hello World Example](#hello-world-example)
+* [Tools & Dependency Injection Example](#tools-dependency-injection-example)
+* [Instrumentation with Pydantic Logfire](#instrumentation-with-pydantic-logfire)
+* [llms.txt](#llmstxt)
+* [Next Steps](#next-steps)
+
+# Pydantic AI
+
+![Pydantic AI](./img/pydantic-ai-dark.svg#only-dark)
+
+![Pydantic AI](./img/pydantic-ai-light.svg#only-light)
+
+*GenAI Agent Framework, the Pydantic way*
+
+[![CI](https://github.com/pydantic/pydantic-ai/actions/workflows/ci.yml/badge.svg?event=push)](https://github.com/pydantic/pydantic-ai/actions/workflows/ci.yml?query=branch%3Amain)
+[![Coverage](https://coverage-badge.samuelcolvin.workers.dev/pydantic/pydantic-ai.svg)](https://coverage-badge.samuelcolvin.workers.dev/redirect/pydantic/pydantic-ai)
+[![PyPI](https://img.shields.io/pypi/v/pydantic-ai.svg)](https://pypi.python.org/pypi/pydantic-ai)
+[![versions](https://img.shields.io/pypi/pyversions/pydantic-ai.svg)](https://github.com/pydantic/pydantic-ai)
+[![license](https://img.shields.io/github/license/pydantic/pydantic-ai.svg)](https://github.com/pydantic/pydantic-ai/blob/main/LICENSE)
+[![Join Slack](https://img.shields.io/badge/Slack-Join%20Slack-4A154B?logo=slack)](https://logfire.pydantic.dev/docs/join-slack/)
+
+Pydantic AI is a Python agent framework designed to help you
+quickly, confidently, and painlessly build production grade applications and workflows with Generative AI.
+
 FastAPI revolutionized web development by offering an innovative and ergonomic design, built on the foundation of [Pydantic Validation](https://docs.pydantic.dev) and modern Python features like type hints.
+
 Yet despite virtually every Python agent framework and LLM library using Pydantic Validation, when we began to use LLMs in [Pydantic Logfire](https://pydantic.dev/logfire), we couldn't find anything that gave us the same feeling.
+
 We built Pydantic AI with one simple aim: to bring that FastAPI feeling to GenAI app and agent development.
-Why use Pydantic AI
--
-Built by the Pydantic Team:
-[Pydantic Validation](https://docs.pydantic.dev/latest/)is the validation layer of the OpenAI SDK, the Google ADK, the Anthropic SDK, LangChain, LlamaIndex, AutoGPT, Transformers, CrewAI, Instructor and many more. Why use the derivative when you can go straight to the source? -
-Model-agnostic: Supports virtually every
-[model](models/overview/)and provider: OpenAI, Anthropic, Gemini, DeepSeek, Grok, Cohere, Mistral, and Perplexity; Azure AI Foundry, Amazon Bedrock, Google Vertex AI, Ollama, LiteLLM, Groq, OpenRouter, Together AI, Fireworks AI, Cerebras, Hugging Face, GitHub, Heroku, Vercel, Nebius, OVHcloud, and Outlines. If your favorite model or provider is not listed, you can easily implement a[custom model](models/overview/#custom-models). -
-Seamless Observability: Tightly
-[integrates](logfire/)with[Pydantic Logfire](https://pydantic.dev/logfire), our general-purpose OpenTelemetry observability platform, for real-time debugging, evals-based performance monitoring, and behavior, tracing, and cost tracking. If you already have an observability platform that supports OTel, you can[use that too](logfire/#alternative-observability-backends). -
-Fully Type-safe: Designed to give your IDE or AI coding agent as much context as possible for auto-completion and
-[type checking](agents/#static-type-checking), moving entire classes of errors from runtime to write-time for a bit of that Rust "if it compiles, it works" feel. -
-Powerful Evals: Enables you to systematically test and
-[evaluate](evals/)the performance and accuracy of the agentic systems you build, and monitor the performance over time in Pydantic Logfire. -
-MCP, A2A, and UI: Integrates the
-[Model Context Protocol](mcp/overview/),[Agent2Agent](a2a/), and various[UI event stream](ui/overview/)standards to give your agent access to external tools and data, let it interoperate with other agents, and build interactive applications with streaming event-based communication. -
-Human-in-the-Loop Tool Approval: Easily lets you flag that certain tool calls
-[require approval](deferred-tools/#human-in-the-loop-tool-approval)before they can proceed, possibly depending on tool call arguments, conversation history, or user preferences. -
-Durable Execution: Enables you to build
-[durable agents](durable_execution/overview/)that can preserve their progress across transient API failures and application errors or restarts, and handle long-running, asynchronous, and human-in-the-loop workflows with production-grade reliability. -
-Streamed Outputs: Provides the ability to
-[stream](output/#streamed-results)structured output continuously, with immediate validation, ensuring real time access to generated data. -
-Graph Support: Provides a powerful way to define
-[graphs](graph/)using type hints, for use in complex applications where standard control flow can degrade to spaghetti code.
+
+## Why use Pydantic AI
+
+1. **Built by the Pydantic Team**:
+   [Pydantic Validation](https://docs.pydantic.dev/latest/) is the validation layer of the OpenAI SDK, the Google ADK, the Anthropic SDK, LangChain, LlamaIndex, AutoGPT, Transformers, CrewAI, Instructor and many more. *Why use the derivative when you can go straight to the source?* ![😃](https://cdn.jsdelivr.net/gh/jdecked/twemoji@15.1.0/assets/svg/1f603.svg ":smiley:")
+2. **Model-agnostic**:
+   Supports virtually every [model](models/overview/) and provider: OpenAI, Anthropic, Gemini, DeepSeek, Grok, Cohere, Mistral, and Perplexity; Azure AI Foundry, Amazon Bedrock, Google Vertex AI, Ollama, LiteLLM, Groq, OpenRouter, Together AI, Fireworks AI, Cerebras, Hugging Face, GitHub, Heroku, Vercel, Nebius, OVHcloud, and Outlines. If your favorite model or provider is not listed, you can easily implement a [custom model](models/overview/#custom-models).
+3. **Seamless Observability**:
+   Tightly [integrates](logfire/) with [Pydantic Logfire](https://pydantic.dev/logfire), our general-purpose OpenTelemetry observability platform, for real-time debugging, evals-based performance monitoring, and behavior, tracing, and cost tracking. If you already have an observability platform that supports OTel, you can [use that too](logfire/#alternative-observability-backends).
+4. **Fully Type-safe**:
+   Designed to give your IDE or AI coding agent as much context as possible for auto-completion and [type checking](agents/#static-type-checking), moving entire classes of errors from runtime to write-time for a bit of that Rust "if it compiles, it works" feel.
+5. **Powerful Evals**:
+   Enables you to systematically test and [evaluate](evals/) the performance and accuracy of the agentic systems you build, and monitor the performance over time in Pydantic Logfire.
+6. **MCP, A2A, and UI**:
+   Integrates the [Model Context Protocol](mcp/overview/), [Agent2Agent](a2a/), and various [UI event stream](ui/overview/) standards to give your agent access to external tools and data, let it interoperate with other agents, and build interactive applications with streaming event-based communication.
+7. **Human-in-the-Loop Tool Approval**:
+   Easily lets you flag that certain tool calls [require approval](deferred-tools/#human-in-the-loop-tool-approval) before they can proceed, possibly depending on tool call arguments, conversation history, or user preferences.
+8. **Durable Execution**:
+   Enables you to build [durable agents](durable_execution/overview/) that can preserve their progress across transient API failures and application errors or restarts, and handle long-running, asynchronous, and human-in-the-loop workflows with production-grade reliability.
+9. **Streamed Outputs**:
+   Provides the ability to [stream](output/#streamed-results) structured output continuously, with immediate validation, ensuring real time access to generated data.
+10. **Graph Support**:
+    Provides a powerful way to define [graphs](graph/) using type hints, for use in complex applications where standard control flow can degrade to spaghetti code.
+
 Realistically though, no list is going to be as convincing as [giving it a try](#next-steps) and seeing how it makes you feel!
-Sign up for our newsletter, The Pydantic Stack, with updates & tutorials on Pydantic AI, Logfire, and Pydantic:
-Hello World Example
+
+**Sign up for our newsletter, *The Pydantic Stack*, with updates & tutorials on Pydantic AI, Logfire, and Pydantic:**
+
+Subscribe
+
+## Hello World Example
+
 Here's a minimal example of Pydantic AI:
-[Learn about Gateway](gateway)hello_world.py
+
+With Pydantic AI GatewayDirectly to Provider API
+
+[Learn about Gateway](../gateway) hello\\_world.py
+
+```
 from pydantic_ai import Agent
-agent = Agent( # (1)!
-'gateway/anthropic:claude-sonnet-4-0',
-instructions='Be concise, reply with one sentence.', # (2)!
+
+agent = Agent(  # (1)!
+    'gateway/anthropic:claude-sonnet-4-0',
+    instructions='Be concise, reply with one sentence.',  # (2)!
 )
-result = agent.run_sync('Where does "hello world" come from?') # (3)!
+
+result = agent.run_sync('Where does "hello world" come from?')  # (3)!
 print(result.output)
 """
 The first known use of "hello, world" was in a 1974 textbook about the C programming language.
 """
-- We configure the agent to use
-[Anthropic's Claude Sonnet 4.0](api/models/anthropic/)model, but you can also set the model when running the agent. - Register static
-[instructions](agents/#instructions)using a keyword argument to the agent. [Run the agent](agents/#running-agents)synchronously, starting a conversation with the LLM.
+```
+
+1. We configure the agent to use [Anthropic's Claude Sonnet 4.0](api/models/anthropic/) model, but you can also set the model when running the agent.
+2. Register static [instructions](agents/#instructions) using a keyword argument to the agent.
+3. [Run the agent](agents/#running-agents) synchronously, starting a conversation with the LLM.
+
+hello\\_world.py
+
+```
 from pydantic_ai import Agent
-agent = Agent( # (1)!
-'anthropic:claude-sonnet-4-0',
-instructions='Be concise, reply with one sentence.', # (2)!
+
+agent = Agent(  # (1)!
+    'anthropic:claude-sonnet-4-0',
+    instructions='Be concise, reply with one sentence.',  # (2)!
 )
-result = agent.run_sync('Where does "hello world" come from?') # (3)!
+
+result = agent.run_sync('Where does "hello world" come from?')  # (3)!
 print(result.output)
 """
 The first known use of "hello, world" was in a 1974 textbook about the C programming language.
 """
-- We configure the agent to use
-[Anthropic's Claude Sonnet 4.0](api/models/anthropic/)model, but you can also set the model when running the agent. - Register static
-[instructions](agents/#instructions)using a keyword argument to the agent. [Run the agent](agents/#running-agents)synchronously, starting a conversation with the LLM.
-(This example is complete, it can be run "as is", assuming you've [installed the pydantic_ai package](install/))
+```
+
+1. We configure the agent to use [Anthropic's Claude Sonnet 4.0](api/models/anthropic/) model, but you can also set the model when running the agent.
+2. Register static [instructions](agents/#instructions) using a keyword argument to the agent.
+3. [Run the agent](agents/#running-agents) synchronously, starting a conversation with the LLM.
+
+*(This example is complete, it can be run "as is", assuming you've [installed the `pydantic_ai` package](install/))*
+
 The exchange will be very short: Pydantic AI will send the instructions and the user prompt to the LLM, and the model will return a text response.
+
 Not very interesting yet, but we can easily add [tools](tools/), [dynamic instructions](agents/#instructions), and [structured outputs](output/) to build more powerful agents.
-Tools & Dependency Injection Example
+
+## Tools & Dependency Injection Example
+
 Here is a concise example using Pydantic AI to build a support agent for a bank:
-[Learn about Gateway](gateway)bank_support.py
+
+With Pydantic AI GatewayDirectly to Provider API
+
+[Learn about Gateway](../gateway) bank\\_support.py
+
+```
 from dataclasses import dataclass
+
 from pydantic import BaseModel, Field
 from pydantic_ai import Agent, RunContext
+
 from bank_database import DatabaseConn
+
+
 @dataclass
-class SupportDependencies: # (3)!
-customer_id: int
-db: DatabaseConn # (12)!
-class SupportOutput(BaseModel): # (13)!
-support_advice: str = Field(description='Advice returned to the customer')
-block_card: bool = Field(description="Whether to block the customer's card")
-risk: int = Field(description='Risk level of query', ge=0, le=10)
-support_agent = Agent( # (1)!
-'gateway/openai:gpt-5', # (2)!
-deps_type=SupportDependencies,
-output_type=SupportOutput, # (9)!
-instructions=( # (4)!
-'You are a support agent in our bank, give the '
-'customer support and judge the risk level of their query.'
-),
+class SupportDependencies:  # (3)!
+    customer_id: int
+    db: DatabaseConn  # (12)!
+
+
+class SupportOutput(BaseModel):  # (13)!
+    support_advice: str = Field(description='Advice returned to the customer')
+    block_card: bool = Field(description="Whether to block the customer's card")
+    risk: int = Field(description='Risk level of query', ge=0, le=10)
+
+
+support_agent = Agent(  # (1)!
+    'gateway/openai:gpt-5',  # (2)!
+    deps_type=SupportDependencies,
+    output_type=SupportOutput,  # (9)!
+    instructions=(  # (4)!
+        'You are a support agent in our bank, give the '
+        'customer support and judge the risk level of their query.'
+    ),
 )
-@support_agent.instructions # (5)!
+
+
+@support_agent.instructions  # (5)!
 async def add_customer_name(ctx: RunContext[SupportDependencies]) -> str:
-customer_name = await ctx.deps.db.customer_name(id=ctx.deps.customer_id)
-return f"The customer's name is {customer_name!r}"
-@support_agent.tool # (6)!
+    customer_name = await ctx.deps.db.customer_name(id=ctx.deps.customer_id)
+    return f"The customer's name is {customer_name!r}"
+
+
+@support_agent.tool  # (6)!
 async def customer_balance(
-ctx: RunContext[SupportDependencies], include_pending: bool
+    ctx: RunContext[SupportDependencies], include_pending: bool
 ) -> float:
-"""Returns the customer's current account balance.""" # (7)!
-return await ctx.deps.db.customer_balance(
-id=ctx.deps.customer_id,
-include_pending=include_pending,
-)
-... # (11)!
+    """Returns the customer's current account balance."""  # (7)!
+    return await ctx.deps.db.customer_balance(
+        id=ctx.deps.customer_id,
+        include_pending=include_pending,
+    )
+
+
+...  # (11)!
+
+
 async def main():
-deps = SupportDependencies(customer_id=123, db=DatabaseConn())
-result = await support_agent.run('What is my balance?', deps=deps) # (8)!
-print(result.output) # (10)!
-"""
-support_advice='Hello John, your current account balance, including pending transactions, is $123.45.' block_card=False risk=1
-"""
-result = await support_agent.run('I just lost my card!', deps=deps)
-print(result.output)
-"""
-support_advice="I'm sorry to hear that, John. We are temporarily blocking your card to prevent unauthorized transactions." block_card=True risk=8
-"""
-- This
-[agent](agents/)will act as first-tier support in a bank. Agents are generic in the type of dependencies they accept and the type of output they return. In this case, the support agent has typeAgent[SupportDependencies, SupportOutput]
-. - Here we configure the agent to use
-[OpenAI's GPT-5 model](api/models/openai/), you can also set the model when running the agent. - The
-SupportDependencies
-dataclass is used to pass data, connections, and logic into the model that will be needed when running[instructions](agents/#instructions)and[tool](tools/)functions. Pydantic AI's system of dependency injection provides a[type-safe](agents/#static-type-checking)way to customise the behavior of your agents, and can be especially useful when running[unit tests](testing/)and evals. - Static
-[instructions](agents/#instructions)can be registered with theto the agent.instructions
-keyword argument - Dynamic
-[instructions](agents/#instructions)can be registered with thedecorator, and can make use of dependency injection. Dependencies are carried via the@agent.instructions
-argument, which is parameterized with theRunContext
-deps_type
-from above. If the type annotation here is wrong, static type checkers will catch it. - The
-decorator let you register functions which the LLM may call while responding to a user. Again, dependencies are carried via@agent.tool
-, any other arguments become the tool schema passed to the LLM. Pydantic is used to validate these arguments, and errors are passed back to the LLM so it can retry.RunContext
-- The docstring of a tool is also passed to the LLM as the description of the tool. Parameter descriptions are
-[extracted](tools/#function-tools-and-schema)from the docstring and added to the parameter schema sent to the LLM. [Run the agent](agents/#running-agents)asynchronously, conducting a conversation with the LLM until a final response is reached. Even in this fairly simple case, the agent will exchange multiple messages with the LLM as tools are called to retrieve an output.- The response from the agent will be guaranteed to be a
-SupportOutput
-. If validation fails[reflection](agents/#reflection-and-self-correction), the agent is prompted to try again. - The output will be validated with Pydantic to guarantee it is a
-SupportOutput
-, since the agent is generic, it'll also be typed as aSupportOutput
-to aid with static type checking. - In a real use case, you'd add more tools and longer instructions to the agent to extend the context it's equipped with and support it can provide.
-- This is a simple sketch of a database connection, used to keep the example short and readable. In reality, you'd be connecting to an external database (e.g. PostgreSQL) to get information about customers.
-- This
-[Pydantic](https://docs.pydantic.dev)model is used to constrain the structured data returned by the agent. From this simple definition, Pydantic builds the JSON Schema that tells the LLM how to return the data, and performs validation to guarantee the data is correct at the end of the run.
+    deps = SupportDependencies(customer_id=123, db=DatabaseConn())
+    result = await support_agent.run('What is my balance?', deps=deps)  # (8)!
+    print(result.output)  # (10)!
+    """
+    support_advice='Hello John, your current account balance, including pending transactions, is $123.45.' block_card=False risk=1
+    """
+
+    result = await support_agent.run('I just lost my card!', deps=deps)
+    print(result.output)
+    """
+    support_advice="I'm sorry to hear that, John. We are temporarily blocking your card to prevent unauthorized transactions." block_card=True risk=8
+    """
+```
+
+1. This [agent](agents/) will act as first-tier support in a bank. Agents are generic in the type of dependencies they accept and the type of output they return. In this case, the support agent has type `Agent[SupportDependencies, SupportOutput]`.
+2. Here we configure the agent to use [OpenAI's GPT-5 model](api/models/openai/), you can also set the model when running the agent.
+3. The `SupportDependencies` dataclass is used to pass data, connections, and logic into the model that will be needed when running [instructions](agents/#instructions) and [tool](tools/) functions. Pydantic AI's system of dependency injection provides a [type-safe](agents/#static-type-checking) way to customise the behavior of your agents, and can be especially useful when running [unit tests](testing/) and evals.
+4. Static [instructions](agents/#instructions) can be registered with the [`instructions` keyword argument](api/agent/#pydantic_ai.agent.Agent.__init__) to the agent.
+5. Dynamic [instructions](agents/#instructions) can be registered with the [`@agent.instructions`](api/agent/#pydantic_ai.agent.Agent.instructions) decorator, and can make use of dependency injection. Dependencies are carried via the [`RunContext`](api/tools/#pydantic_ai.tools.RunContext) argument, which is parameterized with the `deps_type` from above. If the type annotation here is wrong, static type checkers will catch it.
+6. The [`@agent.tool`](tools/) decorator let you register functions which the LLM may call while responding to a user. Again, dependencies are carried via [`RunContext`](api/tools/#pydantic_ai.tools.RunContext), any other arguments become the tool schema passed to the LLM. Pydantic is used to validate these arguments, and errors are passed back to the LLM so it can retry.
+7. The docstring of a tool is also passed to the LLM as the description of the tool. Parameter descriptions are [extracted](tools/#function-tools-and-schema) from the docstring and added to the parameter schema sent to the LLM.
+8. [Run the agent](agents/#running-agents) asynchronously, conducting a conversation with the LLM until a final response is reached. Even in this fairly simple case, the agent will exchange multiple messages with the LLM as tools are called to retrieve an output.
+9. The response from the agent will be guaranteed to be a `SupportOutput`. If validation fails [reflection](agents/#reflection-and-self-correction), the agent is prompted to try again.
+10. The output will be validated with Pydantic to guarantee it is a `SupportOutput`, since the agent is generic, it'll also be typed as a `SupportOutput` to aid with static type checking.
+11. In a real use case, you'd add more tools and longer instructions to the agent to extend the context it's equipped with and support it can provide.
+12. This is a simple sketch of a database connection, used to keep the example short and readable. In reality, you'd be connecting to an external database (e.g. PostgreSQL) to get information about customers.
+13. This [Pydantic](https://docs.pydantic.dev) model is used to constrain the structured data returned by the agent. From this simple definition, Pydantic builds the JSON Schema that tells the LLM how to return the data, and performs validation to guarantee the data is correct at the end of the run.
+
+bank\\_support.py
+
+```
 from dataclasses import dataclass
+
 from pydantic import BaseModel, Field
 from pydantic_ai import Agent, RunContext
+
 from bank_database import DatabaseConn
+
+
 @dataclass
-class SupportDependencies: # (3)!
-customer_id: int
-db: DatabaseConn # (12)!
-class SupportOutput(BaseModel): # (13)!
-support_advice: str = Field(description='Advice returned to the customer')
-block_card: bool = Field(description="Whether to block the customer's card")
-risk: int = Field(description='Risk level of query', ge=0, le=10)
-support_agent = Agent( # (1)!
-'openai:gpt-5', # (2)!
-deps_type=SupportDependencies,
-output_type=SupportOutput, # (9)!
-instructions=( # (4)!
-'You are a support agent in our bank, give the '
-'customer support and judge the risk level of their query.'
-),
+class SupportDependencies:  # (3)!
+    customer_id: int
+    db: DatabaseConn  # (12)!
+
+
+class SupportOutput(BaseModel):  # (13)!
+    support_advice: str = Field(description='Advice returned to the customer')
+    block_card: bool = Field(description="Whether to block the customer's card")
+    risk: int = Field(description='Risk level of query', ge=0, le=10)
+
+
+support_agent = Agent(  # (1)!
+    'openai:gpt-5',  # (2)!
+    deps_type=SupportDependencies,
+    output_type=SupportOutput,  # (9)!
+    instructions=(  # (4)!
+        'You are a support agent in our bank, give the '
+        'customer support and judge the risk level of their query.'
+    ),
 )
-@support_agent.instructions # (5)!
+
+
+@support_agent.instructions  # (5)!
 async def add_customer_name(ctx: RunContext[SupportDependencies]) -> str:
-customer_name = await ctx.deps.db.customer_name(id=ctx.deps.customer_id)
-return f"The customer's name is {customer_name!r}"
-@support_agent.tool # (6)!
+    customer_name = await ctx.deps.db.customer_name(id=ctx.deps.customer_id)
+    return f"The customer's name is {customer_name!r}"
+
+
+@support_agent.tool  # (6)!
 async def customer_balance(
-ctx: RunContext[SupportDependencies], include_pending: bool
+    ctx: RunContext[SupportDependencies], include_pending: bool
 ) -> float:
-"""Returns the customer's current account balance.""" # (7)!
-return await ctx.deps.db.customer_balance(
-id=ctx.deps.customer_id,
-include_pending=include_pending,
-)
-... # (11)!
+    """Returns the customer's current account balance."""  # (7)!
+    return await ctx.deps.db.customer_balance(
+        id=ctx.deps.customer_id,
+        include_pending=include_pending,
+    )
+
+
+...  # (11)!
+
+
 async def main():
-deps = SupportDependencies(customer_id=123, db=DatabaseConn())
-result = await support_agent.run('What is my balance?', deps=deps) # (8)!
-print(result.output) # (10)!
-"""
-support_advice='Hello John, your current account balance, including pending transactions, is $123.45.' block_card=False risk=1
-"""
-result = await support_agent.run('I just lost my card!', deps=deps)
-print(result.output)
-"""
-support_advice="I'm sorry to hear that, John. We are temporarily blocking your card to prevent unauthorized transactions." block_card=True risk=8
-"""
-- This
-[agent](agents/)will act as first-tier support in a bank. Agents are generic in the type of dependencies they accept and the type of output they return. In this case, the support agent has typeAgent[SupportDependencies, SupportOutput]
-. - Here we configure the agent to use
-[OpenAI's GPT-5 model](api/models/openai/), you can also set the model when running the agent. - The
-SupportDependencies
-dataclass is used to pass data, connections, and logic into the model that will be needed when running[instructions](agents/#instructions)and[tool](tools/)functions. Pydantic AI's system of dependency injection provides a[type-safe](agents/#static-type-checking)way to customise the behavior of your agents, and can be especially useful when running[unit tests](testing/)and evals. - Static
-[instructions](agents/#instructions)can be registered with theto the agent.instructions
-keyword argument - Dynamic
-[instructions](agents/#instructions)can be registered with thedecorator, and can make use of dependency injection. Dependencies are carried via the@agent.instructions
-argument, which is parameterized with theRunContext
-deps_type
-from above. If the type annotation here is wrong, static type checkers will catch it. - The
-decorator let you register functions which the LLM may call while responding to a user. Again, dependencies are carried via@agent.tool
-, any other arguments become the tool schema passed to the LLM. Pydantic is used to validate these arguments, and errors are passed back to the LLM so it can retry.RunContext
-- The docstring of a tool is also passed to the LLM as the description of the tool. Parameter descriptions are
-[extracted](tools/#function-tools-and-schema)from the docstring and added to the parameter schema sent to the LLM. [Run the agent](agents/#running-agents)asynchronously, conducting a conversation with the LLM until a final response is reached. Even in this fairly simple case, the agent will exchange multiple messages with the LLM as tools are called to retrieve an output.- The response from the agent will be guaranteed to be a
-SupportOutput
-. If validation fails[reflection](agents/#reflection-and-self-correction), the agent is prompted to try again. - The output will be validated with Pydantic to guarantee it is a
-SupportOutput
-, since the agent is generic, it'll also be typed as aSupportOutput
-to aid with static type checking. - In a real use case, you'd add more tools and longer instructions to the agent to extend the context it's equipped with and support it can provide.
-- This is a simple sketch of a database connection, used to keep the example short and readable. In reality, you'd be connecting to an external database (e.g. PostgreSQL) to get information about customers.
-- This
-[Pydantic](https://docs.pydantic.dev)model is used to constrain the structured data returned by the agent. From this simple definition, Pydantic builds the JSON Schema that tells the LLM how to return the data, and performs validation to guarantee the data is correct at the end of the run.
-Complete bank_support.py
-example
-The code included here is incomplete for the sake of brevity (the definition of DatabaseConn
-is missing); you can find the complete bank_support.py
-example [here](examples/bank-support/).
-Instrumentation with Pydantic Logfire
-Even a simple agent with just a handful of tools can result in a lot of back-and-forth with the LLM, making it nearly impossible to be confident of what's going on just from reading the code. To understand the flow of the above runs, we can watch the agent in action using Pydantic Logfire.
+    deps = SupportDependencies(customer_id=123, db=DatabaseConn())
+    result = await support_agent.run('What is my balance?', deps=deps)  # (8)!
+    print(result.output)  # (10)!
+    """
+    support_advice='Hello John, your current account balance, including pending transactions, is $123.45.' block_card=False risk=1
+    """
+
+    result = await support_agent.run('I just lost my card!', deps=deps)
+    print(result.output)
+    """
+    support_advice="I'm sorry to hear that, John. We are temporarily blocking your card to prevent unauthorized transactions." block_card=True risk=8
+    """
+```
+
+1. This [agent](agents/) will act as first-tier support in a bank. Agents are generic in the type of dependencies they accept and the type of output they return. In this case, the support agent has type `Agent[SupportDependencies, SupportOutput]`.
+2. Here we configure the agent to use [OpenAI's GPT-5 model](api/models/openai/), you can also set the model when running the agent.
+3. The `SupportDependencies` dataclass is used to pass data, connections, and logic into the model that will be needed when running [instructions](agents/#instructions) and [tool](tools/) functions. Pydantic AI's system of dependency injection provides a [type-safe](agents/#static-type-checking) way to customise the behavior of your agents, and can be especially useful when running [unit tests](testing/) and evals.
+4. Static [instructions](agents/#instructions) can be registered with the [`instructions` keyword argument](api/agent/#pydantic_ai.agent.Agent.__init__) to the agent.
+5. Dynamic [instructions](agents/#instructions) can be registered with the [`@agent.instructions`](api/agent/#pydantic_ai.agent.Agent.instructions) decorator, and can make use of dependency injection. Dependencies are carried via the [`RunContext`](api/tools/#pydantic_ai.tools.RunContext) argument, which is parameterized with the `deps_type` from above. If the type annotation here is wrong, static type checkers will catch it.
+6. The [`@agent.tool`](tools/) decorator let you register functions which the LLM may call while responding to a user. Again, dependencies are carried via [`RunContext`](api/tools/#pydantic_ai.tools.RunContext), any other arguments become the tool schema passed to the LLM. Pydantic is used to validate these arguments, and errors are passed back to the LLM so it can retry.
+7. The docstring of a tool is also passed to the LLM as the description of the tool. Parameter descriptions are [extracted](tools/#function-tools-and-schema) from the docstring and added to the parameter schema sent to the LLM.
+8. [Run the agent](agents/#running-agents) asynchronously, conducting a conversation with the LLM until a final response is reached. Even in this fairly simple case, the agent will exchange multiple messages with the LLM as tools are called to retrieve an output.
+9. The response from the agent will be guaranteed to be a `SupportOutput`. If validation fails [reflection](agents/#reflection-and-self-correction), the agent is prompted to try again.
+10. The output will be validated with Pydantic to guarantee it is a `SupportOutput`, since the agent is generic, it'll also be typed as a `SupportOutput` to aid with static type checking.
+11. In a real use case, you'd add more tools and longer instructions to the agent to extend the context it's equipped with and support it can provide.
+12. This is a simple sketch of a database connection, used to keep the example short and readable. In reality, you'd be connecting to an external database (e.g. PostgreSQL) to get information about customers.
+13. This [Pydantic](https://docs.pydantic.dev) model is used to constrain the structured data returned by the agent. From this simple definition, Pydantic builds the JSON Schema that tells the LLM how to return the data, and performs validation to guarantee the data is correct at the end of the run.
+
+Complete `bank_support.py` example
+
+The code included here is incomplete for the sake of brevity (the definition of `DatabaseConn` is missing); you can find the complete `bank_support.py` example [here](examples/bank-support/).
+
+## Instrumentation with Pydantic Logfire
+
+Even a simple agent with just a handful of tools can result in a lot of back-and-forth with the LLM, making it nearly impossible to be confident of what's going on just from reading the code.
+To understand the flow of the above runs, we can watch the agent in action using Pydantic Logfire.
+
 To do this, we need to [set up Logfire](logfire/#using-logfire), and add the following to our code:
-[Learn about Gateway](gateway)bank_support_with_logfire.py
+
+With Pydantic AI GatewayDirectly to Provider API
+
+[Learn about Gateway](../gateway) bank\\_support\\_with\\_logfire.py
+
+```
 ...
 from pydantic_ai import Agent, RunContext
+
 from bank_database import DatabaseConn
+
 import logfire
-logfire.configure() # (1)!
-logfire.instrument_pydantic_ai() # (2)!
-logfire.instrument_asyncpg() # (3)!
+
+logfire.configure()  # (1)!
+logfire.instrument_pydantic_ai()  # (2)!
+logfire.instrument_asyncpg()  # (3)!
+
 ...
+
 support_agent = Agent(
-'gateway/openai:gpt-5',
-deps_type=SupportDependencies,
-output_type=SupportOutput,
-system_prompt=(
-'You are a support agent in our bank, give the '
-'customer support and judge the risk level of their query.'
-),
+    'gateway/openai:gpt-5',
+    deps_type=SupportDependencies,
+    output_type=SupportOutput,
+    system_prompt=(
+        'You are a support agent in our bank, give the '
+        'customer support and judge the risk level of their query.'
+    ),
 )
-- Configure the Logfire SDK, this will fail if project is not set up.
-- This will instrument all Pydantic AI agents used from here on out. If you want to instrument only a specific agent, you can pass the
-to the agent.instrument=True
-keyword argument - In our demo,
-DatabaseConn
-usesto connect to a PostgreSQL database, soasyncpg
-is used to log the database queries.logfire.instrument_asyncpg()
+```
+
+1. Configure the Logfire SDK, this will fail if project is not set up.
+2. This will instrument all Pydantic AI agents used from here on out. If you want to instrument only a specific agent, you can pass the [`instrument=True` keyword argument](api/agent/#pydantic_ai.agent.Agent.__init__) to the agent.
+3. In our demo, `DatabaseConn` uses `asyncpg` to connect to a PostgreSQL database, so [`logfire.instrument_asyncpg()`](https://magicstack.github.io/asyncpg/current/) is used to log the database queries.
+
+bank\\_support\\_with\\_logfire.py
+
+```
 ...
 from pydantic_ai import Agent, RunContext
+
 from bank_database import DatabaseConn
+
 import logfire
-logfire.configure() # (1)!
-logfire.instrument_pydantic_ai() # (2)!
-logfire.instrument_asyncpg() # (3)!
+
+logfire.configure()  # (1)!
+logfire.instrument_pydantic_ai()  # (2)!
+logfire.instrument_asyncpg()  # (3)!
+
 ...
+
 support_agent = Agent(
-'openai:gpt-5',
-deps_type=SupportDependencies,
-output_type=SupportOutput,
-system_prompt=(
-'You are a support agent in our bank, give the '
-'customer support and judge the risk level of their query.'
-),
+    'openai:gpt-5',
+    deps_type=SupportDependencies,
+    output_type=SupportOutput,
+    system_prompt=(
+        'You are a support agent in our bank, give the '
+        'customer support and judge the risk level of their query.'
+    ),
 )
-- Configure the Logfire SDK, this will fail if project is not set up.
-- This will instrument all Pydantic AI agents used from here on out. If you want to instrument only a specific agent, you can pass the
-to the agent.instrument=True
-keyword argument - In our demo,
-DatabaseConn
-usesto connect to a PostgreSQL database, soasyncpg
-is used to log the database queries.logfire.instrument_asyncpg()
+```
+
+1. Configure the Logfire SDK, this will fail if project is not set up.
+2. This will instrument all Pydantic AI agents used from here on out. If you want to instrument only a specific agent, you can pass the [`instrument=True` keyword argument](api/agent/#pydantic_ai.agent.Agent.__init__) to the agent.
+3. In our demo, `DatabaseConn` uses `asyncpg` to connect to a PostgreSQL database, so [`logfire.instrument_asyncpg()`](https://magicstack.github.io/asyncpg/current/) is used to log the database queries.
+
 That's enough to get the following view of your agent in action:
+
 See [Monitoring and Performance](logfire/) to learn more.
-llms.txt
+
+## `llms.txt`
+
 The Pydantic AI documentation is available in the [llms.txt](https://llmstxt.org/) format.
 This format is defined in Markdown and suited for LLMs and AI coding assistants and agents.
+
 Two formats are available:
-: a file containing a brief description of the project, along with links to the different sections of the documentation. The structure of this file is described in detailsllms.txt
-[here](https://llmstxt.org/#format).: Similar to thellms-full.txt
-llms.txt
-file, but every link content is included. Note that this file may be too large for some LLMs.
+
+* [`llms.txt`](https://ai.pydantic.dev/llms.txt): a file containing a brief description
+  of the project, along with links to the different sections of the documentation. The structure
+  of this file is described in details [here](https://llmstxt.org/#format).
+* [`llms-full.txt`](https://ai.pydantic.dev/llms-full.txt): Similar to the `llms.txt` file,
+  but every link content is included. Note that this file may be too large for some LLMs.
+
 As of today, these files are not automatically leveraged by IDEs or coding agents, but they will use it if you provide a link or the full text.
-Next Steps
+
+## Next Steps
+
 To try Pydantic AI for yourself, [install it](install/) and follow the instructions [in the examples](examples/setup/).
+
 Read the [docs](agents/) to learn more about building applications with Pydantic AI.
+
 Read the [API Reference](api/agent/) to understand Pydantic AI's interface.
-Join [ Slack](https://logfire.pydantic.dev/docs/join-slack/) or file an issue on [ GitHub](https://github.com/pydantic/pydantic-ai/issues) if you have any questions.\
+
+Join  [Slack](https://logfire.pydantic.dev/docs/join-slack/) or file an issue on  [GitHub](https://github.com/pydantic/pydantic-ai/issues) if you have any questions.
+
+
+
+© Pydantic Services Inc. 2024 to present\
 ''',
                                 'media_type': 'text/plain',
                                 'type': 'text',
@@ -4795,35 +5333,24 @@ async def main():
                             'title': 'Pydantic AI',
                             'type': 'document',
                         },
-                        'retrieved_at': IsStr(),
+                        'retrieved_at': '2025-12-08T15:05:59.571000+00:00',
                         'type': 'web_fetch_result',
                         'url': 'https://ai.pydantic.dev',
                     },
-                    tool_call_id=IsStr(),
-                    timestamp=IsDatetime(),
+                    tool_call_id='srvtoolu_011CmugtvU55veq6jzEtGtnt',
+                    timestamp=IsNow(tz=timezone.utc),
                     provider_name='anthropic',
                 ),
                 previous_part_kind='builtin-tool-call',
             ),
-            PartDeltaEvent(index=3, delta=TextPartDelta(content_delta='ydantic AI is a')),
-            PartDeltaEvent(index=3, delta=TextPartDelta(content_delta=' Python')),
-            PartDeltaEvent(index=3, delta=TextPartDelta(content_delta=' agent')),
-            PartDeltaEvent(index=3, delta=TextPartDelta(content_delta=' framework')),
-            PartDeltaEvent(index=3, delta=TextPartDelta(content_delta=' designe')),
-            PartDeltaEvent(index=3, delta=TextPartDelta(content_delta='d to help')),
-            PartDeltaEvent(index=3, delta=TextPartDelta(content_delta=' you quickly')),
+            PartDeltaEvent(index=3, delta=TextPartDelta(content_delta='Gen')),
+            PartDeltaEvent(index=3, delta=TextPartDelta(content_delta='A')),
+            PartDeltaEvent(index=3, delta=TextPartDelta(content_delta='I Agent')),
+            PartDeltaEvent(index=3, delta=TextPartDelta(content_delta=' Framework')),
             PartDeltaEvent(index=3, delta=TextPartDelta(content_delta=',')),
-            PartDeltaEvent(index=3, delta=TextPartDelta(content_delta=' confi')),
-            PartDeltaEvent(index=3, delta=TextPartDelta(content_delta='dently,')),
-            PartDeltaEvent(index=3, delta=TextPartDelta(content_delta=' and pain')),
-            PartDeltaEvent(index=3, delta=TextPartDelta(content_delta='lessly build production')),
-            PartDeltaEvent(index=3, delta=TextPartDelta(content_delta=' grade')),
-            PartDeltaEvent(index=3, delta=TextPartDelta(content_delta=' applications')),
-            PartDeltaEvent(index=3, delta=TextPartDelta(content_delta=' an')),
-            PartDeltaEvent(index=3, delta=TextPartDelta(content_delta='d workflows')),
-            PartDeltaEvent(index=3, delta=TextPartDelta(content_delta=' with')),
-            PartDeltaEvent(index=3, delta=TextPartDelta(content_delta=' Gener')),
-            PartDeltaEvent(index=3, delta=TextPartDelta(content_delta='ative AI.')),
+            PartDeltaEvent(index=3, delta=TextPartDelta(content_delta=' the')),
+            PartDeltaEvent(index=3, delta=TextPartDelta(content_delta=' Pydantic way')),
+            PartDeltaEvent(index=3, delta=TextPartDelta(content_delta='"')),
         ]
     )
 
@@ -8026,3 +8553,214 @@ async def test_anthropic_container_id_from_stream_response(allow_model_requests:
     assert model_response.provider_details is not None
     assert model_response.provider_details.get('container_id') == 'container_from_stream'
     assert model_response.provider_details.get('finish_reason') == 'end_turn'
+
+
+@pytest.mark.parametrize(
+    'tool_choice,expected_type',
+    [
+        pytest.param('auto', 'auto', id='auto'),
+        pytest.param('required', 'any', id='required-maps-to-any'),
+    ],
+)
+async def test_tool_choice_string_values(allow_model_requests: None, tool_choice: str, expected_type: str) -> None:
+    """Ensure Anthropic string values map to the expected schema."""
+    c = completion_message([BetaTextBlock(text='ok', type='text')], BetaUsage(input_tokens=5, output_tokens=10))
+    mock_client = MockAnthropic.create_mock(c)
+    m = AnthropicModel('claude-haiku-4-5', provider=AnthropicProvider(anthropic_client=mock_client))
+    agent = Agent(m)
+
+    @agent.tool_plain
+    def my_tool(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    await agent.run('hello', model_settings={'tool_choice': tool_choice})  # type: ignore
+
+    kwargs = mock_client.chat_completion_kwargs[0]  # type: ignore
+    assert kwargs['tool_choice']['type'] == expected_type
+
+
+async def test_tool_choice_specific_tool_single(allow_model_requests: None) -> None:
+    """Single Anthropic tools should emit the 'tool' choice payload."""
+    c = completion_message([BetaTextBlock(text='ok', type='text')], BetaUsage(input_tokens=5, output_tokens=10))
+    mock_client = MockAnthropic.create_mock(c)
+    m = AnthropicModel('claude-haiku-4-5', provider=AnthropicProvider(anthropic_client=mock_client))
+    agent = Agent(m)
+
+    @agent.tool_plain
+    def tool_a(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    @agent.tool_plain
+    def tool_b(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    await agent.run('hello', model_settings={'tool_choice': ['tool_a']})
+
+    kwargs = mock_client.chat_completion_kwargs[0]  # type: ignore
+    assert kwargs['tool_choice'] == {'type': 'tool', 'name': 'tool_a'}
+
+
+async def test_tool_choice_multiple_tools_falls_back_to_any(allow_model_requests: None) -> None:
+    """Multiple specific tools fall back to 'any' with a warning."""
+    c = completion_message([BetaTextBlock(text='ok', type='text')], BetaUsage(input_tokens=5, output_tokens=10))
+    mock_client = MockAnthropic.create_mock(c)
+    m = AnthropicModel('claude-haiku-4-5', provider=AnthropicProvider(anthropic_client=mock_client))
+    agent = Agent(m)
+
+    @agent.tool_plain
+    def tool_a(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    @agent.tool_plain
+    def tool_b(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    with pytest.warns(UserWarning, match='Anthropic only supports forcing a single tool'):
+        await agent.run('hello', model_settings={'tool_choice': ['tool_a', 'tool_b']})
+
+    kwargs = mock_client.chat_completion_kwargs[0]  # type: ignore
+    assert kwargs['tool_choice'] == snapshot({'type': 'any'})
+
+
+async def test_tool_choice_none_with_output_tools(allow_model_requests: None) -> None:
+    """Structured output must remain available even with tool_choice='none'."""
+
+    class Location(BaseModel):
+        city: str
+        country: str
+
+    c = completion_message(
+        [BetaToolUseBlock(id='1', type='tool_use', name='final_result', input={'city': 'Paris', 'country': 'France'})],
+        BetaUsage(input_tokens=5, output_tokens=10),
+    )
+    mock_client = MockAnthropic.create_mock(c)
+    m = AnthropicModel('claude-haiku-4-5', provider=AnthropicProvider(anthropic_client=mock_client))
+    agent = Agent(m, output_type=Location)
+
+    @agent.tool_plain
+    def my_tool(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    result = await agent.run('hello', model_settings={'tool_choice': 'none'})
+
+    assert result.output == snapshot(Location(city='Paris', country='France'))
+    kwargs = mock_client.chat_completion_kwargs[0]  # type: ignore
+    assert kwargs['tool_choice'] == snapshot({'type': 'tool', 'name': 'final_result'})
+
+
+async def test_tool_choice_required_with_thinking_raises_error(allow_model_requests: None) -> None:
+    """Thinking mode with tool_choice='required' raises UserError."""
+    c = completion_message([BetaTextBlock(text='ok', type='text')], BetaUsage(input_tokens=5, output_tokens=10))
+    mock_client = MockAnthropic.create_mock(c)
+    m = AnthropicModel('claude-haiku-4-5', provider=AnthropicProvider(anthropic_client=mock_client))
+    agent = Agent(m)
+
+    @agent.tool_plain
+    def my_tool(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    with pytest.raises(UserError, match="tool_choice='required' is not supported with Anthropic thinking mode"):
+        await agent.run(
+            'hello',
+            model_settings={
+                'tool_choice': 'required',
+                'anthropic_thinking': {'type': 'enabled', 'budget_tokens': 1000},
+            },  # type: ignore
+        )
+
+
+async def test_tool_choice_specific_with_thinking_raises_error(allow_model_requests: None) -> None:
+    """Specific tool forcing with thinking mode raises UserError."""
+    c = completion_message([BetaTextBlock(text='ok', type='text')], BetaUsage(input_tokens=5, output_tokens=10))
+    mock_client = MockAnthropic.create_mock(c)
+    m = AnthropicModel('claude-haiku-4-5', provider=AnthropicProvider(anthropic_client=mock_client))
+    agent = Agent(m)
+
+    @agent.tool_plain
+    def my_tool(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    with pytest.raises(UserError, match='Forcing specific tools is not supported with Anthropic thinking mode'):
+        await agent.run(
+            'hello',
+            model_settings={
+                'tool_choice': ['my_tool'],
+                'anthropic_thinking': {'type': 'enabled', 'budget_tokens': 1000},
+            },  # type: ignore
+        )
+
+
+async def test_tool_choice_none_with_multiple_output_tools_falls_back_to_auto(allow_model_requests: None) -> None:
+    """Multiple output tools force a fallback to 'auto' with a warning."""
+
+    class LocationA(BaseModel):
+        city: str
+
+    class LocationB(BaseModel):
+        country: str
+
+    c = completion_message(
+        [BetaToolUseBlock(id='1', type='tool_use', name='final_result_LocationA', input={'city': 'Paris'})],
+        BetaUsage(input_tokens=5, output_tokens=10),
+    )
+    mock_client = MockAnthropic.create_mock(c)
+    m = AnthropicModel('claude-haiku-4-5', provider=AnthropicProvider(anthropic_client=mock_client))
+    agent: Agent[None, LocationA | LocationB] = Agent(m, output_type=[LocationA, LocationB])
+
+    @agent.tool_plain
+    def my_tool(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    with pytest.warns(UserWarning, match='Anthropic only supports forcing a single tool'):
+        await agent.run('hello', model_settings={'tool_choice': 'none'})
+
+    kwargs = mock_client.chat_completion_kwargs[0]  # type: ignore
+    assert kwargs['tool_choice']['type'] == 'auto'
+
+
+async def test_tool_choice_auto_with_required_output(allow_model_requests: None) -> None:
+    """When tool_choice='auto' but structured output is required, falls back to 'any'."""
+
+    class Location(BaseModel):
+        city: str
+        country: str
+
+    c = completion_message(
+        [BetaToolUseBlock(id='1', type='tool_use', name='final_result', input={'city': 'Paris', 'country': 'France'})],
+        BetaUsage(input_tokens=5, output_tokens=10),
+    )
+    mock_client = MockAnthropic.create_mock(c)
+    m = AnthropicModel('claude-haiku-4-5', provider=AnthropicProvider(anthropic_client=mock_client))
+    agent = Agent(m, output_type=Location)
+
+    @agent.tool_plain
+    def my_tool(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    await agent.run('hello', model_settings={'tool_choice': 'auto'})
+
+    kwargs = mock_client.chat_completion_kwargs[0]  # type: ignore
+    # With structured output (allow_text_output=False), 'auto' becomes 'any'
+    assert kwargs['tool_choice'] == snapshot({'type': 'any'})
+
+
+async def test_tool_choice_none_without_output_tools(allow_model_requests: None) -> None:
+    """When tool_choice='none' with no output tools, no tools are sent at all."""
+    c = completion_message([BetaTextBlock(text='ok', type='text')], BetaUsage(input_tokens=5, output_tokens=10))
+    mock_client = MockAnthropic.create_mock(c)
+    m = AnthropicModel('claude-haiku-4-5', provider=AnthropicProvider(anthropic_client=mock_client))
+    agent = Agent(m)
+
+    @agent.tool_plain
+    def my_tool(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    await agent.run('hello', model_settings={'tool_choice': 'none'})
+
+    kwargs = mock_client.chat_completion_kwargs[0]  # type: ignore
+    # Function tools filtered out, no output tools → tools is Omit (sentinel value)
+    from anthropic import Omit
+
+    assert isinstance(kwargs.get('tools'), Omit)  # pyright: ignore[reportUnknownMemberType]
+    # tool_choice is also Omit when no tools are sent
+    assert isinstance(kwargs.get('tool_choice'), Omit)  # pyright: ignore[reportUnknownMemberType]
diff --git a/tests/models/test_bedrock.py b/tests/models/test_bedrock.py
index ceb0e76680..1e8b92722e 100644
--- a/tests/models/test_bedrock.py
+++ b/tests/models/test_bedrock.py
@@ -1324,7 +1324,7 @@ async def test_bedrock_group_consecutive_tool_return_parts(bedrock_provider: Bed
     ]
 
     # Call the mapping function directly
-    _, bedrock_messages = await model._map_messages(req, ModelRequestParameters())  # type: ignore[reportPrivateUsage]
+    _, bedrock_messages = await model._map_messages(req, ModelRequestParameters())  # pyright: ignore[reportPrivateUsage]
 
     assert bedrock_messages == snapshot(
         [
@@ -1445,7 +1445,7 @@ async def test_bedrock_mistral_tool_result_format(bedrock_provider: BedrockProvi
     # Models other than Mistral support toolResult.content with text, not json
     model = BedrockConverseModel('us.amazon.nova-micro-v1:0', provider=bedrock_provider)
     # Call the mapping function directly
-    _, bedrock_messages = await model._map_messages(req, ModelRequestParameters())  # type: ignore[reportPrivateUsage]
+    _, bedrock_messages = await model._map_messages(req, ModelRequestParameters())  # pyright: ignore[reportPrivateUsage,reportArgumentType]
 
     assert bedrock_messages == snapshot(
         [
@@ -1461,7 +1461,7 @@ async def test_bedrock_mistral_tool_result_format(bedrock_provider: BedrockProvi
     # Mistral requires toolResult.content to hold json, not text
     model = BedrockConverseModel('mistral.mistral-7b-instruct-v0:2', provider=bedrock_provider)
     # Call the mapping function directly
-    _, bedrock_messages = await model._map_messages(req, ModelRequestParameters())  # type: ignore[reportPrivateUsage]
+    _, bedrock_messages = await model._map_messages(req, ModelRequestParameters())  # pyright: ignore[reportPrivateUsage,reportArgumentType]
 
     assert bedrock_messages == snapshot(
         [
@@ -1485,7 +1485,7 @@ async def test_bedrock_no_tool_choice(bedrock_provider: BedrockProvider):
 
     # Amazon Nova supports tool_choice
     model = BedrockConverseModel('us.amazon.nova-micro-v1:0', provider=bedrock_provider)
-    tool_config = model._map_tool_config(mrp)  # type: ignore[reportPrivateUsage]
+    tool_config = model._map_tool_config(mrp, None)  # pyright: ignore[reportPrivateUsage]
 
     assert tool_config == snapshot(
         {
@@ -1506,7 +1506,7 @@ async def test_bedrock_no_tool_choice(bedrock_provider: BedrockProvider):
 
     # Anthropic supports tool_choice
     model = BedrockConverseModel('us.anthropic.claude-3-7-sonnet-20250219-v1:0', provider=bedrock_provider)
-    tool_config = model._map_tool_config(mrp)  # type: ignore[reportPrivateUsage]
+    tool_config = model._map_tool_config(mrp, None)  # pyright: ignore[reportPrivateUsage]
 
     assert tool_config == snapshot(
         {
@@ -1527,7 +1527,7 @@ async def test_bedrock_no_tool_choice(bedrock_provider: BedrockProvider):
 
     # Other models don't support tool_choice
     model = BedrockConverseModel('us.meta.llama4-maverick-17b-instruct-v1:0', provider=bedrock_provider)
-    tool_config = model._map_tool_config(mrp)  # type: ignore[reportPrivateUsage]
+    tool_config = model._map_tool_config(mrp, None)  # pyright: ignore[reportPrivateUsage]
 
     assert tool_config == snapshot(
         {
@@ -1626,6 +1626,177 @@ async def test_cache_point_filtering():
     assert messages[0]['role'] == 'user'
 
 
+@pytest.mark.parametrize(
+    'tool_choice,expected_tool_choice',
+    [
+        pytest.param('auto', {'auto': {}}, id='auto'),
+        pytest.param('required', {'any': {}}, id='required-maps-to-any'),
+    ],
+)
+async def test_tool_choice_string_values(
+    bedrock_provider: BedrockProvider, tool_choice: str, expected_tool_choice: dict[str, Any]
+) -> None:
+    """Ensure simple string tool_choice values map to Bedrock's schema."""
+    my_tool = ToolDefinition(
+        name='my_tool',
+        description='Test tool',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+    mrp = ModelRequestParameters(output_mode='tool', function_tools=[my_tool], allow_text_output=True, output_tools=[])
+
+    model = BedrockConverseModel('us.amazon.nova-micro-v1:0', provider=bedrock_provider)
+    settings: BedrockModelSettings = {'tool_choice': tool_choice}  # type: ignore[assignment]
+    tool_config = model._map_tool_config(mrp, settings)  # pyright: ignore[reportPrivateUsage]
+
+    assert tool_config is not None
+    assert tool_config.get('toolChoice') == expected_tool_choice
+
+
+async def test_tool_choice_none_filters_out_function_tools(bedrock_provider: BedrockProvider) -> None:
+    """tool_choice='none' filters out function tools, leaving only output tools (if any)."""
+    my_tool = ToolDefinition(
+        name='my_tool',
+        description='Test tool',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+    mrp = ModelRequestParameters(output_mode='tool', function_tools=[my_tool], allow_text_output=True, output_tools=[])
+
+    model = BedrockConverseModel('us.amazon.nova-micro-v1:0', provider=bedrock_provider)
+
+    settings: BedrockModelSettings = {'tool_choice': 'none'}
+    tool_config = model._map_tool_config(mrp, settings)  # pyright: ignore[reportPrivateUsage]
+
+    # With no output_tools, filtering results in empty tools -> None returned
+    assert tool_config is None
+
+
+async def test_tool_choice_specific_tool_single(bedrock_provider: BedrockProvider) -> None:
+    """Single tool names should emit the {tool: {name}} payload."""
+    tool_a = ToolDefinition(
+        name='tool_a',
+        description='Test tool A',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+    tool_b = ToolDefinition(
+        name='tool_b',
+        description='Test tool B',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+    mrp = ModelRequestParameters(
+        output_mode='tool', function_tools=[tool_a, tool_b], allow_text_output=True, output_tools=[]
+    )
+
+    model = BedrockConverseModel('us.amazon.nova-micro-v1:0', provider=bedrock_provider)
+    settings: BedrockModelSettings = {'tool_choice': ['tool_a']}
+    tool_config = model._map_tool_config(mrp, settings)  # pyright: ignore[reportPrivateUsage]
+
+    # With tool filtering, only the specified tool is sent
+    assert tool_config == snapshot(
+        {
+            'tools': [
+                {
+                    'toolSpec': {
+                        'name': 'tool_a',
+                        'description': 'Test tool A',
+                        'inputSchema': {'json': {'type': 'object', 'properties': {}}},
+                    }
+                },
+            ],
+            'toolChoice': {'tool': {'name': 'tool_a'}},
+        }
+    )
+
+
+async def test_tool_choice_multiple_tools_falls_back_to_any(bedrock_provider: BedrockProvider) -> None:
+    """Multiple tool names fall back to the 'any' configuration."""
+    tool_a = ToolDefinition(
+        name='tool_a',
+        description='Test tool A',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+    tool_b = ToolDefinition(
+        name='tool_b',
+        description='Test tool B',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+    mrp = ModelRequestParameters(
+        output_mode='tool', function_tools=[tool_a, tool_b], allow_text_output=True, output_tools=[]
+    )
+
+    model = BedrockConverseModel('us.amazon.nova-micro-v1:0', provider=bedrock_provider)
+    settings: BedrockModelSettings = {'tool_choice': ['tool_a', 'tool_b']}
+
+    with pytest.warns(UserWarning, match='Bedrock only supports forcing a single tool'):
+        tool_config = model._map_tool_config(mrp, settings)  # pyright: ignore[reportPrivateUsage]
+
+    assert tool_config == snapshot(
+        {
+            'tools': [
+                {
+                    'toolSpec': {
+                        'name': 'tool_a',
+                        'description': 'Test tool A',
+                        'inputSchema': {'json': {'type': 'object', 'properties': {}}},
+                    }
+                },
+                {
+                    'toolSpec': {
+                        'name': 'tool_b',
+                        'description': 'Test tool B',
+                        'inputSchema': {'json': {'type': 'object', 'properties': {}}},
+                    }
+                },
+            ],
+            'toolChoice': {'any': {}},
+        }
+    )
+
+
+async def test_tool_choice_auto_with_required_output(bedrock_provider: BedrockProvider) -> None:
+    """When tool_choice='auto' but output is required, falls back to 'any'."""
+    my_tool = ToolDefinition(
+        name='my_tool',
+        description='Test tool',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+    # allow_text_output=False simulates structured output requirement
+    mrp = ModelRequestParameters(output_mode='tool', function_tools=[my_tool], allow_text_output=False, output_tools=[])
+
+    model = BedrockConverseModel('us.amazon.nova-micro-v1:0', provider=bedrock_provider)
+    settings: BedrockModelSettings = {'tool_choice': 'auto'}
+    tool_config = model._map_tool_config(mrp, settings)  # pyright: ignore[reportPrivateUsage]
+
+    assert tool_config is not None
+    # With allow_text_output=False, 'auto' becomes 'any' to force tool use
+    assert tool_config.get('toolChoice') == {'any': {}}
+
+
+async def test_tool_choice_none_with_output_tools_uses_auto(bedrock_provider: BedrockProvider) -> None:
+    """When tool_choice='none' with output tools, uses 'auto' to let model choose among output tools."""
+    function_tool = ToolDefinition(
+        name='my_tool',
+        description='Function tool',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+    output_tool = ToolDefinition(
+        name='final_result',
+        description='Output tool',
+        parameters_json_schema={'type': 'object', 'properties': {'result': {'type': 'string'}}},
+    )
+    # tool_choice='none' filters function_tools, but output_tools remain
+    mrp = ModelRequestParameters(
+        output_mode='tool', function_tools=[function_tool], allow_text_output=True, output_tools=[output_tool]
+    )
+
+    model = BedrockConverseModel('us.amazon.nova-micro-v1:0', provider=bedrock_provider)
+    settings: BedrockModelSettings = {'tool_choice': 'none'}
+    tool_config = model._map_tool_config(mrp, settings)  # pyright: ignore[reportPrivateUsage]
+
+    assert tool_config is not None
+    # After filtering, only output tools remain; Bedrock uses 'auto' to let model choose
+    assert tool_config.get('toolChoice') == {'auto': {}}
+
+
 async def test_bedrock_empty_model_response_skipped(bedrock_provider: BedrockProvider):
     """Test that ModelResponse with empty parts (e.g. content_filtered) is skipped in message mapping."""
     model = BedrockConverseModel('us.amazon.nova-micro-v1:0', provider=bedrock_provider)
diff --git a/tests/models/test_google.py b/tests/models/test_google.py
index bdb3f0a864..08781b03a9 100644
--- a/tests/models/test_google.py
+++ b/tests/models/test_google.py
@@ -62,6 +62,7 @@
 from pydantic_ai.models import ModelRequestParameters
 from pydantic_ai.output import NativeOutput, PromptedOutput, TextOutput, ToolOutput
 from pydantic_ai.settings import ModelSettings
+from pydantic_ai.tools import ToolDefinition
 from pydantic_ai.usage import RequestUsage, RunUsage, UsageLimits
 
 from ..conftest import IsBytes, IsDatetime, IsInstance, IsStr, try_import
@@ -71,6 +72,7 @@
     from google.genai import errors
     from google.genai.types import (
         FinishReason as GoogleFinishReason,
+        FunctionCallingConfigMode,
         GenerateContentResponse,
         GenerateContentResponseUsageMetadata,
         HarmBlockThreshold,
@@ -1027,13 +1029,28 @@ async def test_google_model_web_search_tool(allow_model_requests: None, google_p
                             },
                             {
                                 'domain': None,
-                                'title': 'weather.gov',
-                                'uri': 'https://vertexaisearch.cloud.google.com/grounding-api-redirect/AUZIYQF_uqo2G5Goeww8iF1L_dYa2sqWGhzu_UnxEZd1gQ7ZNuXEVVVYEEYcx_La3kuODFm0dPUhHeF4qGP1c6kJ86i4SKfvRqFitMCvNiDx07eC5iM7axwepoTv3FeUdIRC-ou1P-6DDykZ4QzcxcrKISa_1Q==',
+                                'title': 'cbsnews.com',
+                                'uri': 'https://vertexaisearch.cloud.google.com/grounding-api-redirect/AUZIYQHs0KxAufAKly9TnNAnn-Baxlk1USk6vVjzW1FEEUCZKnE5eeatKXcIXJ4HZNDI7ROs1q3IuHTZp5bZwB3hc-u1sXnXI0rosZTNt-t6H9FTF9owH4M5u-54bnuL01OC1C3fEnU7MNRV',
                             },
                             {
                                 'domain': None,
                                 'title': 'wunderground.com',
-                                'uri': 'https://vertexaisearch.cloud.google.com/grounding-api-redirect/AUZIYQFywixFZicmDjijfhfLNw8ya7XdqWR31aJp8CHyULLelG8bujH1TuqeP9RAhK6Pcm1qz11ujm2yM7gM5bJXDFsZwbsubub4cnUp5ixRaloJcjVrHkyd5RHblhkDDxHGiREV9BcuqeJovdr8qhtrCKMcvJk=',
+                                'uri': 'https://vertexaisearch.cloud.google.com/grounding-api-redirect/AUZIYQGIi3F3lZlGrWP6vK_zucR90Esg-PCBYRgHOK0gvSIwbHM1jKGKhLwKbv-chvrUhyhc5IZ9XAjo59IBjM6Tk5p2qQK7QGW-WgFi0Nrus7IrBqgNJfWCAMTgqkde8RXWk-T2edNf90TJGVoJIKXhcuWxpuE=',
+                            },
+                            {
+                                'domain': None,
+                                'title': 'accuweather.com',
+                                'uri': 'https://vertexaisearch.cloud.google.com/grounding-api-redirect/AUZIYQFUEG5HLOGJoFbOTpesMFek1T82haMch6RGzVbNaG-m-B7mbwLkfb4pHpCE8CH_RHUMa5GKNPUxev47neFe9YXiKJdXKo4gMABpBHjb3AjAXg5UNoY3hvMfhBVw-mxSLTzHuRzdxvjgMpDbskeuMVt0jM543GJnG06EVVzeYm8UUemWTS2UJyE=',
+                            },
+                            {
+                                'domain': None,
+                                'title': 'theweathernetwork.com',
+                                'uri': 'https://vertexaisearch.cloud.google.com/grounding-api-redirect/AUZIYQHtG8yKh-VGE2kjUi05sHqdu5HUVFr6NUs9F3SdvzlnHjubasE5fLourWIMk6Wmgd6VFmAj8NcY3HNeFosMwnxMc3zyvlZ2V6gNDMFuGgJCofZD1vlE0t2vv4KFC13o1LnElXVvzht7u-6kfwQybN_57kHs63NjwCQLiYECj8Ub7yDRhCYAzCU=',
+                            },
+                            {
+                                'domain': None,
+                                'title': 'weather.com',
+                                'uri': 'https://vertexaisearch.cloud.google.com/grounding-api-redirect/AUZIYQHggnMLBYdYahOGPJ6dykd1mBx7bs82NTc6T-pndOKmIdb8s-3QQ2571SFt8NPG6_UstE9rYG5g2yegUOlsiREqykqesDB7UP58H3ApEe2hDCMTqSyRllMUusJecf2jVHF8kb2Y1rCBNkzaXKuhtxgx6OPvoaYNnYDhIo73',
                             },
                         ],
                         tool_call_id=IsStr(),
@@ -1042,33 +1059,31 @@ async def test_google_model_web_search_tool(allow_model_requests: None, google_p
                     ),
                     TextPart(
                         content="""\
-## Weather in San Francisco is Mild and Partly Cloudy
-
-**San Francisco, CA** - Residents and visitors in San Francisco are experiencing a mild Tuesday, with partly cloudy skies and temperatures hovering around 69°F. There is a very low chance of rain throughout the day.
+**San Francisco Experiences a Mostly Cloudy Day with Mild Temperatures**
 
-According to the latest weather reports, the forecast for the remainder of the day is expected to be sunny, with highs ranging from the mid-60s to the lower 80s. Winds are predicted to come from the west at 10 to 15 mph.
+As of Monday in San Francisco, the weather is predominantly mostly cloudy with a current temperature of 51°F, which feels more like 49°F. Other reports describe the sky as partly cloudy. The forecast for the day indicates that cloudy conditions will persist with a slight 10% chance of rain.
 
-As the evening approaches, the skies are expected to remain partly cloudy, with temperatures dropping to the upper 50s. There is a slight increase in the chance of rain overnight, but it remains low at 20%.
+The high temperature for the day is expected to reach the low to mid-50s, with forecasts predicting a high of 54°F. The low for tonight is anticipated to be in the mid-40s, with some forecasts calling for a low of 45°F.
 
-Overall, today's weather in San Francisco is pleasant, with a mix of sun and clouds and comfortable temperatures.\
+Humidity levels are relatively high, reported at 77%. Winds are generally light, coming from the north at 5 to 10 mph. Visibility has been noted as being around 1.5 to 2 miles. There is also a possibility of dense fog in some areas.\
 """
                     ),
                 ],
                 usage=RequestUsage(
                     input_tokens=17,
-                    output_tokens=533,
+                    output_tokens=762,
                     details={
-                        'thoughts_tokens': 213,
-                        'tool_use_prompt_tokens': 119,
+                        'thoughts_tokens': 444,
+                        'tool_use_prompt_tokens': 103,
                         'text_prompt_tokens': 17,
-                        'text_tool_use_prompt_tokens': 119,
+                        'text_tool_use_prompt_tokens': 103,
                     },
                 ),
                 model_name='gemini-2.5-pro',
                 timestamp=IsDatetime(),
                 provider_name='google-gla',
                 provider_details={'finish_reason': 'STOP'},
-                provider_response_id='btnJaOrqE4_6qtsP7bOboQs',
+                provider_response_id='y1I3aaeTDvOLmtkPgevhkAE',
                 finish_reason='stop',
                 run_id=IsStr(),
             ),
@@ -1092,7 +1107,7 @@ async def test_google_model_web_search_tool(allow_model_requests: None, google_p
                 parts=[
                     BuiltinToolCallPart(
                         tool_name='web_search',
-                        args={'queries': ['current weather in Mexico City']},
+                        args={'queries': ['weather in Mexico City today']},
                         tool_call_id=IsStr(),
                         provider_name='google-gla',
                     ),
@@ -1101,18 +1116,23 @@ async def test_google_model_web_search_tool(allow_model_requests: None, google_p
                         content=[
                             {
                                 'domain': None,
-                                'title': 'theweathernetwork.com',
-                                'uri': 'https://vertexaisearch.cloud.google.com/grounding-api-redirect/AUZIYQEvigSUuLwtMoqPNq2bvqCduH6yYQLKmhzoj0-SQbxBb2rs_ow380KClss6yfKqxmQ-3HIrmzasviLVdO2FhQ_uEIGfpv6-_r4XOSSLu57LKZgAFYTsswd5Q--VkuO2eEr4Vh8b0aK4KFi3Rt3k_r99frmOa-8mCHzWrXI_HeS58IvIpda0XNtWVEjg',
+                                'title': 'weatherbug.com',
+                                'uri': 'https://vertexaisearch.cloud.google.com/grounding-api-redirect/AUZIYQGNALHx6WbEk-l7IywrVofZAc2f2B3liR_LzjbU-1am45jWx9hcx90BpU7s99-o3AlvyF3rFjbEUsCFf3iXkMtOTRQ6jXV-dANbcpH5Xay-cxn0bEap1w1Pc1LRW3vBu_SENFOfmxLEZ34c-OxqZ31RL75U6sjx2i4ZDkZ4PFh2AU96STIf3d1jHA==',
                             },
                             {
                                 'domain': None,
-                                'title': 'wunderground.com',
-                                'uri': 'https://vertexaisearch.cloud.google.com/grounding-api-redirect/AUZIYQFEXnJiWubQ1I2xMumZnSwxzZzhO_s2AdGg1yFakgO7GqJXU25aq3-Zl5xFEsUk9KpDtKUsS0NrBQxRNYCTkbKMknHSD5n8Yps9aAYvLOvyKgKPDFt4SkBkt1RO1nyPOweAzOzjPmnnd8AqBqOq',
+                                'title': 'accuweather.com',
+                                'uri': 'https://vertexaisearch.cloud.google.com/grounding-api-redirect/AUZIYQH7JB3O5Oy3_PWu31FwdJElbZYSRGZeZWlIDXoEOtOaIQuIX_wPZaP8LyNT1K3_nPEGsobbg_tSkYiqLn_D1SD_-wGu0-RwwxF4bN8UcM5GCOMVdf7gI3a2WVyBBUL7_BPiW9Rrnf2eDjjOv0jtEIJw1tDGDvJh9R54phebi_Cls5aDD7ajlg==',
+                            },
+                            {
+                                'domain': None,
+                                'title': 'accuweather.com',
+                                'uri': 'https://vertexaisearch.cloud.google.com/grounding-api-redirect/AUZIYQGrARwtoF8hUa_8zy1oHzNBmQTFitFKcqATKStBQC2h_7YLvNzHVV4XzGridgTcihzPfjXUTW_0OZ0qs6iG_157KwIdS2ePZTccfXIQ3XdTii0DIT-4L-xmQl8dPpHm1Lmx1Q8XSiOJA55QXjvXsstMI3OJ8PyT8ewzhD136NdMbdPV0Ftp',
                             },
                             {
                                 'domain': None,
                                 'title': 'wunderground.com',
-                                'uri': 'https://vertexaisearch.cloud.google.com/grounding-api-redirect/AUZIYQEDXOJgWay-hTPi0eqxph51YPv_mX15kug_vYdV3Ybx19gm4XsIFdbDN3OhP8tHbKJDheVySvDaxmXZK2lsEJlHITYidz_uKAiY38_peXIPv0Kw4LvBYLWUh4SPwHBLgHAR3CsLQo3293ZbIXZ_3A==',
+                                'uri': 'https://vertexaisearch.cloud.google.com/grounding-api-redirect/AUZIYQHoTyQZHYOqP2WvRsPSvTGoKXpwgkZVJipTrznFmWt1mDux7eNnL5Wh46MfZ5CghEY7e7aIGejO5NvpK5DJQ2e3wV-smAcf2MYbm-4nIXi17hXJ6X4Rb7wXNGsD4GzyQe45Qcqqnt8xw39vUBut',
                             },
                         ],
                         tool_call_id=IsStr(),
@@ -1121,31 +1141,31 @@ async def test_google_model_web_search_tool(allow_model_requests: None, google_p
                     ),
                     TextPart(
                         content="""\
-In Mexico City today, you can expect a day of mixed sun and clouds with a high likelihood of showers and thunderstorms, particularly in the afternoon and evening.
+**Mexico City Sees a Mix of Clouds and Sun with Mild Temperatures**
 
-Currently, the weather is partly cloudy with temperatures in the mid-60s Fahrenheit (around 17-18°C). As the day progresses, the temperature is expected to rise, reaching a high of around 73-75°F (approximately 23°C).
+Today in Mexico City, residents can expect partly to mostly cloudy skies with a high temperature reaching the upper 60s, with some forecasts predicting a high of 67°F or 68°F. There is a slight chance of showers, with precipitation probabilities ranging from 25% to 40%.
 
-There is a significant chance of rain, with forecasts indicating a 60% to 100% probability of precipitation, especially from mid-afternoon into the evening. Winds are generally light, coming from the north-northeast at 10 to 15 mph.
+Currently, the temperature is around 58°F, feeling like 58°F. The wind is relatively calm, coming from the north-northwest at approximately 6 mph. Humidity levels are at 56%.
 
-Tonight, the skies will remain cloudy with a continued chance of showers, and the temperature will drop to a low of around 57°F (about 14°C).\
+Tonight, the skies are expected to be partly cloudy with a low temperature in the upper 40s to low 50s. There is still a chance of rain showers this evening, clearing up overnight. The sun rose at 6:58 AM and is set to go down at 5:58 PM.\
 """
                     ),
                 ],
                 usage=RequestUsage(
-                    input_tokens=209,
-                    output_tokens=623,
+                    input_tokens=223,
+                    output_tokens=700,
                     details={
-                        'thoughts_tokens': 131,
-                        'tool_use_prompt_tokens': 286,
-                        'text_prompt_tokens': 209,
-                        'text_tool_use_prompt_tokens': 286,
+                        'thoughts_tokens': 169,
+                        'tool_use_prompt_tokens': 318,
+                        'text_prompt_tokens': 223,
+                        'text_tool_use_prompt_tokens': 318,
                     },
                 ),
                 model_name='gemini-2.5-pro',
                 timestamp=IsDatetime(),
                 provider_name='google-gla',
                 provider_details={'finish_reason': 'STOP'},
-                provider_response_id='dtnJaKyTAri3qtsPu4imqQs',
+                provider_response_id='01I3ab71ENy4mtkPpNOJsQY',
                 finish_reason='stop',
                 run_id=IsStr(),
             ),
@@ -2524,7 +2544,7 @@ async def get_user_country() -> str:
             ModelResponse(
                 parts=[ToolCallPart(tool_name='get_user_country', args={}, tool_call_id=IsStr())],
                 usage=RequestUsage(
-                    input_tokens=33, output_tokens=5, details={'text_candidates_tokens': 5, 'text_prompt_tokens': 33}
+                    input_tokens=25, output_tokens=5, details={'text_candidates_tokens': 5, 'text_prompt_tokens': 25}
                 ),
                 model_name='gemini-2.0-flash',
                 timestamp=IsDatetime(),
@@ -2554,7 +2574,7 @@ async def get_user_country() -> str:
                     )
                 ],
                 usage=RequestUsage(
-                    input_tokens=47, output_tokens=8, details={'text_candidates_tokens': 8, 'text_prompt_tokens': 47}
+                    input_tokens=39, output_tokens=8, details={'text_candidates_tokens': 8, 'text_prompt_tokens': 39}
                 ),
                 model_name='gemini-2.0-flash',
                 timestamp=IsDatetime(),
@@ -3604,8 +3624,8 @@ async def test_google_image_generation_tool_aspect_ratio(google_provider: Google
     model = GoogleModel('gemini-2.5-flash-image', provider=google_provider)
     params = ModelRequestParameters(builtin_tools=[ImageGenerationTool(aspect_ratio='16:9')])
 
-    tools, image_config = model._get_tools(params)  # pyright: ignore[reportPrivateUsage]
-    assert tools is None
+    builtin_tools, image_config = model._get_builtin_tools(params)  # pyright: ignore[reportPrivateUsage]
+    assert builtin_tools == []
     assert image_config == {'aspect_ratio': '16:9'}
 
 
@@ -4439,6 +4459,145 @@ def test_google_missing_tool_call_thought_signature():
     )
 
 
+def test_tool_choice_string_value_none(google_provider: GoogleProvider) -> None:
+    """Test that tool_choice='none' filters out function tools and returns None if no output tools."""
+    my_tool = ToolDefinition(
+        name='my_tool',
+        description='Test tool',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+    mrp = ModelRequestParameters(output_mode='tool', function_tools=[my_tool], allow_text_output=True, output_tools=[])
+
+    model = GoogleModel('gemini-2.5-flash', provider=google_provider)
+    settings: GoogleModelSettings = {'tool_choice': 'none'}
+    tools, tool_config, _image_config = model._get_tool_config(mrp, settings)  # pyright: ignore[reportPrivateUsage]
+
+    assert tools is None
+    assert tool_config is None
+
+
+def test_tool_choice_string_value_auto(google_provider: GoogleProvider) -> None:
+    """Test that tool_choice='auto' includes all tools and maps to AUTO mode."""
+    my_tool = ToolDefinition(
+        name='my_tool',
+        description='Test tool',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+    mrp = ModelRequestParameters(output_mode='tool', function_tools=[my_tool], allow_text_output=True, output_tools=[])
+
+    model = GoogleModel('gemini-2.5-flash', provider=google_provider)
+    settings: GoogleModelSettings = {'tool_choice': 'auto'}
+    tools, tool_config, _image_config = model._get_tool_config(mrp, settings)  # pyright: ignore[reportPrivateUsage]
+
+    assert tools is not None
+    assert len(tools) == 1
+    assert tool_config is not None
+    fcc = tool_config.get('function_calling_config')
+    assert fcc == snapshot({'mode': FunctionCallingConfigMode.AUTO})
+
+
+def test_tool_choice_required_maps_to_any(google_provider: GoogleProvider) -> None:
+    """Test that 'required' filters to function tools only and maps to ANY mode."""
+    my_tool = ToolDefinition(
+        name='my_tool',
+        description='Test tool',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+    mrp = ModelRequestParameters(output_mode='tool', function_tools=[my_tool], allow_text_output=True, output_tools=[])
+
+    model = GoogleModel('gemini-2.5-flash', provider=google_provider)
+    settings: GoogleModelSettings = {'tool_choice': 'required'}
+    tools, tool_config, _image_config = model._get_tool_config(mrp, settings)  # pyright: ignore[reportPrivateUsage]
+
+    assert tools is not None
+    assert len(tools) == 1
+    assert tool_config is not None
+    fcc = tool_config.get('function_calling_config')
+    assert fcc == snapshot({'mode': FunctionCallingConfigMode.ANY})
+
+
+def test_tool_choice_specific_tool_single(google_provider: GoogleProvider) -> None:
+    """Specific tool names filter to only those tools."""
+    tool_a = ToolDefinition(
+        name='tool_a',
+        description='Test tool A',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+    tool_b = ToolDefinition(
+        name='tool_b',
+        description='Test tool B',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+    mrp = ModelRequestParameters(
+        output_mode='tool', function_tools=[tool_a, tool_b], allow_text_output=True, output_tools=[]
+    )
+
+    model = GoogleModel('gemini-2.5-flash', provider=google_provider)
+    settings: GoogleModelSettings = {'tool_choice': ['tool_a']}
+    tools, tool_config, _image_config = model._get_tool_config(mrp, settings)  # pyright: ignore[reportPrivateUsage]
+
+    assert tools is not None
+    assert len(tools) == 1
+    func_decls = tools[0].get('function_declarations')
+    assert func_decls is not None
+    assert func_decls[0].get('name') == 'tool_a'
+    assert tool_config is not None
+    fcc = tool_config.get('function_calling_config')
+    assert fcc == snapshot({'mode': FunctionCallingConfigMode.ANY, 'allowed_function_names': ['tool_a']})
+
+
+def test_tool_choice_none_with_output_tools_keeps_output_tools(google_provider: GoogleProvider) -> None:
+    """tool_choice='none' filters out function tools but keeps output tools."""
+    func_tool = ToolDefinition(
+        name='func_tool',
+        description='Function tool',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+    output_tool = ToolDefinition(
+        name='output_tool',
+        description='Output tool',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+    mrp = ModelRequestParameters(
+        output_mode='tool', function_tools=[func_tool], allow_text_output=False, output_tools=[output_tool]
+    )
+
+    model = GoogleModel('gemini-2.5-flash', provider=google_provider)
+    settings: GoogleModelSettings = {'tool_choice': 'none'}
+
+    tools, tool_config, _image_config = model._get_tool_config(mrp, settings)  # pyright: ignore[reportPrivateUsage]
+
+    assert tools is not None
+    assert len(tools) == 1
+    func_decls = tools[0].get('function_declarations')
+    assert func_decls is not None
+    assert func_decls[0].get('name') == 'output_tool'
+    assert tool_config is not None
+    fcc = tool_config.get('function_calling_config')
+    assert fcc == snapshot({'mode': FunctionCallingConfigMode.ANY, 'allowed_function_names': ['output_tool']})
+
+
+def test_tool_choice_auto_with_required_output(google_provider: GoogleProvider) -> None:
+    """When tool_choice='auto' but output is required, falls back to ANY mode."""
+    my_tool = ToolDefinition(
+        name='my_tool',
+        description='Test tool',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+    # allow_text_output=False simulates structured output requirement
+    mrp = ModelRequestParameters(output_mode='tool', function_tools=[my_tool], allow_text_output=False, output_tools=[])
+
+    model = GoogleModel('gemini-2.5-flash', provider=google_provider)
+    settings: GoogleModelSettings = {'tool_choice': 'auto'}
+    tools, tool_config, _image_config = model._get_tool_config(mrp, settings)  # pyright: ignore[reportPrivateUsage]
+
+    assert tools is not None
+    assert tool_config is not None
+    # With allow_text_output=False, 'auto' becomes ANY to force tool use
+    fcc = tool_config.get('function_calling_config')
+    assert fcc == snapshot({'mode': FunctionCallingConfigMode.ANY})
+
+
 async def test_google_streaming_tool_call_thought_signature(
     allow_model_requests: None, google_provider: GoogleProvider
 ):
diff --git a/tests/models/test_groq.py b/tests/models/test_groq.py
index dd3395750e..7a07f3a384 100644
--- a/tests/models/test_groq.py
+++ b/tests/models/test_groq.py
@@ -3,7 +3,7 @@
 import json
 import os
 from collections.abc import Sequence
-from dataclasses import dataclass
+from dataclasses import dataclass, field
 from datetime import datetime, timezone
 from functools import cached_property
 from typing import Any, Literal, cast
@@ -97,6 +97,7 @@ class MockGroq:
     completions: MockChatCompletion | Sequence[MockChatCompletion] | None = None
     stream: Sequence[MockChatCompletionChunk] | Sequence[Sequence[MockChatCompletionChunk]] | None = None
     index: int = 0
+    chat_completion_kwargs: list[dict[str, Any]] = field(default_factory=list)
 
     @cached_property
     def chat(self) -> Any:
@@ -115,8 +116,9 @@ def create_mock_stream(
         return cast(AsyncGroq, cls(stream=stream))
 
     async def chat_completions_create(
-        self, *_args: Any, stream: bool = False, **_kwargs: Any
+        self, *_args: Any, stream: bool = False, **kwargs: Any
     ) -> chat.ChatCompletion | MockAsyncStream[MockChatCompletionChunk]:
+        self.chat_completion_kwargs.append(kwargs)
         if stream:
             assert self.stream is not None, 'you can only used `stream=True` if `stream` is provided'
             if isinstance(self.stream[0], Sequence):
@@ -137,6 +139,13 @@ async def chat_completions_create(
         return response
 
 
+def get_mock_chat_completion_kwargs(groq_client: AsyncGroq) -> list[dict[str, Any]]:
+    if isinstance(groq_client, MockGroq):
+        return groq_client.chat_completion_kwargs
+    else:  # pragma: no cover
+        raise RuntimeError('Not a MockGroq instance')
+
+
 def completion_message(message: ChatCompletionMessage, *, usage: CompletionUsage | None = None) -> chat.ChatCompletion:
     return chat.ChatCompletion(
         id='123',
@@ -5623,3 +5632,141 @@ class CityLocation(BaseModel):
             ),
         ]
     )
+
+
+@pytest.mark.parametrize(
+    'tool_choice,expected',
+    [
+        pytest.param('auto', 'auto', id='auto'),
+        pytest.param('required', 'required', id='required'),
+    ],
+)
+async def test_tool_choice_string_values(allow_model_requests: None, tool_choice: str, expected: str) -> None:
+    """Ensure Groq string values are forwarded unchanged."""
+    mock_client = MockGroq.create_mock(completion_message(ChatCompletionMessage(content='ok', role='assistant')))
+    m = GroqModel('llama-3.3-70b-versatile', provider=GroqProvider(groq_client=mock_client))
+    agent = Agent(m)
+
+    @agent.tool_plain
+    def my_tool(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    await agent.run('hello', model_settings={'tool_choice': tool_choice})  # type: ignore
+
+    kwargs = get_mock_chat_completion_kwargs(mock_client)[0]
+    assert kwargs['tool_choice'] == expected
+
+
+async def test_tool_choice_specific_tool_single(allow_model_requests: None) -> None:
+    """Single tool choices should use the named tool payload."""
+    mock_client = MockGroq.create_mock(completion_message(ChatCompletionMessage(content='ok', role='assistant')))
+    m = GroqModel('llama-3.3-70b-versatile', provider=GroqProvider(groq_client=mock_client))
+    agent = Agent(m)
+
+    @agent.tool_plain
+    def tool_a(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    @agent.tool_plain
+    def tool_b(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    await agent.run('hello', model_settings={'tool_choice': ['tool_a']})
+
+    kwargs = get_mock_chat_completion_kwargs(mock_client)[0]
+    assert kwargs['tool_choice'] == {'type': 'function', 'function': {'name': 'tool_a'}}
+
+
+async def test_tool_choice_multiple_tools_falls_back_to_required(allow_model_requests: None) -> None:
+    """Multiple specific tools fall back to 'required'."""
+    mock_client = MockGroq.create_mock(completion_message(ChatCompletionMessage(content='ok', role='assistant')))
+    m = GroqModel('llama-3.3-70b-versatile', provider=GroqProvider(groq_client=mock_client))
+    agent = Agent(m)
+
+    @agent.tool_plain
+    def tool_a(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    @agent.tool_plain
+    def tool_b(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    with pytest.warns(UserWarning, match='Groq only supports forcing a single tool'):
+        await agent.run('hello', model_settings={'tool_choice': ['tool_a', 'tool_b']})
+
+    kwargs = get_mock_chat_completion_kwargs(mock_client)[0]
+    assert kwargs['tool_choice'] == 'required'
+
+
+async def test_tool_choice_none_with_output_tools(allow_model_requests: None) -> None:
+    """tool_choice='none' still allows output tools to execute."""
+
+    class MyOutput(BaseModel):
+        result: str
+
+    # Tool call response that returns final_result tool
+    tool_call_response = completion_message(
+        ChatCompletionMessage(
+            content=None,
+            role='assistant',
+            tool_calls=[
+                chat.ChatCompletionMessageToolCall(
+                    id='call_1',
+                    type='function',
+                    function=chat.chat_completion_message_tool_call.Function(
+                        name='final_result', arguments='{"result": "done"}'
+                    ),
+                )
+            ],
+        )
+    )
+
+    mock_client = MockGroq.create_mock(tool_call_response)
+    m = GroqModel('llama-3.3-70b-versatile', provider=GroqProvider(groq_client=mock_client))
+    agent: Agent[None, MyOutput] = Agent(m, output_type=MyOutput)
+
+    @agent.tool_plain
+    def my_tool(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    await agent.run('hello', model_settings={'tool_choice': 'none'})
+
+    kwargs = get_mock_chat_completion_kwargs(mock_client)[0]
+    assert kwargs['tool_choice'] == {'type': 'function', 'function': {'name': 'final_result'}}
+
+
+async def test_tool_choice_auto_with_required_output(allow_model_requests: None) -> None:
+    """When tool_choice='auto' but structured output is required, falls back to 'required'."""
+
+    class MyOutput(BaseModel):
+        result: str
+
+    tool_call_response = completion_message(
+        ChatCompletionMessage(
+            content=None,
+            role='assistant',
+            tool_calls=[
+                chat.ChatCompletionMessageToolCall(
+                    id='call_1',
+                    type='function',
+                    function=chat.chat_completion_message_tool_call.Function(
+                        name='final_result', arguments='{"result": "done"}'
+                    ),
+                )
+            ],
+        )
+    )
+
+    mock_client = MockGroq.create_mock(tool_call_response)
+    m = GroqModel('llama-3.3-70b-versatile', provider=GroqProvider(groq_client=mock_client))
+    agent: Agent[None, MyOutput] = Agent(m, output_type=MyOutput)
+
+    @agent.tool_plain
+    def my_tool(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    await agent.run('hello', model_settings={'tool_choice': 'auto'})
+
+    kwargs = get_mock_chat_completion_kwargs(mock_client)[0]
+    # With structured output (allow_text_output=False), 'auto' becomes 'required'
+    assert kwargs['tool_choice'] == 'required'
diff --git a/tests/models/test_huggingface.py b/tests/models/test_huggingface.py
index 56d74ed619..8a50f71956 100644
--- a/tests/models/test_huggingface.py
+++ b/tests/models/test_huggingface.py
@@ -12,7 +12,9 @@
 import pytest
 from huggingface_hub import (
     AsyncInferenceClient,
+    ChatCompletionInputFunctionName,
     ChatCompletionInputMessage,
+    ChatCompletionInputToolChoiceClass,
     ChatCompletionOutput,
     ChatCompletionOutputComplete,
     ChatCompletionOutputFunctionDefinition,
@@ -50,12 +52,13 @@
     VideoUrl,
 )
 from pydantic_ai.exceptions import ModelHTTPError
-from pydantic_ai.models.huggingface import HuggingFaceModel
+from pydantic_ai.models import ModelRequestParameters
+from pydantic_ai.models.huggingface import HuggingFaceModel, HuggingFaceModelSettings
 from pydantic_ai.providers.huggingface import HuggingFaceProvider
 from pydantic_ai.result import RunUsage
 from pydantic_ai.run import AgentRunResult, AgentRunResultEvent
 from pydantic_ai.settings import ModelSettings
-from pydantic_ai.tools import RunContext
+from pydantic_ai.tools import RunContext, ToolDefinition
 from pydantic_ai.usage import RequestUsage
 
 from ..conftest import IsDatetime, IsInstance, IsNow, IsStr, raise_if_exception, try_import
@@ -1026,3 +1029,168 @@ async def test_cache_point_filtering():
     # CachePoint should be filtered out
     assert msg['role'] == 'user'
     assert len(msg['content']) == 1  # pyright: ignore[reportUnknownArgumentType]
+
+
+@pytest.mark.parametrize(
+    'tool_choice,expected_tool_choice',
+    [
+        pytest.param('auto', 'auto', id='auto'),
+        pytest.param('required', 'required', id='required'),
+    ],
+)
+def test_tool_choice_string_values(tool_choice: str, expected_tool_choice: str) -> None:
+    """Ensure HuggingFace string values pass through, returning tools and tool_choice."""
+    my_tool = ToolDefinition(
+        name='my_tool',
+        description='Test tool',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+    mrp = ModelRequestParameters(output_mode='tool', function_tools=[my_tool], allow_text_output=True, output_tools=[])
+
+    mock_client = MockHuggingFace.create_mock(
+        completion_message(ChatCompletionOutputMessage.parse_obj_as_instance({'content': 'ok', 'role': 'assistant'}))  # type: ignore
+    )
+    model = HuggingFaceModel('hf-model', provider=HuggingFaceProvider(hf_client=mock_client, api_key='x'))
+    settings: HuggingFaceModelSettings = {'tool_choice': tool_choice}  # type: ignore[assignment]
+    tools, result_tool_choice = model._get_tool_choice(settings, mrp)  # pyright: ignore[reportPrivateUsage]
+
+    assert len(tools) == 1
+    assert tools[0].function['name'] == 'my_tool'
+    assert result_tool_choice == expected_tool_choice
+
+
+def test_tool_choice_none_filters_to_empty() -> None:
+    """tool_choice='none' filters out function tools, returns empty if no output tools."""
+    my_tool = ToolDefinition(
+        name='my_tool',
+        description='Test tool',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+    mrp = ModelRequestParameters(output_mode='tool', function_tools=[my_tool], allow_text_output=True, output_tools=[])
+
+    mock_client = MockHuggingFace.create_mock(
+        completion_message(ChatCompletionOutputMessage.parse_obj_as_instance({'content': 'ok', 'role': 'assistant'}))  # type: ignore
+    )
+    model = HuggingFaceModel('hf-model', provider=HuggingFaceProvider(hf_client=mock_client, api_key='x'))
+    settings: HuggingFaceModelSettings = {'tool_choice': 'none'}
+    tools, result_tool_choice = model._get_tool_choice(settings, mrp)  # pyright: ignore[reportPrivateUsage]
+
+    assert tools == []
+    assert result_tool_choice is None
+
+
+def test_tool_choice_specific_tool_single() -> None:
+    """Single tool entries should use ChatCompletionInputToolChoiceClass and filter tools."""
+    tool_a = ToolDefinition(
+        name='tool_a',
+        description='Test tool A',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+    tool_b = ToolDefinition(
+        name='tool_b',
+        description='Test tool B',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+    mrp = ModelRequestParameters(
+        output_mode='tool', function_tools=[tool_a, tool_b], allow_text_output=True, output_tools=[]
+    )
+
+    mock_client = MockHuggingFace.create_mock(
+        completion_message(ChatCompletionOutputMessage.parse_obj_as_instance({'content': 'ok', 'role': 'assistant'}))  # type: ignore
+    )
+    model = HuggingFaceModel('hf-model', provider=HuggingFaceProvider(hf_client=mock_client, api_key='x'))
+    settings: HuggingFaceModelSettings = {'tool_choice': ['tool_a']}
+    tools, result_tool_choice = model._get_tool_choice(settings, mrp)  # pyright: ignore[reportPrivateUsage]
+
+    assert len(tools) == 1
+    assert tools[0].function['name'] == 'tool_a'
+    assert isinstance(result_tool_choice, ChatCompletionInputToolChoiceClass)
+    assert result_tool_choice.function == ChatCompletionInputFunctionName(name='tool_a')  # type: ignore[call-arg]
+
+
+def test_tool_choice_multiple_tools_filters_to_requested() -> None:
+    """Multiple specific tools filter to requested and use 'required'."""
+    tool_a = ToolDefinition(
+        name='tool_a',
+        description='Test tool A',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+    tool_b = ToolDefinition(
+        name='tool_b',
+        description='Test tool B',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+    tool_c = ToolDefinition(
+        name='tool_c',
+        description='Test tool C',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+    mrp = ModelRequestParameters(
+        output_mode='tool', function_tools=[tool_a, tool_b, tool_c], allow_text_output=True, output_tools=[]
+    )
+
+    mock_client = MockHuggingFace.create_mock(
+        completion_message(ChatCompletionOutputMessage.parse_obj_as_instance({'content': 'ok', 'role': 'assistant'}))  # type: ignore
+    )
+    model = HuggingFaceModel('hf-model', provider=HuggingFaceProvider(hf_client=mock_client, api_key='x'))
+    settings: HuggingFaceModelSettings = {'tool_choice': ['tool_a', 'tool_b']}
+
+    tools, result_tool_choice = model._get_tool_choice(settings, mrp)  # pyright: ignore[reportPrivateUsage]
+
+    assert len(tools) == 2
+    tool_names: list[str] = [t.function['name'] for t in tools]
+    assert 'tool_a' in tool_names
+    assert 'tool_b' in tool_names
+    assert result_tool_choice == 'required'
+
+
+def test_tool_choice_none_with_output_tools_keeps_output_tools() -> None:
+    """tool_choice='none' filters out function tools but keeps output tools."""
+    func_tool = ToolDefinition(
+        name='func_tool',
+        description='Function tool',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+    output_tool = ToolDefinition(
+        name='output_tool',
+        description='Output tool',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+    mrp = ModelRequestParameters(
+        output_mode='tool', function_tools=[func_tool], allow_text_output=False, output_tools=[output_tool]
+    )
+
+    mock_client = MockHuggingFace.create_mock(
+        completion_message(ChatCompletionOutputMessage.parse_obj_as_instance({'content': 'ok', 'role': 'assistant'}))  # type: ignore
+    )
+    model = HuggingFaceModel('hf-model', provider=HuggingFaceProvider(hf_client=mock_client, api_key='x'))
+    settings: HuggingFaceModelSettings = {'tool_choice': 'none'}
+
+    tools, result_tool_choice = model._get_tool_choice(settings, mrp)  # pyright: ignore[reportPrivateUsage]
+
+    assert len(tools) == 1
+    assert tools[0].function['name'] == 'output_tool'
+    assert isinstance(result_tool_choice, ChatCompletionInputToolChoiceClass)
+    assert result_tool_choice.function == ChatCompletionInputFunctionName(name='output_tool')  # type: ignore[call-arg]
+
+
+def test_tool_choice_auto_with_required_output() -> None:
+    """When tool_choice='auto' but output is required, falls back to 'required'."""
+    my_tool = ToolDefinition(
+        name='my_tool',
+        description='Test tool',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+    # allow_text_output=False simulates structured output requirement
+    mrp = ModelRequestParameters(output_mode='tool', function_tools=[my_tool], allow_text_output=False, output_tools=[])
+
+    mock_client = MockHuggingFace.create_mock(
+        completion_message(ChatCompletionOutputMessage.parse_obj_as_instance({'content': 'ok', 'role': 'assistant'}))  # type: ignore
+    )
+    model = HuggingFaceModel('hf-model', provider=HuggingFaceProvider(hf_client=mock_client, api_key='x'))
+    settings: HuggingFaceModelSettings = {'tool_choice': 'auto'}
+    tools, result_tool_choice = model._get_tool_choice(settings, mrp)  # pyright: ignore[reportPrivateUsage]
+
+    assert len(tools) == 1
+    # With allow_text_output=False, 'auto' becomes 'required'
+    assert result_tool_choice == 'required'
diff --git a/tests/models/test_mistral.py b/tests/models/test_mistral.py
index 32a56c6395..05d12e7bbb 100644
--- a/tests/models/test_mistral.py
+++ b/tests/models/test_mistral.py
@@ -29,6 +29,8 @@
 )
 from pydantic_ai.agent import Agent
 from pydantic_ai.exceptions import ModelAPIError, ModelHTTPError, ModelRetry
+from pydantic_ai.models import ModelRequestParameters
+from pydantic_ai.tools import ToolDefinition
 from pydantic_ai.usage import RequestUsage
 
 from ..conftest import IsDatetime, IsNow, IsStr, raise_if_exception, try_import
@@ -55,7 +57,7 @@
     )
     from mistralai.types.basemodel import Unset as MistralUnset
 
-    from pydantic_ai.models.mistral import MistralModel, MistralStreamedResponse
+    from pydantic_ai.models.mistral import MistralModel, MistralModelSettings, MistralStreamedResponse
     from pydantic_ai.models.openai import OpenAIResponsesModel, OpenAIResponsesModelSettings
     from pydantic_ai.providers.mistral import MistralProvider
     from pydantic_ai.providers.openai import OpenAIProvider
@@ -2345,3 +2347,125 @@ async def test_mistral_model_thinking_part_iter(allow_model_requests: None, mist
             ),
         ]
     )
+
+
+@pytest.mark.parametrize(
+    'tool_choice,expected_tool_choice',
+    [
+        pytest.param('auto', 'auto', id='auto'),
+        pytest.param('required', 'required', id='required'),
+    ],
+)
+def test_tool_choice_string_values(tool_choice: str, expected_tool_choice: str) -> None:
+    """Ensure Mistral string values pass through, returning tools and tool_choice."""
+    my_tool = ToolDefinition(
+        name='my_tool',
+        description='Test tool',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+    mrp = ModelRequestParameters(output_mode='tool', function_tools=[my_tool], allow_text_output=True, output_tools=[])
+
+    mock_client = MockMistralAI.create_mock(completion_message(MistralAssistantMessage(content='ok', role='assistant')))
+    model = MistralModel('mistral-large-latest', provider=MistralProvider(mistral_client=mock_client))
+    settings: MistralModelSettings = {'tool_choice': tool_choice}  # type: ignore[assignment]
+    tools, result_tool_choice = model._get_tool_choice(mrp, settings)  # pyright: ignore[reportPrivateUsage]
+
+    assert tools is not None
+    assert len(tools) == 1
+    assert tools[0].function.name == 'my_tool'
+    assert result_tool_choice == expected_tool_choice
+
+
+def test_tool_choice_none_filters_to_empty() -> None:
+    """tool_choice='none' filters out function tools, returns None if no output tools."""
+    my_tool = ToolDefinition(
+        name='my_tool',
+        description='Test tool',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+    mrp = ModelRequestParameters(output_mode='tool', function_tools=[my_tool], allow_text_output=True, output_tools=[])
+
+    mock_client = MockMistralAI.create_mock(completion_message(MistralAssistantMessage(content='ok', role='assistant')))
+    model = MistralModel('mistral-large-latest', provider=MistralProvider(mistral_client=mock_client))
+    settings: MistralModelSettings = {'tool_choice': 'none'}
+    tools, result_tool_choice = model._get_tool_choice(mrp, settings)  # pyright: ignore[reportPrivateUsage]
+
+    assert tools is None
+    assert result_tool_choice is None
+
+
+def test_tool_choice_specific_tool_filters_to_requested() -> None:
+    """Specific tool choice filters to only the requested tools."""
+    tool_a = ToolDefinition(
+        name='tool_a',
+        description='Test tool A',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+    tool_b = ToolDefinition(
+        name='tool_b',
+        description='Test tool B',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+    mrp = ModelRequestParameters(
+        output_mode='tool', function_tools=[tool_a, tool_b], allow_text_output=True, output_tools=[]
+    )
+
+    mock_client = MockMistralAI.create_mock(completion_message(MistralAssistantMessage(content='ok', role='assistant')))
+    model = MistralModel('mistral-large-latest', provider=MistralProvider(mistral_client=mock_client))
+    settings: MistralModelSettings = {'tool_choice': ['tool_a']}
+
+    tools, result_tool_choice = model._get_tool_choice(mrp, settings)  # pyright: ignore[reportPrivateUsage]
+
+    assert tools is not None
+    assert len(tools) == 1
+    assert tools[0].function.name == 'tool_a'
+    assert result_tool_choice == 'required'
+
+
+def test_tool_choice_none_with_output_tools_keeps_output_tools() -> None:
+    """tool_choice='none' filters out function tools but keeps output tools."""
+    func_tool = ToolDefinition(
+        name='func_tool',
+        description='Function tool',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+    output_tool = ToolDefinition(
+        name='output_tool',
+        description='Output tool',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+    mrp = ModelRequestParameters(
+        output_mode='tool', function_tools=[func_tool], allow_text_output=False, output_tools=[output_tool]
+    )
+
+    mock_client = MockMistralAI.create_mock(completion_message(MistralAssistantMessage(content='ok', role='assistant')))
+    model = MistralModel('mistral-large-latest', provider=MistralProvider(mistral_client=mock_client))
+    settings: MistralModelSettings = {'tool_choice': 'none'}
+
+    tools, result_tool_choice = model._get_tool_choice(mrp, settings)  # pyright: ignore[reportPrivateUsage]
+
+    assert tools is not None
+    assert len(tools) == 1
+    assert tools[0].function.name == 'output_tool'
+    assert result_tool_choice == 'required'
+
+
+def test_tool_choice_auto_with_required_output() -> None:
+    """When tool_choice='auto' but output is required, falls back to 'required'."""
+    my_tool = ToolDefinition(
+        name='my_tool',
+        description='Test tool',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+    # allow_text_output=False simulates structured output requirement
+    mrp = ModelRequestParameters(output_mode='tool', function_tools=[my_tool], allow_text_output=False, output_tools=[])
+
+    mock_client = MockMistralAI.create_mock(completion_message(MistralAssistantMessage(content='ok', role='assistant')))
+    model = MistralModel('mistral-large-latest', provider=MistralProvider(mistral_client=mock_client))
+    settings: MistralModelSettings = {'tool_choice': 'auto'}
+    tools, result_tool_choice = model._get_tool_choice(mrp, settings)  # pyright: ignore[reportPrivateUsage]
+
+    assert tools is not None
+    assert len(tools) == 1
+    # With allow_text_output=False, 'auto' becomes 'required'
+    assert result_tool_choice == 'required'
diff --git a/tests/models/test_openai.py b/tests/models/test_openai.py
index ed68edd94f..edfc1c11cb 100644
--- a/tests/models/test_openai.py
+++ b/tests/models/test_openai.py
@@ -71,6 +71,8 @@
     from openai.types.chat.chat_completion_message_tool_call import Function
     from openai.types.chat.chat_completion_token_logprob import ChatCompletionTokenLogprob
     from openai.types.completion_usage import CompletionUsage, PromptTokensDetails
+    from openai.types.responses import ResponseFunctionToolCall
+    from openai.types.responses.response_output_message import ResponseOutputMessage, ResponseOutputText
 
     from pydantic_ai.models.google import GoogleModel
     from pydantic_ai.models.openai import (
@@ -895,10 +897,10 @@ async def get_image() -> ImageUrl:
                 run_id=IsStr(),
             ),
             ModelResponse(
-                parts=[ToolCallPart(tool_name='get_image', args='{}', tool_call_id='call_4hrT4QP9jfojtK69vGiFCFjG')],
+                parts=[ToolCallPart(tool_name='get_image', args='{}', tool_call_id='call_Xn7ZD27IylZB66yw2n38IWXe')],
                 usage=RequestUsage(
                     input_tokens=46,
-                    output_tokens=11,
+                    output_tokens=10,
                     details={
                         'accepted_prediction_tokens': 0,
                         'audio_tokens': 0,
@@ -910,7 +912,7 @@ async def get_image() -> ImageUrl:
                 timestamp=IsDatetime(),
                 provider_name='openai',
                 provider_details={'finish_reason': 'tool_calls'},
-                provider_response_id='chatcmpl-BRmTHlrARTzAHK1na9s80xDlQGYPX',
+                provider_response_id='chatcmpl-CkZpBs2uAOr90Y3bazEGxLfYjrJgJ',
                 finish_reason='tool_call',
                 run_id=IsStr(),
             ),
@@ -919,7 +921,7 @@ async def get_image() -> ImageUrl:
                     ToolReturnPart(
                         tool_name='get_image',
                         content='See file bd38f5',
-                        tool_call_id='call_4hrT4QP9jfojtK69vGiFCFjG',
+                        tool_call_id='call_Xn7ZD27IylZB66yw2n38IWXe',
                         timestamp=IsDatetime(),
                     ),
                     UserPromptPart(
@@ -938,8 +940,8 @@ async def get_image() -> ImageUrl:
             ModelResponse(
                 parts=[TextPart(content='The image shows a potato.')],
                 usage=RequestUsage(
-                    input_tokens=503,
-                    output_tokens=8,
+                    input_tokens=507,
+                    output_tokens=7,
                     details={
                         'accepted_prediction_tokens': 0,
                         'audio_tokens': 0,
@@ -951,7 +953,7 @@ async def get_image() -> ImageUrl:
                 timestamp=IsDatetime(),
                 provider_name='openai',
                 provider_details={'finish_reason': 'stop'},
-                provider_response_id='chatcmpl-BRmTI0Y2zmkGw27kLarhsmiFQTGxR',
+                provider_response_id='chatcmpl-CkZpD3JSLa7qZKvU5yYhrf7L3wOxA',
                 finish_reason='stop',
                 run_id=IsStr(),
             ),
@@ -3129,6 +3131,48 @@ async def test_tool_choice_fallback_response_api(allow_model_requests: None) ->
     assert get_mock_responses_kwargs(mock_client)[0]['tool_choice'] == 'auto'
 
 
+async def test_tool_choice_required_explicit_unsupported(allow_model_requests: None) -> None:
+    """Ensure explicit tool_choice='required' warns and falls back to 'auto' when unsupported."""
+    profile = OpenAIModelProfile(openai_supports_tool_choice_required=False).update(openai_model_profile('stub'))
+
+    mock_client = MockOpenAI.create_mock(completion_message(ChatCompletionMessage(content='ok', role='assistant')))
+    model = OpenAIChatModel('stub', provider=OpenAIProvider(openai_client=mock_client), profile=profile)
+
+    params = ModelRequestParameters(function_tools=[ToolDefinition(name='x')], allow_text_output=True)
+    settings: OpenAIChatModelSettings = {'tool_choice': 'required'}
+
+    with pytest.warns(UserWarning, match=r"tool_choice='required' is not supported by model 'stub'"):
+        await model._completions_create(  # pyright: ignore[reportPrivateUsage]
+            messages=[],
+            stream=False,
+            model_settings=settings,
+            model_request_parameters=params,
+        )
+
+    assert get_mock_chat_completion_kwargs(mock_client)[0]['tool_choice'] == 'auto'
+
+
+async def test_tool_choice_required_explicit_unsupported_responses_api(allow_model_requests: None) -> None:
+    """Ensure explicit tool_choice='required' warns and falls back for Responses API when unsupported."""
+    profile = OpenAIModelProfile(openai_supports_tool_choice_required=False).update(openai_model_profile('stub'))
+
+    mock_client = MockOpenAIResponses.create_mock(response_message([]))
+    model = OpenAIResponsesModel('openai/gpt-oss', provider=OpenAIProvider(openai_client=mock_client), profile=profile)
+
+    params = ModelRequestParameters(function_tools=[ToolDefinition(name='x')], allow_text_output=True)
+    settings: OpenAIResponsesModelSettings = {'tool_choice': 'required'}
+
+    with pytest.warns(UserWarning, match=r"tool_choice='required' is not supported by model 'openai/gpt-oss'"):
+        await model._responses_create(  # pyright: ignore[reportPrivateUsage]
+            messages=[],
+            stream=False,
+            model_settings=settings,
+            model_request_parameters=params,
+        )
+
+    assert get_mock_responses_kwargs(mock_client)[0]['tool_choice'] == 'auto'
+
+
 async def test_openai_model_settings_temperature_ignored_on_gpt_5(allow_model_requests: None, openai_api_key: str):
     m = OpenAIChatModel('gpt-5', provider=OpenAIProvider(api_key=openai_api_key))
     agent = Agent(m)
@@ -3183,10 +3227,9 @@ async def test_cache_point_filtering(allow_model_requests: None):
     msg = await m._map_user_prompt(UserPromptPart(content=['text before', CachePoint(), 'text after']))  # pyright: ignore[reportPrivateUsage]
 
     # CachePoint should be filtered out, only text content should remain
-    assert msg['role'] == 'user'
-    assert len(msg['content']) == 2  # type: ignore[reportUnknownArgumentType]
-    assert msg['content'][0]['text'] == 'text before'  # type: ignore[reportUnknownArgumentType]
-    assert msg['content'][1]['text'] == 'text after'  # type: ignore[reportUnknownArgumentType]
+    assert msg == snapshot(
+        {'role': 'user', 'content': [{'text': 'text before', 'type': 'text'}, {'text': 'text after', 'type': 'text'}]}
+    )
 
 
 async def test_cache_point_filtering_responses_model():
@@ -3197,10 +3240,464 @@ async def test_cache_point_filtering_responses_model():
     )
 
     # CachePoint should be filtered out, only text content should remain
-    assert msg['role'] == 'user'
-    assert len(msg['content']) == 2
-    assert msg['content'][0]['text'] == 'text before'  # type: ignore[reportUnknownArgumentType]
-    assert msg['content'][1]['text'] == 'text after'  # type: ignore[reportUnknownArgumentType]
+    assert msg == snapshot(
+        {
+            'role': 'user',
+            'content': [{'text': 'text before', 'type': 'input_text'}, {'text': 'text after', 'type': 'input_text'}],
+        }
+    )
+
+
+@pytest.mark.parametrize(
+    'tool_choice,expected',
+    [
+        pytest.param('auto', 'auto', id='auto'),
+        pytest.param('required', 'required', id='required'),
+    ],
+)
+async def test_tool_choice_string_values(allow_model_requests: None, tool_choice: str, expected: str) -> None:
+    """Ensure Chat tool_choice strings flow through unchanged."""
+    mock_client = MockOpenAI.create_mock(completion_message(ChatCompletionMessage(content='ok', role='assistant')))
+    model = OpenAIChatModel('gpt-4o', provider=OpenAIProvider(openai_client=mock_client))
+    agent = Agent(model)
+
+    @agent.tool_plain
+    def my_tool(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    await agent.run('hello', model_settings={'tool_choice': tool_choice})  # type: ignore
+
+    kwargs = get_mock_chat_completion_kwargs(mock_client)
+    assert kwargs[0]['tool_choice'] == expected
+
+
+async def test_tool_choice_none_filters_out_function_tools(allow_model_requests: None) -> None:
+    """tool_choice='none' filters out function tools, resulting in no tools sent."""
+    mock_client = MockOpenAI.create_mock(completion_message(ChatCompletionMessage(content='ok', role='assistant')))
+    model = OpenAIChatModel('gpt-4o', provider=OpenAIProvider(openai_client=mock_client))
+    agent = Agent(model)
+
+    @agent.tool_plain
+    def my_tool(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    await agent.run('hello', model_settings={'tool_choice': 'none'})
+
+    kwargs = get_mock_chat_completion_kwargs(mock_client)
+    assert 'tools' not in kwargs[0]
+    assert 'tool_choice' not in kwargs[0]
+
+
+async def test_tool_choice_specific_tool_single(allow_model_requests: None) -> None:
+    """Force the Chat API to call a specific tool."""
+    mock_client = MockOpenAI.create_mock(completion_message(ChatCompletionMessage(content='ok', role='assistant')))
+    model = OpenAIChatModel('gpt-4o', provider=OpenAIProvider(openai_client=mock_client))
+    agent = Agent(model)
+
+    @agent.tool_plain
+    def tool_a(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    @agent.tool_plain
+    def tool_b(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    await agent.run('hello', model_settings={'tool_choice': ['tool_a']})
+
+    kwargs = get_mock_chat_completion_kwargs(mock_client)
+    assert kwargs[0]['tool_choice'] == {'type': 'function', 'function': {'name': 'tool_a'}}
+
+
+async def test_tool_choice_specific_tools_multiple(allow_model_requests: None) -> None:
+    """Multiple Chat tools should produce an allowed_tools payload."""
+    mock_client = MockOpenAI.create_mock(completion_message(ChatCompletionMessage(content='ok', role='assistant')))
+    model = OpenAIChatModel('gpt-4o', provider=OpenAIProvider(openai_client=mock_client))
+    agent = Agent(model)
+
+    @agent.tool_plain
+    def tool_a(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    @agent.tool_plain
+    def tool_b(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    @agent.tool_plain
+    def tool_c(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    await agent.run('hello', model_settings={'tool_choice': ['tool_a', 'tool_b']})
+
+    kwargs = get_mock_chat_completion_kwargs(mock_client)
+    assert kwargs[0]['tool_choice'] == snapshot(
+        {
+            'type': 'allowed_tools',
+            'allowed_tools': {
+                'mode': 'auto',
+                'tools': [
+                    {'type': 'function', 'function': {'name': 'tool_a'}},
+                    {'type': 'function', 'function': {'name': 'tool_b'}},
+                ],
+            },
+        }
+    )
+
+
+async def test_tool_choice_none_with_output_tools(allow_model_requests: None) -> None:
+    """tool_choice='none' filters function tools but keeps output tools for structured output."""
+
+    class Location(BaseModel):
+        city: str
+        country: str
+
+    mock_client = MockOpenAI.create_mock(
+        completion_message(
+            ChatCompletionMessage(
+                content=None,
+                role='assistant',
+                tool_calls=[
+                    ChatCompletionMessageFunctionToolCall(
+                        id='1',
+                        type='function',
+                        function=Function(
+                            name='final_result',
+                            arguments='{"city": "Paris", "country": "France"}',
+                        ),
+                    ),
+                ],
+            )
+        )
+    )
+    model = OpenAIChatModel('gpt-4o', provider=OpenAIProvider(openai_client=mock_client))
+    agent = Agent(model, output_type=Location)
+
+    @agent.tool_plain
+    def my_tool(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    result = await agent.run('hello', model_settings={'tool_choice': 'none'})
+
+    assert result.output == Location(city='Paris', country='France')
+    kwargs = get_mock_chat_completion_kwargs(mock_client)
+    # With tool_choice='none', only output tools are sent (function tool filtered out)
+    # Since there's only one output tool, tool_choice forces it
+    assert kwargs[0]['tool_choice'] == {'type': 'function', 'function': {'name': 'final_result'}}
+
+
+async def test_tool_choice_none_with_multiple_output_tools(allow_model_requests: None) -> None:
+    """Multiple output tools fall back to allowed_tools when forcing 'none'."""
+
+    class LocationA(BaseModel):
+        city: str
+
+    class LocationB(BaseModel):
+        country: str
+
+    mock_client = MockOpenAI.create_mock(
+        completion_message(
+            ChatCompletionMessage(
+                content=None,
+                role='assistant',
+                tool_calls=[
+                    ChatCompletionMessageFunctionToolCall(
+                        id='1',
+                        type='function',
+                        function=Function(
+                            name='final_result_LocationA',
+                            arguments='{"city": "Paris"}',
+                        ),
+                    ),
+                ],
+            )
+        )
+    )
+    model = OpenAIChatModel('gpt-4o', provider=OpenAIProvider(openai_client=mock_client))
+    agent: Agent[None, LocationA | LocationB] = Agent(model, output_type=[LocationA, LocationB])
+
+    @agent.tool_plain
+    def my_tool(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    result = await agent.run('hello', model_settings={'tool_choice': 'none'})
+
+    assert result.output == LocationA(city='Paris')
+    kwargs = get_mock_chat_completion_kwargs(mock_client)
+    # With tool_choice='none', only output tools are sent (function tool filtered out)
+    # Multiple output tools use allowed_tools
+    assert kwargs[0]['tool_choice'] == {
+        'type': 'allowed_tools',
+        'allowed_tools': {
+            'mode': 'required',
+            'tools': [
+                {'type': 'function', 'function': {'name': 'final_result_LocationA'}},
+                {'type': 'function', 'function': {'name': 'final_result_LocationB'}},
+            ],
+        },
+    }
+
+
+async def test_tool_choice_auto_with_required_output(allow_model_requests: None) -> None:
+    """When tool_choice='auto' but structured output is required, falls back to 'required'."""
+
+    class Location(BaseModel):
+        city: str
+        country: str
+
+    mock_client = MockOpenAI.create_mock(
+        completion_message(
+            ChatCompletionMessage(
+                content=None,
+                role='assistant',
+                tool_calls=[
+                    ChatCompletionMessageFunctionToolCall(
+                        id='1',
+                        type='function',
+                        function=Function(
+                            name='final_result',
+                            arguments='{"city": "Paris", "country": "France"}',
+                        ),
+                    ),
+                ],
+            )
+        )
+    )
+    model = OpenAIChatModel('gpt-4o', provider=OpenAIProvider(openai_client=mock_client))
+    agent = Agent(model, output_type=Location)
+
+    @agent.tool_plain
+    def my_tool(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    await agent.run('hello', model_settings={'tool_choice': 'auto'})
+
+    kwargs = get_mock_chat_completion_kwargs(mock_client)
+    # With structured output (allow_text_output=False), 'auto' becomes 'required'
+    assert kwargs[0]['tool_choice'] == 'required'
+
+
+@pytest.mark.parametrize(
+    'tool_choice,expected',
+    [
+        pytest.param('auto', 'auto', id='auto'),
+        pytest.param('required', 'required', id='required'),
+    ],
+)
+async def test_responses_tool_choice_string_values(allow_model_requests: None, tool_choice: str, expected: str) -> None:
+    """Ensure Responses tool_choice strings pass through untouched."""
+    mock_client = MockOpenAIResponses.create_mock(
+        response_message(
+            [
+                ResponseOutputMessage(
+                    id='msg_123',
+                    content=[ResponseOutputText(text='ok', type='output_text', annotations=[])],
+                    role='assistant',
+                    status='completed',
+                    type='message',
+                )
+            ]
+        )
+    )
+    model = OpenAIResponsesModel('gpt-4o', provider=OpenAIProvider(openai_client=mock_client))
+    agent = Agent(model)
+
+    @agent.tool_plain
+    def my_tool(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    await agent.run('hello', model_settings={'tool_choice': tool_choice})  # type: ignore
+
+    kwargs = get_mock_responses_kwargs(mock_client)
+    assert kwargs[0]['tool_choice'] == expected
+
+
+async def test_responses_tool_choice_specific_tool_single(allow_model_requests: None) -> None:
+    """Force a single tool when using the Responses API."""
+    mock_client = MockOpenAIResponses.create_mock(
+        response_message(
+            [
+                ResponseOutputMessage(
+                    id='msg_123',
+                    content=[ResponseOutputText(text='ok', type='output_text', annotations=[])],
+                    role='assistant',
+                    status='completed',
+                    type='message',
+                )
+            ]
+        )
+    )
+    model = OpenAIResponsesModel('gpt-4o', provider=OpenAIProvider(openai_client=mock_client))
+    agent = Agent(model)
+
+    @agent.tool_plain
+    def my_tool(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    @agent.tool_plain
+    def other_tool(y: str) -> str:
+        return y  # pragma: no cover
+
+    await agent.run('hello', model_settings={'tool_choice': ['my_tool']})
+
+    kwargs = get_mock_responses_kwargs(mock_client)
+    assert kwargs[0]['tool_choice'] == {'type': 'function', 'name': 'my_tool'}
+
+
+async def test_responses_tool_choice_specific_tool_multiple(allow_model_requests: None) -> None:
+    """Multiple Responses tools rely on the allowed_tools payload."""
+    mock_client = MockOpenAIResponses.create_mock(
+        response_message(
+            [
+                ResponseOutputMessage(
+                    id='msg_123',
+                    content=[ResponseOutputText(text='ok', type='output_text', annotations=[])],
+                    role='assistant',
+                    status='completed',
+                    type='message',
+                )
+            ]
+        )
+    )
+    model = OpenAIResponsesModel('gpt-4o', provider=OpenAIProvider(openai_client=mock_client))
+    agent = Agent(model)
+
+    @agent.tool_plain
+    def tool_a(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    @agent.tool_plain
+    def tool_b(y: str) -> str:
+        return y  # pragma: no cover
+
+    @agent.tool_plain
+    def tool_c(z: float) -> str:
+        return str(z)  # pragma: no cover
+
+    await agent.run('hello', model_settings={'tool_choice': ['tool_a', 'tool_b']})
+
+    kwargs = get_mock_responses_kwargs(mock_client)
+    assert kwargs[0]['tool_choice'] == {
+        'type': 'allowed_tools',
+        'mode': 'auto',
+        'tools': [{'type': 'function', 'name': 'tool_a'}, {'type': 'function', 'name': 'tool_b'}],
+    }
+
+
+async def test_responses_tool_choice_none_with_output_tools_warns(allow_model_requests: None) -> None:
+    """tool_choice='none' cannot disable required Responses output tools."""
+
+    class Location(BaseModel):
+        city: str
+        country: str
+
+    mock_client = MockOpenAIResponses.create_mock(
+        response_message(
+            [
+                ResponseFunctionToolCall(
+                    id='call_123',
+                    call_id='call_123',
+                    name='final_result',
+                    arguments='{"city": "Paris", "country": "France"}',
+                    type='function_call',
+                    status='completed',
+                )
+            ]
+        )
+    )
+    model = OpenAIResponsesModel('gpt-4o', provider=OpenAIProvider(openai_client=mock_client))
+    agent = Agent(model, output_type=Location)
+
+    @agent.tool_plain
+    def my_tool(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    result = await agent.run('hello', model_settings={'tool_choice': 'none'})
+
+    assert result.output == Location(city='Paris', country='France')
+    kwargs = get_mock_responses_kwargs(mock_client)
+    # With tool_choice='none', only output tools are sent (function tool filtered out)
+    # Single output tool is forced
+    assert kwargs[0]['tool_choice'] == {'type': 'function', 'name': 'final_result'}
+
+
+async def test_responses_tool_choice_none_with_multiple_output_tools(allow_model_requests: None) -> None:
+    """Multiple Responses output tools still use allowed_tools when forced to 'none'."""
+
+    class LocationA(BaseModel):
+        city: str
+
+    class LocationB(BaseModel):
+        country: str
+
+    mock_client = MockOpenAIResponses.create_mock(
+        response_message(
+            [
+                ResponseFunctionToolCall(
+                    id='call_123',
+                    call_id='call_123',
+                    name='final_result_LocationA',
+                    arguments='{"city": "Paris"}',
+                    type='function_call',
+                    status='completed',
+                )
+            ]
+        )
+    )
+    model = OpenAIResponsesModel('gpt-4o', provider=OpenAIProvider(openai_client=mock_client))
+    agent: Agent[None, LocationA | LocationB] = Agent(model, output_type=[LocationA, LocationB])
+
+    @agent.tool_plain
+    def my_tool(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    result = await agent.run('hello', model_settings={'tool_choice': 'none'})
+
+    assert result.output == LocationA(city='Paris')
+    kwargs = get_mock_responses_kwargs(mock_client)
+    # With tool_choice='none', only output tools are sent (function tool filtered out)
+    # Multiple output tools use allowed_tools
+    assert kwargs[0]['tool_choice'] == {
+        'type': 'allowed_tools',
+        'mode': 'required',
+        'tools': [
+            {'type': 'function', 'name': 'final_result_LocationA'},
+            {'type': 'function', 'name': 'final_result_LocationB'},
+        ],
+    }
+
+
+async def test_responses_tool_choice_auto_with_required_output(allow_model_requests: None) -> None:
+    """When tool_choice='auto' but structured output is required, falls back to 'required' (Responses API)."""
+
+    class Location(BaseModel):
+        city: str
+        country: str
+
+    mock_client = MockOpenAIResponses.create_mock(
+        response_message(
+            [
+                ResponseFunctionToolCall(
+                    id='call_123',
+                    call_id='call_123',
+                    name='final_result',
+                    arguments='{"city": "Paris", "country": "France"}',
+                    type='function_call',
+                    status='completed',
+                )
+            ]
+        )
+    )
+    model = OpenAIResponsesModel('gpt-4o', provider=OpenAIProvider(openai_client=mock_client))
+    agent = Agent(model, output_type=Location)
+
+    @agent.tool_plain
+    def my_tool(x: int) -> str:
+        return str(x)  # pragma: no cover
+
+    await agent.run('hello', model_settings={'tool_choice': 'auto'})
+
+    kwargs = get_mock_responses_kwargs(mock_client)
+    # With structured output (allow_text_output=False), 'auto' becomes 'required'
+    assert kwargs[0]['tool_choice'] == 'required'
 
 
 async def test_openai_custom_reasoning_field_sending_back_in_thinking_tags(allow_model_requests: None):
diff --git a/tests/models/test_openai_responses.py b/tests/models/test_openai_responses.py
index 17964a2bdf..5914230067 100644
--- a/tests/models/test_openai_responses.py
+++ b/tests/models/test_openai_responses.py
@@ -1404,7 +1404,7 @@ async def get_user_country() -> str:
                         tool_name='get_user_country',
                         args='{}',
                         tool_call_id=IsStr(),
-                        id='fc_68477f0bb8e4819cba6d781e174d77f8001fd29e2d5573f7',
+                        id='fc_04c1bf8ad3be7d27006937124d6218819cad7022b00dd3530b',
                     )
                 ],
                 usage=RequestUsage(input_tokens=62, output_tokens=12, details={'reasoning_tokens': 0}),
@@ -1412,7 +1412,7 @@ async def get_user_country() -> str:
                 timestamp=IsDatetime(),
                 provider_name='openai',
                 provider_details={'finish_reason': 'completed'},
-                provider_response_id='resp_68477f0b40a8819cb8d55594bc2c232a001fd29e2d5573f7',
+                provider_response_id='resp_04c1bf8ad3be7d27006937124c0f18819c8e3cfa2c478b5678',
                 finish_reason='stop',
                 run_id=IsStr(),
             ),
@@ -1421,7 +1421,7 @@ async def get_user_country() -> str:
                     ToolReturnPart(
                         tool_name='get_user_country',
                         content='Mexico',
-                        tool_call_id='call_ZWkVhdUjupo528U9dqgFeRkH',
+                        tool_call_id='call_bzir81UHdS66eGfDbGdkxItT',
                         timestamp=IsDatetime(),
                     )
                 ],
@@ -1432,16 +1432,16 @@ async def get_user_country() -> str:
                     ToolCallPart(
                         tool_name='final_result',
                         args='{"city":"Mexico City","country":"Mexico"}',
-                        tool_call_id='call_iFBd0zULhSZRR908DfH73VwN',
-                        id='fc_68477f0c91cc819e8024e7e633f0f09401dc81d4bc91f560',
+                        tool_call_id='call_pQ58SKRjGbf62NBIIqpX4JB0',
+                        id='fc_032b8ae48d9012e100693712501798819d81203cd609c1e77a',
                     )
                 ],
-                usage=RequestUsage(input_tokens=85, output_tokens=20, details={'reasoning_tokens': 0}),
+                usage=RequestUsage(input_tokens=81, output_tokens=20, details={'reasoning_tokens': 0}),
                 model_name='gpt-4o-2024-08-06',
                 timestamp=IsDatetime(),
                 provider_name='openai',
                 provider_details={'finish_reason': 'completed'},
-                provider_response_id='resp_68477f0bfda8819ea65458cd7cc389b801dc81d4bc91f560',
+                provider_response_id='resp_032b8ae48d9012e1006937124ef11c819dbf3ff33c3a91e4ae',
                 finish_reason='stop',
                 run_id=IsStr(),
             ),
@@ -1450,7 +1450,7 @@ async def get_user_country() -> str:
                     ToolReturnPart(
                         tool_name='final_result',
                         content='Final result processed.',
-                        tool_call_id='call_iFBd0zULhSZRR908DfH73VwN',
+                        tool_call_id='call_pQ58SKRjGbf62NBIIqpX4JB0',
                         timestamp=IsDatetime(),
                     )
                 ],
diff --git a/tests/models/test_resolve_tool_choice.py b/tests/models/test_resolve_tool_choice.py
new file mode 100644
index 0000000000..d1444bf2ab
--- /dev/null
+++ b/tests/models/test_resolve_tool_choice.py
@@ -0,0 +1,125 @@
+"""Tests for the centralized `_resolve_tool_choice()` function.
+
+These tests cover the common logic shared across all providers:
+- String value resolution ('none', 'auto', 'required')
+- List[str] validation and resolution
+- Empty list treated as 'none'
+- Invalid tool name detection
+
+Provider-specific tests (API format mapping) remain in their respective test files.
+"""
+
+from __future__ import annotations
+
+import pytest
+from inline_snapshot import snapshot
+
+from pydantic_ai.exceptions import UserError
+from pydantic_ai.models import (
+    ModelRequestParameters,
+    _resolve_tool_choice,  # pyright: ignore[reportPrivateUsage]
+    _ResolvedToolChoice,  # pyright: ignore[reportPrivateUsage]
+)
+from pydantic_ai.settings import ModelSettings
+from pydantic_ai.tools import ToolDefinition
+
+
+def make_tool(name: str) -> ToolDefinition:
+    """Return a minimal `ToolDefinition` used throughout the tests."""
+    return ToolDefinition(
+        name=name,
+        description=f'Tool {name}',
+        parameters_json_schema={'type': 'object', 'properties': {}},
+    )
+
+
+class TestResolveToolChoiceNone:
+    """Cases where `tool_choice` is unset in the settings."""
+
+    def test_none_model_settings_returns_none(self) -> None:
+        """`_resolve_tool_choice` returns None when `model_settings` is None."""
+        params = ModelRequestParameters()
+        result = _resolve_tool_choice(None, params)
+        assert result is None
+
+    def test_empty_model_settings_returns_none(self) -> None:
+        """Empty `model_settings` dict should also yield None."""
+        params = ModelRequestParameters()
+        settings: ModelSettings = {}
+        result = _resolve_tool_choice(settings, params)
+        assert result is None
+
+    def test_tool_choice_not_set_returns_none(self) -> None:
+        """`tool_choice` missing from settings keeps provider defaults."""
+        params = ModelRequestParameters()
+        settings: ModelSettings = {'temperature': 0.5}
+        result = _resolve_tool_choice(settings, params)
+        assert result is None
+
+
+class TestResolveToolChoiceStringValues:
+    """String-valued `tool_choice` entries."""
+
+    @pytest.mark.parametrize(
+        'tool_choice,expected',
+        [
+            pytest.param('none', snapshot(_ResolvedToolChoice(mode='none')), id='none'),
+            pytest.param('auto', snapshot(_ResolvedToolChoice(mode='auto')), id='auto'),
+            pytest.param('required', snapshot(_ResolvedToolChoice(mode='required')), id='required'),
+        ],
+    )
+    def test_string_values(self, tool_choice: str, expected: _ResolvedToolChoice) -> None:
+        """Valid string entries map directly to their resolved form."""
+        params = ModelRequestParameters(function_tools=[make_tool('my_tool')])
+        settings: ModelSettings = {'tool_choice': tool_choice}  # type: ignore
+        result = _resolve_tool_choice(settings, params)
+        assert result == expected
+
+
+class TestResolveToolChoiceSpecificTools:
+    """List-based tool_choice entries."""
+
+    def test_single_valid_tool(self) -> None:
+        """Single tool names remain in the returned result."""
+        params = ModelRequestParameters(function_tools=[make_tool('tool_a'), make_tool('tool_b')])
+        settings: ModelSettings = {'tool_choice': ['tool_a']}
+        result = _resolve_tool_choice(settings, params)
+        assert result == snapshot(_ResolvedToolChoice(mode='specific', tool_names=['tool_a']))
+
+    def test_multiple_valid_tools(self) -> None:
+        """Multiple valid names stay in insertion order."""
+        params = ModelRequestParameters(function_tools=[make_tool('tool_a'), make_tool('tool_b'), make_tool('tool_c')])
+        settings: ModelSettings = {'tool_choice': ['tool_a', 'tool_b']}
+        result = _resolve_tool_choice(settings, params)
+        assert result == snapshot(_ResolvedToolChoice(mode='specific', tool_names=['tool_a', 'tool_b']))
+
+    def test_invalid_tool_name_raises_user_error(self) -> None:
+        """Unknown names raise a UserError."""
+        params = ModelRequestParameters(function_tools=[make_tool('my_tool')])
+        settings: ModelSettings = {'tool_choice': ['nonexistent_tool']}
+
+        with pytest.raises(UserError, match='Invalid tool names in `tool_choice`'):
+            _resolve_tool_choice(settings, params)
+
+    def test_mixed_valid_and_invalid_tools(self) -> None:
+        """Mixed valid/invalid names still raise."""
+        params = ModelRequestParameters(function_tools=[make_tool('valid_tool')])
+        settings: ModelSettings = {'tool_choice': ['valid_tool', 'invalid_tool']}
+
+        with pytest.raises(UserError, match='invalid_tool'):
+            _resolve_tool_choice(settings, params)
+
+    def test_no_function_tools_available(self) -> None:
+        """Requesting specific tools without registered ones errors."""
+        params = ModelRequestParameters()
+        settings: ModelSettings = {'tool_choice': ['some_tool']}
+
+        with pytest.raises(UserError, match='Available function tools: none'):
+            _resolve_tool_choice(settings, params)
+
+    def test_empty_list_returns_none_mode(self) -> None:
+        """Empty list is treated as tool_choice='none'."""
+        params = ModelRequestParameters(function_tools=[make_tool('my_tool')])
+        settings: ModelSettings = {'tool_choice': []}
+        result = _resolve_tool_choice(settings, params)
+        assert result == snapshot(_ResolvedToolChoice(mode='none'))