From 616192ea8b91d8d47b1ed9d17af41906d93d9de9 Mon Sep 17 00:00:00 2001
From: pakrym-oai <pakrym@openai.com>
Date: Mon, 19 May 2025 17:45:57 -0700
Subject: [PATCH 01/22] Runner

---
 src/agents/run.py | 294 ++++++++++++++++++++++++----------------------
 1 file changed, 153 insertions(+), 141 deletions(-)

diff --git a/src/agents/run.py b/src/agents/run.py
index 849da7bfc..018200a9a 100644
--- a/src/agents/run.py
+++ b/src/agents/run.py
@@ -1,5 +1,6 @@
 from __future__ import annotations
 
+import abc
 import asyncio
 import copy
 from dataclasses import dataclass, field
@@ -106,7 +107,48 @@ class RunConfig:
     """
 
 
-class Runner:
+class Runner(abc.ABC):
+    @abc.abstractmethod
+    async def run_impl(
+        self,
+        starting_agent: Agent[TContext],
+        input: str | list[TResponseInputItem],
+        *,
+        context: TContext | None = None,
+        max_turns: int = DEFAULT_MAX_TURNS,
+        hooks: RunHooks[TContext] | None = None,
+        run_config: RunConfig | None = None,
+        previous_response_id: str | None = None,
+    ) -> RunResult:
+        pass
+
+    @abc.abstractmethod
+    def run_sync_impl(
+        self,
+        starting_agent: Agent[TContext],
+        input: str | list[TResponseInputItem],
+        *,
+        context: TContext | None = None,
+        max_turns: int = DEFAULT_MAX_TURNS,
+        hooks: RunHooks[TContext] | None = None,
+        run_config: RunConfig | None = None,
+        previous_response_id: str | None = None,
+    ) -> RunResult:
+        pass
+
+    @abc.abstractmethod
+    def run_streaming_impl(
+        self,
+        starting_agent: Agent[TContext],
+        input: str | list[TResponseInputItem],
+        context: TContext | None = None,
+        max_turns: int = DEFAULT_MAX_TURNS,
+        hooks: RunHooks[TContext] | None = None,
+        run_config: RunConfig | None = None,
+        previous_response_id: str | None = None,
+    ) -> RunResultStreaming:
+        pass
+
     @classmethod
     async def run(
         cls,
@@ -119,36 +161,102 @@ async def run(
         run_config: RunConfig | None = None,
         previous_response_id: str | None = None,
     ) -> RunResult:
-        """Run a workflow starting at the given agent. The agent will run in a loop until a final
-        output is generated. The loop runs like so:
-        1. The agent is invoked with the given input.
-        2. If there is a final output (i.e. the agent produces something of type
-            `agent.output_type`, the loop terminates.
-        3. If there's a handoff, we run the loop again, with the new agent.
-        4. Else, we run tool calls (if any), and re-run the loop.
-
-        In two cases, the agent may raise an exception:
-        1. If the max_turns is exceeded, a MaxTurnsExceeded exception is raised.
-        2. If a guardrail tripwire is triggered, a GuardrailTripwireTriggered exception is raised.
-
-        Note that only the first agent's input guardrails are run.
-
-        Args:
-            starting_agent: The starting agent to run.
-            input: The initial input to the agent. You can pass a single string for a user message,
-                or a list of input items.
-            context: The context to run the agent with.
-            max_turns: The maximum number of turns to run the agent for. A turn is defined as one
-                AI invocation (including any tool calls that might occur).
-            hooks: An object that receives callbacks on various lifecycle events.
-            run_config: Global settings for the entire agent run.
-            previous_response_id: The ID of the previous response, if using OpenAI models via the
-                Responses API, this allows you to skip passing in input from the previous turn.
-
-        Returns:
-            A run result containing all the inputs, guardrail results and the output of the last
-            agent. Agents may perform handoffs, so we don't know the specific type of the output.
-        """
+        return await DefaultRunner().run_impl(
+            starting_agent,
+            input,
+            context=context,
+            max_turns=max_turns,
+            hooks=hooks,
+            run_config=run_config,
+            previous_response_id=previous_response_id,
+        )
+
+    @classmethod
+    def run_sync(
+        cls,
+        starting_agent: Agent[TContext],
+        input: str | list[TResponseInputItem],
+        *,
+        context: TContext | None = None,
+        max_turns: int = DEFAULT_MAX_TURNS,
+        hooks: RunHooks[TContext] | None = None,
+        run_config: RunConfig | None = None,
+        previous_response_id: str | None = None,
+    ) -> RunResult:
+        return DefaultRunner().run_sync_impl(
+            starting_agent,
+            input,
+            context=context,
+            max_turns=max_turns,
+            hooks=hooks,
+            run_config=run_config,
+            previous_response_id=previous_response_id,
+        )
+
+    @classmethod
+    def run_streamed(
+        cls,
+        starting_agent: Agent[TContext],
+        input: str | list[TResponseInputItem],
+        context: TContext | None = None,
+        max_turns: int = DEFAULT_MAX_TURNS,
+        hooks: RunHooks[TContext] | None = None,
+        run_config: RunConfig | None = None,
+        previous_response_id: str | None = None,
+    ) -> RunResultStreaming:
+        return DefaultRunner().run_streaming_impl(
+            starting_agent,
+            input,
+            context=context,
+            max_turns=max_turns,
+            hooks=hooks,
+            run_config=run_config,
+            previous_response_id=previous_response_id,
+        )
+
+    @classmethod
+    def _get_output_schema(cls, agent: Agent[Any]) -> AgentOutputSchemaBase | None:
+        if agent.output_type is None or agent.output_type is str:
+            return None
+        elif isinstance(agent.output_type, AgentOutputSchemaBase):
+            return agent.output_type
+
+        return AgentOutputSchema(agent.output_type)
+
+    @classmethod
+    def _get_handoffs(cls, agent: Agent[Any]) -> list[Handoff]:
+        handoffs = []
+        for handoff_item in agent.handoffs:
+            if isinstance(handoff_item, Handoff):
+                handoffs.append(handoff_item)
+            elif isinstance(handoff_item, Agent):
+                handoffs.append(handoff(handoff_item))
+        return handoffs
+
+    @classmethod
+    def _get_model(cls, agent: Agent[Any], run_config: RunConfig) -> Model:
+        if isinstance(run_config.model, Model):
+            return run_config.model
+        elif isinstance(run_config.model, str):
+            return run_config.model_provider.get_model(run_config.model)
+        elif isinstance(agent.model, Model):
+            return agent.model
+
+        return run_config.model_provider.get_model(agent.model)
+
+
+class DefaultRunner(Runner):
+    async def run_impl(
+        self,
+        starting_agent: Agent[TContext],
+        input: str | list[TResponseInputItem],
+        *,
+        context: TContext | None = None,
+        max_turns: int = DEFAULT_MAX_TURNS,
+        hooks: RunHooks[TContext] | None = None,
+        run_config: RunConfig | None = None,
+        previous_response_id: str | None = None,
+    ) -> RunResult:
         if hooks is None:
             hooks = RunHooks[Any]()
         if run_config is None:
@@ -183,8 +291,8 @@ async def run(
                     # Start an agent span if we don't have one. This span is ended if the current
                     # agent changes, or if the agent loop ends.
                     if current_span is None:
-                        handoff_names = [h.agent_name for h in cls._get_handoffs(current_agent)]
-                        if output_schema := cls._get_output_schema(current_agent):
+                        handoff_names = [h.agent_name for h in self._get_handoffs(current_agent)]
+                        if output_schema := self._get_output_schema(current_agent):
                             output_type_name = output_schema.name()
                         else:
                             output_type_name = "str"
@@ -196,7 +304,7 @@ async def run(
                         )
                         current_span.start(mark_as_current=True)
 
-                        all_tools = await cls._get_all_tools(current_agent)
+                        all_tools = await self._get_all_tools(current_agent)
                         current_span.span_data.tools = [t.name for t in all_tools]
 
                     current_turn += 1
@@ -216,14 +324,14 @@ async def run(
 
                     if current_turn == 1:
                         input_guardrail_results, turn_result = await asyncio.gather(
-                            cls._run_input_guardrails(
+                            self._run_input_guardrails(
                                 starting_agent,
                                 starting_agent.input_guardrails
                                 + (run_config.input_guardrails or []),
                                 copy.deepcopy(input),
                                 context_wrapper,
                             ),
-                            cls._run_single_turn(
+                            self._run_single_turn(
                                 agent=current_agent,
                                 all_tools=all_tools,
                                 original_input=original_input,
@@ -237,7 +345,7 @@ async def run(
                             ),
                         )
                     else:
-                        turn_result = await cls._run_single_turn(
+                        turn_result = await self._run_single_turn(
                             agent=current_agent,
                             all_tools=all_tools,
                             original_input=original_input,
@@ -256,7 +364,7 @@ async def run(
                     generated_items = turn_result.generated_items
 
                     if isinstance(turn_result.next_step, NextStepFinalOutput):
-                        output_guardrail_results = await cls._run_output_guardrails(
+                        output_guardrail_results = await self._run_output_guardrails(
                             current_agent.output_guardrails + (run_config.output_guardrails or []),
                             current_agent,
                             turn_result.next_step.output,
@@ -287,9 +395,8 @@ async def run(
                 if current_span:
                     current_span.finish(reset_current=True)
 
-    @classmethod
-    def run_sync(
-        cls,
+    def run_sync_impl(
+        self,
         starting_agent: Agent[TContext],
         input: str | list[TResponseInputItem],
         *,
@@ -299,42 +406,8 @@ def run_sync(
         run_config: RunConfig | None = None,
         previous_response_id: str | None = None,
     ) -> RunResult:
-        """Run a workflow synchronously, starting at the given agent. Note that this just wraps the
-        `run` method, so it will not work if there's already an event loop (e.g. inside an async
-        function, or in a Jupyter notebook or async context like FastAPI). For those cases, use
-        the `run` method instead.
-
-        The agent will run in a loop until a final output is generated. The loop runs like so:
-        1. The agent is invoked with the given input.
-        2. If there is a final output (i.e. the agent produces something of type
-            `agent.output_type`, the loop terminates.
-        3. If there's a handoff, we run the loop again, with the new agent.
-        4. Else, we run tool calls (if any), and re-run the loop.
-
-        In two cases, the agent may raise an exception:
-        1. If the max_turns is exceeded, a MaxTurnsExceeded exception is raised.
-        2. If a guardrail tripwire is triggered, a GuardrailTripwireTriggered exception is raised.
-
-        Note that only the first agent's input guardrails are run.
-
-        Args:
-            starting_agent: The starting agent to run.
-            input: The initial input to the agent. You can pass a single string for a user message,
-                or a list of input items.
-            context: The context to run the agent with.
-            max_turns: The maximum number of turns to run the agent for. A turn is defined as one
-                AI invocation (including any tool calls that might occur).
-            hooks: An object that receives callbacks on various lifecycle events.
-            run_config: Global settings for the entire agent run.
-            previous_response_id: The ID of the previous response, if using OpenAI models via the
-                Responses API, this allows you to skip passing in input from the previous turn.
-
-        Returns:
-            A run result containing all the inputs, guardrail results and the output of the last
-            agent. Agents may perform handoffs, so we don't know the specific type of the output.
-        """
         return asyncio.get_event_loop().run_until_complete(
-            cls.run(
+            self.run(
                 starting_agent,
                 input,
                 context=context,
@@ -345,9 +418,8 @@ def run_sync(
             )
         )
 
-    @classmethod
-    def run_streamed(
-        cls,
+    def run_streaming_impl(
+        self,
         starting_agent: Agent[TContext],
         input: str | list[TResponseInputItem],
         context: TContext | None = None,
@@ -356,36 +428,6 @@ def run_streamed(
         run_config: RunConfig | None = None,
         previous_response_id: str | None = None,
     ) -> RunResultStreaming:
-        """Run a workflow starting at the given agent in streaming mode. The returned result object
-        contains a method you can use to stream semantic events as they are generated.
-
-        The agent will run in a loop until a final output is generated. The loop runs like so:
-        1. The agent is invoked with the given input.
-        2. If there is a final output (i.e. the agent produces something of type
-            `agent.output_type`, the loop terminates.
-        3. If there's a handoff, we run the loop again, with the new agent.
-        4. Else, we run tool calls (if any), and re-run the loop.
-
-        In two cases, the agent may raise an exception:
-        1. If the max_turns is exceeded, a MaxTurnsExceeded exception is raised.
-        2. If a guardrail tripwire is triggered, a GuardrailTripwireTriggered exception is raised.
-
-        Note that only the first agent's input guardrails are run.
-
-        Args:
-            starting_agent: The starting agent to run.
-            input: The initial input to the agent. You can pass a single string for a user message,
-                or a list of input items.
-            context: The context to run the agent with.
-            max_turns: The maximum number of turns to run the agent for. A turn is defined as one
-                AI invocation (including any tool calls that might occur).
-            hooks: An object that receives callbacks on various lifecycle events.
-            run_config: Global settings for the entire agent run.
-            previous_response_id: The ID of the previous response, if using OpenAI models via the
-                Responses API, this allows you to skip passing in input from the previous turn.
-        Returns:
-            A result object that contains data about the run, as well as a method to stream events.
-        """
         if hooks is None:
             hooks = RunHooks[Any]()
         if run_config is None:
@@ -406,7 +448,7 @@ def run_streamed(
             )
         )
 
-        output_schema = cls._get_output_schema(starting_agent)
+        output_schema = self._get_output_schema(starting_agent)
         context_wrapper: RunContextWrapper[TContext] = RunContextWrapper(
             context=context  # type: ignore
         )
@@ -429,7 +471,7 @@ def run_streamed(
 
         # Kick off the actual agent loop in the background and return the streamed result object.
         streamed_result._run_impl_task = asyncio.create_task(
-            cls._run_streamed_impl(
+            self._run_streamed_impl(
                 starting_input=input,
                 streamed_result=streamed_result,
                 starting_agent=starting_agent,
@@ -933,36 +975,6 @@ async def _get_new_response(
 
         return new_response
 
-    @classmethod
-    def _get_output_schema(cls, agent: Agent[Any]) -> AgentOutputSchemaBase | None:
-        if agent.output_type is None or agent.output_type is str:
-            return None
-        elif isinstance(agent.output_type, AgentOutputSchemaBase):
-            return agent.output_type
-
-        return AgentOutputSchema(agent.output_type)
-
-    @classmethod
-    def _get_handoffs(cls, agent: Agent[Any]) -> list[Handoff]:
-        handoffs = []
-        for handoff_item in agent.handoffs:
-            if isinstance(handoff_item, Handoff):
-                handoffs.append(handoff_item)
-            elif isinstance(handoff_item, Agent):
-                handoffs.append(handoff(handoff_item))
-        return handoffs
-
     @classmethod
     async def _get_all_tools(cls, agent: Agent[Any]) -> list[Tool]:
         return await agent.get_all_tools()
-
-    @classmethod
-    def _get_model(cls, agent: Agent[Any], run_config: RunConfig) -> Model:
-        if isinstance(run_config.model, Model):
-            return run_config.model
-        elif isinstance(run_config.model, str):
-            return run_config.model_provider.get_model(run_config.model)
-        elif isinstance(agent.model, Model):
-            return agent.model
-
-        return run_config.model_provider.get_model(agent.model)

From 046c2874ee8f50934132347a7e6489a6df5600ed Mon Sep 17 00:00:00 2001
From: pakrym-oai <pakrym@openai.com>
Date: Mon, 19 May 2025 17:51:18 -0700
Subject: [PATCH 02/22] LLM: run.py: add support for configurable default
 Runner

- Introduce a DEFAULT_RUNNER global and a set_default_runner() function to allow callers to specify a default Runner for agent runs.
- Update Runner.run, run_sync, and run_streaming to use DEFAULT_RUNNER if set, otherwise fallback to DefaultRunner.
- Add detailed docstrings to run, run_sync, and run_streaming methods for clarity on agent execution flow and exceptions.
---
 src/agents/run.py | 99 +++++++++++++++++++++++++++++++++++++++++++++--
 1 file changed, 96 insertions(+), 3 deletions(-)

diff --git a/src/agents/run.py b/src/agents/run.py
index 018200a9a..6b7a2bd3c 100644
--- a/src/agents/run.py
+++ b/src/agents/run.py
@@ -46,6 +46,15 @@
 from .util import _coro, _error_tracing
 
 DEFAULT_MAX_TURNS = 10
+DEFAULT_RUNNER: Runner | None = None
+
+
+def set_default_runner(runner: Runner) -> None:
+    """
+    Set the default runner to use for the agent run.
+    """
+    global DEFAULT_RUNNER
+    DEFAULT_RUNNER = runner
 
 
 @dataclass
@@ -161,7 +170,34 @@ async def run(
         run_config: RunConfig | None = None,
         previous_response_id: str | None = None,
     ) -> RunResult:
-        return await DefaultRunner().run_impl(
+        """Run a workflow starting at the given agent. The agent will run in a loop until a final
+        output is generated. The loop runs like so:
+        1. The agent is invoked with the given input.
+        2. If there is a final output (i.e. the agent produces something of type
+            `agent.output_type`, the loop terminates.
+        3. If there's a handoff, we run the loop again, with the new agent.
+        4. Else, we run tool calls (if any), and re-run the loop.
+        In two cases, the agent may raise an exception:
+        1. If the max_turns is exceeded, a MaxTurnsExceeded exception is raised.
+        2. If a guardrail tripwire is triggered, a GuardrailTripwireTriggered exception is raised.
+        Note that only the first agent's input guardrails are run.
+        Args:
+            starting_agent: The starting agent to run.
+            input: The initial input to the agent. You can pass a single string for a user message,
+                or a list of input items.
+            context: The context to run the agent with.
+            max_turns: The maximum number of turns to run the agent for. A turn is defined as one
+                AI invocation (including any tool calls that might occur).
+            hooks: An object that receives callbacks on various lifecycle events.
+            run_config: Global settings for the entire agent run.
+            previous_response_id: The ID of the previous response, if using OpenAI models via the
+                Responses API, this allows you to skip passing in input from the previous turn.
+        Returns:
+            A run result containing all the inputs, guardrail results and the output of the last
+            agent. Agents may perform handoffs, so we don't know the specific type of the output.
+        """
+        runner = DEFAULT_RUNNER or DefaultRunner()
+        return await runner.run_impl(
             starting_agent,
             input,
             context=context,
@@ -183,7 +219,37 @@ def run_sync(
         run_config: RunConfig | None = None,
         previous_response_id: str | None = None,
     ) -> RunResult:
-        return DefaultRunner().run_sync_impl(
+        """Run a workflow synchronously, starting at the given agent. Note that this just wraps the
+        `run` method, so it will not work if there's already an event loop (e.g. inside an async
+        function, or in a Jupyter notebook or async context like FastAPI). For those cases, use
+        the `run` method instead.
+        The agent will run in a loop until a final output is generated. The loop runs like so:
+        1. The agent is invoked with the given input.
+        2. If there is a final output (i.e. the agent produces something of type
+            `agent.output_type`, the loop terminates.
+        3. If there's a handoff, we run the loop again, with the new agent.
+        4. Else, we run tool calls (if any), and re-run the loop.
+        In two cases, the agent may raise an exception:
+        1. If the max_turns is exceeded, a MaxTurnsExceeded exception is raised.
+        2. If a guardrail tripwire is triggered, a GuardrailTripwireTriggered exception is raised.
+        Note that only the first agent's input guardrails are run.
+        Args:
+            starting_agent: The starting agent to run.
+            input: The initial input to the agent. You can pass a single string for a user message,
+                or a list of input items.
+            context: The context to run the agent with.
+            max_turns: The maximum number of turns to run the agent for. A turn is defined as one
+                AI invocation (including any tool calls that might occur).
+            hooks: An object that receives callbacks on various lifecycle events.
+            run_config: Global settings for the entire agent run.
+            previous_response_id: The ID of the previous response, if using OpenAI models via the
+                Responses API, this allows you to skip passing in input from the previous turn.
+        Returns:
+            A run result containing all the inputs, guardrail results and the output of the last
+            agent. Agents may perform handoffs, so we don't know the specific type of the output.
+        """
+        runner = DEFAULT_RUNNER or DefaultRunner()
+        return runner.run_sync_impl(
             starting_agent,
             input,
             context=context,
@@ -204,7 +270,34 @@ def run_streamed(
         run_config: RunConfig | None = None,
         previous_response_id: str | None = None,
     ) -> RunResultStreaming:
-        return DefaultRunner().run_streaming_impl(
+        """Run a workflow starting at the given agent in streaming mode. The returned result object
+        contains a method you can use to stream semantic events as they are generated.
+        The agent will run in a loop until a final output is generated. The loop runs like so:
+        1. The agent is invoked with the given input.
+        2. If there is a final output (i.e. the agent produces something of type
+            `agent.output_type`, the loop terminates.
+        3. If there's a handoff, we run the loop again, with the new agent.
+        4. Else, we run tool calls (if any), and re-run the loop.
+        In two cases, the agent may raise an exception:
+        1. If the max_turns is exceeded, a MaxTurnsExceeded exception is raised.
+        2. If a guardrail tripwire is triggered, a GuardrailTripwireTriggered exception is raised.
+        Note that only the first agent's input guardrails are run.
+        Args:
+            starting_agent: The starting agent to run.
+            input: The initial input to the agent. You can pass a single string for a user message,
+                or a list of input items.
+            context: The context to run the agent with.
+            max_turns: The maximum number of turns to run the agent for. A turn is defined as one
+                AI invocation (including any tool calls that might occur).
+            hooks: An object that receives callbacks on various lifecycle events.
+            run_config: Global settings for the entire agent run.
+            previous_response_id: The ID of the previous response, if using OpenAI models via the
+                Responses API, this allows you to skip passing in input from the previous turn.
+        Returns:
+            A result object that contains data about the run, as well as a method to stream events.
+        """
+        runner = DEFAULT_RUNNER or DefaultRunner()
+        return runner.run_streaming_impl(
             starting_agent,
             input,
             context=context,

From c7b5053e4e6f7542d65e2c22cdd6456a165f12ac Mon Sep 17 00:00:00 2001
From: pakrym-oai <pakrym@openai.com>
Date: Mon, 19 May 2025 17:52:14 -0700
Subject: [PATCH 03/22] LLM: agents: export DefaultRunner and
 set_default_runner in __init__

---
 src/agents/__init__.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/src/agents/__init__.py b/src/agents/__init__.py
index 6d7c90b4f..3c9c84657 100644
--- a/src/agents/__init__.py
+++ b/src/agents/__init__.py
@@ -45,7 +45,7 @@
 from .models.openai_provider import OpenAIProvider
 from .models.openai_responses import OpenAIResponsesModel
 from .result import RunResult, RunResultStreaming
-from .run import RunConfig, Runner
+from .run import DefaultRunner, RunConfig, Runner, set_default_runner
 from .run_context import RunContextWrapper, TContext
 from .stream_events import (
     AgentUpdatedStreamEvent,
@@ -150,6 +150,7 @@ def enable_verbose_stdout_logging():
     "ToolsToFinalOutputFunction",
     "ToolsToFinalOutputResult",
     "Runner",
+    "DefaultRunner",
     "Model",
     "ModelProvider",
     "ModelTracing",
@@ -244,6 +245,7 @@ def enable_verbose_stdout_logging():
     "set_default_openai_key",
     "set_default_openai_client",
     "set_default_openai_api",
+    "set_default_runner",
     "set_tracing_export_api_key",
     "enable_verbose_stdout_logging",
     "gen_trace_id",

From a10f9459bf84c1871cb969a902b95a4b354f60a3 Mon Sep 17 00:00:00 2001
From: pakrym-oai <pakrym@openai.com>
Date: Mon, 19 May 2025 18:02:40 -0700
Subject: [PATCH 04/22] test

---
 src/agents/run.py |  8 ++++----
 tests/conftest.py |  6 ++++++
 tests/test_run.py | 26 ++++++++++++++++++++++++++
 3 files changed, 36 insertions(+), 4 deletions(-)
 create mode 100644 tests/test_run.py

diff --git a/src/agents/run.py b/src/agents/run.py
index 6b7a2bd3c..6bf1ed16b 100644
--- a/src/agents/run.py
+++ b/src/agents/run.py
@@ -49,7 +49,7 @@
 DEFAULT_RUNNER: Runner | None = None
 
 
-def set_default_runner(runner: Runner) -> None:
+def set_default_runner(runner: Runner | None) -> None:
     """
     Set the default runner to use for the agent run.
     """
@@ -146,7 +146,7 @@ def run_sync_impl(
         pass
 
     @abc.abstractmethod
-    def run_streaming_impl(
+    def run_streamed_impl(
         self,
         starting_agent: Agent[TContext],
         input: str | list[TResponseInputItem],
@@ -297,7 +297,7 @@ def run_streamed(
             A result object that contains data about the run, as well as a method to stream events.
         """
         runner = DEFAULT_RUNNER or DefaultRunner()
-        return runner.run_streaming_impl(
+        return runner.run_streamed_impl(
             starting_agent,
             input,
             context=context,
@@ -511,7 +511,7 @@ def run_sync_impl(
             )
         )
 
-    def run_streaming_impl(
+    def run_streamed_impl(
         self,
         starting_agent: Agent[TContext],
         input: str | list[TResponseInputItem],
diff --git a/tests/conftest.py b/tests/conftest.py
index ba0d88221..622b61b14 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -5,6 +5,7 @@
 from agents.models import _openai_shared
 from agents.models.openai_chatcompletions import OpenAIChatCompletionsModel
 from agents.models.openai_responses import OpenAIResponsesModel
+from agents.run import set_default_runner
 from agents.tracing import set_trace_processors
 from agents.tracing.setup import GLOBAL_TRACE_PROVIDER
 
@@ -33,6 +34,11 @@ def clear_openai_settings():
     _openai_shared._use_responses_by_default = True
 
 
+@pytest.fixture(autouse=True)
+def clear_default_runner():
+    set_default_runner(None)
+
+
 # This fixture will run after all tests end
 @pytest.fixture(autouse=True, scope="session")
 def shutdown_trace_provider():
diff --git a/tests/test_run.py b/tests/test_run.py
new file mode 100644
index 000000000..b01c8605e
--- /dev/null
+++ b/tests/test_run.py
@@ -0,0 +1,26 @@
+from __future__ import annotations
+
+from unittest import mock
+
+import pytest
+
+from agents import Agent, Runner
+from agents.run import set_default_runner
+
+from .fake_model import FakeModel
+
+
+@pytest.mark.asyncio
+async def test_static_run_methods_call_into_default_runner() -> None:
+    runner = mock.Mock(spec=Runner)
+    set_default_runner(runner)
+
+    agent = Agent(name="test", model=FakeModel())
+    await Runner.run(agent, input="test")
+    runner.run_impl.assert_called_once()
+
+    Runner.run_streamed(agent, input="test")
+    runner.run_streamed_impl.assert_called_once()
+
+    Runner.run_sync(agent, input="test")
+    runner.run_sync_impl.assert_called_once()

From 2002dd9b525a2ab782cb059a1e8a016f0b2cc6ac Mon Sep 17 00:00:00 2001
From: pakrym-oai <pakrym@openai.com>
Date: Mon, 19 May 2025 18:05:20 -0700
Subject: [PATCH 05/22] LLM: rename Runner execution methods to use leading
 underscores

This commit renames the abstract and concrete methods run_impl, run_sync_impl, and run_streamed_impl in the Runner and DefaultRunner classes to _run_impl, _run_sync_impl, and _run_streamed_impl (or _start_streaming as appropriate) for improved naming consistency. Updates all method calls and test mocks accordingly. No behavior changes.
---
 src/agents/run.py | 22 +++++++++++-----------
 tests/test_run.py |  6 +++---
 2 files changed, 14 insertions(+), 14 deletions(-)

diff --git a/src/agents/run.py b/src/agents/run.py
index 6bf1ed16b..045f6f0b8 100644
--- a/src/agents/run.py
+++ b/src/agents/run.py
@@ -118,7 +118,7 @@ class RunConfig:
 
 class Runner(abc.ABC):
     @abc.abstractmethod
-    async def run_impl(
+    async def _run_impl(
         self,
         starting_agent: Agent[TContext],
         input: str | list[TResponseInputItem],
@@ -132,7 +132,7 @@ async def run_impl(
         pass
 
     @abc.abstractmethod
-    def run_sync_impl(
+    def _run_sync_impl(
         self,
         starting_agent: Agent[TContext],
         input: str | list[TResponseInputItem],
@@ -146,7 +146,7 @@ def run_sync_impl(
         pass
 
     @abc.abstractmethod
-    def run_streamed_impl(
+    def _run_streamed_impl(
         self,
         starting_agent: Agent[TContext],
         input: str | list[TResponseInputItem],
@@ -197,7 +197,7 @@ async def run(
             agent. Agents may perform handoffs, so we don't know the specific type of the output.
         """
         runner = DEFAULT_RUNNER or DefaultRunner()
-        return await runner.run_impl(
+        return await runner._run_impl(
             starting_agent,
             input,
             context=context,
@@ -249,7 +249,7 @@ def run_sync(
             agent. Agents may perform handoffs, so we don't know the specific type of the output.
         """
         runner = DEFAULT_RUNNER or DefaultRunner()
-        return runner.run_sync_impl(
+        return runner._run_sync_impl(
             starting_agent,
             input,
             context=context,
@@ -297,7 +297,7 @@ def run_streamed(
             A result object that contains data about the run, as well as a method to stream events.
         """
         runner = DEFAULT_RUNNER or DefaultRunner()
-        return runner.run_streamed_impl(
+        return runner._run_streamed_impl(
             starting_agent,
             input,
             context=context,
@@ -339,7 +339,7 @@ def _get_model(cls, agent: Agent[Any], run_config: RunConfig) -> Model:
 
 
 class DefaultRunner(Runner):
-    async def run_impl(
+    async def _run_impl(
         self,
         starting_agent: Agent[TContext],
         input: str | list[TResponseInputItem],
@@ -488,7 +488,7 @@ async def run_impl(
                 if current_span:
                     current_span.finish(reset_current=True)
 
-    def run_sync_impl(
+    def _run_sync_impl(
         self,
         starting_agent: Agent[TContext],
         input: str | list[TResponseInputItem],
@@ -511,7 +511,7 @@ def run_sync_impl(
             )
         )
 
-    def run_streamed_impl(
+    def _run_streamed_impl(
         self,
         starting_agent: Agent[TContext],
         input: str | list[TResponseInputItem],
@@ -564,7 +564,7 @@ def run_streamed_impl(
 
         # Kick off the actual agent loop in the background and return the streamed result object.
         streamed_result._run_impl_task = asyncio.create_task(
-            self._run_streamed_impl(
+            self._start_streaming(
                 starting_input=input,
                 streamed_result=streamed_result,
                 starting_agent=starting_agent,
@@ -621,7 +621,7 @@ async def _run_input_guardrails_with_queue(
         streamed_result.input_guardrail_results = guardrail_results
 
     @classmethod
-    async def _run_streamed_impl(
+    async def _start_streaming(
         cls,
         starting_input: str | list[TResponseInputItem],
         streamed_result: RunResultStreaming,
diff --git a/tests/test_run.py b/tests/test_run.py
index b01c8605e..57e33d50d 100644
--- a/tests/test_run.py
+++ b/tests/test_run.py
@@ -17,10 +17,10 @@ async def test_static_run_methods_call_into_default_runner() -> None:
 
     agent = Agent(name="test", model=FakeModel())
     await Runner.run(agent, input="test")
-    runner.run_impl.assert_called_once()
+    runner._run_impl.assert_called_once()
 
     Runner.run_streamed(agent, input="test")
-    runner.run_streamed_impl.assert_called_once()
+    runner._run_streamed_impl.assert_called_once()
 
     Runner.run_sync(agent, input="test")
-    runner.run_sync_impl.assert_called_once()
+    runner._run_sync_impl.assert_called_once()

From 40d1b91410f8ea347f074abc5e9bb813629a64d5 Mon Sep 17 00:00:00 2001
From: pakrym-oai <pakrym@openai.com>
Date: Wed, 21 May 2025 09:19:06 -0700
Subject: [PATCH 06/22] Add ID generation methods to TraceProvider (#729)

---
 src/agents/__init__.py         |  2 ++
 src/agents/tracing/__init__.py |  3 ++-
 src/agents/tracing/setup.py    | 24 ++++++++++++++++++++++++
 src/agents/tracing/util.py     | 19 +++++++++----------
 4 files changed, 37 insertions(+), 11 deletions(-)

diff --git a/src/agents/__init__.py b/src/agents/__init__.py
index 3c9c84657..65e44244f 100644
--- a/src/agents/__init__.py
+++ b/src/agents/__init__.py
@@ -92,6 +92,7 @@
     handoff_span,
     mcp_tools_span,
     set_trace_processors,
+    set_trace_provider,
     set_tracing_disabled,
     set_tracing_export_api_key,
     speech_group_span,
@@ -221,6 +222,7 @@ def enable_verbose_stdout_logging():
     "guardrail_span",
     "handoff_span",
     "set_trace_processors",
+    "set_trace_provider",
     "set_tracing_disabled",
     "speech_group_span",
     "transcription_span",
diff --git a/src/agents/tracing/__init__.py b/src/agents/tracing/__init__.py
index 9df944263..07d8af6d7 100644
--- a/src/agents/tracing/__init__.py
+++ b/src/agents/tracing/__init__.py
@@ -18,7 +18,7 @@
 )
 from .processor_interface import TracingProcessor
 from .processors import default_exporter, default_processor
-from .setup import GLOBAL_TRACE_PROVIDER
+from .setup import GLOBAL_TRACE_PROVIDER, set_trace_provider
 from .span_data import (
     AgentSpanData,
     CustomSpanData,
@@ -49,6 +49,7 @@
     "handoff_span",
     "response_span",
     "set_trace_processors",
+    "set_trace_provider",
     "set_tracing_disabled",
     "trace",
     "Trace",
diff --git a/src/agents/tracing/setup.py b/src/agents/tracing/setup.py
index 9e27d210b..daa7b86d0 100644
--- a/src/agents/tracing/setup.py
+++ b/src/agents/tracing/setup.py
@@ -2,6 +2,8 @@
 
 import os
 import threading
+import uuid
+from datetime import datetime, timezone
 from typing import Any
 
 from ..logger import logger
@@ -118,6 +120,22 @@ def set_disabled(self, disabled: bool) -> None:
         """
         self._disabled = disabled
 
+    def time_iso(self) -> str:
+        """Return the current time in ISO 8601 format."""
+        return datetime.now(timezone.utc).isoformat()
+
+    def gen_trace_id(self) -> str:
+        """Generate a new trace ID."""
+        return f"trace_{uuid.uuid4().hex}"
+
+    def gen_span_id(self) -> str:
+        """Generate a new span ID."""
+        return f"span_{uuid.uuid4().hex[:24]}"
+
+    def gen_group_id(self) -> str:
+        """Generate a new group ID."""
+        return f"group_{uuid.uuid4().hex[:24]}"
+
     def create_trace(
         self,
         name: str,
@@ -212,3 +230,9 @@ def shutdown(self) -> None:
 
 
 GLOBAL_TRACE_PROVIDER = TraceProvider()
+
+
+def set_trace_provider(provider: TraceProvider) -> None:
+    """Set the global trace provider used by tracing utilities."""
+    global GLOBAL_TRACE_PROVIDER
+    GLOBAL_TRACE_PROVIDER = provider
diff --git a/src/agents/tracing/util.py b/src/agents/tracing/util.py
index f546b4e50..af2f5ff32 100644
--- a/src/agents/tracing/util.py
+++ b/src/agents/tracing/util.py
@@ -1,22 +1,21 @@
-import uuid
-from datetime import datetime, timezone
+from .setup import GLOBAL_TRACE_PROVIDER
 
 
 def time_iso() -> str:
-    """Returns the current time in ISO 8601 format."""
-    return datetime.now(timezone.utc).isoformat()
+    """Return the current time in ISO 8601 format."""
+    return GLOBAL_TRACE_PROVIDER.time_iso()
 
 
 def gen_trace_id() -> str:
-    """Generates a new trace ID."""
-    return f"trace_{uuid.uuid4().hex}"
+    """Generate a new trace ID."""
+    return GLOBAL_TRACE_PROVIDER.gen_trace_id()
 
 
 def gen_span_id() -> str:
-    """Generates a new span ID."""
-    return f"span_{uuid.uuid4().hex[:24]}"
+    """Generate a new span ID."""
+    return GLOBAL_TRACE_PROVIDER.gen_span_id()
 
 
 def gen_group_id() -> str:
-    """Generates a new group ID."""
-    return f"group_{uuid.uuid4().hex[:24]}"
+    """Generate a new group ID."""
+    return GLOBAL_TRACE_PROVIDER.gen_group_id()

From b9145707c6c9361650d093a3f3a8e5d46ae8e52d Mon Sep 17 00:00:00 2001
From: pakrym-oai <pakrym@openai.com>
Date: Wed, 21 May 2025 09:34:06 -0700
Subject: [PATCH 07/22] LLM: refactor(tracing): move TraceProvider to separate
 module and replace global with accessor

- Move TraceProvider and related logic from setup.py to new provider.py module
- Replace direct GLOBAL_TRACE_PROVIDER references with get_trace_provider() accessor throughout tracing code
- Update init and util imports to use get_trace_provider
- Call set_trace_provider(TraceProvider()) on init
- Remove ID and time generation logic from util, delegate to TraceProvider
- Update SpanImpl to always use passed-in span_id
---
 src/agents/tracing/__init__.py |  13 +-
 src/agents/tracing/create.py   |  32 ++---
 src/agents/tracing/provider.py | 228 +++++++++++++++++++++++++++++++
 src/agents/tracing/setup.py    | 239 ++-------------------------------
 src/agents/tracing/spans.py    |   2 +-
 src/agents/tracing/util.py     |  10 +-
 tests/conftest.py              |   4 +-
 7 files changed, 271 insertions(+), 257 deletions(-)
 create mode 100644 src/agents/tracing/provider.py

diff --git a/src/agents/tracing/__init__.py b/src/agents/tracing/__init__.py
index 07d8af6d7..4281c29ff 100644
--- a/src/agents/tracing/__init__.py
+++ b/src/agents/tracing/__init__.py
@@ -1,5 +1,7 @@
 import atexit
 
+from agents.tracing.provider import TraceProvider
+
 from .create import (
     agent_span,
     custom_span,
@@ -18,7 +20,7 @@
 )
 from .processor_interface import TracingProcessor
 from .processors import default_exporter, default_processor
-from .setup import GLOBAL_TRACE_PROVIDER, set_trace_provider
+from .setup import get_trace_provider, set_trace_provider
 from .span_data import (
     AgentSpanData,
     CustomSpanData,
@@ -81,21 +83,21 @@ def add_trace_processor(span_processor: TracingProcessor) -> None:
     """
     Adds a new trace processor. This processor will receive all traces/spans.
     """
-    GLOBAL_TRACE_PROVIDER.register_processor(span_processor)
+    get_trace_provider().register_processor(span_processor)
 
 
 def set_trace_processors(processors: list[TracingProcessor]) -> None:
     """
     Set the list of trace processors. This will replace the current list of processors.
     """
-    GLOBAL_TRACE_PROVIDER.set_processors(processors)
+    get_trace_provider().set_processors(processors)
 
 
 def set_tracing_disabled(disabled: bool) -> None:
     """
     Set whether tracing is globally disabled.
     """
-    GLOBAL_TRACE_PROVIDER.set_disabled(disabled)
+    get_trace_provider().set_disabled(disabled)
 
 
 def set_tracing_export_api_key(api_key: str) -> None:
@@ -105,10 +107,11 @@ def set_tracing_export_api_key(api_key: str) -> None:
     default_exporter().set_api_key(api_key)
 
 
+set_trace_provider(TraceProvider())
 # Add the default processor, which exports traces and spans to the backend in batches. You can
 # change the default behavior by either:
 # 1. calling add_trace_processor(), which adds additional processors, or
 # 2. calling set_trace_processors(), which replaces the default processor.
 add_trace_processor(default_processor())
 
-atexit.register(GLOBAL_TRACE_PROVIDER.shutdown)
+atexit.register(get_trace_provider().shutdown)
diff --git a/src/agents/tracing/create.py b/src/agents/tracing/create.py
index b6fe46104..ac451abf5 100644
--- a/src/agents/tracing/create.py
+++ b/src/agents/tracing/create.py
@@ -4,7 +4,7 @@
 from typing import TYPE_CHECKING, Any
 
 from ..logger import logger
-from .setup import GLOBAL_TRACE_PROVIDER
+from .setup import get_trace_provider
 from .span_data import (
     AgentSpanData,
     CustomSpanData,
@@ -56,13 +56,13 @@ def trace(
     Returns:
         The newly created trace object.
     """
-    current_trace = GLOBAL_TRACE_PROVIDER.get_current_trace()
+    current_trace = get_trace_provider().get_current_trace()
     if current_trace:
         logger.warning(
             "Trace already exists. Creating a new trace, but this is probably a mistake."
         )
 
-    return GLOBAL_TRACE_PROVIDER.create_trace(
+    return get_trace_provider().create_trace(
         name=workflow_name,
         trace_id=trace_id,
         group_id=group_id,
@@ -73,12 +73,12 @@ def trace(
 
 def get_current_trace() -> Trace | None:
     """Returns the currently active trace, if present."""
-    return GLOBAL_TRACE_PROVIDER.get_current_trace()
+    return get_trace_provider().get_current_trace()
 
 
 def get_current_span() -> Span[Any] | None:
     """Returns the currently active span, if present."""
-    return GLOBAL_TRACE_PROVIDER.get_current_span()
+    return get_trace_provider().get_current_span()
 
 
 def agent_span(
@@ -108,7 +108,7 @@ def agent_span(
     Returns:
         The newly created agent span.
     """
-    return GLOBAL_TRACE_PROVIDER.create_span(
+    return get_trace_provider().create_span(
         span_data=AgentSpanData(name=name, handoffs=handoffs, tools=tools, output_type=output_type),
         span_id=span_id,
         parent=parent,
@@ -141,7 +141,7 @@ def function_span(
     Returns:
         The newly created function span.
     """
-    return GLOBAL_TRACE_PROVIDER.create_span(
+    return get_trace_provider().create_span(
         span_data=FunctionSpanData(name=name, input=input, output=output),
         span_id=span_id,
         parent=parent,
@@ -183,7 +183,7 @@ def generation_span(
     Returns:
         The newly created generation span.
     """
-    return GLOBAL_TRACE_PROVIDER.create_span(
+    return get_trace_provider().create_span(
         span_data=GenerationSpanData(
             input=input,
             output=output,
@@ -215,7 +215,7 @@ def response_span(
             trace/span as the parent.
         disabled: If True, we will return a Span but the Span will not be recorded.
     """
-    return GLOBAL_TRACE_PROVIDER.create_span(
+    return get_trace_provider().create_span(
         span_data=ResponseSpanData(response=response),
         span_id=span_id,
         parent=parent,
@@ -246,7 +246,7 @@ def handoff_span(
     Returns:
         The newly created handoff span.
     """
-    return GLOBAL_TRACE_PROVIDER.create_span(
+    return get_trace_provider().create_span(
         span_data=HandoffSpanData(from_agent=from_agent, to_agent=to_agent),
         span_id=span_id,
         parent=parent,
@@ -278,7 +278,7 @@ def custom_span(
     Returns:
         The newly created custom span.
     """
-    return GLOBAL_TRACE_PROVIDER.create_span(
+    return get_trace_provider().create_span(
         span_data=CustomSpanData(name=name, data=data or {}),
         span_id=span_id,
         parent=parent,
@@ -306,7 +306,7 @@ def guardrail_span(
             trace/span as the parent.
         disabled: If True, we will return a Span but the Span will not be recorded.
     """
-    return GLOBAL_TRACE_PROVIDER.create_span(
+    return get_trace_provider().create_span(
         span_data=GuardrailSpanData(name=name, triggered=triggered),
         span_id=span_id,
         parent=parent,
@@ -344,7 +344,7 @@ def transcription_span(
     Returns:
         The newly created speech-to-text span.
     """
-    return GLOBAL_TRACE_PROVIDER.create_span(
+    return get_trace_provider().create_span(
         span_data=TranscriptionSpanData(
             input=input,
             input_format=input_format,
@@ -386,7 +386,7 @@ def speech_span(
             trace/span as the parent.
         disabled: If True, we will return a Span but the Span will not be recorded.
     """
-    return GLOBAL_TRACE_PROVIDER.create_span(
+    return get_trace_provider().create_span(
         span_data=SpeechSpanData(
             model=model,
             input=input,
@@ -419,7 +419,7 @@ def speech_group_span(
             trace/span as the parent.
         disabled: If True, we will return a Span but the Span will not be recorded.
     """
-    return GLOBAL_TRACE_PROVIDER.create_span(
+    return get_trace_provider().create_span(
         span_data=SpeechGroupSpanData(input=input),
         span_id=span_id,
         parent=parent,
@@ -447,7 +447,7 @@ def mcp_tools_span(
             trace/span as the parent.
         disabled: If True, we will return a Span but the Span will not be recorded.
     """
-    return GLOBAL_TRACE_PROVIDER.create_span(
+    return get_trace_provider().create_span(
         span_data=MCPListToolsSpanData(server=server, result=result),
         span_id=span_id,
         parent=parent,
diff --git a/src/agents/tracing/provider.py b/src/agents/tracing/provider.py
new file mode 100644
index 000000000..b9f4c63e9
--- /dev/null
+++ b/src/agents/tracing/provider.py
@@ -0,0 +1,228 @@
+from __future__ import annotations
+
+import os
+import threading
+import uuid
+from datetime import datetime, timezone
+from typing import Any
+
+from ..logger import logger
+from .processor_interface import TracingProcessor
+from .scope import Scope
+from .spans import NoOpSpan, Span, SpanImpl, TSpanData
+from .traces import NoOpTrace, Trace, TraceImpl
+
+
+class SynchronousMultiTracingProcessor(TracingProcessor):
+    """
+    Forwards all calls to a list of TracingProcessors, in order of registration.
+    """
+
+    def __init__(self):
+        # Using a tuple to avoid race conditions when iterating over processors
+        self._processors: tuple[TracingProcessor, ...] = ()
+        self._lock = threading.Lock()
+
+    def add_tracing_processor(self, tracing_processor: TracingProcessor):
+        """
+        Add a processor to the list of processors. Each processor will receive all traces/spans.
+        """
+        with self._lock:
+            self._processors += (tracing_processor,)
+
+    def set_processors(self, processors: list[TracingProcessor]):
+        """
+        Set the list of processors. This will replace the current list of processors.
+        """
+        with self._lock:
+            self._processors = tuple(processors)
+
+    def on_trace_start(self, trace: Trace) -> None:
+        """
+        Called when a trace is started.
+        """
+        for processor in self._processors:
+            processor.on_trace_start(trace)
+
+    def on_trace_end(self, trace: Trace) -> None:
+        """
+        Called when a trace is finished.
+        """
+        for processor in self._processors:
+            processor.on_trace_end(trace)
+
+    def on_span_start(self, span: Span[Any]) -> None:
+        """
+        Called when a span is started.
+        """
+        for processor in self._processors:
+            processor.on_span_start(span)
+
+    def on_span_end(self, span: Span[Any]) -> None:
+        """
+        Called when a span is finished.
+        """
+        for processor in self._processors:
+            processor.on_span_end(span)
+
+    def shutdown(self) -> None:
+        """
+        Called when the application stops.
+        """
+        for processor in self._processors:
+            logger.debug(f"Shutting down trace processor {processor}")
+            processor.shutdown()
+
+    def force_flush(self):
+        """
+        Force the processors to flush their buffers.
+        """
+        for processor in self._processors:
+            processor.force_flush()
+
+
+class TraceProvider:
+    def __init__(self):
+        self._multi_processor = SynchronousMultiTracingProcessor()
+        self._disabled = os.environ.get("OPENAI_AGENTS_DISABLE_TRACING", "false").lower() in (
+            "true",
+            "1",
+        )
+
+    def register_processor(self, processor: TracingProcessor):
+        """
+        Add a processor to the list of processors. Each processor will receive all traces/spans.
+        """
+        self._multi_processor.add_tracing_processor(processor)
+
+    def set_processors(self, processors: list[TracingProcessor]):
+        """
+        Set the list of processors. This will replace the current list of processors.
+        """
+        self._multi_processor.set_processors(processors)
+
+    def get_current_trace(self) -> Trace | None:
+        """
+        Returns the currently active trace, if any.
+        """
+        return Scope.get_current_trace()
+
+    def get_current_span(self) -> Span[Any] | None:
+        """
+        Returns the currently active span, if any.
+        """
+        return Scope.get_current_span()
+
+    def set_disabled(self, disabled: bool) -> None:
+        """
+        Set whether tracing is disabled.
+        """
+        self._disabled = disabled
+
+    def time_iso(self) -> str:
+        """Return the current time in ISO 8601 format."""
+        return datetime.now(timezone.utc).isoformat()
+
+    def gen_trace_id(self) -> str:
+        """Generate a new trace ID."""
+        return f"trace_{uuid.uuid4().hex}"
+
+    def gen_span_id(self) -> str:
+        """Generate a new span ID."""
+        return f"span_{uuid.uuid4().hex[:24]}"
+
+    def gen_group_id(self) -> str:
+        """Generate a new group ID."""
+        return f"group_{uuid.uuid4().hex[:24]}"
+
+    def create_trace(
+        self,
+        name: str,
+        trace_id: str | None = None,
+        group_id: str | None = None,
+        metadata: dict[str, Any] | None = None,
+        disabled: bool = False,
+    ) -> Trace:
+        """
+        Create a new trace.
+        """
+        if self._disabled or disabled:
+            logger.debug(f"Tracing is disabled. Not creating trace {name}")
+            return NoOpTrace()
+
+        trace_id = trace_id or self.gen_trace_id()
+
+        logger.debug(f"Creating trace {name} with id {trace_id}")
+
+        return TraceImpl(
+            name=name,
+            trace_id=trace_id,
+            group_id=group_id,
+            metadata=metadata,
+            processor=self._multi_processor,
+        )
+
+    def create_span(
+        self,
+        span_data: TSpanData,
+        span_id: str | None = None,
+        parent: Trace | Span[Any] | None = None,
+        disabled: bool = False,
+    ) -> Span[TSpanData]:
+        """
+        Create a new span.
+        """
+        if self._disabled or disabled:
+            logger.debug(f"Tracing is disabled. Not creating span {span_data}")
+            return NoOpSpan(span_data)
+
+        if not parent:
+            current_span = Scope.get_current_span()
+            current_trace = Scope.get_current_trace()
+            if current_trace is None:
+                logger.error(
+                    "No active trace. Make sure to start a trace with `trace()` first"
+                    "Returning NoOpSpan."
+                )
+                return NoOpSpan(span_data)
+            elif isinstance(current_trace, NoOpTrace) or isinstance(current_span, NoOpSpan):
+                logger.debug(
+                    f"Parent {current_span} or {current_trace} is no-op, returning NoOpSpan"
+                )
+                return NoOpSpan(span_data)
+
+            parent_id = current_span.span_id if current_span else None
+            trace_id = current_trace.trace_id
+
+        elif isinstance(parent, Trace):
+            if isinstance(parent, NoOpTrace):
+                logger.debug(f"Parent {parent} is no-op, returning NoOpSpan")
+                return NoOpSpan(span_data)
+            trace_id = parent.trace_id
+            parent_id = None
+        elif isinstance(parent, Span):
+            if isinstance(parent, NoOpSpan):
+                logger.debug(f"Parent {parent} is no-op, returning NoOpSpan")
+                return NoOpSpan(span_data)
+            parent_id = parent.span_id
+            trace_id = parent.trace_id
+
+        logger.debug(f"Creating span {span_data} with id {span_id}")
+
+        return SpanImpl(
+            trace_id=trace_id,
+            span_id=span_id or self.gen_span_id(),
+            parent_id=parent_id,
+            processor=self._multi_processor,
+            span_data=span_data,
+        )
+
+    def shutdown(self) -> None:
+        if self._disabled:
+            return
+
+        try:
+            logger.debug("Shutting down trace provider")
+            self._multi_processor.shutdown()
+        except Exception as e:
+            logger.error(f"Error shutting down trace provider: {e}")
diff --git a/src/agents/tracing/setup.py b/src/agents/tracing/setup.py
index daa7b86d0..3a56b728f 100644
--- a/src/agents/tracing/setup.py
+++ b/src/agents/tracing/setup.py
@@ -1,238 +1,21 @@
 from __future__ import annotations
 
-import os
-import threading
-import uuid
-from datetime import datetime, timezone
-from typing import Any
+from typing import TYPE_CHECKING
 
-from ..logger import logger
-from . import util
-from .processor_interface import TracingProcessor
-from .scope import Scope
-from .spans import NoOpSpan, Span, SpanImpl, TSpanData
-from .traces import NoOpTrace, Trace, TraceImpl
+if TYPE_CHECKING:
+    from .provider import TraceProvider
 
-
-class SynchronousMultiTracingProcessor(TracingProcessor):
-    """
-    Forwards all calls to a list of TracingProcessors, in order of registration.
-    """
-
-    def __init__(self):
-        # Using a tuple to avoid race conditions when iterating over processors
-        self._processors: tuple[TracingProcessor, ...] = ()
-        self._lock = threading.Lock()
-
-    def add_tracing_processor(self, tracing_processor: TracingProcessor):
-        """
-        Add a processor to the list of processors. Each processor will receive all traces/spans.
-        """
-        with self._lock:
-            self._processors += (tracing_processor,)
-
-    def set_processors(self, processors: list[TracingProcessor]):
-        """
-        Set the list of processors. This will replace the current list of processors.
-        """
-        with self._lock:
-            self._processors = tuple(processors)
-
-    def on_trace_start(self, trace: Trace) -> None:
-        """
-        Called when a trace is started.
-        """
-        for processor in self._processors:
-            processor.on_trace_start(trace)
-
-    def on_trace_end(self, trace: Trace) -> None:
-        """
-        Called when a trace is finished.
-        """
-        for processor in self._processors:
-            processor.on_trace_end(trace)
-
-    def on_span_start(self, span: Span[Any]) -> None:
-        """
-        Called when a span is started.
-        """
-        for processor in self._processors:
-            processor.on_span_start(span)
-
-    def on_span_end(self, span: Span[Any]) -> None:
-        """
-        Called when a span is finished.
-        """
-        for processor in self._processors:
-            processor.on_span_end(span)
-
-    def shutdown(self) -> None:
-        """
-        Called when the application stops.
-        """
-        for processor in self._processors:
-            logger.debug(f"Shutting down trace processor {processor}")
-            processor.shutdown()
-
-    def force_flush(self):
-        """
-        Force the processors to flush their buffers.
-        """
-        for processor in self._processors:
-            processor.force_flush()
-
-
-class TraceProvider:
-    def __init__(self):
-        self._multi_processor = SynchronousMultiTracingProcessor()
-        self._disabled = os.environ.get("OPENAI_AGENTS_DISABLE_TRACING", "false").lower() in (
-            "true",
-            "1",
-        )
-
-    def register_processor(self, processor: TracingProcessor):
-        """
-        Add a processor to the list of processors. Each processor will receive all traces/spans.
-        """
-        self._multi_processor.add_tracing_processor(processor)
-
-    def set_processors(self, processors: list[TracingProcessor]):
-        """
-        Set the list of processors. This will replace the current list of processors.
-        """
-        self._multi_processor.set_processors(processors)
-
-    def get_current_trace(self) -> Trace | None:
-        """
-        Returns the currently active trace, if any.
-        """
-        return Scope.get_current_trace()
-
-    def get_current_span(self) -> Span[Any] | None:
-        """
-        Returns the currently active span, if any.
-        """
-        return Scope.get_current_span()
-
-    def set_disabled(self, disabled: bool) -> None:
-        """
-        Set whether tracing is disabled.
-        """
-        self._disabled = disabled
-
-    def time_iso(self) -> str:
-        """Return the current time in ISO 8601 format."""
-        return datetime.now(timezone.utc).isoformat()
-
-    def gen_trace_id(self) -> str:
-        """Generate a new trace ID."""
-        return f"trace_{uuid.uuid4().hex}"
-
-    def gen_span_id(self) -> str:
-        """Generate a new span ID."""
-        return f"span_{uuid.uuid4().hex[:24]}"
-
-    def gen_group_id(self) -> str:
-        """Generate a new group ID."""
-        return f"group_{uuid.uuid4().hex[:24]}"
-
-    def create_trace(
-        self,
-        name: str,
-        trace_id: str | None = None,
-        group_id: str | None = None,
-        metadata: dict[str, Any] | None = None,
-        disabled: bool = False,
-    ) -> Trace:
-        """
-        Create a new trace.
-        """
-        if self._disabled or disabled:
-            logger.debug(f"Tracing is disabled. Not creating trace {name}")
-            return NoOpTrace()
-
-        trace_id = trace_id or util.gen_trace_id()
-
-        logger.debug(f"Creating trace {name} with id {trace_id}")
-
-        return TraceImpl(
-            name=name,
-            trace_id=trace_id,
-            group_id=group_id,
-            metadata=metadata,
-            processor=self._multi_processor,
-        )
-
-    def create_span(
-        self,
-        span_data: TSpanData,
-        span_id: str | None = None,
-        parent: Trace | Span[Any] | None = None,
-        disabled: bool = False,
-    ) -> Span[TSpanData]:
-        """
-        Create a new span.
-        """
-        if self._disabled or disabled:
-            logger.debug(f"Tracing is disabled. Not creating span {span_data}")
-            return NoOpSpan(span_data)
-
-        if not parent:
-            current_span = Scope.get_current_span()
-            current_trace = Scope.get_current_trace()
-            if current_trace is None:
-                logger.error(
-                    "No active trace. Make sure to start a trace with `trace()` first"
-                    "Returning NoOpSpan."
-                )
-                return NoOpSpan(span_data)
-            elif isinstance(current_trace, NoOpTrace) or isinstance(current_span, NoOpSpan):
-                logger.debug(
-                    f"Parent {current_span} or {current_trace} is no-op, returning NoOpSpan"
-                )
-                return NoOpSpan(span_data)
-
-            parent_id = current_span.span_id if current_span else None
-            trace_id = current_trace.trace_id
-
-        elif isinstance(parent, Trace):
-            if isinstance(parent, NoOpTrace):
-                logger.debug(f"Parent {parent} is no-op, returning NoOpSpan")
-                return NoOpSpan(span_data)
-            trace_id = parent.trace_id
-            parent_id = None
-        elif isinstance(parent, Span):
-            if isinstance(parent, NoOpSpan):
-                logger.debug(f"Parent {parent} is no-op, returning NoOpSpan")
-                return NoOpSpan(span_data)
-            parent_id = parent.span_id
-            trace_id = parent.trace_id
-
-        logger.debug(f"Creating span {span_data} with id {span_id}")
-
-        return SpanImpl(
-            trace_id=trace_id,
-            span_id=span_id,
-            parent_id=parent_id,
-            processor=self._multi_processor,
-            span_data=span_data,
-        )
-
-    def shutdown(self) -> None:
-        if self._disabled:
-            return
-
-        try:
-            logger.debug("Shutting down trace provider")
-            self._multi_processor.shutdown()
-        except Exception as e:
-            logger.error(f"Error shutting down trace provider: {e}")
-
-
-GLOBAL_TRACE_PROVIDER = TraceProvider()
+GLOBAL_TRACE_PROVIDER: TraceProvider | None = None
 
 
 def set_trace_provider(provider: TraceProvider) -> None:
     """Set the global trace provider used by tracing utilities."""
     global GLOBAL_TRACE_PROVIDER
     GLOBAL_TRACE_PROVIDER = provider
+
+
+def get_trace_provider() -> TraceProvider:
+    """Get the global trace provider used by tracing utilities."""
+    if GLOBAL_TRACE_PROVIDER is None:
+        raise RuntimeError("Trace provider not set")
+    return GLOBAL_TRACE_PROVIDER
diff --git a/src/agents/tracing/spans.py b/src/agents/tracing/spans.py
index ee933e730..129c468df 100644
--- a/src/agents/tracing/spans.py
+++ b/src/agents/tracing/spans.py
@@ -178,7 +178,7 @@ def __init__(
         span_data: TSpanData,
     ):
         self._trace_id = trace_id
-        self._span_id = span_id or util.gen_span_id()
+        self._span_id = span_id
         self._parent_id = parent_id
         self._started_at: str | None = None
         self._ended_at: str | None = None
diff --git a/src/agents/tracing/util.py b/src/agents/tracing/util.py
index af2f5ff32..7f436d019 100644
--- a/src/agents/tracing/util.py
+++ b/src/agents/tracing/util.py
@@ -1,21 +1,21 @@
-from .setup import GLOBAL_TRACE_PROVIDER
+from .setup import get_trace_provider
 
 
 def time_iso() -> str:
     """Return the current time in ISO 8601 format."""
-    return GLOBAL_TRACE_PROVIDER.time_iso()
+    return get_trace_provider().time_iso()
 
 
 def gen_trace_id() -> str:
     """Generate a new trace ID."""
-    return GLOBAL_TRACE_PROVIDER.gen_trace_id()
+    return get_trace_provider().gen_trace_id()
 
 
 def gen_span_id() -> str:
     """Generate a new span ID."""
-    return GLOBAL_TRACE_PROVIDER.gen_span_id()
+    return get_trace_provider().gen_span_id()
 
 
 def gen_group_id() -> str:
     """Generate a new group ID."""
-    return GLOBAL_TRACE_PROVIDER.gen_group_id()
+    return get_trace_provider().gen_group_id()
diff --git a/tests/conftest.py b/tests/conftest.py
index 622b61b14..f87e85594 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -7,7 +7,7 @@
 from agents.models.openai_responses import OpenAIResponsesModel
 from agents.run import set_default_runner
 from agents.tracing import set_trace_processors
-from agents.tracing.setup import GLOBAL_TRACE_PROVIDER
+from agents.tracing.setup import get_trace_provider
 
 from .testing_processor import SPAN_PROCESSOR_TESTING
 
@@ -43,7 +43,7 @@ def clear_default_runner():
 @pytest.fixture(autouse=True, scope="session")
 def shutdown_trace_provider():
     yield
-    GLOBAL_TRACE_PROVIDER.shutdown()
+    get_trace_provider().shutdown()
 
 
 @pytest.fixture(autouse=True)

From 27646ee1c31dc191f1cf1268563de8ca6c6f111b Mon Sep 17 00:00:00 2001
From: pakrym-oai <pakrym@openai.com>
Date: Wed, 21 May 2025 09:54:06 -0700
Subject: [PATCH 08/22] LLM: tracing/spans: generate span_id if not provided in
 SpanImpl constructor

---
 src/agents/tracing/spans.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/agents/tracing/spans.py b/src/agents/tracing/spans.py
index 129c468df..ee933e730 100644
--- a/src/agents/tracing/spans.py
+++ b/src/agents/tracing/spans.py
@@ -178,7 +178,7 @@ def __init__(
         span_data: TSpanData,
     ):
         self._trace_id = trace_id
-        self._span_id = span_id
+        self._span_id = span_id or util.gen_span_id()
         self._parent_id = parent_id
         self._started_at: str | None = None
         self._ended_at: str | None = None

From caf30b9694ac99fd654560229f6c9cdb55ecee13 Mon Sep 17 00:00:00 2001
From: pakrym-oai <pakrym@openai.com>
Date: Wed, 11 Jun 2025 10:40:24 -0700
Subject: [PATCH 09/22] tracing: introduce TraceProvider interface and
 DefaultTraceProvider implementation

- Add abstract TraceProvider base class to define tracing API
- Move default tracing logic to DefaultTraceProvider
- Update __init__.py to export both TraceProvider and DefaultTraceProvider, and use DefaultTraceProvider as default
- Aligns span/trace management and enables alternative provider implementations
---
 src/agents/tracing/__init__.py |  5 ++-
 src/agents/tracing/provider.py | 70 +++++++++++++++++++++++++++++++++-
 2 files changed, 71 insertions(+), 4 deletions(-)

diff --git a/src/agents/tracing/__init__.py b/src/agents/tracing/__init__.py
index 4281c29ff..e80aac46d 100644
--- a/src/agents/tracing/__init__.py
+++ b/src/agents/tracing/__init__.py
@@ -1,6 +1,6 @@
 import atexit
 
-from agents.tracing.provider import TraceProvider
+from agents.tracing.provider import DefaultTraceProvider, TraceProvider
 
 from .create import (
     agent_span,
@@ -70,6 +70,7 @@
     "SpeechSpanData",
     "TranscriptionSpanData",
     "TracingProcessor",
+    "TraceProvider",
     "gen_trace_id",
     "gen_span_id",
     "speech_group_span",
@@ -107,7 +108,7 @@ def set_tracing_export_api_key(api_key: str) -> None:
     default_exporter().set_api_key(api_key)
 
 
-set_trace_provider(TraceProvider())
+set_trace_provider(DefaultTraceProvider())
 # Add the default processor, which exports traces and spans to the backend in batches. You can
 # change the default behavior by either:
 # 1. calling add_trace_processor(), which adds additional processors, or
diff --git a/src/agents/tracing/provider.py b/src/agents/tracing/provider.py
index b9f4c63e9..38d3b7ab3 100644
--- a/src/agents/tracing/provider.py
+++ b/src/agents/tracing/provider.py
@@ -3,6 +3,7 @@
 import os
 import threading
 import uuid
+from abc import ABC, abstractmethod
 from datetime import datetime, timezone
 from typing import Any
 
@@ -81,8 +82,73 @@ def force_flush(self):
             processor.force_flush()
 
 
-class TraceProvider:
-    def __init__(self):
+class TraceProvider(ABC):
+    """Interface for creating traces and spans."""
+
+    @abstractmethod
+    def register_processor(self, processor: TracingProcessor) -> None:
+        """Add a processor that will receive all traces and spans."""
+
+    @abstractmethod
+    def set_processors(self, processors: list[TracingProcessor]) -> None:
+        """Replace the list of processors with ``processors``."""
+
+    @abstractmethod
+    def get_current_trace(self) -> Trace | None:
+        """Return the currently active trace, if any."""
+
+    @abstractmethod
+    def get_current_span(self) -> Span[Any] | None:
+        """Return the currently active span, if any."""
+
+    @abstractmethod
+    def set_disabled(self, disabled: bool) -> None:
+        """Enable or disable tracing globally."""
+
+    @abstractmethod
+    def time_iso(self) -> str:
+        """Return the current time in ISO 8601 format."""
+
+    @abstractmethod
+    def gen_trace_id(self) -> str:
+        """Generate a new trace identifier."""
+
+    @abstractmethod
+    def gen_span_id(self) -> str:
+        """Generate a new span identifier."""
+
+    @abstractmethod
+    def gen_group_id(self) -> str:
+        """Generate a new group identifier."""
+
+    @abstractmethod
+    def create_trace(
+        self,
+        name: str,
+        trace_id: str | None = None,
+        group_id: str | None = None,
+        metadata: dict[str, Any] | None = None,
+        disabled: bool = False,
+    ) -> Trace:
+        """Create a new trace."""
+
+    @abstractmethod
+    def create_span(
+        self,
+        span_data: TSpanData,
+        span_id: str | None = None,
+        parent: Trace | Span[Any] | None = None,
+        disabled: bool = False,
+    ) -> Span[TSpanData]:
+        """Create a new span."""
+
+    @abstractmethod
+    def shutdown(self) -> None:
+        """Clean up any resources used by the provider."""
+
+
+class DefaultTraceProvider(TraceProvider):
+    def __init__(self) -> None:
         self._multi_processor = SynchronousMultiTracingProcessor()
         self._disabled = os.environ.get("OPENAI_AGENTS_DISABLE_TRACING", "false").lower() in (
             "true",

From 9538c8166b838b36b624d444c16a9027d4f1e291 Mon Sep 17 00:00:00 2001
From: pakrym-oai <pakrym@openai.com>
Date: Wed, 11 Jun 2025 10:46:03 -0700
Subject: [PATCH 10/22] run.py: call _get_all_tools as DefaultRunner class
 method instead of via cls

---
 src/agents/run.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/agents/run.py b/src/agents/run.py
index 1feebbd77..1012792c9 100644
--- a/src/agents/run.py
+++ b/src/agents/run.py
@@ -382,7 +382,7 @@ async def _run_impl(
 
             try:
                 while True:
-                    all_tools = await cls._get_all_tools(current_agent, context_wrapper)
+                    all_tools = await DefaultRunner._get_all_tools(current_agent, context_wrapper)
 
                     # Start an agent span if we don't have one. This span is ended if the current
                     # agent changes, or if the agent loop ends.

From 9f7934a4ceb3a473fb8945067b7cf74e9ed4b957 Mon Sep 17 00:00:00 2001
From: pakrym-oai <pakrym@openai.com>
Date: Wed, 11 Jun 2025 10:59:19 -0700
Subject: [PATCH 11/22] agents: add get_default_runner and ensure
 DEFAULT_RUNNER is always initialized

- Add get_default_runner to retrieve current default runner.
- Always assign DEFAULT_RUNNER to a DefaultRunner at module init.
- Replace fallback logic (`DEFAULT_RUNNER or DefaultRunner()`) with direct use of initialized DEFAULT_RUNNER.
- Update __all__ in __init__.py to export get_default_runner.
- Minor update to tracing/__init__.py __all__ for consistency.
---
 src/agents/__init__.py         |  1 +
 src/agents/run.py              | 20 +++++++++++++++-----
 src/agents/tracing/__init__.py |  1 +
 3 files changed, 17 insertions(+), 5 deletions(-)

diff --git a/src/agents/__init__.py b/src/agents/__init__.py
index 332b97d2b..afa578b5e 100644
--- a/src/agents/__init__.py
+++ b/src/agents/__init__.py
@@ -241,6 +241,7 @@ def enable_verbose_stdout_logging():
     "generation_span",
     "get_current_span",
     "get_current_trace",
+    "get_default_runner",
     "guardrail_span",
     "handoff_span",
     "set_trace_processors",
diff --git a/src/agents/run.py b/src/agents/run.py
index 1012792c9..b44afa12e 100644
--- a/src/agents/run.py
+++ b/src/agents/run.py
@@ -47,7 +47,8 @@
 from .util import _coro, _error_tracing
 
 DEFAULT_MAX_TURNS = 10
-DEFAULT_RUNNER: Runner | None = None
+DEFAULT_RUNNER: Runner = None # type: ignore
+# assigned at the end of the module initialization
 
 
 def set_default_runner(runner: Runner | None) -> None:
@@ -55,7 +56,14 @@ def set_default_runner(runner: Runner | None) -> None:
     Set the default runner to use for the agent run.
     """
     global DEFAULT_RUNNER
-    DEFAULT_RUNNER = runner
+    DEFAULT_RUNNER = runner or DefaultRunner()
+
+def get_default_runner() -> Runner | None:
+    """
+    Get the default runner to use for the agent run.
+    """
+    global DEFAULT_RUNNER
+    return DEFAULT_RUNNER
 
 
 @dataclass
@@ -197,7 +205,7 @@ async def run(
             A run result containing all the inputs, guardrail results and the output of the last
             agent. Agents may perform handoffs, so we don't know the specific type of the output.
         """
-        runner = DEFAULT_RUNNER or DefaultRunner()
+        runner = DEFAULT_RUNNER
         return await runner._run_impl(
             starting_agent,
             input,
@@ -249,7 +257,7 @@ def run_sync(
             A run result containing all the inputs, guardrail results and the output of the last
             agent. Agents may perform handoffs, so we don't know the specific type of the output.
         """
-        runner = DEFAULT_RUNNER or DefaultRunner()
+        runner = DEFAULT_RUNNER
         return runner._run_sync_impl(
             starting_agent,
             input,
@@ -297,7 +305,7 @@ def run_streamed(
         Returns:
             A result object that contains data about the run, as well as a method to stream events.
         """
-        runner = DEFAULT_RUNNER or DefaultRunner()
+        runner = DEFAULT_RUNNER
         return runner._run_streamed_impl(
             starting_agent,
             input,
@@ -1130,3 +1138,5 @@ def _get_model(cls, agent: Agent[Any], run_config: RunConfig) -> Model:
             return agent.model
 
         return run_config.model_provider.get_model(agent.model)
+
+DEFAULT_RUNNER = DefaultRunner()
diff --git a/src/agents/tracing/__init__.py b/src/agents/tracing/__init__.py
index e80aac46d..64b0bd71f 100644
--- a/src/agents/tracing/__init__.py
+++ b/src/agents/tracing/__init__.py
@@ -47,6 +47,7 @@
     "generation_span",
     "get_current_span",
     "get_current_trace",
+    "get_trace_provider",
     "guardrail_span",
     "handoff_span",
     "response_span",

From b25beb649509f67923b0c099548eea860c0f99ea Mon Sep 17 00:00:00 2001
From: pakrym-oai <pakrym@openai.com>
Date: Wed, 11 Jun 2025 11:30:51 -0700
Subject: [PATCH 12/22] runner: remove unused helper methods from Runner class

---
 src/agents/run.py | 33 +--------------------------------
 1 file changed, 1 insertion(+), 32 deletions(-)

diff --git a/src/agents/run.py b/src/agents/run.py
index b44afa12e..6fc3fde69 100644
--- a/src/agents/run.py
+++ b/src/agents/run.py
@@ -316,37 +316,6 @@ def run_streamed(
             previous_response_id=previous_response_id,
         )
 
-    @classmethod
-    def _get_output_schema(cls, agent: Agent[Any]) -> AgentOutputSchemaBase | None:
-        if agent.output_type is None or agent.output_type is str:
-            return None
-        elif isinstance(agent.output_type, AgentOutputSchemaBase):
-            return agent.output_type
-
-        return AgentOutputSchema(agent.output_type)
-
-    @classmethod
-    def _get_handoffs(cls, agent: Agent[Any]) -> list[Handoff]:
-        handoffs = []
-        for handoff_item in agent.handoffs:
-            if isinstance(handoff_item, Handoff):
-                handoffs.append(handoff_item)
-            elif isinstance(handoff_item, Agent):
-                handoffs.append(handoff(handoff_item))
-        return handoffs
-
-    @classmethod
-    def _get_model(cls, agent: Agent[Any], run_config: RunConfig) -> Model:
-        if isinstance(run_config.model, Model):
-            return run_config.model
-        elif isinstance(run_config.model, str):
-            return run_config.model_provider.get_model(run_config.model)
-        elif isinstance(agent.model, Model):
-            return agent.model
-
-        return run_config.model_provider.get_model(agent.model)
-
-
 class DefaultRunner(Runner):
     async def _run_impl(
         self,
@@ -390,7 +359,7 @@ async def _run_impl(
 
             try:
                 while True:
-                    all_tools = await DefaultRunner._get_all_tools(current_agent, context_wrapper)
+                    all_tools = await self._get_all_tools(current_agent, context_wrapper)
 
                     # Start an agent span if we don't have one. This span is ended if the current
                     # agent changes, or if the agent loop ends.

From 83251c385483cfdf89121ecf313880f6076f8917 Mon Sep 17 00:00:00 2001
From: pakrym-oai <pakrym@openai.com>
Date: Wed, 11 Jun 2025 11:34:25 -0700
Subject: [PATCH 13/22] move utility methods (_get_output_schema,
 _get_handoffs, _get_all_tools, _get_model) from DefaultRunner to Runner base
 class

---
 src/agents/run.py | 72 ++++++++++++++++++++++++-----------------------
 1 file changed, 37 insertions(+), 35 deletions(-)

diff --git a/src/agents/run.py b/src/agents/run.py
index 6fc3fde69..1c301cb00 100644
--- a/src/agents/run.py
+++ b/src/agents/run.py
@@ -316,6 +316,43 @@ def run_streamed(
             previous_response_id=previous_response_id,
         )
 
+
+    @classmethod
+    def _get_output_schema(cls, agent: Agent[Any]) -> AgentOutputSchemaBase | None:
+        if agent.output_type is None or agent.output_type is str:
+            return None
+        elif isinstance(agent.output_type, AgentOutputSchemaBase):
+            return agent.output_type
+
+        return AgentOutputSchema(agent.output_type)
+
+    @classmethod
+    def _get_handoffs(cls, agent: Agent[Any]) -> list[Handoff]:
+        handoffs = []
+        for handoff_item in agent.handoffs:
+            if isinstance(handoff_item, Handoff):
+                handoffs.append(handoff_item)
+            elif isinstance(handoff_item, Agent):
+                handoffs.append(handoff(handoff_item))
+        return handoffs
+
+    @classmethod
+    async def _get_all_tools(
+        cls, agent: Agent[Any], context_wrapper: RunContextWrapper[Any]
+    ) -> list[Tool]:
+        return await agent.get_all_tools(context_wrapper)
+
+    @classmethod
+    def _get_model(cls, agent: Agent[Any], run_config: RunConfig) -> Model:
+        if isinstance(run_config.model, Model):
+            return run_config.model
+        elif isinstance(run_config.model, str):
+            return run_config.model_provider.get_model(run_config.model)
+        elif isinstance(agent.model, Model):
+            return agent.model
+
+        return run_config.model_provider.get_model(agent.model)
+
 class DefaultRunner(Runner):
     async def _run_impl(
         self,
@@ -1072,40 +1109,5 @@ async def _get_new_response(
 
         return new_response
 
-    @classmethod
-    def _get_output_schema(cls, agent: Agent[Any]) -> AgentOutputSchemaBase | None:
-        if agent.output_type is None or agent.output_type is str:
-            return None
-        elif isinstance(agent.output_type, AgentOutputSchemaBase):
-            return agent.output_type
-
-        return AgentOutputSchema(agent.output_type)
-
-    @classmethod
-    def _get_handoffs(cls, agent: Agent[Any]) -> list[Handoff]:
-        handoffs = []
-        for handoff_item in agent.handoffs:
-            if isinstance(handoff_item, Handoff):
-                handoffs.append(handoff_item)
-            elif isinstance(handoff_item, Agent):
-                handoffs.append(handoff(handoff_item))
-        return handoffs
-
-    @classmethod
-    async def _get_all_tools(
-        cls, agent: Agent[Any], context_wrapper: RunContextWrapper[Any]
-    ) -> list[Tool]:
-        return await agent.get_all_tools(context_wrapper)
-
-    @classmethod
-    def _get_model(cls, agent: Agent[Any], run_config: RunConfig) -> Model:
-        if isinstance(run_config.model, Model):
-            return run_config.model
-        elif isinstance(run_config.model, str):
-            return run_config.model_provider.get_model(run_config.model)
-        elif isinstance(agent.model, Model):
-            return agent.model
-
-        return run_config.model_provider.get_model(agent.model)
 
 DEFAULT_RUNNER = DefaultRunner()

From 0ba33c4f8b508dd26ec8e7f966229147cab98ac1 Mon Sep 17 00:00:00 2001
From: pakrym-oai <pakrym@openai.com>
Date: Tue, 17 Jun 2025 08:48:51 -0700
Subject: [PATCH 14/22] Introduce AgentRunner class (#886)

## Summary
- rename DefaultRunner to DefaultAgentRunner and extend new AgentRunner
base
- remove `set_default_runner`/`get_default_runner` helpers
- rename abstract methods on AgentRunner (no underscore)
- update tests and imports for new API

## Testing
- `make format`
- `make lint`
- `make mypy`
- `make tests`


------
https://chatgpt.com/codex/tasks/task_i_6851851acce8832099adc70d8197016c
---
 src/agents/__init__.py |   7 +--
 src/agents/run.py      | 131 +++++++++++++++++++----------------------
 tests/conftest.py      |   6 --
 tests/test_run.py      |  26 --------
 4 files changed, 64 insertions(+), 106 deletions(-)
 delete mode 100644 tests/test_run.py

diff --git a/src/agents/__init__.py b/src/agents/__init__.py
index afa578b5e..d2e0857e5 100644
--- a/src/agents/__init__.py
+++ b/src/agents/__init__.py
@@ -47,7 +47,7 @@
 from .models.openai_responses import OpenAIResponsesModel
 from .repl import run_demo_loop
 from .result import RunResult, RunResultStreaming
-from .run import DefaultRunner, RunConfig, Runner, set_default_runner
+from .run import AgentRunner, DefaultAgentRunner, RunConfig, Runner
 from .run_context import RunContextWrapper, TContext
 from .stream_events import (
     AgentUpdatedStreamEvent,
@@ -162,7 +162,8 @@ def enable_verbose_stdout_logging():
     "ToolsToFinalOutputFunction",
     "ToolsToFinalOutputResult",
     "Runner",
-    "DefaultRunner",
+    "AgentRunner",
+    "DefaultAgentRunner",
     "run_demo_loop",
     "Model",
     "ModelProvider",
@@ -241,7 +242,6 @@ def enable_verbose_stdout_logging():
     "generation_span",
     "get_current_span",
     "get_current_trace",
-    "get_default_runner",
     "guardrail_span",
     "handoff_span",
     "set_trace_processors",
@@ -270,7 +270,6 @@ def enable_verbose_stdout_logging():
     "set_default_openai_key",
     "set_default_openai_client",
     "set_default_openai_api",
-    "set_default_runner",
     "set_tracing_export_api_key",
     "enable_verbose_stdout_logging",
     "gen_trace_id",
diff --git a/src/agents/run.py b/src/agents/run.py
index 1c301cb00..ce48d1dc7 100644
--- a/src/agents/run.py
+++ b/src/agents/run.py
@@ -4,9 +4,10 @@
 import asyncio
 import copy
 from dataclasses import dataclass, field
-from typing import Any, cast
+from typing import Any, Generic, cast
 
 from openai.types.responses import ResponseCompletedEvent
+from typing_extensions import TypedDict, Unpack
 
 from ._run_impl import (
     AgentToolUseTracker,
@@ -47,23 +48,6 @@
 from .util import _coro, _error_tracing
 
 DEFAULT_MAX_TURNS = 10
-DEFAULT_RUNNER: Runner = None # type: ignore
-# assigned at the end of the module initialization
-
-
-def set_default_runner(runner: Runner | None) -> None:
-    """
-    Set the default runner to use for the agent run.
-    """
-    global DEFAULT_RUNNER
-    DEFAULT_RUNNER = runner or DefaultRunner()
-
-def get_default_runner() -> Runner | None:
-    """
-    Get the default runner to use for the agent run.
-    """
-    global DEFAULT_RUNNER
-    return DEFAULT_RUNNER
 
 
 @dataclass
@@ -125,48 +109,57 @@ class RunConfig:
     """
 
 
-class Runner(abc.ABC):
+class AgentRunnerParams(TypedDict, Generic[TContext]):
+    """Arguments for ``AgentRunner`` methods."""
+
+    context: TContext | None
+    """The context for the run."""
+
+    max_turns: int
+    """The maximum number of turns to run for."""
+
+    hooks: RunHooks[TContext] | None
+    """Lifecycle hooks for the run."""
+
+    run_config: RunConfig | None
+    """Run configuration."""
+
+    previous_response_id: str | None
+    """The ID of the previous response, if any."""
+
+
+class AgentRunner(abc.ABC):
     @abc.abstractmethod
-    async def _run_impl(
+    async def run(
         self,
         starting_agent: Agent[TContext],
         input: str | list[TResponseInputItem],
-        *,
-        context: TContext | None = None,
-        max_turns: int = DEFAULT_MAX_TURNS,
-        hooks: RunHooks[TContext] | None = None,
-        run_config: RunConfig | None = None,
-        previous_response_id: str | None = None,
+        **kwargs: Unpack[AgentRunnerParams[TContext]],
     ) -> RunResult:
         pass
 
     @abc.abstractmethod
-    def _run_sync_impl(
+    def run_sync(
         self,
         starting_agent: Agent[TContext],
         input: str | list[TResponseInputItem],
-        *,
-        context: TContext | None = None,
-        max_turns: int = DEFAULT_MAX_TURNS,
-        hooks: RunHooks[TContext] | None = None,
-        run_config: RunConfig | None = None,
-        previous_response_id: str | None = None,
+        **kwargs: Unpack[AgentRunnerParams[TContext]],
     ) -> RunResult:
         pass
 
     @abc.abstractmethod
-    def _run_streamed_impl(
+    def run_streamed(
         self,
         starting_agent: Agent[TContext],
         input: str | list[TResponseInputItem],
-        context: TContext | None = None,
-        max_turns: int = DEFAULT_MAX_TURNS,
-        hooks: RunHooks[TContext] | None = None,
-        run_config: RunConfig | None = None,
-        previous_response_id: str | None = None,
+        **kwargs: Unpack[AgentRunnerParams[TContext]],
     ) -> RunResultStreaming:
         pass
 
+
+class Runner:
+    pass
+
     @classmethod
     async def run(
         cls,
@@ -205,8 +198,8 @@ async def run(
             A run result containing all the inputs, guardrail results and the output of the last
             agent. Agents may perform handoffs, so we don't know the specific type of the output.
         """
-        runner = DEFAULT_RUNNER
-        return await runner._run_impl(
+        runner = DefaultAgentRunner()
+        return await runner.run(
             starting_agent,
             input,
             context=context,
@@ -257,8 +250,8 @@ def run_sync(
             A run result containing all the inputs, guardrail results and the output of the last
             agent. Agents may perform handoffs, so we don't know the specific type of the output.
         """
-        runner = DEFAULT_RUNNER
-        return runner._run_sync_impl(
+        runner = DefaultAgentRunner()
+        return runner.run_sync(
             starting_agent,
             input,
             context=context,
@@ -305,8 +298,8 @@ def run_streamed(
         Returns:
             A result object that contains data about the run, as well as a method to stream events.
         """
-        runner = DEFAULT_RUNNER
-        return runner._run_streamed_impl(
+        runner = DefaultAgentRunner()
+        return runner.run_streamed(
             starting_agent,
             input,
             context=context,
@@ -316,7 +309,6 @@ def run_streamed(
             previous_response_id=previous_response_id,
         )
 
-
     @classmethod
     def _get_output_schema(cls, agent: Agent[Any]) -> AgentOutputSchemaBase | None:
         if agent.output_type is None or agent.output_type is str:
@@ -353,18 +345,19 @@ def _get_model(cls, agent: Agent[Any], run_config: RunConfig) -> Model:
 
         return run_config.model_provider.get_model(agent.model)
 
-class DefaultRunner(Runner):
-    async def _run_impl(
+
+class DefaultAgentRunner(AgentRunner, Runner):
+    async def run(  # type: ignore[override]
         self,
         starting_agent: Agent[TContext],
         input: str | list[TResponseInputItem],
-        *,
-        context: TContext | None = None,
-        max_turns: int = DEFAULT_MAX_TURNS,
-        hooks: RunHooks[TContext] | None = None,
-        run_config: RunConfig | None = None,
-        previous_response_id: str | None = None,
+        **kwargs: Unpack[AgentRunnerParams[TContext]],
     ) -> RunResult:
+        context = kwargs.get("context")
+        max_turns = kwargs.get("max_turns", DEFAULT_MAX_TURNS)
+        hooks = kwargs.get("hooks")
+        run_config = kwargs.get("run_config")
+        previous_response_id = kwargs.get("previous_response_id")
         if hooks is None:
             hooks = RunHooks[Any]()
         if run_config is None:
@@ -514,17 +507,17 @@ async def _run_impl(
                 if current_span:
                     current_span.finish(reset_current=True)
 
-    def _run_sync_impl(
+    def run_sync(  # type: ignore[override]
         self,
         starting_agent: Agent[TContext],
         input: str | list[TResponseInputItem],
-        *,
-        context: TContext | None = None,
-        max_turns: int = DEFAULT_MAX_TURNS,
-        hooks: RunHooks[TContext] | None = None,
-        run_config: RunConfig | None = None,
-        previous_response_id: str | None = None,
+        **kwargs: Unpack[AgentRunnerParams[TContext]],
     ) -> RunResult:
+        context = kwargs.get("context")
+        max_turns = kwargs.get("max_turns", DEFAULT_MAX_TURNS)
+        hooks = kwargs.get("hooks")
+        run_config = kwargs.get("run_config")
+        previous_response_id = kwargs.get("previous_response_id")
         return asyncio.get_event_loop().run_until_complete(
             self.run(
                 starting_agent,
@@ -537,16 +530,17 @@ def _run_sync_impl(
             )
         )
 
-    def _run_streamed_impl(
+    def run_streamed(  # type: ignore[override]
         self,
         starting_agent: Agent[TContext],
         input: str | list[TResponseInputItem],
-        context: TContext | None = None,
-        max_turns: int = DEFAULT_MAX_TURNS,
-        hooks: RunHooks[TContext] | None = None,
-        run_config: RunConfig | None = None,
-        previous_response_id: str | None = None,
+        **kwargs: Unpack[AgentRunnerParams[TContext]],
     ) -> RunResultStreaming:
+        context = kwargs.get("context")
+        max_turns = kwargs.get("max_turns", DEFAULT_MAX_TURNS)
+        hooks = kwargs.get("hooks")
+        run_config = kwargs.get("run_config")
+        previous_response_id = kwargs.get("previous_response_id")
         if hooks is None:
             hooks = RunHooks[Any]()
         if run_config is None:
@@ -1108,6 +1102,3 @@ async def _get_new_response(
         context_wrapper.usage.add(new_response.usage)
 
         return new_response
-
-
-DEFAULT_RUNNER = DefaultRunner()
diff --git a/tests/conftest.py b/tests/conftest.py
index f87e85594..7527e11b8 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -5,7 +5,6 @@
 from agents.models import _openai_shared
 from agents.models.openai_chatcompletions import OpenAIChatCompletionsModel
 from agents.models.openai_responses import OpenAIResponsesModel
-from agents.run import set_default_runner
 from agents.tracing import set_trace_processors
 from agents.tracing.setup import get_trace_provider
 
@@ -34,11 +33,6 @@ def clear_openai_settings():
     _openai_shared._use_responses_by_default = True
 
 
-@pytest.fixture(autouse=True)
-def clear_default_runner():
-    set_default_runner(None)
-
-
 # This fixture will run after all tests end
 @pytest.fixture(autouse=True, scope="session")
 def shutdown_trace_provider():
diff --git a/tests/test_run.py b/tests/test_run.py
deleted file mode 100644
index 57e33d50d..000000000
--- a/tests/test_run.py
+++ /dev/null
@@ -1,26 +0,0 @@
-from __future__ import annotations
-
-from unittest import mock
-
-import pytest
-
-from agents import Agent, Runner
-from agents.run import set_default_runner
-
-from .fake_model import FakeModel
-
-
-@pytest.mark.asyncio
-async def test_static_run_methods_call_into_default_runner() -> None:
-    runner = mock.Mock(spec=Runner)
-    set_default_runner(runner)
-
-    agent = Agent(name="test", model=FakeModel())
-    await Runner.run(agent, input="test")
-    runner._run_impl.assert_called_once()
-
-    Runner.run_streamed(agent, input="test")
-    runner._run_streamed_impl.assert_called_once()
-
-    Runner.run_sync(agent, input="test")
-    runner._run_sync_impl.assert_called_once()

From 1d5537c923e6f694a95786a4a01aab0e4071074d Mon Sep 17 00:00:00 2001
From: pakrym-oai <pakrym@openai.com>
Date: Tue, 17 Jun 2025 09:10:35 -0700
Subject: [PATCH 15/22] cleanup

---
 src/agents/run.py                 | 108 +++++++++++++++---------------
 src/agents/tool_context.py        |   1 +
 tests/models/test_map.py          |   9 +--
 tests/test_agent_config.py        |  11 +--
 tests/test_handoff_tool.py        |  10 +--
 tests/test_output_tool.py         |  16 ++---
 tests/test_run_config.py          |   2 +-
 tests/test_run_step_execution.py  |   6 +-
 tests/test_run_step_processing.py |  11 +--
 9 files changed, 90 insertions(+), 84 deletions(-)

diff --git a/src/agents/run.py b/src/agents/run.py
index ce48d1dc7..5c273b8b9 100644
--- a/src/agents/run.py
+++ b/src/agents/run.py
@@ -109,7 +109,7 @@ class RunConfig:
     """
 
 
-class AgentRunnerParams(TypedDict, Generic[TContext]):
+class RunOptions(TypedDict, Generic[TContext]):
     """Arguments for ``AgentRunner`` methods."""
 
     context: TContext | None
@@ -134,7 +134,7 @@ async def run(
         self,
         starting_agent: Agent[TContext],
         input: str | list[TResponseInputItem],
-        **kwargs: Unpack[AgentRunnerParams[TContext]],
+        **kwargs: Unpack[RunOptions[TContext]],
     ) -> RunResult:
         pass
 
@@ -143,7 +143,7 @@ def run_sync(
         self,
         starting_agent: Agent[TContext],
         input: str | list[TResponseInputItem],
-        **kwargs: Unpack[AgentRunnerParams[TContext]],
+        **kwargs: Unpack[RunOptions[TContext]],
     ) -> RunResult:
         pass
 
@@ -152,14 +152,12 @@ def run_streamed(
         self,
         starting_agent: Agent[TContext],
         input: str | list[TResponseInputItem],
-        **kwargs: Unpack[AgentRunnerParams[TContext]],
+        **kwargs: Unpack[RunOptions[TContext]],
     ) -> RunResultStreaming:
         pass
 
 
 class Runner:
-    pass
-
     @classmethod
     async def run(
         cls,
@@ -309,49 +307,13 @@ def run_streamed(
             previous_response_id=previous_response_id,
         )
 
-    @classmethod
-    def _get_output_schema(cls, agent: Agent[Any]) -> AgentOutputSchemaBase | None:
-        if agent.output_type is None or agent.output_type is str:
-            return None
-        elif isinstance(agent.output_type, AgentOutputSchemaBase):
-            return agent.output_type
-
-        return AgentOutputSchema(agent.output_type)
-
-    @classmethod
-    def _get_handoffs(cls, agent: Agent[Any]) -> list[Handoff]:
-        handoffs = []
-        for handoff_item in agent.handoffs:
-            if isinstance(handoff_item, Handoff):
-                handoffs.append(handoff_item)
-            elif isinstance(handoff_item, Agent):
-                handoffs.append(handoff(handoff_item))
-        return handoffs
 
-    @classmethod
-    async def _get_all_tools(
-        cls, agent: Agent[Any], context_wrapper: RunContextWrapper[Any]
-    ) -> list[Tool]:
-        return await agent.get_all_tools(context_wrapper)
-
-    @classmethod
-    def _get_model(cls, agent: Agent[Any], run_config: RunConfig) -> Model:
-        if isinstance(run_config.model, Model):
-            return run_config.model
-        elif isinstance(run_config.model, str):
-            return run_config.model_provider.get_model(run_config.model)
-        elif isinstance(agent.model, Model):
-            return agent.model
-
-        return run_config.model_provider.get_model(agent.model)
-
-
-class DefaultAgentRunner(AgentRunner, Runner):
-    async def run(  # type: ignore[override]
+class DefaultAgentRunner(AgentRunner):
+    async def run(
         self,
         starting_agent: Agent[TContext],
         input: str | list[TResponseInputItem],
-        **kwargs: Unpack[AgentRunnerParams[TContext]],
+        **kwargs: Unpack[RunOptions[TContext]],
     ) -> RunResult:
         context = kwargs.get("context")
         max_turns = kwargs.get("max_turns", DEFAULT_MAX_TURNS)
@@ -389,13 +351,17 @@ async def run(  # type: ignore[override]
 
             try:
                 while True:
-                    all_tools = await self._get_all_tools(current_agent, context_wrapper)
+                    all_tools = await DefaultAgentRunner._get_all_tools(
+                        current_agent, context_wrapper
+                    )
 
                     # Start an agent span if we don't have one. This span is ended if the current
                     # agent changes, or if the agent loop ends.
                     if current_span is None:
-                        handoff_names = [h.agent_name for h in self._get_handoffs(current_agent)]
-                        if output_schema := self._get_output_schema(current_agent):
+                        handoff_names = [
+                            h.agent_name for h in DefaultAgentRunner._get_handoffs(current_agent)
+                        ]
+                        if output_schema := DefaultAgentRunner._get_output_schema(current_agent):
                             output_type_name = output_schema.name()
                         else:
                             output_type_name = "str"
@@ -507,11 +473,11 @@ async def run(  # type: ignore[override]
                 if current_span:
                     current_span.finish(reset_current=True)
 
-    def run_sync(  # type: ignore[override]
+    def run_sync(
         self,
         starting_agent: Agent[TContext],
         input: str | list[TResponseInputItem],
-        **kwargs: Unpack[AgentRunnerParams[TContext]],
+        **kwargs: Unpack[RunOptions[TContext]],
     ) -> RunResult:
         context = kwargs.get("context")
         max_turns = kwargs.get("max_turns", DEFAULT_MAX_TURNS)
@@ -530,11 +496,11 @@ def run_sync(  # type: ignore[override]
             )
         )
 
-    def run_streamed(  # type: ignore[override]
+    def run_streamed(
         self,
         starting_agent: Agent[TContext],
         input: str | list[TResponseInputItem],
-        **kwargs: Unpack[AgentRunnerParams[TContext]],
+        **kwargs: Unpack[RunOptions[TContext]],
     ) -> RunResultStreaming:
         context = kwargs.get("context")
         max_turns = kwargs.get("max_turns", DEFAULT_MAX_TURNS)
@@ -561,7 +527,7 @@ def run_streamed(  # type: ignore[override]
             )
         )
 
-        output_schema = self._get_output_schema(starting_agent)
+        output_schema = DefaultAgentRunner._get_output_schema(starting_agent)
         context_wrapper: RunContextWrapper[TContext] = RunContextWrapper(
             context=context  # type: ignore
         )
@@ -1102,3 +1068,39 @@ async def _get_new_response(
         context_wrapper.usage.add(new_response.usage)
 
         return new_response
+
+    @classmethod
+    def _get_output_schema(cls, agent: Agent[Any]) -> AgentOutputSchemaBase | None:
+        if agent.output_type is None or agent.output_type is str:
+            return None
+        elif isinstance(agent.output_type, AgentOutputSchemaBase):
+            return agent.output_type
+
+        return AgentOutputSchema(agent.output_type)
+
+    @classmethod
+    def _get_handoffs(cls, agent: Agent[Any]) -> list[Handoff]:
+        handoffs = []
+        for handoff_item in agent.handoffs:
+            if isinstance(handoff_item, Handoff):
+                handoffs.append(handoff_item)
+            elif isinstance(handoff_item, Agent):
+                handoffs.append(handoff(handoff_item))
+        return handoffs
+
+    @classmethod
+    async def _get_all_tools(
+        cls, agent: Agent[Any], context_wrapper: RunContextWrapper[Any]
+    ) -> list[Tool]:
+        return await agent.get_all_tools(context_wrapper)
+
+    @classmethod
+    def _get_model(cls, agent: Agent[Any], run_config: RunConfig) -> Model:
+        if isinstance(run_config.model, Model):
+            return run_config.model
+        elif isinstance(run_config.model, str):
+            return run_config.model_provider.get_model(run_config.model)
+        elif isinstance(agent.model, Model):
+            return agent.model
+
+        return run_config.model_provider.get_model(agent.model)
diff --git a/src/agents/tool_context.py b/src/agents/tool_context.py
index 17b595f06..c4329b8af 100644
--- a/src/agents/tool_context.py
+++ b/src/agents/tool_context.py
@@ -7,6 +7,7 @@
 def _assert_must_pass_tool_call_id() -> str:
     raise ValueError("tool_call_id must be passed to ToolContext")
 
+
 @dataclass
 class ToolContext(RunContextWrapper[TContext]):
     """The context of a tool call."""
diff --git a/tests/models/test_map.py b/tests/models/test_map.py
index 6b65fc094..11df1c0e5 100644
--- a/tests/models/test_map.py
+++ b/tests/models/test_map.py
@@ -1,20 +1,21 @@
-from agents import Agent, OpenAIResponsesModel, RunConfig, Runner
+from agents import Agent, OpenAIResponsesModel, RunConfig
 from agents.extensions.models.litellm_model import LitellmModel
+from agents.run import DefaultAgentRunner
 
 
 def test_no_prefix_is_openai():
     agent = Agent(model="gpt-4o", instructions="", name="test")
-    model = Runner._get_model(agent, RunConfig())
+    model = DefaultAgentRunner._get_model(agent, RunConfig())
     assert isinstance(model, OpenAIResponsesModel)
 
 
 def openai_prefix_is_openai():
     agent = Agent(model="openai/gpt-4o", instructions="", name="test")
-    model = Runner._get_model(agent, RunConfig())
+    model = DefaultAgentRunner._get_model(agent, RunConfig())
     assert isinstance(model, OpenAIResponsesModel)
 
 
 def test_litellm_prefix_is_litellm():
     agent = Agent(model="litellm/foo/bar", instructions="", name="test")
-    model = Runner._get_model(agent, RunConfig())
+    model = DefaultAgentRunner._get_model(agent, RunConfig())
     assert isinstance(model, LitellmModel)
diff --git a/tests/test_agent_config.py b/tests/test_agent_config.py
index f79c0cf8a..3ecce7788 100644
--- a/tests/test_agent_config.py
+++ b/tests/test_agent_config.py
@@ -1,7 +1,8 @@
 import pytest
 from pydantic import BaseModel
 
-from agents import Agent, AgentOutputSchema, Handoff, RunContextWrapper, Runner, handoff
+from agents import Agent, AgentOutputSchema, Handoff, RunContextWrapper, handoff
+from agents.run import DefaultAgentRunner
 
 
 @pytest.mark.asyncio
@@ -42,7 +43,7 @@ async def test_handoff_with_agents():
         handoffs=[agent_1, agent_2],
     )
 
-    handoffs = Runner._get_handoffs(agent_3)
+    handoffs = DefaultAgentRunner._get_handoffs(agent_3)
     assert len(handoffs) == 2
 
     assert handoffs[0].agent_name == "agent_1"
@@ -77,7 +78,7 @@ async def test_handoff_with_handoff_obj():
         ],
     )
 
-    handoffs = Runner._get_handoffs(agent_3)
+    handoffs = DefaultAgentRunner._get_handoffs(agent_3)
     assert len(handoffs) == 2
 
     assert handoffs[0].agent_name == "agent_1"
@@ -111,7 +112,7 @@ async def test_handoff_with_handoff_obj_and_agent():
         handoffs=[handoff(agent_1), agent_2],
     )
 
-    handoffs = Runner._get_handoffs(agent_3)
+    handoffs = DefaultAgentRunner._get_handoffs(agent_3)
     assert len(handoffs) == 2
 
     assert handoffs[0].agent_name == "agent_1"
@@ -159,7 +160,7 @@ async def test_agent_final_output():
         output_type=Foo,
     )
 
-    schema = Runner._get_output_schema(agent)
+    schema = DefaultAgentRunner._get_output_schema(agent)
     assert isinstance(schema, AgentOutputSchema)
     assert schema is not None
     assert schema.output_type == Foo
diff --git a/tests/test_handoff_tool.py b/tests/test_handoff_tool.py
index 0a8f064f1..a33b53965 100644
--- a/tests/test_handoff_tool.py
+++ b/tests/test_handoff_tool.py
@@ -12,10 +12,10 @@
     MessageOutputItem,
     ModelBehaviorError,
     RunContextWrapper,
-    Runner,
     UserError,
     handoff,
 )
+from agents.run import DefaultAgentRunner
 
 
 def message_item(content: str, agent: Agent[Any]) -> MessageOutputItem:
@@ -45,9 +45,9 @@ def test_single_handoff_setup():
     assert not agent_1.handoffs
     assert agent_2.handoffs == [agent_1]
 
-    assert not Runner._get_handoffs(agent_1)
+    assert not DefaultAgentRunner._get_handoffs(agent_1)
 
-    handoff_objects = Runner._get_handoffs(agent_2)
+    handoff_objects = DefaultAgentRunner._get_handoffs(agent_2)
     assert len(handoff_objects) == 1
     obj = handoff_objects[0]
     assert obj.tool_name == Handoff.default_tool_name(agent_1)
@@ -64,7 +64,7 @@ def test_multiple_handoffs_setup():
     assert not agent_1.handoffs
     assert not agent_2.handoffs
 
-    handoff_objects = Runner._get_handoffs(agent_3)
+    handoff_objects = DefaultAgentRunner._get_handoffs(agent_3)
     assert len(handoff_objects) == 2
     assert handoff_objects[0].tool_name == Handoff.default_tool_name(agent_1)
     assert handoff_objects[1].tool_name == Handoff.default_tool_name(agent_2)
@@ -95,7 +95,7 @@ def test_custom_handoff_setup():
     assert not agent_1.handoffs
     assert not agent_2.handoffs
 
-    handoff_objects = Runner._get_handoffs(agent_3)
+    handoff_objects = DefaultAgentRunner._get_handoffs(agent_3)
     assert len(handoff_objects) == 2
 
     first_handoff = handoff_objects[0]
diff --git a/tests/test_output_tool.py b/tests/test_output_tool.py
index 37c1b1b67..786729e13 100644
--- a/tests/test_output_tool.py
+++ b/tests/test_output_tool.py
@@ -10,16 +10,16 @@
     AgentOutputSchema,
     AgentOutputSchemaBase,
     ModelBehaviorError,
-    Runner,
     UserError,
 )
 from agents.agent_output import _WRAPPER_DICT_KEY
+from agents.run import DefaultAgentRunner
 from agents.util import _json
 
 
 def test_plain_text_output():
     agent = Agent(name="test")
-    output_schema = Runner._get_output_schema(agent)
+    output_schema = DefaultAgentRunner._get_output_schema(agent)
     assert not output_schema, "Shouldn't have an output tool config without an output type"
 
     agent = Agent(name="test", output_type=str)
@@ -32,7 +32,7 @@ class Foo(BaseModel):
 
 def test_structured_output_pydantic():
     agent = Agent(name="test", output_type=Foo)
-    output_schema = Runner._get_output_schema(agent)
+    output_schema = DefaultAgentRunner._get_output_schema(agent)
     assert output_schema, "Should have an output tool config with a structured output type"
 
     assert isinstance(output_schema, AgentOutputSchema)
@@ -52,7 +52,7 @@ class Bar(TypedDict):
 
 def test_structured_output_typed_dict():
     agent = Agent(name="test", output_type=Bar)
-    output_schema = Runner._get_output_schema(agent)
+    output_schema = DefaultAgentRunner._get_output_schema(agent)
     assert output_schema, "Should have an output tool config with a structured output type"
     assert isinstance(output_schema, AgentOutputSchema)
     assert output_schema.output_type == Bar, "Should have the correct output type"
@@ -65,7 +65,7 @@ def test_structured_output_typed_dict():
 
 def test_structured_output_list():
     agent = Agent(name="test", output_type=list[str])
-    output_schema = Runner._get_output_schema(agent)
+    output_schema = DefaultAgentRunner._get_output_schema(agent)
     assert output_schema, "Should have an output tool config with a structured output type"
     assert isinstance(output_schema, AgentOutputSchema)
     assert output_schema.output_type == list[str], "Should have the correct output type"
@@ -79,14 +79,14 @@ def test_structured_output_list():
 
 def test_bad_json_raises_error(mocker):
     agent = Agent(name="test", output_type=Foo)
-    output_schema = Runner._get_output_schema(agent)
+    output_schema = DefaultAgentRunner._get_output_schema(agent)
     assert output_schema, "Should have an output tool config with a structured output type"
 
     with pytest.raises(ModelBehaviorError):
         output_schema.validate_json("not valid json")
 
     agent = Agent(name="test", output_type=list[str])
-    output_schema = Runner._get_output_schema(agent)
+    output_schema = DefaultAgentRunner._get_output_schema(agent)
     assert output_schema, "Should have an output tool config with a structured output type"
 
     mock_validate_json = mocker.patch.object(_json, "validate_json")
@@ -155,7 +155,7 @@ def validate_json(self, json_str: str) -> Any:
 def test_custom_output_schema():
     custom_output_schema = CustomOutputSchema()
     agent = Agent(name="test", output_type=custom_output_schema)
-    output_schema = Runner._get_output_schema(agent)
+    output_schema = DefaultAgentRunner._get_output_schema(agent)
 
     assert output_schema, "Should have an output tool config with a structured output type"
     assert isinstance(output_schema, CustomOutputSchema)
diff --git a/tests/test_run_config.py b/tests/test_run_config.py
index 51835ab66..7da7c72d5 100644
--- a/tests/test_run_config.py
+++ b/tests/test_run_config.py
@@ -60,7 +60,7 @@ async def test_run_config_model_name_override_takes_precedence() -> None:
 async def test_run_config_model_override_object_takes_precedence() -> None:
     """
     When a concrete Model instance is set on the RunConfig, then that instance should be
-    returned by Runner._get_model regardless of the agent's model.
+    returned by DefaultAgentRunner._get_model regardless of the agent's model.
     """
     fake_model = FakeModel(initial_output=[get_text_message("override-object")])
     agent = Agent(name="test", model="agent-model")
diff --git a/tests/test_run_step_execution.py b/tests/test_run_step_execution.py
index 6f446649a..680cd4230 100644
--- a/tests/test_run_step_execution.py
+++ b/tests/test_run_step_execution.py
@@ -14,7 +14,6 @@
     RunContextWrapper,
     RunHooks,
     RunItem,
-    Runner,
     ToolCallItem,
     ToolCallOutputItem,
     TResponseInputItem,
@@ -27,6 +26,7 @@
     RunImpl,
     SingleStepResult,
 )
+from agents.run import DefaultAgentRunner
 from agents.tool import function_tool
 from agents.tool_context import ToolContext
 
@@ -324,8 +324,8 @@ async def get_execute_result(
     context_wrapper: RunContextWrapper[Any] | None = None,
     run_config: RunConfig | None = None,
 ) -> SingleStepResult:
-    output_schema = Runner._get_output_schema(agent)
-    handoffs = Runner._get_handoffs(agent)
+    output_schema = DefaultAgentRunner._get_output_schema(agent)
+    handoffs = DefaultAgentRunner._get_handoffs(agent)
 
     processed_response = RunImpl.process_model_response(
         agent=agent,
diff --git a/tests/test_run_step_processing.py b/tests/test_run_step_processing.py
index 3cc1231c1..e8f5c03c2 100644
--- a/tests/test_run_step_processing.py
+++ b/tests/test_run_step_processing.py
@@ -24,6 +24,7 @@
     Usage,
 )
 from agents._run_impl import RunImpl
+from agents.run import DefaultAgentRunner
 
 from .test_responses import (
     get_final_output_message,
@@ -186,7 +187,7 @@ async def test_handoffs_parsed_correctly():
         agent=agent_3,
         response=response,
         output_schema=None,
-        handoffs=Runner._get_handoffs(agent_3),
+        handoffs=DefaultAgentRunner._get_handoffs(agent_3),
         all_tools=await agent_3.get_all_tools(_dummy_ctx()),
     )
     assert len(result.handoffs) == 1, "Should have a handoff here"
@@ -216,7 +217,7 @@ async def test_missing_handoff_fails():
             agent=agent_3,
             response=response,
             output_schema=None,
-            handoffs=Runner._get_handoffs(agent_3),
+            handoffs=DefaultAgentRunner._get_handoffs(agent_3),
             all_tools=await agent_3.get_all_tools(_dummy_ctx()),
         )
 
@@ -239,7 +240,7 @@ async def test_multiple_handoffs_doesnt_error():
         agent=agent_3,
         response=response,
         output_schema=None,
-        handoffs=Runner._get_handoffs(agent_3),
+        handoffs=DefaultAgentRunner._get_handoffs(agent_3),
         all_tools=await agent_3.get_all_tools(_dummy_ctx()),
     )
     assert len(result.handoffs) == 2, "Should have multiple handoffs here"
@@ -264,7 +265,7 @@ async def test_final_output_parsed_correctly():
     RunImpl.process_model_response(
         agent=agent,
         response=response,
-        output_schema=Runner._get_output_schema(agent),
+        output_schema=DefaultAgentRunner._get_output_schema(agent),
         handoffs=[],
         all_tools=await agent.get_all_tools(_dummy_ctx()),
     )
@@ -471,7 +472,7 @@ async def test_tool_and_handoff_parsed_correctly():
         agent=agent_3,
         response=response,
         output_schema=None,
-        handoffs=Runner._get_handoffs(agent_3),
+        handoffs=DefaultAgentRunner._get_handoffs(agent_3),
         all_tools=await agent_3.get_all_tools(_dummy_ctx()),
     )
     assert result.functions and len(result.functions) == 1

From aeede3c6021fbd2a9b83335bc3399e6a128ade34 Mon Sep 17 00:00:00 2001
From: pakrym-oai <pakrym@openai.com>
Date: Tue, 17 Jun 2025 09:15:08 -0700
Subject: [PATCH 16/22] agents/__init__.py: remove unused AgentRunner and
 DefaultAgentRunner imports and __all__ entries

---
 src/agents/__init__.py | 4 +---
 1 file changed, 1 insertion(+), 3 deletions(-)

diff --git a/src/agents/__init__.py b/src/agents/__init__.py
index d2e0857e5..7464498f1 100644
--- a/src/agents/__init__.py
+++ b/src/agents/__init__.py
@@ -47,7 +47,7 @@
 from .models.openai_responses import OpenAIResponsesModel
 from .repl import run_demo_loop
 from .result import RunResult, RunResultStreaming
-from .run import AgentRunner, DefaultAgentRunner, RunConfig, Runner
+from .run import RunConfig, Runner
 from .run_context import RunContextWrapper, TContext
 from .stream_events import (
     AgentUpdatedStreamEvent,
@@ -162,8 +162,6 @@ def enable_verbose_stdout_logging():
     "ToolsToFinalOutputFunction",
     "ToolsToFinalOutputResult",
     "Runner",
-    "AgentRunner",
-    "DefaultAgentRunner",
     "run_demo_loop",
     "Model",
     "ModelProvider",

From 27c63c60e0515f2986d6404a22d6002e9bc91dc9 Mon Sep 17 00:00:00 2001
From: pakrym-oai <pakrym@openai.com>
Date: Tue, 17 Jun 2025 09:19:51 -0700
Subject: [PATCH 17/22] tests: clean unused import in test_run_step_processing
 & fix import order in voice workflow tests

---
 tests/test_run_step_processing.py | 1 -
 tests/voice/test_workflow.py      | 5 +++--
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/tests/test_run_step_processing.py b/tests/test_run_step_processing.py
index e8f5c03c2..bb66fd524 100644
--- a/tests/test_run_step_processing.py
+++ b/tests/test_run_step_processing.py
@@ -19,7 +19,6 @@
     ModelResponse,
     ReasoningItem,
     RunContextWrapper,
-    Runner,
     ToolCallItem,
     Usage,
 )
diff --git a/tests/voice/test_workflow.py b/tests/voice/test_workflow.py
index 035a05d56..13d1fa9f4 100644
--- a/tests/voice/test_workflow.py
+++ b/tests/voice/test_workflow.py
@@ -18,11 +18,12 @@
     TResponseStreamEvent,
 )
 
+from ..fake_model import get_response_obj
+from ..test_responses import get_function_tool, get_function_tool_call, get_text_message
+
 try:
     from agents.voice import SingleAgentVoiceWorkflow
 
-    from ..fake_model import get_response_obj
-    from ..test_responses import get_function_tool, get_function_tool_call, get_text_message
 except ImportError:
     pass
 

From 43be4779d9f91eddc11012c1adef82af23669c7a Mon Sep 17 00:00:00 2001
From: pakrym-oai <pakrym@openai.com>
Date: Tue, 17 Jun 2025 10:48:32 -0700
Subject: [PATCH 18/22] fb

---
 src/agents/run.py                 | 58 ++++++++-----------------------
 tests/models/test_map.py          |  8 ++---
 tests/test_agent_config.py        | 10 +++---
 tests/test_handoff_tool.py        | 10 +++---
 tests/test_output_tool.py         | 16 ++++-----
 tests/test_run_config.py          |  2 +-
 tests/test_run_step_execution.py  |  6 ++--
 tests/test_run_step_processing.py | 12 +++----
 8 files changed, 46 insertions(+), 76 deletions(-)

diff --git a/src/agents/run.py b/src/agents/run.py
index 5c273b8b9..898f29396 100644
--- a/src/agents/run.py
+++ b/src/agents/run.py
@@ -1,10 +1,9 @@
 from __future__ import annotations
 
-import abc
 import asyncio
 import copy
 from dataclasses import dataclass, field
-from typing import Any, Generic, cast
+from typing import Any, Generic, cast, NotRequired
 
 from openai.types.responses import ResponseCompletedEvent
 from typing_extensions import TypedDict, Unpack
@@ -112,51 +111,22 @@ class RunConfig:
 class RunOptions(TypedDict, Generic[TContext]):
     """Arguments for ``AgentRunner`` methods."""
 
-    context: TContext | None
+    context: NotRequired[TContext | None]
     """The context for the run."""
 
-    max_turns: int
+    max_turns: NotRequired[int]
     """The maximum number of turns to run for."""
 
-    hooks: RunHooks[TContext] | None
+    hooks: NotRequired[RunHooks[TContext] | None]
     """Lifecycle hooks for the run."""
 
-    run_config: RunConfig | None
+    run_config: NotRequired[RunConfig | None]
     """Run configuration."""
 
-    previous_response_id: str | None
+    previous_response_id: NotRequired[str | None]
     """The ID of the previous response, if any."""
 
 
-class AgentRunner(abc.ABC):
-    @abc.abstractmethod
-    async def run(
-        self,
-        starting_agent: Agent[TContext],
-        input: str | list[TResponseInputItem],
-        **kwargs: Unpack[RunOptions[TContext]],
-    ) -> RunResult:
-        pass
-
-    @abc.abstractmethod
-    def run_sync(
-        self,
-        starting_agent: Agent[TContext],
-        input: str | list[TResponseInputItem],
-        **kwargs: Unpack[RunOptions[TContext]],
-    ) -> RunResult:
-        pass
-
-    @abc.abstractmethod
-    def run_streamed(
-        self,
-        starting_agent: Agent[TContext],
-        input: str | list[TResponseInputItem],
-        **kwargs: Unpack[RunOptions[TContext]],
-    ) -> RunResultStreaming:
-        pass
-
-
 class Runner:
     @classmethod
     async def run(
@@ -196,7 +166,7 @@ async def run(
             A run result containing all the inputs, guardrail results and the output of the last
             agent. Agents may perform handoffs, so we don't know the specific type of the output.
         """
-        runner = DefaultAgentRunner()
+        runner = AgentRunner()
         return await runner.run(
             starting_agent,
             input,
@@ -248,7 +218,7 @@ def run_sync(
             A run result containing all the inputs, guardrail results and the output of the last
             agent. Agents may perform handoffs, so we don't know the specific type of the output.
         """
-        runner = DefaultAgentRunner()
+        runner = AgentRunner()
         return runner.run_sync(
             starting_agent,
             input,
@@ -296,7 +266,7 @@ def run_streamed(
         Returns:
             A result object that contains data about the run, as well as a method to stream events.
         """
-        runner = DefaultAgentRunner()
+        runner = AgentRunner()
         return runner.run_streamed(
             starting_agent,
             input,
@@ -308,7 +278,7 @@ def run_streamed(
         )
 
 
-class DefaultAgentRunner(AgentRunner):
+class AgentRunner:
     async def run(
         self,
         starting_agent: Agent[TContext],
@@ -351,7 +321,7 @@ async def run(
 
             try:
                 while True:
-                    all_tools = await DefaultAgentRunner._get_all_tools(
+                    all_tools = await AgentRunner._get_all_tools(
                         current_agent, context_wrapper
                     )
 
@@ -359,9 +329,9 @@ async def run(
                     # agent changes, or if the agent loop ends.
                     if current_span is None:
                         handoff_names = [
-                            h.agent_name for h in DefaultAgentRunner._get_handoffs(current_agent)
+                            h.agent_name for h in AgentRunner._get_handoffs(current_agent)
                         ]
-                        if output_schema := DefaultAgentRunner._get_output_schema(current_agent):
+                        if output_schema := AgentRunner._get_output_schema(current_agent):
                             output_type_name = output_schema.name()
                         else:
                             output_type_name = "str"
@@ -527,7 +497,7 @@ def run_streamed(
             )
         )
 
-        output_schema = DefaultAgentRunner._get_output_schema(starting_agent)
+        output_schema = AgentRunner._get_output_schema(starting_agent)
         context_wrapper: RunContextWrapper[TContext] = RunContextWrapper(
             context=context  # type: ignore
         )
diff --git a/tests/models/test_map.py b/tests/models/test_map.py
index 11df1c0e5..b1a129667 100644
--- a/tests/models/test_map.py
+++ b/tests/models/test_map.py
@@ -1,21 +1,21 @@
 from agents import Agent, OpenAIResponsesModel, RunConfig
 from agents.extensions.models.litellm_model import LitellmModel
-from agents.run import DefaultAgentRunner
+from agents.run import AgentRunner
 
 
 def test_no_prefix_is_openai():
     agent = Agent(model="gpt-4o", instructions="", name="test")
-    model = DefaultAgentRunner._get_model(agent, RunConfig())
+    model = AgentRunner._get_model(agent, RunConfig())
     assert isinstance(model, OpenAIResponsesModel)
 
 
 def openai_prefix_is_openai():
     agent = Agent(model="openai/gpt-4o", instructions="", name="test")
-    model = DefaultAgentRunner._get_model(agent, RunConfig())
+    model = AgentRunner._get_model(agent, RunConfig())
     assert isinstance(model, OpenAIResponsesModel)
 
 
 def test_litellm_prefix_is_litellm():
     agent = Agent(model="litellm/foo/bar", instructions="", name="test")
-    model = DefaultAgentRunner._get_model(agent, RunConfig())
+    model = AgentRunner._get_model(agent, RunConfig())
     assert isinstance(model, LitellmModel)
diff --git a/tests/test_agent_config.py b/tests/test_agent_config.py
index 3ecce7788..f9423619d 100644
--- a/tests/test_agent_config.py
+++ b/tests/test_agent_config.py
@@ -2,7 +2,7 @@
 from pydantic import BaseModel
 
 from agents import Agent, AgentOutputSchema, Handoff, RunContextWrapper, handoff
-from agents.run import DefaultAgentRunner
+from agents.run import AgentRunner
 
 
 @pytest.mark.asyncio
@@ -43,7 +43,7 @@ async def test_handoff_with_agents():
         handoffs=[agent_1, agent_2],
     )
 
-    handoffs = DefaultAgentRunner._get_handoffs(agent_3)
+    handoffs = AgentRunner._get_handoffs(agent_3)
     assert len(handoffs) == 2
 
     assert handoffs[0].agent_name == "agent_1"
@@ -78,7 +78,7 @@ async def test_handoff_with_handoff_obj():
         ],
     )
 
-    handoffs = DefaultAgentRunner._get_handoffs(agent_3)
+    handoffs = AgentRunner._get_handoffs(agent_3)
     assert len(handoffs) == 2
 
     assert handoffs[0].agent_name == "agent_1"
@@ -112,7 +112,7 @@ async def test_handoff_with_handoff_obj_and_agent():
         handoffs=[handoff(agent_1), agent_2],
     )
 
-    handoffs = DefaultAgentRunner._get_handoffs(agent_3)
+    handoffs = AgentRunner._get_handoffs(agent_3)
     assert len(handoffs) == 2
 
     assert handoffs[0].agent_name == "agent_1"
@@ -160,7 +160,7 @@ async def test_agent_final_output():
         output_type=Foo,
     )
 
-    schema = DefaultAgentRunner._get_output_schema(agent)
+    schema = AgentRunner._get_output_schema(agent)
     assert isinstance(schema, AgentOutputSchema)
     assert schema is not None
     assert schema.output_type == Foo
diff --git a/tests/test_handoff_tool.py b/tests/test_handoff_tool.py
index a33b53965..a1b5b80ba 100644
--- a/tests/test_handoff_tool.py
+++ b/tests/test_handoff_tool.py
@@ -15,7 +15,7 @@
     UserError,
     handoff,
 )
-from agents.run import DefaultAgentRunner
+from agents.run import AgentRunner
 
 
 def message_item(content: str, agent: Agent[Any]) -> MessageOutputItem:
@@ -45,9 +45,9 @@ def test_single_handoff_setup():
     assert not agent_1.handoffs
     assert agent_2.handoffs == [agent_1]
 
-    assert not DefaultAgentRunner._get_handoffs(agent_1)
+    assert not AgentRunner._get_handoffs(agent_1)
 
-    handoff_objects = DefaultAgentRunner._get_handoffs(agent_2)
+    handoff_objects = AgentRunner._get_handoffs(agent_2)
     assert len(handoff_objects) == 1
     obj = handoff_objects[0]
     assert obj.tool_name == Handoff.default_tool_name(agent_1)
@@ -64,7 +64,7 @@ def test_multiple_handoffs_setup():
     assert not agent_1.handoffs
     assert not agent_2.handoffs
 
-    handoff_objects = DefaultAgentRunner._get_handoffs(agent_3)
+    handoff_objects = AgentRunner._get_handoffs(agent_3)
     assert len(handoff_objects) == 2
     assert handoff_objects[0].tool_name == Handoff.default_tool_name(agent_1)
     assert handoff_objects[1].tool_name == Handoff.default_tool_name(agent_2)
@@ -95,7 +95,7 @@ def test_custom_handoff_setup():
     assert not agent_1.handoffs
     assert not agent_2.handoffs
 
-    handoff_objects = DefaultAgentRunner._get_handoffs(agent_3)
+    handoff_objects = AgentRunner._get_handoffs(agent_3)
     assert len(handoff_objects) == 2
 
     first_handoff = handoff_objects[0]
diff --git a/tests/test_output_tool.py b/tests/test_output_tool.py
index 786729e13..e98fd3c55 100644
--- a/tests/test_output_tool.py
+++ b/tests/test_output_tool.py
@@ -13,13 +13,13 @@
     UserError,
 )
 from agents.agent_output import _WRAPPER_DICT_KEY
-from agents.run import DefaultAgentRunner
+from agents.run import AgentRunner
 from agents.util import _json
 
 
 def test_plain_text_output():
     agent = Agent(name="test")
-    output_schema = DefaultAgentRunner._get_output_schema(agent)
+    output_schema = AgentRunner._get_output_schema(agent)
     assert not output_schema, "Shouldn't have an output tool config without an output type"
 
     agent = Agent(name="test", output_type=str)
@@ -32,7 +32,7 @@ class Foo(BaseModel):
 
 def test_structured_output_pydantic():
     agent = Agent(name="test", output_type=Foo)
-    output_schema = DefaultAgentRunner._get_output_schema(agent)
+    output_schema = AgentRunner._get_output_schema(agent)
     assert output_schema, "Should have an output tool config with a structured output type"
 
     assert isinstance(output_schema, AgentOutputSchema)
@@ -52,7 +52,7 @@ class Bar(TypedDict):
 
 def test_structured_output_typed_dict():
     agent = Agent(name="test", output_type=Bar)
-    output_schema = DefaultAgentRunner._get_output_schema(agent)
+    output_schema = AgentRunner._get_output_schema(agent)
     assert output_schema, "Should have an output tool config with a structured output type"
     assert isinstance(output_schema, AgentOutputSchema)
     assert output_schema.output_type == Bar, "Should have the correct output type"
@@ -65,7 +65,7 @@ def test_structured_output_typed_dict():
 
 def test_structured_output_list():
     agent = Agent(name="test", output_type=list[str])
-    output_schema = DefaultAgentRunner._get_output_schema(agent)
+    output_schema = AgentRunner._get_output_schema(agent)
     assert output_schema, "Should have an output tool config with a structured output type"
     assert isinstance(output_schema, AgentOutputSchema)
     assert output_schema.output_type == list[str], "Should have the correct output type"
@@ -79,14 +79,14 @@ def test_structured_output_list():
 
 def test_bad_json_raises_error(mocker):
     agent = Agent(name="test", output_type=Foo)
-    output_schema = DefaultAgentRunner._get_output_schema(agent)
+    output_schema = AgentRunner._get_output_schema(agent)
     assert output_schema, "Should have an output tool config with a structured output type"
 
     with pytest.raises(ModelBehaviorError):
         output_schema.validate_json("not valid json")
 
     agent = Agent(name="test", output_type=list[str])
-    output_schema = DefaultAgentRunner._get_output_schema(agent)
+    output_schema = AgentRunner._get_output_schema(agent)
     assert output_schema, "Should have an output tool config with a structured output type"
 
     mock_validate_json = mocker.patch.object(_json, "validate_json")
@@ -155,7 +155,7 @@ def validate_json(self, json_str: str) -> Any:
 def test_custom_output_schema():
     custom_output_schema = CustomOutputSchema()
     agent = Agent(name="test", output_type=custom_output_schema)
-    output_schema = DefaultAgentRunner._get_output_schema(agent)
+    output_schema = AgentRunner._get_output_schema(agent)
 
     assert output_schema, "Should have an output tool config with a structured output type"
     assert isinstance(output_schema, CustomOutputSchema)
diff --git a/tests/test_run_config.py b/tests/test_run_config.py
index 7da7c72d5..e19899006 100644
--- a/tests/test_run_config.py
+++ b/tests/test_run_config.py
@@ -60,7 +60,7 @@ async def test_run_config_model_name_override_takes_precedence() -> None:
 async def test_run_config_model_override_object_takes_precedence() -> None:
     """
     When a concrete Model instance is set on the RunConfig, then that instance should be
-    returned by DefaultAgentRunner._get_model regardless of the agent's model.
+    returned by AgentRunner._get_model regardless of the agent's model.
     """
     fake_model = FakeModel(initial_output=[get_text_message("override-object")])
     agent = Agent(name="test", model="agent-model")
diff --git a/tests/test_run_step_execution.py b/tests/test_run_step_execution.py
index 680cd4230..2454a4462 100644
--- a/tests/test_run_step_execution.py
+++ b/tests/test_run_step_execution.py
@@ -26,7 +26,7 @@
     RunImpl,
     SingleStepResult,
 )
-from agents.run import DefaultAgentRunner
+from agents.run import AgentRunner
 from agents.tool import function_tool
 from agents.tool_context import ToolContext
 
@@ -324,8 +324,8 @@ async def get_execute_result(
     context_wrapper: RunContextWrapper[Any] | None = None,
     run_config: RunConfig | None = None,
 ) -> SingleStepResult:
-    output_schema = DefaultAgentRunner._get_output_schema(agent)
-    handoffs = DefaultAgentRunner._get_handoffs(agent)
+    output_schema = AgentRunner._get_output_schema(agent)
+    handoffs = AgentRunner._get_handoffs(agent)
 
     processed_response = RunImpl.process_model_response(
         agent=agent,
diff --git a/tests/test_run_step_processing.py b/tests/test_run_step_processing.py
index bb66fd524..5a75ec837 100644
--- a/tests/test_run_step_processing.py
+++ b/tests/test_run_step_processing.py
@@ -23,7 +23,7 @@
     Usage,
 )
 from agents._run_impl import RunImpl
-from agents.run import DefaultAgentRunner
+from agents.run import AgentRunner
 
 from .test_responses import (
     get_final_output_message,
@@ -186,7 +186,7 @@ async def test_handoffs_parsed_correctly():
         agent=agent_3,
         response=response,
         output_schema=None,
-        handoffs=DefaultAgentRunner._get_handoffs(agent_3),
+        handoffs=AgentRunner._get_handoffs(agent_3),
         all_tools=await agent_3.get_all_tools(_dummy_ctx()),
     )
     assert len(result.handoffs) == 1, "Should have a handoff here"
@@ -216,7 +216,7 @@ async def test_missing_handoff_fails():
             agent=agent_3,
             response=response,
             output_schema=None,
-            handoffs=DefaultAgentRunner._get_handoffs(agent_3),
+            handoffs=AgentRunner._get_handoffs(agent_3),
             all_tools=await agent_3.get_all_tools(_dummy_ctx()),
         )
 
@@ -239,7 +239,7 @@ async def test_multiple_handoffs_doesnt_error():
         agent=agent_3,
         response=response,
         output_schema=None,
-        handoffs=DefaultAgentRunner._get_handoffs(agent_3),
+        handoffs=AgentRunner._get_handoffs(agent_3),
         all_tools=await agent_3.get_all_tools(_dummy_ctx()),
     )
     assert len(result.handoffs) == 2, "Should have multiple handoffs here"
@@ -264,7 +264,7 @@ async def test_final_output_parsed_correctly():
     RunImpl.process_model_response(
         agent=agent,
         response=response,
-        output_schema=DefaultAgentRunner._get_output_schema(agent),
+        output_schema=AgentRunner._get_output_schema(agent),
         handoffs=[],
         all_tools=await agent.get_all_tools(_dummy_ctx()),
     )
@@ -471,7 +471,7 @@ async def test_tool_and_handoff_parsed_correctly():
         agent=agent_3,
         response=response,
         output_schema=None,
-        handoffs=DefaultAgentRunner._get_handoffs(agent_3),
+        handoffs=AgentRunner._get_handoffs(agent_3),
         all_tools=await agent_3.get_all_tools(_dummy_ctx()),
     )
     assert result.functions and len(result.functions) == 1

From d30a5129b8aabfee3a0c54ec283c8b1ab7551aed Mon Sep 17 00:00:00 2001
From: pakrym-oai <pakrym@openai.com>
Date: Tue, 17 Jun 2025 10:57:27 -0700
Subject: [PATCH 19/22] AgentRunner: add docstring warning that class is not
 public API

---
 src/agents/run.py | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/src/agents/run.py b/src/agents/run.py
index 898f29396..faae37faf 100644
--- a/src/agents/run.py
+++ b/src/agents/run.py
@@ -279,6 +279,10 @@ def run_streamed(
 
 
 class AgentRunner:
+    """
+    ATTENTION: this class is not part of the public API and should not be used directly or subclassed.
+    """
+
     async def run(
         self,
         starting_agent: Agent[TContext],

From ec1caeec75315963a6755c5d0f102c18cfb4dab7 Mon Sep 17 00:00:00 2001
From: pakrym-oai <pakrym@openai.com>
Date: Tue, 17 Jun 2025 11:10:46 -0700
Subject: [PATCH 20/22] run.py: import NotRequired from typing_extensions
 instead of typing; reorder imports

---
 src/agents/run.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/agents/run.py b/src/agents/run.py
index 79af4c00a..dae97265f 100644
--- a/src/agents/run.py
+++ b/src/agents/run.py
@@ -3,13 +3,13 @@
 import asyncio
 import copy
 from dataclasses import dataclass, field
-from typing import Any, Generic, NotRequired, cast
+from typing import Any, Generic, cast
 
 from openai.types.responses import ResponseCompletedEvent
 from openai.types.responses.response_prompt_param import (
     ResponsePromptParam,
 )
-from typing_extensions import TypedDict, Unpack
+from typing_extensions import NotRequired, TypedDict, Unpack
 
 from ._run_impl import (
     AgentToolUseTracker,

From 28ff992d6e5e993f1871c910e320e116fc81fe4c Mon Sep 17 00:00:00 2001
From: pakrym-oai <pakrym@openai.com>
Date: Tue, 17 Jun 2025 13:38:20 -0700
Subject: [PATCH 21/22] default

---
 src/agents/run.py | 34 +++++++++++++++++++++++++++++-----
 tests/test_run.py | 26 ++++++++++++++++++++++++++
 2 files changed, 55 insertions(+), 5 deletions(-)
 create mode 100644 tests/test_run.py

diff --git a/src/agents/run.py b/src/agents/run.py
index dae97265f..f8bbb3114 100644
--- a/src/agents/run.py
+++ b/src/agents/run.py
@@ -56,6 +56,27 @@
 
 DEFAULT_MAX_TURNS = 10
 
+DEFAULT_AGENT_RUNNER: AgentRunner = None  # type: ignore
+# the value is set at the end of the module
+
+
+def set_default_agent_runner(runner: AgentRunner) -> None:
+    """
+    WARNING: this class is experimental and not part of the public API
+    It should not be used directly.
+    """
+    global DEFAULT_AGENT_RUNNER
+    DEFAULT_AGENT_RUNNER = runner
+
+
+def get_default_agent_runner() -> AgentRunner:
+    """
+    WARNING: this class is experimental and not part of the public API
+    It should not be used directly.
+    """
+    global DEFAULT_AGENT_RUNNER
+    return DEFAULT_AGENT_RUNNER
+
 
 @dataclass
 class RunConfig:
@@ -174,7 +195,7 @@ async def run(
             A run result containing all the inputs, guardrail results and the output of the last
             agent. Agents may perform handoffs, so we don't know the specific type of the output.
         """
-        runner = AgentRunner()
+        runner = DEFAULT_AGENT_RUNNER
         return await runner.run(
             starting_agent,
             input,
@@ -226,7 +247,7 @@ def run_sync(
             A run result containing all the inputs, guardrail results and the output of the last
             agent. Agents may perform handoffs, so we don't know the specific type of the output.
         """
-        runner = AgentRunner()
+        runner = DEFAULT_AGENT_RUNNER
         return runner.run_sync(
             starting_agent,
             input,
@@ -274,7 +295,7 @@ def run_streamed(
         Returns:
             A result object that contains data about the run, as well as a method to stream events.
         """
-        runner = AgentRunner()
+        runner = DEFAULT_AGENT_RUNNER
         return runner.run_streamed(
             starting_agent,
             input,
@@ -288,8 +309,8 @@ def run_streamed(
 
 class AgentRunner:
     """
-    ATTENTION: this class is not part of the public API and
-    should not be used directly or subclassed.
+    WARNING: this class is experimental and not part of the public API
+    It should not be used directly or subclassed.
     """
 
     async def run(
@@ -1095,3 +1116,6 @@ def _get_model(cls, agent: Agent[Any], run_config: RunConfig) -> Model:
             return agent.model
 
         return run_config.model_provider.get_model(agent.model)
+
+
+DEFAULT_AGENT_RUNNER = AgentRunner()
diff --git a/tests/test_run.py b/tests/test_run.py
new file mode 100644
index 000000000..66cfee1f1
--- /dev/null
+++ b/tests/test_run.py
@@ -0,0 +1,26 @@
+from __future__ import annotations
+
+from unittest import mock
+
+import pytest
+
+from agents import Agent, Runner
+from agents.run import AgentRunner, set_default_agent_runner
+
+from .fake_model import FakeModel
+
+
+@pytest.mark.asyncio
+async def test_static_run_methods_call_into_default_runner() -> None:
+    runner = mock.Mock(spec=AgentRunner)
+    set_default_agent_runner(runner)
+
+    agent = Agent(name="test", model=FakeModel())
+    await Runner.run(agent, input="test")
+    runner.run.assert_called_once()
+
+    Runner.run_streamed(agent, input="test")
+    runner.run_streamed.assert_called_once()
+
+    Runner.run_sync(agent, input="test")
+    runner.run_sync.assert_called_once()

From 5eb048686f7093ff55d896cbe79b9f65d8757e8d Mon Sep 17 00:00:00 2001
From: pakrym-oai <pakrym@openai.com>
Date: Tue, 17 Jun 2025 13:44:31 -0700
Subject: [PATCH 22/22] run.py: set_default_agent_runner accepts None, resets
 DEFAULT_AGENT_RUNNER to new AgentRunner if passed None conftest.py: add
 autouse fixture to clear DEFAULT_AGENT_RUNNER before each test

---
 src/agents/run.py | 4 ++--
 tests/conftest.py | 6 ++++++
 2 files changed, 8 insertions(+), 2 deletions(-)

diff --git a/src/agents/run.py b/src/agents/run.py
index f8bbb3114..8a44a0e54 100644
--- a/src/agents/run.py
+++ b/src/agents/run.py
@@ -60,13 +60,13 @@
 # the value is set at the end of the module
 
 
-def set_default_agent_runner(runner: AgentRunner) -> None:
+def set_default_agent_runner(runner: AgentRunner | None) -> None:
     """
     WARNING: this class is experimental and not part of the public API
     It should not be used directly.
     """
     global DEFAULT_AGENT_RUNNER
-    DEFAULT_AGENT_RUNNER = runner
+    DEFAULT_AGENT_RUNNER = runner or AgentRunner()
 
 
 def get_default_agent_runner() -> AgentRunner:
diff --git a/tests/conftest.py b/tests/conftest.py
index 7527e11b8..b73d734d1 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -5,6 +5,7 @@
 from agents.models import _openai_shared
 from agents.models.openai_chatcompletions import OpenAIChatCompletionsModel
 from agents.models.openai_responses import OpenAIResponsesModel
+from agents.run import set_default_agent_runner
 from agents.tracing import set_trace_processors
 from agents.tracing.setup import get_trace_provider
 
@@ -33,6 +34,11 @@ def clear_openai_settings():
     _openai_shared._use_responses_by_default = True
 
 
+@pytest.fixture(autouse=True)
+def clear_default_runner():
+    set_default_agent_runner(None)
+
+
 # This fixture will run after all tests end
 @pytest.fixture(autouse=True, scope="session")
 def shutdown_trace_provider():