`Runner`

运行器

Source code in src/agents/run.py

class Runner:
    @classmethod
    async def run(
        cls,
        starting_agent: Agent[TContext],
        input: str | list[TResponseInputItem],
        *,
        context: TContext | None = None,
        max_turns: int = DEFAULT_MAX_TURNS,
        hooks: RunHooks[TContext] | None = None,
        run_config: RunConfig | None = None,
    ) -> RunResult:
        """Run a workflow starting at the given agent. The agent will run in a loop until a final
        output is generated. The loop runs like so:
        1. The agent is invoked with the given input.
        2. If there is a final output (i.e. the agent produces something of type
            `agent.output_type`, the loop terminates.
        3. If there's a handoff, we run the loop again, with the new agent.
        4. Else, we run tool calls (if any), and re-run the loop.

        In two cases, the agent may raise an exception:
        1. If the max_turns is exceeded, a MaxTurnsExceeded exception is raised.
        2. If a guardrail tripwire is triggered, a GuardrailTripwireTriggered exception is raised.

        Note that only the first agent's input guardrails are run.

        Args:
            starting_agent: The starting agent to run.
            input: The initial input to the agent. You can pass a single string for a user message,
                or a list of input items.
            context: The context to run the agent with.
            max_turns: The maximum number of turns to run the agent for. A turn is defined as one
                AI invocation (including any tool calls that might occur).
            hooks: An object that receives callbacks on various lifecycle events.
            run_config: Global settings for the entire agent run.

        Returns:
            A run result containing all the inputs, guardrail results and the output of the last
            agent. Agents may perform handoffs, so we don't know the specific type of the output.
        """
        if hooks is None:
            hooks = RunHooks[Any]()
        if run_config is None:
            run_config = RunConfig()

        tool_use_tracker = AgentToolUseTracker()

        with TraceCtxManager(
            workflow_name=run_config.workflow_name,
            trace_id=run_config.trace_id,
            group_id=run_config.group_id,
            metadata=run_config.trace_metadata,
            disabled=run_config.tracing_disabled,
        ):
            current_turn = 0
            original_input: str | list[TResponseInputItem] = copy.deepcopy(input)
            generated_items: list[RunItem] = []
            model_responses: list[ModelResponse] = []

            context_wrapper: RunContextWrapper[TContext] = RunContextWrapper(
                context=context,  # type: ignore
            )

            input_guardrail_results: list[InputGuardrailResult] = []

            current_span: Span[AgentSpanData] | None = None
            current_agent = starting_agent
            should_run_agent_start_hooks = True

            try:
                while True:
                    # Start an agent span if we don't have one. This span is ended if the current
                    # agent changes, or if the agent loop ends.
                    if current_span is None:
                        handoff_names = [h.agent_name for h in cls._get_handoffs(current_agent)]
                        if output_schema := cls._get_output_schema(current_agent):
                            output_type_name = output_schema.output_type_name()
                        else:
                            output_type_name = "str"

                        current_span = agent_span(
                            name=current_agent.name,
                            handoffs=handoff_names,
                            output_type=output_type_name,
                        )
                        current_span.start(mark_as_current=True)

                        all_tools = await cls._get_all_tools(current_agent)
                        current_span.span_data.tools = [t.name for t in all_tools]

                    current_turn += 1
                    if current_turn > max_turns:
                        _error_tracing.attach_error_to_span(
                            current_span,
                            SpanError(
                                message="Max turns exceeded",
                                data={"max_turns": max_turns},
                            ),
                        )
                        raise MaxTurnsExceeded(f"Max turns ({max_turns}) exceeded")

                    logger.debug(
                        f"Running agent {current_agent.name} (turn {current_turn})",
                    )

                    if current_turn == 1:
                        input_guardrail_results, turn_result = await asyncio.gather(
                            cls._run_input_guardrails(
                                starting_agent,
                                starting_agent.input_guardrails
                                + (run_config.input_guardrails or []),
                                copy.deepcopy(input),
                                context_wrapper,
                            ),
                            cls._run_single_turn(
                                agent=current_agent,
                                all_tools=all_tools,
                                original_input=original_input,
                                generated_items=generated_items,
                                hooks=hooks,
                                context_wrapper=context_wrapper,
                                run_config=run_config,
                                should_run_agent_start_hooks=should_run_agent_start_hooks,
                                tool_use_tracker=tool_use_tracker,
                            ),
                        )
                    else:
                        turn_result = await cls._run_single_turn(
                            agent=current_agent,
                            all_tools=all_tools,
                            original_input=original_input,
                            generated_items=generated_items,
                            hooks=hooks,
                            context_wrapper=context_wrapper,
                            run_config=run_config,
                            should_run_agent_start_hooks=should_run_agent_start_hooks,
                            tool_use_tracker=tool_use_tracker,
                        )
                    should_run_agent_start_hooks = False

                    model_responses.append(turn_result.model_response)
                    original_input = turn_result.original_input
                    generated_items = turn_result.generated_items

                    if isinstance(turn_result.next_step, NextStepFinalOutput):
                        output_guardrail_results = await cls._run_output_guardrails(
                            current_agent.output_guardrails + (run_config.output_guardrails or []),
                            current_agent,
                            turn_result.next_step.output,
                            context_wrapper,
                        )
                        return RunResult(
                            input=original_input,
                            new_items=generated_items,
                            raw_responses=model_responses,
                            final_output=turn_result.next_step.output,
                            _last_agent=current_agent,
                            input_guardrail_results=input_guardrail_results,
                            output_guardrail_results=output_guardrail_results,
                        )
                    elif isinstance(turn_result.next_step, NextStepHandoff):
                        current_agent = cast(Agent[TContext], turn_result.next_step.new_agent)
                        current_span.finish(reset_current=True)
                        current_span = None
                        should_run_agent_start_hooks = True
                    elif isinstance(turn_result.next_step, NextStepRunAgain):
                        pass
                    else:
                        raise AgentsException(
                            f"Unknown next step type: {type(turn_result.next_step)}"
                        )
            finally:
                if current_span:
                    current_span.finish(reset_current=True)

    @classmethod
    def run_sync(
        cls,
        starting_agent: Agent[TContext],
        input: str | list[TResponseInputItem],
        *,
        context: TContext | None = None,
        max_turns: int = DEFAULT_MAX_TURNS,
        hooks: RunHooks[TContext] | None = None,
        run_config: RunConfig | None = None,
    ) -> RunResult:
        """Run a workflow synchronously, starting at the given agent. Note that this just wraps the
        `run` method, so it will not work if there's already an event loop (e.g. inside an async
        function, or in a Jupyter notebook or async context like FastAPI). For those cases, use
        the `run` method instead.

        The agent will run in a loop until a final output is generated. The loop runs like so:
        1. The agent is invoked with the given input.
        2. If there is a final output (i.e. the agent produces something of type
            `agent.output_type`, the loop terminates.
        3. If there's a handoff, we run the loop again, with the new agent.
        4. Else, we run tool calls (if any), and re-run the loop.

        In two cases, the agent may raise an exception:
        1. If the max_turns is exceeded, a MaxTurnsExceeded exception is raised.
        2. If a guardrail tripwire is triggered, a GuardrailTripwireTriggered exception is raised.

        Note that only the first agent's input guardrails are run.

        Args:
            starting_agent: The starting agent to run.
            input: The initial input to the agent. You can pass a single string for a user message,
                or a list of input items.
            context: The context to run the agent with.
            max_turns: The maximum number of turns to run the agent for. A turn is defined as one
                AI invocation (including any tool calls that might occur).
            hooks: An object that receives callbacks on various lifecycle events.
            run_config: Global settings for the entire agent run.

        Returns:
            A run result containing all the inputs, guardrail results and the output of the last
            agent. Agents may perform handoffs, so we don't know the specific type of the output.
        """
        return asyncio.get_event_loop().run_until_complete(
            cls.run(
                starting_agent,
                input,
                context=context,
                max_turns=max_turns,
                hooks=hooks,
                run_config=run_config,
            )
        )

    @classmethod
    def run_streamed(
        cls,
        starting_agent: Agent[TContext],
        input: str | list[TResponseInputItem],
        context: TContext | None = None,
        max_turns: int = DEFAULT_MAX_TURNS,
        hooks: RunHooks[TContext] | None = None,
        run_config: RunConfig | None = None,
    ) -> RunResultStreaming:
        """Run a workflow starting at the given agent in streaming mode. The returned result object
        contains a method you can use to stream semantic events as they are generated.

        The agent will run in a loop until a final output is generated. The loop runs like so:
        1. The agent is invoked with the given input.
        2. If there is a final output (i.e. the agent produces something of type
            `agent.output_type`, the loop terminates.
        3. If there's a handoff, we run the loop again, with the new agent.
        4. Else, we run tool calls (if any), and re-run the loop.

        In two cases, the agent may raise an exception:
        1. If the max_turns is exceeded, a MaxTurnsExceeded exception is raised.
        2. If a guardrail tripwire is triggered, a GuardrailTripwireTriggered exception is raised.

        Note that only the first agent's input guardrails are run.

        Args:
            starting_agent: The starting agent to run.
            input: The initial input to the agent. You can pass a single string for a user message,
                or a list of input items.
            context: The context to run the agent with.
            max_turns: The maximum number of turns to run the agent for. A turn is defined as one
                AI invocation (including any tool calls that might occur).
            hooks: An object that receives callbacks on various lifecycle events.
            run_config: Global settings for the entire agent run.

        Returns:
            A result object that contains data about the run, as well as a method to stream events.
        """
        if hooks is None:
            hooks = RunHooks[Any]()
        if run_config is None:
            run_config = RunConfig()

        # If there's already a trace, we don't create a new one. In addition, we can't end the
        # trace here, because the actual work is done in `stream_events` and this method ends
        # before that.
        new_trace = (
            None
            if get_current_trace()
            else trace(
                workflow_name=run_config.workflow_name,
                trace_id=run_config.trace_id,
                group_id=run_config.group_id,
                metadata=run_config.trace_metadata,
                disabled=run_config.tracing_disabled,
            )
        )
        # Need to start the trace here, because the current trace contextvar is captured at
        # asyncio.create_task time
        if new_trace:
            new_trace.start(mark_as_current=True)

        output_schema = cls._get_output_schema(starting_agent)
        context_wrapper: RunContextWrapper[TContext] = RunContextWrapper(
            context=context  # type: ignore
        )

        streamed_result = RunResultStreaming(
            input=copy.deepcopy(input),
            new_items=[],
            current_agent=starting_agent,
            raw_responses=[],
            final_output=None,
            is_complete=False,
            current_turn=0,
            max_turns=max_turns,
            input_guardrail_results=[],
            output_guardrail_results=[],
            _current_agent_output_schema=output_schema,
            _trace=new_trace,
        )

        # Kick off the actual agent loop in the background and return the streamed result object.
        streamed_result._run_impl_task = asyncio.create_task(
            cls._run_streamed_impl(
                starting_input=input,
                streamed_result=streamed_result,
                starting_agent=starting_agent,
                max_turns=max_turns,
                hooks=hooks,
                context_wrapper=context_wrapper,
                run_config=run_config,
            )
        )
        return streamed_result

    @classmethod
    async def _run_input_guardrails_with_queue(
        cls,
        agent: Agent[Any],
        guardrails: list[InputGuardrail[TContext]],
        input: str | list[TResponseInputItem],
        context: RunContextWrapper[TContext],
        streamed_result: RunResultStreaming,
        parent_span: Span[Any],
    ):
        queue = streamed_result._input_guardrail_queue

        # We'll run the guardrails and push them onto the queue as they complete
        guardrail_tasks = [
            asyncio.create_task(
                RunImpl.run_single_input_guardrail(agent, guardrail, input, context)
            )
            for guardrail in guardrails
        ]
        guardrail_results = []
        try:
            for done in asyncio.as_completed(guardrail_tasks):
                result = await done
                if result.output.tripwire_triggered:
                    _error_tracing.attach_error_to_span(
                        parent_span,
                        SpanError(
                            message="Guardrail tripwire triggered",
                            data={
                                "guardrail": result.guardrail.get_name(),
                                "type": "input_guardrail",
                            },
                        ),
                    )
                queue.put_nowait(result)
                guardrail_results.append(result)
        except Exception:
            for t in guardrail_tasks:
                t.cancel()
            raise

        streamed_result.input_guardrail_results = guardrail_results

    @classmethod
    async def _run_streamed_impl(
        cls,
        starting_input: str | list[TResponseInputItem],
        streamed_result: RunResultStreaming,
        starting_agent: Agent[TContext],
        max_turns: int,
        hooks: RunHooks[TContext],
        context_wrapper: RunContextWrapper[TContext],
        run_config: RunConfig,
    ):
        current_span: Span[AgentSpanData] | None = None
        current_agent = starting_agent
        current_turn = 0
        should_run_agent_start_hooks = True
        tool_use_tracker = AgentToolUseTracker()

        streamed_result._event_queue.put_nowait(AgentUpdatedStreamEvent(new_agent=current_agent))

        try:
            while True:
                if streamed_result.is_complete:
                    break

                # Start an agent span if we don't have one. This span is ended if the current
                # agent changes, or if the agent loop ends.
                if current_span is None:
                    handoff_names = [h.agent_name for h in cls._get_handoffs(current_agent)]
                    if output_schema := cls._get_output_schema(current_agent):
                        output_type_name = output_schema.output_type_name()
                    else:
                        output_type_name = "str"

                    current_span = agent_span(
                        name=current_agent.name,
                        handoffs=handoff_names,
                        output_type=output_type_name,
                    )
                    current_span.start(mark_as_current=True)

                    all_tools = await cls._get_all_tools(current_agent)
                    tool_names = [t.name for t in all_tools]
                    current_span.span_data.tools = tool_names
                current_turn += 1
                streamed_result.current_turn = current_turn

                if current_turn > max_turns:
                    _error_tracing.attach_error_to_span(
                        current_span,
                        SpanError(
                            message="Max turns exceeded",
                            data={"max_turns": max_turns},
                        ),
                    )
                    streamed_result._event_queue.put_nowait(QueueCompleteSentinel())
                    break

                if current_turn == 1:
                    # Run the input guardrails in the background and put the results on the queue
                    streamed_result._input_guardrails_task = asyncio.create_task(
                        cls._run_input_guardrails_with_queue(
                            starting_agent,
                            starting_agent.input_guardrails + (run_config.input_guardrails or []),
                            copy.deepcopy(ItemHelpers.input_to_new_input_list(starting_input)),
                            context_wrapper,
                            streamed_result,
                            current_span,
                        )
                    )
                try:
                    turn_result = await cls._run_single_turn_streamed(
                        streamed_result,
                        current_agent,
                        hooks,
                        context_wrapper,
                        run_config,
                        should_run_agent_start_hooks,
                        tool_use_tracker,
                        all_tools,
                    )
                    should_run_agent_start_hooks = False

                    streamed_result.raw_responses = streamed_result.raw_responses + [
                        turn_result.model_response
                    ]
                    streamed_result.input = turn_result.original_input
                    streamed_result.new_items = turn_result.generated_items

                    if isinstance(turn_result.next_step, NextStepHandoff):
                        current_agent = turn_result.next_step.new_agent
                        current_span.finish(reset_current=True)
                        current_span = None
                        should_run_agent_start_hooks = True
                        streamed_result._event_queue.put_nowait(
                            AgentUpdatedStreamEvent(new_agent=current_agent)
                        )
                    elif isinstance(turn_result.next_step, NextStepFinalOutput):
                        streamed_result._output_guardrails_task = asyncio.create_task(
                            cls._run_output_guardrails(
                                current_agent.output_guardrails
                                + (run_config.output_guardrails or []),
                                current_agent,
                                turn_result.next_step.output,
                                context_wrapper,
                            )
                        )

                        try:
                            output_guardrail_results = await streamed_result._output_guardrails_task
                        except Exception:
                            # Exceptions will be checked in the stream_events loop
                            output_guardrail_results = []

                        streamed_result.output_guardrail_results = output_guardrail_results
                        streamed_result.final_output = turn_result.next_step.output
                        streamed_result.is_complete = True
                        streamed_result._event_queue.put_nowait(QueueCompleteSentinel())
                    elif isinstance(turn_result.next_step, NextStepRunAgain):
                        pass
                except Exception as e:
                    if current_span:
                        _error_tracing.attach_error_to_span(
                            current_span,
                            SpanError(
                                message="Error in agent run",
                                data={"error": str(e)},
                            ),
                        )
                    streamed_result.is_complete = True
                    streamed_result._event_queue.put_nowait(QueueCompleteSentinel())
                    raise

            streamed_result.is_complete = True
        finally:
            if current_span:
                current_span.finish(reset_current=True)

    @classmethod
    async def _run_single_turn_streamed(
        cls,
        streamed_result: RunResultStreaming,
        agent: Agent[TContext],
        hooks: RunHooks[TContext],
        context_wrapper: RunContextWrapper[TContext],
        run_config: RunConfig,
        should_run_agent_start_hooks: bool,
        tool_use_tracker: AgentToolUseTracker,
        all_tools: list[Tool],
    ) -> SingleStepResult:
        if should_run_agent_start_hooks:
            await asyncio.gather(
                hooks.on_agent_start(context_wrapper, agent),
                (
                    agent.hooks.on_start(context_wrapper, agent)
                    if agent.hooks
                    else _coro.noop_coroutine()
                ),
            )

        output_schema = cls._get_output_schema(agent)

        streamed_result.current_agent = agent
        streamed_result._current_agent_output_schema = output_schema

        system_prompt = await agent.get_system_prompt(context_wrapper)

        handoffs = cls._get_handoffs(agent)
        model = cls._get_model(agent, run_config)
        model_settings = agent.model_settings.resolve(run_config.model_settings)
        model_settings = RunImpl.maybe_reset_tool_choice(agent, tool_use_tracker, model_settings)

        final_response: ModelResponse | None = None

        input = ItemHelpers.input_to_new_input_list(streamed_result.input)
        input.extend([item.to_input_item() for item in streamed_result.new_items])

        # 1. Stream the output events
        async for event in model.stream_response(
            system_prompt,
            input,
            model_settings,
            all_tools,
            output_schema,
            handoffs,
            get_model_tracing_impl(
                run_config.tracing_disabled, run_config.trace_include_sensitive_data
            ),
        ):
            if isinstance(event, ResponseCompletedEvent):
                usage = (
                    Usage(
                        requests=1,
                        input_tokens=event.response.usage.input_tokens,
                        output_tokens=event.response.usage.output_tokens,
                        total_tokens=event.response.usage.total_tokens,
                    )
                    if event.response.usage
                    else Usage()
                )
                final_response = ModelResponse(
                    output=event.response.output,
                    usage=usage,
                    referenceable_id=event.response.id,
                )

            streamed_result._event_queue.put_nowait(RawResponsesStreamEvent(data=event))

        # 2. At this point, the streaming is complete for this turn of the agent loop.
        if not final_response:
            raise ModelBehaviorError("Model did not produce a final response!")

        # 3. Now, we can process the turn as we do in the non-streaming case
        single_step_result = await cls._get_single_step_result_from_response(
            agent=agent,
            original_input=streamed_result.input,
            pre_step_items=streamed_result.new_items,
            new_response=final_response,
            output_schema=output_schema,
            all_tools=all_tools,
            handoffs=handoffs,
            hooks=hooks,
            context_wrapper=context_wrapper,
            run_config=run_config,
            tool_use_tracker=tool_use_tracker,
        )

        RunImpl.stream_step_result_to_queue(single_step_result, streamed_result._event_queue)
        return single_step_result

    @classmethod
    async def _run_single_turn(
        cls,
        *,
        agent: Agent[TContext],
        all_tools: list[Tool],
        original_input: str | list[TResponseInputItem],
        generated_items: list[RunItem],
        hooks: RunHooks[TContext],
        context_wrapper: RunContextWrapper[TContext],
        run_config: RunConfig,
        should_run_agent_start_hooks: bool,
        tool_use_tracker: AgentToolUseTracker,
    ) -> SingleStepResult:
        # Ensure we run the hooks before anything else
        if should_run_agent_start_hooks:
            await asyncio.gather(
                hooks.on_agent_start(context_wrapper, agent),
                (
                    agent.hooks.on_start(context_wrapper, agent)
                    if agent.hooks
                    else _coro.noop_coroutine()
                ),
            )

        system_prompt = await agent.get_system_prompt(context_wrapper)

        output_schema = cls._get_output_schema(agent)
        handoffs = cls._get_handoffs(agent)
        input = ItemHelpers.input_to_new_input_list(original_input)
        input.extend([generated_item.to_input_item() for generated_item in generated_items])

        new_response = await cls._get_new_response(
            agent,
            system_prompt,
            input,
            output_schema,
            all_tools,
            handoffs,
            context_wrapper,
            run_config,
            tool_use_tracker,
        )

        return await cls._get_single_step_result_from_response(
            agent=agent,
            original_input=original_input,
            pre_step_items=generated_items,
            new_response=new_response,
            output_schema=output_schema,
            all_tools=all_tools,
            handoffs=handoffs,
            hooks=hooks,
            context_wrapper=context_wrapper,
            run_config=run_config,
            tool_use_tracker=tool_use_tracker,
        )

    @classmethod
    async def _get_single_step_result_from_response(
        cls,
        *,
        agent: Agent[TContext],
        all_tools: list[Tool],
        original_input: str | list[TResponseInputItem],
        pre_step_items: list[RunItem],
        new_response: ModelResponse,
        output_schema: AgentOutputSchema | None,
        handoffs: list[Handoff],
        hooks: RunHooks[TContext],
        context_wrapper: RunContextWrapper[TContext],
        run_config: RunConfig,
        tool_use_tracker: AgentToolUseTracker,
    ) -> SingleStepResult:
        processed_response = RunImpl.process_model_response(
            agent=agent,
            all_tools=all_tools,
            response=new_response,
            output_schema=output_schema,
            handoffs=handoffs,
        )

        tool_use_tracker.add_tool_use(agent, processed_response.tools_used)

        return await RunImpl.execute_tools_and_side_effects(
            agent=agent,
            original_input=original_input,
            pre_step_items=pre_step_items,
            new_response=new_response,
            processed_response=processed_response,
            output_schema=output_schema,
            hooks=hooks,
            context_wrapper=context_wrapper,
            run_config=run_config,
        )

    @classmethod
    async def _run_input_guardrails(
        cls,
        agent: Agent[Any],
        guardrails: list[InputGuardrail[TContext]],
        input: str | list[TResponseInputItem],
        context: RunContextWrapper[TContext],
    ) -> list[InputGuardrailResult]:
        if not guardrails:
            return []

        guardrail_tasks = [
            asyncio.create_task(
                RunImpl.run_single_input_guardrail(agent, guardrail, input, context)
            )
            for guardrail in guardrails
        ]

        guardrail_results = []

        for done in asyncio.as_completed(guardrail_tasks):
            result = await done
            if result.output.tripwire_triggered:
                # Cancel all guardrail tasks if a tripwire is triggered.
                for t in guardrail_tasks:
                    t.cancel()
                _error_tracing.attach_error_to_current_span(
                    SpanError(
                        message="Guardrail tripwire triggered",
                        data={"guardrail": result.guardrail.get_name()},
                    )
                )
                raise InputGuardrailTripwireTriggered(result)
            else:
                guardrail_results.append(result)

        return guardrail_results

    @classmethod
    async def _run_output_guardrails(
        cls,
        guardrails: list[OutputGuardrail[TContext]],
        agent: Agent[TContext],
        agent_output: Any,
        context: RunContextWrapper[TContext],
    ) -> list[OutputGuardrailResult]:
        if not guardrails:
            return []

        guardrail_tasks = [
            asyncio.create_task(
                RunImpl.run_single_output_guardrail(guardrail, agent, agent_output, context)
            )
            for guardrail in guardrails
        ]

        guardrail_results = []

        for done in asyncio.as_completed(guardrail_tasks):
            result = await done
            if result.output.tripwire_triggered:
                # Cancel all guardrail tasks if a tripwire is triggered.
                for t in guardrail_tasks:
                    t.cancel()
                _error_tracing.attach_error_to_current_span(
                    SpanError(
                        message="Guardrail tripwire triggered",
                        data={"guardrail": result.guardrail.get_name()},
                    )
                )
                raise OutputGuardrailTripwireTriggered(result)
            else:
                guardrail_results.append(result)

        return guardrail_results

    @classmethod
    async def _get_new_response(
        cls,
        agent: Agent[TContext],
        system_prompt: str | None,
        input: list[TResponseInputItem],
        output_schema: AgentOutputSchema | None,
        all_tools: list[Tool],
        handoffs: list[Handoff],
        context_wrapper: RunContextWrapper[TContext],
        run_config: RunConfig,
        tool_use_tracker: AgentToolUseTracker,
    ) -> ModelResponse:
        model = cls._get_model(agent, run_config)
        model_settings = agent.model_settings.resolve(run_config.model_settings)
        model_settings = RunImpl.maybe_reset_tool_choice(agent, tool_use_tracker, model_settings)

        new_response = await model.get_response(
            system_instructions=system_prompt,
            input=input,
            model_settings=model_settings,
            tools=all_tools,
            output_schema=output_schema,
            handoffs=handoffs,
            tracing=get_model_tracing_impl(
                run_config.tracing_disabled, run_config.trace_include_sensitive_data
            ),
        )

        context_wrapper.usage.add(new_response.usage)

        return new_response

    @classmethod
    def _get_output_schema(cls, agent: Agent[Any]) -> AgentOutputSchema | None:
        if agent.output_type is None or agent.output_type is str:
            return None

        return AgentOutputSchema(agent.output_type)

    @classmethod
    def _get_handoffs(cls, agent: Agent[Any]) -> list[Handoff]:
        handoffs = []
        for handoff_item in agent.handoffs:
            if isinstance(handoff_item, Handoff):
                handoffs.append(handoff_item)
            elif isinstance(handoff_item, Agent):
                handoffs.append(handoff(handoff_item))
        return handoffs

    @classmethod
    async def _get_all_tools(cls, agent: Agent[Any]) -> list[Tool]:
        return await agent.get_all_tools()

    @classmethod
    def _get_model(cls, agent: Agent[Any], run_config: RunConfig) -> Model:
        if isinstance(run_config.model, Model):
            return run_config.model
        elif isinstance(run_config.model, str):
            return run_config.model_provider.get_model(run_config.model)
        elif isinstance(agent.model, Model):
            return agent.model

        return run_config.model_provider.get_model(agent.model)

运行 `async` `classmethod`

run(
    starting_agent: Agent[TContext],
    input: str | list[TResponseInputItem],
    *,
    context: TContext | None = None,
    max_turns: int = DEFAULT_MAX_TURNS,
    hooks: RunHooks[TContext] | None = None,
    run_config: RunConfig | None = None,
) -> RunResult

从给定的代理开始运行工作流。该代理将循环运行，直到生成最终输出。循环运行流程如下： 1. 使用给定输入调用代理。 2. 如果存在最终输出（即代理生成类型为agent.output_type的内容），则循环终止。 3. 如果存在交接，我们将使用新代理再次运行循环。 4. 否则，我们将运行工具调用（如果有），并重新运行循环。

在两种情况下，代理可能会抛出异常： 1. 如果超过max_turns限制，会抛出MaxTurnsExceeded异常。 2. 如果触发防护栏机制，会抛出GuardrailTripwireTriggered异常。

请注意，仅会运行第一个代理的输入防护机制。

参数:

名称	类型	描述	默认值
`starting_agent`	`Agent[TContext]`	要运行的起始代理。	required
`input`	`str \| list[TResponseInputItem]`	代理的初始输入。您可以传递单个字符串作为用户消息，或者传递一个输入项列表。	required
`context`	`TContext \| None`	运行代理程序的上下文环境。	`None`
`max_turns`	`int`	运行代理的最大轮次数。一轮定义为一次AI调用（包括可能发生的任何工具调用）。	`DEFAULT_MAX_TURNS`
`hooks`	`RunHooks[TContext] \| None`	一个接收各种生命周期事件回调的对象。	`None`
`run_config`	`RunConfig \| None`	整个代理运行的全局设置。	`None`

返回值：

类型	描述
`RunResult`	一个运行结果，包含所有输入、防护栏结果和最后一个的输出
`RunResult`	代理。代理可能会执行交接，因此我们不知道输出的具体类型。

Source code in src/agents/run.py

@classmethod
async def run(
    cls,
    starting_agent: Agent[TContext],
    input: str | list[TResponseInputItem],
    *,
    context: TContext | None = None,
    max_turns: int = DEFAULT_MAX_TURNS,
    hooks: RunHooks[TContext] | None = None,
    run_config: RunConfig | None = None,
) -> RunResult:
    """Run a workflow starting at the given agent. The agent will run in a loop until a final
    output is generated. The loop runs like so:
    1. The agent is invoked with the given input.
    2. If there is a final output (i.e. the agent produces something of type
        `agent.output_type`, the loop terminates.
    3. If there's a handoff, we run the loop again, with the new agent.
    4. Else, we run tool calls (if any), and re-run the loop.

    In two cases, the agent may raise an exception:
    1. If the max_turns is exceeded, a MaxTurnsExceeded exception is raised.
    2. If a guardrail tripwire is triggered, a GuardrailTripwireTriggered exception is raised.

    Note that only the first agent's input guardrails are run.

    Args:
        starting_agent: The starting agent to run.
        input: The initial input to the agent. You can pass a single string for a user message,
            or a list of input items.
        context: The context to run the agent with.
        max_turns: The maximum number of turns to run the agent for. A turn is defined as one
            AI invocation (including any tool calls that might occur).
        hooks: An object that receives callbacks on various lifecycle events.
        run_config: Global settings for the entire agent run.

    Returns:
        A run result containing all the inputs, guardrail results and the output of the last
        agent. Agents may perform handoffs, so we don't know the specific type of the output.
    """
    if hooks is None:
        hooks = RunHooks[Any]()
    if run_config is None:
        run_config = RunConfig()

    tool_use_tracker = AgentToolUseTracker()

    with TraceCtxManager(
        workflow_name=run_config.workflow_name,
        trace_id=run_config.trace_id,
        group_id=run_config.group_id,
        metadata=run_config.trace_metadata,
        disabled=run_config.tracing_disabled,
    ):
        current_turn = 0
        original_input: str | list[TResponseInputItem] = copy.deepcopy(input)
        generated_items: list[RunItem] = []
        model_responses: list[ModelResponse] = []

        context_wrapper: RunContextWrapper[TContext] = RunContextWrapper(
            context=context,  # type: ignore
        )

        input_guardrail_results: list[InputGuardrailResult] = []

        current_span: Span[AgentSpanData] | None = None
        current_agent = starting_agent
        should_run_agent_start_hooks = True

        try:
            while True:
                # Start an agent span if we don't have one. This span is ended if the current
                # agent changes, or if the agent loop ends.
                if current_span is None:
                    handoff_names = [h.agent_name for h in cls._get_handoffs(current_agent)]
                    if output_schema := cls._get_output_schema(current_agent):
                        output_type_name = output_schema.output_type_name()
                    else:
                        output_type_name = "str"

                    current_span = agent_span(
                        name=current_agent.name,
                        handoffs=handoff_names,
                        output_type=output_type_name,
                    )
                    current_span.start(mark_as_current=True)

                    all_tools = await cls._get_all_tools(current_agent)
                    current_span.span_data.tools = [t.name for t in all_tools]

                current_turn += 1
                if current_turn > max_turns:
                    _error_tracing.attach_error_to_span(
                        current_span,
                        SpanError(
                            message="Max turns exceeded",
                            data={"max_turns": max_turns},
                        ),
                    )
                    raise MaxTurnsExceeded(f"Max turns ({max_turns}) exceeded")

                logger.debug(
                    f"Running agent {current_agent.name} (turn {current_turn})",
                )

                if current_turn == 1:
                    input_guardrail_results, turn_result = await asyncio.gather(
                        cls._run_input_guardrails(
                            starting_agent,
                            starting_agent.input_guardrails
                            + (run_config.input_guardrails or []),
                            copy.deepcopy(input),
                            context_wrapper,
                        ),
                        cls._run_single_turn(
                            agent=current_agent,
                            all_tools=all_tools,
                            original_input=original_input,
                            generated_items=generated_items,
                            hooks=hooks,
                            context_wrapper=context_wrapper,
                            run_config=run_config,
                            should_run_agent_start_hooks=should_run_agent_start_hooks,
                            tool_use_tracker=tool_use_tracker,
                        ),
                    )
                else:
                    turn_result = await cls._run_single_turn(
                        agent=current_agent,
                        all_tools=all_tools,
                        original_input=original_input,
                        generated_items=generated_items,
                        hooks=hooks,
                        context_wrapper=context_wrapper,
                        run_config=run_config,
                        should_run_agent_start_hooks=should_run_agent_start_hooks,
                        tool_use_tracker=tool_use_tracker,
                    )
                should_run_agent_start_hooks = False

                model_responses.append(turn_result.model_response)
                original_input = turn_result.original_input
                generated_items = turn_result.generated_items

                if isinstance(turn_result.next_step, NextStepFinalOutput):
                    output_guardrail_results = await cls._run_output_guardrails(
                        current_agent.output_guardrails + (run_config.output_guardrails or []),
                        current_agent,
                        turn_result.next_step.output,
                        context_wrapper,
                    )
                    return RunResult(
                        input=original_input,
                        new_items=generated_items,
                        raw_responses=model_responses,
                        final_output=turn_result.next_step.output,
                        _last_agent=current_agent,
                        input_guardrail_results=input_guardrail_results,
                        output_guardrail_results=output_guardrail_results,
                    )
                elif isinstance(turn_result.next_step, NextStepHandoff):
                    current_agent = cast(Agent[TContext], turn_result.next_step.new_agent)
                    current_span.finish(reset_current=True)
                    current_span = None
                    should_run_agent_start_hooks = True
                elif isinstance(turn_result.next_step, NextStepRunAgain):
                    pass
                else:
                    raise AgentsException(
                        f"Unknown next step type: {type(turn_result.next_step)}"
                    )
        finally:
            if current_span:
                current_span.finish(reset_current=True)

run_sync `classmethod`

run_sync(
    starting_agent: Agent[TContext],
    input: str | list[TResponseInputItem],
    *,
    context: TContext | None = None,
    max_turns: int = DEFAULT_MAX_TURNS,
    hooks: RunHooks[TContext] | None = None,
    run_config: RunConfig | None = None,
) -> RunResult

同步运行一个工作流，从给定的代理开始。请注意，这只是对run方法的封装，因此如果已经存在事件循环（例如在异步函数内部、Jupyter笔记本或FastAPI等异步上下文中），它将无法工作。对于这些情况，请改用run方法。

代理将在一个循环中运行，直到生成最终输出。循环的运行流程如下： 1. 使用给定的输入调用代理。 2. 如果有最终输出（即代理生成了类型为agent.output_type的内容），循环终止。 3. 如果有交接，我们将使用新的代理再次运行循环。 4. 否则，我们将运行工具调用（如果有的话），并重新运行循环。

在两种情况下，代理可能会抛出异常： 1. 如果超过max_turns限制，会抛出MaxTurnsExceeded异常。 2. 如果触发防护栏机制，会抛出GuardrailTripwireTriggered异常。

请注意，仅会运行第一个代理的输入防护机制。

参数:

名称	类型	描述	默认值
`starting_agent`	`Agent[TContext]`	要运行的起始代理。	required
`input`	`str \| list[TResponseInputItem]`	代理的初始输入。您可以传递单个字符串作为用户消息，或者传递一个输入项列表。	required
`context`	`TContext \| None`	运行代理程序的上下文环境。	`None`
`max_turns`	`int`	运行代理的最大轮次数。一轮定义为一次AI调用（包括可能发生的任何工具调用）。	`DEFAULT_MAX_TURNS`
`hooks`	`RunHooks[TContext] \| None`	一个接收各种生命周期事件回调的对象。	`None`
`run_config`	`RunConfig \| None`	整个代理运行的全局设置。	`None`

返回值：

类型	描述
`RunResult`	一个运行结果，包含所有输入、防护栏结果和最后一个的输出
`RunResult`	代理。代理可能会执行交接，因此我们不知道输出的具体类型。

Source code in src/agents/run.py

@classmethod
def run_sync(
    cls,
    starting_agent: Agent[TContext],
    input: str | list[TResponseInputItem],
    *,
    context: TContext | None = None,
    max_turns: int = DEFAULT_MAX_TURNS,
    hooks: RunHooks[TContext] | None = None,
    run_config: RunConfig | None = None,
) -> RunResult:
    """Run a workflow synchronously, starting at the given agent. Note that this just wraps the
    `run` method, so it will not work if there's already an event loop (e.g. inside an async
    function, or in a Jupyter notebook or async context like FastAPI). For those cases, use
    the `run` method instead.

    The agent will run in a loop until a final output is generated. The loop runs like so:
    1. The agent is invoked with the given input.
    2. If there is a final output (i.e. the agent produces something of type
        `agent.output_type`, the loop terminates.
    3. If there's a handoff, we run the loop again, with the new agent.
    4. Else, we run tool calls (if any), and re-run the loop.

    In two cases, the agent may raise an exception:
    1. If the max_turns is exceeded, a MaxTurnsExceeded exception is raised.
    2. If a guardrail tripwire is triggered, a GuardrailTripwireTriggered exception is raised.

    Note that only the first agent's input guardrails are run.

    Args:
        starting_agent: The starting agent to run.
        input: The initial input to the agent. You can pass a single string for a user message,
            or a list of input items.
        context: The context to run the agent with.
        max_turns: The maximum number of turns to run the agent for. A turn is defined as one
            AI invocation (including any tool calls that might occur).
        hooks: An object that receives callbacks on various lifecycle events.
        run_config: Global settings for the entire agent run.

    Returns:
        A run result containing all the inputs, guardrail results and the output of the last
        agent. Agents may perform handoffs, so we don't know the specific type of the output.
    """
    return asyncio.get_event_loop().run_until_complete(
        cls.run(
            starting_agent,
            input,
            context=context,
            max_turns=max_turns,
            hooks=hooks,
            run_config=run_config,
        )
    )

run_streamed `classmethod`

run_streamed(
    starting_agent: Agent[TContext],
    input: str | list[TResponseInputItem],
    context: TContext | None = None,
    max_turns: int = DEFAULT_MAX_TURNS,
    hooks: RunHooks[TContext] | None = None,
    run_config: RunConfig | None = None,
) -> RunResultStreaming

以流式模式从指定代理开始运行工作流。返回的结果对象包含一个方法，可用于在语义事件生成时进行流式传输。

代理将循环运行直到生成最终输出。循环流程如下： 1. 使用给定输入调用代理。 2. 如果存在最终输出（即代理产生了agent.output_type类型的结果），则循环终止。 3. 如果存在交接，我们将使用新代理再次运行循环。 4. 否则，我们将运行工具调用（如果有），并重新运行循环。

在两种情况下，代理可能会抛出异常： 1. 如果超过max_turns限制，会抛出MaxTurnsExceeded异常。 2. 如果触发防护栏机制，会抛出GuardrailTripwireTriggered异常。

请注意，仅会运行第一个代理的输入防护机制。

参数:

名称	类型	描述	默认值
`starting_agent`	`Agent[TContext]`	要运行的起始代理。	required
`input`	`str \| list[TResponseInputItem]`	代理的初始输入。您可以传递单个字符串作为用户消息，或者传递一个输入项列表。	required
`context`	`TContext \| None`	运行代理程序的上下文环境。	`None`
`max_turns`	`int`	运行代理的最大轮次数。一轮定义为一次AI调用（包括可能发生的任何工具调用）。	`DEFAULT_MAX_TURNS`
`hooks`	`RunHooks[TContext] \| None`	一个接收各种生命周期事件回调的对象。	`None`
`run_config`	`RunConfig \| None`	整个代理运行的全局设置。	`None`

返回值：

类型	描述
`RunResultStreaming`	一个包含运行数据的结果对象，以及一个用于流式传输事件的方法。

Source code in src/agents/run.py

@classmethod
def run_streamed(
    cls,
    starting_agent: Agent[TContext],
    input: str | list[TResponseInputItem],
    context: TContext | None = None,
    max_turns: int = DEFAULT_MAX_TURNS,
    hooks: RunHooks[TContext] | None = None,
    run_config: RunConfig | None = None,
) -> RunResultStreaming:
    """Run a workflow starting at the given agent in streaming mode. The returned result object
    contains a method you can use to stream semantic events as they are generated.

    The agent will run in a loop until a final output is generated. The loop runs like so:
    1. The agent is invoked with the given input.
    2. If there is a final output (i.e. the agent produces something of type
        `agent.output_type`, the loop terminates.
    3. If there's a handoff, we run the loop again, with the new agent.
    4. Else, we run tool calls (if any), and re-run the loop.

    In two cases, the agent may raise an exception:
    1. If the max_turns is exceeded, a MaxTurnsExceeded exception is raised.
    2. If a guardrail tripwire is triggered, a GuardrailTripwireTriggered exception is raised.

    Note that only the first agent's input guardrails are run.

    Args:
        starting_agent: The starting agent to run.
        input: The initial input to the agent. You can pass a single string for a user message,
            or a list of input items.
        context: The context to run the agent with.
        max_turns: The maximum number of turns to run the agent for. A turn is defined as one
            AI invocation (including any tool calls that might occur).
        hooks: An object that receives callbacks on various lifecycle events.
        run_config: Global settings for the entire agent run.

    Returns:
        A result object that contains data about the run, as well as a method to stream events.
    """
    if hooks is None:
        hooks = RunHooks[Any]()
    if run_config is None:
        run_config = RunConfig()

    # If there's already a trace, we don't create a new one. In addition, we can't end the
    # trace here, because the actual work is done in `stream_events` and this method ends
    # before that.
    new_trace = (
        None
        if get_current_trace()
        else trace(
            workflow_name=run_config.workflow_name,
            trace_id=run_config.trace_id,
            group_id=run_config.group_id,
            metadata=run_config.trace_metadata,
            disabled=run_config.tracing_disabled,
        )
    )
    # Need to start the trace here, because the current trace contextvar is captured at
    # asyncio.create_task time
    if new_trace:
        new_trace.start(mark_as_current=True)

    output_schema = cls._get_output_schema(starting_agent)
    context_wrapper: RunContextWrapper[TContext] = RunContextWrapper(
        context=context  # type: ignore
    )

    streamed_result = RunResultStreaming(
        input=copy.deepcopy(input),
        new_items=[],
        current_agent=starting_agent,
        raw_responses=[],
        final_output=None,
        is_complete=False,
        current_turn=0,
        max_turns=max_turns,
        input_guardrail_results=[],
        output_guardrail_results=[],
        _current_agent_output_schema=output_schema,
        _trace=new_trace,
    )

    # Kick off the actual agent loop in the background and return the streamed result object.
    streamed_result._run_impl_task = asyncio.create_task(
        cls._run_streamed_impl(
            starting_input=input,
            streamed_result=streamed_result,
            starting_agent=starting_agent,
            max_turns=max_turns,
            hooks=hooks,
            context_wrapper=context_wrapper,
            run_config=run_config,
        )
    )
    return streamed_result

运行配置 `dataclass`

配置整个代理运行的设置。

Source code in src/agents/run.py

@dataclass
class RunConfig:
    """Configures settings for the entire agent run."""

    model: str | Model | None = None
    """The model to use for the entire agent run. If set, will override the model set on every
    agent. The model_provider passed in below must be able to resolve this model name.
    """

    model_provider: ModelProvider = field(default_factory=OpenAIProvider)
    """The model provider to use when looking up string model names. Defaults to OpenAI."""

    model_settings: ModelSettings | None = None
    """Configure global model settings. Any non-null values will override the agent-specific model
    settings.
    """

    handoff_input_filter: HandoffInputFilter | None = None
    """A global input filter to apply to all handoffs. If `Handoff.input_filter` is set, then that
    will take precedence. The input filter allows you to edit the inputs that are sent to the new
    agent. See the documentation in `Handoff.input_filter` for more details.
    """

    input_guardrails: list[InputGuardrail[Any]] | None = None
    """A list of input guardrails to run on the initial run input."""

    output_guardrails: list[OutputGuardrail[Any]] | None = None
    """A list of output guardrails to run on the final output of the run."""

    tracing_disabled: bool = False
    """Whether tracing is disabled for the agent run. If disabled, we will not trace the agent run.
    """

    trace_include_sensitive_data: bool = True
    """Whether we include potentially sensitive data (for example: inputs/outputs of tool calls or
    LLM generations) in traces. If False, we'll still create spans for these events, but the
    sensitive data will not be included.
    """

    workflow_name: str = "Agent workflow"
    """The name of the run, used for tracing. Should be a logical name for the run, like
    "Code generation workflow" or "Customer support agent".
    """

    trace_id: str | None = None
    """A custom trace ID to use for tracing. If not provided, we will generate a new trace ID."""

    group_id: str | None = None
    """
    A grouping identifier to use for tracing, to link multiple traces from the same conversation
    or process. For example, you might use a chat thread ID.
    """

    trace_metadata: dict[str, Any] | None = None
    """
    An optional dictionary of additional metadata to include with the trace.
    """

模型 `class-attribute` `instance-attribute`

model: str | Model | None = None

用于整个代理运行的模型。如果设置，将覆盖每个代理上设置的模型。下面传入的model_provider必须能够解析此模型名称。

model_provider `class-attribute` `instance-attribute`

model_provider: ModelProvider = field(
    default_factory=OpenAIProvider
)

在查找字符串模型名称时使用的模型提供者。默认为OpenAI。

模型设置 `class-attribute` `instance-attribute`

model_settings: ModelSettings | None = None

配置全局模型设置。任何非空值将覆盖特定于代理的模型设置。

handoff_input_filter `class-attribute` `instance-attribute`

handoff_input_filter: HandoffInputFilter | None = None

一个应用于所有交接的全局输入过滤器。如果设置了Handoff.input_filter，则该设置将优先生效。输入过滤器允许您编辑发送给新代理的输入内容。更多详情请参阅Handoff.input_filter中的文档。

输入防护栏 `class-attribute` `instance-attribute`

input_guardrails: list[InputGuardrail[Any]] | None = None

在初始运行输入上运行的输入防护栏列表。

输出防护栏 `class-attribute` `instance-attribute`

output_guardrails: list[OutputGuardrail[Any]] | None = None

在运行最终输出上要执行的一系列输出防护措施列表。

tracing_disabled `class-attribute` `instance-attribute`

tracing_disabled: bool = False

是否禁用代理运行的追踪。如果禁用，我们将不会追踪代理运行。

trace_include_sensitive_data `class-attribute` `instance-attribute`

trace_include_sensitive_data: bool = True

是否在跟踪记录中包含可能敏感的数据（例如：工具调用的输入/输出或LLM生成的内容）。如果设为False，我们仍会为这些事件创建跨度，但敏感数据将不会被包含在内。

工作流名称 `class-attribute` `instance-attribute`

workflow_name: str = 'Agent workflow'

运行的名称，用于追踪。应该是一个逻辑上的运行名称，例如"代码生成工作流"或"客户支持代理"。

追踪ID `class-attribute` `instance-attribute`

trace_id: str | None = None

用于追踪的自定义跟踪ID。如果未提供，我们将生成一个新的跟踪ID。

群组ID `class-attribute` `instance-attribute`

group_id: str | None = None

用于追踪的分组标识符，可以将同一对话或进程中的多个追踪记录关联起来。例如，您可以使用聊天线程ID作为分组标识。

trace_metadata `class-attribute` `instance-attribute`

trace_metadata: dict[str, Any] | None = None

一个可选的字典，包含要随跟踪一起包含的额外元数据。

Runner

运行器

运行 async classmethod

run_sync classmethod

run_streamed classmethod

运行配置 dataclass

模型 class-attribute instance-attribute

model_provider class-attribute instance-attribute

模型设置 class-attribute instance-attribute

handoff_input_filter class-attribute instance-attribute

输入防护栏 class-attribute instance-attribute

输出防护栏 class-attribute instance-attribute

tracing_disabled class-attribute instance-attribute

trace_include_sensitive_data class-attribute instance-attribute

工作流名称 class-attribute instance-attribute

追踪ID class-attribute instance-attribute

群组ID class-attribute instance-attribute

trace_metadata class-attribute instance-attribute

`Runner`

运行 `async` `classmethod`

run_sync `classmethod`

run_streamed `classmethod`

运行配置 `dataclass`

模型 `class-attribute` `instance-attribute`

model_provider `class-attribute` `instance-attribute`

模型设置 `class-attribute` `instance-attribute`

handoff_input_filter `class-attribute` `instance-attribute`

输入防护栏 `class-attribute` `instance-attribute`

输出防护栏 `class-attribute` `instance-attribute`

tracing_disabled `class-attribute` `instance-attribute`

trace_include_sensitive_data `class-attribute` `instance-attribute`

工作流名称 `class-attribute` `instance-attribute`

追踪ID `class-attribute` `instance-attribute`

群组ID `class-attribute` `instance-attribute`

trace_metadata `class-attribute` `instance-attribute`