Source code for agent_inspect.metrics.adapters.tau2bench_adapter

from typing import List, Dict, Any, Optional, Tuple

from agent_inspect.metrics.adapters.base_adapter import BaseAdapter
from agent_inspect.models.metrics.agent_trace import AgentDialogueTrace, TurnTrace, Step, AgentResponse
from agent_inspect.models.metrics.agent_data_sample import ToolInputParameter



[docs]
class Tau2BenchAdapter(BaseAdapter):
    """
    Adapter for converting tau2bench conversation format to AgentDialogueTrace format.
    """


[docs]
    def convert_to_agent_trace(self, conversation_data: List[Dict[str, Any]]) -> AgentDialogueTrace:
        """
        Convert tau2bench conversation format to AgentDialogueTrace format.

        :param conversation_data: List of conversation turns, each containing role-based messages.
        :return: Converted agent trace.
        """
        turns = []

        for turn_idx, turn_messages in enumerate(conversation_data):
            turn_trace = self._process_turn(turn_messages, turn_idx)
            if turn_trace:  # Only add turns with user input
                turns.append(turn_trace)

        return AgentDialogueTrace(turns=turns)


    def _process_turn(self, turn_messages: List[Dict[str, Any]], turn_idx: int) -> Optional[TurnTrace]:
        """
        Process a single conversation turn into a TurnTrace.

        :param turn_messages: List of messages in this turn
        :param turn_idx: Index of this turn
        :return: TurnTrace object or None if no user input found
        """
        user_input = self._extract_user_input(turn_messages)
        if user_input is None:
            return None

        agent_response, steps = self._process_agent_messages(turn_messages, turn_idx)

        return TurnTrace(
            id=f"turn_{turn_idx}",
            agent_input=user_input,
            agent_response=agent_response,
            from_id=f"turn_{turn_idx - 1}" if turn_idx > 0 else None,
            steps=steps,
            latency_in_ms=None
        )

    def _extract_user_input(self, turn_messages: List[Dict[str, Any]]) -> Optional[str]:
        """
        Extract user input from turn messages.

        :param turn_messages: List of messages in the turn
        :return: User input content or None
        """
        for message in turn_messages:
            if message.get("role") == "user":
                return message.get("content")
        return None

    def _process_agent_messages(self, turn_messages: List[Dict[str, Any]], turn_idx: int) -> Tuple[
        Optional[AgentResponse], List[Step]]:
        """
        Process agent messages to extract response and tool steps.

        :param turn_messages: List of messages in the turn
        :param turn_idx: Index of this turn
        :return: Tuple of (agent_response, steps)
        """
        agent_response = None
        steps = []

        for message in turn_messages:
            if message.get("role") == "agent":
                # Process tool calls first
                tool_calls = message.get("tool_calls", [])
                if tool_calls:
                    new_steps = self._process_tool_calls(tool_calls, turn_messages, turn_idx, len(steps))
                    steps.extend(new_steps)

                # Process agent response content
                content = message.get("content")
                if content:
                    agent_response = AgentResponse(response=content, status_code="200")

        return agent_response, steps

    def _process_tool_calls(self, tool_calls: List[Dict[str, Any]], turn_messages: List[Dict[str, Any]],
                            turn_idx: int, step_offset: int) -> List[Step]:
        """
        Process tool calls into Step objects.

        :param tool_calls: List of tool call dictionaries
        :param turn_messages: All messages in the turn (to find tool responses)
        :param turn_idx: Index of the current turn
        :param step_offset: Current number of steps (for sequential numbering)
        :return: List of Step objects
        """
        steps = []

        for step_idx, tool_call in enumerate(tool_calls):
            tool_input_args = self._parse_tool_arguments(tool_call.get("arguments", {}))
            tool_output = self._find_tool_output(tool_call.get("id"), turn_messages)
            parent_ids = self._get_parent_ids(step_offset + step_idx, turn_idx, step_offset)

            step = Step(
                id=f"turn_{turn_idx}_step_{step_offset + step_idx}",
                parent_ids=parent_ids,
                tool=tool_call.get("name"),
                tool_input_args=tool_input_args,
                tool_output=tool_output,
                agent_thought=None,
                input_token_consumption=None,
                output_token_consumption=None,
                reasoning_token_consumption=None
            )
            steps.append(step)

        return steps

    def _parse_tool_arguments(self, arguments: Dict[str, Any]) -> List[ToolInputParameter]:
        """
        Parse tool call arguments into ToolInputParameter objects.

        :param arguments: Dictionary of tool arguments
        :return: List of ToolInputParameter objects
        """
        tool_input_args = []
        for key, value in arguments.items():
            tool_input_args.append(ToolInputParameter(name=key, value=value))
        return tool_input_args

    def _find_tool_output(self, tool_call_id: str, turn_messages: List[Dict[str, Any]]) -> Optional[str]:
        """
        Find the tool output for a given tool call ID.

        :param tool_call_id: ID of the tool call
        :param turn_messages: All messages in the turn
        :return: Tool output content or None
        """
        for message in turn_messages:
            if (message.get("role") == "tool" and
                    message.get("tool_id") == tool_call_id):
                return message.get("content")
        return None

    def _get_parent_ids(self, current_step_idx: int, turn_idx: int, step_offset: int) -> List[str]:
        """
        Get parent IDs for the current step.

        :param current_step_idx: Index of current step within the turn
        :param turn_idx: Index of the current turn
        :param step_offset: Offset for step numbering
        :return: List of parent step IDs
        """
        if current_step_idx > 0:
            return [f"turn_{turn_idx}_step_{step_offset + current_step_idx - 1}"]
        return []