Source code for agent_inspect.models.tools.analysis_models

from dataclasses import dataclass

from agent_inspect.models.metrics.validation_result import SubGoalValidationResult
from typing import List, Dict, Optional


[docs]
@dataclass
class ErrorAnalysisDataSample:
    """
    Represents a single data sample with its associated subgoal validations.
    """

    data_sample_id: int
    """
    Unique identifier for the data sample. Final results of error analysis will reference this id.
    """
    subgoal_validations: List[SubGoalValidationResult]
    """
    A list of ordered subgoal validation results to perform error analysis on.
    """
    agent_run_id: Optional[int] = None
    """
    Unique identifier for the agent run associated with this data sample.
    """

    

[docs]
@dataclass
class StatisticAnalysisResult:
    """
    Represents the statistical analysis result for a single data sample.
    """

    data_sample_id: int
    """
    The unique identifier of the data sample that this statistic analysis result corresponds to.
    """
    subgoal_validations: List[SubGoalValidationResult]
    """
    A list of subgoal validation results to perform error analysis on.
    """
    judge_expectation: Optional[float] = None
    """
    The computed expectation (mean) of judge scores across all subgoals in one data sample.
    """
    judge_std: Optional[float] = None
    """
    The computed standard deviation of judge scores across all subgoals in one data sample.
    """
    agent_run_id: Optional[int] = None
    """
    Unique identifier for the agent run associated with this data sample.
    """



[docs]
@dataclass
class AnalyzedSubgoalValidation:
    """
    Represents the error analysis result for a single subgoal validation within a data sample.
    """

    subgoal_validation: SubGoalValidationResult
    """
    The subgoal validation result being analyzed.
    """
    data_sample_id: int
    """
    The unique identifier of the data sample that this result's subgoal validation originates from.
    """
    base_error: Optional[str]
    """
    A description of the identified error in the subgoal validation.
    """
    agent_run_id: Optional[int] = None
    """
    Unique identifier for the agent run associated with this data sample.
    """

    

[docs]
@dataclass
class ErrorAnalysisResult:
    """
    Represents the overall error analysis result for a set of data samples.
    """

    analyzed_validations_clustered_by_errors: Dict[str, List[AnalyzedSubgoalValidation]]
    """
    A mapping from generalized errors to lists of analyzed subgoal validations that exhibit those errors.
    """
    completed_subgoal_validations: List[AnalyzedSubgoalValidation]
    """
    A list of analyzed subgoal validations consisting of the subgoal validations 
    that were marked completed, and thus have no associated errors.
    """