From acc14047f0aa723a3d0b74b93ee74190f5b6b6c4 Mon Sep 17 00:00:00 2001 From: Corby Rosset Date: Thu, 23 Apr 2026 01:38:28 -0400 Subject: [PATCH] Remove TrajectoryDiagnosticsResult class Removed the TrajectoryDiagnosticsResult class and its attributes from data_point.py. --- .../src/webeval/rubric_agent/data_point.py | 27 ------------------- 1 file changed, 27 deletions(-) diff --git a/webeval/src/webeval/rubric_agent/data_point.py b/webeval/src/webeval/rubric_agent/data_point.py index 4cbe0d4..19f69a9 100644 --- a/webeval/src/webeval/rubric_agent/data_point.py +++ b/webeval/src/webeval/rubric_agent/data_point.py @@ -531,33 +531,6 @@ class MMRubricOutcomeResult(VerificationResult): primary_intent: str = "" -class TrajectoryDiagnosticsResult(VerificationResult): - """Structured result from trajectory diagnostics verification.""" - - result_type: Literal["trajectory_diagnostics"] = "trajectory_diagnostics" - # Efficiency - loops: List[Dict[str, Any]] = Field(default_factory=list) - unnecessary_actions: List[Dict[str, Any]] = Field(default_factory=list) - efficiency_rating: Optional[int] = None - efficiency_reasoning: str = "" - # Success - solver_self_judgement_of_success: Optional[bool] = None - solver_self_judgement_reasoning: str = "" - proxy_verifier_judgement_of_success: Optional[bool] = None - proxy_verifier_judgement_reasoning: str = "" - # Optimal plan - optimal_plan: List[str] = Field(default_factory=list) - optimal_plan_reasoning: str = "" - # Critical point (via CriticalPointComplianceAgent) - task_has_critical_point: Optional[bool] = None - critical_point_type: Optional[str] = None - critical_point_classification_reasoning: str = "" - critical_point_expected_behavior: List[str] = Field(default_factory=list) - agent_navigated_successfully: Optional[bool] = None - critical_point_reasoning: str = "" - # Critical point (via direct LLM call — backup) - critical_point_llm: Dict[str, Any] = Field(default_factory=dict) - class TaskAgentResult(VerificationResult): """Result from the unified task verification classification (Step 10).