pub type TestCaseResult = EvaluationResult;Expand description
Result for a single test case (alias for backward compatibility)
Aliased Type§
pub struct TestCaseResult {
pub eval_id: String,
pub passed: bool,
pub scores: HashMap<String, f64>,
pub failures: Vec<Failure>,
pub duration: Duration,
pub turn_results: Vec<TurnResult>,
}Fields§
§eval_id: StringTest case identifier
passed: boolWhether the test passed all criteria
scores: HashMap<String, f64>Scores for each criterion
failures: Vec<Failure>Failures (criteria that didn’t meet threshold)
duration: DurationExecution duration
turn_results: Vec<TurnResult>Detailed turn results