ras-judge 4.2.0

Judge eval for agent traces
Documentation
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
use serde::{Deserialize, Serialize};

#[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize, Deserialize)]
#[serde(rename_all = "snake_case")]
pub enum Verdict {
    Success,
    PartialSuccess,
    Failure,
    Inconclusive,
}

#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct JudgementResult {
    pub verdict: Verdict,
    pub reasoning: String,
    pub confidence: f32,
    pub flagged_steps: Vec<u32>,
}