atomr-agents-eval 0.11.0

Eval suites + regression detection + deterministic event-stream replay.
Documentation
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
//! Eval suites + replay-based regression detection.

mod annotation;
mod judge;
mod pairwise;
mod regression;
mod scorer;
mod suite;

pub use annotation::{AnnotationItem, AnnotationQueue, InMemoryAnnotationQueue, Verdict};
pub use judge::{JudgeModel, LlmJudgeScorer, RubricCriterion, RubricScorer};
pub use pairwise::{PairwiseChoice, PairwiseScorer};
pub use regression::{RegressionGate, RegressionResult};
pub use scorer::{AsyncScorer, Scorer, ScorerOutcome};
pub use suite::{EvalCase, EvalResult, EvalRun, EvalSuite};