1pub mod criteria;
50pub mod error;
51pub mod evaluator;
52pub mod llm_judge;
53pub mod report;
54pub mod schema;
55pub mod scoring;
56
57#[cfg(feature = "personas")]
58pub mod personas;
59
60pub mod optimizer;
61
62pub mod annotation;
64pub mod baseline;
65pub mod conversation_scorer;
66pub mod cost_tracker;
67pub mod pricing;
68pub mod structured_judge;
69pub mod test_generator;
70pub mod trace_analyzer;
71
72#[cfg(feature = "embedding")]
74pub mod embedding_scorer;
75
76#[cfg(feature = "ci-helpers")]
77pub mod junit_reporter;
78
79#[cfg(feature = "statistics")]
80pub mod ab_comparator;
81
82pub use criteria::{
84 EvaluationCriteria, ResponseMatchConfig, Rubric, RubricConfig, ToolTrajectoryConfig,
85};
86pub use error::{EvalError, Result};
87pub use evaluator::{EvaluationConfig, Evaluator};
88pub use llm_judge::{
89 LlmJudge, LlmJudgeConfig, RubricEvaluationResult, RubricScore, SemanticMatchResult,
90};
91pub use report::{EvaluationReport, EvaluationResult, Failure, TestCaseResult};
92pub use schema::{EvalCase, EvalSet, IntermediateData, SessionInput, TestFile, ToolUse, Turn};
93pub use scoring::{ResponseScorer, ToolTrajectoryScorer};
94
95pub use optimizer::{OptimizationResult, OptimizerConfig, PromptOptimizer};
97
98pub use annotation::{AnnotationRecord, AnnotationStore, HumanVerdict};
100pub use baseline::{Baseline, BaselineStore, Regression};
101pub use conversation_scorer::{ConversationMetrics, ConversationScorer, ConversationScorerConfig};
102pub use cost_tracker::{CostMetrics, CostTracker};
103pub use pricing::ModelPricing;
104pub use structured_judge::{
105 JudgeRubric, ScalePoint, StructuredJudge, StructuredJudgeConfig, StructuredVerdict, Verdict,
106};
107pub use test_generator::{EvalCaseMetadata, GeneratorConfig, TestGenerator};
108pub use trace_analyzer::{
109 ToolCallRecord, TraceAnalysis, TraceAnalyzer, TraceDiagnostic, TracePattern,
110};
111
112#[cfg(feature = "embedding")]
113pub use embedding_scorer::EmbeddingScorer;
114
115#[cfg(feature = "ci-helpers")]
116pub use junit_reporter::JunitReporter;
117
118#[cfg(feature = "statistics")]
119pub use ab_comparator::AbComparator;
120
121pub mod prelude {
123 pub use crate::criteria::{
124 EvaluationCriteria, ResponseMatchConfig, Rubric, RubricConfig, ToolTrajectoryConfig,
125 };
126 pub use crate::error::{EvalError, Result};
127 pub use crate::evaluator::{EvaluationConfig, Evaluator};
128 pub use crate::llm_judge::{
129 LlmJudge, LlmJudgeConfig, RubricEvaluationResult, SemanticMatchResult,
130 };
131 pub use crate::report::{EvaluationReport, EvaluationResult, Failure, TestCaseResult};
132 pub use crate::schema::{EvalCase, EvalSet, TestFile, ToolUse, Turn};
133}