pub struct Evaluator { /* private fields */ }Expand description
The main evaluator struct
Implementations§
Source§impl Evaluator
impl Evaluator
Sourcepub fn new(config: EvaluationConfig) -> Self
pub fn new(config: EvaluationConfig) -> Self
Create a new evaluator with default configuration
Sourcepub fn with_llm_judge(
config: EvaluationConfig,
judge_model: Arc<dyn Llm>,
) -> Self
pub fn with_llm_judge( config: EvaluationConfig, judge_model: Arc<dyn Llm>, ) -> Self
Create an evaluator with an LLM judge for semantic matching and rubric evaluation
Sourcepub fn set_llm_judge(&mut self, judge_model: Arc<dyn Llm>)
pub fn set_llm_judge(&mut self, judge_model: Arc<dyn Llm>)
Set the LLM judge model
Sourcepub fn has_llm_judge(&self) -> bool
pub fn has_llm_judge(&self) -> bool
Check if LLM judge is available
Sourcepub async fn evaluate_file(
&self,
agent: Arc<dyn Agent>,
path: impl AsRef<Path>,
) -> Result<EvaluationReport>
pub async fn evaluate_file( &self, agent: Arc<dyn Agent>, path: impl AsRef<Path>, ) -> Result<EvaluationReport>
Evaluate a test file against an agent
Sourcepub async fn evaluate_test_file(
&self,
agent: Arc<dyn Agent>,
test_file: &TestFile,
) -> Result<EvaluationReport>
pub async fn evaluate_test_file( &self, agent: Arc<dyn Agent>, test_file: &TestFile, ) -> Result<EvaluationReport>
Evaluate a TestFile struct
Sourcepub async fn evaluate_case(
&self,
agent: Arc<dyn Agent>,
eval_case: &EvalCase,
) -> Result<EvaluationResult>
pub async fn evaluate_case( &self, agent: Arc<dyn Agent>, eval_case: &EvalCase, ) -> Result<EvaluationResult>
Evaluate a single test case
Sourcepub async fn evaluate_cases_parallel(
&self,
agent: Arc<dyn Agent>,
cases: &[EvalCase],
concurrency: usize,
) -> Vec<Result<EvaluationResult>> ⓘ
pub async fn evaluate_cases_parallel( &self, agent: Arc<dyn Agent>, cases: &[EvalCase], concurrency: usize, ) -> Vec<Result<EvaluationResult>> ⓘ
Evaluate multiple test cases in parallel
Sourcepub async fn evaluate_directory(
&self,
agent: Arc<dyn Agent>,
dir: impl AsRef<Path>,
) -> Result<Vec<EvaluationReport>>
pub async fn evaluate_directory( &self, agent: Arc<dyn Agent>, dir: impl AsRef<Path>, ) -> Result<Vec<EvaluationReport>>
Evaluate a directory of test files
Trait Implementations§
Auto Trait Implementations§
impl Freeze for Evaluator
impl !RefUnwindSafe for Evaluator
impl Send for Evaluator
impl Sync for Evaluator
impl Unpin for Evaluator
impl UnsafeUnpin for Evaluator
impl !UnwindSafe for Evaluator
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more