pub trait Benchmark: Send + Sync {
// Required methods
fn name(&self) -> &str;
fn generate_test_data(&self) -> RragResult<EvaluationData>;
fn evaluate_benchmark(
&self,
system_responses: &[SystemResponse],
) -> RragResult<BenchmarkResult>;
fn get_config(&self) -> BenchmarkConfig;
}Expand description
Trait for evaluation benchmarks
Required Methods§
Sourcefn generate_test_data(&self) -> RragResult<EvaluationData>
fn generate_test_data(&self) -> RragResult<EvaluationData>
Generate test queries and ground truth
Sourcefn evaluate_benchmark(
&self,
system_responses: &[SystemResponse],
) -> RragResult<BenchmarkResult>
fn evaluate_benchmark( &self, system_responses: &[SystemResponse], ) -> RragResult<BenchmarkResult>
Evaluate system against this benchmark
Sourcefn get_config(&self) -> BenchmarkConfig
fn get_config(&self) -> BenchmarkConfig
Get benchmark configuration