pub struct ReasoningEvalSummary {
pub num_benchmarks: usize,
pub accuracy: HashMap<String, f64>,
pub improvement: HashMap<String, f64>,
pub self_consistency: f64,
pub calibration_ece: f64,
pub thinktool_scores: HashMap<String, f64>,
/* private fields */
}Expand description
Summary of reasoning evaluation
Fields§
§num_benchmarks: usize§accuracy: HashMap<String, f64>Accuracy per benchmark
improvement: HashMap<String, f64>Improvement over baseline per benchmark
self_consistency: f64Self-consistency rate
calibration_ece: f64Expected Calibration Error
thinktool_scores: HashMap<String, f64>ThinkTool effectiveness scores
Implementations§
Source§impl ReasoningEvalSummary
impl ReasoningEvalSummary
pub fn new(benchmarks: &[String]) -> Self
Sourcepub fn check_targets(&self, targets: &ReasoningTargets) -> TargetResult
pub fn check_targets(&self, targets: &ReasoningTargets) -> TargetResult
Check if reasoning targets are met
Trait Implementations§
Source§impl Clone for ReasoningEvalSummary
impl Clone for ReasoningEvalSummary
Source§fn clone(&self) -> ReasoningEvalSummary
fn clone(&self) -> ReasoningEvalSummary
Returns a duplicate of the value. Read more
1.0.0 · Source§fn clone_from(&mut self, source: &Self)
fn clone_from(&mut self, source: &Self)
Performs copy-assignment from
source. Read moreAuto Trait Implementations§
impl Freeze for ReasoningEvalSummary
impl RefUnwindSafe for ReasoningEvalSummary
impl Send for ReasoningEvalSummary
impl Sync for ReasoningEvalSummary
impl Unpin for ReasoningEvalSummary
impl UnwindSafe for ReasoningEvalSummary
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more
Source§impl<T> CloneToUninit for Twhere
T: Clone,
impl<T> CloneToUninit for Twhere
T: Clone,
Source§impl<T> Instrument for T
impl<T> Instrument for T
Source§fn instrument(self, span: Span) -> Instrumented<Self>
fn instrument(self, span: Span) -> Instrumented<Self>
Source§fn in_current_span(self) -> Instrumented<Self>
fn in_current_span(self) -> Instrumented<Self>
Source§impl<T> IntoEither for T
impl<T> IntoEither for T
Source§fn into_either(self, into_left: bool) -> Either<Self, Self>
fn into_either(self, into_left: bool) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left is true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read moreSource§fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left(&self) returns true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read more