Struct BenchmarkScore

Source

pub struct BenchmarkScore {
    pub name: String,
    pub score: f64,
    pub harness: Option<String>,
    pub source_url: Option<String>,
    pub measured_at: Option<String>,
}

Expand description

A score on a public benchmark from a published source (model card, paper, leaderboard). The schema is deliberately permissive — no enum of benchmark names — so the catalog can carry whichever benchmarks the upstream provider chose to publish, and new ones can be added without a code change. Scores are stored on a 0.0–1.0 scale (e.g. 73.5% accuracy → 0.735) so they compare cleanly across benchmarks and so routing_ext::apply_benchmark_priors can consume them directly when wired in later.

Fields§

§name: String

Benchmark name as published (e.g., “MMLU-Pro”, “GPQA-Diamond”, “SWE-bench-Verified”, “HumanEval”, “MATH”).

§score: f64

Score on a 0.0–1.0 scale.

§harness: Option<String>

Evaluation harness or setup label (e.g., “5-shot”, “0-shot CoT”, “agentic”, “pass@1”). Optional but strongly recommended — the same benchmark name can mean different things under different harnesses.

§source_url: Option<String>

Where the score came from (model card URL, paper, leaderboard snapshot). Empty when the source is the upstream provider’s announcement and a stable URL is not yet known.

§measured_at: Option<String>

ISO 8601 date of the score snapshot (e.g., “2025-08-12”). Lets downstream code judge how stale a number is.

BenchmarkScore

Struct BenchmarkScore Copy item path

Fields§

Trait Implementations§

impl Clone for BenchmarkScore

fn clone(&self) -> BenchmarkScore

fn clone_from(&mut self, source: &Self)

impl Debug for BenchmarkScore

fn fmt(&self, f: &mut Formatter<'_>) -> Result

impl<'de> Deserialize<'de> for BenchmarkScore

fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where __D: Deserializer<'de>,

impl Serialize for BenchmarkScore

fn serialize<__S>(&self, __serializer: __S) -> Result<__S::Ok, __S::Error>where __S: Serializer,

Auto Trait Implementations§

impl Freeze for BenchmarkScore

impl RefUnwindSafe for BenchmarkScore

impl Send for BenchmarkScore

impl Sync for BenchmarkScore

impl Unpin for BenchmarkScore

impl UnsafeUnpin for BenchmarkScore

impl UnwindSafe for BenchmarkScore

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> CloneToUninit for Twhere T: Clone,

unsafe fn clone_to_uninit(&self, dest: *mut u8)

impl<T> From<T> for T

fn from(t: T) -> T

impl<T> Instrument for T

fn instrument(self, span: Span) -> Instrumented<Self>

fn in_current_span(self) -> Instrumented<Self>

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> IntoEither for T

fn into_either(self, into_left: bool) -> Either<Self, Self>

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>where F: FnOnce(&Self) -> bool,

impl<T> Pointable for T

const ALIGN: usize

type Init = T

unsafe fn init(init: <T as Pointable>::Init) -> usize

unsafe fn deref<'a>(ptr: usize) -> &'a T

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

unsafe fn drop(ptr: usize)

impl<T> PolicyExt for Twhere T: ?Sized,

fn and<P, B, E>(self, other: P) -> And<T, P>where T: Policy<B, E>, P: Policy<B, E>,

fn or<P, B, E>(self, other: P) -> Or<T, P>where T: Policy<B, E>, P: Policy<B, E>,

impl<T> Same for T

type Output = T

impl<T> ToOwned for Twhere T: Clone,

type Owned = T

fn to_owned(&self) -> T

fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for Twhere V: MultiLane<T>,

fn vzip(self) -> V

impl<T> WithSubscriber for T

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>where S: Into<Dispatch>,

fn with_current_subscriber(self) -> WithDispatch<Self>

impl<T> DeserializeOwned for Twhere T: for<'de> Deserialize<'de>,

impl<T> ErasedDestructor for Twhere T: 'static,

Struct BenchmarkScore

fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
where __D: Deserializer<'de>,

fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
where S: Serializer,

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T> CloneToUninit for T
where T: Clone,

impl<T, U> Into<U> for T
where U: From<T>,

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

impl<T> PolicyExt for T
where T: ?Sized,

fn and<P, B, E>(self, other: P) -> And<T, P>
where T: Policy<B, E>, P: Policy<B, E>,

fn or<P, B, E>(self, other: P) -> Or<T, P>
where T: Policy<B, E>, P: Policy<B, E>,

impl<T> ToOwned for T
where T: Clone,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,

impl<T> DeserializeOwned for T
where T: for<'de> Deserialize<'de>,

impl<T> ErasedDestructor for T
where T: 'static,