Enum CrossEncoder

Source

pub enum CrossEncoder {
    Lexical {
        degraded: bool,
    },
    Neural {
        model: Arc<BertModel>,
        tokenizer: Arc<Tokenizer>,
        classifier_weight: Tensor,
        classifier_bias: Tensor,
        device: Device,
    },
}

Expand description

Cross-encoder for (query, document) relevance scoring.

Variants§

§

Lexical

Lightweight lexical cross-encoder using term overlap signals.

degraded is true when this variant exists because a configured neural cross-encoder failed to initialise (HF Hub unreachable, model checksum mismatch, etc.) and the runtime fell back. false is the originally-configured lexical tier (operator opted in to keyword-tier or smart-tier without cross-encoder reranking).

v0.7.0 R3-S2 — the distinction surfaces in the recall response’s meta.reranker_used field as "degraded_lexical" vs "lexical", so an in-band signal tells clients (MCP + HTTP) when their reranker downgraded. The original G8 fix landed tracing::warn! only; G8 closure per the playbook required an in-response field, which the prior implementation overstated.

Fields

§degraded: bool

§

Neural

Neural BERT-based cross-encoder (ms-marco-MiniLM-L-6-v2).

v0.7.0 #1084 — model is Arc<BertModel> (no mutex), same pattern as Embedder::Local. The pre-#1084 design held an Arc<Mutex<BertModel>> and locked across the full neural rerank forward pass, serialising every rerank-tier recall on a single global mutex. Candle’s BertModel::forward takes &self (inference-only; weights are read-only) so the mutex was unnecessary.

Fields

§model: Arc<BertModel>

§tokenizer: Arc<Tokenizer>

§classifier_weight: Tensor

§classifier_bias: Tensor

§device: Device

Enum CrossEncoder Copy item path

Variants§

Lexical

Fields

Neural

Fields

Implementations§

impl CrossEncoder

pub fn new() -> Self

pub fn new_neural() -> Self

pub fn score(&self, query: &str, title: &str, content: &str) -> f32

pub fn is_neural(&self) -> bool

pub fn is_degraded_lexical(&self) -> bool

pub fn rerank( &self, query: &str, candidates: Vec<(Memory, f64)>, ) -> Vec<(Memory, f64)>

pub fn rerank_with_reflection_boost( &self, query: &str, candidates: Vec<(Memory, f64)>, boost_config: &ReflectionBoostConfig, ) -> Vec<(Memory, f64)>

pub fn rerank_batch( &self, queries: Vec<(String, Vec<(Memory, f64)>)>, ) -> Vec<Vec<(Memory, f64)>>

pub fn rerank_batch_with_reflection_boost( &self, queries: Vec<(String, Vec<(Memory, f64)>)>, boost_config: &ReflectionBoostConfig, ) -> Vec<Vec<(Memory, f64)>>

Trait Implementations§

impl Default for CrossEncoder

fn default() -> Self

Auto Trait Implementations§

impl !RefUnwindSafe for CrossEncoder

impl !UnwindSafe for CrossEncoder

impl Freeze for CrossEncoder

impl Send for CrossEncoder

impl Sync for CrossEncoder

impl Unpin for CrossEncoder

impl UnsafeUnpin for CrossEncoder

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> ErasedDestructor for Twhere T: 'static,

impl<T> From<T> for T

fn from(t: T) -> T

impl<T> Instrument for T

fn instrument(self, span: Span) -> Instrumented<Self>

fn in_current_span(self) -> Instrumented<Self>

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> IntoEither for T

fn into_either(self, into_left: bool) -> Either<Self, Self>

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>where F: FnOnce(&Self) -> bool,

impl<T> Pointable for T

const ALIGN: usize

type Init = T

unsafe fn init(init: <T as Pointable>::Init) -> usize

unsafe fn deref<'a>(ptr: usize) -> &'a T

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

unsafe fn drop(ptr: usize)

impl<T> PolicyExt for Twhere T: ?Sized,

fn and<P, B, E>(self, other: P) -> And<T, P>where T: Sized + Policy<B, E>, P: Policy<B, E>,

fn or<P, B, E>(self, other: P) -> Or<T, P>where T: Sized + Policy<B, E>, P: Policy<B, E>,

impl<T> Same for T

type Output = T

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for Twhere V: MultiLane<T>,

fn vzip(self) -> V

impl<T> WithSubscriber for T

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>where S: Into<Dispatch>,

fn with_current_subscriber(self) -> WithDispatch<Self>

Enum CrossEncoder

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T> ErasedDestructor for T
where T: 'static,

impl<T, U> Into<U> for T
where U: From<T>,

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

impl<T> PolicyExt for T
where T: ?Sized,

fn and<P, B, E>(self, other: P) -> And<T, P>
where T: Sized + Policy<B, E>, P: Policy<B, E>,

fn or<P, B, E>(self, other: P) -> Or<T, P>
where T: Sized + Policy<B, E>, P: Policy<B, E>,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,