Struct FidelityConfig

Source

pub struct FidelityConfig {Show 20 fields
    pub enabled: bool,
    pub w_semantic: f32,
    pub w_temporal: f32,
    pub w_importance: f32,
    pub w_plan: f32,
    pub full_threshold: f32,
    pub compressed_threshold: f32,
    pub compressed_max_tokens: usize,
    pub regrade_threshold: f32,
    pub min_query_length: usize,
    pub max_scored_messages: usize,
    pub exempt_tail_messages: usize,
    pub compress_provider: Option<ProviderName>,
    pub semantic_scoring_provider: Option<ProviderName>,
    pub lookahead_depth: u8,
    pub embed_concurrency: usize,
    pub max_embed_input_tokens: Option<usize>,
    pub max_compress_input_tokens: Option<usize>,
    pub embed_timeout_secs: u64,
    pub compress_timeout_secs: u64,
}

Expand description

Configuration for the heuristic fidelity scorer (CAM §8.1).

All weight fields must be positive. Weights are normalised at runtime by the sum of active weights (INV-05).

§Examples

use zeph_config::fidelity::FidelityConfig;

let cfg = FidelityConfig::default();
assert!(!cfg.enabled, "fidelity scoring is off by default");
assert!((cfg.w_semantic - 0.3).abs() < f32::EPSILON);

Fields§

§enabled: bool

Master switch. When false, no fidelity scoring occurs.

§w_semantic: f32

Cosine/keyword semantic relevance weight.

Previously named w_keyword in config — that name is still accepted for compatibility.

§w_temporal: f32

Recency weight.

§w_importance: f32

Role-based importance weight.

§w_plan: f32

Plan-hint relevance weight (active only when planned_tools is non-empty).

§full_threshold: f32

Score threshold above which a message retains Full fidelity.

§compressed_threshold: f32

Score threshold above which a message is Compressed (not Placeholder).

§compressed_max_tokens: usize

Maximum tokens kept when rendering a Compressed message.

§regrade_threshold: f32

Budget ratio at which AgeMem triggers a proactive regrade.

§min_query_length: usize

Minimum query length for semantic signal to be active.

§max_scored_messages: usize

Maximum number of messages scored per turn (performance cap).

§exempt_tail_messages: usize

Number of the newest messages exempt from scoring when the window exceeds max_scored_messages. These messages default to Full fidelity.

A value of 0 (the default) means no tail exemption beyond the hard max_scored_messages cap.

§compress_provider: Option<ProviderName>

LLM provider name (from [[llm.providers]]) used to summarize messages during Compressed rendering. When None, truncation is used instead.

§semantic_scoring_provider: Option<ProviderName>

Embedding provider name (from [[llm.providers]]) used for semantic similarity scoring. When None, keyword overlap is used instead.

§lookahead_depth: u8

Maximum BFS depth for PAACE lookahead hints derived from the orchestration DAG.

Controls how many steps ahead in the active task graph are converted to PlannedToolHint values and passed to FidelityScorer. 0 disables lookahead (returns an empty hint slice). Valid range: 0..=5.

§embed_concurrency: usize

Maximum number of concurrent provider.embed() calls during the cold-start pre-pass.

Controls the buffer_unordered(N) bound. Higher values reduce latency on cold starts at the cost of more concurrent API requests. Default is 32.

§max_embed_input_tokens: Option<usize>

Hard cap on message content length (in approximate tokens) fed to provider.embed().

When Some(n), message content is truncated to approximately n * 4 characters (at a valid UTF-8 char boundary) before the embed call. None means no cap.

§max_compress_input_tokens: Option<usize>

Hard cap on message content length (in approximate tokens) fed to the LLM compress call.

When Some(n), the input is truncated to approximately n * 4 characters before the compress call. None means no cap. Independent of the existing 2× cost guard.

§embed_timeout_secs: u64

Timeout in seconds for embed calls in fidelity scoring (default: 30).

Applies to both the query embed and each per-message embed in the pre-pass. Timed-out calls are skipped with a warn-level log; scoring falls back to keyword overlap.

§compress_timeout_secs: u64

Timeout in seconds for the LLM compress call in fidelity scoring (default: 30).

When the LLM compress call exceeds this limit it is cancelled and truncation is used as a fallback. Set higher if your compress provider has high cold-start latency.

Struct FidelityConfig Copy item path

§Examples

Fields§

Implementations§

impl FidelityConfig

pub fn default_lookahead_depth() -> u8

pub fn validate(&self) -> Result<(), String>

§Errors

§Examples

Trait Implementations§

impl Clone for FidelityConfig

fn clone(&self) -> FidelityConfig

fn clone_from(&mut self, source: &Self)

impl Debug for FidelityConfig

fn fmt(&self, f: &mut Formatter<'_>) -> Result

impl Default for FidelityConfig

fn default() -> Self

impl<'de> Deserialize<'de> for FidelityConfigwhere FidelityConfig: Default,

fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where __D: Deserializer<'de>,

impl Serialize for FidelityConfig

fn serialize<__S>(&self, __serializer: __S) -> Result<__S::Ok, __S::Error>where __S: Serializer,

Auto Trait Implementations§

impl Freeze for FidelityConfig

impl RefUnwindSafe for FidelityConfig

impl Send for FidelityConfig

impl Sync for FidelityConfig

impl Unpin for FidelityConfig

impl UnsafeUnpin for FidelityConfig

impl UnwindSafe for FidelityConfig

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> CloneToUninit for Twhere T: Clone,

unsafe fn clone_to_uninit(&self, dest: *mut u8)

impl<T> DeserializeOwned for Twhere T: for<'de> Deserialize<'de>,

impl<T> DynClone for Twhere T: Clone,

fn __clone_box(&self, _: Private) -> *mut ()

impl<T> From<T> for T

fn from(t: T) -> T

impl<T> Instrument for T

fn instrument(self, span: Span) -> Instrumented<Self>

fn in_current_span(self) -> Instrumented<Self>

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> ToOwned for Twhere T: Clone,

type Owned = T

fn to_owned(&self) -> T

fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<T> WithSubscriber for T

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>where S: Into<Dispatch>,

fn with_current_subscriber(self) -> WithDispatch<Self>

Struct FidelityConfig

impl<'de> Deserialize<'de> for FidelityConfig
where FidelityConfig: Default,

fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
where __D: Deserializer<'de>,

fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
where S: Serializer,

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T> CloneToUninit for T
where T: Clone,

impl<T> DeserializeOwned for T
where T: for<'de> Deserialize<'de>,

impl<T> DynClone for T
where T: Clone,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T> ToOwned for T
where T: Clone,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,