Struct MemoryConfig

Source

pub struct MemoryConfig {Show 66 fields
    pub compression_guidelines: CompressionGuidelinesConfig,
    pub sqlite_path: String,
    pub history_limit: u32,
    pub qdrant_url: String,
    pub qdrant_api_key: Option<Secret>,
    pub semantic: SemanticConfig,
    pub summarization_threshold: usize,
    pub summarization_llm_timeout_secs: u64,
    pub context_budget_tokens: usize,
    pub soft_compaction_threshold: f32,
    pub hard_compaction_threshold: f32,
    pub compaction_preserve_tail: usize,
    pub compaction_cooldown_turns: u8,
    pub auto_budget: bool,
    pub prune_protect_tokens: usize,
    pub cross_session_score_threshold: f32,
    pub vector_backend: VectorBackend,
    pub token_safety_margin: f32,
    pub redact_credentials: bool,
    pub autosave_assistant: bool,
    pub autosave_min_length: usize,
    pub tool_call_cutoff: usize,
    pub sqlite_pool_size: u32,
    pub sessions: SessionsConfig,
    pub documents: DocumentConfig,
    pub eviction: EvictionConfig,
    pub compression: CompressionConfig,
    pub sidequest: SidequestConfig,
    pub graph: GraphConfig,
    pub shutdown_summary: bool,
    pub shutdown_summary_min_messages: usize,
    pub shutdown_summary_max_messages: usize,
    pub shutdown_summary_timeout_secs: u64,
    pub shutdown_summary_provider: ProviderName,
    pub compaction_provider: ProviderName,
    pub structured_summaries: bool,
    pub tiers: TierConfig,
    pub admission: AdmissionConfig,
    pub digest: DigestConfig,
    pub context_strategy: ContextStrategy,
    pub crossover_turn_threshold: u32,
    pub consolidation: ConsolidationConfig,
    pub forgetting: ForgettingConfig,
    pub database_url: Option<String>,
    pub store_routing: StoreRoutingConfig,
    pub persona: PersonaConfig,
    pub trajectory: TrajectoryConfig,
    pub category: CategoryConfig,
    pub tree: TreeConfig,
    pub microcompact: MicrocompactConfig,
    pub autodream: AutoDreamConfig,
    pub key_facts_dedup_threshold: f32,
    pub compression_spectrum: CompressionSpectrumConfig,
    pub retrieval: RetrievalConfig,
    pub reasoning: ReasoningConfig,
    pub hebbian: HebbianConfig,
    pub memcot: MemCotConfig,
    pub retrieval_failures: RetrievalFailuresConfig,
    pub quality_gate: WriteQualityGateConfig,
    pub tiered_retrieval: TieredRetrievalConfig,
    pub optical_forgetting: OpticalForgettingConfig,
    pub em_graph: EmGraphConfig,
    pub episodic_consolidation: EpisodicConsolidationConfig,
    pub shadow_memory: TrajectoryRiskAccumulatorConfig,
    pub five_signal: FiveSignalConfig,
    pub fidelity: Option<FidelityConfig>,
}

Expand description

Memory subsystem configuration, nested under [memory] in TOML.

Controls SQLite and Qdrant storage, semantic recall, context compaction, multi-tier promotion, and all memory-related background tasks.

§Example (TOML)

[memory]
sqlite_path = "~/.local/share/zeph/data/zeph.db"
qdrant_url = "http://localhost:6334"
history_limit = 50
summarization_threshold = 50
auto_budget = true

Fields§

§compression_guidelines: CompressionGuidelinesConfig§sqlite_path: String§history_limit: u32§qdrant_url: String§qdrant_api_key: Option<Secret>

Optional API key for authenticating to a remote or managed Qdrant cluster.

Required when qdrant_url points to a non-localhost host (e.g. Qdrant Cloud). Leave None for local dev instances. The actual key is resolved from the vault: zeph vault set ZEPH_QDRANT_API_KEY "<key>".

The value is wrapped in Secret to prevent accidental logging. skip_serializing prevents the key from being written back to TOML on config save.

§semantic: SemanticConfig§summarization_threshold: usize§summarization_llm_timeout_secs: u64

LLM call timeout for summarization, in seconds. Default: 60.

§context_budget_tokens: usize§soft_compaction_threshold: f32§hard_compaction_threshold: f32§compaction_preserve_tail: usize§compaction_cooldown_turns: u8§auto_budget: bool§prune_protect_tokens: usize§cross_session_score_threshold: f32§vector_backend: VectorBackend§token_safety_margin: f32§redact_credentials: bool§autosave_assistant: bool§autosave_min_length: usize§tool_call_cutoff: usize§sqlite_pool_size: u32§sessions: SessionsConfig§documents: DocumentConfig§eviction: EvictionConfig§compression: CompressionConfig§sidequest: SidequestConfig§graph: GraphConfig§shutdown_summary: bool

Store a lightweight session summary to the vector store on shutdown when no session summary exists yet for this conversation. Enables cross-session recall for short or interrupted sessions that never triggered hard compaction. Default: true.

§shutdown_summary_min_messages: usize

Minimum number of user-turn messages required before a shutdown summary is generated. Sessions below this threshold are considered trivial and skipped. Default: 4.

§shutdown_summary_max_messages: usize

Maximum number of recent messages (user + assistant) sent to the LLM for shutdown summarization. Caps token cost for long sessions that never triggered hard compaction. Default: 20.

§shutdown_summary_timeout_secs: u64

Per-attempt timeout in seconds for each LLM call during shutdown summarization. Applies independently to the structured call and to the plain-text fallback. Default: 10.

§shutdown_summary_provider: ProviderName

LLM provider used for shutdown summarization calls.

Accepts a provider name from [[llm.providers]]. When empty, falls back to the primary provider. Use a fast, cost-efficient model (e.g. "fast") to minimise shutdown latency.

Example:

[memory]
shutdown_summary_provider = "fast"

§compaction_provider: ProviderName

LLM provider used for deferred tool-pair summarization (context compaction).

Accepts a provider name from [[llm.providers]]. When empty, falls back to the primary provider. A mid-tier model is usually sufficient for compaction summaries.

Example:

[memory]
compaction_provider = "fast"

§structured_summaries: bool

Use structured anchored summaries for context compaction.

When enabled, hard compaction requests a JSON schema from the LLM instead of free-form prose. Falls back to prose if the LLM fails to produce valid JSON. Default: false.

§tiers: TierConfig

AOI three-layer memory tier promotion system.

When tiers.enabled = true, a background sweep promotes frequently-accessed episodic messages to a semantic tier by clustering near-duplicates and distilling via LLM.

§admission: AdmissionConfig

A-MAC adaptive memory admission control.

When admission.enabled = true, each message is evaluated before saving and rejected if its composite admission score falls below the configured threshold.

§digest: DigestConfig

Session digest generation at session end. Default: disabled.

§context_strategy: ContextStrategy

Context assembly strategy. Default: full_history (current behavior).

§crossover_turn_threshold: u32

Number of turns at which Adaptive strategy switches to MemoryFirst. Default: 20.

§consolidation: ConsolidationConfig

All-Mem lifelong memory consolidation sweep.

When consolidation.enabled = true, a background loop clusters semantically similar messages and merges them into consolidated entries via LLM.

§forgetting: ForgettingConfig

SleepGate forgetting sweep (#2397).

When forgetting.enabled = true, a background loop periodically decays importance scores and prunes memories below the forgetting floor.

§database_url: Option<String>

PostgreSQL connection URL.

Used when the binary is compiled with --features postgres. Can be overridden by the vault key ZEPH_DATABASE_URL. Example: postgres://user:pass@localhost:5432/zeph Default: None (uses sqlite_path instead).

§store_routing: StoreRoutingConfig

Cost-sensitive store routing (#2444).

When store_routing.enabled = true, query intent is classified and routed to the cheapest sufficient backend instead of querying all stores on every turn.

§persona: PersonaConfig

Persona memory layer (#2461).

When persona.enabled = true, user preferences and domain knowledge are extracted from conversation history and injected into context after the system prompt.

§trajectory: TrajectoryConfig

Trajectory-informed memory (#2498).

§category: CategoryConfig

Category-aware memory (#2428).

§tree: TreeConfig

TiMem temporal-hierarchical memory tree (#2262).

§microcompact: MicrocompactConfig

Time-based microcompact (#2699).

When microcompact.enabled = true, stale low-value tool outputs are cleared from context when the session has been idle longer than gap_threshold_minutes.

§autodream: AutoDreamConfig

autoDream background memory consolidation (#2697).

When autodream.enabled = true, a constrained consolidation subagent runs after a session ends if both min_sessions and min_hours gates pass.

§key_facts_dedup_threshold: f32

Cosine similarity threshold for deduplicating key facts in zeph_key_facts (#2717).

Before inserting a new key fact, its nearest neighbour is looked up in the zeph_key_facts collection. If the best score is ≥ this threshold the fact is considered a near-duplicate and skipped. Set to a value greater than 1.0 (e.g. 2.0) to disable dedup entirely. Default: 0.95.

§compression_spectrum: CompressionSpectrumConfig

Experience compression spectrum (#3305).

Controls three-tier retrieval policy and background skill-promotion engine.

§retrieval: RetrievalConfig

MemMachine-inspired retrieval-stage tuning (#3340).

Controls ANN candidate depth, search-prompt formatting, and the shape of memory snippets injected into agent context. Separate from SemanticConfig because these knobs apply uniformly across graph, hybrid, and vector-only recall paths.

§Example (TOML)

[memory.retrieval]
depth = 40
search_prompt_template = ""
context_format = "structured"

§reasoning: ReasoningConfig

ReasoningBank: distilled reasoning strategy memory (#3342).

When reasoning.enabled = true, each completed agent turn is evaluated by a self-judge LLM call; successful and failed reasoning chains are compressed into short, generalizable strategy summaries stored in reasoning_strategies (SQLite) and a matching Qdrant collection. Top-k strategies are retrieved by embedding similarity at context-build time and injected before the LLM call.

§hebbian: HebbianConfig

Hebbian edge-weight reinforcement configuration (HL-F1/F2, #3344).

When enabled = true, the weight of each graph_edges row is incremented by hebbian_lr every time that edge is traversed during a recall. Default: disabled.

§Example (TOML)

[memory.hebbian]
enabled = true
hebbian_lr = 0.1

§memcot: MemCotConfig

MemCoT rolling semantic state configuration (#3574).

When enabled = true, each completed assistant turn spawns a background distillation task that compresses the response into a short semantic state buffer. The buffer is prepended to graph recall queries so retrieval stays contextually relevant across long multi-turn sessions.

§Example (TOML)

[memory.memcot]
enabled = true
distill_provider = "fast"
min_assistant_chars = 200
max_distills_per_session = 50

§retrieval_failures: RetrievalFailuresConfig

OmniMem retrieval failure tracking (issue #3576).

When enabled = true, no-hit and low-confidence recall events are logged asynchronously to memory_retrieval_failures for closed-loop parameter tuning.

§Example (TOML)

[memory.retrieval_failures]
enabled = true
low_confidence_threshold = 0.3
retention_days = 90

§quality_gate: WriteQualityGateConfig

Write quality gate (#3629).

When quality_gate.enabled = true, each remember() call is scored and low-quality writes are rejected before persistence. Evaluated after A-MAC admission control.

§tiered_retrieval: TieredRetrievalConfig

MemFlow tiered intent-driven retrieval (issue #3712).

When tiered_retrieval.enabled = true, recall queries are classified by intent and dispatched to the cheapest sufficient tier (ProfileLookup → TargetedRetrieval → DeepReasoning) with optional validation and tier escalation.

§optical_forgetting: OpticalForgettingConfig

ScrapMem optical forgetting (issue #3713).

When optical_forgetting.enabled = true, a background sweep progressively compresses old messages: Full → Compressed → SummaryOnly, saving token budget in context assembly.

§em_graph: EmGraphConfig

EM-Graph episodic event extraction and causal linking (issue #3713).

When em_graph.enabled = true, episodic events are extracted from conversation turns and linked via causal relationships, enabling causal-chain retrieval.

§episodic_consolidation: EpisodicConsolidationConfig

Episodic-to-semantic consolidation daemon (issue #3799).

When episodic_consolidation.enabled = true, a background loop periodically sweeps mature episodic_events, extracts durable facts via LLM, deduplicates against existing key facts, and promotes them to the semantic tier in zeph_key_facts.

§shadow_memory: TrajectoryRiskAccumulatorConfig

MAGE shadow memory trajectory risk accumulator (spec 004-16).

Maintains a per-session rolling risk score fed by sanitizer audit signals. When shadow_memory.enabled = true, tool execution is gated if cumulative trajectory risk exceeds risk_threshold. When false, all code paths are zero-cost no-ops.

§Example (TOML)

[memory.shadow_memory]
enabled = true
risk_threshold = 0.75
risk_halflife_turns = 10

§five_signal: FiveSignalConfig

Five-signal SYNAPSE retrieval (issue #4374).

When five_signal.enabled = true, SYNAPSE recall weights five signals: recency, relevance, access frequency, causal distance, and novelty. All new signals default to weight 0.0, preserving exact backward compatibility.

§fidelity: Option<FidelityConfig>

Context-Adaptive Memory fidelity scoring (CAM Phase 1, #4547).

When fidelity.enabled = true, the heuristic fidelity scorer runs after each apply_prepared_context() call and assigns Full / Compressed / Placeholder levels to historical messages. Default: disabled.

§Example (TOML)

[memory.fidelity]
enabled = false
w_semantic = 0.3
w_temporal = 0.3
w_importance = 0.2
w_plan = 0.2
full_threshold = 0.7
compressed_threshold = 0.3
compressed_max_tokens = 50
regrade_threshold = 0.6
min_query_length = 8
max_scored_messages = 500

Struct MemoryConfig Copy item path

§Example (TOML)

Fields§

§Example (TOML)

§Example (TOML)

§Example (TOML)

§Example (TOML)

§Example (TOML)

§Example (TOML)

Trait Implementations§

impl Debug for MemoryConfig

fn fmt(&self, f: &mut Formatter<'_>) -> Result

impl<'de> Deserialize<'de> for MemoryConfig

fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where __D: Deserializer<'de>,

impl Serialize for MemoryConfig

fn serialize<__S>(&self, __serializer: __S) -> Result<__S::Ok, __S::Error>where __S: Serializer,

Auto Trait Implementations§

impl Freeze for MemoryConfig

impl RefUnwindSafe for MemoryConfig

impl Send for MemoryConfig

impl Sync for MemoryConfig

impl Unpin for MemoryConfig

impl UnsafeUnpin for MemoryConfig

impl UnwindSafe for MemoryConfig

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> DeserializeOwned for Twhere T: for<'de> Deserialize<'de>,

impl<T> From<T> for T

fn from(t: T) -> T

impl<T> Instrument for T

fn instrument(self, span: Span) -> Instrumented<Self>

fn in_current_span(self) -> Instrumented<Self>

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<T> WithSubscriber for T

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>where S: Into<Dispatch>,

fn with_current_subscriber(self) -> WithDispatch<Self>

Struct MemoryConfig

fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
where __D: Deserializer<'de>,

fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
where S: Serializer,

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T> DeserializeOwned for T
where T: for<'de> Deserialize<'de>,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,