Skip to main content

zeph_memory/
lib.rs

1// SPDX-FileCopyrightText: 2026 Andrei G <bug-ops>
2// SPDX-License-Identifier: MIT OR Apache-2.0
3
4//! Semantic memory layer for the Zeph agent.
5//!
6//! `zeph-memory` implements a two-backend hybrid memory system:
7//!
8//! - **[`store::DbStore`]** (`SqliteStore`) — relational persistence for messages, summaries,
9//!   persona facts, trajectory entries, and session metadata.
10//! - **[`embedding_store::EmbeddingStore`]** — Qdrant-backed vector index for semantic recall.
11//!   Falls back gracefully to [`db_vector_store::DbVectorStore`] when Qdrant is unavailable.
12//!
13//! The high-level entry point is [`semantic::SemanticMemory`], which combines both backends
14//! and exposes `remember` / `recall` / `summarize` operations consumed by `zeph-core`.
15//!
16//! # Architecture overview
17//!
18//! ```text
19//! SemanticMemory
20//! ├── SqliteStore  ── messages, summaries, corrections, persona, trajectory …
21//! └── EmbeddingStore ── Qdrant (primary) / DbVectorStore (fallback)
22//!         └── QdrantOps  ── thin gRPC wrapper over qdrant-client
23//! ```
24//!
25//! # Memory tiers
26//!
27//! Messages are classified into four tiers (see [`types::MemoryTier`]):
28//!
29//! | Tier | Description |
30//! |------|-------------|
31//! | `Working` | Current context window; never persisted. |
32//! | `Episodic` | Per-session messages stored in `SQLite`. |
33//! | `Semantic` | Cross-session distilled facts promoted from episodic. |
34//! | `Persona` | Long-lived user attributes (preferences, domain knowledge). |
35//!
36//! # Admission control
37//!
38//! Each `remember()` call is gated by [`admission::AdmissionControl`] (A-MAC, #2317), which
39//! evaluates five factors (future utility, factual confidence, semantic novelty, temporal
40//! recency, content-type prior) and rejects low-value messages before they reach the DB.
41//!
42//! # Memory routing
43//!
44//! [`router::HybridRouter`] classifies each recall query and dispatches to the appropriate
45//! backend: keyword (`SQLite` FTS5), semantic (Qdrant), graph (BFS traversal), episodic
46//! (timestamp-filtered FTS5), or hybrid (reciprocal-rank fusion of keyword + semantic).
47//!
48//! # Background loops
49//!
50//! Several background tasks maintain memory health:
51//!
52//! - [`eviction::start_eviction_loop`] — Ebbinghaus-curve eviction.
53//! - [`forgetting::start_forgetting_loop`] — `SleepGate` importance downscaling.
54//! - [`consolidation::start_consolidation_loop`] — cross-session fact merging.
55//! - [`tiers::start_tier_promotion_loop`] — Episodic → Semantic promotion.
56//! - [`semantic::start_tree_consolidation_loop`] — hierarchical note consolidation.
57//!
58//! # Feature flags
59//!
60//! | Feature | Description |
61//! |---------|-------------|
62//! | `sqlite` (default) | Enable SQLite persistence via `zeph-db`. |
63//! | `pdf` | Enable `PdfLoader` for PDF ingestion. |
64//! | `postgres` | Enable PostgreSQL support via `zeph-db`. |
65
66pub mod admission;
67pub mod admission_rl;
68pub mod anchored_summary;
69pub mod compaction_probe;
70pub mod compression_guidelines;
71pub mod compression_predictor;
72pub mod consolidation;
73pub mod document;
74pub mod facade;
75pub mod forgetting;
76pub mod scenes;
77pub mod tiers;
78
79pub mod db_vector_store;
80pub mod embedding_registry;
81pub mod embedding_store;
82pub mod error;
83pub mod eviction;
84pub mod graph;
85pub mod in_memory_store;
86pub mod qdrant_ops;
87pub mod response_cache;
88pub mod router;
89pub mod semantic;
90pub mod snapshot;
91pub mod store;
92pub mod testing;
93pub mod token_counter;
94pub mod types;
95pub mod vector_store;
96
97pub use admission::{
98    AdmissionControl, AdmissionDecision, AdmissionFactors, AdmissionRejected, AdmissionWeights,
99    GoalGateConfig, compute_content_type_prior, compute_factual_confidence, log_admission_decision,
100};
101pub use anchored_summary::AnchoredSummary;
102pub use compaction_probe::{
103    CategoryScore, CompactionProbeConfig, CompactionProbeResult, ProbeCategory, ProbeQuestion,
104    ProbeVerdict, answer_probe_questions, generate_probe_questions, score_answers,
105    validate_compaction,
106};
107pub use compression_guidelines::CompressionGuidelinesConfig;
108pub use compression_guidelines::{
109    build_guidelines_update_prompt, sanitize_guidelines, start_guidelines_updater,
110    truncate_to_token_budget, update_guidelines_once,
111};
112pub use compression_predictor::{
113    CompressionFeatures, CompressionModelWeights, CompressionPredictor,
114};
115pub use consolidation::{
116    ConsolidationConfig, ConsolidationResult, TopologyOp, run_consolidation_sweep,
117    start_consolidation_loop,
118};
119#[cfg(feature = "pdf")]
120pub use document::PdfLoader;
121pub use document::{
122    Chunk, Document, DocumentError, DocumentLoader, DocumentMetadata, IngestionPipeline,
123    SplitterConfig, TextLoader, TextSplitter,
124};
125pub use embedding_registry::{
126    EmbedFuture, Embeddable, EmbeddingRegistry, EmbeddingRegistryError, SyncStats,
127};
128pub use embedding_store::ensure_qdrant_collection;
129pub use error::MemoryError;
130pub use eviction::{EbbinghausPolicy, EvictionConfig, EvictionPolicy, start_eviction_loop};
131pub use facade::{
132    CompactionContext, CompactionResult, InMemoryFacade, MemoryEntry, MemoryFacade, MemoryMatch,
133    MemorySource,
134};
135pub use forgetting::{ForgettingConfig, ForgettingResult, start_forgetting_loop};
136pub use graph::EntityLockManager;
137pub use graph::{
138    BeliefRevisionConfig, Community, Edge, EdgeType, Entity, EntityType, GraphFact, GraphStore,
139    RpeRouter, RpeSignal, extract_candidate_entities,
140};
141pub use qdrant_ops::QdrantOps;
142pub use response_cache::ResponseCache;
143pub use router::{
144    AsyncMemoryRouter, HeuristicRouter, HybridRouter, LlmRouter, MemoryRoute, MemoryRouter,
145    RoutingDecision, TemporalRange, classify_graph_subgraph, parse_route_str,
146    strip_temporal_keywords,
147};
148pub use scenes::{
149    MemScene, SceneConfig, consolidate_scenes, list_scenes, start_scene_consolidation_loop,
150};
151pub use semantic::{
152    BufferedWrite, EmbedContext, ExtractionResult, ExtractionStats, GraphExtractionConfig,
153    LinkingStats, NoteLinkingConfig, PersonaExtractionConfig, StructuredSummary, TrajectoryEntry,
154    TrajectoryExtractionConfig, TreeConsolidationConfig, TreeConsolidationResult, WriteBuffer,
155    build_summarization_prompt, contains_self_referential_language, extract_and_store,
156    extract_persona_facts, extract_trajectory_entries, link_memory_notes,
157    run_tree_consolidation_sweep, start_tree_consolidation_loop,
158};
159pub use snapshot::{ImportStats, MemorySnapshot, export_snapshot, import_snapshot};
160pub use store::compression_guidelines::CompressionFailurePair;
161pub use store::corrections::UserCorrectionRow;
162pub use store::experiments::{ExperimentResultRow, NewExperimentResult, SessionSummaryRow};
163pub use store::memory_tree::MemoryTreeRow;
164pub use store::persona::PersonaFactRow;
165pub use store::session_digest::SessionDigest;
166pub use store::trajectory::{NewTrajectoryEntry, TrajectoryEntryRow};
167pub use tiers::{TierPromotionConfig, start_tier_promotion_loop};
168pub use token_counter::TokenCounter;
169pub use tokio_util::sync::CancellationToken;
170pub use types::{ConversationId, MemSceneId, MemoryTier, MessageId};
171pub use vector_store::{
172    FieldCondition, FieldValue, ScoredVectorPoint, VectorFilter, VectorPoint, VectorStore,
173    VectorStoreError,
174};