Struct SemanticMemory

Source

pub struct SemanticMemory {
    pub token_counter: Arc<TokenCounter>,
    pub graph_store: Option<Arc<GraphStore>>,
    /* private fields */
}

Fields§

§token_counter: Arc<TokenCounter>§graph_store: Option<Arc<GraphStore>>

Implementations§

Source §

impl SemanticMemory

Source

pub async fn store_correction_embedding( &self, correction_id: i64, correction_text: &str, ) -> Result<(), MemoryError>

Store an embedding for a user correction in the vector store.

Silently skips if no vector store is configured or embeddings are unsupported.

§Errors

Returns an error if embedding generation or vector store write fails.

Source

pub async fn retrieve_similar_corrections( &self, query: &str, limit: usize, min_score: f32, ) -> Result<Vec<UserCorrectionRow>, MemoryError>

Retrieve corrections semantically similar to query.

Returns up to limit corrections scoring above min_score. Returns an empty vec if no vector store is configured.

§Errors

Returns an error if embedding generation or vector search fails.

Source §

impl SemanticMemory

Source

pub async fn has_session_summary( &self, conversation_id: ConversationId, ) -> Result<bool, MemoryError>

Check whether a session summary already exists for the given conversation.

Returns true if at least one session summary is stored in SQLite for this conversation. Used as the primary guard in the shutdown summary path to handle cases where hard compaction fired but its Qdrant write failed (the SQLite record is the authoritative source).

§Errors

Returns an error if the database query fails.

Source

pub async fn store_shutdown_summary( &self, conversation_id: ConversationId, summary_text: &str, key_facts: &[String], ) -> Result<(), MemoryError>

Store a shutdown session summary: persists to SQLite, embeds into the zeph_session_summaries Qdrant collection (so cross-session search can find it), and stores key facts into the key-facts collection.

Unlike the hard-compaction path, first_message_id and last_message_id are None because the shutdown hook does not track exact message boundaries.

§Errors

Returns an error if the SQLite insert fails. Qdrant errors are logged as warnings and do not propagate — the SQLite record is the authoritative summary store.

Source

pub async fn store_session_summary( &self, conversation_id: ConversationId, summary_text: &str, ) -> Result<(), MemoryError>

Store a session summary into the dedicated zeph_session_summaries Qdrant collection.

§Errors

Returns an error if embedding or Qdrant storage fails.

Source

pub async fn search_session_summaries( &self, query: &str, limit: usize, exclude_conversation_id: Option<ConversationId>, ) -> Result<Vec<SessionSummaryResult>, MemoryError>

Search session summaries from other conversations.

§Errors

Returns an error if embedding or Qdrant search fails.

Source §

impl SemanticMemory

Source

pub fn spawn_graph_extraction( &self, content: String, context_messages: Vec<String>, config: GraphExtractionConfig, post_extract_validator: PostExtractValidator, ) -> JoinHandle<()>

Spawn background graph extraction for a message. Fire-and-forget — never blocks.

Extraction runs in a separate tokio task with a timeout. Any error or timeout is logged and the task exits silently; the agent response is never blocked.

The optional post_extract_validator is called after extraction, before upsert. It is a generic predicate opaque to zeph-memory (design decision D1).

When config.note_linking.enabled is true and an embedding store is available, link_memory_notes runs after successful extraction inside the same task, bounded by config.note_linking.timeout_secs.

Source §

impl SemanticMemory

Source

pub async fn remember( &self, conversation_id: ConversationId, role: &str, content: &str, ) -> Result<MessageId, MemoryError>

Save a message to SQLite and optionally embed and store in Qdrant.

Returns the message ID assigned by SQLite.

§Errors

Returns an error if the SQLite save fails. Embedding failures are logged but not propagated.

Source

pub async fn remember_with_parts( &self, conversation_id: ConversationId, role: &str, content: &str, parts_json: &str, ) -> Result<(MessageId, bool), MemoryError>

Save a message with pre-serialized parts JSON to SQLite and optionally embed in Qdrant.

Returns (message_id, embedding_stored) tuple where embedding_stored is true if an embedding was successfully generated and stored in Qdrant.

§Errors

Returns an error if the SQLite save fails.

Source

pub async fn save_only( &self, conversation_id: ConversationId, role: &str, content: &str, parts_json: &str, ) -> Result<MessageId, MemoryError>

Save a message to SQLite without generating an embedding.

Use this when embedding is intentionally skipped (e.g. autosave disabled for assistant).

§Errors

Returns an error if the SQLite save fails.

Source

pub async fn recall( &self, query: &str, limit: usize, filter: Option<SearchFilter>, ) -> Result<Vec<RecalledMessage>, MemoryError>

Recall relevant messages using hybrid search (vector + FTS5 keyword).

When Qdrant is available, runs both vector and keyword searches, then merges results using weighted scoring. When Qdrant is unavailable, falls back to FTS5-only keyword search.

§Errors

Returns an error if embedding generation, Qdrant search, or FTS5 query fails.

Source

pub async fn recall_routed( &self, query: &str, limit: usize, filter: Option<SearchFilter>, router: &dyn MemoryRouter, ) -> Result<Vec<RecalledMessage>, MemoryError>

Recall messages using query-aware routing.

Delegates to FTS5-only, vector-only, or hybrid search based on the router decision, then runs the shared merge and ranking pipeline.

§Errors

Returns an error if any underlying search or database operation fails.

Source

pub async fn recall_graph( &self, query: &str, limit: usize, max_hops: u32, at_timestamp: Option<&str>, temporal_decay_rate: f64, edge_types: &[EdgeType], ) -> Result<Vec<GraphFact>, MemoryError>

Retrieve graph facts relevant to query via BFS traversal.

Returns an empty Vec if no graph_store is configured.

§Parameters

at_timestamp: when Some, only edges valid at that SQLite datetime string are returned. When None, only currently active edges are used.
temporal_decay_rate: non-negative decay rate (1/day). 0.0 preserves original ordering.

§Errors

Returns an error if the underlying graph query fails.

Source

pub async fn recall_graph_activated( &self, query: &str, limit: usize, params: SpreadingActivationParams, edge_types: &[EdgeType], ) -> Result<Vec<ActivatedFact>, MemoryError>

Retrieve graph facts via SYNAPSE spreading activation.

Delegates to crate::graph::retrieval::graph_recall_activated. Used in place of [recall_graph] when spreading_activation.enabled = true.

§Errors

Returns an error if the underlying graph query fails.

Source

pub async fn has_embedding( &self, message_id: MessageId, ) -> Result<bool, MemoryError>

Check whether an embedding exists for a given message ID.

§Errors

Returns an error if the SQLite query fails.

Source

pub async fn embed_missing(&self) -> Result<usize, MemoryError>

Embed all messages that do not yet have embeddings.

Returns the count of successfully embedded messages.

§Errors

Returns an error if collection initialization or database query fails. Individual embedding failures are logged but do not stop processing.

Source §

impl SemanticMemory

Source

pub async fn load_summaries( &self, conversation_id: ConversationId, ) -> Result<Vec<Summary>, MemoryError>

Load all summaries for a conversation.

§Errors

Returns an error if the query fails.

Source

pub async fn summarize( &self, conversation_id: ConversationId, message_count: usize, ) -> Result<Option<i64>, MemoryError>

Generate a summary of the oldest unsummarized messages.

Returns Ok(None) if there are not enough messages to summarize.

§Errors

Returns an error if LLM call or database operation fails.

Source

pub async fn search_key_facts( &self, query: &str, limit: usize, ) -> Result<Vec<String>, MemoryError>

Search key facts extracted from conversation summaries.

§Errors

Returns an error if embedding or Qdrant search fails.

Source

pub async fn search_document_collection( &self, collection: &str, query: &str, limit: usize, ) -> Result<Vec<ScoredVectorPoint>, MemoryError>

Search a named document collection by semantic similarity.

Returns up to limit scored vector points whose payloads contain ingested document chunks. Returns an empty vec when Qdrant is unavailable, the collection does not exist, or the provider does not support embeddings.

§Errors

Returns an error if embedding generation or Qdrant search fails.

Source §

impl SemanticMemory

Source

pub async fn new( sqlite_path: &str, qdrant_url: &str, provider: AnyProvider, embedding_model: &str, ) -> Result<Self, MemoryError>

Create a new SemanticMemory instance with default hybrid search weights (0.7/0.3).

Qdrant connection is best-effort: if unavailable, semantic search is disabled.

For AppBuilder bootstrap, prefer SemanticMemory::with_qdrant_ops to share a single gRPC channel across all subsystems.

§Errors

Returns an error if SQLite cannot be initialized.

Source

pub async fn with_weights( sqlite_path: &str, qdrant_url: &str, provider: AnyProvider, embedding_model: &str, vector_weight: f64, keyword_weight: f64, ) -> Result<Self, MemoryError>

Create a new SemanticMemory with custom vector/keyword weights for hybrid search.

For AppBuilder bootstrap, prefer SemanticMemory::with_qdrant_ops to share a single gRPC channel across all subsystems.

§Errors

Returns an error if SQLite cannot be initialized.

Source

pub async fn with_weights_and_pool_size( sqlite_path: &str, qdrant_url: &str, provider: AnyProvider, embedding_model: &str, vector_weight: f64, keyword_weight: f64, pool_size: u32, ) -> Result<Self, MemoryError>

Create a new SemanticMemory with custom weights and configurable pool size.

For AppBuilder bootstrap, prefer SemanticMemory::with_qdrant_ops to share a single gRPC channel across all subsystems.

§Errors

Returns an error if SQLite cannot be initialized.

Source

pub async fn with_qdrant_ops( sqlite_path: &str, ops: QdrantOps, provider: AnyProvider, embedding_model: &str, vector_weight: f64, keyword_weight: f64, pool_size: u32, ) -> Result<Self, MemoryError>

Create a SemanticMemory from a pre-built QdrantOps instance.

Use this at bootstrap to share one QdrantOps (and thus one gRPC channel) across all subsystems. The ops is consumed and wrapped inside EmbeddingStore.

§Errors

Returns an error if SQLite cannot be initialized.

Source

pub fn with_graph_store(self, store: Arc<GraphStore>) -> Self

Attach a GraphStore for graph-aware retrieval.

When set, recall_graph traverses the graph starting from entities matched by the query.

Source

pub fn community_detection_failures(&self) -> u64

Returns the cumulative count of community detection failures since startup.

Source

pub fn graph_extraction_count(&self) -> u64

Returns the cumulative count of successful graph extractions since startup.

Source

pub fn graph_extraction_failures(&self) -> u64

Returns the cumulative count of failed graph extractions since startup.

Source

pub fn with_ranking_options( self, temporal_decay_enabled: bool, temporal_decay_half_life_days: u32, mmr_enabled: bool, mmr_lambda: f32, ) -> Self

Configure temporal decay and MMR re-ranking options.

Source

pub fn with_importance_options(self, enabled: bool, weight: f64) -> Self

Configure write-time importance scoring for memory retrieval.

Source

pub fn from_parts( sqlite: SqliteStore, qdrant: Option<Arc<EmbeddingStore>>, provider: AnyProvider, embedding_model: impl Into<String>, vector_weight: f64, keyword_weight: f64, token_counter: Arc<TokenCounter>, ) -> Self

Construct a SemanticMemory from pre-built parts.

Intended for tests that need full control over the backing stores.

Source

pub async fn with_sqlite_backend( sqlite_path: &str, provider: AnyProvider, embedding_model: &str, vector_weight: f64, keyword_weight: f64, ) -> Result<Self, MemoryError>

Create a SemanticMemory using the SQLite-embedded vector backend.

§Errors

Returns an error if SQLite cannot be initialized.

Source

pub async fn with_sqlite_backend_and_pool_size( sqlite_path: &str, provider: AnyProvider, embedding_model: &str, vector_weight: f64, keyword_weight: f64, pool_size: u32, ) -> Result<Self, MemoryError>

Create a SemanticMemory using the SQLite-embedded vector backend with configurable pool size.

§Errors

Returns an error if SQLite cannot be initialized.

Source

pub fn sqlite(&self) -> &SqliteStore

Access the underlying SqliteStore for operations that don’t involve semantics.

Source

pub async fn is_vector_store_connected(&self) -> bool

Check if the vector store backend is reachable.

Performs a real health check (Qdrant gRPC ping or SQLite query) instead of just checking whether the client was created.

Source

pub fn has_vector_store(&self) -> bool

Check if a vector store client is configured (may not be connected).

Source

pub fn embedding_store(&self) -> Option<&Arc<EmbeddingStore>>

Return a reference to the embedding store, if configured.

Source

pub async fn message_count( &self, conversation_id: ConversationId, ) -> Result<i64, MemoryError>

Count messages in a conversation.

§Errors

Returns an error if the query fails.

Source

pub async fn unsummarized_message_count( &self, conversation_id: ConversationId, ) -> Result<i64, MemoryError>

Count messages not yet covered by any summary.

§Errors

Returns an error if the query fails.

Auto Trait Implementations§

§

impl !UnwindSafe for SemanticMemory

Blanket Implementations§

Source §

impl<T> Any for T
where T: 'static + ?Sized,

Source §

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more

Source §

impl<T> Borrow<T> for T
where T: ?Sized,

Source §

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more

Source §

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source §

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more

Source §

impl<T> From<T> for T

Source §

fn from(t: T) -> T

Returns the argument unchanged.

Source §

impl<T> Instrument for T

Source §

fn instrument(self, span: Span) -> Instrumented<Self>

Instruments this type with the provided Span, returning an Instrumented wrapper. Read more

Source §

fn in_current_span(self) -> Instrumented<Self>

Instruments this type with the current Span, returning an Instrumented wrapper. Read more

Source §

impl<T, U> Into for T
where U: From<T>,

Source §

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source §

impl<T> IntoEither for T

Source §

fn into_either(self, into_left: bool) -> Either<Self, Self>

Converts self into a Left variant of Either<Self, Self> if into_left is true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more

Source §

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

Converts self into a Left variant of Either<Self, Self> if into_left(&self) returns true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more

Source §

impl<T> IntoRequest<T> for T

Source §

fn into_request(self) -> Request<T>

Wrap the input message T in a tonic::Request

Source §

impl<T> PolicyExt for T
where T: ?Sized,

Source §

fn and<P, B, E>(self, other: P) -> And<T, P>
where T: Policy<B, E>, P: Policy<B, E>,

Create a new Policy that returns Action::Follow only if self and other return Action::Follow. Read more

Source §

fn or<P, B, E>(self, other: P) -> Or<T, P>
where T: Policy<B, E>, P: Policy<B, E>,

Create a new Policy that returns Action::Follow if either self or other returns Action::Follow. Read more

Source §

impl<T> Same for T

Source §

type Output = T

Should always be Self

Source §

impl<T, U> TryFrom for T
where U: Into<T>,

Source §

type Error = Infallible

The type returned in the event of a conversion error.

Source §

fn try_from(value: U) -> Result<T, <T as TryFrom>::Error>

Performs the conversion.

Source §

impl<T, U> TryInto for T
where U: TryFrom<T>,

Source §

type Error = >::Error

The type returned in the event of a conversion error.

Source §

fn try_into(self) -> Result<U, >::Error>

Performs the conversion.

Source §

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

Source §

fn vzip(self) -> V

Source §

impl<T> WithSubscriber for T

Source §

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,

Attaches the provided Subscriber to this type, returning a WithDispatch wrapper. Read more

Source §

fn with_current_subscriber(self) -> WithDispatch<Self>

Attaches the current default Subscriber to this type, returning a WithDispatch wrapper. Read more

SemanticMemory

Struct SemanticMemory Copy item path

Fields§

Implementations§

impl SemanticMemory

pub async fn store_correction_embedding( &self, correction_id: i64, correction_text: &str, ) -> Result<(), MemoryError>

§Errors

pub async fn retrieve_similar_corrections( &self, query: &str, limit: usize, min_score: f32, ) -> Result<Vec<UserCorrectionRow>, MemoryError>

§Errors

impl SemanticMemory

pub async fn has_session_summary( &self, conversation_id: ConversationId, ) -> Result<bool, MemoryError>

§Errors

pub async fn store_shutdown_summary( &self, conversation_id: ConversationId, summary_text: &str, key_facts: &[String], ) -> Result<(), MemoryError>

§Errors

pub async fn store_session_summary( &self, conversation_id: ConversationId, summary_text: &str, ) -> Result<(), MemoryError>

§Errors

pub async fn search_session_summaries( &self, query: &str, limit: usize, exclude_conversation_id: Option<ConversationId>, ) -> Result<Vec<SessionSummaryResult>, MemoryError>

§Errors

impl SemanticMemory

pub fn spawn_graph_extraction( &self, content: String, context_messages: Vec<String>, config: GraphExtractionConfig, post_extract_validator: PostExtractValidator, ) -> JoinHandle<()>

impl SemanticMemory

pub async fn remember( &self, conversation_id: ConversationId, role: &str, content: &str, ) -> Result<MessageId, MemoryError>

§Errors

pub async fn remember_with_parts( &self, conversation_id: ConversationId, role: &str, content: &str, parts_json: &str, ) -> Result<(MessageId, bool), MemoryError>

§Errors

pub async fn save_only( &self, conversation_id: ConversationId, role: &str, content: &str, parts_json: &str, ) -> Result<MessageId, MemoryError>

§Errors

pub async fn recall( &self, query: &str, limit: usize, filter: Option<SearchFilter>, ) -> Result<Vec<RecalledMessage>, MemoryError>

§Errors

pub async fn recall_routed( &self, query: &str, limit: usize, filter: Option<SearchFilter>, router: &dyn MemoryRouter, ) -> Result<Vec<RecalledMessage>, MemoryError>

§Errors

pub async fn recall_graph( &self, query: &str, limit: usize, max_hops: u32, at_timestamp: Option<&str>, temporal_decay_rate: f64, edge_types: &[EdgeType], ) -> Result<Vec<GraphFact>, MemoryError>

§Parameters

§Errors

pub async fn recall_graph_activated( &self, query: &str, limit: usize, params: SpreadingActivationParams, edge_types: &[EdgeType], ) -> Result<Vec<ActivatedFact>, MemoryError>

§Errors

pub async fn has_embedding( &self, message_id: MessageId, ) -> Result<bool, MemoryError>

§Errors

pub async fn embed_missing(&self) -> Result<usize, MemoryError>

§Errors

impl SemanticMemory

pub async fn load_summaries( &self, conversation_id: ConversationId, ) -> Result<Vec<Summary>, MemoryError>

§Errors

pub async fn summarize( &self, conversation_id: ConversationId, message_count: usize, ) -> Result<Option<i64>, MemoryError>

§Errors

pub async fn search_key_facts( &self, query: &str, limit: usize, ) -> Result<Vec<String>, MemoryError>

§Errors

pub async fn search_document_collection( &self, collection: &str, query: &str, limit: usize, ) -> Result<Vec<ScoredVectorPoint>, MemoryError>

§Errors

impl SemanticMemory

pub async fn new( sqlite_path: &str, qdrant_url: &str, provider: AnyProvider, embedding_model: &str, ) -> Result<Self, MemoryError>

§Errors

pub async fn with_weights( sqlite_path: &str, qdrant_url: &str, provider: AnyProvider, embedding_model: &str, vector_weight: f64, keyword_weight: f64, ) -> Result<Self, MemoryError>

§Errors

pub async fn with_weights_and_pool_size( sqlite_path: &str, qdrant_url: &str, provider: AnyProvider, embedding_model: &str, vector_weight: f64, keyword_weight: f64, pool_size: u32, ) -> Result<Self, MemoryError>

§Errors

pub async fn with_qdrant_ops( sqlite_path: &str, ops: QdrantOps, provider: AnyProvider, embedding_model: &str, vector_weight: f64, keyword_weight: f64, pool_size: u32, ) -> Result<Self, MemoryError>

§Errors

pub fn with_graph_store(self, store: Arc<GraphStore>) -> Self

pub fn community_detection_failures(&self) -> u64

pub fn graph_extraction_count(&self) -> u64

pub fn graph_extraction_failures(&self) -> u64

pub fn with_ranking_options( self, temporal_decay_enabled: bool, temporal_decay_half_life_days: u32, mmr_enabled: bool, mmr_lambda: f32, ) -> Self

pub fn with_importance_options(self, enabled: bool, weight: f64) -> Self

pub fn from_parts( sqlite: SqliteStore, qdrant: Option<Arc<EmbeddingStore>>, provider: AnyProvider, embedding_model: impl Into<String>, vector_weight: f64, keyword_weight: f64, token_counter: Arc<TokenCounter>, ) -> Self

pub async fn with_sqlite_backend( sqlite_path: &str, provider: AnyProvider, embedding_model: &str, vector_weight: f64, keyword_weight: f64, ) -> Result<Self, MemoryError>

§Errors

pub async fn with_sqlite_backend_and_pool_size( sqlite_path: &str, provider: AnyProvider, embedding_model: &str, vector_weight: f64, keyword_weight: f64, pool_size: u32, ) -> Result<Self, MemoryError>

§Errors

pub fn sqlite(&self) -> &SqliteStore

pub async fn is_vector_store_connected(&self) -> bool

pub fn has_vector_store(&self) -> bool

pub fn embedding_store(&self) -> Option<&Arc<EmbeddingStore>>

pub async fn message_count( &self, conversation_id: ConversationId, ) -> Result<i64, MemoryError>

§Errors

pub async fn unsummarized_message_count( &self, conversation_id: ConversationId, ) -> Result<i64, MemoryError>

§Errors

Auto Trait Implementations§

impl !Freeze for SemanticMemory

impl !RefUnwindSafe for SemanticMemory

Struct SemanticMemory

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T, U> Into<U> for T
where U: From<T>,

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

impl<T> PolicyExt for T
where T: ?Sized,

fn and<P, B, E>(self, other: P) -> And<T, P>
where T: Policy<B, E>, P: Policy<B, E>,

fn or<P, B, E>(self, other: P) -> Or<T, P>
where T: Policy<B, E>, P: Policy<B, E>,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,