sqlrite 1.0.2 - Docs.rs

//! SQLRite is an embedded, SQLite-based retrieval engine for AI-agent memory and
//! retrieval-augmented generation workloads.
//!
//! The crate is optimized for local, in-process use around a single database file,
//! with optional HTTP, compact HTTP, gRPC, and MCP surfaces when a service boundary
//! is needed.
//!
//! # Primary entry points
//!
//! - [`SqlRite`] for direct embedded use
//! - [`run_benchmark`] for synthetic retrieval benchmarking
//! - [`run_grpc_server`] and [`serve_health_endpoints`] for service mode
//! - [`execute_sdk_query`] and [`execute_sdk_sql`] for SDK-facing envelopes
//!
//! # Example
//!
//! ```no_run
//! use sqlrite::SqlRite;
//!
//! let db = SqlRite::open("sqlrite.db")?;
//! println!("chunks={}", db.chunk_count()?);
//! # Ok::<(), sqlrite::SqlRiteError>(())
//! ```

mod adapter;
mod bench;
mod error;
mod eval;
pub mod grpc;
mod ha;
mod ingest;
mod mcp;
mod migrate;
mod ops;
mod reindex;
mod sdk_runtime;
mod security;
mod server;
mod sql_semantics;
mod vector_index;

pub use adapter::{SqlRiteToolAdapter, ToolRequest, ToolResponse, ToolSpec};
pub use bench::{
    BenchmarkConfig, BenchmarkFilterMode, BenchmarkLatency, BenchmarkReport, run_benchmark,
};
pub use error::{Result, SqlRiteError};
pub use eval::{
    EvalDataset, EvalMetricsAtK, EvalQuery, EvalReport, EvalSummary, QueryEvalResult,
    evaluate_dataset,
};
pub use grpc::{GrpcServerConfig, grpc_json_payload_or_error, run_grpc_server};
pub use ha::{
    FailoverMode, HaRuntimeProfile, HaRuntimeState, RecoveryConfig, ReplicationConfig,
    ReplicationLog, ReplicationLogEntry, ServerRole,
};
pub use ingest::{
    ChunkingStrategy, CustomHttpEmbeddingProvider, DeterministicEmbeddingProvider,
    EmbeddingProvider, EmbeddingRetryPolicy, IngestionBatchTuning, IngestionCheckpoint,
    IngestionReport, IngestionRequest, IngestionSource, IngestionWorker,
    OpenAiCompatibleEmbeddingProvider,
};
pub use mcp::{McpServerConfig, mcp_tools_manifest_document, run_stdio_mcp_server};
pub use migrate::{
    ApiFirstSourceKind, ApiJsonlMigrationConfig, MigrationEmbeddingFormat, MigrationReport,
    PgvectorJsonlMigrationConfig, SqliteMigrationConfig, migrate_api_jsonl, migrate_pgvector_jsonl,
    migrate_sqlite,
};
pub use ops::{
    BackupPruneReport, BackupSnapshotRecord, HealthReport, backup_file, build_health_report,
    create_backup_snapshot, list_backup_snapshots, prune_backup_snapshots, restore_backup_file,
    restore_backup_file_verified, select_backup_snapshot_for_time, verify_backup_file,
};
pub use reindex::{ReindexCheckpoint, ReindexOptions, ReindexReport, reindex_embeddings};
pub use sdk_runtime::{
    SdkRuntimeError, execute_query as execute_sdk_query, execute_sql as execute_sdk_sql,
};
pub use security::{
    AccessContext, AccessOperation, AccessPolicy, AllowAllPolicy, AuditEvent, AuditExportFormat,
    AuditExportReport, AuditLogger, AuditQuery, InMemoryTenantKeyRegistry, JsonlAuditLogger,
    KeyRotationReport, RbacPolicy, RbacPolicyConfig, SecureSqlRite, TenantKey, TenantKeyRegistry,
    export_audit_events, inspect_tenant_key_rotation, read_audit_events,
    rotate_tenant_encryption_key, rotate_tenant_encryption_key_with_report,
};
pub use server::{ServerConfig, ServerSecurityConfig, serve_health_endpoints};
pub use sql_semantics::{execute_sql_statement_json, prepare_sql_connection};
pub use vector_index::{
    AnnTuningConfig, BruteForceVectorIndex, LshAnnVectorIndex, VectorCandidate, VectorIndex,
    VectorIndexMode, VectorIndexOptions, VectorStorageKind,
};
use vector_index::{BuiltinVectorIndex, ChunkKey, VectorEntryRecord};

use half::f16;
use roaring::RoaringTreemap;
use rusqlite::types::Value as SqlValue;
use rusqlite::{Connection, params, params_from_iter};
use serde::{Deserialize, Serialize};
use serde_json::Value;
use std::cell::RefCell;
use std::collections::{HashMap, HashSet};
use std::fs::{self, File};
use std::io::{Read, Write};
use std::path::{Path, PathBuf};
use std::time::{Duration, Instant};

use crate::ingest::chunk_text_for_ingest;

const LATEST_SCHEMA_VERSION: i64 = 4;
const HYBRID_FTS_SCORE_LOOKUP_SKIP_CANDIDATE_LIMIT: usize = 512;
const QUERY_PROFILE_LATENCY_MIN_CANDIDATE_LIMIT: usize = 32;
const QUERY_PROFILE_LATENCY_TOP_K_MULTIPLIER: usize = 8;
const QUERY_PROFILE_RECALL_MIN_CANDIDATE_LIMIT: usize = 200;
const QUERY_PROFILE_RECALL_TOP_K_MULTIPLIER: usize = 32;
const DOC_UPSERT_SQL: &str = "
    INSERT INTO documents (id, source, metadata) VALUES (?1, ?2, '{}')
    ON CONFLICT(id) DO UPDATE SET source = COALESCE(excluded.source, documents.source)
";
const CHUNK_UPSERT_SQL: &str = "
    INSERT INTO chunks (id, doc_id, content, metadata, embedding, embedding_dim)
    VALUES (?1, ?2, ?3, ?4, ?5, ?6)
    ON CONFLICT(id) DO UPDATE SET
        doc_id = excluded.doc_id,
        content = excluded.content,
        metadata = excluded.metadata,
        embedding = excluded.embedding,
        embedding_dim = excluded.embedding_dim
";

struct Migration {
    version: i64,
    name: &'static str,
    sql: &'static str,
}

const MIGRATIONS: &[Migration] = &[
    Migration {
        version: 1,
        name: "baseline_schema",
        sql: "
            CREATE TABLE IF NOT EXISTS documents (
                id TEXT PRIMARY KEY,
                source TEXT,
                metadata TEXT NOT NULL DEFAULT '{}',
                created_at TEXT NOT NULL DEFAULT (datetime('now'))
            );

            CREATE TABLE IF NOT EXISTS chunks (
                rowid INTEGER PRIMARY KEY AUTOINCREMENT,
                id TEXT NOT NULL UNIQUE,
                doc_id TEXT NOT NULL,
                content TEXT NOT NULL,
                metadata TEXT NOT NULL DEFAULT '{}',
                embedding BLOB NOT NULL,
                embedding_dim INTEGER NOT NULL CHECK (embedding_dim >= 0),
                created_at TEXT NOT NULL DEFAULT (datetime('now')),
                FOREIGN KEY (doc_id) REFERENCES documents(id) ON DELETE CASCADE
            );
        ",
    },
    Migration {
        version: 2,
        name: "chunk_indexes",
        sql: "
            CREATE INDEX IF NOT EXISTS idx_chunks_doc_id ON chunks(doc_id);
            CREATE INDEX IF NOT EXISTS idx_chunks_created_at ON chunks(created_at DESC, rowid DESC);
            CREATE INDEX IF NOT EXISTS idx_documents_created_at ON documents(created_at DESC);
        ",
    },
    Migration {
        version: 3,
        name: "retrieval_index_catalog",
        sql: "
            CREATE TABLE IF NOT EXISTS retrieval_indexes (
                name TEXT PRIMARY KEY,
                index_kind TEXT NOT NULL CHECK (index_kind IN ('vector', 'text')),
                table_name TEXT NOT NULL,
                column_name TEXT NOT NULL,
                using_engine TEXT NOT NULL,
                options_json TEXT NOT NULL DEFAULT '{}',
                status TEXT NOT NULL DEFAULT 'active',
                created_at TEXT NOT NULL DEFAULT (datetime('now'))
            );

            CREATE INDEX IF NOT EXISTS idx_retrieval_indexes_kind_table
                ON retrieval_indexes(index_kind, table_name, status);

            CREATE VIEW IF NOT EXISTS retrieval_index_catalog AS
            SELECT
                name,
                index_kind,
                table_name,
                column_name,
                using_engine,
                options_json,
                status,
                created_at
            FROM retrieval_indexes;
        ",
    },
    Migration {
        version: 4,
        name: "allow_text_only_chunks",
        sql: "
            ALTER TABLE chunks RENAME TO chunks_legacy_v3;

            CREATE TABLE chunks (
                rowid INTEGER PRIMARY KEY AUTOINCREMENT,
                id TEXT NOT NULL UNIQUE,
                doc_id TEXT NOT NULL,
                content TEXT NOT NULL,
                metadata TEXT NOT NULL DEFAULT '{}',
                embedding BLOB NOT NULL,
                embedding_dim INTEGER NOT NULL CHECK (embedding_dim >= 0),
                created_at TEXT NOT NULL DEFAULT (datetime('now')),
                FOREIGN KEY (doc_id) REFERENCES documents(id) ON DELETE CASCADE
            );

            INSERT INTO chunks (rowid, id, doc_id, content, metadata, embedding, embedding_dim, created_at)
            SELECT rowid, id, doc_id, content, metadata, embedding, embedding_dim, created_at
            FROM chunks_legacy_v3;

            DROP TABLE chunks_legacy_v3;

            CREATE INDEX IF NOT EXISTS idx_chunks_doc_id ON chunks(doc_id);
            CREATE INDEX IF NOT EXISTS idx_chunks_created_at ON chunks(created_at DESC, rowid DESC);
        ",
    },
];

#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct ChunkInput {
    pub id: String,
    pub doc_id: String,
    pub content: String,
    pub embedding: Vec<f32>,
    pub metadata: Value,
    pub source: Option<String>,
}

impl ChunkInput {
    pub fn new(
        id: impl Into<String>,
        doc_id: impl Into<String>,
        content: impl Into<String>,
        embedding: Vec<f32>,
    ) -> Self {
        Self {
            id: id.into(),
            doc_id: doc_id.into(),
            content: content.into(),
            embedding,
            metadata: Value::Object(serde_json::Map::new()),
            source: None,
        }
    }

    pub fn with_metadata(mut self, metadata: Value) -> Self {
        self.metadata = metadata;
        self
    }

    pub fn with_source(mut self, source: impl Into<String>) -> Self {
        self.source = Some(source.into());
        self
    }
}

#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct TextChunkInput {
    pub id: String,
    pub doc_id: String,
    pub content: String,
    pub metadata: Value,
    pub source: Option<String>,
}

impl TextChunkInput {
    pub fn new(
        id: impl Into<String>,
        doc_id: impl Into<String>,
        content: impl Into<String>,
    ) -> Self {
        Self {
            id: id.into(),
            doc_id: doc_id.into(),
            content: content.into(),
            metadata: Value::Object(serde_json::Map::new()),
            source: None,
        }
    }

    pub fn with_metadata(mut self, metadata: Value) -> Self {
        self.metadata = metadata;
        self
    }

    pub fn with_source(mut self, source: impl Into<String>) -> Self {
        self.source = Some(source.into());
        self
    }
}

#[derive(Debug, Clone)]
pub struct DocumentIngestOptions {
    pub chunking: ChunkingStrategy,
    pub metadata: Value,
    pub source: Option<String>,
    pub chunk_id_prefix: Option<String>,
}

impl Default for DocumentIngestOptions {
    fn default() -> Self {
        Self {
            chunking: ChunkingStrategy::default(),
            metadata: Value::Object(serde_json::Map::new()),
            source: None,
            chunk_id_prefix: None,
        }
    }
}

impl DocumentIngestOptions {
    pub fn with_chunking(mut self, chunking: ChunkingStrategy) -> Self {
        self.chunking = chunking;
        self
    }

    pub fn with_metadata(mut self, metadata: Value) -> Self {
        self.metadata = metadata;
        self
    }

    pub fn with_source(mut self, source: impl Into<String>) -> Self {
        self.source = Some(source.into());
        self
    }

    pub fn with_chunk_id_prefix(mut self, prefix: impl Into<String>) -> Self {
        self.chunk_id_prefix = Some(prefix.into());
        self
    }
}

#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct DocumentIngestReport {
    pub doc_id: String,
    pub chunk_ids: Vec<String>,
    pub chunk_count: usize,
}

#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct StoredChunk {
    pub id: String,
    pub doc_id: String,
    pub content: String,
    pub metadata: Value,
    pub source: Option<String>,
}

#[derive(Debug, Clone)]
pub struct SearchRequest {
    pub query_text: Option<String>,
    pub query_embedding: Option<Vec<f32>>,
    pub top_k: usize,
    pub alpha: f32,
    pub candidate_limit: usize,
    pub include_payloads: bool,
    pub metadata_filters: HashMap<String, String>,
    pub doc_id: Option<String>,
    pub fusion_strategy: FusionStrategy,
    pub query_profile: QueryProfile,
}

impl Default for SearchRequest {
    fn default() -> Self {
        Self {
            query_text: None,
            query_embedding: None,
            top_k: 5,
            alpha: 0.65,
            candidate_limit: 1000,
            include_payloads: true,
            metadata_filters: HashMap::new(),
            doc_id: None,
            fusion_strategy: FusionStrategy::default(),
            query_profile: QueryProfile::default(),
        }
    }
}

#[derive(Debug, Clone, Copy, PartialEq, Serialize, Deserialize, Default)]
pub enum FusionStrategy {
    #[default]
    Weighted,
    ReciprocalRankFusion {
        rank_constant: f32,
    },
}

#[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize, Deserialize, Default)]
#[serde(rename_all = "snake_case")]
pub enum QueryProfile {
    Latency,
    #[default]
    Balanced,
    Recall,
}

impl SearchRequest {
    /// Convenience constructor for text-only retrieval with default fusion and payloads enabled.
    pub fn text(query_text: impl Into<String>, top_k: usize) -> Self {
        Self {
            query_text: Some(query_text.into()),
            top_k,
            ..Self::default()
        }
    }

    /// Alias for [`SearchRequest::text`] that is easier to discover on docs.rs.
    pub fn text_only(query_text: impl Into<String>, top_k: usize) -> Self {
        Self::text(query_text, top_k)
    }

    /// Convenience constructor for vector-only retrieval with payloads enabled.
    pub fn vector(query_embedding: Vec<f32>, top_k: usize) -> Self {
        Self {
            query_embedding: Some(query_embedding),
            top_k,
            ..Self::default()
        }
    }

    /// Alias for [`SearchRequest::vector`] that is easier to discover on docs.rs.
    pub fn vector_only(query_embedding: Vec<f32>, top_k: usize) -> Self {
        Self::vector(query_embedding, top_k)
    }

    /// Convenience constructor for hybrid retrieval with default fusion and payloads enabled.
    pub fn hybrid(query_text: impl Into<String>, query_embedding: Vec<f32>, top_k: usize) -> Self {
        Self {
            query_text: Some(query_text.into()),
            query_embedding: Some(query_embedding),
            top_k,
            ..Self::default()
        }
    }

    pub fn builder() -> SearchRequestBuilder {
        SearchRequestBuilder::default()
    }

    pub fn resolve_query_profile(&self) -> Self {
        let mut resolved = self.clone();
        match resolved.query_profile {
            QueryProfile::Latency => {
                let cap = resolved
                    .top_k
                    .saturating_mul(QUERY_PROFILE_LATENCY_TOP_K_MULTIPLIER)
                    .max(QUERY_PROFILE_LATENCY_MIN_CANDIDATE_LIMIT);
                resolved.candidate_limit = resolved.candidate_limit.min(cap).max(resolved.top_k);
            }
            QueryProfile::Balanced => {}
            QueryProfile::Recall => {
                let floor = resolved
                    .top_k
                    .saturating_mul(QUERY_PROFILE_RECALL_TOP_K_MULTIPLIER)
                    .max(QUERY_PROFILE_RECALL_MIN_CANDIDATE_LIMIT);
                resolved.candidate_limit = resolved.candidate_limit.max(floor);
            }
        }
        resolved
    }

    pub fn validate(&self) -> Result<()> {
        if self.query_text.is_none() && self.query_embedding.is_none() {
            return Err(SqlRiteError::MissingQuery);
        }
        if self.top_k == 0 {
            return Err(SqlRiteError::InvalidTopK);
        }
        if self.candidate_limit == 0 {
            return Err(SqlRiteError::InvalidCandidateLimit);
        }
        if self.candidate_limit < self.top_k {
            return Err(SqlRiteError::CandidateLimitTooSmall);
        }
        if !(0.0..=1.0).contains(&self.alpha) {
            return Err(SqlRiteError::InvalidAlpha);
        }
        if let FusionStrategy::ReciprocalRankFusion { rank_constant } = self.fusion_strategy
            && rank_constant <= 0.0
        {
            return Err(SqlRiteError::InvalidRrfRankConstant);
        }
        Ok(())
    }
}

#[derive(Debug, Default, Clone)]
pub struct SearchRequestBuilder {
    inner: SearchRequest,
}

impl SearchRequestBuilder {
    pub fn new() -> Self {
        Self::default()
    }

    pub fn query_text(mut self, value: impl Into<String>) -> Self {
        self.inner.query_text = Some(value.into());
        self
    }

    pub fn query_embedding(mut self, value: Vec<f32>) -> Self {
        self.inner.query_embedding = Some(value);
        self
    }

    pub fn top_k(mut self, value: usize) -> Self {
        self.inner.top_k = value;
        self
    }

    pub fn alpha(mut self, value: f32) -> Self {
        self.inner.alpha = value;
        self
    }

    pub fn candidate_limit(mut self, value: usize) -> Self {
        self.inner.candidate_limit = value;
        self
    }

    pub fn include_payloads(mut self, value: bool) -> Self {
        self.inner.include_payloads = value;
        self
    }

    pub fn metadata_filter(mut self, key: impl Into<String>, value: impl Into<String>) -> Self {
        self.inner.metadata_filters.insert(key.into(), value.into());
        self
    }

    pub fn doc_id(mut self, value: impl Into<String>) -> Self {
        self.inner.doc_id = Some(value.into());
        self
    }

    pub fn fusion_strategy(mut self, value: FusionStrategy) -> Self {
        self.inner.fusion_strategy = value;
        self
    }

    pub fn query_profile(mut self, value: QueryProfile) -> Self {
        self.inner.query_profile = value;
        self
    }

    pub fn reciprocal_rank_fusion(mut self, rank_constant: f32) -> Self {
        self.inner.fusion_strategy = FusionStrategy::ReciprocalRankFusion { rank_constant };
        self
    }

    pub fn build(self) -> Result<SearchRequest> {
        self.inner.validate()?;
        Ok(self.inner)
    }
}

#[derive(Debug, Clone, Copy, PartialEq, Eq)]
pub enum DurabilityProfile {
    Balanced,
    Durable,
    FastUnsafe,
}

#[derive(Debug, Clone)]
pub struct RuntimeConfig {
    pub durability_profile: DurabilityProfile,
    pub busy_timeout_ms: u64,
    pub enable_wal: bool,
    pub temp_store_memory: bool,
    pub vector_index_mode: VectorIndexMode,
    pub vector_storage_kind: VectorStorageKind,
    pub ann_tuning: AnnTuningConfig,
    pub enable_ann_persistence: bool,
    pub sqlite_mmap_size_bytes: i64,
    pub sqlite_cache_size_kib: i64,
}

impl Default for RuntimeConfig {
    fn default() -> Self {
        Self {
            durability_profile: DurabilityProfile::Balanced,
            busy_timeout_ms: 5_000,
            enable_wal: true,
            temp_store_memory: true,
            vector_index_mode: VectorIndexMode::BruteForce,
            vector_storage_kind: VectorStorageKind::F32,
            ann_tuning: AnnTuningConfig::default(),
            enable_ann_persistence: true,
            sqlite_mmap_size_bytes: 268_435_456,
            sqlite_cache_size_kib: 65_536,
        }
    }
}

impl RuntimeConfig {
    pub fn durable() -> Self {
        Self {
            durability_profile: DurabilityProfile::Durable,
            ..Self::default()
        }
    }

    pub fn fast_unsafe() -> Self {
        Self {
            durability_profile: DurabilityProfile::FastUnsafe,
            ..Self::default()
        }
    }

    pub fn with_vector_index_mode(mut self, mode: VectorIndexMode) -> Self {
        self.vector_index_mode = mode;
        self
    }

    pub fn with_vector_storage_kind(mut self, kind: VectorStorageKind) -> Self {
        self.vector_storage_kind = kind;
        self
    }

    pub fn with_ann_tuning(mut self, tuning: AnnTuningConfig) -> Self {
        self.ann_tuning = tuning;
        self
    }

    pub fn with_ann_persistence(mut self, enabled: bool) -> Self {
        self.enable_ann_persistence = enabled;
        self
    }

    pub fn with_sqlite_mmap_size(mut self, bytes: i64) -> Self {
        self.sqlite_mmap_size_bytes = bytes.max(0);
        self
    }

    pub fn with_sqlite_cache_size_kib(mut self, kib: i64) -> Self {
        self.sqlite_cache_size_kib = kib.max(0);
        self
    }

    fn synchronous_sql(&self) -> &'static str {
        match self.durability_profile {
            DurabilityProfile::Balanced => "NORMAL",
            DurabilityProfile::Durable => "FULL",
            DurabilityProfile::FastUnsafe => "OFF",
        }
    }
}

#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct SearchResult {
    pub chunk_id: String,
    pub doc_id: String,
    pub content: String,
    pub metadata: Value,
    pub vector_score: f32,
    pub text_score: f32,
    pub hybrid_score: f32,
}

#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct VectorIndexStats {
    pub mode: String,
    pub storage_kind: String,
    pub dimension: Option<usize>,
    pub entries: usize,
    pub estimated_memory_bytes: usize,
}

#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct SqlRiteDiagnostics {
    pub chunk_count: usize,
    pub document_count: usize,
    pub integrity_check_ok: bool,
    pub schema_version: i64,
    pub vector_index: Option<VectorIndexStats>,
    pub fts_enabled: bool,
}

#[derive(Debug, Clone, Copy, Serialize, Deserialize)]
pub struct CompactionOptions {
    pub dedupe_by_content_hash: bool,
    pub prune_orphan_documents: bool,
    pub wal_checkpoint_truncate: bool,
    pub analyze: bool,
    pub vacuum: bool,
}

impl Default for CompactionOptions {
    fn default() -> Self {
        Self {
            dedupe_by_content_hash: true,
            prune_orphan_documents: true,
            wal_checkpoint_truncate: true,
            analyze: true,
            vacuum: true,
        }
    }
}

#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct CompactionReport {
    pub before_chunks: usize,
    pub after_chunks: usize,
    pub removed_chunks: usize,
    pub deduplicated_chunks: usize,
    pub before_documents: usize,
    pub after_documents: usize,
    pub orphan_documents_removed: usize,
    pub wal_checkpoint_applied: bool,
    pub analyze_applied: bool,
    pub vacuum_applied: bool,
    pub vector_index_rebuilt: bool,
    pub database_size_before_bytes: Option<u64>,
    pub database_size_after_bytes: Option<u64>,
    pub reclaimed_bytes: Option<u64>,
    pub duration_ms: f64,
}

#[derive(Debug)]
pub struct SqlRite {
    conn: Connection,
    fts_enabled: bool,
    runtime_config: RuntimeConfig,
    schema_version: i64,
    vector_index: Option<RefCell<BuiltinVectorIndex>>,
    filter_index: RefCell<ChunkFilterIndex>,
    db_path: Option<PathBuf>,
}

#[derive(Debug, Clone)]
pub struct SqlRiteHandle {
    db_path: PathBuf,
    runtime_config: RuntimeConfig,
}

#[derive(Debug)]
struct CandidateChunkRecord {
    id: String,
    doc_id: String,
    metadata: Value,
}

#[derive(Debug, Clone)]
struct ChunkFilterIndexEntry {
    chunk_id: String,
    doc_id: String,
    metadata_pairs: Vec<(String, String)>,
}

#[derive(Debug, Default)]
struct ChunkFilterIndex {
    by_doc_id: HashMap<String, RoaringTreemap>,
    by_metadata: HashMap<(String, String), RoaringTreemap>,
    by_chunk_key: HashMap<ChunkKey, ChunkFilterIndexEntry>,
    chunk_key_by_id: HashMap<String, ChunkKey>,
}

#[derive(Debug)]
struct ScoredChunk {
    chunk_id: String,
    vector_score: f32,
    text_score: f32,
}

#[derive(Debug, Default)]
struct FtsCandidates {
    ordered_chunk_ids: Vec<String>,
    scores: HashMap<String, f32>,
}

#[derive(Debug, Clone, Copy, PartialEq, Eq)]
enum HybridPlannerMode {
    VectorFirst,
    TextFirst,
    BalancedHybrid,
}

impl ChunkFilterIndex {
    fn from_connection(conn: &Connection) -> Result<Self> {
        let mut stmt = conn.prepare("SELECT rowid, id, doc_id, metadata FROM chunks")?;
        let rows = stmt.query_map([], |row| {
            let chunk_key: i64 = row.get(0)?;
            let chunk_id: String = row.get(1)?;
            let doc_id: String = row.get(2)?;
            let metadata_text: String = row.get(3)?;
            let metadata = serde_json::from_str::<Value>(&metadata_text).map_err(|e| {
                rusqlite::Error::FromSqlConversionFailure(
                    3,
                    rusqlite::types::Type::Text,
                    Box::new(e),
                )
            })?;
            Ok((chunk_key as ChunkKey, chunk_id, doc_id, metadata))
        })?;

        let mut index = Self::default();
        for row in rows {
            let (chunk_key, chunk_id, doc_id, metadata) = row?;
            index.upsert_chunk(chunk_key, &chunk_id, &doc_id, &metadata);
        }
        Ok(index)
    }

    fn upsert_chunk(
        &mut self,
        chunk_key: ChunkKey,
        chunk_id: &str,
        doc_id: &str,
        metadata: &Value,
    ) {
        self.remove_chunk_by_id(chunk_id);

        self.by_doc_id
            .entry(doc_id.to_string())
            .or_default()
            .insert(chunk_key);

        let metadata_pairs = extract_filterable_metadata_pairs(metadata);
        for (key, value) in &metadata_pairs {
            self.by_metadata
                .entry((key.clone(), value.clone()))
                .or_default()
                .insert(chunk_key);
        }

        self.by_chunk_key.insert(
            chunk_key,
            ChunkFilterIndexEntry {
                chunk_id: chunk_id.to_string(),
                doc_id: doc_id.to_string(),
                metadata_pairs,
            },
        );
        self.chunk_key_by_id.insert(chunk_id.to_string(), chunk_key);
    }

    fn remove_chunk_by_id(&mut self, chunk_id: &str) {
        let Some(chunk_key) = self.chunk_key_by_id.remove(chunk_id) else {
            return;
        };
        self.remove_chunk_key(chunk_key);
    }

    fn remove_chunk_key(&mut self, chunk_key: ChunkKey) {
        let Some(existing) = self.by_chunk_key.remove(&chunk_key) else {
            return;
        };
        self.chunk_key_by_id.remove(&existing.chunk_id);

        if let Some(ids) = self.by_doc_id.get_mut(&existing.doc_id) {
            ids.remove(chunk_key);
            if ids.is_empty() {
                self.by_doc_id.remove(&existing.doc_id);
            }
        }

        for (key, value) in existing.metadata_pairs {
            let map_key = (key, value);
            if let Some(ids) = self.by_metadata.get_mut(&map_key) {
                ids.remove(chunk_key);
                if ids.is_empty() {
                    self.by_metadata.remove(&map_key);
                }
            }
        }
    }

    fn filtered_chunk_keys(&self, request: &SearchRequest) -> Option<RoaringTreemap> {
        if request.doc_id.is_none() && request.metadata_filters.is_empty() {
            return None;
        }

        let mut working_set: Option<RoaringTreemap> = None;

        if let Some(doc_id) = &request.doc_id {
            let ids = self.by_doc_id.get(doc_id)?;
            working_set = Some(ids.clone());
        }

        for (key, value) in &request.metadata_filters {
            let ids = self.by_metadata.get(&(key.clone(), value.clone()))?;
            if let Some(current) = &mut working_set {
                *current &= ids.clone();
                if current.is_empty() {
                    return Some(RoaringTreemap::new());
                }
            } else {
                working_set = Some(ids.clone());
            }
        }

        working_set
    }
}

fn extract_filterable_metadata_pairs(metadata: &Value) -> Vec<(String, String)> {
    let Some(object) = metadata.as_object() else {
        return Vec::new();
    };

    object
        .iter()
        .filter_map(|(key, value)| {
            let normalized = match value {
                Value::String(text) => Some(text.clone()),
                Value::Number(number) => Some(number.to_string()),
                Value::Bool(flag) => Some(flag.to_string()),
                _ => None,
            }?;
            Some((key.clone(), normalized))
        })
        .collect()
}

impl SqlRiteHandle {
    pub fn open(path: impl AsRef<Path>) -> Result<Self> {
        Self::open_with_config(path, RuntimeConfig::default())
    }

    pub fn open_with_config(path: impl AsRef<Path>, runtime_config: RuntimeConfig) -> Result<Self> {
        let path = path.as_ref().to_path_buf();
        let _ = SqlRite::open_with_config(&path, runtime_config.clone())?;
        Ok(Self {
            db_path: path,
            runtime_config,
        })
    }

    pub fn db_path(&self) -> &Path {
        &self.db_path
    }

    pub fn runtime_config(&self) -> &RuntimeConfig {
        &self.runtime_config
    }

    pub fn connect(&self) -> Result<SqlRite> {
        SqlRite::open_with_config(&self.db_path, self.runtime_config.clone())
    }

    pub fn with_db<T>(&self, f: impl FnOnce(&SqlRite) -> Result<T>) -> Result<T> {
        let db = self.connect()?;
        f(&db)
    }

    pub fn search(&self, request: SearchRequest) -> Result<Vec<SearchResult>> {
        self.with_db(|db| db.search(request))
    }

    pub fn chunk_count(&self) -> Result<usize> {
        self.with_db(SqlRite::chunk_count)
    }

    pub fn document_count(&self) -> Result<usize> {
        self.with_db(SqlRite::document_count)
    }

    pub fn diagnostics(&self) -> Result<SqlRiteDiagnostics> {
        self.with_db(SqlRite::diagnostics)
    }

    pub fn ingest_chunk(&self, chunk: &ChunkInput) -> Result<()> {
        self.with_db(|db| db.ingest_chunk(chunk))
    }

    pub fn ingest_chunks(&self, chunks: &[ChunkInput]) -> Result<()> {
        self.with_db(|db| db.ingest_chunks(chunks))
    }

    pub fn ingest_text_chunk(&self, chunk: &TextChunkInput) -> Result<()> {
        self.with_db(|db| db.ingest_text_chunk(chunk))
    }

    pub fn ingest_text_chunks(&self, chunks: &[TextChunkInput]) -> Result<()> {
        self.with_db(|db| db.ingest_text_chunks(chunks))
    }

    pub fn ingest_document_text(
        &self,
        doc_id: impl Into<String>,
        content: impl AsRef<str>,
        options: DocumentIngestOptions,
    ) -> Result<DocumentIngestReport> {
        let doc_id = doc_id.into();
        let content = content.as_ref().to_string();
        self.with_db(|db| db.ingest_document_text(doc_id, &content, options))
    }

    pub fn update_chunk_embedding(&self, chunk_id: &str, embedding: Vec<f32>) -> Result<()> {
        self.with_db(|db| db.update_chunk_embedding(chunk_id, embedding))
    }

    pub fn delete_by_doc_id(&self, doc_id: &str) -> Result<usize> {
        self.with_db(|db| db.delete_by_doc_id(doc_id))
    }

    pub fn compact(&self, options: CompactionOptions) -> Result<CompactionReport> {
        self.with_db(|db| db.compact(options))
    }
}

impl SqlRite {
    pub fn open(path: impl AsRef<Path>) -> Result<Self> {
        let path = path.as_ref();
        let conn = Connection::open(path)?;
        Self::from_connection_with_config(conn, RuntimeConfig::default(), Some(path.to_path_buf()))
    }

    pub fn open_with_config(path: impl AsRef<Path>, config: RuntimeConfig) -> Result<Self> {
        let path = path.as_ref();
        let conn = Connection::open(path)?;
        Self::from_connection_with_config(conn, config, Some(path.to_path_buf()))
    }

    pub fn open_in_memory() -> Result<Self> {
        let conn = Connection::open_in_memory()?;
        Self::from_connection_with_config(conn, RuntimeConfig::default(), None)
    }

    pub fn open_in_memory_with_config(config: RuntimeConfig) -> Result<Self> {
        let conn = Connection::open_in_memory()?;
        Self::from_connection_with_config(conn, config, None)
    }

    pub fn chunk_count(&self) -> Result<usize> {
        let count = self
            .conn
            .query_row("SELECT COUNT(*) FROM chunks", [], |row| {
                row.get::<_, i64>(0)
            })?;
        Ok(count as usize)
    }

    pub fn document_count(&self) -> Result<usize> {
        let count = self
            .conn
            .query_row("SELECT COUNT(*) FROM documents", [], |row| {
                row.get::<_, i64>(0)
            })?;
        Ok(count as usize)
    }

    pub fn integrity_check_ok(&self) -> Result<bool> {
        let result: String = self
            .conn
            .query_row("PRAGMA integrity_check;", [], |row| row.get(0))?;
        Ok(result.eq_ignore_ascii_case("ok"))
    }

    pub fn diagnostics(&self) -> Result<SqlRiteDiagnostics> {
        Ok(SqlRiteDiagnostics {
            chunk_count: self.chunk_count()?,
            document_count: self.document_count()?,
            integrity_check_ok: self.integrity_check_ok()?,
            schema_version: self.schema_version(),
            vector_index: self.vector_index_stats(),
            fts_enabled: self.fts_enabled,
        })
    }

    pub fn compact(&self, options: CompactionOptions) -> Result<CompactionReport> {
        if !options.dedupe_by_content_hash
            && !options.prune_orphan_documents
            && !options.wal_checkpoint_truncate
            && !options.analyze
            && !options.vacuum
        {
            return Err(SqlRiteError::InvalidCompactionConfig(
                "at least one compaction action must be enabled".to_string(),
            ));
        }

        let started = Instant::now();
        let before_chunks = self.chunk_count()?;
        let before_documents = self.document_count()?;
        let database_size_before_bytes = self.database_file_size_bytes();

        let deduplicated_chunks = if options.dedupe_by_content_hash {
            self.delete_content_hash_duplicates()?
        } else {
            0
        };

        let orphan_documents_removed = if options.prune_orphan_documents {
            self.conn.execute(
                "DELETE FROM documents
                 WHERE NOT EXISTS (
                    SELECT 1 FROM chunks
                    WHERE chunks.doc_id = documents.id
                 )",
                [],
            )?
        } else {
            0
        };

        let mut vector_index_rebuilt = false;
        if deduplicated_chunks > 0 {
            self.rebuild_vector_index()?;
            self.rebuild_filter_index()?;
            self.persist_vector_index_artifacts_if_enabled()?;
            vector_index_rebuilt = true;
        }

        let wal_checkpoint_applied = options.wal_checkpoint_truncate;
        if wal_checkpoint_applied {
            self.conn
                .execute_batch("PRAGMA wal_checkpoint(TRUNCATE);")?;
        }

        let analyze_applied = options.analyze;
        if analyze_applied {
            self.conn.execute_batch("ANALYZE;")?;
        }

        let vacuum_applied = options.vacuum && self.db_path.is_some();
        if vacuum_applied {
            self.conn.execute_batch("VACUUM;")?;
        }

        let after_chunks = self.chunk_count()?;
        let after_documents = self.document_count()?;
        let database_size_after_bytes = self.database_file_size_bytes();
        let reclaimed_bytes = match (database_size_before_bytes, database_size_after_bytes) {
            (Some(before), Some(after)) if before >= after => Some(before - after),
            _ => None,
        };

        Ok(CompactionReport {
            before_chunks,
            after_chunks,
            removed_chunks: before_chunks.saturating_sub(after_chunks),
            deduplicated_chunks,
            before_documents,
            after_documents,
            orphan_documents_removed,
            wal_checkpoint_applied,
            analyze_applied,
            vacuum_applied,
            vector_index_rebuilt,
            database_size_before_bytes,
            database_size_after_bytes,
            reclaimed_bytes,
            duration_ms: started.elapsed().as_secs_f64() * 1000.0,
        })
    }

    pub fn delete_chunks_by_metadata(&self, key: &str, value: &str) -> Result<usize> {
        let safe_key = sanitize_metadata_key(key)?;
        let sql = format!(
            "DELETE FROM chunks WHERE json_extract(metadata, '$.{}') = ?",
            safe_key
        );
        let deleted = self.conn.execute(&sql, params![value])?;
        if deleted > 0 {
            self.rebuild_vector_index()?;
            self.rebuild_filter_index()?;
            self.persist_vector_index_artifacts_if_enabled()?;
        }
        Ok(deleted)
    }

    pub fn delete_by_doc_id(&self, doc_id: &str) -> Result<usize> {
        let deleted = self
            .conn
            .execute("DELETE FROM chunks WHERE doc_id = ?1", params![doc_id])?;
        self.conn.execute(
            "DELETE FROM documents
             WHERE id = ?1
             AND NOT EXISTS (SELECT 1 FROM chunks WHERE chunks.doc_id = documents.id)",
            params![doc_id],
        )?;
        if deleted > 0 {
            self.rebuild_vector_index()?;
            self.rebuild_filter_index()?;
            self.persist_vector_index_artifacts_if_enabled()?;
        }
        Ok(deleted)
    }

    pub fn list_chunks_page(
        &self,
        offset: usize,
        limit: usize,
        tenant_id: Option<&str>,
    ) -> Result<Vec<StoredChunk>> {
        if limit == 0 {
            return Ok(Vec::new());
        }

        let mut sql = String::from(
            "
            SELECT c.id, c.doc_id, c.content, c.metadata, d.source
            FROM chunks AS c
            LEFT JOIN documents AS d ON d.id = c.doc_id
            ",
        );
        let mut params = Vec::new();
        if let Some(tenant_id) = tenant_id {
            sql.push_str(" WHERE json_extract(c.metadata, '$.tenant') = ?");
            params.push(SqlValue::from(tenant_id.to_string()));
        }
        sql.push_str(" ORDER BY c.rowid ASC LIMIT ? OFFSET ?");
        params.push(SqlValue::Integer(limit as i64));
        params.push(SqlValue::Integer(offset as i64));

        let mut stmt = self.conn.prepare(&sql)?;
        let rows = stmt.query_map(params_from_iter(params), |row| {
            let metadata_text: String = row.get(3)?;
            let metadata = serde_json::from_str::<Value>(&metadata_text).map_err(|e| {
                rusqlite::Error::FromSqlConversionFailure(
                    3,
                    rusqlite::types::Type::Text,
                    Box::new(e),
                )
            })?;
            Ok(StoredChunk {
                id: row.get(0)?,
                doc_id: row.get(1)?,
                content: row.get(2)?,
                metadata,
                source: row.get(4)?,
            })
        })?;

        let mut out = Vec::new();
        for row in rows {
            out.push(row?);
        }
        Ok(out)
    }

    pub fn update_chunk_metadata(&self, chunk_id: &str, metadata: &Value) -> Result<()> {
        let metadata_json = serde_json::to_string(metadata)?;
        self.conn.execute(
            "UPDATE chunks SET metadata = ?1 WHERE id = ?2",
            params![metadata_json, chunk_id],
        )?;
        if let Ok((chunk_key, doc_id)) = self.conn.query_row(
            "SELECT rowid, doc_id FROM chunks WHERE id = ?1",
            params![chunk_id],
            |row| Ok((row.get::<_, i64>(0)? as ChunkKey, row.get::<_, String>(1)?)),
        ) {
            self.filter_index
                .borrow_mut()
                .upsert_chunk(chunk_key, chunk_id, &doc_id, metadata);
        }
        Ok(())
    }

    pub fn schema_version(&self) -> i64 {
        self.schema_version
    }

    pub fn runtime_config(&self) -> &RuntimeConfig {
        &self.runtime_config
    }

    pub fn vector_index_stats(&self) -> Option<VectorIndexStats> {
        let index = self.vector_index.as_ref()?;
        let index = index.borrow();
        Some(VectorIndexStats {
            mode: index.name().to_string(),
            storage_kind: index.storage_kind().as_str().to_string(),
            dimension: index.dimension(),
            entries: index.len(),
            estimated_memory_bytes: index.estimated_memory_bytes(),
        })
    }

    pub fn ingest_chunk(&self, chunk: &ChunkInput) -> Result<()> {
        self.ingest_chunks(std::slice::from_ref(chunk))
    }

    pub fn chunk_text(content: &str, strategy: &ChunkingStrategy) -> Vec<String> {
        chunk_text_for_ingest(content, strategy)
    }

    pub fn ingest_text_chunk(&self, chunk: &TextChunkInput) -> Result<()> {
        self.ingest_text_chunks(std::slice::from_ref(chunk))
    }

    pub fn ingest_chunks(&self, chunks: &[ChunkInput]) -> Result<()> {
        if chunks.is_empty() {
            return Ok(());
        }

        self.validate_ingest_chunks(chunks)?;

        let tx = self.conn.unchecked_transaction()?;
        {
            let mut doc_stmt = tx.prepare(DOC_UPSERT_SQL)?;
            let mut chunk_stmt = tx.prepare(CHUNK_UPSERT_SQL)?;

            for chunk in chunks {
                let metadata_json = serde_json::to_string(&chunk.metadata)?;
                let embedding_dim = chunk.embedding.len() as i64;
                let embedding_blob = encode_embedding(&chunk.embedding);

                doc_stmt.execute(params![chunk.doc_id, chunk.source.as_deref()])?;
                chunk_stmt.execute(params![
                    chunk.id,
                    chunk.doc_id,
                    chunk.content,
                    metadata_json,
                    embedding_blob,
                    embedding_dim
                ])?;
            }
        }
        tx.commit()?;

        let chunk_keys = self.fetch_chunk_keys_by_ids(
            &chunks
                .iter()
                .map(|chunk| chunk.id.clone())
                .collect::<Vec<_>>(),
        )?;

        if let Some(index) = &self.vector_index {
            let mut index = index.borrow_mut();
            let upserts: Vec<VectorEntryRecord> = chunks
                .iter()
                .filter_map(|chunk| {
                    chunk_keys
                        .get(&chunk.id)
                        .copied()
                        .map(|chunk_key| VectorEntryRecord {
                            chunk_key,
                            chunk_id: chunk.id.clone(),
                            embedding: chunk.embedding.clone(),
                        })
                })
                .collect();
            index.upsert_records(&upserts)?;
        }

        {
            let mut filter_index = self.filter_index.borrow_mut();
            for chunk in chunks {
                if let Some(chunk_key) = chunk_keys.get(&chunk.id).copied() {
                    filter_index.upsert_chunk(chunk_key, &chunk.id, &chunk.doc_id, &chunk.metadata);
                }
            }
        }

        self.persist_vector_index_artifacts_if_enabled()?;
        Ok(())
    }

    pub fn ingest_text_chunks(&self, chunks: &[TextChunkInput]) -> Result<()> {
        if chunks.is_empty() {
            return Ok(());
        }

        let tx = self.conn.unchecked_transaction()?;
        {
            let mut doc_stmt = tx.prepare(DOC_UPSERT_SQL)?;
            let mut chunk_stmt = tx.prepare(CHUNK_UPSERT_SQL)?;

            for chunk in chunks {
                let metadata_json = serde_json::to_string(&chunk.metadata)?;
                doc_stmt.execute(params![chunk.doc_id, chunk.source.as_deref()])?;
                chunk_stmt.execute(params![
                    chunk.id,
                    chunk.doc_id,
                    chunk.content,
                    metadata_json,
                    Vec::<u8>::new(),
                    0i64
                ])?;
            }
        }
        tx.commit()?;

        let chunk_keys = self.fetch_chunk_keys_by_ids(
            &chunks
                .iter()
                .map(|chunk| chunk.id.clone())
                .collect::<Vec<_>>(),
        )?;
        {
            let mut filter_index = self.filter_index.borrow_mut();
            for chunk in chunks {
                if let Some(chunk_key) = chunk_keys.get(&chunk.id).copied() {
                    filter_index.upsert_chunk(chunk_key, &chunk.id, &chunk.doc_id, &chunk.metadata);
                }
            }
        }

        Ok(())
    }

    pub fn ingest_document_text(
        &self,
        doc_id: impl Into<String>,
        content: impl AsRef<str>,
        options: DocumentIngestOptions,
    ) -> Result<DocumentIngestReport> {
        let doc_id = doc_id.into();
        let DocumentIngestOptions {
            chunking,
            metadata,
            source,
            chunk_id_prefix,
        } = options;
        let chunk_bodies = chunk_text_for_ingest(content.as_ref(), &chunking);
        if chunk_bodies.is_empty() {
            return Ok(DocumentIngestReport {
                doc_id,
                chunk_ids: Vec::new(),
                chunk_count: 0,
            });
        }

        let chunk_prefix = chunk_id_prefix.unwrap_or_else(|| format!("{doc_id}:chunk"));
        let chunks = chunk_bodies
            .into_iter()
            .enumerate()
            .map(|(idx, body)| {
                let mut chunk = TextChunkInput::new(format!("{chunk_prefix}-{idx}"), &doc_id, body)
                    .with_metadata(metadata.clone());
                if let Some(source) = &source {
                    chunk = chunk.with_source(source.clone());
                }
                chunk
            })
            .collect::<Vec<_>>();
        let chunk_ids = chunks
            .iter()
            .map(|chunk| chunk.id.clone())
            .collect::<Vec<_>>();
        self.ingest_text_chunks(&chunks)?;
        Ok(DocumentIngestReport {
            doc_id,
            chunk_count: chunk_ids.len(),
            chunk_ids,
        })
    }

    pub fn update_chunk_embedding(&self, chunk_id: &str, embedding: Vec<f32>) -> Result<()> {
        if embedding.is_empty() {
            return Err(SqlRiteError::EmptyEmbedding);
        }

        let chunk_key = self.conn.query_row(
            "SELECT rowid FROM chunks WHERE id = ?1",
            params![chunk_id],
            |row| row.get::<_, i64>(0),
        )? as ChunkKey;
        let embedding_dim = embedding.len() as i64;
        let embedding_blob = encode_embedding(&embedding);

        self.conn.execute(
            "UPDATE chunks SET embedding = ?1, embedding_dim = ?2 WHERE id = ?3",
            params![embedding_blob, embedding_dim, chunk_id],
        )?;

        if let Some(index) = &self.vector_index {
            index.borrow_mut().upsert_records(&[VectorEntryRecord {
                chunk_key,
                chunk_id: chunk_id.to_string(),
                embedding,
            }])?;
            self.persist_vector_index_artifacts_if_enabled()?;
        }

        Ok(())
    }

    pub fn search(&self, request: SearchRequest) -> Result<Vec<SearchResult>> {
        let request = request.resolve_query_profile();
        request.validate()?;

        let query_embedding = request.query_embedding.as_ref();
        let normalized_query_embedding =
            query_embedding.map(|query| normalize_embedding_for_search(query));
        let query_text = request.query_text.as_deref();
        let query_tokens = query_text.map(tokenize);
        let use_vector = query_embedding.is_some();
        let use_text = query_text.is_some();
        let hybrid_planner_mode =
            select_hybrid_planner_mode(&request, self.fts_enabled, self.vector_index.is_some());

        if let Some(query_vector) = query_embedding
            && !use_text
        {
            let mut vector_request = request.clone();
            vector_request.candidate_limit = request.top_k;
            let vector_candidates = self.vector_candidates(query_vector, &vector_request)?;
            return self.build_vector_only_results(vector_candidates, &request);
        }

        let mut vector_score_lookup = HashMap::new();
        let mut vector_candidate_ids = Vec::new();
        let vector_fast_path = false;

        let mut text_scores = HashMap::new();
        let mut text_candidate_ids = Vec::new();
        if let Some(query_vector) = query_embedding
            && !matches!(hybrid_planner_mode, Some(HybridPlannerMode::TextFirst))
        {
            let mut vector_request = request.clone();
            if let Some(mode) = hybrid_planner_mode {
                vector_request.candidate_limit = hybrid_primary_candidate_limit(&request, mode);
            }
            let vector_candidates = self.vector_candidates(query_vector, &vector_request)?;
            vector_score_lookup = vector_candidates
                .iter()
                .map(|candidate| (candidate.chunk_id.clone(), candidate.score))
                .collect();
            vector_candidate_ids = vector_candidates
                .iter()
                .map(|candidate| candidate.chunk_id.clone())
                .collect();
        }
        if let Some(text) = query_text
            && self.fts_enabled
        {
            let need_text_candidates = match hybrid_planner_mode {
                Some(HybridPlannerMode::VectorFirst) => vector_candidate_ids.len() < request.top_k,
                Some(HybridPlannerMode::TextFirst) => true,
                Some(HybridPlannerMode::BalancedHybrid) | None => {
                    !use_vector || vector_candidate_ids.len() < request.candidate_limit
                }
            };
            if need_text_candidates {
                let text_limit = match hybrid_planner_mode {
                    Some(mode) => hybrid_primary_candidate_limit(&request, mode),
                    None if use_vector => match request.query_profile {
                        QueryProfile::Latency => request.candidate_limit,
                        QueryProfile::Balanced => request.candidate_limit.saturating_mul(2),
                        QueryProfile::Recall => request.candidate_limit.saturating_mul(4),
                    },
                    None => request.candidate_limit,
                };
                let fts_candidates = self
                    .fts_text_candidates(text, &request, text_limit)
                    .unwrap_or_default();
                text_candidate_ids = fts_candidates.ordered_chunk_ids;
                if !use_vector || matches!(hybrid_planner_mode, Some(HybridPlannerMode::TextFirst))
                {
                    text_scores = fts_candidates.scores;
                }
            }
        }
        if let Some(query_vector) = query_embedding
            && matches!(hybrid_planner_mode, Some(HybridPlannerMode::TextFirst))
            && vector_candidate_ids.len() < request.top_k
        {
            let mut vector_request = request.clone();
            vector_request.candidate_limit =
                hybrid_secondary_candidate_limit(&request, HybridPlannerMode::TextFirst);
            let vector_candidates = self.vector_candidates(query_vector, &vector_request)?;
            vector_score_lookup = vector_candidates
                .iter()
                .map(|candidate| (candidate.chunk_id.clone(), candidate.score))
                .collect();
            vector_candidate_ids = vector_candidates
                .iter()
                .map(|candidate| candidate.chunk_id.clone())
                .collect();
        }

        let fetch_ids = if vector_fast_path {
            vector_candidate_ids
                .iter()
                .take(request.top_k)
                .cloned()
                .collect()
        } else {
            match hybrid_planner_mode {
                Some(HybridPlannerMode::VectorFirst) => merge_ranked_candidate_ids(
                    &vector_candidate_ids,
                    &text_candidate_ids,
                    request.candidate_limit,
                ),
                Some(HybridPlannerMode::TextFirst) => merge_ranked_candidate_ids(
                    &text_candidate_ids,
                    &vector_candidate_ids,
                    request.candidate_limit,
                ),
                Some(HybridPlannerMode::BalancedHybrid) | None => merge_candidate_ids(
                    &vector_candidate_ids,
                    &text_candidate_ids,
                    request.candidate_limit,
                    use_vector,
                    use_text,
                ),
            }
        };

        let candidate_ids = if fetch_ids.is_empty() {
            self.fetch_candidate_chunk_ids(&request)?
        } else {
            let mut items = fetch_ids;
            let allow_sql_backfill = matches!(
                hybrid_planner_mode,
                None | Some(HybridPlannerMode::BalancedHybrid)
            );
            if !vector_fast_path && allow_sql_backfill && items.len() < request.candidate_limit {
                let fallback = self.fetch_candidate_chunk_ids(&request)?;
                let mut seen_ids: HashSet<String> = items.iter().cloned().collect();
                for chunk_id in fallback {
                    if seen_ids.insert(chunk_id.clone()) {
                        items.push(chunk_id);
                        if items.len() >= request.candidate_limit {
                            break;
                        }
                    }
                }
            }
            items.truncate(request.candidate_limit);
            items
        };

        let candidate_ids = if use_vector && use_text && !vector_fast_path {
            select_hybrid_rerank_ids(
                candidate_ids,
                &vector_score_lookup,
                &text_scores,
                &request,
                hybrid_planner_mode,
            )
        } else {
            candidate_ids
        };

        if let Some(text) = query_text
            && self.fts_enabled
            && candidate_ids
                .iter()
                .any(|chunk_id| !text_scores.contains_key(chunk_id))
            && !should_skip_fts_score_lookup(
                use_vector,
                self.fts_enabled,
                vector_candidate_ids.len(),
                request.candidate_limit,
            )
        {
            let missing_text_ids: Vec<String> = candidate_ids
                .iter()
                .filter(|chunk_id| !text_scores.contains_key(*chunk_id))
                .cloned()
                .collect();
            if !missing_text_ids.is_empty() {
                text_scores.extend(
                    self.fts_text_scores_for_ids(text, &missing_text_ids)
                        .unwrap_or_default(),
                );
            }
        }

        let mut scored = Vec::with_capacity(candidate_ids.len());
        let mut content_cache = HashMap::new();
        let mut embedding_cache = HashMap::new();
        let missing_text_ids = if use_text {
            candidate_ids
                .iter()
                .filter(|chunk_id| text_scores.get(*chunk_id).copied().unwrap_or(0.0) <= 0.0)
                .cloned()
                .collect::<Vec<_>>()
        } else {
            Vec::new()
        };
        if !missing_text_ids.is_empty() {
            content_cache = self.fetch_chunk_contents_by_ids(&missing_text_ids)?;
        }
        if use_vector {
            let missing_vector_ids: Vec<String> = candidate_ids
                .iter()
                .filter(|chunk_id| !vector_score_lookup.contains_key(*chunk_id))
                .cloned()
                .collect();
            if !missing_vector_ids.is_empty() {
                embedding_cache = self.fetch_chunk_embeddings_by_ids(&missing_vector_ids)?;
            }
        }

        for chunk_id in candidate_ids {
            let vector_score = if let Some(query_vector) = query_embedding {
                if let Some(score) = vector_score_lookup.get(&chunk_id).copied() {
                    score
                } else if let Some(chunk_embedding) = embedding_cache.get(&chunk_id) {
                    if query_vector.len() != chunk_embedding.len() {
                        if !use_text {
                            continue;
                        }
                        0.0
                    } else {
                        cosine_similarity_with_normalized_query(
                            normalized_query_embedding
                                .as_deref()
                                .expect("normalized query exists"),
                            chunk_embedding,
                        )
                    }
                } else if !use_text {
                    continue;
                } else {
                    0.0
                }
            } else {
                0.0
            };

            let text_score = if let Some(text) = query_text {
                let fts_score = text_scores.get(&chunk_id).copied().unwrap_or(0.0);
                if self.fts_enabled && fts_score > 0.0 {
                    fts_score
                } else {
                    lexical_overlap_score(
                        query_tokens.as_ref().expect("tokens exist"),
                        text,
                        content_cache
                            .get(&chunk_id)
                            .map(String::as_str)
                            .unwrap_or_default(),
                    )
                }
            } else {
                0.0
            };

            scored.push(ScoredChunk {
                chunk_id,
                vector_score,
                text_score,
            });
        }

        let hybrid_scores = compute_hybrid_scores(
            &scored,
            use_vector,
            use_text,
            request.alpha,
            request.fusion_strategy,
        );
        let mut results = Vec::with_capacity(scored.len());
        for entry in scored {
            let hybrid_score = hybrid_scores.get(&entry.chunk_id).copied().unwrap_or(0.0);
            results.push(SearchResult {
                chunk_id: entry.chunk_id,
                doc_id: String::new(),
                content: String::new(),
                metadata: Value::Null,
                vector_score: entry.vector_score,
                text_score: entry.text_score,
                hybrid_score,
            });
        }

        results.sort_by(|left, right| {
            right
                .hybrid_score
                .total_cmp(&left.hybrid_score)
                .then_with(|| right.vector_score.total_cmp(&left.vector_score))
                .then_with(|| right.text_score.total_cmp(&left.text_score))
                .then_with(|| left.chunk_id.cmp(&right.chunk_id))
        });
        results.truncate(request.top_k);
        if request.include_payloads {
            self.hydrate_search_result_payloads(&mut results, &mut content_cache)?;
        }
        Ok(results)
    }

    fn build_vector_only_results(
        &self,
        candidates: Vec<VectorCandidate>,
        request: &SearchRequest,
    ) -> Result<Vec<SearchResult>> {
        if candidates.is_empty() {
            return Ok(Vec::new());
        }

        let mut results: Vec<SearchResult> = candidates
            .into_iter()
            .take(request.top_k)
            .map(|candidate| SearchResult {
                chunk_id: candidate.chunk_id,
                doc_id: String::new(),
                content: String::new(),
                metadata: Value::Null,
                vector_score: candidate.score,
                text_score: 0.0,
                hybrid_score: candidate.score,
            })
            .collect();

        if request.include_payloads {
            let mut content_cache = HashMap::new();
            self.hydrate_search_result_payloads(&mut results, &mut content_cache)?;
        }

        Ok(results)
    }

    fn hydrate_search_result_payloads(
        &self,
        results: &mut Vec<SearchResult>,
        content_cache: &mut HashMap<String, String>,
    ) -> Result<()> {
        let final_ids: Vec<String> = results
            .iter()
            .map(|result| result.chunk_id.clone())
            .collect();
        if !final_ids.is_empty() {
            let final_chunks = self.fetch_chunks_by_ids(&final_ids)?;
            let final_chunk_lookup: HashMap<String, CandidateChunkRecord> = final_chunks
                .into_iter()
                .map(|chunk| (chunk.id.clone(), chunk))
                .collect();
            results.retain(|result| final_chunk_lookup.contains_key(&result.chunk_id));
            for result in results.iter_mut() {
                if let Some(chunk) = final_chunk_lookup.get(&result.chunk_id) {
                    result.doc_id = chunk.doc_id.clone();
                    result.metadata = chunk.metadata.clone();
                }
            }
        }
        let missing_content_ids: Vec<String> = results
            .iter()
            .filter(|result| !content_cache.contains_key(&result.chunk_id))
            .map(|result| result.chunk_id.clone())
            .collect();
        if !missing_content_ids.is_empty() {
            content_cache.extend(self.fetch_chunk_contents_by_ids(&missing_content_ids)?);
        }
        for result in results.iter_mut() {
            if let Some(content) = content_cache.get(&result.chunk_id) {
                result.content = content.clone();
            }
        }
        Ok(())
    }

    fn from_connection_with_config(
        mut conn: Connection,
        runtime_config: RuntimeConfig,
        db_path: Option<PathBuf>,
    ) -> Result<Self> {
        apply_runtime_config(&conn, &runtime_config)?;
        let schema_version = run_migrations(&mut conn)?;
        let fts_enabled = initialize_fts(&conn);
        let vector_index =
            load_vector_index(&conn, &runtime_config, db_path.as_deref())?.map(RefCell::new);
        let filter_index = RefCell::new(ChunkFilterIndex::from_connection(&conn)?);

        Ok(Self {
            conn,
            fts_enabled,
            runtime_config,
            schema_version,
            vector_index,
            filter_index,
            db_path,
        })
    }

    fn rebuild_filter_index(&self) -> Result<()> {
        *self.filter_index.borrow_mut() = ChunkFilterIndex::from_connection(&self.conn)?;
        Ok(())
    }

    fn persist_vector_index_artifacts_if_enabled(&self) -> Result<()> {
        if !self.runtime_config.enable_ann_persistence {
            return Ok(());
        }
        let Some(db_path) = self.db_path.as_deref() else {
            return Ok(());
        };
        let Some(index) = self.vector_index.as_ref() else {
            return Ok(());
        };

        let index = index.borrow();
        let entries = index.export_records();
        if self.runtime_config.vector_index_mode.is_ann() {
            let Some(entry_sidecar_path) = ann_entry_sidecar_path(
                db_path,
                self.runtime_config.vector_index_mode,
                self.runtime_config.vector_storage_kind,
            ) else {
                return Ok(());
            };
            let Some(snapshot_path) = ann_snapshot_path(
                db_path,
                self.runtime_config.vector_index_mode,
                self.runtime_config.vector_storage_kind,
            ) else {
                return Ok(());
            };
            save_ann_entry_sidecar(
                &entry_sidecar_path,
                self.runtime_config.vector_storage_kind,
                &entries,
            )?;
            save_ann_snapshot(
                &snapshot_path,
                self.runtime_config.vector_index_mode,
                self.runtime_config.vector_storage_kind,
                &entries,
            )?;
            if self.runtime_config.vector_index_mode == VectorIndexMode::HnswBaseline
                && let Some(graph_paths) = ann_graph_dump_paths(
                    db_path,
                    self.runtime_config.vector_index_mode,
                    self.runtime_config.vector_storage_kind,
                )
                && let BuiltinVectorIndex::HnswBaseline(hnsw) = &*index
            {
                hnsw.dump_graph_snapshot(&graph_paths.directory, &graph_paths.basename)?;
            }
        }
        if self.runtime_config.vector_index_mode == VectorIndexMode::BruteForce
            && let Some(segment_path) =
                exact_segment_path(db_path, self.runtime_config.vector_storage_kind)
        {
            save_exact_segment_snapshot(
                &segment_path,
                self.runtime_config.vector_storage_kind,
                &entries,
            )?;
        }
        Ok(())
    }

    fn fetch_candidate_chunk_ids(&self, request: &SearchRequest) -> Result<Vec<String>> {
        let mut sql = String::from("SELECT id FROM chunks");
        let mut clauses = Vec::new();
        let mut params = Vec::new();

        if let Some(doc_id) = &request.doc_id {
            clauses.push("doc_id = ?".to_string());
            params.push(SqlValue::from(doc_id.clone()));
        }

        for (key, value) in &request.metadata_filters {
            let safe_key = sanitize_metadata_key(key)?;
            clauses.push(format!("json_extract(metadata, '$.{}') = ?", safe_key));
            params.push(SqlValue::from(value.clone()));
        }

        if !clauses.is_empty() {
            sql.push_str(" WHERE ");
            sql.push_str(&clauses.join(" AND "));
        }

        sql.push_str(" ORDER BY created_at DESC, rowid DESC LIMIT ?");
        params.push(SqlValue::Integer(request.candidate_limit as i64));

        let mut stmt = self.conn.prepare(&sql)?;
        let rows = stmt.query_map(params_from_iter(params), |row| row.get::<_, String>(0))?;

        let mut items = Vec::new();
        for row in rows {
            items.push(row?);
        }
        Ok(items)
    }

    fn fetch_chunks_by_ids(&self, ids: &[String]) -> Result<Vec<CandidateChunkRecord>> {
        if ids.is_empty() {
            return Ok(Vec::new());
        }

        let mut by_id: HashMap<String, CandidateChunkRecord> = HashMap::new();
        for chunk_ids in ids.chunks(900) {
            let placeholders = std::iter::repeat_n("?", chunk_ids.len())
                .collect::<Vec<_>>()
                .join(", ");
            let sql = format!(
                "SELECT id, doc_id, metadata
                 FROM chunks
                 WHERE id IN ({})",
                placeholders
            );

            let params: Vec<SqlValue> = chunk_ids
                .iter()
                .map(|id| SqlValue::from(id.clone()))
                .collect();
            let mut stmt = self.conn.prepare(&sql)?;
            let rows = stmt.query_map(params_from_iter(params), map_candidate_chunk_row)?;
            for row in rows {
                let record = row?;
                by_id.insert(record.id.clone(), record);
            }
        }

        let mut ordered = Vec::with_capacity(ids.len());
        for id in ids {
            if let Some(record) = by_id.remove(id) {
                ordered.push(record);
            }
        }
        Ok(ordered)
    }

    fn fetch_chunk_embeddings_by_ids(&self, ids: &[String]) -> Result<HashMap<String, Vec<f32>>> {
        if ids.is_empty() {
            return Ok(HashMap::new());
        }

        let mut embeddings = HashMap::new();
        for chunk_ids in ids.chunks(900) {
            let placeholders = std::iter::repeat_n("?", chunk_ids.len())
                .collect::<Vec<_>>()
                .join(", ");
            let sql = format!(
                "SELECT id, embedding, embedding_dim
                 FROM chunks
                 WHERE id IN ({})",
                placeholders
            );
            let params: Vec<SqlValue> = chunk_ids
                .iter()
                .map(|id| SqlValue::from(id.clone()))
                .collect();
            let mut stmt = self.conn.prepare(&sql)?;
            let rows = stmt.query_map(params_from_iter(params), |row| {
                let chunk_id: String = row.get(0)?;
                let embedding_blob: Vec<u8> = row.get(1)?;
                let embedding_dim: i64 = row.get(2)?;
                if embedding_dim <= 0 || embedding_blob.is_empty() {
                    return Ok((chunk_id, Vec::new()));
                }
                let embedding =
                    decode_embedding(&embedding_blob, embedding_dim as usize).map_err(|e| {
                        rusqlite::Error::FromSqlConversionFailure(
                            1,
                            rusqlite::types::Type::Blob,
                            Box::new(std::io::Error::new(std::io::ErrorKind::InvalidData, e)),
                        )
                    })?;
                Ok((chunk_id, embedding))
            })?;
            for row in rows {
                let (chunk_id, embedding) = row?;
                embeddings.insert(chunk_id, embedding);
            }
        }

        Ok(embeddings)
    }

    fn fetch_chunk_contents_by_ids(&self, ids: &[String]) -> Result<HashMap<String, String>> {
        if ids.is_empty() {
            return Ok(HashMap::new());
        }

        let mut by_id = HashMap::with_capacity(ids.len());
        for chunk_ids in ids.chunks(900) {
            let placeholders = std::iter::repeat_n("?", chunk_ids.len())
                .collect::<Vec<_>>()
                .join(", ");
            let sql = format!(
                "SELECT id, content
                 FROM chunks
                 WHERE id IN ({})",
                placeholders
            );
            let params: Vec<SqlValue> = chunk_ids
                .iter()
                .map(|id| SqlValue::from(id.clone()))
                .collect();
            let mut stmt = self.conn.prepare(&sql)?;
            let rows = stmt.query_map(params_from_iter(params), |row| {
                let id: String = row.get(0)?;
                let content: String = row.get(1)?;
                Ok((id, content))
            })?;
            for row in rows {
                let (id, content) = row?;
                by_id.insert(id, content);
            }
        }

        Ok(by_id)
    }

    fn fetch_chunk_keys_by_ids(&self, ids: &[String]) -> Result<HashMap<String, ChunkKey>> {
        fetch_chunk_keys_by_ids_from_connection(&self.conn, ids)
    }

    fn vector_candidates(
        &self,
        query_embedding: &[f32],
        request: &SearchRequest,
    ) -> Result<Vec<VectorCandidate>> {
        let indexed_candidates = if let Some(index) = &self.vector_index {
            let index = index.borrow();
            if index.dimension() != Some(query_embedding.len()) {
                None
            } else {
                let filtered_query =
                    request.doc_id.is_some() || !request.metadata_filters.is_empty();
                let query_result = if filtered_query {
                    let allowed_keys = self.filtered_chunk_keys(request)?;
                    if allowed_keys.is_empty() {
                        return Ok(Vec::new());
                    }
                    let allowed_positions = index.allowed_positions_for_keys(&allowed_keys);
                    if allowed_positions.is_empty() {
                        return Ok(Vec::new());
                    }
                    index.query_filtered_positions(
                        query_embedding,
                        request.candidate_limit,
                        &allowed_positions,
                    )
                } else {
                    index.query(query_embedding, request.candidate_limit)
                };
                match query_result {
                    Ok(candidates) if !candidates.is_empty() || index.len() == 0 => {
                        Some(candidates)
                    }
                    Ok(_) | Err(_) => None,
                }
            }
        } else {
            None
        };

        if let Some(candidates) = indexed_candidates {
            return Ok(candidates);
        }

        self.brute_force_vector_candidates(query_embedding, request)
    }

    fn filtered_chunk_keys(&self, request: &SearchRequest) -> Result<Vec<ChunkKey>> {
        if let Some(ids) = self.filter_index.borrow().filtered_chunk_keys(request) {
            return Ok(ids.iter().collect());
        }

        let mut sql = String::from("SELECT rowid FROM chunks");
        let mut clauses = Vec::new();
        let mut params = Vec::new();

        if let Some(doc_id) = &request.doc_id {
            clauses.push("doc_id = ?".to_string());
            params.push(SqlValue::from(doc_id.clone()));
        }

        for (key, value) in &request.metadata_filters {
            let safe_key = sanitize_metadata_key(key)?;
            clauses.push(format!("json_extract(metadata, '$.{}') = ?", safe_key));
            params.push(SqlValue::from(value.clone()));
        }

        if !clauses.is_empty() {
            sql.push_str(" WHERE ");
            sql.push_str(&clauses.join(" AND "));
        }

        let mut stmt = self.conn.prepare(&sql)?;
        let rows = stmt.query_map(params_from_iter(params), |row| row.get::<_, i64>(0))?;

        let mut ids = Vec::new();
        for row in rows {
            ids.push(row? as ChunkKey);
        }
        Ok(ids)
    }

    fn brute_force_vector_candidates(
        &self,
        query_embedding: &[f32],
        request: &SearchRequest,
    ) -> Result<Vec<VectorCandidate>> {
        let query_normalized = normalize_embedding_for_search(query_embedding);
        let mut sql = String::from("SELECT id, embedding, embedding_dim FROM chunks");
        let mut clauses = Vec::new();
        let mut params = Vec::new();

        if let Some(doc_id) = &request.doc_id {
            clauses.push("doc_id = ?".to_string());
            params.push(SqlValue::from(doc_id.clone()));
        }

        for (key, value) in &request.metadata_filters {
            let safe_key = sanitize_metadata_key(key)?;
            clauses.push(format!("json_extract(metadata, '$.{}') = ?", safe_key));
            params.push(SqlValue::from(value.clone()));
        }

        if !clauses.is_empty() {
            sql.push_str(" WHERE ");
            sql.push_str(&clauses.join(" AND "));
        }

        let mut stmt = self.conn.prepare(&sql)?;
        let rows = stmt.query_map(params_from_iter(params), |row| {
            let chunk_id: String = row.get(0)?;
            let embedding_blob: Vec<u8> = row.get(1)?;
            let embedding_dim: i64 = row.get(2)?;
            Ok((chunk_id, embedding_blob, embedding_dim))
        })?;

        let mut candidates = Vec::new();
        for row in rows {
            let (chunk_id, embedding_blob, embedding_dim) = row?;
            if embedding_dim <= 0 || embedding_dim as usize != query_embedding.len() {
                continue;
            }

            let embedding = decode_embedding(&embedding_blob, embedding_dim as usize)?;
            let score = cosine_similarity_with_normalized_query(&query_normalized, &embedding);
            candidates.push(VectorCandidate { chunk_id, score });
        }

        candidates.sort_by(|left, right| {
            right
                .score
                .total_cmp(&left.score)
                .then_with(|| left.chunk_id.cmp(&right.chunk_id))
        });
        candidates.truncate(request.candidate_limit);
        Ok(candidates)
    }

    fn fts_text_candidates(
        &self,
        query_text: &str,
        request: &SearchRequest,
        limit: usize,
    ) -> Result<FtsCandidates> {
        if limit == 0 {
            return Ok(FtsCandidates::default());
        }

        let Some(match_query) = build_fts_match_query(query_text) else {
            return Ok(FtsCandidates::default());
        };

        let mut sql;
        let mut params = vec![SqlValue::from(match_query)];
        if request.metadata_filters.is_empty() {
            sql = String::from(
                "SELECT chunk_id, bm25(chunks_fts) AS rank
                 FROM chunks_fts
                 WHERE chunks_fts MATCH ?",
            );
            if let Some(doc_id) = &request.doc_id {
                sql.push_str(" AND doc_id = ?");
                params.push(SqlValue::from(doc_id.clone()));
            }
            sql.push_str(" ORDER BY rank ASC, chunk_id ASC LIMIT ?");
            params.push(SqlValue::Integer(limit as i64));
        } else {
            sql = String::from(
                "SELECT f.chunk_id, bm25(chunks_fts) AS rank
                 FROM chunks_fts AS f
                 INNER JOIN chunks AS c ON c.id = f.chunk_id
                 WHERE chunks_fts MATCH ?",
            );
            if let Some(doc_id) = &request.doc_id {
                sql.push_str(" AND c.doc_id = ?");
                params.push(SqlValue::from(doc_id.clone()));
            }
            for (key, value) in &request.metadata_filters {
                let safe_key = sanitize_metadata_key(key)?;
                sql.push_str(&format!(
                    " AND json_extract(c.metadata, '$.{}') = ?",
                    safe_key
                ));
                params.push(SqlValue::from(value.clone()));
            }
            sql.push_str(" ORDER BY rank ASC, f.chunk_id ASC LIMIT ?");
            params.push(SqlValue::Integer(limit as i64));
        }

        let mut stmt = self.conn.prepare(&sql)?;
        let rows = stmt.query_map(params_from_iter(params), |row| {
            let chunk_id: String = row.get(0)?;
            let rank: f64 = row.get(1)?;
            Ok((chunk_id, rank))
        })?;

        let mut ranked = Vec::new();
        for row in rows {
            ranked.push(row?);
        }
        if ranked.is_empty() {
            return Ok(FtsCandidates::default());
        }

        let min_rank = ranked
            .iter()
            .map(|(_, rank)| *rank)
            .fold(f64::INFINITY, f64::min);

        let mut scores = HashMap::with_capacity(ranked.len());
        let mut ordered_chunk_ids = Vec::with_capacity(ranked.len());
        for (chunk_id, rank) in ranked {
            let normalized = 1.0 / (1.0 + (rank - min_rank).max(0.0) as f32);
            scores.insert(chunk_id.clone(), normalized);
            ordered_chunk_ids.push(chunk_id);
        }
        Ok(FtsCandidates {
            ordered_chunk_ids,
            scores,
        })
    }

    fn fts_text_scores_for_ids(
        &self,
        query_text: &str,
        candidate_ids: &[String],
    ) -> Result<HashMap<String, f32>> {
        if candidate_ids.is_empty() {
            return Ok(HashMap::new());
        }

        let Some(match_query) = build_fts_match_query(query_text) else {
            return Ok(HashMap::new());
        };

        let mut ranked = Vec::new();
        for ids in candidate_ids.chunks(900) {
            let placeholders = std::iter::repeat_n("?", ids.len())
                .collect::<Vec<_>>()
                .join(", ");
            let sql = format!(
                "SELECT chunk_id, bm25(chunks_fts) AS rank
                 FROM chunks_fts
                 WHERE chunks_fts MATCH ? AND chunk_id IN ({})",
                placeholders
            );

            let mut params = Vec::with_capacity(ids.len() + 1);
            params.push(SqlValue::from(match_query.clone()));
            for id in ids {
                params.push(SqlValue::from(id.clone()));
            }

            let mut stmt = self.conn.prepare(&sql)?;
            let rows = stmt.query_map(params_from_iter(params), |row| {
                let chunk_id: String = row.get(0)?;
                let rank: f64 = row.get(1)?;
                Ok((chunk_id, rank))
            })?;
            for row in rows {
                ranked.push(row?);
            }
        }

        if ranked.is_empty() {
            return Ok(HashMap::new());
        }

        let min_rank = ranked
            .iter()
            .map(|(_, rank)| *rank)
            .fold(f64::INFINITY, f64::min);

        let mut scores = HashMap::with_capacity(ranked.len());
        for (chunk_id, rank) in ranked {
            let normalized = 1.0 / (1.0 + (rank - min_rank).max(0.0) as f32);
            scores
                .entry(chunk_id)
                .and_modify(|existing| {
                    if normalized > *existing {
                        *existing = normalized;
                    }
                })
                .or_insert(normalized);
        }
        Ok(scores)
    }

    fn database_file_size_bytes(&self) -> Option<u64> {
        self.db_path
            .as_ref()
            .and_then(|path| fs::metadata(path).ok())
            .map(|meta| meta.len())
    }

    fn delete_content_hash_duplicates(&self) -> Result<usize> {
        let deleted = self.conn.execute(
            "
            DELETE FROM chunks
            WHERE rowid IN (
                SELECT c.rowid
                FROM chunks AS c
                JOIN (
                    SELECT
                        doc_id,
                        COALESCE(json_extract(metadata, '$.tenant'), '') AS tenant,
                        json_extract(metadata, '$.content_hash') AS content_hash,
                        MAX(rowid) AS keep_rowid
                    FROM chunks
                    WHERE json_extract(metadata, '$.content_hash') IS NOT NULL
                    GROUP BY
                        doc_id,
                        COALESCE(json_extract(metadata, '$.tenant'), ''),
                        json_extract(metadata, '$.content_hash')
                    HAVING COUNT(*) > 1
                ) AS dup
                ON c.doc_id = dup.doc_id
                AND COALESCE(json_extract(c.metadata, '$.tenant'), '') = dup.tenant
                AND json_extract(c.metadata, '$.content_hash') = dup.content_hash
                WHERE c.rowid <> dup.keep_rowid
            )
            ",
            [],
        )?;
        Ok(deleted)
    }

    fn validate_ingest_chunks(&self, chunks: &[ChunkInput]) -> Result<()> {
        let enforce_dimension = self.vector_index.is_some();
        let mut expected_dimension = self
            .vector_index
            .as_ref()
            .and_then(|index| index.borrow().dimension());

        for chunk in chunks {
            if chunk.embedding.is_empty() {
                return Err(SqlRiteError::EmptyEmbedding);
            }

            if let Some(expected) = expected_dimension {
                if expected != chunk.embedding.len() {
                    return Err(SqlRiteError::EmbeddingDimensionMismatch {
                        expected,
                        found: chunk.embedding.len(),
                    });
                }
            } else if enforce_dimension {
                expected_dimension = Some(chunk.embedding.len());
            }
        }

        Ok(())
    }

    fn rebuild_vector_index(&self) -> Result<()> {
        let Some(index) = &self.vector_index else {
            return Ok(());
        };

        let mut index = index.borrow_mut();
        index.reset()?;

        let mut stmt = self.conn.prepare(
            "SELECT rowid, id, embedding, embedding_dim
             FROM chunks
             ORDER BY rowid ASC",
        )?;
        let rows = stmt.query_map([], |row| {
            let chunk_key: i64 = row.get(0)?;
            let id: String = row.get(1)?;
            let embedding_blob: Vec<u8> = row.get(2)?;
            let embedding_dim: i64 = row.get(3)?;
            if embedding_dim <= 0 || embedding_blob.is_empty() {
                return Ok(None);
            }
            let embedding =
                decode_embedding(&embedding_blob, embedding_dim as usize).map_err(|e| {
                    rusqlite::Error::FromSqlConversionFailure(
                        2,
                        rusqlite::types::Type::Blob,
                        Box::new(std::io::Error::new(std::io::ErrorKind::InvalidData, e)),
                    )
                })?;
            Ok(Some(VectorEntryRecord {
                chunk_key: chunk_key as ChunkKey,
                chunk_id: id,
                embedding,
            }))
        })?;

        let mut batch: Vec<VectorEntryRecord> = Vec::with_capacity(1024);
        for row in rows {
            if let Some(record) = row? {
                batch.push(record);
            }
            if batch.len() >= 1024 {
                index.upsert_records(&batch)?;
                batch.clear();
            }
        }

        if !batch.is_empty() {
            index.upsert_records(&batch)?;
        }

        Ok(())
    }
}

fn map_candidate_chunk_row(row: &rusqlite::Row<'_>) -> rusqlite::Result<CandidateChunkRecord> {
    let metadata_text: String = row.get(2)?;
    let metadata = serde_json::from_str::<Value>(&metadata_text).map_err(|e| {
        rusqlite::Error::FromSqlConversionFailure(2, rusqlite::types::Type::Text, Box::new(e))
    })?;

    Ok(CandidateChunkRecord {
        id: row.get(0)?,
        doc_id: row.get(1)?,
        metadata,
    })
}

fn merge_candidate_ids(
    vector_ids: &[String],
    text_ids: &[String],
    limit: usize,
    use_vector: bool,
    use_text: bool,
) -> Vec<String> {
    if limit == 0 {
        return Vec::new();
    }

    let mut merged = Vec::with_capacity(limit);
    let mut seen = HashSet::with_capacity(limit.saturating_mul(2));

    if use_vector {
        for id in vector_ids {
            if seen.insert(id.clone()) {
                merged.push(id.clone());
                if merged.len() >= limit {
                    return merged;
                }
            }
        }
    }

    if use_text {
        for id in text_ids {
            if seen.insert(id.clone()) {
                merged.push(id.clone());
                if merged.len() >= limit {
                    break;
                }
            }
        }
    }

    merged
}

fn merge_ranked_candidate_ids(
    primary_ids: &[String],
    secondary_ids: &[String],
    limit: usize,
) -> Vec<String> {
    if limit == 0 {
        return Vec::new();
    }

    let mut merged = Vec::with_capacity(limit);
    let mut seen = HashSet::with_capacity(limit.saturating_mul(2));

    for id in primary_ids {
        if seen.insert(id.clone()) {
            merged.push(id.clone());
            if merged.len() >= limit {
                return merged;
            }
        }
    }

    for id in secondary_ids {
        if seen.insert(id.clone()) {
            merged.push(id.clone());
            if merged.len() >= limit {
                break;
            }
        }
    }

    merged
}

fn select_hybrid_planner_mode(
    request: &SearchRequest,
    fts_enabled: bool,
    vector_index_available: bool,
) -> Option<HybridPlannerMode> {
    if request.query_text.is_none() || request.query_embedding.is_none() {
        return None;
    }
    if !fts_enabled {
        return Some(HybridPlannerMode::VectorFirst);
    }
    if !vector_index_available {
        return Some(HybridPlannerMode::TextFirst);
    }
    if request.alpha >= 0.6 || request.query_profile == QueryProfile::Latency {
        return Some(HybridPlannerMode::VectorFirst);
    }
    if request.alpha <= 0.35 {
        return Some(HybridPlannerMode::TextFirst);
    }
    Some(HybridPlannerMode::BalancedHybrid)
}

fn hybrid_primary_candidate_limit(request: &SearchRequest, mode: HybridPlannerMode) -> usize {
    let multiplier = match (mode, request.query_profile) {
        (HybridPlannerMode::VectorFirst, QueryProfile::Latency) => 4,
        (HybridPlannerMode::VectorFirst, QueryProfile::Balanced) => 8,
        (HybridPlannerMode::VectorFirst, QueryProfile::Recall) => 12,
        (HybridPlannerMode::TextFirst, QueryProfile::Latency) => 4,
        (HybridPlannerMode::TextFirst, QueryProfile::Balanced) => 8,
        (HybridPlannerMode::TextFirst, QueryProfile::Recall) => 12,
        (HybridPlannerMode::BalancedHybrid, _) => return request.candidate_limit,
    };
    request
        .top_k
        .saturating_mul(multiplier)
        .max(32)
        .min(request.candidate_limit)
        .max(request.top_k)
}

fn hybrid_secondary_candidate_limit(request: &SearchRequest, mode: HybridPlannerMode) -> usize {
    let multiplier = match (mode, request.query_profile) {
        (HybridPlannerMode::VectorFirst, QueryProfile::Latency) => 2,
        (HybridPlannerMode::VectorFirst, QueryProfile::Balanced) => 4,
        (HybridPlannerMode::VectorFirst, QueryProfile::Recall) => 6,
        (HybridPlannerMode::TextFirst, QueryProfile::Latency) => 2,
        (HybridPlannerMode::TextFirst, QueryProfile::Balanced) => 4,
        (HybridPlannerMode::TextFirst, QueryProfile::Recall) => 6,
        (HybridPlannerMode::BalancedHybrid, _) => return request.candidate_limit,
    };
    request
        .top_k
        .saturating_mul(multiplier)
        .max(16)
        .min(request.candidate_limit)
        .max(request.top_k)
}

fn hybrid_rerank_candidate_limit(
    request: &SearchRequest,
    mode: Option<HybridPlannerMode>,
) -> usize {
    let multiplier = match (
        mode.unwrap_or(HybridPlannerMode::BalancedHybrid),
        request.query_profile,
    ) {
        (HybridPlannerMode::VectorFirst, QueryProfile::Latency) => 2,
        (HybridPlannerMode::VectorFirst, QueryProfile::Balanced) => 4,
        (HybridPlannerMode::VectorFirst, QueryProfile::Recall) => 8,
        (HybridPlannerMode::TextFirst, QueryProfile::Latency) => 2,
        (HybridPlannerMode::TextFirst, QueryProfile::Balanced) => 4,
        (HybridPlannerMode::TextFirst, QueryProfile::Recall) => 8,
        (HybridPlannerMode::BalancedHybrid, QueryProfile::Latency) => 4,
        (HybridPlannerMode::BalancedHybrid, QueryProfile::Balanced) => 6,
        (HybridPlannerMode::BalancedHybrid, QueryProfile::Recall) => 10,
    };
    request
        .top_k
        .saturating_mul(multiplier)
        .max(request.top_k)
        .min(request.candidate_limit)
}

fn select_hybrid_rerank_ids(
    candidate_ids: Vec<String>,
    vector_score_lookup: &HashMap<String, f32>,
    text_scores: &HashMap<String, f32>,
    request: &SearchRequest,
    mode: Option<HybridPlannerMode>,
) -> Vec<String> {
    let rerank_limit = hybrid_rerank_candidate_limit(request, mode);
    if candidate_ids.len() <= rerank_limit {
        return candidate_ids;
    }

    let provisional = candidate_ids
        .iter()
        .map(|chunk_id| ScoredChunk {
            chunk_id: chunk_id.clone(),
            vector_score: vector_score_lookup.get(chunk_id).copied().unwrap_or(0.0),
            text_score: text_scores.get(chunk_id).copied().unwrap_or(0.0),
        })
        .collect::<Vec<_>>();
    let provisional_scores = compute_hybrid_scores(
        &provisional,
        true,
        true,
        request.alpha,
        request.fusion_strategy,
    );
    let mut ranked = provisional
        .into_iter()
        .map(|entry| {
            (
                entry.chunk_id.clone(),
                provisional_scores
                    .get(&entry.chunk_id)
                    .copied()
                    .unwrap_or(0.0),
                entry.vector_score,
                entry.text_score,
            )
        })
        .collect::<Vec<_>>();
    ranked.sort_by(|left, right| {
        right
            .1
            .total_cmp(&left.1)
            .then_with(|| right.2.total_cmp(&left.2))
            .then_with(|| right.3.total_cmp(&left.3))
            .then_with(|| left.0.cmp(&right.0))
    });
    ranked.truncate(rerank_limit);
    ranked
        .into_iter()
        .map(|(chunk_id, _, _, _)| chunk_id)
        .collect()
}

fn should_skip_fts_score_lookup(
    use_vector: bool,
    fts_enabled: bool,
    vector_candidate_count: usize,
    candidate_limit: usize,
) -> bool {
    if !use_vector || !fts_enabled {
        return false;
    }
    candidate_limit >= HYBRID_FTS_SCORE_LOOKUP_SKIP_CANDIDATE_LIMIT
        && vector_candidate_count >= candidate_limit
}

#[derive(Debug, Clone, Serialize, Deserialize)]
struct AnnSnapshotFile {
    version: u32,
    mode: String,
    storage_kind: String,
    entries: Vec<AnnSnapshotEntry>,
}

#[derive(Debug, Clone, Serialize, Deserialize)]
struct AnnSnapshotEntry {
    #[serde(default)]
    chunk_key: Option<ChunkKey>,
    chunk_id: String,
    vector: AnnSnapshotVector,
}

#[derive(Debug, Clone)]
struct AnnGraphDumpPaths {
    directory: PathBuf,
    basename: String,
    graph_path: PathBuf,
    data_path: PathBuf,
}

#[derive(Debug, Clone, Serialize, Deserialize)]
#[serde(tag = "encoding", rename_all = "snake_case")]
enum AnnSnapshotVector {
    F32 { values: Vec<f32> },
    F16 { values: Vec<u16> },
    Int8 { values: Vec<i8>, scale: f32 },
}

fn load_vector_index(
    conn: &Connection,
    runtime_config: &RuntimeConfig,
    db_path: Option<&Path>,
) -> Result<Option<BuiltinVectorIndex>> {
    let options = VectorIndexOptions {
        storage_kind: runtime_config.vector_storage_kind,
        ann_tuning: runtime_config.ann_tuning,
    };
    let Some(mut index) = BuiltinVectorIndex::from_mode(runtime_config.vector_index_mode, options)
    else {
        return Ok(None);
    };

    let exact_segment_snapshot_path = if runtime_config.enable_ann_persistence
        && runtime_config.vector_index_mode == VectorIndexMode::BruteForce
    {
        db_path.and_then(|path| exact_segment_path(path, runtime_config.vector_storage_kind))
    } else {
        None
    };

    if let (Some(path), Some(db_file)) = (exact_segment_snapshot_path.as_ref(), db_path)
        && artifact_is_fresh(path, db_file)
    {
        if runtime_config.vector_storage_kind == VectorStorageKind::F32
            && let BuiltinVectorIndex::BruteForce(_) = &index
            && let Ok(mapped_index) = BruteForceVectorIndex::load_mmap_f32_sidecar(path)
        {
            return Ok(Some(BuiltinVectorIndex::BruteForce(mapped_index)));
        }
        if let Ok(entries) = load_exact_segment_snapshot(path, runtime_config.vector_storage_kind)
            && index.import_records(&entries).is_ok()
        {
            return Ok(Some(index));
        }
    }

    let snapshot_path =
        if runtime_config.enable_ann_persistence && runtime_config.vector_index_mode.is_ann() {
            db_path.and_then(|path| {
                ann_snapshot_path(
                    path,
                    runtime_config.vector_index_mode,
                    runtime_config.vector_storage_kind,
                )
            })
        } else {
            None
        };

    let ann_entry_path =
        if runtime_config.enable_ann_persistence && runtime_config.vector_index_mode.is_ann() {
            db_path.and_then(|path| {
                ann_entry_sidecar_path(
                    path,
                    runtime_config.vector_index_mode,
                    runtime_config.vector_storage_kind,
                )
            })
        } else {
            None
        };

    let ann_graph_paths = if runtime_config.enable_ann_persistence
        && runtime_config.vector_index_mode == VectorIndexMode::HnswBaseline
    {
        db_path.and_then(|path| {
            ann_graph_dump_paths(
                path,
                runtime_config.vector_index_mode,
                runtime_config.vector_storage_kind,
            )
        })
    } else {
        None
    };

    if let (Some(path), Some(db_file)) = (ann_entry_path.as_ref(), db_path)
        && artifact_is_fresh(path, db_file)
        && let Ok(entries) = load_ann_entry_sidecar(path, runtime_config.vector_storage_kind)
        && index.import_records(&entries).is_ok()
    {
        if let (Some(graph_paths), BuiltinVectorIndex::HnswBaseline(hnsw)) =
            (ann_graph_paths.as_ref(), &index)
            && graph_artifacts_are_fresh(graph_paths, db_file)
            && hnsw
                .load_graph_snapshot(&graph_paths.directory, &graph_paths.basename)
                .is_ok()
        {
            return Ok(Some(index));
        }
        return Ok(Some(index));
    }

    if let (Some(path), Some(db_file)) = (snapshot_path.as_ref(), db_path)
        && artifact_is_fresh(path, db_file)
        && let Ok(snapshot) = load_ann_snapshot(path)
        && snapshot.mode == runtime_config.vector_index_mode.as_str()
        && snapshot.storage_kind == runtime_config.vector_storage_kind.as_str()
    {
        let mut entries = snapshot
            .entries
            .into_iter()
            .map(|entry| VectorEntryRecord {
                chunk_key: entry.chunk_key.unwrap_or_default(),
                chunk_id: entry.chunk_id,
                embedding: decode_snapshot_vector(entry.vector),
            })
            .collect::<Vec<_>>();
        if entries.iter().any(|entry| entry.chunk_key == 0) {
            backfill_vector_entry_keys(conn, &mut entries)?;
        }
        if index.import_records(&entries).is_ok() {
            return Ok(Some(index));
        }
    }

    let mut stmt = conn.prepare(
        "SELECT rowid, id, embedding, embedding_dim
         FROM chunks
         ORDER BY rowid ASC",
    )?;
    let rows = stmt.query_map([], |row| {
        let chunk_key: i64 = row.get(0)?;
        let id: String = row.get(1)?;
        let embedding_blob: Vec<u8> = row.get(2)?;
        let embedding_dim: i64 = row.get(3)?;
        if embedding_dim <= 0 || embedding_blob.is_empty() {
            return Ok(None);
        }
        let embedding = decode_embedding(&embedding_blob, embedding_dim as usize).map_err(|e| {
            rusqlite::Error::FromSqlConversionFailure(
                2,
                rusqlite::types::Type::Blob,
                Box::new(std::io::Error::new(std::io::ErrorKind::InvalidData, e)),
            )
        })?;
        Ok(Some(VectorEntryRecord {
            chunk_key: chunk_key as ChunkKey,
            chunk_id: id,
            embedding,
        }))
    })?;

    let mut batch: Vec<VectorEntryRecord> = Vec::with_capacity(1024);
    for row in rows {
        if let Some(record) = row? {
            batch.push(record);
        }
        if batch.len() >= 1024 {
            index.upsert_records(&batch)?;
            batch.clear();
        }
    }

    if !batch.is_empty() {
        index.upsert_records(&batch)?;
    }

    let entries = index.export_records();
    if let Some(path) = exact_segment_snapshot_path.as_ref() {
        let _ = save_exact_segment_snapshot(path, runtime_config.vector_storage_kind, &entries);
    }
    if let Some(path) = ann_entry_path.as_ref() {
        let _ = save_ann_entry_sidecar(path, runtime_config.vector_storage_kind, &entries);
    }
    if let Some(path) = snapshot_path.as_ref() {
        let _ = save_ann_snapshot(
            path,
            runtime_config.vector_index_mode,
            runtime_config.vector_storage_kind,
            &entries,
        );
    }
    if let (Some(graph_paths), BuiltinVectorIndex::HnswBaseline(hnsw)) =
        (ann_graph_paths.as_ref(), &index)
    {
        let _ = hnsw.dump_graph_snapshot(&graph_paths.directory, &graph_paths.basename);
    }

    Ok(Some(index))
}

fn backfill_vector_entry_keys(conn: &Connection, entries: &mut [VectorEntryRecord]) -> Result<()> {
    let chunk_ids = entries
        .iter()
        .filter(|entry| entry.chunk_key == 0)
        .map(|entry| entry.chunk_id.clone())
        .collect::<Vec<_>>();
    if chunk_ids.is_empty() {
        return Ok(());
    }

    let chunk_key_lookup = fetch_chunk_keys_by_ids_from_connection(conn, &chunk_ids)?;
    for entry in entries.iter_mut() {
        if entry.chunk_key == 0
            && let Some(chunk_key) = chunk_key_lookup.get(&entry.chunk_id).copied()
        {
            entry.chunk_key = chunk_key;
        }
    }

    Ok(())
}

fn fetch_chunk_keys_by_ids_from_connection(
    conn: &Connection,
    ids: &[String],
) -> Result<HashMap<String, ChunkKey>> {
    if ids.is_empty() {
        return Ok(HashMap::new());
    }

    let mut by_id = HashMap::with_capacity(ids.len());
    for chunk_ids in ids.chunks(900) {
        let placeholders = std::iter::repeat_n("?", chunk_ids.len())
            .collect::<Vec<_>>()
            .join(", ");
        let sql = format!(
            "SELECT id, rowid
             FROM chunks
             WHERE id IN ({})",
            placeholders
        );
        let params: Vec<SqlValue> = chunk_ids
            .iter()
            .map(|id| SqlValue::from(id.clone()))
            .collect();
        let mut stmt = conn.prepare(&sql)?;
        let rows = stmt.query_map(params_from_iter(params), |row| {
            let id: String = row.get(0)?;
            let chunk_key: i64 = row.get(1)?;
            Ok((id, chunk_key as ChunkKey))
        })?;
        for row in rows {
            let (id, chunk_key) = row?;
            by_id.insert(id, chunk_key);
        }
    }

    Ok(by_id)
}

fn ann_snapshot_path(
    db_path: &Path,
    mode: VectorIndexMode,
    storage_kind: VectorStorageKind,
) -> Option<PathBuf> {
    let parent = db_path.parent().unwrap_or_else(|| Path::new("."));
    let file_stem = db_path
        .file_name()
        .and_then(|value| value.to_str())
        .unwrap_or("sqlrite");
    Some(parent.join(format!(
        ".{file_stem}.ann.{}.{}.json",
        mode.as_str(),
        storage_kind.as_str()
    )))
}

fn ann_entry_sidecar_path(
    db_path: &Path,
    mode: VectorIndexMode,
    storage_kind: VectorStorageKind,
) -> Option<PathBuf> {
    let parent = db_path.parent().unwrap_or_else(|| Path::new("."));
    let file_stem = db_path
        .file_name()
        .and_then(|value| value.to_str())
        .unwrap_or("sqlrite");
    Some(parent.join(format!(
        ".{file_stem}.ann.{}.{}.bin",
        mode.as_str(),
        storage_kind.as_str()
    )))
}

fn ann_graph_dump_paths(
    db_path: &Path,
    mode: VectorIndexMode,
    storage_kind: VectorStorageKind,
) -> Option<AnnGraphDumpPaths> {
    let directory = db_path
        .parent()
        .unwrap_or_else(|| Path::new("."))
        .to_path_buf();
    let file_stem = db_path
        .file_name()
        .and_then(|value| value.to_str())
        .unwrap_or("sqlrite");
    let basename = format!(
        ".{file_stem}.ann_graph.{}.{}",
        mode.as_str(),
        storage_kind.as_str()
    );
    let graph_path = directory.join(format!("{basename}.hnsw.graph"));
    let data_path = directory.join(format!("{basename}.hnsw.data"));
    Some(AnnGraphDumpPaths {
        directory,
        basename,
        graph_path,
        data_path,
    })
}

fn exact_segment_path(db_path: &Path, storage_kind: VectorStorageKind) -> Option<PathBuf> {
    let parent = db_path.parent().unwrap_or_else(|| Path::new("."));
    let file_stem = db_path
        .file_name()
        .and_then(|value| value.to_str())
        .unwrap_or("sqlrite");
    Some(parent.join(format!(
        ".{file_stem}.segment.bruteforce.{}.bin",
        storage_kind.as_str()
    )))
}

fn artifact_is_fresh(artifact_path: &Path, db_path: &Path) -> bool {
    let snapshot_meta = fs::metadata(artifact_path).ok();
    let db_meta = fs::metadata(db_path).ok();
    let Some(snapshot_mtime) = snapshot_meta.and_then(|meta| meta.modified().ok()) else {
        return false;
    };
    let Some(db_mtime) = db_meta.and_then(|meta| meta.modified().ok()) else {
        return false;
    };
    snapshot_mtime >= db_mtime
}

fn graph_artifacts_are_fresh(paths: &AnnGraphDumpPaths, db_path: &Path) -> bool {
    artifact_is_fresh(&paths.graph_path, db_path) && artifact_is_fresh(&paths.data_path, db_path)
}

const EXACT_SEGMENT_MAGIC: &[u8; 8] = b"SQLRSEG1";
const EXACT_SEGMENT_VERSION: u32 = 2;

fn save_exact_segment_snapshot(
    path: &Path,
    storage_kind: VectorStorageKind,
    entries: &[VectorEntryRecord],
) -> Result<()> {
    let mut file = File::create(path)?;
    file.write_all(EXACT_SEGMENT_MAGIC)?;
    file.write_all(&EXACT_SEGMENT_VERSION.to_le_bytes())?;
    file.write_all(&[storage_kind_code(storage_kind)])?;
    file.write_all(&(entries.len() as u32).to_le_bytes())?;

    for entry in entries {
        let chunk_id_bytes = entry.chunk_id.as_bytes();
        file.write_all(&entry.chunk_key.to_le_bytes())?;
        file.write_all(&(chunk_id_bytes.len() as u32).to_le_bytes())?;
        file.write_all(chunk_id_bytes)?;
        file.write_all(&(entry.embedding.len() as u32).to_le_bytes())?;
        match storage_kind {
            VectorStorageKind::F32 => {
                for value in &entry.embedding {
                    file.write_all(&value.to_le_bytes())?;
                }
            }
            VectorStorageKind::F16 => {
                for value in &entry.embedding {
                    file.write_all(&f16::from_f32(*value).to_bits().to_le_bytes())?;
                }
            }
            VectorStorageKind::Int8 => {
                let max_abs = entry
                    .embedding
                    .iter()
                    .fold(0.0f32, |acc, value| acc.max(value.abs()));
                let scale = if max_abs == 0.0 { 1.0 } else { max_abs / 127.0 };
                file.write_all(&scale.to_le_bytes())?;
                for value in &entry.embedding {
                    let quantized = (value / scale).round().clamp(-127.0, 127.0) as i8;
                    file.write_all(&(quantized as u8).to_le_bytes())?;
                }
            }
        }
    }

    Ok(())
}

fn save_ann_entry_sidecar(
    path: &Path,
    storage_kind: VectorStorageKind,
    entries: &[VectorEntryRecord],
) -> Result<()> {
    save_exact_segment_snapshot(path, storage_kind, entries)
}

fn load_exact_segment_snapshot(
    path: &Path,
    storage_kind: VectorStorageKind,
) -> Result<Vec<VectorEntryRecord>> {
    let mut file = File::open(path)?;
    let mut magic = [0u8; 8];
    file.read_exact(&mut magic)?;
    if &magic != EXACT_SEGMENT_MAGIC {
        return Err(SqlRiteError::Io(std::io::Error::new(
            std::io::ErrorKind::InvalidData,
            "invalid exact segment snapshot magic",
        )));
    }

    let version = read_u32_le(&mut file)?;
    if version != EXACT_SEGMENT_VERSION {
        return Err(SqlRiteError::Io(std::io::Error::new(
            std::io::ErrorKind::InvalidData,
            format!("unsupported exact segment snapshot version {version}"),
        )));
    }

    let stored_kind = read_u8(&mut file)?;
    if stored_kind != storage_kind_code(storage_kind) {
        return Err(SqlRiteError::Io(std::io::Error::new(
            std::io::ErrorKind::InvalidData,
            "exact segment snapshot storage kind mismatch",
        )));
    }

    let entry_count = read_u32_le(&mut file)? as usize;
    let mut entries = Vec::with_capacity(entry_count);
    for _ in 0..entry_count {
        let chunk_key = read_u64_le(&mut file)?;
        let chunk_id_len = read_u32_le(&mut file)? as usize;
        let mut chunk_id_bytes = vec![0u8; chunk_id_len];
        file.read_exact(&mut chunk_id_bytes)?;
        let chunk_id = String::from_utf8(chunk_id_bytes).map_err(|error| {
            SqlRiteError::Io(std::io::Error::new(
                std::io::ErrorKind::InvalidData,
                error.to_string(),
            ))
        })?;
        let dimension = read_u32_le(&mut file)? as usize;
        let embedding = match storage_kind {
            VectorStorageKind::F32 => {
                let mut values = Vec::with_capacity(dimension);
                for _ in 0..dimension {
                    values.push(read_f32_le(&mut file)?);
                }
                values
            }
            VectorStorageKind::F16 => {
                let mut values = Vec::with_capacity(dimension);
                for _ in 0..dimension {
                    let bits = read_u16_le(&mut file)?;
                    values.push(f16::from_bits(bits).to_f32());
                }
                values
            }
            VectorStorageKind::Int8 => {
                let scale = read_f32_le(&mut file)?;
                let mut values = Vec::with_capacity(dimension);
                for _ in 0..dimension {
                    let value = read_u8(&mut file)? as i8;
                    values.push(value as f32 * scale);
                }
                values
            }
        };
        entries.push(VectorEntryRecord {
            chunk_key,
            chunk_id,
            embedding,
        });
    }

    Ok(entries)
}

fn load_ann_entry_sidecar(
    path: &Path,
    storage_kind: VectorStorageKind,
) -> Result<Vec<VectorEntryRecord>> {
    load_exact_segment_snapshot(path, storage_kind)
}

fn storage_kind_code(storage_kind: VectorStorageKind) -> u8 {
    match storage_kind {
        VectorStorageKind::F32 => 1,
        VectorStorageKind::F16 => 2,
        VectorStorageKind::Int8 => 3,
    }
}

fn read_u8(reader: &mut impl Read) -> Result<u8> {
    let mut value = [0u8; 1];
    reader.read_exact(&mut value)?;
    Ok(value[0])
}

fn read_u16_le(reader: &mut impl Read) -> Result<u16> {
    let mut value = [0u8; 2];
    reader.read_exact(&mut value)?;
    Ok(u16::from_le_bytes(value))
}

fn read_u32_le(reader: &mut impl Read) -> Result<u32> {
    let mut value = [0u8; 4];
    reader.read_exact(&mut value)?;
    Ok(u32::from_le_bytes(value))
}

fn read_u64_le(reader: &mut impl Read) -> Result<u64> {
    let mut value = [0u8; 8];
    reader.read_exact(&mut value)?;
    Ok(u64::from_le_bytes(value))
}

fn read_f32_le(reader: &mut impl Read) -> Result<f32> {
    let mut value = [0u8; 4];
    reader.read_exact(&mut value)?;
    Ok(f32::from_le_bytes(value))
}

fn load_ann_snapshot(path: &Path) -> Result<AnnSnapshotFile> {
    let raw = fs::read_to_string(path)?;
    let snapshot: AnnSnapshotFile = serde_json::from_str(&raw)?;
    Ok(snapshot)
}

fn save_ann_snapshot(
    path: &Path,
    mode: VectorIndexMode,
    storage_kind: VectorStorageKind,
    entries: &[VectorEntryRecord],
) -> Result<()> {
    let payload = AnnSnapshotFile {
        version: 1,
        mode: mode.as_str().to_string(),
        storage_kind: storage_kind.as_str().to_string(),
        entries: entries
            .iter()
            .map(|entry| AnnSnapshotEntry {
                chunk_key: Some(entry.chunk_key),
                chunk_id: entry.chunk_id.clone(),
                vector: encode_snapshot_vector(&entry.embedding, storage_kind),
            })
            .collect(),
    };

    let raw = serde_json::to_string_pretty(&payload)?;
    fs::write(path, raw)?;
    Ok(())
}

fn encode_snapshot_vector(embedding: &[f32], storage_kind: VectorStorageKind) -> AnnSnapshotVector {
    match storage_kind {
        VectorStorageKind::F32 => AnnSnapshotVector::F32 {
            values: embedding.to_vec(),
        },
        VectorStorageKind::F16 => AnnSnapshotVector::F16 {
            values: embedding
                .iter()
                .map(|value| f16::from_f32(*value).to_bits())
                .collect(),
        },
        VectorStorageKind::Int8 => {
            let max_abs = embedding
                .iter()
                .fold(0.0f32, |acc, value| acc.max(value.abs()))
                .max(1e-6);
            let scale = max_abs / 127.0;
            let values = embedding
                .iter()
                .map(|value| ((*value / scale).round().clamp(-127.0, 127.0)) as i8)
                .collect::<Vec<_>>();
            AnnSnapshotVector::Int8 { values, scale }
        }
    }
}

fn decode_snapshot_vector(vector: AnnSnapshotVector) -> Vec<f32> {
    match vector {
        AnnSnapshotVector::F32 { values } => values,
        AnnSnapshotVector::F16 { values } => values
            .into_iter()
            .map(|bits| f16::from_bits(bits).to_f32())
            .collect(),
        AnnSnapshotVector::Int8 { values, scale } => values
            .into_iter()
            .map(|value| value as f32 * scale)
            .collect(),
    }
}

fn compute_hybrid_scores(
    scored: &[ScoredChunk],
    use_vector: bool,
    use_text: bool,
    alpha: f32,
    fusion_strategy: FusionStrategy,
) -> HashMap<String, f32> {
    if scored.is_empty() {
        return HashMap::new();
    }

    match (use_vector, use_text, fusion_strategy) {
        (true, true, FusionStrategy::Weighted) => scored
            .iter()
            .map(|entry| {
                (
                    entry.chunk_id.clone(),
                    alpha * entry.vector_score + (1.0 - alpha) * entry.text_score,
                )
            })
            .collect(),
        (true, true, FusionStrategy::ReciprocalRankFusion { rank_constant }) => {
            let vector_ranks = rank_lookup(
                scored
                    .iter()
                    .map(|entry| (&entry.chunk_id, entry.vector_score)),
            );
            let text_ranks = rank_lookup(
                scored
                    .iter()
                    .map(|entry| (&entry.chunk_id, entry.text_score)),
            );

            scored
                .iter()
                .map(|entry| {
                    let vector_term = vector_ranks
                        .get(&entry.chunk_id)
                        .copied()
                        .map(|rank| 1.0 / (rank_constant + rank as f32))
                        .unwrap_or(0.0);
                    let text_term = text_ranks
                        .get(&entry.chunk_id)
                        .copied()
                        .map(|rank| 1.0 / (rank_constant + rank as f32))
                        .unwrap_or(0.0);
                    (entry.chunk_id.clone(), vector_term + text_term)
                })
                .collect()
        }
        (true, false, _) => scored
            .iter()
            .map(|entry| (entry.chunk_id.clone(), entry.vector_score))
            .collect(),
        (false, true, _) => scored
            .iter()
            .map(|entry| (entry.chunk_id.clone(), entry.text_score))
            .collect(),
        (false, false, _) => scored
            .iter()
            .map(|entry| (entry.chunk_id.clone(), 0.0))
            .collect(),
    }
}

fn rank_lookup<'a>(items: impl Iterator<Item = (&'a String, f32)>) -> HashMap<String, usize> {
    let mut ranked: Vec<(String, f32)> = items.map(|(id, score)| (id.clone(), score)).collect();
    ranked.sort_by(|left, right| {
        right
            .1
            .total_cmp(&left.1)
            .then_with(|| left.0.cmp(&right.0))
    });

    ranked
        .into_iter()
        .enumerate()
        .map(|(idx, (id, _))| (id, idx + 1))
        .collect()
}

fn apply_runtime_config(conn: &Connection, config: &RuntimeConfig) -> Result<()> {
    conn.busy_timeout(Duration::from_millis(config.busy_timeout_ms))?;
    conn.pragma_update(None, "foreign_keys", true)?;
    conn.pragma_update(None, "synchronous", config.synchronous_sql())?;

    if config.enable_wal {
        let _: String = conn.query_row("PRAGMA journal_mode = WAL;", [], |row| row.get(0))?;
    } else {
        let _: String = conn.query_row("PRAGMA journal_mode = DELETE;", [], |row| row.get(0))?;
    }

    if config.temp_store_memory {
        conn.pragma_update(None, "temp_store", "MEMORY")?;
    }

    if config.sqlite_cache_size_kib > 0 {
        let cache_pages_kib = -config.sqlite_cache_size_kib;
        conn.pragma_update(None, "cache_size", cache_pages_kib)?;
    }

    if config.sqlite_mmap_size_bytes > 0 {
        conn.pragma_update(None, "mmap_size", config.sqlite_mmap_size_bytes)?;
    }

    Ok(())
}

fn run_migrations(conn: &mut Connection) -> Result<i64> {
    conn.execute_batch(
        "
        CREATE TABLE IF NOT EXISTS schema_migrations (
            version INTEGER PRIMARY KEY,
            name TEXT NOT NULL,
            applied_at TEXT NOT NULL DEFAULT (datetime('now'))
        );
        ",
    )?;

    let mut applied = HashSet::new();
    {
        let mut applied_stmt = conn.prepare("SELECT version FROM schema_migrations")?;
        let applied_rows = applied_stmt.query_map([], |row| row.get::<_, i64>(0))?;
        for row in applied_rows {
            applied.insert(row?);
        }
    }

    for migration in MIGRATIONS {
        if applied.contains(&migration.version) {
            continue;
        }

        let tx = conn.transaction()?;
        tx.execute_batch(migration.sql)?;
        tx.execute(
            "INSERT OR IGNORE INTO schema_migrations (version, name) VALUES (?1, ?2)",
            params![migration.version, migration.name],
        )?;
        tx.commit()?;
    }

    let schema_version = conn.query_row(
        "SELECT COALESCE(MAX(version), 0) FROM schema_migrations",
        [],
        |row| row.get::<_, i64>(0),
    )?;

    Ok(schema_version.min(LATEST_SCHEMA_VERSION))
}

fn initialize_fts(conn: &Connection) -> bool {
    let enabled = conn
        .execute_batch(
            "
            CREATE VIRTUAL TABLE IF NOT EXISTS chunks_fts USING fts5(
                content,
                chunk_id UNINDEXED,
                doc_id UNINDEXED
            );
            ",
        )
        .is_ok();

    if !enabled {
        return false;
    }

    let _ = conn.execute_batch(
        "
        CREATE TRIGGER IF NOT EXISTS chunks_fts_after_insert
        AFTER INSERT ON chunks
        BEGIN
            INSERT INTO chunks_fts (content, chunk_id, doc_id)
            VALUES (new.content, new.id, new.doc_id);
        END;

        CREATE TRIGGER IF NOT EXISTS chunks_fts_after_update
        AFTER UPDATE ON chunks
        BEGIN
            DELETE FROM chunks_fts WHERE chunk_id = old.id;
            INSERT INTO chunks_fts (content, chunk_id, doc_id)
            VALUES (new.content, new.id, new.doc_id);
        END;

        CREATE TRIGGER IF NOT EXISTS chunks_fts_after_delete
        AFTER DELETE ON chunks
        BEGIN
            DELETE FROM chunks_fts WHERE chunk_id = old.id;
        END;
        ",
    );

    let _ = conn.execute(
        "
        INSERT INTO chunks_fts (content, chunk_id, doc_id)
        SELECT c.content, c.id, c.doc_id
        FROM chunks AS c
        WHERE NOT EXISTS (
            SELECT 1
            FROM chunks_fts AS f
            WHERE f.chunk_id = c.id
        )
        ",
        [],
    );

    true
}

fn sanitize_metadata_key(key: &str) -> Result<&str> {
    if !key.is_empty()
        && key
            .chars()
            .all(|ch| ch.is_ascii_alphanumeric() || ch == '_')
    {
        Ok(key)
    } else {
        Err(SqlRiteError::InvalidFilterKey(key.to_string()))
    }
}

fn build_fts_match_query(query_text: &str) -> Option<String> {
    let mut terms: Vec<String> = query_text
        .split(|ch: char| !ch.is_ascii_alphanumeric())
        .filter(|token| !token.is_empty())
        .map(|token| token.to_lowercase())
        .collect();
    if terms.is_empty() {
        return None;
    }
    terms.sort();
    terms.dedup();

    Some(terms.join(" OR "))
}

fn encode_embedding(vector: &[f32]) -> Vec<u8> {
    let mut bytes = Vec::with_capacity(vector.len() * 4);
    for value in vector {
        bytes.extend_from_slice(&value.to_le_bytes());
    }
    bytes
}

fn decode_embedding(bytes: &[u8], dim: usize) -> std::result::Result<Vec<f32>, SqlRiteError> {
    let expected = dim * 4;
    if bytes.len() != expected {
        return Err(SqlRiteError::InvalidEmbeddingBytes {
            expected_bytes: expected,
            found_bytes: bytes.len(),
        });
    }

    let mut out = Vec::with_capacity(dim);
    for chunk in bytes.chunks_exact(4) {
        let arr = [chunk[0], chunk[1], chunk[2], chunk[3]];
        out.push(f32::from_le_bytes(arr));
    }
    Ok(out)
}

fn cosine_similarity_with_normalized_query(query_normalized: &[f32], right: &[f32]) -> f32 {
    let right_norm = l2_norm_unrolled(right);
    if right_norm == 0.0 {
        return 0.0;
    }
    dot_product_unrolled(query_normalized, right) / right_norm
}

fn normalize_embedding_for_search(values: &[f32]) -> Vec<f32> {
    let norm = l2_norm_unrolled(values);
    if norm == 0.0 {
        return values.to_vec();
    }
    values.iter().map(|value| value / norm).collect()
}

fn dot_product_unrolled(left: &[f32], right: &[f32]) -> f32 {
    #[cfg(any(target_arch = "x86", target_arch = "x86_64"))]
    {
        if std::arch::is_x86_feature_detected!("avx2") {
            return unsafe { dot_product_avx2(left, right) };
        }
    }
    dot_product_scalar(left, right)
}

fn dot_product_scalar(left: &[f32], right: &[f32]) -> f32 {
    let len = left.len().min(right.len());
    let mut acc0 = 0.0f32;
    let mut acc1 = 0.0f32;
    let mut acc2 = 0.0f32;
    let mut acc3 = 0.0f32;
    let mut i = 0usize;
    while i + 4 <= len {
        acc0 += left[i] * right[i];
        acc1 += left[i + 1] * right[i + 1];
        acc2 += left[i + 2] * right[i + 2];
        acc3 += left[i + 3] * right[i + 3];
        i += 4;
    }
    let mut tail = 0.0f32;
    while i < len {
        tail += left[i] * right[i];
        i += 1;
    }
    acc0 + acc1 + acc2 + acc3 + tail
}

fn l2_norm_unrolled(values: &[f32]) -> f32 {
    #[cfg(any(target_arch = "x86", target_arch = "x86_64"))]
    {
        if std::arch::is_x86_feature_detected!("avx2") {
            return unsafe { l2_norm_avx2(values) };
        }
    }
    l2_norm_scalar(values)
}

fn l2_norm_scalar(values: &[f32]) -> f32 {
    let mut acc0 = 0.0f32;
    let mut acc1 = 0.0f32;
    let mut acc2 = 0.0f32;
    let mut acc3 = 0.0f32;
    let mut i = 0usize;
    while i + 4 <= values.len() {
        acc0 += values[i] * values[i];
        acc1 += values[i + 1] * values[i + 1];
        acc2 += values[i + 2] * values[i + 2];
        acc3 += values[i + 3] * values[i + 3];
        i += 4;
    }
    let mut tail = 0.0f32;
    while i < values.len() {
        tail += values[i] * values[i];
        i += 1;
    }
    (acc0 + acc1 + acc2 + acc3 + tail).sqrt()
}

#[cfg(any(target_arch = "x86", target_arch = "x86_64"))]
#[target_feature(enable = "avx2")]
unsafe fn dot_product_avx2(left: &[f32], right: &[f32]) -> f32 {
    #[cfg(target_arch = "x86")]
    use std::arch::x86::{
        __m256, _mm256_add_ps, _mm256_loadu_ps, _mm256_mul_ps, _mm256_setzero_ps, _mm256_storeu_ps,
    };
    #[cfg(target_arch = "x86_64")]
    use std::arch::x86_64::{
        __m256, _mm256_add_ps, _mm256_loadu_ps, _mm256_mul_ps, _mm256_setzero_ps, _mm256_storeu_ps,
    };

    let len = left.len().min(right.len());
    let mut i = 0usize;
    let mut acc: __m256 = _mm256_setzero_ps();
    while i + 8 <= len {
        let (left_vec, right_vec) = unsafe {
            (
                _mm256_loadu_ps(left.as_ptr().add(i)),
                _mm256_loadu_ps(right.as_ptr().add(i)),
            )
        };
        acc = _mm256_add_ps(acc, _mm256_mul_ps(left_vec, right_vec));
        i += 8;
    }

    let mut lanes = [0.0f32; 8];
    unsafe {
        _mm256_storeu_ps(lanes.as_mut_ptr(), acc);
    }
    let mut total = lanes.iter().sum::<f32>();
    while i < len {
        total += left[i] * right[i];
        i += 1;
    }
    total
}

#[cfg(any(target_arch = "x86", target_arch = "x86_64"))]
#[target_feature(enable = "avx2")]
unsafe fn l2_norm_avx2(values: &[f32]) -> f32 {
    #[cfg(target_arch = "x86")]
    use std::arch::x86::{
        __m256, _mm256_add_ps, _mm256_loadu_ps, _mm256_mul_ps, _mm256_setzero_ps, _mm256_storeu_ps,
    };
    #[cfg(target_arch = "x86_64")]
    use std::arch::x86_64::{
        __m256, _mm256_add_ps, _mm256_loadu_ps, _mm256_mul_ps, _mm256_setzero_ps, _mm256_storeu_ps,
    };

    let mut i = 0usize;
    let mut acc: __m256 = _mm256_setzero_ps();
    while i + 8 <= values.len() {
        let vec = unsafe { _mm256_loadu_ps(values.as_ptr().add(i)) };
        acc = _mm256_add_ps(acc, _mm256_mul_ps(vec, vec));
        i += 8;
    }

    let mut lanes = [0.0f32; 8];
    unsafe {
        _mm256_storeu_ps(lanes.as_mut_ptr(), acc);
    }
    let mut total = lanes.iter().sum::<f32>();
    while i < values.len() {
        total += values[i] * values[i];
        i += 1;
    }
    total.sqrt()
}

fn tokenize(text: &str) -> HashSet<String> {
    text.to_lowercase()
        .split(|ch: char| !ch.is_ascii_alphanumeric())
        .filter(|token| !token.is_empty())
        .map(ToOwned::to_owned)
        .collect()
}

fn lexical_overlap_score(query_tokens: &HashSet<String>, query_text: &str, content: &str) -> f32 {
    if query_tokens.is_empty() {
        return 0.0;
    }

    let content_tokens = tokenize(content);
    let overlap = query_tokens.intersection(&content_tokens).count() as f32;
    let base = overlap / query_tokens.len() as f32;

    if content.to_lowercase().contains(&query_text.to_lowercase()) {
        (base + 0.15).min(1.0)
    } else {
        base
    }
}

#[cfg(test)]
mod tests {
    use super::*;
    use serde_json::json;
    use tempfile::tempdir;

    fn seed(db: &SqlRite) -> Result<()> {
        db.ingest_chunks(&[
            ChunkInput {
                id: "c1".to_string(),
                doc_id: "d1".to_string(),
                content: "Rust powers AI agents with safe systems code.".to_string(),
                embedding: vec![1.0, 0.0, 0.0],
                metadata: json!({"tenant": "acme", "topic": "rust"}),
                source: Some("docs/rust.txt".to_string()),
            },
            ChunkInput {
                id: "c2".to_string(),
                doc_id: "d2".to_string(),
                content: "PostgreSQL handles relational workloads at scale.".to_string(),
                embedding: vec![0.0, 1.0, 0.0],
                metadata: json!({"tenant": "acme", "topic": "postgres"}),
                source: Some("docs/postgres.txt".to_string()),
            },
            ChunkInput {
                id: "c3".to_string(),
                doc_id: "d1".to_string(),
                content: "SQLite is excellent for local-first RAG memory.".to_string(),
                embedding: vec![0.8, 0.2, 0.0],
                metadata: json!({"tenant": "beta", "topic": "sqlite"}),
                source: Some("docs/sqlite.txt".to_string()),
            },
        ])?;
        Ok(())
    }

    #[test]
    fn vector_search_ranks_by_similarity() -> Result<()> {
        let db = SqlRite::open_in_memory()?;
        seed(&db)?;

        let results = db.search(SearchRequest {
            query_embedding: Some(vec![0.95, 0.05, 0.0]),
            top_k: 2,
            ..Default::default()
        })?;

        assert_eq!(results.len(), 2);
        assert_eq!(results[0].chunk_id, "c1");
        Ok(())
    }

    #[test]
    fn hybrid_search_matches_text_and_vector() -> Result<()> {
        let db = SqlRite::open_in_memory()?;
        seed(&db)?;

        let results = db.search(SearchRequest {
            query_text: Some("local rag memory sqlite".to_string()),
            query_embedding: Some(vec![0.7, 0.3, 0.0]),
            alpha: 0.5,
            top_k: 1,
            ..Default::default()
        })?;

        assert_eq!(results.len(), 1);
        assert_eq!(results[0].chunk_id, "c3");
        Ok(())
    }

    #[test]
    fn metadata_filter_restricts_results() -> Result<()> {
        let db = SqlRite::open_in_memory()?;
        seed(&db)?;

        let mut filters = HashMap::new();
        filters.insert("tenant".to_string(), "acme".to_string());

        let results = db.search(SearchRequest {
            query_text: Some("ai systems".to_string()),
            metadata_filters: filters,
            top_k: 10,
            ..Default::default()
        })?;

        assert!(results.iter().all(|r| r.metadata["tenant"] == "acme"));
        Ok(())
    }

    #[test]
    fn schema_migrations_are_applied() -> Result<()> {
        let db = SqlRite::open_in_memory()?;
        assert_eq!(db.schema_version(), LATEST_SCHEMA_VERSION);

        let migration_count =
            db.conn
                .query_row("SELECT COUNT(*) FROM schema_migrations", [], |row| {
                    row.get::<_, i64>(0)
                })?;
        assert_eq!(migration_count, MIGRATIONS.len() as i64);
        Ok(())
    }

    #[test]
    fn retrieval_index_catalog_migration_objects_exist() -> Result<()> {
        let db = SqlRite::open_in_memory()?;

        let table_exists: i64 = db.conn.query_row(
            "SELECT COUNT(*) FROM sqlite_master WHERE type = 'table' AND name = 'retrieval_indexes'",
            [],
            |row| row.get(0),
        )?;
        assert_eq!(table_exists, 1);

        let view_exists: i64 = db.conn.query_row(
            "SELECT COUNT(*) FROM sqlite_master WHERE type = 'view' AND name = 'retrieval_index_catalog'",
            [],
            |row| row.get(0),
        )?;
        assert_eq!(view_exists, 1);

        Ok(())
    }

    #[test]
    fn builder_validates_parameters() {
        let err = SearchRequest::builder()
            .query_text("agents")
            .top_k(0)
            .build()
            .expect_err("invalid top_k should fail");
        assert!(matches!(err, SqlRiteError::InvalidTopK));

        let err = SearchRequest::builder()
            .query_text("agents")
            .reciprocal_rank_fusion(0.0)
            .build()
            .expect_err("invalid rrf constant should fail");
        assert!(matches!(err, SqlRiteError::InvalidRrfRankConstant));
    }

    #[test]
    fn convenience_constructors_work() -> Result<()> {
        let chunk = ChunkInput::new("c1", "d1", "content", vec![1.0, 0.0])
            .with_metadata(json!({"tenant": "acme"}))
            .with_source("docs/c1.md");
        assert_eq!(chunk.id, "c1");
        assert_eq!(chunk.source.as_deref(), Some("docs/c1.md"));

        let req = SearchRequest::hybrid("hello", vec![1.0, 0.0], 3);
        assert_eq!(req.top_k, 3);
        assert_eq!(req.query_text.as_deref(), Some("hello"));
        assert!(req.query_embedding.is_some());
        Ok(())
    }

    #[test]
    fn query_profile_latency_clamps_candidate_limit() -> Result<()> {
        let request = SearchRequest::builder()
            .query_text("agents")
            .top_k(4)
            .candidate_limit(500)
            .query_profile(QueryProfile::Latency)
            .build()?;

        let resolved = request.resolve_query_profile();
        assert_eq!(resolved.candidate_limit, 32);
        Ok(())
    }

    #[test]
    fn query_profile_recall_expands_candidate_limit() -> Result<()> {
        let request = SearchRequest::builder()
            .query_text("agents")
            .top_k(5)
            .candidate_limit(20)
            .query_profile(QueryProfile::Recall)
            .build()?;

        let resolved = request.resolve_query_profile();
        assert_eq!(resolved.candidate_limit, 200);
        Ok(())
    }

    #[test]
    fn runtime_config_applies_synchronous_profile() -> Result<()> {
        let db = SqlRite::open_in_memory_with_config(RuntimeConfig::durable())?;
        let synchronous = db
            .conn
            .query_row("PRAGMA synchronous;", [], |row| row.get::<_, i64>(0))?;
        assert_eq!(synchronous, 2);
        Ok(())
    }

    #[test]
    fn deterministic_tie_break_uses_chunk_id() -> Result<()> {
        let db = SqlRite::open_in_memory()?;
        db.ingest_chunks(&[
            ChunkInput {
                id: "z-chunk".to_string(),
                doc_id: "doc-1".to_string(),
                content: "same content".to_string(),
                embedding: vec![1.0, 0.0],
                metadata: json!({}),
                source: None,
            },
            ChunkInput {
                id: "a-chunk".to_string(),
                doc_id: "doc-2".to_string(),
                content: "same content".to_string(),
                embedding: vec![1.0, 0.0],
                metadata: json!({}),
                source: None,
            },
        ])?;

        let results = db.search(SearchRequest {
            query_embedding: Some(vec![1.0, 0.0]),
            top_k: 2,
            ..Default::default()
        })?;
        assert_eq!(results.len(), 2);
        assert_eq!(results[0].chunk_id, "a-chunk");
        Ok(())
    }

    #[test]
    fn deterministic_order_is_stable_across_repeated_runs() -> Result<()> {
        let db = SqlRite::open_in_memory()?;
        db.ingest_chunks(&[
            ChunkInput {
                id: "a-chunk".to_string(),
                doc_id: "d1".to_string(),
                content: "same".to_string(),
                embedding: vec![1.0, 0.0],
                metadata: json!({}),
                source: None,
            },
            ChunkInput {
                id: "b-chunk".to_string(),
                doc_id: "d2".to_string(),
                content: "same".to_string(),
                embedding: vec![1.0, 0.0],
                metadata: json!({}),
                source: None,
            },
        ])?;

        let request = SearchRequest::builder()
            .query_text("same")
            .query_embedding(vec![1.0, 0.0])
            .alpha(0.5)
            .top_k(2)
            .candidate_limit(2)
            .build()?;

        for _ in 0..5 {
            let results = db.search(request.clone())?;
            let ids: Vec<&str> = results.iter().map(|item| item.chunk_id.as_str()).collect();
            assert_eq!(ids, vec!["a-chunk", "b-chunk"]);
        }

        Ok(())
    }

    #[test]
    fn index_mode_rejects_mixed_embedding_dimensions() -> Result<()> {
        let db = SqlRite::open_in_memory_with_config(
            RuntimeConfig::default().with_vector_index_mode(VectorIndexMode::BruteForce),
        )?;
        db.ingest_chunk(&ChunkInput {
            id: "c1".to_string(),
            doc_id: "d1".to_string(),
            content: "alpha".to_string(),
            embedding: vec![1.0, 0.0, 0.0],
            metadata: json!({}),
            source: None,
        })?;

        let err = db
            .ingest_chunk(&ChunkInput {
                id: "c2".to_string(),
                doc_id: "d2".to_string(),
                content: "beta".to_string(),
                embedding: vec![1.0, 0.0],
                metadata: json!({}),
                source: None,
            })
            .expect_err("mixed dimensions should fail in indexed mode");
        assert!(matches!(
            err,
            SqlRiteError::EmbeddingDimensionMismatch { .. }
        ));
        Ok(())
    }

    #[test]
    fn disabled_index_allows_mixed_embedding_dimensions() -> Result<()> {
        let db = SqlRite::open_in_memory_with_config(
            RuntimeConfig::default().with_vector_index_mode(VectorIndexMode::Disabled),
        )?;
        db.ingest_chunk(&ChunkInput {
            id: "c1".to_string(),
            doc_id: "d1".to_string(),
            content: "alpha".to_string(),
            embedding: vec![1.0, 0.0, 0.0],
            metadata: json!({}),
            source: None,
        })?;
        db.ingest_chunk(&ChunkInput {
            id: "c2".to_string(),
            doc_id: "d2".to_string(),
            content: "beta".to_string(),
            embedding: vec![1.0, 0.0],
            metadata: json!({}),
            source: None,
        })?;
        assert_eq!(db.chunk_count()?, 2);
        Ok(())
    }

    #[test]
    fn lsh_ann_mode_rejects_mixed_embedding_dimensions() -> Result<()> {
        let db = SqlRite::open_in_memory_with_config(
            RuntimeConfig::default().with_vector_index_mode(VectorIndexMode::LshAnn),
        )?;
        db.ingest_chunk(&ChunkInput {
            id: "c1".to_string(),
            doc_id: "d1".to_string(),
            content: "alpha".to_string(),
            embedding: vec![1.0, 0.0, 0.0],
            metadata: json!({}),
            source: None,
        })?;

        let err = db
            .ingest_chunk(&ChunkInput {
                id: "c2".to_string(),
                doc_id: "d2".to_string(),
                content: "beta".to_string(),
                embedding: vec![1.0, 0.0],
                metadata: json!({}),
                source: None,
            })
            .expect_err("mixed dimensions should fail in lsh_ann mode");
        assert!(matches!(
            err,
            SqlRiteError::EmbeddingDimensionMismatch { .. }
        ));
        Ok(())
    }

    #[test]
    fn hnsw_baseline_mode_rejects_mixed_embedding_dimensions() -> Result<()> {
        let db = SqlRite::open_in_memory_with_config(
            RuntimeConfig::default().with_vector_index_mode(VectorIndexMode::HnswBaseline),
        )?;
        db.ingest_chunk(&ChunkInput {
            id: "c1".to_string(),
            doc_id: "d1".to_string(),
            content: "alpha".to_string(),
            embedding: vec![1.0, 0.0, 0.0],
            metadata: json!({}),
            source: None,
        })?;

        let err = db
            .ingest_chunk(&ChunkInput {
                id: "c2".to_string(),
                doc_id: "d2".to_string(),
                content: "beta".to_string(),
                embedding: vec![1.0, 0.0],
                metadata: json!({}),
                source: None,
            })
            .expect_err("mixed dimensions should fail in hnsw_baseline mode");
        assert!(matches!(
            err,
            SqlRiteError::EmbeddingDimensionMismatch { .. }
        ));
        Ok(())
    }

    #[test]
    fn ann_snapshot_round_trip_f16_precision() {
        let original = vec![0.12345, -0.34567, 0.99991, -0.00123, 0.5, -0.5];
        let encoded = encode_snapshot_vector(&original, VectorStorageKind::F16);
        let decoded = decode_snapshot_vector(encoded);
        assert_eq!(decoded.len(), original.len());
        for (left, right) in decoded.iter().zip(original.iter()) {
            assert!(
                (left - right).abs() < 0.001,
                "f16 round-trip drift too high"
            );
        }
    }

    #[test]
    fn ann_snapshot_round_trip_int8_precision() {
        let original = vec![1.0, -1.0, 0.75, -0.5, 0.1, -0.05, 0.0];
        let encoded = encode_snapshot_vector(&original, VectorStorageKind::Int8);
        let decoded = decode_snapshot_vector(encoded);
        assert_eq!(decoded.len(), original.len());
        for (left, right) in decoded.iter().zip(original.iter()) {
            assert!(
                (left - right).abs() < 0.02,
                "int8 round-trip drift too high"
            );
        }
    }

    #[test]
    fn ann_snapshot_persists_for_file_backed_ann_index() -> Result<()> {
        let dir = tempdir()?;
        let db_path = dir.path().join("ann_snapshot_test.db");
        let runtime = RuntimeConfig::default()
            .with_vector_index_mode(VectorIndexMode::HnswBaseline)
            .with_vector_storage_kind(VectorStorageKind::Int8)
            .with_ann_persistence(true);

        {
            let db = SqlRite::open_with_config(&db_path, runtime)?;
            db.ingest_chunks(&[
                ChunkInput {
                    id: "c1".to_string(),
                    doc_id: "d1".to_string(),
                    content: "alpha".to_string(),
                    embedding: vec![1.0, 0.0, 0.0],
                    metadata: json!({}),
                    source: None,
                },
                ChunkInput {
                    id: "c2".to_string(),
                    doc_id: "d2".to_string(),
                    content: "beta".to_string(),
                    embedding: vec![0.8, 0.2, 0.0],
                    metadata: json!({}),
                    source: None,
                },
            ])?;
        }

        let snapshot_path = ann_snapshot_path(
            &db_path,
            VectorIndexMode::HnswBaseline,
            VectorStorageKind::Int8,
        )
        .expect("expected snapshot path");
        let graph_paths = ann_graph_dump_paths(
            &db_path,
            VectorIndexMode::HnswBaseline,
            VectorStorageKind::Int8,
        )
        .expect("expected ann graph paths");
        let entry_sidecar_path = ann_entry_sidecar_path(
            &db_path,
            VectorIndexMode::HnswBaseline,
            VectorStorageKind::Int8,
        )
        .expect("expected ann entry sidecar path");
        assert!(snapshot_path.exists(), "snapshot file should be created");
        assert!(
            entry_sidecar_path.exists(),
            "ann entry sidecar should be created"
        );
        assert!(
            graph_paths.graph_path.exists(),
            "ann graph file should be created"
        );
        assert!(
            graph_paths.data_path.exists(),
            "ann data file should be created"
        );

        let snapshot = load_ann_snapshot(&snapshot_path)?;
        assert_eq!(snapshot.version, 1);
        assert_eq!(snapshot.mode, "hnsw_baseline");
        assert_eq!(snapshot.storage_kind, "int8");
        assert_eq!(snapshot.entries.len(), 2);
        assert!(
            snapshot
                .entries
                .iter()
                .all(|entry| matches!(entry.vector, AnnSnapshotVector::Int8 { .. })),
            "expected int8 encoded vectors"
        );
        let sidecar_entries = load_ann_entry_sidecar(&entry_sidecar_path, VectorStorageKind::Int8)?;
        assert_eq!(sidecar_entries.len(), 2);
        assert_eq!(sidecar_entries[0].chunk_id, "c1");
        assert_eq!(sidecar_entries[1].chunk_id, "c2");
        Ok(())
    }

    #[test]
    fn file_backed_ann_reopen_prefers_binary_entry_sidecar() -> Result<()> {
        let dir = tempdir()?;
        let db_path = dir.path().join("ann_entry_sidecar_reopen_test.db");
        let runtime = RuntimeConfig::default()
            .with_vector_index_mode(VectorIndexMode::HnswBaseline)
            .with_vector_storage_kind(VectorStorageKind::F32)
            .with_ann_persistence(true);

        {
            let db = SqlRite::open_with_config(&db_path, runtime.clone())?;
            db.ingest_chunks(&[
                ChunkInput {
                    id: "c1".to_string(),
                    doc_id: "d1".to_string(),
                    content: "alpha".to_string(),
                    embedding: vec![1.0, 0.0, 0.0],
                    metadata: json!({}),
                    source: None,
                },
                ChunkInput {
                    id: "c2".to_string(),
                    doc_id: "d2".to_string(),
                    content: "beta".to_string(),
                    embedding: vec![0.0, 1.0, 0.0],
                    metadata: json!({}),
                    source: None,
                },
            ])?;
        }

        let entry_sidecar_path = ann_entry_sidecar_path(
            &db_path,
            VectorIndexMode::HnswBaseline,
            VectorStorageKind::F32,
        )
        .expect("expected ann entry sidecar path");
        let snapshot_path = ann_snapshot_path(
            &db_path,
            VectorIndexMode::HnswBaseline,
            VectorStorageKind::F32,
        )
        .expect("expected snapshot path");
        let graph_paths = ann_graph_dump_paths(
            &db_path,
            VectorIndexMode::HnswBaseline,
            VectorStorageKind::F32,
        )
        .expect("expected ann graph paths");
        assert!(entry_sidecar_path.exists(), "ann sidecar should be created");
        assert!(snapshot_path.exists(), "json snapshot should be created");
        assert!(
            graph_paths.graph_path.exists(),
            "graph dump should be created"
        );
        assert!(
            graph_paths.data_path.exists(),
            "data dump should be created"
        );

        let conn = Connection::open(&db_path)?;
        conn.execute(
            "UPDATE chunks SET embedding = zeroblob(1), embedding_dim = 3",
            [],
        )?;
        drop(conn);
        fs::remove_file(&snapshot_path)?;
        save_ann_entry_sidecar(
            &entry_sidecar_path,
            VectorStorageKind::F32,
            &[
                VectorEntryRecord {
                    chunk_key: 1,
                    chunk_id: "c1".to_string(),
                    embedding: vec![1.0, 0.0, 0.0],
                },
                VectorEntryRecord {
                    chunk_key: 2,
                    chunk_id: "c2".to_string(),
                    embedding: vec![0.0, 1.0, 0.0],
                },
            ],
        )?;
        let graph_bytes = fs::read(&graph_paths.graph_path)?;
        fs::write(&graph_paths.graph_path, graph_bytes)?;
        let data_bytes = fs::read(&graph_paths.data_path)?;
        fs::write(&graph_paths.data_path, data_bytes)?;

        let reopened = SqlRite::open_with_config(&db_path, runtime)?;
        let index = reopened
            .vector_index
            .as_ref()
            .expect("expected vector index")
            .borrow();
        assert!(
            index.graph_ready(),
            "reopen should load the HNSW graph snapshot eagerly"
        );
        drop(index);
        let results = reopened.search(SearchRequest {
            query_embedding: Some(vec![1.0, 0.0, 0.0]),
            top_k: 1,
            candidate_limit: 5,
            ..Default::default()
        })?;
        assert_eq!(results.len(), 1);
        assert_eq!(results[0].chunk_id, "c1");
        Ok(())
    }

    #[test]
    fn exact_segment_snapshot_round_trip_int8_precision() -> Result<()> {
        let dir = tempdir()?;
        let path = dir.path().join("exact_segment_round_trip.bin");
        let original = vec![
            VectorEntryRecord {
                chunk_key: 1,
                chunk_id: "c1".to_string(),
                embedding: vec![1.0, -1.0, 0.25, -0.125],
            },
            VectorEntryRecord {
                chunk_key: 2,
                chunk_id: "c2".to_string(),
                embedding: vec![0.0, 0.5, -0.75, 0.9],
            },
        ];
        save_exact_segment_snapshot(&path, VectorStorageKind::Int8, &original)?;
        let decoded = load_exact_segment_snapshot(&path, VectorStorageKind::Int8)?;
        assert_eq!(decoded.len(), original.len());
        for (expected, actual) in original.iter().zip(decoded.iter()) {
            assert_eq!(actual.chunk_key, expected.chunk_key);
            assert_eq!(actual.chunk_id, expected.chunk_id);
            assert_eq!(actual.embedding.len(), expected.embedding.len());
            for (left, right) in actual.embedding.iter().zip(expected.embedding.iter()) {
                assert!(
                    (left - right).abs() < 0.02,
                    "exact segment int8 round-trip drift too high"
                );
            }
        }
        Ok(())
    }

    #[test]
    fn exact_segment_persists_for_file_backed_bruteforce_index() -> Result<()> {
        let dir = tempdir()?;
        let db_path = dir.path().join("exact_segment_test.db");
        let runtime = RuntimeConfig::default()
            .with_vector_index_mode(VectorIndexMode::BruteForce)
            .with_vector_storage_kind(VectorStorageKind::Int8)
            .with_ann_persistence(true);

        {
            let db = SqlRite::open_with_config(&db_path, runtime)?;
            db.ingest_chunks(&[
                ChunkInput {
                    id: "c1".to_string(),
                    doc_id: "d1".to_string(),
                    content: "alpha".to_string(),
                    embedding: vec![1.0, 0.0, 0.0],
                    metadata: json!({}),
                    source: None,
                },
                ChunkInput {
                    id: "c2".to_string(),
                    doc_id: "d2".to_string(),
                    content: "beta".to_string(),
                    embedding: vec![0.8, 0.2, 0.0],
                    metadata: json!({}),
                    source: None,
                },
            ])?;
        }

        let segment_path = exact_segment_path(&db_path, VectorStorageKind::Int8)
            .expect("expected exact segment path");
        assert!(
            segment_path.exists(),
            "exact segment file should be created"
        );

        let entries = load_exact_segment_snapshot(&segment_path, VectorStorageKind::Int8)?;
        assert_eq!(entries.len(), 2);
        assert_eq!(entries[0].chunk_id, "c1");
        assert_eq!(entries[1].chunk_id, "c2");
        Ok(())
    }

    #[test]
    fn file_backed_bruteforce_reopen_prefers_exact_segment_sidecar() -> Result<()> {
        let dir = tempdir()?;
        let db_path = dir.path().join("exact_segment_reopen_test.db");
        let runtime = RuntimeConfig::default()
            .with_vector_index_mode(VectorIndexMode::BruteForce)
            .with_vector_storage_kind(VectorStorageKind::F32)
            .with_ann_persistence(true);

        {
            let db = SqlRite::open_with_config(&db_path, runtime.clone())?;
            db.ingest_chunks(&[
                ChunkInput {
                    id: "c1".to_string(),
                    doc_id: "d1".to_string(),
                    content: "alpha".to_string(),
                    embedding: vec![1.0, 0.0, 0.0],
                    metadata: json!({}),
                    source: None,
                },
                ChunkInput {
                    id: "c2".to_string(),
                    doc_id: "d2".to_string(),
                    content: "beta".to_string(),
                    embedding: vec![0.0, 1.0, 0.0],
                    metadata: json!({}),
                    source: None,
                },
            ])?;
        }

        let segment_path = exact_segment_path(&db_path, VectorStorageKind::F32)
            .expect("expected exact segment path");
        assert!(
            segment_path.exists(),
            "exact segment file should be created"
        );

        let conn = Connection::open(&db_path)?;
        conn.execute(
            "UPDATE chunks SET embedding = zeroblob(1), embedding_dim = 3",
            [],
        )?;
        drop(conn);
        save_exact_segment_snapshot(
            &segment_path,
            VectorStorageKind::F32,
            &[
                VectorEntryRecord {
                    chunk_key: 1,
                    chunk_id: "c1".to_string(),
                    embedding: vec![1.0, 0.0, 0.0],
                },
                VectorEntryRecord {
                    chunk_key: 2,
                    chunk_id: "c2".to_string(),
                    embedding: vec![0.0, 1.0, 0.0],
                },
            ],
        )?;

        let reopened = SqlRite::open_with_config(&db_path, runtime)?;
        let results = reopened.search(SearchRequest {
            query_embedding: Some(vec![1.0, 0.0, 0.0]),
            top_k: 1,
            candidate_limit: 5,
            ..Default::default()
        })?;
        assert_eq!(results.len(), 1);
        assert_eq!(results[0].chunk_id, "c1");
        Ok(())
    }

    #[test]
    fn compaction_deduplicates_chunks_and_rebuilds_index() -> Result<()> {
        let db = SqlRite::open_in_memory_with_config(
            RuntimeConfig::default().with_vector_index_mode(VectorIndexMode::BruteForce),
        )?;
        db.ingest_chunks(&[
            ChunkInput {
                id: "c1".to_string(),
                doc_id: "d1".to_string(),
                content: "same-content-a".to_string(),
                embedding: vec![1.0, 0.0],
                metadata: json!({"tenant": "acme", "content_hash": "hash-1"}),
                source: None,
            },
            ChunkInput {
                id: "c2".to_string(),
                doc_id: "d1".to_string(),
                content: "same-content-b".to_string(),
                embedding: vec![0.9, 0.1],
                metadata: json!({"tenant": "acme", "content_hash": "hash-1"}),
                source: None,
            },
            ChunkInput {
                id: "c3".to_string(),
                doc_id: "d1".to_string(),
                content: "different-content".to_string(),
                embedding: vec![0.0, 1.0],
                metadata: json!({"tenant": "acme", "content_hash": "hash-2"}),
                source: None,
            },
        ])?;

        let report = db.compact(CompactionOptions {
            dedupe_by_content_hash: true,
            prune_orphan_documents: false,
            wal_checkpoint_truncate: false,
            analyze: false,
            vacuum: false,
        })?;
        assert_eq!(report.before_chunks, 3);
        assert_eq!(report.after_chunks, 2);
        assert_eq!(report.removed_chunks, 1);
        assert_eq!(report.deduplicated_chunks, 1);
        assert!(report.vector_index_rebuilt);
        assert_eq!(
            db.vector_index_stats()
                .map(|stats| stats.entries)
                .unwrap_or(0),
            2
        );
        Ok(())
    }

    #[test]
    fn compaction_prunes_orphan_documents() -> Result<()> {
        let db = SqlRite::open_in_memory_with_config(RuntimeConfig::default())?;
        db.ingest_chunk(&ChunkInput {
            id: "c1".to_string(),
            doc_id: "d1".to_string(),
            content: "active".to_string(),
            embedding: vec![1.0, 0.0],
            metadata: json!({"tenant": "acme", "content_hash": "hash-1"}),
            source: None,
        })?;
        db.conn.execute(
            "INSERT INTO documents (id, source, metadata) VALUES (?1, ?2, '{}')",
            params!["orphan-doc", Option::<String>::None],
        )?;

        let report = db.compact(CompactionOptions {
            dedupe_by_content_hash: false,
            prune_orphan_documents: true,
            wal_checkpoint_truncate: false,
            analyze: false,
            vacuum: false,
        })?;
        assert_eq!(report.before_documents, 2);
        assert_eq!(report.after_documents, 1);
        assert_eq!(report.orphan_documents_removed, 1);
        Ok(())
    }

    #[test]
    fn vector_search_falls_back_to_bruteforce_when_index_absent() -> Result<()> {
        let db = SqlRite::open_in_memory_with_config(
            RuntimeConfig::default().with_vector_index_mode(VectorIndexMode::Disabled),
        )?;
        db.ingest_chunk(&ChunkInput {
            id: "best".to_string(),
            doc_id: "d1".to_string(),
            content: "best".to_string(),
            embedding: vec![1.0, 0.0],
            metadata: json!({}),
            source: None,
        })?;
        db.ingest_chunk(&ChunkInput {
            id: "recent-noise".to_string(),
            doc_id: "d2".to_string(),
            content: "noise".to_string(),
            embedding: vec![0.0, 1.0],
            metadata: json!({}),
            source: None,
        })?;

        let results = db.search(
            SearchRequest::builder()
                .query_embedding(vec![1.0, 0.0])
                .candidate_limit(1)
                .top_k(1)
                .build()?,
        )?;
        assert_eq!(results.len(), 1);
        assert_eq!(results[0].chunk_id, "best");
        Ok(())
    }

    #[test]
    fn vector_search_falls_back_to_bruteforce_on_index_dimension_mismatch() -> Result<()> {
        let db = SqlRite::open_in_memory_with_config(
            RuntimeConfig::default().with_vector_index_mode(VectorIndexMode::BruteForce),
        )?;

        db.ingest_chunk(&ChunkInput {
            id: "indexed-3d".to_string(),
            doc_id: "d-indexed".to_string(),
            content: "indexed".to_string(),
            embedding: vec![1.0, 0.0, 0.0],
            metadata: json!({}),
            source: None,
        })?;

        db.conn.execute(
            "INSERT INTO documents (id, source, metadata) VALUES (?1, ?2, '{}')
             ON CONFLICT(id) DO UPDATE SET source = excluded.source",
            params!["d-raw-1", Option::<String>::None],
        )?;
        db.conn.execute(
            "INSERT INTO chunks (id, doc_id, content, metadata, embedding, embedding_dim)
             VALUES (?1, ?2, ?3, '{}', ?4, ?5)",
            params![
                "target-2d",
                "d-raw-1",
                "target",
                encode_embedding(&[1.0, 0.0]),
                2
            ],
        )?;

        db.conn.execute(
            "INSERT INTO documents (id, source, metadata) VALUES (?1, ?2, '{}')
             ON CONFLICT(id) DO UPDATE SET source = excluded.source",
            params!["d-raw-2", Option::<String>::None],
        )?;
        db.conn.execute(
            "INSERT INTO chunks (id, doc_id, content, metadata, embedding, embedding_dim)
             VALUES (?1, ?2, ?3, '{}', ?4, ?5)",
            params![
                "recent-noise-2d",
                "d-raw-2",
                "noise",
                encode_embedding(&[0.0, 1.0]),
                2
            ],
        )?;

        let results = db.search(
            SearchRequest::builder()
                .query_embedding(vec![1.0, 0.0])
                .candidate_limit(1)
                .top_k(1)
                .build()?,
        )?;
        assert_eq!(results.len(), 1);
        assert_eq!(results[0].chunk_id, "target-2d");
        Ok(())
    }

    #[test]
    fn ingest_chunks_is_atomic_on_dimension_validation_error() -> Result<()> {
        let db = SqlRite::open_in_memory_with_config(
            RuntimeConfig::default().with_vector_index_mode(VectorIndexMode::BruteForce),
        )?;
        let err = db
            .ingest_chunks(&[
                ChunkInput {
                    id: "ok".to_string(),
                    doc_id: "d1".to_string(),
                    content: "first".to_string(),
                    embedding: vec![1.0, 0.0, 0.0],
                    metadata: json!({}),
                    source: None,
                },
                ChunkInput {
                    id: "bad".to_string(),
                    doc_id: "d2".to_string(),
                    content: "second".to_string(),
                    embedding: vec![1.0, 0.0],
                    metadata: json!({}),
                    source: None,
                },
            ])
            .expect_err("mixed dimensions in one batch should fail");
        assert!(matches!(
            err,
            SqlRiteError::EmbeddingDimensionMismatch { .. }
        ));
        assert_eq!(db.chunk_count()?, 0);
        Ok(())
    }

    #[test]
    fn text_search_uses_fts_candidates_not_recent_window() -> Result<()> {
        let db = SqlRite::open_in_memory()?;
        if !db.fts_enabled {
            return Ok(());
        }

        db.ingest_chunk(&ChunkInput {
            id: "target".to_string(),
            doc_id: "doc-target".to_string(),
            content: "ultrauniqueterm retrieval anchor".to_string(),
            embedding: vec![1.0, 0.0],
            metadata: json!({"tenant": "acme"}),
            source: None,
        })?;

        for idx in 0..20 {
            db.ingest_chunk(&ChunkInput {
                id: format!("noise-{idx}"),
                doc_id: format!("doc-noise-{idx}"),
                content: format!("background chunk {idx} with no lexical match"),
                embedding: vec![0.0, 1.0],
                metadata: json!({"tenant": "acme"}),
                source: None,
            })?;
        }

        let results = db.search(
            SearchRequest::builder()
                .query_text("ultrauniqueterm")
                .top_k(1)
                .candidate_limit(5)
                .build()?,
        )?;
        assert_eq!(results.len(), 1);
        assert_eq!(results[0].chunk_id, "target");
        Ok(())
    }

    #[test]
    fn text_search_applies_filters_during_fts_candidate_selection() -> Result<()> {
        let db = SqlRite::open_in_memory()?;
        if !db.fts_enabled {
            return Ok(());
        }

        db.ingest_chunk(&ChunkInput {
            id: "beta-hit".to_string(),
            doc_id: "doc-beta".to_string(),
            content: "tenantscopedtoken appears here".to_string(),
            embedding: vec![1.0, 0.0],
            metadata: json!({"tenant": "beta"}),
            source: None,
        })?;
        db.ingest_chunk(&ChunkInput {
            id: "acme-hit".to_string(),
            doc_id: "doc-acme".to_string(),
            content: "tenantscopedtoken appears here".to_string(),
            embedding: vec![1.0, 0.0],
            metadata: json!({"tenant": "acme"}),
            source: None,
        })?;

        let results = db.search(
            SearchRequest::builder()
                .query_text("tenantscopedtoken")
                .metadata_filter("tenant", "beta")
                .top_k(1)
                .candidate_limit(1)
                .build()?,
        )?;
        assert_eq!(results.len(), 1);
        assert_eq!(results[0].chunk_id, "beta-hit");
        Ok(())
    }

    #[test]
    fn hnsw_vector_search_applies_metadata_filter() -> Result<()> {
        let db = SqlRite::open_in_memory_with_config(
            RuntimeConfig::default().with_vector_index_mode(VectorIndexMode::HnswBaseline),
        )?;

        db.ingest_chunk(&ChunkInput {
            id: "acme-top".to_string(),
            doc_id: "doc-acme".to_string(),
            content: "acme vector".to_string(),
            embedding: vec![1.0, 0.0],
            metadata: json!({"tenant": "acme"}),
            source: None,
        })?;
        db.ingest_chunk(&ChunkInput {
            id: "beta-top".to_string(),
            doc_id: "doc-beta".to_string(),
            content: "beta vector".to_string(),
            embedding: vec![0.99, 0.01],
            metadata: json!({"tenant": "beta"}),
            source: None,
        })?;
        db.ingest_chunk(&ChunkInput {
            id: "beta-second".to_string(),
            doc_id: "doc-beta-2".to_string(),
            content: "beta vector second".to_string(),
            embedding: vec![0.95, 0.05],
            metadata: json!({"tenant": "beta"}),
            source: None,
        })?;

        let results = db.search(
            SearchRequest::builder()
                .query_embedding(vec![1.0, 0.0])
                .metadata_filter("tenant", "beta")
                .candidate_limit(2)
                .top_k(1)
                .build()?,
        )?;
        assert_eq!(results.len(), 1);
        assert_eq!(results[0].chunk_id, "beta-top");
        assert_eq!(results[0].metadata["tenant"], "beta");
        Ok(())
    }

    #[test]
    fn filtered_vector_search_can_skip_payload_materialization() -> Result<()> {
        let db = SqlRite::open_in_memory_with_config(
            RuntimeConfig::default().with_vector_index_mode(VectorIndexMode::HnswBaseline),
        )?;

        db.ingest_chunk(&ChunkInput {
            id: "beta-top".to_string(),
            doc_id: "doc-beta".to_string(),
            content: "beta vector".to_string(),
            embedding: vec![1.0, 0.0],
            metadata: json!({"tenant": "beta"}),
            source: None,
        })?;

        let results = db.search(
            SearchRequest::builder()
                .query_embedding(vec![1.0, 0.0])
                .metadata_filter("tenant", "beta")
                .candidate_limit(64)
                .top_k(1)
                .include_payloads(false)
                .build()?,
        )?;
        assert_eq!(results.len(), 1);
        assert_eq!(results[0].chunk_id, "beta-top");
        assert_eq!(results[0].doc_id, "");
        assert_eq!(results[0].content, "");
        assert_eq!(results[0].metadata, Value::Null);
        Ok(())
    }

    #[test]
    fn rrf_changes_hybrid_ordering() -> Result<()> {
        let db = SqlRite::open_in_memory()?;
        db.ingest_chunks(&[
            ChunkInput {
                id: "z".to_string(),
                doc_id: "d1".to_string(),
                content: "noise".to_string(),
                embedding: vec![1.0, 0.0],
                metadata: json!({}),
                source: None,
            },
            ChunkInput {
                id: "b".to_string(),
                doc_id: "d2".to_string(),
                content: "target".to_string(),
                embedding: vec![0.97, 0.03],
                metadata: json!({}),
                source: None,
            },
            ChunkInput {
                id: "c".to_string(),
                doc_id: "d3".to_string(),
                content: "target".to_string(),
                embedding: vec![0.94, 0.06],
                metadata: json!({}),
                source: None,
            },
        ])?;

        let weighted = db.search(
            SearchRequest::builder()
                .query_text("target")
                .query_embedding(vec![1.0, 0.0])
                .alpha(1.0)
                .top_k(3)
                .fusion_strategy(FusionStrategy::Weighted)
                .build()?,
        )?;
        assert_eq!(weighted[0].chunk_id, "z");

        let rrf = db.search(
            SearchRequest::builder()
                .query_text("target")
                .query_embedding(vec![1.0, 0.0])
                .alpha(1.0)
                .top_k(3)
                .reciprocal_rank_fusion(1.0)
                .build()?,
        )?;
        assert_eq!(rrf[0].chunk_id, "b");
        Ok(())
    }

    #[test]
    fn skip_fts_score_lookup_for_large_vector_hybrid_candidates() {
        assert!(should_skip_fts_score_lookup(
            true,
            true,
            HYBRID_FTS_SCORE_LOOKUP_SKIP_CANDIDATE_LIMIT,
            HYBRID_FTS_SCORE_LOOKUP_SKIP_CANDIDATE_LIMIT
        ));
        assert!(should_skip_fts_score_lookup(
            true,
            true,
            2000,
            HYBRID_FTS_SCORE_LOOKUP_SKIP_CANDIDATE_LIMIT
        ));
    }

    #[test]
    fn keep_fts_score_lookup_for_small_or_non_vector_queries() {
        assert!(!should_skip_fts_score_lookup(true, true, 50, 50));
        assert!(!should_skip_fts_score_lookup(false, true, 1000, 1000));
        assert!(!should_skip_fts_score_lookup(true, false, 1000, 1000));
        assert!(!should_skip_fts_score_lookup(true, true, 100, 1000));
    }

    #[test]
    fn hybrid_planner_selects_vector_first_for_latency_or_high_alpha() {
        let latency_request = SearchRequest {
            query_text: Some("agent memory".to_string()),
            query_embedding: Some(vec![1.0, 0.0]),
            query_profile: QueryProfile::Latency,
            ..Default::default()
        };
        assert_eq!(
            select_hybrid_planner_mode(&latency_request, true, true),
            Some(HybridPlannerMode::VectorFirst)
        );

        let high_alpha_request = SearchRequest {
            query_text: Some("agent memory".to_string()),
            query_embedding: Some(vec![1.0, 0.0]),
            alpha: 0.8,
            ..Default::default()
        };
        assert_eq!(
            select_hybrid_planner_mode(&high_alpha_request, true, true),
            Some(HybridPlannerMode::VectorFirst)
        );
    }

    #[test]
    fn hybrid_planner_selects_text_first_for_low_alpha_or_missing_index() {
        let low_alpha_request = SearchRequest {
            query_text: Some("agent memory".to_string()),
            query_embedding: Some(vec![1.0, 0.0]),
            alpha: 0.2,
            ..Default::default()
        };
        assert_eq!(
            select_hybrid_planner_mode(&low_alpha_request, true, true),
            Some(HybridPlannerMode::TextFirst)
        );
        assert_eq!(
            select_hybrid_planner_mode(&low_alpha_request, true, false),
            Some(HybridPlannerMode::TextFirst)
        );
    }

    #[test]
    fn hybrid_planner_selects_balanced_for_mid_alpha_hybrid_queries() {
        let balanced_request = SearchRequest {
            query_text: Some("agent memory".to_string()),
            query_embedding: Some(vec![1.0, 0.0]),
            alpha: 0.5,
            ..Default::default()
        };
        assert_eq!(
            select_hybrid_planner_mode(&balanced_request, true, true),
            Some(HybridPlannerMode::BalancedHybrid)
        );
    }

    #[test]
    fn hybrid_rerank_limit_stays_smaller_than_candidate_window() {
        let request = SearchRequest {
            query_text: Some("agent memory".to_string()),
            query_embedding: Some(vec![1.0, 0.0]),
            top_k: 10,
            candidate_limit: 200,
            query_profile: QueryProfile::Balanced,
            ..Default::default()
        };

        assert_eq!(
            hybrid_rerank_candidate_limit(&request, Some(HybridPlannerMode::VectorFirst)),
            40
        );
        assert_eq!(
            hybrid_rerank_candidate_limit(&request, Some(HybridPlannerMode::TextFirst)),
            40
        );
        assert_eq!(
            hybrid_rerank_candidate_limit(&request, Some(HybridPlannerMode::BalancedHybrid)),
            60
        );
    }

    #[test]
    fn filtered_chunk_ids_uses_in_memory_doc_and_metadata_index() -> Result<()> {
        let db = SqlRite::open_in_memory()?;
        db.ingest_chunks(&[
            ChunkInput {
                id: "chunk-a".to_string(),
                doc_id: "doc-a".to_string(),
                content: "tenant a memory".to_string(),
                metadata: serde_json::json!({"tenant":"alpha","topic":"memory"}),
                embedding: vec![1.0, 0.0],
                source: None,
            },
            ChunkInput {
                id: "chunk-b".to_string(),
                doc_id: "doc-b".to_string(),
                content: "tenant b ops".to_string(),
                metadata: serde_json::json!({"tenant":"beta","topic":"ops"}),
                embedding: vec![0.0, 1.0],
                source: None,
            },
        ])?;

        let request = SearchRequest {
            doc_id: Some("doc-a".to_string()),
            metadata_filters: HashMap::from([("tenant".to_string(), "alpha".to_string())]),
            ..Default::default()
        };

        let filtered = db.filtered_chunk_keys(&request)?;
        assert_eq!(filtered.len(), 1);
        let chunk_key =
            db.conn
                .query_row("SELECT rowid FROM chunks WHERE id = 'chunk-a'", [], |row| {
                    row.get::<_, i64>(0)
                })? as ChunkKey;
        assert!(filtered.contains(&chunk_key));
        Ok(())
    }

    #[test]
    fn update_chunk_metadata_refreshes_filter_index() -> Result<()> {
        let db = SqlRite::open_in_memory()?;
        db.ingest_chunk(&ChunkInput {
            id: "chunk-a".to_string(),
            doc_id: "doc-a".to_string(),
            content: "tenant alpha memory".to_string(),
            metadata: serde_json::json!({"tenant":"alpha"}),
            embedding: vec![1.0, 0.0],
            source: None,
        })?;

        db.update_chunk_metadata("chunk-a", &serde_json::json!({"tenant":"beta"}))?;

        let alpha_request = SearchRequest {
            metadata_filters: HashMap::from([("tenant".to_string(), "alpha".to_string())]),
            ..Default::default()
        };
        assert!(db.filtered_chunk_keys(&alpha_request)?.is_empty());

        let beta_request = SearchRequest {
            metadata_filters: HashMap::from([("tenant".to_string(), "beta".to_string())]),
            ..Default::default()
        };
        let filtered = db.filtered_chunk_keys(&beta_request)?;
        assert_eq!(filtered.len(), 1);
        let chunk_key =
            db.conn
                .query_row("SELECT rowid FROM chunks WHERE id = 'chunk-a'", [], |row| {
                    row.get::<_, i64>(0)
                })? as ChunkKey;
        assert!(filtered.contains(&chunk_key));
        Ok(())
    }

    #[test]
    fn sqlrite_handle_is_send_sync() {
        fn assert_send_sync<T: Send + Sync>() {}
        assert_send_sync::<SqlRiteHandle>();
    }

    #[test]
    fn text_only_ingest_supports_text_search_and_diagnostics() -> Result<()> {
        let db = SqlRite::open_in_memory()?;
        db.ingest_text_chunks(&[
            TextChunkInput::new("chunk-1", "doc-1", "local agent memory for retrieval")
                .with_metadata(serde_json::json!({"tenant":"acme"}))
                .with_source("notes.md"),
            TextChunkInput::new("chunk-2", "doc-1", "secondary note").with_source("notes.md"),
        ])?;

        let results = db.search(SearchRequest::text_only("agent memory", 2))?;
        assert_eq!(results.len(), 2);
        assert_eq!(results[0].chunk_id, "chunk-1");
        assert_eq!(db.chunk_count()?, 2);
        assert_eq!(db.document_count()?, 1);

        let diagnostics = db.diagnostics()?;
        assert_eq!(diagnostics.chunk_count, 2);
        assert_eq!(diagnostics.document_count, 1);
        assert!(diagnostics.integrity_check_ok);
        assert_eq!(diagnostics.schema_version, LATEST_SCHEMA_VERSION);
        Ok(())
    }

    #[test]
    fn ingest_document_text_applies_builtin_chunking() -> Result<()> {
        let db = SqlRite::open_in_memory()?;
        let report = db.ingest_document_text(
            "doc-chunked",
            "abcdefghijABCDEFGHIJ1234567890",
            DocumentIngestOptions::default().with_chunking(ChunkingStrategy::Fixed {
                max_chars: 8,
                overlap_chars: 2,
            }),
        )?;

        assert!(report.chunk_count > 1);
        assert_eq!(report.chunk_count, report.chunk_ids.len());
        assert_eq!(db.document_count()?, 1);
        assert_eq!(db.chunk_count()?, report.chunk_count);
        Ok(())
    }

    #[test]
    fn update_chunk_embedding_backfills_vector_search_for_text_only_chunk() -> Result<()> {
        let db = SqlRite::open_in_memory_with_config(
            RuntimeConfig::default().with_vector_index_mode(VectorIndexMode::BruteForce),
        )?;
        db.ingest_text_chunk(&TextChunkInput::new(
            "chunk-1",
            "doc-1",
            "text only until embeddings arrive",
        ))?;
        db.update_chunk_embedding("chunk-1", vec![1.0, 0.0])?;

        let results = db.search(SearchRequest::vector_only(vec![1.0, 0.0], 1))?;
        assert_eq!(results.len(), 1);
        assert_eq!(results[0].chunk_id, "chunk-1");
        Ok(())
    }

    #[test]
    fn delete_by_doc_id_removes_chunks_and_document() -> Result<()> {
        let db = SqlRite::open_in_memory()?;
        db.ingest_text_chunks(&[
            TextChunkInput::new("chunk-1", "doc-1", "alpha"),
            TextChunkInput::new("chunk-2", "doc-1", "beta"),
        ])?;

        let deleted = db.delete_by_doc_id("doc-1")?;
        assert_eq!(deleted, 2);
        assert_eq!(db.chunk_count()?, 0);
        assert_eq!(db.document_count()?, 0);
        Ok(())
    }

    #[test]
    fn sqlrite_handle_supports_concurrent_friendly_access_pattern() -> Result<()> {
        let temp = tempfile::tempdir()?;
        let path = temp.path().join("handle.db");
        let handle = SqlRiteHandle::open(&path)?;
        handle.ingest_text_chunk(&TextChunkInput::new(
            "chunk-1",
            "doc-1",
            "gateway request handlers need shared access",
        ))?;
        let results = handle.search(SearchRequest::text_only("shared access", 1))?;
        assert_eq!(results.len(), 1);
        assert_eq!(handle.document_count()?, 1);
        Ok(())
    }
}