bookforge-store 1.5.0

use std::{
    cell::RefCell,
    collections::HashMap,
    fs,
    path::{Path, PathBuf},
    time::{Duration, SystemTime, UNIX_EPOCH},
};

use bookforge_core::{
    Result as CoreResult,
    entity::EntityGender,
    glossary::{GlossaryCategory, GlossaryScopeKind, GlossaryStatus, GlossaryTerm},
    ir::BlockId,
    run_snapshot::RunConfigSnapshot,
    segment::{BlockTranslation, Segment},
};
use rusqlite::{Connection, OptionalExtension, params, types::Type};
use sha2::{Digest, Sha256};
use std::str::FromStr;

pub type Result<T> = std::result::Result<T, StoreError>;

#[derive(Debug, thiserror::Error)]
pub enum StoreError {
    #[error("I/O error: {0}")]
    Io(#[from] std::io::Error),

    #[error("SQLite error: {0}")]
    Sqlite(#[from] rusqlite::Error),

    #[error("core error: {0}")]
    Core(#[from] bookforge_core::BookforgeError),

    #[error("serialization error: {0}")]
    Serialization(String),
}

pub struct JobStore {
    conn: RefCell<Connection>,
    path: PathBuf,
}

#[derive(Debug, Clone)]
pub struct JobRecord {
    pub id: String,
    pub input_path: PathBuf,
    pub input_snapshot_path: Option<PathBuf>,
    pub input_sha256: Option<String>,
    pub output_path: PathBuf,
    pub input_hash: String,
    pub source_lang: Option<String>,
    pub target_lang: String,
    pub provider: String,
    pub model: String,
    pub base_url: Option<String>,
    pub api_key_env: Option<String>,
    pub status: String,
    pub events_path: Option<PathBuf>,
    pub report_json_path: Option<PathBuf>,
    pub report_markdown_path: Option<PathBuf>,
    pub book_id: Option<String>,
    pub series_id: Option<String>,
}

#[derive(Debug, Clone, Default)]
pub struct JobSummary {
    pub id: String,
    pub status: String,
    pub total_segments: usize,
    pub succeeded: usize,
    pub failed: usize,
    pub needs_review: usize,
    pub retry_pending: usize,
    pub cached: usize,
    pub retried: usize,
    pub input_tokens: u64,
    pub input_cached_tokens: u64,
    pub output_tokens: u64,
}

#[derive(Debug, Clone, Copy)]
pub struct CreateJob<'a> {
    pub input: &'a Path,
    pub output: &'a Path,
    pub source_lang: Option<&'a str>,
    pub target_lang: &'a str,
    pub provider: &'a str,
    pub model: &'a str,
    pub base_url: Option<&'a str>,
    pub api_key_env: Option<&'a str>,
    pub book_id: Option<&'a str>,
    pub series_id: Option<&'a str>,
}

#[derive(Debug, Clone)]
pub struct SegmentRecord {
    pub id: String,
    pub status: String,
    pub attempts: usize,
    pub error: Option<String>,
    pub input_tokens: Option<u64>,
    pub input_cached_tokens: Option<u64>,
    pub output_tokens: Option<u64>,
    pub tokens_estimated: bool,
}

#[derive(Debug, Clone, PartialEq, Eq)]
pub struct StoredBlockTranslation {
    pub segment_id: String,
    pub block_id: String,
    pub text: String,
}

#[derive(Debug, Clone, PartialEq, Eq)]
pub struct StoredSegmentTranslation {
    pub segment_id: String,
    pub ordinal: usize,
    pub status: String,
    pub error: Option<String>,
    pub translated_text: String,
    pub blocks: Vec<BlockTranslation>,
}

#[derive(Debug, Clone, PartialEq, Eq)]
pub struct CachedTranslation {
    pub translated_text: String,
    pub blocks: Vec<BlockTranslation>,
}

#[derive(Debug, Clone, Copy)]
pub struct SaveTranslation<'a> {
    pub job_id: &'a str,
    pub segment_id: &'a str,
    pub translated_text: &'a str,
    pub blocks: &'a [BlockTranslation],
    pub provider: &'a str,
    pub model: &'a str,
    pub prompt_version: &'a str,
    pub input_tokens: Option<u64>,
    pub input_cached_tokens: Option<u64>,
    pub output_tokens: Option<u64>,
    pub tokens_estimated: bool,
}

#[derive(Debug, Clone, Copy)]
pub struct SaveNeedsReview<'a> {
    pub job_id: &'a str,
    pub segment_id: &'a str,
    pub preserved_text: &'a str,
    pub blocks: &'a [BlockTranslation],
    pub provider: &'a str,
    pub model: &'a str,
    pub prompt_version: &'a str,
    pub error: &'a str,
    pub input_tokens: Option<u64>,
    pub input_cached_tokens: Option<u64>,
    pub output_tokens: Option<u64>,
    pub tokens_estimated: bool,
}

#[derive(Debug, Clone, Copy)]
pub struct SaveCachedTranslation<'a> {
    pub job_id: &'a str,
    pub segment_id: &'a str,
    pub translated_text: &'a str,
    pub blocks: &'a [BlockTranslation],
    pub provider: &'a str,
    pub model: &'a str,
    pub prompt_version: &'a str,
}

#[derive(Debug, Clone, Copy)]
pub struct CacheLookupRequest<'a> {
    pub prompt_version: &'a str,
    pub provider: &'a str,
    pub model: &'a str,
    pub source_lang: Option<&'a str>,
    pub target_lang: &'a str,
    pub cache_namespace: &'a str,
}

#[derive(Debug, Clone, Copy)]
pub struct NewSegmentFlag<'a> {
    pub job_id: &'a str,
    pub segment_id: &'a str,
    pub kind: &'a str,
    pub note: Option<&'a str>,
    pub suggested_source: Option<&'a str>,
    pub suggested_target: Option<&'a str>,
    pub consumed: bool,
}

#[derive(Debug, Clone, Copy, Default)]
pub struct GlossaryFilter<'a> {
    pub scope_kind: Option<GlossaryScopeKind>,
    pub scope_id: Option<&'a str>,
    pub source_language: Option<&'a str>,
    pub target_language: Option<&'a str>,
    pub active_only: bool,
}

#[derive(Debug, Clone, Copy)]
pub struct NewGlossaryCandidate<'a> {
    pub source_text: &'a str,
    pub category: GlossaryCategory,
    pub source_count: usize,
}

#[derive(Debug, Clone, Copy, Default, PartialEq, Eq)]
pub struct GlossaryCandidateUpsertResult {
    pub inserted: usize,
    pub updated: usize,
    pub skipped: usize,
}

#[derive(Debug, Clone, PartialEq, Eq)]
pub struct StoredGlossaryCandidate {
    pub id: i64,
    pub source_text: String,
    pub target_text: Option<String>,
    pub category: GlossaryCategory,
    pub notes: Option<String>,
    pub case_sensitive: bool,
    pub always_active: bool,
    pub status: GlossaryStatus,
    pub source_language: String,
    pub target_language: String,
    pub source_count: usize,
}

#[derive(Debug, Clone, Copy)]
pub struct NewStyleSheet<'a> {
    pub scope_kind: GlossaryScopeKind,
    pub scope_id: Option<&'a str>,
    pub target_language: &'a str,
    pub content_toml: &'a str,
    pub fingerprint: &'a str,
}

#[derive(Debug, Clone, PartialEq, Eq)]
pub struct StoredStyleSheet {
    pub id: i64,
    pub scope_kind: GlossaryScopeKind,
    pub scope_id: Option<String>,
    pub target_language: String,
    pub content_toml: String,
    pub fingerprint: String,
}

#[derive(Debug, Clone, Copy)]
pub struct NewEntity<'a> {
    pub scope_kind: GlossaryScopeKind,
    pub scope_id: Option<&'a str>,
    pub source_name: &'a str,
    pub target_name: &'a str,
    pub gender_target: Option<EntityGender>,
    pub role: Option<&'a str>,
    pub notes: Option<&'a str>,
    pub source_language: &'a str,
    pub target_language: &'a str,
}

#[derive(Debug, Clone, PartialEq, Eq)]
pub struct StoredEntity {
    pub id: i64,
    pub scope_kind: GlossaryScopeKind,
    pub scope_id: Option<String>,
    pub source_name: String,
    pub target_name: String,
    pub gender_target: Option<EntityGender>,
    pub role: Option<String>,
    pub notes: Option<String>,
    pub source_language: String,
    pub target_language: String,
}

#[derive(Debug, Clone)]
pub struct StorageDoctor {
    pub database_path: PathBuf,
    pub database_exists: bool,
    pub wal_present: bool,
    pub shm_present: bool,
    pub journal_mode: String,
    pub integrity_check: String,
    pub wal_sidecars_normal: bool,
    pub note: String,
}

pub fn run_doctor(db_path: Option<PathBuf>) -> Result<StorageDoctor> {
    let path = db_path.unwrap_or_else(|| PathBuf::from(".bookforge/jobs.sqlite"));
    let database_exists = path.exists();
    let wal_path = path.with_extension("sqlite-wal");
    let shm_path = path.with_extension("sqlite-shm");
    let wal_present = wal_path.exists();
    let shm_present = shm_path.exists();

    let (journal_mode, integrity_check, wal_sidecars_normal, note) = if database_exists {
        let conn = Connection::open(&path)?;
        let journal_mode: String = conn
            .pragma_query_value(None, "journal_mode", |row| row.get(0))
            .unwrap_or_else(|_| "unknown".to_string());
        let integrity_check: String = conn
            .pragma_query_value(None, "integrity_check", |row| row.get(0))
            .unwrap_or_else(|_| "error".to_string());
        let _ = conn.execute_batch("PRAGMA wal_checkpoint(PASSIVE);");

        let wal_sidecars_normal = if wal_present || shm_present {
            integrity_check == "ok"
        } else {
            true
        };

        let note = if wal_present || shm_present {
            "WAL sidecar files are normal. SQLite will recover them automatically. \
             Do not delete them manually while BookForge is running."
                .to_string()
        } else {
            String::new()
        };

        (journal_mode, integrity_check, wal_sidecars_normal, note)
    } else {
        ("unknown".to_string(), String::new(), true, String::new())
    };

    Ok(StorageDoctor {
        database_path: path,
        database_exists,
        wal_present,
        shm_present,
        journal_mode,
        integrity_check,
        wal_sidecars_normal,
        note,
    })
}

impl JobStore {
    pub fn open_default() -> Result<Self> {
        Self::open(".bookforge/jobs.sqlite")
    }

    pub fn open(path: impl Into<PathBuf>) -> Result<Self> {
        let path = path.into();
        if let Some(parent) = path.parent() {
            fs::create_dir_all(parent)?;
        }
        let conn = Connection::open(&path)?;

        conn.busy_timeout(Duration::from_secs(5))?;
        conn.pragma_update(None, "journal_mode", "WAL")?;
        conn.pragma_update(None, "synchronous", "NORMAL")?;
        conn.pragma_update(None, "foreign_keys", "ON")?;

        let store = Self {
            conn: RefCell::new(conn),
            path,
        };
        store.migrate()?;
        Ok(store)
    }

    pub fn path(&self) -> &Path {
        &self.path
    }

    pub fn create_job(&self, request: CreateJob<'_>) -> Result<JobRecord> {
        let input_hash = file_hash(request.input)?;
        let id = format!("job_{}_{}", unix_timestamp_nanos(), &input_hash[..12]);
        let now = timestamp_string();
        let input_path = request.input.to_path_buf();
        let output_path = request.output.to_path_buf();
        let conn = self.conn.borrow();
        conn.execute(
            "INSERT INTO jobs
             (id, input_path, output_path, input_hash, source_lang, target_lang, provider, model, base_url, api_key_env, book_id, series_id, status, created_at, updated_at)
             VALUES (?1, ?2, ?3, ?4, ?5, ?6, ?7, ?8, ?9, ?10, ?11, ?12, 'running', ?13, ?13)",
            params![
                id,
                input_path.to_string_lossy(),
                output_path.to_string_lossy(),
                input_hash,
                request.source_lang,
                request.target_lang,
                request.provider,
                request.model,
                request.base_url,
                request.api_key_env,
                request.book_id,
                request.series_id,
                now,
            ],
        )?;

        Ok(JobRecord {
            id,
            input_path,
            input_snapshot_path: None,
            input_sha256: None,
            output_path,
            input_hash,
            source_lang: request.source_lang.map(ToOwned::to_owned),
            target_lang: request.target_lang.to_string(),
            provider: request.provider.to_string(),
            model: request.model.to_string(),
            base_url: request.base_url.map(ToOwned::to_owned),
            api_key_env: request.api_key_env.map(ToOwned::to_owned),
            status: "running".to_string(),
            events_path: None,
            report_json_path: None,
            report_markdown_path: None,
            book_id: request.book_id.map(ToOwned::to_owned),
            series_id: request.series_id.map(ToOwned::to_owned),
        })
    }

    pub fn update_job_config_snapshot(
        &self,
        job_id: &str,
        snapshot: &RunConfigSnapshot,
    ) -> Result<()> {
        let json = serde_json::to_string(snapshot)
            .map_err(|e| StoreError::Serialization(e.to_string()))?;
        let conn = self.conn.borrow();
        conn.execute(
            "UPDATE jobs
             SET config_json = ?1,
                 events_path = ?2,
                 report_json_path = ?3,
                 report_markdown_path = ?4,
                 input_snapshot_path = ?5,
                 input_sha256 = ?6,
                 updated_at = ?7
             WHERE id = ?8",
            params![
                json,
                snapshot
                    .events_path
                    .as_ref()
                    .map(|path| path.to_string_lossy().to_string()),
                snapshot
                    .report_json_path
                    .as_ref()
                    .map(|path| path.to_string_lossy().to_string()),
                snapshot
                    .report_markdown_path
                    .as_ref()
                    .map(|path| path.to_string_lossy().to_string()),
                snapshot
                    .input_snapshot_path
                    .as_ref()
                    .map(|path| path.to_string_lossy().to_string()),
                snapshot.input_sha256.as_deref(),
                timestamp_string(),
                job_id,
            ],
        )?;
        Ok(())
    }

    pub fn update_job_input_snapshot(
        &self,
        job_id: &str,
        snapshot_path: &Path,
        input_sha256: &str,
    ) -> Result<()> {
        let conn = self.conn.borrow();
        conn.execute(
            "UPDATE jobs
             SET input_snapshot_path = ?1,
                 input_sha256 = ?2,
                 updated_at = ?3
             WHERE id = ?4",
            params![
                snapshot_path.to_string_lossy(),
                input_sha256,
                timestamp_string(),
                job_id
            ],
        )?;
        Ok(())
    }

    pub fn load_job_config_snapshot(&self, job_id: &str) -> Result<Option<RunConfigSnapshot>> {
        let conn = self.conn.borrow();
        let Some(json) = conn
            .query_row(
                "SELECT config_json FROM jobs WHERE id = ?1",
                params![job_id],
                |row| row.get::<_, Option<String>>(0),
            )
            .optional()?
            .flatten()
        else {
            return Ok(None);
        };

        serde_json::from_str(&json)
            .map(Some)
            .map_err(|e| StoreError::Serialization(e.to_string()))
    }

    pub fn update_job_event_path(&self, job_id: &str, path: &Path) -> Result<()> {
        let conn = self.conn.borrow();
        conn.execute(
            "UPDATE jobs SET events_path = ?1, updated_at = ?2 WHERE id = ?3",
            params![path.to_string_lossy(), timestamp_string(), job_id],
        )?;
        Ok(())
    }

    pub fn update_job_report_paths(
        &self,
        job_id: &str,
        json_path: &Path,
        markdown_path: &Path,
    ) -> Result<()> {
        let conn = self.conn.borrow();
        conn.execute(
            "UPDATE jobs
             SET report_json_path = ?1, report_markdown_path = ?2, updated_at = ?3
             WHERE id = ?4",
            params![
                json_path.to_string_lossy(),
                markdown_path.to_string_lossy(),
                timestamp_string(),
                job_id
            ],
        )?;
        Ok(())
    }

    pub fn update_job_output_path(&self, job_id: &str, path: &Path) -> Result<()> {
        let conn = self.conn.borrow();
        conn.execute(
            "UPDATE jobs SET output_path = ?1, updated_at = ?2 WHERE id = ?3",
            params![path.to_string_lossy(), timestamp_string(), job_id],
        )?;
        Ok(())
    }

    pub fn insert_segments(
        &self,
        job_id: &str,
        segments: &[Segment],
        prompt_version: &str,
        provider: &str,
        model: &str,
        cache_namespace: &str,
    ) -> Result<()> {
        let mut conn = self.conn.borrow_mut();
        let tx = conn.transaction()?;
        for segment in segments {
            tx.execute(
                "INSERT OR IGNORE INTO segments
                 (id, job_id, section_id, ordinal, source_hash, prompt_version, provider, model, status, attempts, cache_namespace)
                 VALUES (?1, ?2, ?3, ?4, ?5, ?6, ?7, ?8, 'queued', 0, ?9)",
                params![
                    segment.id.0,
                    job_id,
                    segment.section_id.0,
                    segment.ordinal as i64,
                    segment.checksum,
                    prompt_version,
                    provider,
                    model,
                    cache_namespace,
                ],
            )?;
        }
        tx.commit()?;
        Ok(())
    }

    pub fn save_translation(&self, request: SaveTranslation<'_>) -> Result<()> {
        let now = timestamp_string();
        let translated_hash = stable_hash(request.translated_text);
        {
            let conn = self.conn.borrow();
            conn.execute(
                "INSERT OR REPLACE INTO translations
                 (segment_id, job_id, translated_text, provider, model, prompt_version, created_at)
                 VALUES (?1, ?2, ?3, ?4, ?5, ?6, ?7)",
                params![
                    request.segment_id,
                    request.job_id,
                    request.translated_text,
                    request.provider,
                    request.model,
                    request.prompt_version,
                    now
                ],
            )?;
            replace_block_translations(&conn, request.job_id, request.segment_id, request.blocks)?;
            conn.execute(
                "UPDATE segments
                 SET status = 'succeeded',
                     attempts = attempts + 1,
                     tokens_input = ?1,
                     tokens_input_cached = ?2,
                     tokens_output = ?3,
                     tokens_estimated = ?4,
                     translated_hash = ?5,
                     error = NULL
                 WHERE job_id = ?6 AND id = ?7",
                params![
                    request.input_tokens.map(|value| value as i64),
                    request.input_cached_tokens.map(|value| value as i64),
                    request.output_tokens.map(|value| value as i64),
                    if request.tokens_estimated {
                        1_i64
                    } else {
                        0_i64
                    },
                    translated_hash,
                    request.job_id,
                    request.segment_id,
                ],
            )?;
        }
        self.touch_job(request.job_id, "running")?;
        Ok(())
    }

    pub fn save_needs_review(&self, request: SaveNeedsReview<'_>) -> Result<()> {
        let now = timestamp_string();
        let translated_hash = stable_hash(request.preserved_text);
        {
            let conn = self.conn.borrow();
            conn.execute(
                "INSERT OR REPLACE INTO translations
                 (segment_id, job_id, translated_text, provider, model, prompt_version, created_at)
                 VALUES (?1, ?2, ?3, ?4, ?5, ?6, ?7)",
                params![
                    request.segment_id,
                    request.job_id,
                    request.preserved_text,
                    request.provider,
                    request.model,
                    request.prompt_version,
                    now
                ],
            )?;
            replace_block_translations(&conn, request.job_id, request.segment_id, request.blocks)?;
            conn.execute(
                "UPDATE segments
                 SET status = 'needs_review',
                     attempts = attempts + 1,
                     tokens_input = ?1,
                     tokens_input_cached = ?2,
                     tokens_output = ?3,
                     tokens_estimated = ?4,
                     translated_hash = ?5,
                     error = ?6
                 WHERE job_id = ?7 AND id = ?8",
                params![
                    request.input_tokens.map(|value| value as i64),
                    request.input_cached_tokens.map(|value| value as i64),
                    request.output_tokens.map(|value| value as i64),
                    if request.tokens_estimated {
                        1_i64
                    } else {
                        0_i64
                    },
                    translated_hash,
                    request.error,
                    request.job_id,
                    request.segment_id
                ],
            )?;
        }
        self.touch_job(request.job_id, "needs_review")?;
        Ok(())
    }

    pub fn save_cached_translation(&self, request: SaveCachedTranslation<'_>) -> Result<()> {
        let now = timestamp_string();
        let translated_hash = stable_hash(request.translated_text);
        {
            let conn = self.conn.borrow();
            conn.execute(
                "INSERT OR REPLACE INTO translations
                 (segment_id, job_id, translated_text, provider, model, prompt_version, created_at)
                 VALUES (?1, ?2, ?3, ?4, ?5, ?6, ?7)",
                params![
                    request.segment_id,
                    request.job_id,
                    request.translated_text,
                    request.provider,
                    request.model,
                    request.prompt_version,
                    now
                ],
            )?;
            replace_block_translations(&conn, request.job_id, request.segment_id, request.blocks)?;
            conn.execute(
                "UPDATE segments
                 SET status = 'skipped_cached',
                     tokens_input = NULL,
                     tokens_input_cached = NULL,
                     tokens_output = NULL,
                     tokens_estimated = 0,
                     translated_hash = ?1,
                     error = NULL
                 WHERE job_id = ?2 AND id = ?3",
                params![translated_hash, request.job_id, request.segment_id],
            )?;
        }
        self.touch_job(request.job_id, "running")?;
        Ok(())
    }

    pub fn mark_job_complete(&self, job_id: &str) -> Result<()> {
        self.touch_job(job_id, "succeeded")
    }

    pub fn mark_job_running(&self, job_id: &str) -> Result<()> {
        self.touch_job(job_id, "running")
    }

    pub fn mark_job_succeeded(&self, job_id: &str) -> Result<()> {
        self.mark_job_complete(job_id)
    }

    pub fn mark_job_needs_review(&self, job_id: &str) -> Result<()> {
        self.touch_job(job_id, "needs_review")
    }

    pub fn mark_job_interrupted(&self, job_id: &str) -> Result<()> {
        self.touch_job(job_id, "interrupted")
    }

    pub fn mark_job_failed(&self, job_id: &str) -> Result<()> {
        self.touch_job(job_id, "failed")
    }

    pub fn mark_segment_failed(&self, job_id: &str, segment_id: &str, error: &str) -> Result<()> {
        {
            let conn = self.conn.borrow();
            conn.execute(
                "UPDATE segments SET status = 'failed', attempts = attempts + 1, error = ?1 WHERE job_id = ?2 AND id = ?3",
                params![error, job_id, segment_id],
            )?;
        }
        self.touch_job(job_id, "failed")?;
        Ok(())
    }

    pub fn mark_segment_failed_if_unfinished(
        &self,
        job_id: &str,
        segment_id: &str,
        error: &str,
    ) -> Result<()> {
        {
            let conn = self.conn.borrow();
            conn.execute(
                "UPDATE segments
                 SET status = 'failed', attempts = attempts + 1, error = ?1
                 WHERE job_id = ?2
                   AND id = ?3
                   AND status NOT IN ('succeeded', 'skipped_cached', 'needs_review')",
                params![error, job_id, segment_id],
            )?;
        }
        self.touch_job(job_id, "failed")?;
        Ok(())
    }

    pub fn mark_unfinished_segments_failed(
        &self,
        job_id: &str,
        candidate_segment_ids: &[String],
        error: &str,
    ) -> Result<usize> {
        const SQLITE_IN_CHUNK_SIZE: usize = 900;
        let mut updated = 0;

        for chunk in candidate_segment_ids.chunks(SQLITE_IN_CHUNK_SIZE) {
            if chunk.is_empty() {
                continue;
            }

            let placeholders = std::iter::repeat_n("?", chunk.len())
                .collect::<Vec<_>>()
                .join(", ");
            let sql = format!(
                "UPDATE segments
                 SET status = 'failed', attempts = attempts + 1, error = ?
                 WHERE job_id = ?
                   AND id IN ({placeholders})
                   AND status NOT IN ('succeeded', 'skipped_cached', 'needs_review')"
            );

            let conn = self.conn.borrow();
            let mut params: Vec<&dyn rusqlite::types::ToSql> = Vec::with_capacity(chunk.len() + 2);
            params.push(&error);
            params.push(&job_id);
            for id in chunk {
                params.push(id);
            }
            updated += conn.execute(&sql, params.as_slice())?;
        }

        if updated > 0 {
            self.touch_job(job_id, "failed")?;
        }
        Ok(updated)
    }

    pub fn get_job(&self, job_id: &str) -> Result<Option<JobRecord>> {
        let conn = self.conn.borrow();
        conn.query_row(
            "SELECT id, input_path, input_snapshot_path, input_sha256, output_path, input_hash, source_lang, target_lang, provider, model, base_url, api_key_env, status,
                    events_path, report_json_path, report_markdown_path, book_id, series_id
             FROM jobs WHERE id = ?1",
            params![job_id],
            |row| {
                Ok(JobRecord {
                    id: row.get(0)?,
                    input_path: PathBuf::from(row.get::<_, String>(1)?),
                    input_snapshot_path: row.get::<_, Option<String>>(2)?.map(PathBuf::from),
                    input_sha256: row.get(3)?,
                    output_path: PathBuf::from(row.get::<_, String>(4)?),
                    input_hash: row.get(5)?,
                    source_lang: row.get(6)?,
                    target_lang: row.get(7)?,
                    provider: row.get(8)?,
                    model: row.get(9)?,
                    base_url: row.get(10)?,
                    api_key_env: row.get(11)?,
                    status: row.get(12)?,
                    events_path: row.get::<_, Option<String>>(13)?.map(PathBuf::from),
                    report_json_path: row.get::<_, Option<String>>(14)?.map(PathBuf::from),
                    report_markdown_path: row.get::<_, Option<String>>(15)?.map(PathBuf::from),
                    book_id: row.get(16)?,
                    series_id: row.get(17)?,
                })
            },
        )
        .optional()
        .map_err(StoreError::from)
    }

    pub fn summary(&self, job_id: &str) -> Result<Option<JobSummary>> {
        let Some(job) = self.get_job(job_id)? else {
            return Ok(None);
        };
        let conn = self.conn.borrow();
        let mut summary = JobSummary {
            id: job.id,
            status: job.status,
            ..JobSummary::default()
        };

        let mut stmt = conn.prepare(
            "SELECT status,
                    COUNT(*),
                    COALESCE(SUM(COALESCE(tokens_input, input_tokens)), 0),
                    COALESCE(SUM(tokens_input_cached), 0),
                    COALESCE(SUM(COALESCE(tokens_output, output_tokens)), 0)
             FROM segments WHERE job_id = ?1 GROUP BY status",
        )?;
        let rows = stmt.query_map(params![job_id], |row| {
            Ok((
                row.get::<_, String>(0)?,
                row.get::<_, i64>(1)?,
                row.get::<_, i64>(2)?,
                row.get::<_, i64>(3)?,
                row.get::<_, i64>(4)?,
            ))
        })?;

        for row in rows {
            let (status, count, input_tokens, input_cached_tokens, output_tokens) = row?;
            let count = count as usize;
            summary.total_segments += count;
            summary.input_tokens += input_tokens as u64;
            summary.input_cached_tokens += input_cached_tokens as u64;
            summary.output_tokens += output_tokens as u64;
            match status.as_str() {
                "succeeded" => summary.succeeded += count,
                "failed" => summary.failed += count,
                "needs_review" => summary.needs_review += count,
                "retry_pending" => summary.retry_pending += count,
                "skipped_cached" => summary.cached += count,
                _ => {}
            }
        }

        summary.retried = conn.query_row(
            "SELECT COUNT(*) FROM segments WHERE job_id = ?1 AND attempts > 1",
            params![job_id],
            |row| row.get::<_, i64>(0),
        )? as usize;

        Ok(Some(summary))
    }

    pub fn retry_segments(&self, job_id: &str, scope: RetryScope) -> Result<usize> {
        let where_status = match scope {
            RetryScope::Failed => "status = 'failed'",
            RetryScope::NeedsReview => "status = 'needs_review'",
            RetryScope::All => "status IN ('failed', 'needs_review')",
        };
        let sql = format!(
            "UPDATE segments SET status = 'retry_pending', error = NULL WHERE job_id = ?1 AND {where_status}"
        );
        let count = {
            let conn = self.conn.borrow();
            conn.execute(&sql, params![job_id])?
        };
        self.touch_job(job_id, "retry_pending")?;
        Ok(count)
    }

    pub fn insert_segment_flags(&self, flags: &[NewSegmentFlag<'_>]) -> Result<usize> {
        let mut conn = self.conn.borrow_mut();
        let tx = conn.transaction()?;
        let ingested_at = timestamp_string();
        let mut inserted = 0usize;
        for flag in flags {
            inserted += tx.execute(
                "INSERT INTO segment_flags
                 (job_id, segment_id, kind, note, suggested_source, suggested_target, ingested_at, consumed)
                 VALUES (?1, ?2, ?3, ?4, ?5, ?6, ?7, ?8)",
                params![
                    flag.job_id,
                    flag.segment_id,
                    flag.kind,
                    flag.note,
                    flag.suggested_source,
                    flag.suggested_target,
                    ingested_at,
                    if flag.consumed { 1_i64 } else { 0_i64 },
                ],
            )?;
        }
        tx.commit()?;
        Ok(inserted)
    }

    pub fn mark_segments_needs_review(
        &self,
        job_id: &str,
        segment_ids: &[String],
        reason: &str,
    ) -> Result<usize> {
        const SQLITE_IN_CHUNK_SIZE: usize = 900;
        let mut updated = 0usize;
        for chunk in segment_ids.chunks(SQLITE_IN_CHUNK_SIZE) {
            if chunk.is_empty() {
                continue;
            }
            let placeholders = std::iter::repeat_n("?", chunk.len())
                .collect::<Vec<_>>()
                .join(", ");
            let sql = format!(
                "UPDATE segments
                 SET status = 'needs_review',
                     error = ?
                 WHERE job_id = ?
                   AND id IN ({placeholders})"
            );
            let conn = self.conn.borrow();
            let mut params: Vec<&dyn rusqlite::types::ToSql> = Vec::with_capacity(chunk.len() + 2);
            params.push(&reason);
            params.push(&job_id);
            for id in chunk {
                params.push(id);
            }
            updated += conn.execute(&sql, params.as_slice())?;
        }
        if updated > 0 {
            self.touch_job(job_id, "needs_review")?;
        }
        Ok(updated)
    }

    pub fn segment_flag_count(&self, job_id: &str) -> Result<usize> {
        let conn = self.conn.borrow();
        let count = conn.query_row(
            "SELECT COUNT(*) FROM segment_flags WHERE job_id = ?1",
            params![job_id],
            |row| row.get::<_, i64>(0),
        )?;
        Ok(count as usize)
    }

    pub fn upsert_glossary_terms(&self, terms: &[GlossaryTerm]) -> Result<usize> {
        let mut conn = self.conn.borrow_mut();
        let tx = conn.transaction()?;
        let now = timestamp_string();
        let mut changed = 0usize;
        for term in terms {
            let existing_id = tx
                .query_row(
                    "SELECT id FROM glossary_terms
                     WHERE scope_kind = ?1
                       AND ((?2 IS NULL AND scope_id IS NULL) OR scope_id = ?2)
                       AND source_text = ?3
                       AND source_language = ?4
                       AND target_language = ?5",
                    params![
                        term.scope_kind.as_str(),
                        term.scope_id.as_deref(),
                        term.source_text,
                        term.source_language,
                        term.target_language,
                    ],
                    |row| row.get::<_, i64>(0),
                )
                .optional()?;
            if let Some(id) = existing_id {
                changed += tx.execute(
                    "UPDATE glossary_terms
                     SET target_text = ?1,
                         category = ?2,
                         notes = ?3,
                         case_sensitive = ?4,
                         always_active = ?5,
                         status = ?6,
                         source_count = ?7,
                         updated_at = ?8
                     WHERE id = ?9",
                    params![
                        term.target_text,
                        term.category.as_str(),
                        term.notes.as_deref(),
                        if term.case_sensitive { 1_i64 } else { 0_i64 },
                        if term.always_active { 1_i64 } else { 0_i64 },
                        term.status.as_str(),
                        term.source_count as i64,
                        now,
                        id,
                    ],
                )?;
            } else {
                changed += tx.execute(
                    "INSERT INTO glossary_terms
                     (scope_kind, scope_id, source_text, target_text, category, notes,
                      case_sensitive, always_active, status, source_language, target_language,
                      source_count, created_at, updated_at)
                     VALUES (?1, ?2, ?3, ?4, ?5, ?6, ?7, ?8, ?9, ?10, ?11, ?12, ?13, ?13)",
                    params![
                        term.scope_kind.as_str(),
                        term.scope_id.as_deref(),
                        term.source_text,
                        term.target_text,
                        term.category.as_str(),
                        term.notes.as_deref(),
                        if term.case_sensitive { 1_i64 } else { 0_i64 },
                        if term.always_active { 1_i64 } else { 0_i64 },
                        term.status.as_str(),
                        term.source_language,
                        term.target_language,
                        term.source_count as i64,
                        now,
                    ],
                )?;
            }
        }
        tx.commit()?;
        Ok(changed)
    }

    pub fn add_glossary_term(&self, term: &GlossaryTerm) -> Result<i64> {
        self.upsert_glossary_terms(std::slice::from_ref(term))?;
        let conn = self.conn.borrow();
        let id = conn.query_row(
            "SELECT id FROM glossary_terms
             WHERE scope_kind = ?1
               AND ((?2 IS NULL AND scope_id IS NULL) OR scope_id = ?2)
               AND source_text = ?3
               AND source_language = ?4
               AND target_language = ?5",
            params![
                term.scope_kind.as_str(),
                term.scope_id.as_deref(),
                term.source_text,
                term.source_language,
                term.target_language,
            ],
            |row| row.get::<_, i64>(0),
        )?;
        Ok(id)
    }

    pub fn upsert_glossary_candidates(
        &self,
        book_id: &str,
        source_language: &str,
        target_language: &str,
        candidates: &[NewGlossaryCandidate<'_>],
    ) -> Result<GlossaryCandidateUpsertResult> {
        let mut conn = self.conn.borrow_mut();
        let tx = conn.transaction()?;
        let now = timestamp_string();
        let mut result = GlossaryCandidateUpsertResult::default();

        for candidate in candidates {
            let existing = tx
                .query_row(
                    "SELECT id, status FROM glossary_terms
                     WHERE scope_kind = 'book'
                       AND scope_id = ?1
                       AND source_text = ?2
                       AND source_language = ?3
                       AND target_language = ?4",
                    params![
                        book_id,
                        candidate.source_text,
                        source_language,
                        target_language
                    ],
                    |row| Ok((row.get::<_, i64>(0)?, row.get::<_, String>(1)?)),
                )
                .optional()?;

            match existing {
                Some((id, status)) if status == GlossaryStatus::AutoCandidate.as_str() => {
                    tx.execute(
                        "UPDATE glossary_terms
                         SET category = ?1,
                             source_count = ?2,
                             updated_at = ?3
                         WHERE id = ?4",
                        params![
                            candidate.category.as_str(),
                            candidate.source_count as i64,
                            now,
                            id,
                        ],
                    )?;
                    result.updated += 1;
                }
                Some(_) => {
                    result.skipped += 1;
                }
                None => {
                    tx.execute(
                        "INSERT INTO glossary_terms
                         (scope_kind, scope_id, source_text, target_text, category, notes,
                          case_sensitive, always_active, status, source_language, target_language,
                          source_count, created_at, updated_at)
                         VALUES ('book', ?1, ?2, NULL, ?3, NULL, 1, 0, 'auto_candidate',
                                 ?4, ?5, ?6, ?7, ?7)",
                        params![
                            book_id,
                            candidate.source_text,
                            candidate.category.as_str(),
                            source_language,
                            target_language,
                            candidate.source_count as i64,
                            now,
                        ],
                    )?;
                    result.inserted += 1;
                }
            }
        }

        tx.commit()?;
        Ok(result)
    }

    pub fn list_glossary_candidate_language_pairs(
        &self,
        book_id: &str,
    ) -> Result<Vec<(String, String)>> {
        let conn = self.conn.borrow();
        let mut stmt = conn.prepare(
            "SELECT DISTINCT source_language, target_language
             FROM glossary_terms
             WHERE scope_kind = 'book'
               AND scope_id = ?1
               AND status = 'auto_candidate'
             ORDER BY source_language, target_language",
        )?;
        let rows = stmt.query_map(params![book_id], |row| {
            Ok((row.get::<_, String>(0)?, row.get::<_, String>(1)?))
        })?;
        rows.collect::<std::result::Result<Vec<_>, _>>()
            .map_err(StoreError::from)
    }

    pub fn list_glossary_candidates(
        &self,
        book_id: &str,
        source_language: &str,
        target_language: &str,
    ) -> Result<Vec<StoredGlossaryCandidate>> {
        let conn = self.conn.borrow();
        let mut stmt = conn.prepare(
            "SELECT id, source_text, target_text, category, notes, case_sensitive,
                    always_active, status, source_language, target_language, source_count
             FROM glossary_terms
             WHERE scope_kind = 'book'
               AND scope_id = ?1
               AND source_language = ?2
               AND target_language = ?3
               AND status = 'auto_candidate'
             ORDER BY source_count DESC, source_text",
        )?;
        let rows = stmt.query_map(
            params![book_id, source_language, target_language],
            glossary_candidate_from_row,
        )?;
        rows.collect::<std::result::Result<Vec<_>, _>>()
            .map_err(StoreError::from)
    }

    pub fn accept_glossary_candidate(&self, id: i64, target_text: Option<&str>) -> Result<bool> {
        let conn = self.conn.borrow();
        let Some((source_text, existing_target)) = conn
            .query_row(
                "SELECT source_text, target_text
                 FROM glossary_terms
                 WHERE id = ?1 AND status = 'auto_candidate'",
                params![id],
                |row| Ok((row.get::<_, String>(0)?, row.get::<_, Option<String>>(1)?)),
            )
            .optional()?
        else {
            return Ok(false);
        };
        let target = target_text
            .filter(|value| !value.trim().is_empty())
            .map(ToOwned::to_owned)
            .or_else(|| existing_target.filter(|value| !value.trim().is_empty()))
            .unwrap_or(source_text);
        let updated = conn.execute(
            "UPDATE glossary_terms
             SET target_text = ?1,
                 status = 'accepted',
                 updated_at = ?2
             WHERE id = ?3 AND status = 'auto_candidate'",
            params![target, timestamp_string(), id],
        )?;
        Ok(updated > 0)
    }

    pub fn reject_glossary_candidate(&self, id: i64) -> Result<bool> {
        let conn = self.conn.borrow();
        let updated = conn.execute(
            "UPDATE glossary_terms
             SET status = 'rejected',
                 updated_at = ?1
             WHERE id = ?2 AND status = 'auto_candidate'",
            params![timestamp_string(), id],
        )?;
        Ok(updated > 0)
    }

    pub fn list_glossary_terms(&self, filter: GlossaryFilter<'_>) -> Result<Vec<GlossaryTerm>> {
        let conn = self.conn.borrow();
        let mut sql = String::from(
            "SELECT id, scope_kind, scope_id, source_text, COALESCE(target_text, ''), category, notes,
                    case_sensitive, always_active, status, source_language, target_language,
                    source_count
             FROM glossary_terms
             WHERE 1 = 1",
        );
        let mut values: Vec<Box<dyn rusqlite::types::ToSql>> = Vec::new();
        if let Some(scope_kind) = filter.scope_kind {
            sql.push_str(" AND scope_kind = ?");
            values.push(Box::new(scope_kind.as_str().to_string()));
        }
        if let Some(scope_id) = filter.scope_id {
            sql.push_str(" AND scope_id = ?");
            values.push(Box::new(scope_id.to_string()));
        }
        if let Some(source_language) = filter.source_language {
            sql.push_str(" AND source_language = ?");
            values.push(Box::new(source_language.to_string()));
        }
        if let Some(target_language) = filter.target_language {
            sql.push_str(" AND target_language = ?");
            values.push(Box::new(target_language.to_string()));
        }
        if filter.active_only {
            sql.push_str(" AND status IN ('user_seeded', 'accepted')");
        }
        sql.push_str(
            " ORDER BY source_language, target_language, scope_kind, scope_id, source_text",
        );
        let param_refs = values
            .iter()
            .map(|value| value.as_ref())
            .collect::<Vec<&dyn rusqlite::types::ToSql>>();
        let mut stmt = conn.prepare(&sql)?;
        let rows = stmt.query_map(param_refs.as_slice(), glossary_term_from_row)?;
        rows.collect::<std::result::Result<Vec<_>, _>>()
            .map_err(StoreError::from)
    }

    pub fn load_active_glossary_terms(
        &self,
        source_language: &str,
        target_language: &str,
        book_id: Option<&str>,
        series_id: Option<&str>,
    ) -> Result<Vec<GlossaryTerm>> {
        let conn = self.conn.borrow();
        let mut stmt = conn.prepare(
            "SELECT id, scope_kind, scope_id, source_text, COALESCE(target_text, ''), category, notes,
                    case_sensitive, always_active, status, source_language, target_language,
                    source_count
             FROM glossary_terms
             WHERE source_language = ?1
               AND target_language = ?2
               AND status IN ('user_seeded', 'accepted')
               AND (
                    scope_kind = 'global'
                    OR (scope_kind = 'series' AND scope_id = ?3)
                    OR (scope_kind = 'book' AND scope_id = ?4)
               )
             ORDER BY scope_kind, scope_id, source_text",
        )?;
        let rows = stmt.query_map(
            params![source_language, target_language, series_id, book_id],
            glossary_term_from_row,
        )?;
        rows.collect::<std::result::Result<Vec<_>, _>>()
            .map_err(StoreError::from)
    }

    pub fn load_active_glossary_terms_for_target(
        &self,
        target_language: &str,
        book_id: Option<&str>,
        series_id: Option<&str>,
    ) -> Result<Vec<GlossaryTerm>> {
        let conn = self.conn.borrow();
        let mut stmt = conn.prepare(
            "SELECT id, scope_kind, scope_id, source_text, COALESCE(target_text, ''), category, notes,
                    case_sensitive, always_active, status, source_language, target_language,
                    source_count
             FROM glossary_terms
             WHERE target_language = ?1
               AND status IN ('user_seeded', 'accepted')
               AND (
                    scope_kind = 'global'
                    OR (scope_kind = 'series' AND scope_id = ?2)
                    OR (scope_kind = 'book' AND scope_id = ?3)
               )
             ORDER BY scope_kind, scope_id, source_language, source_text",
        )?;
        let rows = stmt.query_map(
            params![target_language, series_id, book_id],
            glossary_term_from_row,
        )?;
        rows.collect::<std::result::Result<Vec<_>, _>>()
            .map_err(StoreError::from)
    }

    pub fn remove_glossary_term(&self, id: i64) -> Result<usize> {
        let conn = self.conn.borrow();
        conn.execute("DELETE FROM glossary_terms WHERE id = ?1", params![id])
            .map_err(StoreError::from)
    }

    pub fn clear_glossary_scope(
        &self,
        scope_kind: GlossaryScopeKind,
        scope_id: Option<&str>,
    ) -> Result<usize> {
        let conn = self.conn.borrow();
        let count = if scope_kind == GlossaryScopeKind::Global {
            conn.execute("DELETE FROM glossary_terms WHERE scope_kind = 'global'", [])?
        } else {
            conn.execute(
                "DELETE FROM glossary_terms WHERE scope_kind = ?1 AND scope_id = ?2",
                params![scope_kind.as_str(), scope_id],
            )?
        };
        Ok(count)
    }

    /// Upsert a style sheet for a (scope, target_language) tuple. Returns
    /// the row id of the inserted/updated row.
    pub fn upsert_style_sheet(&self, record: &NewStyleSheet<'_>) -> Result<i64> {
        let conn = self.conn.borrow();
        let now = timestamp_string();
        conn.execute(
            "INSERT INTO style_sheets
                (scope_kind, scope_id, target_language, content_toml, fingerprint, created_at, updated_at)
             VALUES (?1, ?2, ?3, ?4, ?5, ?6, ?6)
             ON CONFLICT(scope_kind, scope_id, target_language) DO UPDATE SET
                content_toml = excluded.content_toml,
                fingerprint = excluded.fingerprint,
                updated_at = excluded.updated_at",
            params![
                record.scope_kind.as_str(),
                record.scope_id,
                record.target_language,
                record.content_toml,
                record.fingerprint,
                now,
            ],
        )?;
        let id: i64 = conn.query_row(
            "SELECT id FROM style_sheets
                WHERE scope_kind = ?1 AND IFNULL(scope_id, '') = IFNULL(?2, '')
                  AND target_language = ?3",
            params![
                record.scope_kind.as_str(),
                record.scope_id,
                record.target_language
            ],
            |row| row.get(0),
        )?;
        Ok(id)
    }

    /// Load all style sheets that apply for a given language pair and
    /// optional book/series scopes. Caller is responsible for merging via
    /// [`bookforge_core::style::merge_style_sheets`].
    pub fn load_active_style_sheets(
        &self,
        target_language: &str,
        book_id: Option<&str>,
        series_id: Option<&str>,
    ) -> Result<Vec<StoredStyleSheet>> {
        let conn = self.conn.borrow();
        let mut stmt = conn.prepare(
            "SELECT id, scope_kind, scope_id, target_language, content_toml, fingerprint
             FROM style_sheets
             WHERE target_language = ?1
               AND ( (scope_kind = 'global')
                  OR (scope_kind = 'series' AND scope_id = ?2)
                  OR (scope_kind = 'book' AND scope_id = ?3) )",
        )?;
        let rows = stmt.query_map(params![target_language, series_id, book_id], |row| {
            Ok(StoredStyleSheet {
                id: row.get(0)?,
                scope_kind: parse_row_enum(&row.get::<_, String>(1)?, 1)?,
                scope_id: row.get(2)?,
                target_language: row.get(3)?,
                content_toml: row.get(4)?,
                fingerprint: row.get(5)?,
            })
        })?;
        rows.collect::<std::result::Result<Vec<_>, _>>()
            .map_err(StoreError::from)
    }

    pub fn list_style_sheets(
        &self,
        target_language: Option<&str>,
        scope_kind: Option<GlossaryScopeKind>,
        scope_id: Option<&str>,
    ) -> Result<Vec<StoredStyleSheet>> {
        let conn = self.conn.borrow();
        let mut stmt = conn.prepare(
            "SELECT id, scope_kind, scope_id, target_language, content_toml, fingerprint
             FROM style_sheets
             WHERE (?1 IS NULL OR target_language = ?1)
               AND (?2 IS NULL OR scope_kind = ?2)
               AND (?3 IS NULL OR scope_id = ?3)
             ORDER BY scope_kind, scope_id",
        )?;
        let scope_text = scope_kind.map(|s| s.as_str().to_string());
        let rows = stmt.query_map(params![target_language, scope_text, scope_id], |row| {
            Ok(StoredStyleSheet {
                id: row.get(0)?,
                scope_kind: parse_row_enum(&row.get::<_, String>(1)?, 1)?,
                scope_id: row.get(2)?,
                target_language: row.get(3)?,
                content_toml: row.get(4)?,
                fingerprint: row.get(5)?,
            })
        })?;
        rows.collect::<std::result::Result<Vec<_>, _>>()
            .map_err(StoreError::from)
    }

    pub fn clear_style_scope(
        &self,
        scope_kind: GlossaryScopeKind,
        scope_id: Option<&str>,
    ) -> Result<usize> {
        let conn = self.conn.borrow();
        let count = if scope_kind == GlossaryScopeKind::Global {
            conn.execute("DELETE FROM style_sheets WHERE scope_kind = 'global'", [])?
        } else {
            conn.execute(
                "DELETE FROM style_sheets WHERE scope_kind = ?1 AND scope_id = ?2",
                params![scope_kind.as_str(), scope_id],
            )?
        };
        Ok(count)
    }

    pub fn upsert_entities(&self, entities: &[NewEntity<'_>]) -> Result<usize> {
        if entities.is_empty() {
            return Ok(0);
        }
        let conn = self.conn.borrow();
        let now = timestamp_string();
        let mut changed = 0usize;
        for entity in entities {
            conn.execute(
                "INSERT INTO entities
                    (scope_kind, scope_id, source_name, target_name, gender_target,
                     role, notes, source_language, target_language, created_at, updated_at)
                 VALUES (?1, ?2, ?3, ?4, ?5, ?6, ?7, ?8, ?9, ?10, ?10)
                 ON CONFLICT(scope_kind, scope_id, source_name, source_language, target_language)
                 DO UPDATE SET
                    target_name = excluded.target_name,
                    gender_target = excluded.gender_target,
                    role = excluded.role,
                    notes = excluded.notes,
                    updated_at = excluded.updated_at",
                params![
                    entity.scope_kind.as_str(),
                    entity.scope_id,
                    entity.source_name,
                    entity.target_name,
                    entity.gender_target.map(|g| g.as_short()),
                    entity.role,
                    entity.notes,
                    entity.source_language,
                    entity.target_language,
                    now,
                ],
            )?;
            changed += 1;
        }
        Ok(changed)
    }

    /// Load all entities that apply for a language pair and optional
    /// book/series scopes. Caller is responsible for merging via
    /// [`bookforge_core::entity::merge_scope_entities`].
    pub fn load_active_entities(
        &self,
        source_language: &str,
        target_language: &str,
        book_id: Option<&str>,
        series_id: Option<&str>,
    ) -> Result<Vec<StoredEntity>> {
        let conn = self.conn.borrow();
        let mut stmt = conn.prepare(
            "SELECT id, scope_kind, scope_id, source_name, target_name, gender_target,
                    role, notes, source_language, target_language
             FROM entities
             WHERE source_language = ?1
               AND target_language = ?2
               AND ( (scope_kind = 'global')
                  OR (scope_kind = 'series' AND scope_id = ?3)
                  OR (scope_kind = 'book' AND scope_id = ?4) )",
        )?;
        let rows = stmt.query_map(
            params![source_language, target_language, series_id, book_id],
            |row| {
                let gender: Option<String> = row.get(5)?;
                Ok(StoredEntity {
                    id: row.get(0)?,
                    scope_kind: parse_row_enum(&row.get::<_, String>(1)?, 1)?,
                    scope_id: row.get(2)?,
                    source_name: row.get(3)?,
                    target_name: row.get(4)?,
                    gender_target: gender.and_then(|g| parse_gender_short(&g)),
                    role: row.get(6)?,
                    notes: row.get(7)?,
                    source_language: row.get(8)?,
                    target_language: row.get(9)?,
                })
            },
        )?;
        rows.collect::<std::result::Result<Vec<_>, _>>()
            .map_err(StoreError::from)
    }

    pub fn list_entities(
        &self,
        source_language: Option<&str>,
        target_language: Option<&str>,
        scope_kind: Option<GlossaryScopeKind>,
        scope_id: Option<&str>,
    ) -> Result<Vec<StoredEntity>> {
        let conn = self.conn.borrow();
        let mut stmt = conn.prepare(
            "SELECT id, scope_kind, scope_id, source_name, target_name, gender_target,
                    role, notes, source_language, target_language
             FROM entities
             WHERE (?1 IS NULL OR source_language = ?1)
               AND (?2 IS NULL OR target_language = ?2)
               AND (?3 IS NULL OR scope_kind = ?3)
               AND (?4 IS NULL OR scope_id = ?4)
             ORDER BY scope_kind, scope_id, source_name",
        )?;
        let scope_text = scope_kind.map(|s| s.as_str().to_string());
        let rows = stmt.query_map(
            params![source_language, target_language, scope_text, scope_id],
            |row| {
                let gender: Option<String> = row.get(5)?;
                Ok(StoredEntity {
                    id: row.get(0)?,
                    scope_kind: parse_row_enum(&row.get::<_, String>(1)?, 1)?,
                    scope_id: row.get(2)?,
                    source_name: row.get(3)?,
                    target_name: row.get(4)?,
                    gender_target: gender.and_then(|g| parse_gender_short(&g)),
                    role: row.get(6)?,
                    notes: row.get(7)?,
                    source_language: row.get(8)?,
                    target_language: row.get(9)?,
                })
            },
        )?;
        rows.collect::<std::result::Result<Vec<_>, _>>()
            .map_err(StoreError::from)
    }

    pub fn clear_entities_scope(
        &self,
        scope_kind: GlossaryScopeKind,
        scope_id: Option<&str>,
    ) -> Result<usize> {
        let conn = self.conn.borrow();
        let count = if scope_kind == GlossaryScopeKind::Global {
            conn.execute("DELETE FROM entities WHERE scope_kind = 'global'", [])?
        } else {
            conn.execute(
                "DELETE FROM entities WHERE scope_kind = ?1 AND scope_id = ?2",
                params![scope_kind.as_str(), scope_id],
            )?
        };
        Ok(count)
    }

    pub fn pending_segment_ids(&self, job_id: &str) -> Result<Vec<String>> {
        let conn = self.conn.borrow();
        let mut stmt = conn.prepare(
            "SELECT id FROM segments
             WHERE job_id = ?1 AND status IN ('queued', 'retry_pending')
             ORDER BY ordinal",
        )?;
        let rows = stmt.query_map(params![job_id], |row| row.get::<_, String>(0))?;
        rows.collect::<std::result::Result<Vec<_>, _>>()
            .map_err(StoreError::from)
    }

    pub fn segment_records(&self, job_id: &str) -> Result<Vec<SegmentRecord>> {
        let conn = self.conn.borrow();
        let mut stmt = conn.prepare(
            "SELECT id,
                    status,
                    attempts,
                    error,
                    COALESCE(tokens_input, input_tokens),
                    tokens_input_cached,
                    COALESCE(tokens_output, output_tokens),
                    tokens_estimated
             FROM segments WHERE job_id = ?1 ORDER BY ordinal",
        )?;
        let rows = stmt.query_map(params![job_id], |row| {
            Ok(SegmentRecord {
                id: row.get(0)?,
                status: row.get(1)?,
                attempts: row.get::<_, i64>(2)? as usize,
                error: row.get(3)?,
                input_tokens: row.get::<_, Option<i64>>(4)?.map(|value| value as u64),
                input_cached_tokens: row.get::<_, Option<i64>>(5)?.map(|value| value as u64),
                output_tokens: row.get::<_, Option<i64>>(6)?.map(|value| value as u64),
                tokens_estimated: row.get::<_, i64>(7)? != 0,
            })
        })?;
        rows.collect::<std::result::Result<Vec<_>, _>>()
            .map_err(StoreError::from)
    }

    pub fn load_block_translations(&self, job_id: &str) -> Result<Vec<StoredBlockTranslation>> {
        let conn = self.conn.borrow();
        let mut stmt = conn.prepare(
            "SELECT segment_id, block_id, translated_text
             FROM translation_blocks WHERE job_id = ?1 ORDER BY segment_id, block_id",
        )?;
        let rows = stmt.query_map(params![job_id], |row| {
            Ok(StoredBlockTranslation {
                segment_id: row.get(0)?,
                block_id: row.get(1)?,
                text: row.get(2)?,
            })
        })?;
        rows.collect::<std::result::Result<Vec<_>, _>>()
            .map_err(StoreError::from)
    }

    pub fn load_terminal_segment_translations(
        &self,
        job_id: &str,
    ) -> Result<Vec<StoredSegmentTranslation>> {
        let conn = self.conn.borrow();
        let mut stmt = conn.prepare(
            "SELECT s.id, s.ordinal, s.status, s.error, t.translated_text
             FROM segments s
             JOIN translations t ON t.job_id = s.job_id AND t.segment_id = s.id
             WHERE s.job_id = ?1 AND s.status IN ('succeeded', 'skipped_cached', 'needs_review')
             ORDER BY s.ordinal",
        )?;
        let rows = stmt.query_map(params![job_id], |row| {
            Ok((
                row.get::<_, String>(0)?,
                row.get::<_, i64>(1)?,
                row.get::<_, String>(2)?,
                row.get::<_, Option<String>>(3)?,
                row.get::<_, String>(4)?,
            ))
        })?;

        let mut records = Vec::new();
        for row in rows {
            let (segment_id, ordinal, status, error, translated_text) = row?;
            let mut block_stmt = conn.prepare(
                "SELECT block_id, translated_text
                 FROM translation_blocks
                 WHERE job_id = ?1 AND segment_id = ?2
                 ORDER BY block_id",
            )?;
            let blocks = block_stmt
                .query_map(params![job_id, segment_id.as_str()], |row| {
                    Ok(BlockTranslation {
                        block_id: BlockId(row.get::<_, String>(0)?),
                        text: row.get(1)?,
                    })
                })?
                .collect::<std::result::Result<Vec<_>, _>>()?;
            records.push(StoredSegmentTranslation {
                segment_id,
                ordinal: ordinal as usize,
                status,
                error,
                translated_text,
                blocks,
            });
        }

        Ok(records)
    }

    pub fn resumable_segment_ids(&self, job_id: &str) -> Result<Vec<String>> {
        let conn = self.conn.borrow();
        let mut stmt = conn.prepare(
            "SELECT id FROM segments
             WHERE job_id = ?1 AND status IN ('queued', 'retry_pending', 'failed')
             ORDER BY ordinal",
        )?;
        let rows = stmt.query_map(params![job_id], |row| row.get::<_, String>(0))?;
        rows.collect::<std::result::Result<Vec<_>, _>>()
            .map_err(StoreError::from)
    }

    #[allow(clippy::too_many_arguments)]
    pub fn find_cached_translation(
        &self,
        segment: &Segment,
        prompt_version: &str,
        provider: &str,
        model: &str,
        source_lang: Option<&str>,
        target_lang: &str,
        cache_namespace: &str,
    ) -> Result<Option<CachedTranslation>> {
        let conn = self.conn.borrow();
        let cached = conn
            .query_row(
                "SELECT t.job_id, t.segment_id, t.translated_text
                 FROM translations t
                 JOIN segments s ON s.job_id = t.job_id AND s.id = t.segment_id
                 JOIN jobs j ON j.id = t.job_id
                 WHERE s.source_hash = ?1
                   AND s.prompt_version = ?2
                   AND s.provider = ?3
                   AND s.model = ?4
                   AND ((?5 IS NULL AND j.source_lang IS NULL) OR j.source_lang = ?5)
                   AND j.target_lang = ?6
                   AND s.cache_namespace = ?7
                   AND s.status IN ('succeeded', 'skipped_cached')
                 ORDER BY CASE s.status WHEN 'succeeded' THEN 0 ELSE 1 END,
                          CAST(t.created_at AS INTEGER) DESC,
                          t.rowid DESC
                 LIMIT 1",
                params![
                    segment.checksum,
                    prompt_version,
                    provider,
                    model,
                    source_lang,
                    target_lang,
                    cache_namespace,
                ],
                |row| {
                    Ok((
                        row.get::<_, String>(0)?,
                        row.get::<_, String>(1)?,
                        row.get::<_, String>(2)?,
                    ))
                },
            )
            .optional()?;

        let Some((job_id, segment_id, translated_text)) = cached else {
            return Ok(None);
        };

        let mut stmt = conn.prepare(
            "SELECT block_id, translated_text
             FROM translation_blocks
             WHERE job_id = ?1 AND segment_id = ?2
             ORDER BY block_id",
        )?;
        let rows = stmt.query_map(params![job_id, segment_id], |row| {
            Ok(BlockTranslation {
                block_id: BlockId(row.get::<_, String>(0)?),
                text: row.get(1)?,
            })
        })?;
        let blocks = rows.collect::<std::result::Result<Vec<_>, _>>()?;

        let mut by_id = blocks
            .into_iter()
            .map(|block| (block.block_id.0.clone(), block))
            .collect::<HashMap<_, _>>();

        let mut ordered = Vec::with_capacity(segment.block_ids.len());
        for id in &segment.block_ids {
            let Some(block) = by_id.remove(&id.0) else {
                return Ok(None);
            };
            ordered.push(block);
        }
        if !by_id.is_empty() {
            return Ok(None);
        }

        Ok(Some(CachedTranslation {
            translated_text,
            blocks: ordered,
        }))
    }

    pub fn find_cached_translations_batch(
        &self,
        segments: &[Segment],
        request: CacheLookupRequest<'_>,
    ) -> Result<HashMap<String, CachedTranslation>> {
        let mut results = HashMap::new();
        if segments.is_empty() {
            return Ok(results);
        }

        const SQLITE_IN_CHUNK_SIZE: usize = 900;

        for chunk in segments.chunks(SQLITE_IN_CHUNK_SIZE) {
            let hashes: Vec<&str> = chunk.iter().map(|s| s.checksum.as_str()).collect();
            let placeholders: Vec<String> =
                (0..hashes.len()).map(|i| format!("?{}", i + 1)).collect();
            let placeholders_sql = placeholders.join(", ");

            let sql = format!(
                "SELECT t.job_id, t.segment_id, t.translated_text, s.source_hash
                 FROM translations t
                 JOIN segments s ON s.job_id = t.job_id AND s.id = t.segment_id
                 JOIN jobs j ON j.id = t.job_id
                 WHERE s.source_hash IN ({placeholders_sql})
                   AND s.prompt_version = ?{}
                   AND s.provider = ?{}
                   AND s.model = ?{}
                   AND ((?{} IS NULL AND j.source_lang IS NULL) OR j.source_lang = ?{})
                   AND j.target_lang = ?{}
                   AND s.cache_namespace = ?{}
                   AND s.status IN ('succeeded', 'skipped_cached')
                 ORDER BY CASE s.status WHEN 'succeeded' THEN 0 ELSE 1 END,
                          CAST(t.created_at AS INTEGER) DESC,
                          t.rowid DESC",
                hashes.len() + 1,
                hashes.len() + 2,
                hashes.len() + 3,
                hashes.len() + 4,
                hashes.len() + 5,
                hashes.len() + 6,
                hashes.len() + 7,
            );

            let mut params: Vec<Box<dyn rusqlite::types::ToSql>> = Vec::new();
            for hash in &hashes {
                params.push(Box::new(hash.to_string()));
            }
            params.push(Box::new(request.prompt_version.to_string()));
            params.push(Box::new(request.provider.to_string()));
            params.push(Box::new(request.model.to_string()));
            params.push(Box::new(request.source_lang.map(|s| s.to_string())));
            params.push(Box::new(request.source_lang.map(|s| s.to_string())));
            params.push(Box::new(request.target_lang.to_string()));
            params.push(Box::new(request.cache_namespace.to_string()));

            let conn = self.conn.borrow();
            let mut stmt = conn.prepare(&sql)?;
            let param_refs: Vec<&dyn rusqlite::types::ToSql> =
                params.iter().map(|p| p.as_ref()).collect();

            let rows = stmt.query_map(param_refs.as_slice(), |row| {
                Ok((
                    row.get::<_, String>(0)?,
                    row.get::<_, String>(1)?,
                    row.get::<_, String>(2)?,
                    row.get::<_, String>(3)?,
                ))
            })?;

            let mut hash_to_hit: HashMap<String, (String, String, String)> = HashMap::new();
            for row in rows {
                let (job_id, segment_id, translated_text, source_hash) = row?;
                hash_to_hit
                    .entry(source_hash)
                    .or_insert((job_id, segment_id, translated_text));
            }

            for segment in chunk {
                if let Some((job_id, segment_id, translated_text)) =
                    hash_to_hit.get(&segment.checksum)
                {
                    let mut block_stmt = conn.prepare(
                        "SELECT block_id, translated_text
                         FROM translation_blocks
                         WHERE job_id = ?1 AND segment_id = ?2
                         ORDER BY block_id",
                    )?;
                    let block_rows = block_stmt.query_map(params![job_id, segment_id], |row| {
                        Ok(BlockTranslation {
                            block_id: BlockId(row.get::<_, String>(0)?),
                            text: row.get(1)?,
                        })
                    })?;
                    let blocks = block_rows.collect::<std::result::Result<Vec<_>, _>>()?;

                    let mut by_id = blocks
                        .into_iter()
                        .map(|block| (block.block_id.0.clone(), block))
                        .collect::<HashMap<_, _>>();

                    let mut ordered = Vec::with_capacity(segment.block_ids.len());
                    let mut valid = true;
                    for id in &segment.block_ids {
                        let Some(block) = by_id.remove(&id.0) else {
                            valid = false;
                            break;
                        };
                        ordered.push(block);
                    }
                    if !valid || !by_id.is_empty() {
                        continue;
                    }

                    results.insert(
                        segment.id.0.clone(),
                        CachedTranslation {
                            translated_text: translated_text.clone(),
                            blocks: ordered,
                        },
                    );
                }
            }
        }

        Ok(results)
    }

    fn migrate(&self) -> Result<()> {
        let conn = self.conn.borrow();
        if table_exists(&conn, "translations")?
            && !table_has_column(&conn, "translations", "job_id")?
        {
            let suffix = unix_timestamp_nanos();
            rename_table_if_exists(&conn, "qa_findings", suffix)?;
            rename_table_if_exists(&conn, "translation_blocks", suffix)?;
            rename_table_if_exists(&conn, "translations", suffix)?;
            rename_table_if_exists(&conn, "segments", suffix)?;
            rename_table_if_exists(&conn, "jobs", suffix)?;
        }
        conn.execute_batch(
            "
            PRAGMA foreign_keys = ON;
            CREATE TABLE IF NOT EXISTS _migrations (
              version INTEGER PRIMARY KEY,
              name TEXT NOT NULL,
              applied_at TEXT NOT NULL
            );

            CREATE TABLE IF NOT EXISTS jobs (
              id TEXT PRIMARY KEY,
              input_path TEXT NOT NULL DEFAULT '',
              input_snapshot_path TEXT,
              input_sha256 TEXT,
              output_path TEXT NOT NULL DEFAULT '',
              input_hash TEXT NOT NULL,
              source_lang TEXT,
              target_lang TEXT NOT NULL,
              provider TEXT NOT NULL,
              model TEXT NOT NULL,
              base_url TEXT,
              api_key_env TEXT,
              status TEXT NOT NULL,
              config_json TEXT,
              events_path TEXT,
              report_json_path TEXT,
              report_markdown_path TEXT,
              book_id TEXT,
              series_id TEXT,
              created_at TEXT NOT NULL,
              updated_at TEXT NOT NULL
            );

            CREATE TABLE IF NOT EXISTS segments (
              id TEXT NOT NULL,
              job_id TEXT NOT NULL,
              section_id TEXT NOT NULL,
              ordinal INTEGER NOT NULL,
              source_hash TEXT NOT NULL,
              prompt_version TEXT NOT NULL,
              provider TEXT NOT NULL,
              model TEXT NOT NULL,
              status TEXT NOT NULL,
              attempts INTEGER NOT NULL DEFAULT 0,
              input_tokens INTEGER,
              output_tokens INTEGER,
              tokens_input INTEGER,
              tokens_input_cached INTEGER,
              tokens_output INTEGER,
              tokens_estimated INTEGER NOT NULL DEFAULT 0,
              cost_estimate REAL,
              error TEXT,
              translated_hash TEXT,
              PRIMARY KEY (job_id, id),
              FOREIGN KEY(job_id) REFERENCES jobs(id)
            );

            CREATE TABLE IF NOT EXISTS translations (
              segment_id TEXT NOT NULL,
              job_id TEXT NOT NULL,
              translated_text TEXT NOT NULL,
              provider TEXT NOT NULL,
              model TEXT NOT NULL,
              prompt_version TEXT NOT NULL,
              created_at TEXT NOT NULL,
              PRIMARY KEY (job_id, segment_id),
              FOREIGN KEY(job_id, segment_id) REFERENCES segments(job_id, id)
            );

            CREATE TABLE IF NOT EXISTS translation_blocks (
              segment_id TEXT NOT NULL,
              job_id TEXT NOT NULL,
              block_id TEXT NOT NULL,
              translated_text TEXT NOT NULL,
              PRIMARY KEY (job_id, segment_id, block_id),
              FOREIGN KEY(job_id, segment_id) REFERENCES segments(job_id, id)
            );

            CREATE TABLE IF NOT EXISTS qa_findings (
              id TEXT PRIMARY KEY,
              segment_id TEXT NOT NULL,
              job_id TEXT NOT NULL,
              severity TEXT NOT NULL,
              kind TEXT NOT NULL,
              message TEXT NOT NULL,
              FOREIGN KEY(job_id, segment_id) REFERENCES segments(job_id, id)
            );

            CREATE TABLE IF NOT EXISTS segment_flags (
              id INTEGER PRIMARY KEY,
              job_id TEXT NOT NULL,
              segment_id TEXT NOT NULL,
              kind TEXT NOT NULL,
              note TEXT,
              suggested_source TEXT,
              suggested_target TEXT,
              ingested_at TEXT NOT NULL,
              consumed INTEGER NOT NULL DEFAULT 0,
              FOREIGN KEY(job_id) REFERENCES jobs(id) ON DELETE CASCADE
            );

            CREATE TABLE IF NOT EXISTS glossary_terms (
              id INTEGER PRIMARY KEY,
              scope_kind TEXT NOT NULL CHECK(scope_kind IN ('global', 'series', 'book')),
              scope_id TEXT,
              source_text TEXT NOT NULL,
              target_text TEXT,
              category TEXT NOT NULL CHECK(category IN
                ('person', 'place', 'object', 'invented', 'style', 'phrase', 'other')),
              notes TEXT,
              case_sensitive INTEGER NOT NULL DEFAULT 0,
              always_active INTEGER NOT NULL DEFAULT 0,
              status TEXT NOT NULL CHECK(status IN
                ('user_seeded', 'auto_candidate', 'accepted', 'rejected'))
                DEFAULT 'user_seeded',
              source_language TEXT NOT NULL,
              target_language TEXT NOT NULL,
              source_count INTEGER DEFAULT 0,
              created_at TEXT NOT NULL,
              updated_at TEXT NOT NULL,
              UNIQUE(scope_kind, scope_id, source_text, source_language, target_language)
            );

            CREATE TABLE IF NOT EXISTS style_sheets (
              id INTEGER PRIMARY KEY,
              scope_kind TEXT NOT NULL CHECK(scope_kind IN ('global', 'series', 'book')),
              scope_id TEXT,
              target_language TEXT NOT NULL,
              content_toml TEXT NOT NULL,
              fingerprint TEXT NOT NULL,
              created_at TEXT NOT NULL,
              updated_at TEXT NOT NULL,
              UNIQUE(scope_kind, scope_id, target_language)
            );

            CREATE TABLE IF NOT EXISTS entities (
              id INTEGER PRIMARY KEY,
              scope_kind TEXT NOT NULL CHECK(scope_kind IN ('global', 'series', 'book')),
              scope_id TEXT,
              source_name TEXT NOT NULL,
              target_name TEXT NOT NULL,
              gender_target TEXT
                CHECK(gender_target IS NULL OR gender_target IN ('m', 'f', 'n')),
              role TEXT,
              notes TEXT,
              source_language TEXT NOT NULL,
              target_language TEXT NOT NULL,
              created_at TEXT NOT NULL,
              updated_at TEXT NOT NULL,
              UNIQUE(scope_kind, scope_id, source_name, source_language, target_language)
            );
            ",
        )?;
        ensure_glossary_target_nullable(&conn)?;
        ensure_column(&conn, "jobs", "input_path", "TEXT NOT NULL DEFAULT ''")?;
        ensure_column(&conn, "jobs", "input_snapshot_path", "TEXT")?;
        ensure_column(&conn, "jobs", "input_sha256", "TEXT")?;
        ensure_column(&conn, "jobs", "output_path", "TEXT NOT NULL DEFAULT ''")?;
        ensure_column(&conn, "jobs", "base_url", "TEXT")?;
        ensure_column(&conn, "jobs", "api_key_env", "TEXT")?;
        ensure_column(&conn, "jobs", "config_json", "TEXT")?;
        ensure_column(&conn, "jobs", "events_path", "TEXT")?;
        ensure_column(&conn, "jobs", "report_json_path", "TEXT")?;
        ensure_column(&conn, "jobs", "report_markdown_path", "TEXT")?;
        ensure_column(&conn, "jobs", "book_id", "TEXT")?;
        ensure_column(&conn, "jobs", "series_id", "TEXT")?;
        ensure_column(
            &conn,
            "segments",
            "cache_namespace",
            "TEXT NOT NULL DEFAULT ''",
        )?;
        ensure_column(&conn, "segments", "tokens_input", "INTEGER")?;
        ensure_column(&conn, "segments", "tokens_input_cached", "INTEGER")?;
        ensure_column(&conn, "segments", "tokens_output", "INTEGER")?;
        ensure_column(
            &conn,
            "segments",
            "tokens_estimated",
            "INTEGER NOT NULL DEFAULT 0",
        )?;
        conn.execute_batch(
            "CREATE INDEX IF NOT EXISTS idx_segments_cache_lookup
             ON segments(source_hash, cache_namespace, prompt_version, provider, model, status);
             CREATE INDEX IF NOT EXISTS idx_segment_flags_job
             ON segment_flags(job_id, consumed);
             CREATE INDEX IF NOT EXISTS idx_glossary_lookup
             ON glossary_terms(source_language, target_language, scope_kind, scope_id, status);
             CREATE INDEX IF NOT EXISTS idx_style_lookup
             ON style_sheets(target_language, scope_kind, scope_id);
             CREATE INDEX IF NOT EXISTS idx_entity_lookup
             ON entities(source_language, target_language, scope_kind, scope_id);",
        )?;
        record_migration(&conn, 1, "initial")?;
        record_migration(&conn, 2, "v1_0_1_input_snapshot")?;
        record_migration(&conn, 3, "v1_1_segment_flags")?;
        record_migration(&conn, 4, "v1_2_glossary_terms")?;
        record_migration(&conn, 5, "v1_2_1_nullable_glossary_candidate_targets")?;
        record_migration(&conn, 6, "v1_3_context_styles_entities")?;
        Ok(())
    }

    fn touch_job(&self, job_id: &str, status: &str) -> Result<()> {
        let conn = self.conn.borrow();
        conn.execute(
            "UPDATE jobs SET status = ?1, updated_at = ?2 WHERE id = ?3",
            params![status, timestamp_string(), job_id],
        )?;
        Ok(())
    }
}

fn table_exists(conn: &Connection, table: &str) -> rusqlite::Result<bool> {
    conn.query_row(
        "SELECT EXISTS(SELECT 1 FROM sqlite_master WHERE type = 'table' AND name = ?1)",
        params![table],
        |row| row.get::<_, bool>(0),
    )
}

fn table_has_column(conn: &Connection, table: &str, column: &str) -> rusqlite::Result<bool> {
    let mut stmt = conn.prepare(&format!("PRAGMA table_info({table})"))?;
    let rows = stmt.query_map([], |row| row.get::<_, String>(1))?;
    for row in rows {
        if row? == column {
            return Ok(true);
        }
    }
    Ok(false)
}

fn rename_table_if_exists(conn: &Connection, table: &str, suffix: u128) -> rusqlite::Result<()> {
    if table_exists(conn, table)? {
        conn.execute(
            &format!("ALTER TABLE {table} RENAME TO {table}_legacy_{suffix}"),
            [],
        )?;
    }
    Ok(())
}

fn ensure_column(
    conn: &Connection,
    table: &str,
    column: &str,
    definition: &str,
) -> rusqlite::Result<()> {
    if !table_has_column(conn, table, column)? {
        conn.execute(
            &format!("ALTER TABLE {table} ADD COLUMN {column} {definition}"),
            [],
        )?;
    }
    Ok(())
}

fn ensure_glossary_target_nullable(conn: &Connection) -> rusqlite::Result<()> {
    if !table_exists(conn, "glossary_terms")?
        || !table_column_is_not_null(conn, "glossary_terms", "target_text")?
    {
        return Ok(());
    }

    let legacy_table = format!("glossary_terms_v1_2_0_{}", unix_timestamp_nanos());
    conn.execute_batch(&format!(
        "
        DROP INDEX IF EXISTS idx_glossary_lookup;
        ALTER TABLE glossary_terms RENAME TO {legacy_table};
        CREATE TABLE glossary_terms (
          id INTEGER PRIMARY KEY,
          scope_kind TEXT NOT NULL CHECK(scope_kind IN ('global', 'series', 'book')),
          scope_id TEXT,
          source_text TEXT NOT NULL,
          target_text TEXT,
          category TEXT NOT NULL CHECK(category IN
            ('person', 'place', 'object', 'invented', 'style', 'phrase', 'other')),
          notes TEXT,
          case_sensitive INTEGER NOT NULL DEFAULT 0,
          always_active INTEGER NOT NULL DEFAULT 0,
          status TEXT NOT NULL CHECK(status IN
            ('user_seeded', 'auto_candidate', 'accepted', 'rejected'))
            DEFAULT 'user_seeded',
          source_language TEXT NOT NULL,
          target_language TEXT NOT NULL,
          source_count INTEGER DEFAULT 0,
          created_at TEXT NOT NULL,
          updated_at TEXT NOT NULL,
          UNIQUE(scope_kind, scope_id, source_text, source_language, target_language)
        );
        INSERT INTO glossary_terms
          (id, scope_kind, scope_id, source_text, target_text, category, notes,
           case_sensitive, always_active, status, source_language, target_language,
           source_count, created_at, updated_at)
        SELECT id, scope_kind, scope_id, source_text, target_text, category, notes,
               case_sensitive, always_active, status, source_language, target_language,
               source_count, created_at, updated_at
        FROM {legacy_table};
        DROP TABLE {legacy_table};
        ",
    ))?;
    Ok(())
}

fn table_column_is_not_null(
    conn: &Connection,
    table: &str,
    column: &str,
) -> rusqlite::Result<bool> {
    let mut stmt = conn.prepare(&format!("PRAGMA table_info({table})"))?;
    let mut rows = stmt.query([])?;
    while let Some(row) = rows.next()? {
        let name: String = row.get(1)?;
        if name == column {
            let not_null: i64 = row.get(3)?;
            return Ok(not_null != 0);
        }
    }
    Ok(false)
}

fn record_migration(conn: &Connection, version: i64, name: &str) -> rusqlite::Result<()> {
    conn.execute(
        "INSERT OR IGNORE INTO _migrations (version, name, applied_at)
         VALUES (?1, ?2, ?3)",
        params![version, name, timestamp_string()],
    )?;
    Ok(())
}

fn glossary_term_from_row(row: &rusqlite::Row<'_>) -> rusqlite::Result<GlossaryTerm> {
    let scope_kind_text: String = row.get(1)?;
    let category_text: String = row.get(5)?;
    let status_text: String = row.get(9)?;
    Ok(GlossaryTerm {
        id: Some(row.get(0)?),
        scope_kind: parse_row_enum(&scope_kind_text, 1)?,
        scope_id: row.get(2)?,
        source_text: row.get(3)?,
        target_text: row.get(4)?,
        category: parse_row_enum(&category_text, 5)?,
        notes: row.get(6)?,
        case_sensitive: row.get::<_, i64>(7)? != 0,
        always_active: row.get::<_, i64>(8)? != 0,
        status: parse_row_enum(&status_text, 9)?,
        source_language: row.get(10)?,
        target_language: row.get(11)?,
        source_count: row.get::<_, Option<i64>>(12)?.unwrap_or(0).max(0) as usize,
    })
}

fn glossary_candidate_from_row(
    row: &rusqlite::Row<'_>,
) -> rusqlite::Result<StoredGlossaryCandidate> {
    let category_text: String = row.get(3)?;
    let status_text: String = row.get(7)?;
    Ok(StoredGlossaryCandidate {
        id: row.get(0)?,
        source_text: row.get(1)?,
        target_text: row.get(2)?,
        category: parse_row_enum(&category_text, 3)?,
        notes: row.get(4)?,
        case_sensitive: row.get::<_, i64>(5)? != 0,
        always_active: row.get::<_, i64>(6)? != 0,
        status: parse_row_enum(&status_text, 7)?,
        source_language: row.get(8)?,
        target_language: row.get(9)?,
        source_count: row.get::<_, Option<i64>>(10)?.unwrap_or(0).max(0) as usize,
    })
}

fn parse_gender_short(value: &str) -> Option<EntityGender> {
    match value {
        "m" => Some(EntityGender::Masculine),
        "f" => Some(EntityGender::Feminine),
        "n" => Some(EntityGender::Neuter),
        _ => None,
    }
}

fn parse_row_enum<T>(value: &str, column: usize) -> rusqlite::Result<T>
where
    T: FromStr<Err = String>,
{
    value.parse::<T>().map_err(|err| {
        rusqlite::Error::FromSqlConversionFailure(column, Type::Text, Box::new(RowEnumError(err)))
    })
}

#[derive(Debug)]
struct RowEnumError(String);

impl std::fmt::Display for RowEnumError {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        f.write_str(&self.0)
    }
}

impl std::error::Error for RowEnumError {}

fn replace_block_translations(
    conn: &Connection,
    job_id: &str,
    segment_id: &str,
    blocks: &[BlockTranslation],
) -> rusqlite::Result<()> {
    conn.execute(
        "DELETE FROM translation_blocks WHERE job_id = ?1 AND segment_id = ?2",
        params![job_id, segment_id],
    )?;
    for block in blocks {
        conn.execute(
            "INSERT INTO translation_blocks (segment_id, job_id, block_id, translated_text)
             VALUES (?1, ?2, ?3, ?4)",
            params![
                segment_id,
                job_id,
                block.block_id.0.as_str(),
                block.text.as_str()
            ],
        )?;
    }
    Ok(())
}

#[derive(Debug, Clone, Copy)]
pub enum RetryScope {
    Failed,
    NeedsReview,
    All,
}

fn file_hash(path: &Path) -> CoreResult<String> {
    let bytes = fs::read(path)?;
    Ok(stable_hash_bytes(&bytes))
}

fn stable_hash(text: &str) -> String {
    stable_hash_bytes(text.as_bytes())
}

fn stable_hash_bytes(bytes: &[u8]) -> String {
    let digest = Sha256::digest(bytes);
    let mut output = String::with_capacity(digest.len() * 2);
    for byte in digest {
        use std::fmt::Write as _;
        write!(&mut output, "{byte:02x}").expect("writing to string should not fail");
    }
    output
}

fn unix_timestamp() -> u64 {
    SystemTime::now()
        .duration_since(UNIX_EPOCH)
        .unwrap_or_default()
        .as_secs()
}

fn unix_timestamp_nanos() -> u128 {
    SystemTime::now()
        .duration_since(UNIX_EPOCH)
        .unwrap_or_default()
        .as_nanos()
}

fn timestamp_string() -> String {
    unix_timestamp().to_string()
}

#[cfg(test)]
mod tests {
    use super::*;
    use bookforge_core::{
        ir::{BlockId, SectionId},
        segment::{
            Segment, SegmentBlock, SegmentConstraints, SegmentContext, SegmentId, SegmentMetadata,
            SegmentSource, SegmentTextRun,
        },
    };

    #[test]
    fn store_reuses_connection_across_job_operations() {
        let db_path = temp_path("jobs.sqlite");
        let input_path = temp_path("input.epub");
        fs::write(&input_path, b"epub bytes").expect("input fixture should be writable");

        let store = JobStore::open(&db_path).expect("store should open");
        let job = store
            .create_job(CreateJob {
                input: &input_path,
                output: &temp_path("output.epub"),
                source_lang: Some("English"),
                target_lang: "Italian",
                provider: "mock",
                model: "mock-prefix",
                base_url: None,
                api_key_env: None,
                book_id: None,
                series_id: None,
            })
            .expect("job should be created");
        let segments = vec![segment("seg_a", 0), segment("seg_b", 1)];
        store
            .insert_segments(&job.id, &segments, "v1", "mock", "mock-prefix", "test_ns")
            .expect("segments should insert");

        store
            .save_translation(SaveTranslation {
                job_id: &job.id,
                segment_id: "seg_a",
                translated_text: "Tradotto",
                blocks: &[BlockTranslation {
                    block_id: BlockId("b_000000".to_string()),
                    text: "Tradotto".to_string(),
                }],
                provider: "mock",
                model: "mock-prefix",
                prompt_version: "v1",
                input_tokens: Some(11),
                input_cached_tokens: Some(0),
                output_tokens: Some(7),
                tokens_estimated: false,
            })
            .expect("translation should save");
        store
            .mark_segment_failed(&job.id, "seg_b", "provider unavailable")
            .expect("segment should be marked failed");

        let summary = store
            .summary(&job.id)
            .expect("summary should load")
            .expect("job should exist");
        assert_eq!(summary.total_segments, 2);
        assert_eq!(summary.succeeded, 1);
        assert_eq!(summary.failed, 1);
        assert_eq!(summary.input_tokens, 11);
        assert_eq!(summary.output_tokens, 7);
        let blocks = store
            .load_block_translations(&job.id)
            .expect("block translations should load");
        assert_eq!(blocks.len(), 1);
        assert_eq!(blocks[0].text, "Tradotto");

        let _ = fs::remove_file(db_path);
        let _ = fs::remove_file(input_path);
    }

    fn segment(id: &str, ordinal: usize) -> Segment {
        let block_id = BlockId(format!("b_{ordinal:06}"));
        Segment {
            id: SegmentId(id.to_string()),
            section_id: SectionId("sec_000000".to_string()),
            ordinal,
            block_ids: vec![block_id.clone()],
            source: SegmentSource {
                text: format!("Source {ordinal}"),
                blocks: vec![SegmentBlock {
                    block_id,
                    kind: "paragraph".to_string(),
                    text: format!("Source {ordinal}"),
                    text_runs: vec![SegmentTextRun {
                        id: format!("r{ordinal}"),
                        text: format!("Source {ordinal}"),
                    }],
                    protected_spans: Vec::new(),
                }],
                token_estimate: 2,
            },
            context: SegmentContext::default(),
            metadata: SegmentMetadata::default(),
            constraints: SegmentConstraints::default(),
            checksum: format!("checksum_{ordinal}"),
        }
    }

    fn temp_path(name: &str) -> PathBuf {
        std::env::temp_dir().join(format!(
            "bookforge-store-test-{}-{}-{name}",
            std::process::id(),
            unix_timestamp_nanos()
        ))
    }

    fn build_seeded_store_with_translation(
        db_path: &PathBuf,
        cache_namespace: &str,
        block_ids: &[&str],
    ) -> (JobStore, JobRecord, Segment) {
        let input_path = temp_path("input.epub");
        fs::write(&input_path, b"epub bytes").expect("input fixture should be writable");

        let store = JobStore::open(db_path).expect("store should open");
        let job = store
            .create_job(CreateJob {
                input: &input_path,
                output: &temp_path("output.epub"),
                source_lang: Some("English"),
                target_lang: "Italian",
                provider: "mock",
                model: "mock-prefix",
                base_url: None,
                api_key_env: None,
                book_id: None,
                series_id: None,
            })
            .expect("job should be created");

        let mut seg = segment("seg_a", 0);
        let blocks: Vec<BlockTranslation> = block_ids
            .iter()
            .map(|id| BlockTranslation {
                block_id: BlockId(id.to_string()),
                text: format!("Tradotto {id}"),
            })
            .collect();
        seg.block_ids = block_ids.iter().map(|id| BlockId(id.to_string())).collect();

        store
            .insert_segments(
                &job.id,
                std::slice::from_ref(&seg),
                "v1",
                "mock",
                "mock-prefix",
                cache_namespace,
            )
            .expect("segments should insert");
        store
            .save_translation(SaveTranslation {
                job_id: &job.id,
                segment_id: "seg_a",
                translated_text: "Tradotto",
                blocks: &blocks,
                provider: "mock",
                model: "mock-prefix",
                prompt_version: "v1",
                input_tokens: Some(11),
                input_cached_tokens: Some(0),
                output_tokens: Some(7),
                tokens_estimated: false,
            })
            .expect("translation should save");

        let _ = fs::remove_file(input_path);
        (store, job, seg)
    }

    #[test]
    fn job_config_snapshot_round_trips_through_store() {
        let db_path = temp_path("snapshot.sqlite");
        let input_path = temp_path("input.epub");
        fs::write(&input_path, b"epub bytes").expect("input fixture should be writable");
        let store = JobStore::open(&db_path).expect("store should open");
        let job = store
            .create_job(CreateJob {
                input: &input_path,
                output: &temp_path("output.epub"),
                source_lang: Some("English"),
                target_lang: "Italian",
                provider: "openrouter",
                model: "model",
                base_url: Some("https://example.test/v1"),
                api_key_env: Some("OPENROUTER_API_KEY"),
                book_id: None,
                series_id: None,
            })
            .expect("job should be created");
        let settings = bookforge_core::TranslationProfile::Balanced.resolve();
        let snapshot = RunConfigSnapshot {
            input_path: input_path.clone(),
            input_snapshot_path: Some(temp_path("input-snapshot.epub")),
            input_sha256: Some("abc123".to_string()),
            output_path: temp_path("translated.epub"),
            events_path: Some(temp_path("events.jsonl")),
            report_json_path: Some(temp_path("report.json")),
            report_markdown_path: Some(temp_path("report.md")),
            source_language: Some("English".to_string()),
            target_language: "Italian".to_string(),
            provider: "openrouter".to_string(),
            model: "model".to_string(),
            base_url: Some("https://example.test/v1".to_string()),
            api_key_env: Some("OPENROUTER_API_KEY".to_string()),
            profile: settings.profile,
            provider_preset: None,
            prompt_version: "batch_v1".to_string(),
            cache_namespace: "cache_ns".to_string(),
            book_id: None,
            series_id: None,
            glossary_budget_tokens: 800,
            glossary_format: bookforge_core::GlossaryFormat::Json,
            prompt_extra: None,
            glossary_fingerprint: String::new(),
            glossary_terms: Vec::new(),
            context_window: 0,
            context_budget_tokens: 1200,
            context_scope: bookforge_core::config::ContextScope::Chapter,
            style_fingerprint: String::new(),
            style_rendered_block: String::new(),
            entities_fingerprint: String::new(),
            entities_rendered_block: String::new(),
            settings: bookforge_core::ResolvedRunSettingsSnapshot::from_settings(&settings),
        };

        store
            .update_job_config_snapshot(&job.id, &snapshot)
            .expect("snapshot should persist");
        let loaded = store
            .load_job_config_snapshot(&job.id)
            .expect("snapshot should load")
            .expect("snapshot should exist");
        assert_eq!(loaded, snapshot);

        let reloaded_job = store
            .get_job(&job.id)
            .expect("job should load")
            .expect("job should exist");
        assert_eq!(reloaded_job.events_path, snapshot.events_path);
        assert_eq!(reloaded_job.report_json_path, snapshot.report_json_path);
        assert_eq!(
            reloaded_job.report_markdown_path,
            snapshot.report_markdown_path
        );

        let _ = fs::remove_file(db_path);
        let _ = fs::remove_file(input_path);
    }

    #[test]
    fn job_config_snapshot_does_not_store_api_key_value() {
        let db_path = temp_path("snapshot_secret.sqlite");
        let input_path = temp_path("input.epub");
        fs::write(&input_path, b"epub bytes").expect("input fixture should be writable");
        let api_key_env = "BOOKFORGE_TEST_API_KEY_VALUE_NOT_STORED";
        let api_key_value = "sk-live-secret-that-must-not-be-persisted";
        // This test uses a unique process-local env var and verifies snapshot
        // serialization never reads the value.
        unsafe {
            std::env::set_var(api_key_env, api_key_value);
        }

        let store = JobStore::open(&db_path).expect("store should open");
        let job = store
            .create_job(CreateJob {
                input: &input_path,
                output: &temp_path("output.epub"),
                source_lang: Some("English"),
                target_lang: "Italian",
                provider: "openrouter",
                model: "model",
                base_url: Some("https://example.test/v1"),
                api_key_env: Some(api_key_env),
                book_id: None,
                series_id: None,
            })
            .expect("job should be created");
        let settings = bookforge_core::TranslationProfile::Balanced.resolve();
        let snapshot = RunConfigSnapshot {
            input_path: input_path.clone(),
            input_snapshot_path: None,
            input_sha256: None,
            output_path: temp_path("translated.epub"),
            events_path: Some(temp_path("events.jsonl")),
            report_json_path: Some(temp_path("report.json")),
            report_markdown_path: Some(temp_path("report.md")),
            source_language: Some("English".to_string()),
            target_language: "Italian".to_string(),
            provider: "openrouter".to_string(),
            model: "model".to_string(),
            base_url: Some("https://example.test/v1".to_string()),
            api_key_env: Some(api_key_env.to_string()),
            profile: settings.profile,
            provider_preset: None,
            prompt_version: "batch_v1".to_string(),
            cache_namespace: "cache_ns".to_string(),
            book_id: None,
            series_id: None,
            glossary_budget_tokens: 800,
            glossary_format: bookforge_core::GlossaryFormat::Json,
            prompt_extra: None,
            glossary_fingerprint: String::new(),
            glossary_terms: Vec::new(),
            context_window: 0,
            context_budget_tokens: 1200,
            context_scope: bookforge_core::config::ContextScope::Chapter,
            style_fingerprint: String::new(),
            style_rendered_block: String::new(),
            entities_fingerprint: String::new(),
            entities_rendered_block: String::new(),
            settings: bookforge_core::ResolvedRunSettingsSnapshot::from_settings(&settings),
        };

        store
            .update_job_config_snapshot(&job.id, &snapshot)
            .expect("snapshot should persist");
        let raw_json = {
            let conn = store.conn.borrow();
            conn.query_row(
                "SELECT config_json FROM jobs WHERE id = ?1",
                params![job.id],
                |row| row.get::<_, String>(0),
            )
            .expect("raw snapshot JSON should load")
        };

        assert!(raw_json.contains(api_key_env));
        assert!(!raw_json.contains(api_key_value));

        unsafe {
            std::env::remove_var(api_key_env);
        }
        let _ = fs::remove_file(db_path);
        let _ = fs::remove_file(input_path);
    }

    #[test]
    fn terminal_loading_and_resumable_ids_preserve_lifecycle_boundaries() {
        let db_path = temp_path("terminal_resume.sqlite");
        let input_path = temp_path("input.epub");
        fs::write(&input_path, b"epub bytes").expect("input fixture should be writable");
        let store = JobStore::open(&db_path).expect("store should open");
        let job = store
            .create_job(CreateJob {
                input: &input_path,
                output: &temp_path("output.epub"),
                source_lang: Some("English"),
                target_lang: "Italian",
                provider: "mock",
                model: "mock-prefix",
                base_url: None,
                api_key_env: None,
                book_id: None,
                series_id: None,
            })
            .expect("job should be created");
        let segments = vec![
            segment("seg_done", 0),
            segment("seg_cached", 1),
            segment("seg_review", 2),
            segment("seg_failed", 3),
            segment("seg_queued", 4),
        ];
        store
            .insert_segments(&job.id, &segments, "v1", "mock", "mock-prefix", "ns")
            .expect("segments should insert");
        store
            .save_translation(SaveTranslation {
                job_id: &job.id,
                segment_id: "seg_done",
                translated_text: "Done",
                blocks: &[BlockTranslation {
                    block_id: BlockId("b_000000".to_string()),
                    text: "Done".to_string(),
                }],
                provider: "mock",
                model: "mock-prefix",
                prompt_version: "v1",
                input_tokens: None,
                input_cached_tokens: None,
                output_tokens: None,
                tokens_estimated: false,
            })
            .expect("done should save");
        store
            .save_cached_translation(SaveCachedTranslation {
                job_id: &job.id,
                segment_id: "seg_cached",
                translated_text: "Cached",
                blocks: &[BlockTranslation {
                    block_id: BlockId("b_000001".to_string()),
                    text: "Cached".to_string(),
                }],
                provider: "mock",
                model: "mock-prefix",
                prompt_version: "v1",
            })
            .expect("cached should save");
        store
            .save_needs_review(SaveNeedsReview {
                job_id: &job.id,
                segment_id: "seg_review",
                preserved_text: "Review",
                blocks: &[BlockTranslation {
                    block_id: BlockId("b_000002".to_string()),
                    text: "Review".to_string(),
                }],
                provider: "mock",
                model: "mock-prefix",
                prompt_version: "v1",
                error: "needs eyes",
                input_tokens: None,
                input_cached_tokens: None,
                output_tokens: None,
                tokens_estimated: false,
            })
            .expect("review should save");
        store
            .mark_segment_failed(&job.id, "seg_failed", "failed")
            .expect("failed should mark");

        let terminal = store
            .load_terminal_segment_translations(&job.id)
            .expect("terminal records should load");
        let ids = terminal
            .iter()
            .map(|record| record.segment_id.as_str())
            .collect::<Vec<_>>();
        assert_eq!(ids, vec!["seg_done", "seg_cached", "seg_review"]);
        assert_eq!(terminal[0].blocks[0].block_id.0, "b_000000");
        assert_eq!(terminal[2].status, "needs_review");

        let resumable = store
            .resumable_segment_ids(&job.id)
            .expect("resumable ids should load");
        assert_eq!(resumable, vec!["seg_failed", "seg_queued"]);

        let _ = fs::remove_file(db_path);
        let _ = fs::remove_file(input_path);
    }

    #[test]
    fn mark_unfinished_segments_failed_preserves_terminal_segments() {
        let db_path = temp_path("unfinished_preserve.sqlite");
        let input_path = temp_path("input.epub");
        fs::write(&input_path, b"epub bytes").expect("input fixture should be writable");
        let store = JobStore::open(&db_path).expect("store should open");
        let job = store
            .create_job(CreateJob {
                input: &input_path,
                output: &temp_path("output.epub"),
                source_lang: Some("English"),
                target_lang: "Italian",
                provider: "mock",
                model: "mock-prefix",
                base_url: None,
                api_key_env: None,
                book_id: None,
                series_id: None,
            })
            .expect("job should be created");
        let segments = vec![
            segment("seg_succeeded", 0),
            segment("seg_cached", 1),
            segment("seg_review", 2),
            segment("seg_queued", 3),
            segment("seg_retry", 4),
        ];
        store
            .insert_segments(&job.id, &segments, "v1", "mock", "mock-prefix", "test_ns")
            .expect("segments should insert");
        store
            .save_translation(SaveTranslation {
                job_id: &job.id,
                segment_id: "seg_succeeded",
                translated_text: "Done",
                blocks: &[BlockTranslation {
                    block_id: BlockId("b_000000".to_string()),
                    text: "Done".to_string(),
                }],
                provider: "mock",
                model: "mock-prefix",
                prompt_version: "v1",
                input_tokens: None,
                input_cached_tokens: None,
                output_tokens: None,
                tokens_estimated: false,
            })
            .expect("succeeded segment should save");
        store
            .save_cached_translation(SaveCachedTranslation {
                job_id: &job.id,
                segment_id: "seg_cached",
                translated_text: "Cached",
                blocks: &[BlockTranslation {
                    block_id: BlockId("b_000001".to_string()),
                    text: "Cached".to_string(),
                }],
                provider: "mock",
                model: "mock-prefix",
                prompt_version: "v1",
            })
            .expect("cached segment should save");
        store
            .save_needs_review(SaveNeedsReview {
                job_id: &job.id,
                segment_id: "seg_review",
                preserved_text: "Needs review",
                blocks: &[BlockTranslation {
                    block_id: BlockId("b_000002".to_string()),
                    text: "Needs review".to_string(),
                }],
                provider: "mock",
                model: "mock-prefix",
                prompt_version: "v1",
                error: "qa issue",
                input_tokens: None,
                input_cached_tokens: None,
                output_tokens: None,
                tokens_estimated: false,
            })
            .expect("needs-review segment should save");
        store
            .retry_segments(&job.id, RetryScope::Failed)
            .expect("retry with no failed segments should be harmless");
        {
            let conn = store.conn.borrow();
            conn.execute(
                "UPDATE segments SET status = 'retry_pending' WHERE job_id = ?1 AND id = 'seg_retry'",
                params![job.id],
            )
            .expect("test status update should work");
        }

        let candidate_ids = segments
            .iter()
            .map(|segment| segment.id.0.clone())
            .collect::<Vec<_>>();
        let changed = store
            .mark_unfinished_segments_failed(&job.id, &candidate_ids, "run failed")
            .expect("unfinished segments should be marked failed");
        assert_eq!(changed, 2);

        let records = store.segment_records(&job.id).expect("records should load");
        let statuses = records
            .into_iter()
            .map(|record| (record.id, record.status))
            .collect::<HashMap<_, _>>();
        assert_eq!(statuses["seg_succeeded"], "succeeded");
        assert_eq!(statuses["seg_cached"], "skipped_cached");
        assert_eq!(statuses["seg_review"], "needs_review");
        assert_eq!(statuses["seg_queued"], "failed");
        assert_eq!(statuses["seg_retry"], "failed");

        let _ = fs::remove_file(db_path);
        let _ = fs::remove_file(input_path);
    }

    #[test]
    fn mark_unfinished_segments_failed_marks_only_resumable_segments() {
        let db_path = temp_path("unfinished_resumable_only.sqlite");
        let input_path = temp_path("input.epub");
        fs::write(&input_path, b"epub bytes").expect("input fixture should be writable");
        let store = JobStore::open(&db_path).expect("store should open");
        let job = store
            .create_job(CreateJob {
                input: &input_path,
                output: &temp_path("output.epub"),
                source_lang: Some("English"),
                target_lang: "Italian",
                provider: "mock",
                model: "mock-prefix",
                base_url: None,
                api_key_env: None,
                book_id: None,
                series_id: None,
            })
            .expect("job should be created");
        let segments = vec![
            segment("seg_succeeded", 0),
            segment("seg_cached", 1),
            segment("seg_review", 2),
            segment("seg_failed", 3),
            segment("seg_retry", 4),
            segment("seg_queued", 5),
        ];
        store
            .insert_segments(&job.id, &segments, "v1", "mock", "mock-prefix", "test_ns")
            .expect("segments should insert");
        {
            let conn = store.conn.borrow();
            for (id, status) in [
                ("seg_succeeded", "succeeded"),
                ("seg_cached", "skipped_cached"),
                ("seg_review", "needs_review"),
                ("seg_failed", "failed"),
                ("seg_retry", "retry_pending"),
                ("seg_queued", "queued"),
            ] {
                conn.execute(
                    "UPDATE segments SET status = ?1 WHERE job_id = ?2 AND id = ?3",
                    params![status, job.id, id],
                )
                .expect("status should update");
            }
        }

        let candidate_ids = segments
            .iter()
            .map(|segment| segment.id.0.clone())
            .collect::<Vec<_>>();
        let changed = store
            .mark_unfinished_segments_failed(&job.id, &candidate_ids, "run failed")
            .expect("unfinished segments should be marked failed");

        assert_eq!(changed, 3);
        let records = store.segment_records(&job.id).expect("records should load");
        let statuses = records
            .into_iter()
            .map(|record| (record.id, record.status))
            .collect::<HashMap<_, _>>();
        assert_eq!(statuses["seg_succeeded"], "succeeded");
        assert_eq!(statuses["seg_cached"], "skipped_cached");
        assert_eq!(statuses["seg_review"], "needs_review");
        assert_eq!(statuses["seg_failed"], "failed");
        assert_eq!(statuses["seg_retry"], "failed");
        assert_eq!(statuses["seg_queued"], "failed");

        let _ = fs::remove_file(db_path);
        let _ = fs::remove_file(input_path);
    }

    #[test]
    fn resumable_segment_ids_excludes_succeeded_cached_and_needs_review() {
        let db_path = temp_path("resumable_excludes.sqlite");
        let input_path = temp_path("input.epub");
        fs::write(&input_path, b"epub bytes").expect("input fixture should be writable");
        let store = JobStore::open(&db_path).expect("store should open");
        let job = store
            .create_job(CreateJob {
                input: &input_path,
                output: &temp_path("output.epub"),
                source_lang: Some("English"),
                target_lang: "Italian",
                provider: "mock",
                model: "mock-prefix",
                base_url: None,
                api_key_env: None,
                book_id: None,
                series_id: None,
            })
            .expect("job should be created");
        let segments = vec![
            segment("seg_succeeded", 0),
            segment("seg_cached", 1),
            segment("seg_review", 2),
        ];
        store
            .insert_segments(&job.id, &segments, "v1", "mock", "mock-prefix", "test_ns")
            .expect("segments should insert");
        {
            let conn = store.conn.borrow();
            for (id, status) in [
                ("seg_succeeded", "succeeded"),
                ("seg_cached", "skipped_cached"),
                ("seg_review", "needs_review"),
            ] {
                conn.execute(
                    "UPDATE segments SET status = ?1 WHERE job_id = ?2 AND id = ?3",
                    params![status, job.id, id],
                )
                .expect("status should update");
            }
        }

        let ids = store
            .resumable_segment_ids(&job.id)
            .expect("resumable ids should load");

        assert!(ids.is_empty());
        let _ = fs::remove_file(db_path);
        let _ = fs::remove_file(input_path);
    }

    #[test]
    fn resumable_segment_ids_includes_failed_retry_pending_and_pending() {
        let db_path = temp_path("resumable_includes.sqlite");
        let input_path = temp_path("input.epub");
        fs::write(&input_path, b"epub bytes").expect("input fixture should be writable");
        let store = JobStore::open(&db_path).expect("store should open");
        let job = store
            .create_job(CreateJob {
                input: &input_path,
                output: &temp_path("output.epub"),
                source_lang: Some("English"),
                target_lang: "Italian",
                provider: "mock",
                model: "mock-prefix",
                base_url: None,
                api_key_env: None,
                book_id: None,
                series_id: None,
            })
            .expect("job should be created");
        let segments = vec![
            segment("seg_failed", 0),
            segment("seg_retry", 1),
            segment("seg_queued", 2),
        ];
        store
            .insert_segments(&job.id, &segments, "v1", "mock", "mock-prefix", "test_ns")
            .expect("segments should insert");
        {
            let conn = store.conn.borrow();
            for (id, status) in [
                ("seg_failed", "failed"),
                ("seg_retry", "retry_pending"),
                ("seg_queued", "queued"),
            ] {
                conn.execute(
                    "UPDATE segments SET status = ?1 WHERE job_id = ?2 AND id = ?3",
                    params![status, job.id, id],
                )
                .expect("status should update");
            }
        }

        let ids = store
            .resumable_segment_ids(&job.id)
            .expect("resumable ids should load");

        assert_eq!(ids, vec!["seg_failed", "seg_retry", "seg_queued"]);
        let _ = fs::remove_file(db_path);
        let _ = fs::remove_file(input_path);
    }

    #[test]
    fn cached_translation_requires_matching_cache_namespace() {
        let db_path = temp_path("ns_match.sqlite");
        let (store, _job, seg) =
            build_seeded_store_with_translation(&db_path, "ns_one", &["b_000000"]);

        let hit = store
            .find_cached_translation(
                &seg,
                "v1",
                "mock",
                "mock-prefix",
                Some("English"),
                "Italian",
                "ns_one",
            )
            .expect("query ok");
        assert!(hit.is_some(), "matching namespace should hit");

        let miss = store
            .find_cached_translation(
                &seg,
                "v1",
                "mock",
                "mock-prefix",
                Some("English"),
                "Italian",
                "ns_two",
            )
            .expect("query ok");
        assert!(miss.is_none(), "different namespace must not hit");

        let _ = fs::remove_file(db_path);
    }

    #[test]
    fn cached_translation_rejects_mismatched_block_ids() {
        let db_path = temp_path("blockid_match.sqlite");
        let (store, _job, mut seg) =
            build_seeded_store_with_translation(&db_path, "ns_x", &["b_000000"]);

        // Caller's segment now expects different block IDs than what was stored.
        seg.block_ids = vec![BlockId("b_999999".to_string())];

        let miss = store
            .find_cached_translation(
                &seg,
                "v1",
                "mock",
                "mock-prefix",
                Some("English"),
                "Italian",
                "ns_x",
            )
            .expect("query ok");
        assert!(
            miss.is_none(),
            "mismatched block_ids must reject the cached row"
        );

        let _ = fs::remove_file(db_path);
    }

    #[test]
    fn cached_translation_prefers_repaired_succeeded_rows_over_cached_clones() {
        let db_path = temp_path("cache_prefers_repaired.sqlite");
        let (store, _stale_job, seg) =
            build_seeded_store_with_translation(&db_path, "cache_ns", &["b_000000"]);
        let cached_input = temp_path("cached-input.epub");
        let repaired_input = temp_path("repaired-input.epub");
        fs::write(&cached_input, b"cached input").expect("cached input should be writable");
        fs::write(&repaired_input, b"repaired input").expect("repaired input should be writable");

        let cached_job = store
            .create_job(CreateJob {
                input: &cached_input,
                output: &temp_path("cached-output.epub"),
                source_lang: Some("English"),
                target_lang: "Italian",
                provider: "mock",
                model: "mock-prefix",
                base_url: None,
                api_key_env: None,
                book_id: None,
                series_id: None,
            })
            .expect("cached job should be created");
        store
            .insert_segments(
                &cached_job.id,
                std::slice::from_ref(&seg),
                "v1",
                "mock",
                "mock-prefix",
                "cache_ns",
            )
            .expect("cached job segment should insert");
        store
            .save_cached_translation(SaveCachedTranslation {
                job_id: &cached_job.id,
                segment_id: "seg_a",
                translated_text: "stale cached clone",
                blocks: &[BlockTranslation {
                    block_id: BlockId("b_000000".to_string()),
                    text: "stale cached clone".to_string(),
                }],
                provider: "mock",
                model: "mock-prefix",
                prompt_version: "v1",
            })
            .expect("cached clone should save");

        let repaired_job = store
            .create_job(CreateJob {
                input: &repaired_input,
                output: &temp_path("repaired-output.epub"),
                source_lang: Some("English"),
                target_lang: "Italian",
                provider: "mock",
                model: "mock-prefix",
                base_url: None,
                api_key_env: None,
                book_id: None,
                series_id: None,
            })
            .expect("repaired job should be created");
        store
            .insert_segments(
                &repaired_job.id,
                std::slice::from_ref(&seg),
                "v1",
                "mock",
                "mock-prefix",
                "cache_ns",
            )
            .expect("repaired job segment should insert");
        store
            .save_translation(SaveTranslation {
                job_id: &repaired_job.id,
                segment_id: "seg_a",
                translated_text: "repaired translation",
                blocks: &[BlockTranslation {
                    block_id: BlockId("b_000000".to_string()),
                    text: "repaired translation".to_string(),
                }],
                provider: "mock",
                model: "mock-prefix",
                prompt_version: "v1",
                input_tokens: Some(12),
                input_cached_tokens: Some(0),
                output_tokens: Some(8),
                tokens_estimated: false,
            })
            .expect("repaired translation should save");

        let request = CacheLookupRequest {
            prompt_version: "v1",
            provider: "mock",
            model: "mock-prefix",
            source_lang: Some("English"),
            target_lang: "Italian",
            cache_namespace: "cache_ns",
        };
        let single_hit = store
            .find_cached_translation(
                &seg,
                request.prompt_version,
                request.provider,
                request.model,
                request.source_lang,
                request.target_lang,
                request.cache_namespace,
            )
            .expect("single lookup should succeed")
            .expect("single lookup should hit");
        let batch_hit = store
            .find_cached_translations_batch(std::slice::from_ref(&seg), request)
            .expect("batch lookup should succeed")
            .remove(&seg.id.0)
            .expect("batch lookup should hit");

        assert_eq!(single_hit.translated_text, "repaired translation");
        assert_eq!(single_hit.blocks[0].text, "repaired translation");
        assert_eq!(batch_hit.translated_text, "repaired translation");
        assert_eq!(batch_hit.blocks[0].text, "repaired translation");

        let _ = fs::remove_file(db_path);
        let _ = fs::remove_file(cached_input);
        let _ = fs::remove_file(repaired_input);
    }

    #[test]
    fn old_empty_cache_namespace_rows_do_not_match_new_runs() {
        let db_path = temp_path("legacy_ns.sqlite");
        // Simulate a row migrated from an older schema with the default empty namespace.
        let (store, _job, seg) = build_seeded_store_with_translation(&db_path, "", &["b_000000"]);

        let miss = store
            .find_cached_translation(
                &seg,
                "v1",
                "mock",
                "mock-prefix",
                Some("English"),
                "Italian",
                "real_ns",
            )
            .expect("query ok");
        assert!(
            miss.is_none(),
            "legacy empty-namespace row must not satisfy a real namespace lookup"
        );

        let _ = fs::remove_file(db_path);
    }

    #[test]
    fn job_store_enables_wal_and_busy_timeout() {
        let db_path = temp_path("wal_busy.sqlite");
        let store = JobStore::open(&db_path).expect("store should open");

        let conn = store.conn.borrow();
        let journal_mode: String = conn
            .pragma_query_value(None, "journal_mode", |row| row.get(0))
            .expect("pragma journal_mode should succeed");
        assert_eq!(
            journal_mode.to_lowercase(),
            "wal",
            "WAL journal mode must be enabled"
        );

        let busy_timeout: i64 = conn
            .pragma_query_value(None, "busy_timeout", |row| row.get(0))
            .expect("pragma busy_timeout should succeed");
        assert!(
            busy_timeout >= 5000,
            "busy_timeout should be at least 5000ms, got {busy_timeout}"
        );

        let wal_path = db_path.with_extension("sqlite-wal");
        let shm_path = db_path.with_extension("sqlite-shm");
        // WAL/shm may or may not exist depending on transactions, but the
        // journal_mode query confirms WAL is active.

        let _ = fs::remove_file(db_path);
        let _ = fs::remove_file(wal_path);
        let _ = fs::remove_file(shm_path);
    }

    #[test]
    fn job_store_enables_foreign_keys_on_every_connection() {
        let db_path = temp_path("fk.sqlite");
        let store = JobStore::open(&db_path).expect("store should open");

        let conn = store.conn.borrow();
        let fk_enabled: i64 = conn
            .pragma_query_value(None, "foreign_keys", |row| row.get(0))
            .expect("pragma foreign_keys should succeed");
        assert_eq!(
            fk_enabled, 1,
            "foreign_keys pragma must be ON on every connection"
        );

        let _ = fs::remove_file(db_path);
    }

    #[test]
    fn doctor_reports_wal_sidecars_as_normal_when_integrity_check_passes() {
        let db_path = temp_path("doctor.sqlite");
        let store = JobStore::open(&db_path).expect("store should open");

        // Perform a write to trigger WAL sidecar creation.
        let input_path = temp_path("input_doctor.epub");
        fs::write(&input_path, b"epub bytes").expect("test epub");
        let _job = store
            .create_job(CreateJob {
                input: &input_path,
                output: &temp_path("out_doctor.epub"),
                source_lang: Some("English"),
                target_lang: "Italian",
                provider: "mock",
                model: "mock-prefix",
                base_url: None,
                api_key_env: None,
                book_id: None,
                series_id: None,
            })
            .expect("job created");
        drop(store);

        let doctor = run_doctor(Some(db_path.clone())).expect("doctor should run");
        assert!(doctor.database_exists, "database should exist");
        assert_eq!(
            doctor.journal_mode.to_lowercase(),
            "wal",
            "journal mode should be wal"
        );
        assert_eq!(doctor.integrity_check, "ok", "integrity check should pass");
        assert!(
            doctor.wal_sidecars_normal,
            "wal sidecars should be reported as normal"
        );

        if doctor.wal_present || doctor.shm_present {
            assert!(
                !doctor.note.is_empty(),
                "doctor must explain WAL sidecars when they are present"
            );
        }

        let wal_path = db_path.with_extension("sqlite-wal");
        let shm_path = db_path.with_extension("sqlite-shm");
        let _ = fs::remove_file(&db_path);
        let _ = fs::remove_file(input_path);
        let _ = fs::remove_file(wal_path);
        let _ = fs::remove_file(shm_path);
    }

    #[test]
    fn checkpoint_writer_and_reader_do_not_immediately_busy_fail() {
        let db_path = temp_path("concurrent.sqlite");
        let input_path = temp_path("input_conc.epub");
        fs::write(&input_path, b"epub bytes").expect("test epub");

        // Open writer store first and create a job.
        let store_w = JobStore::open(&db_path).expect("store_w open");
        let job = store_w
            .create_job(CreateJob {
                input: &input_path,
                output: &temp_path("out_conc.epub"),
                source_lang: Some("English"),
                target_lang: "Italian",
                provider: "mock",
                model: "mock-prefix",
                base_url: None,
                api_key_env: None,
                book_id: None,
                series_id: None,
            })
            .expect("job created");
        store_w
            .insert_segments(
                &job.id,
                &[segment("seg_conc", 0)],
                "v1",
                "mock",
                "mock-prefix",
                "ns",
            )
            .expect("segments inserted");

        // Open a second reader store while the first is still active.
        let store_r = JobStore::open(&db_path).expect("store_r open");
        let summary = store_r
            .summary(&job.id)
            .expect("summary should load")
            .expect("job should exist");
        assert_eq!(summary.total_segments, 1);

        let wal_path = db_path.with_extension("sqlite-wal");
        let shm_path = db_path.with_extension("sqlite-shm");
        let _ = fs::remove_file(&db_path);
        let _ = fs::remove_file(input_path);
        let _ = fs::remove_file(wal_path);
        let _ = fs::remove_file(shm_path);
    }

    #[test]
    fn migrate_creates_glossary_terms_table() {
        let db_path = temp_path("glossary_migrate.sqlite");
        let store = JobStore::open(&db_path).expect("store opens");
        let conn = store.conn.borrow();
        let table: String = conn
            .query_row(
                "SELECT name FROM sqlite_master WHERE type = 'table' AND name = 'glossary_terms'",
                [],
                |row| row.get(0),
            )
            .expect("glossary_terms table exists");
        assert_eq!(table, "glossary_terms");
        let index: String = conn
            .query_row(
                "SELECT name FROM sqlite_master WHERE type = 'index' AND name = 'idx_glossary_lookup'",
                [],
                |row| row.get(0),
            )
            .expect("idx_glossary_lookup exists");
        assert_eq!(index, "idx_glossary_lookup");
        let version: i64 = conn
            .query_row(
                "SELECT version FROM _migrations WHERE name = 'v1_2_glossary_terms'",
                [],
                |row| row.get(0),
            )
            .expect("v1_2 migration recorded");
        assert_eq!(version, 4);
        drop(conn);
        let _ = fs::remove_file(&db_path);
    }

    #[test]
    fn migrate_is_idempotent_v1_2() {
        let db_path = temp_path("glossary_idem.sqlite");
        // Open twice; second open re-runs migrate() and must not error.
        {
            let _store = JobStore::open(&db_path).expect("first open");
        }
        {
            let _store = JobStore::open(&db_path).expect("second open");
        }
        let _ = fs::remove_file(&db_path);
    }

    #[test]
    fn migrate_rebuilds_glossary_terms_with_nullable_target_text() {
        let db_path = temp_path("glossary_nullable_target.sqlite");
        {
            let conn = Connection::open(&db_path).expect("legacy db opens");
            conn.execute_batch(
                "
                CREATE TABLE _migrations (
                  version INTEGER PRIMARY KEY,
                  name TEXT NOT NULL,
                  applied_at TEXT NOT NULL
                );
                CREATE TABLE glossary_terms (
                  id INTEGER PRIMARY KEY,
                  scope_kind TEXT NOT NULL CHECK(scope_kind IN ('global', 'series', 'book')),
                  scope_id TEXT,
                  source_text TEXT NOT NULL,
                  target_text TEXT NOT NULL,
                  category TEXT NOT NULL CHECK(category IN
                    ('person', 'place', 'object', 'invented', 'style', 'phrase', 'other')),
                  notes TEXT,
                  case_sensitive INTEGER NOT NULL DEFAULT 0,
                  always_active INTEGER NOT NULL DEFAULT 0,
                  status TEXT NOT NULL CHECK(status IN
                    ('user_seeded', 'auto_candidate', 'accepted', 'rejected'))
                    DEFAULT 'user_seeded',
                  source_language TEXT NOT NULL,
                  target_language TEXT NOT NULL,
                  source_count INTEGER DEFAULT 0,
                  created_at TEXT NOT NULL,
                  updated_at TEXT NOT NULL,
                  UNIQUE(scope_kind, scope_id, source_text, source_language, target_language)
                );
                CREATE INDEX idx_glossary_lookup
                  ON glossary_terms(source_language, target_language, scope_kind, scope_id, status);
                INSERT INTO glossary_terms
                  (id, scope_kind, scope_id, source_text, target_text, category, notes,
                   case_sensitive, always_active, status, source_language, target_language,
                   source_count, created_at, updated_at)
                VALUES
                  (42, 'book', 'ivan', 'Ivan Ilych', 'Ivan Il''ich', 'person', 'legacy',
                   1, 0, 'user_seeded', 'English', 'Italian', 9, 'created', 'updated');
                ",
            )
            .expect("legacy schema should initialize");
        }

        let store = JobStore::open(&db_path).expect("store opens and migrates");
        let conn = store.conn.borrow();
        assert!(
            !table_column_is_not_null(&conn, "glossary_terms", "target_text")
                .expect("table info should load")
        );
        let row = conn
            .query_row(
                "SELECT id, target_text, created_at, updated_at FROM glossary_terms WHERE id = 42",
                [],
                |row| {
                    Ok((
                        row.get::<_, i64>(0)?,
                        row.get::<_, String>(1)?,
                        row.get::<_, String>(2)?,
                        row.get::<_, String>(3)?,
                    ))
                },
            )
            .expect("legacy glossary row should survive");
        assert_eq!(row.0, 42);
        assert_eq!(row.1, "Ivan Il'ich");
        assert_eq!(row.2, "created");
        assert_eq!(row.3, "updated");
        let version: i64 = conn
            .query_row(
                "SELECT version FROM _migrations WHERE name = 'v1_2_1_nullable_glossary_candidate_targets'",
                [],
                |row| row.get(0),
            )
            .expect("v1.2.1 migration recorded");
        assert_eq!(version, 5);
        let index: String = conn
            .query_row(
                "SELECT name FROM sqlite_master WHERE type = 'index' AND name = 'idx_glossary_lookup'",
                [],
                |row| row.get(0),
            )
            .expect("idx_glossary_lookup should be recreated");
        assert_eq!(index, "idx_glossary_lookup");
        let duplicate = conn.execute(
            "INSERT INTO glossary_terms
              (scope_kind, scope_id, source_text, target_text, category, notes,
               case_sensitive, always_active, status, source_language, target_language,
               source_count, created_at, updated_at)
             VALUES
              ('book', 'ivan', 'Ivan Ilych', 'duplicate', 'person', NULL,
               1, 0, 'user_seeded', 'English', 'Italian', 1, 'now', 'now')",
            [],
        );
        assert!(
            duplicate.is_err(),
            "unique constraint should survive the rebuild"
        );
        drop(conn);
        let _ = fs::remove_file(&db_path);
    }

    #[test]
    fn glossary_candidate_upsert_updates_auto_and_skips_rejected() {
        let db_path = temp_path("glossary_candidates.sqlite");
        let store = JobStore::open(&db_path).expect("store opens");
        let first = store
            .upsert_glossary_candidates(
                "ivan",
                "English",
                "Italian",
                &[NewGlossaryCandidate {
                    source_text: "Ivan Ilych",
                    category: GlossaryCategory::Other,
                    source_count: 4,
                }],
            )
            .expect("candidate inserts");
        assert_eq!(first.inserted, 1);

        let candidates = store
            .list_glossary_candidates("ivan", "English", "Italian")
            .expect("candidates should list");
        assert_eq!(candidates.len(), 1);
        assert_eq!(candidates[0].target_text, None);
        assert_eq!(candidates[0].source_count, 4);

        let second = store
            .upsert_glossary_candidates(
                "ivan",
                "English",
                "Italian",
                &[NewGlossaryCandidate {
                    source_text: "Ivan Ilych",
                    category: GlossaryCategory::Other,
                    source_count: 7,
                }],
            )
            .expect("candidate updates");
        assert_eq!(second.updated, 1);
        assert_eq!(
            store
                .list_glossary_candidates("ivan", "English", "Italian")
                .expect("candidates should list")[0]
                .source_count,
            7
        );

        assert!(
            store
                .reject_glossary_candidate(candidates[0].id)
                .expect("candidate rejects")
        );
        let third = store
            .upsert_glossary_candidates(
                "ivan",
                "English",
                "Italian",
                &[NewGlossaryCandidate {
                    source_text: "Ivan Ilych",
                    category: GlossaryCategory::Other,
                    source_count: 9,
                }],
            )
            .expect("rejected candidate is skipped");
        assert_eq!(third.skipped, 1);
        assert!(
            store
                .list_glossary_candidates("ivan", "English", "Italian")
                .expect("rejected candidates are not pending")
                .is_empty()
        );

        let all = store
            .list_glossary_terms(GlossaryFilter {
                scope_kind: Some(GlossaryScopeKind::Book),
                scope_id: Some("ivan"),
                source_language: Some("English"),
                target_language: Some("Italian"),
                active_only: false,
            })
            .expect("terms should list");
        assert_eq!(all.len(), 1);
        assert_eq!(all[0].status, GlossaryStatus::Rejected);
        assert_eq!(all[0].source_count, 7);

        let seeded = glossary_term(
            bookforge_core::GlossaryScopeKind::Book,
            Some("ivan"),
            "Aragorn",
            "Aragorn",
        );
        let mut accepted = glossary_term(
            bookforge_core::GlossaryScopeKind::Book,
            Some("ivan"),
            "Mount Doom",
            "Monte Fato",
        );
        accepted.status = GlossaryStatus::Accepted;
        store
            .upsert_glossary_terms(&[seeded, accepted])
            .expect("active terms should insert");
        let fourth = store
            .upsert_glossary_candidates(
                "ivan",
                "English",
                "Italian",
                &[
                    NewGlossaryCandidate {
                        source_text: "Aragorn",
                        category: GlossaryCategory::Other,
                        source_count: 12,
                    },
                    NewGlossaryCandidate {
                        source_text: "Mount Doom",
                        category: GlossaryCategory::Other,
                        source_count: 11,
                    },
                ],
            )
            .expect("active terms are skipped");
        assert_eq!(fourth.skipped, 2);

        let _ = fs::remove_file(&db_path);
    }

    #[test]
    fn glossary_terms_upsert_list_and_active_lookup() {
        let db_path = temp_path("glossary_terms.sqlite");
        let store = JobStore::open(&db_path).expect("store opens");
        let mut global = glossary_term(
            bookforge_core::GlossaryScopeKind::Global,
            None,
            "Aragorn",
            "Aragorn",
        );
        let book = glossary_term(
            bookforge_core::GlossaryScopeKind::Book,
            Some("fellowship"),
            "Aragorn",
            "Granpasso",
        );

        assert_eq!(
            store
                .upsert_glossary_terms(&[global.clone(), book.clone()])
                .expect("terms upsert"),
            2
        );
        global.target_text = "Aragorn II".to_string();
        store
            .upsert_glossary_terms(&[global.clone()])
            .expect("global term updates instead of duplicating");

        let all = store
            .list_glossary_terms(GlossaryFilter::default())
            .expect("terms list");
        assert_eq!(all.len(), 2);

        let active = store
            .load_active_glossary_terms("English", "Italian", Some("fellowship"), Some("lotr"))
            .expect("active terms");
        assert_eq!(active.len(), 2);
        assert!(active.iter().any(|term| term.target_text == "Granpasso"));
        let active_by_target = store
            .load_active_glossary_terms_for_target("Italian", Some("fellowship"), Some("lotr"))
            .expect("target-only active terms");
        assert_eq!(active_by_target.len(), 2);
        assert!(
            active_by_target
                .iter()
                .any(|term| term.source_language == "English" && term.target_text == "Granpasso")
        );

        let removed = store
            .clear_glossary_scope(bookforge_core::GlossaryScopeKind::Global, None)
            .expect("global clear");
        assert_eq!(removed, 1);

        let _ = fs::remove_file(&db_path);
    }

    #[test]
    fn create_job_persists_book_and_series_ids() {
        let db_path = temp_path("glossary_jobids.sqlite");
        let input_path = temp_path("input_jobids.epub");
        fs::write(&input_path, b"epub bytes").expect("input fixture");
        let store = JobStore::open(&db_path).expect("store opens");
        let job = store
            .create_job(CreateJob {
                input: &input_path,
                output: &temp_path("out_jobids.epub"),
                source_lang: Some("English"),
                target_lang: "Italian",
                provider: "mock",
                model: "mock",
                base_url: None,
                api_key_env: None,
                book_id: Some("fellowship"),
                series_id: Some("lord-of-the-rings"),
            })
            .expect("job created");
        assert_eq!(job.book_id.as_deref(), Some("fellowship"));
        assert_eq!(job.series_id.as_deref(), Some("lord-of-the-rings"));
        let loaded = store
            .get_job(&job.id)
            .expect("get_job ok")
            .expect("job present");
        assert_eq!(loaded.book_id.as_deref(), Some("fellowship"));
        assert_eq!(loaded.series_id.as_deref(), Some("lord-of-the-rings"));
        let _ = fs::remove_file(&db_path);
        let _ = fs::remove_file(input_path);
    }

    fn glossary_term(
        scope_kind: bookforge_core::GlossaryScopeKind,
        scope_id: Option<&str>,
        source: &str,
        target: &str,
    ) -> bookforge_core::GlossaryTerm {
        bookforge_core::GlossaryTerm {
            id: None,
            scope_kind,
            scope_id: scope_id.map(ToOwned::to_owned),
            source_text: source.to_string(),
            target_text: target.to_string(),
            category: bookforge_core::GlossaryCategory::Person,
            notes: None,
            case_sensitive: true,
            always_active: false,
            status: bookforge_core::GlossaryStatus::UserSeeded,
            source_language: "English".to_string(),
            target_language: "Italian".to_string(),
            source_count: 0,
        }
    }
}