Skip to main content

sqlite_graphrag/commands/
edit.rs

1//! Handler for the `edit` CLI subcommand.
2
3use crate::errors::AppError;
4use crate::i18n::errors_msg;
5use crate::output;
6use crate::paths::AppPaths;
7use crate::storage::connection::open_rw;
8use crate::storage::{memories, versions};
9use serde::Serialize;
10
11#[derive(clap::Args)]
12#[command(after_long_help = "EXAMPLES:\n  \
13    # Edit body inline\n  \
14    sqlite-graphrag edit onboarding --body \"updated content\"\n\n  \
15    # Edit body from a file\n  \
16    sqlite-graphrag edit onboarding --body-file ./updated.md\n\n  \
17    # Edit body from stdin (pipe)\n  \
18    cat updated.md | sqlite-graphrag edit onboarding --body-stdin\n\n  \
19    # Update only the description\n  \
20    sqlite-graphrag edit onboarding --description \"new short description\"")]
21pub struct EditArgs {
22    /// Memory name as a positional argument. Alternative to `--name`.
23    #[arg(
24        value_name = "NAME",
25        conflicts_with = "name",
26        help = "Memory name to edit; alternative to --name"
27    )]
28    pub name_positional: Option<String>,
29    /// Memory name to edit. Soft-deleted memories are not editable; use `restore` first.
30    #[arg(long)]
31    pub name: Option<String>,
32    /// New inline body content. Mutually exclusive with --body-file and --body-stdin.
33    #[arg(long, conflicts_with_all = ["body_file", "body_stdin"])]
34    pub body: Option<String>,
35    /// Read new body from a file. Mutually exclusive with --body and --body-stdin.
36    #[arg(long, conflicts_with_all = ["body", "body_stdin"])]
37    pub body_file: Option<std::path::PathBuf>,
38    /// Read new body from stdin until EOF. Mutually exclusive with --body and --body-file.
39    #[arg(long, conflicts_with_all = ["body", "body_file"])]
40    pub body_stdin: bool,
41    /// New description (≤500 chars) replacing the existing one.
42    #[arg(long)]
43    pub description: Option<String>,
44    /// Change the memory type (e.g. note, skill, decision).
45    #[arg(long, value_enum, visible_alias = "type", help = "Change memory type")]
46    pub memory_type: Option<crate::cli::MemoryType>,
47    #[arg(
48        long,
49        value_name = "EPOCH_OR_RFC3339",
50        value_parser = crate::parsers::parse_expected_updated_at,
51        long_help = "Optimistic lock: reject if updated_at does not match. \
52Accepts Unix epoch (e.g. 1700000000) or RFC 3339 (e.g. 2026-04-19T12:00:00Z)."
53    )]
54    pub expected_updated_at: Option<i64>,
55    #[arg(
56        long,
57        help = "Namespace (env: SQLITE_GRAPHRAG_NAMESPACE, default: global)"
58    )]
59    pub namespace: Option<String>,
60    #[arg(long, hide = true, help = "No-op; JSON is always emitted on stdout")]
61    pub json: bool,
62    #[arg(long, env = "SQLITE_GRAPHRAG_DB_PATH")]
63    pub db: Option<String>,
64    /// G42/S9 (v1.0.79): regenerate the embedding even when the body is
65    /// unchanged. This is the supported way to re-embed a memory (the
66    /// pre-v1.0.79 docs suggested `edit --description "<same>"`, which
67    /// is a no-op and never re-embeds).
68    #[arg(
69        long,
70        default_value_t = false,
71        help = "Regenerate the embedding even when the body is unchanged (G42/S9)"
72    )]
73    pub force_reembed: bool,
74    /// G42/S3 (v1.0.79): maximum simultaneous LLM embedding subprocesses.
75    /// Only relevant for future multi-item edit paths; a single-body edit
76    /// performs one LLM call regardless.
77    #[arg(long, default_value_t = 4, value_name = "N",
78          value_parser = clap::value_parser!(u64).range(1..=32),
79          help = "Maximum simultaneous LLM embedding subprocesses (default: 4, clamp [1,32])")]
80    pub llm_parallelism: u64,
81}
82
83#[derive(Serialize)]
84struct EditResponse {
85    memory_id: i64,
86    name: String,
87    action: String,
88    version: i64,
89    /// Total execution time in milliseconds from handler start to serialisation.
90    elapsed_ms: u64,
91    /// v1.0.84 (ADR-0042): discriminador do backend LLM que efetivamente
92    /// executou o re-embedding do body editado. `"claude" | "codex" | "none"`.
93    /// Absent on the wire when `None` (kept for happy-path envelope cleanliness,
94    /// ou quando body não mudou e re-embedding não foi invocado).
95    #[serde(skip_serializing_if = "Option::is_none")]
96    backend_invoked: Option<&'static str>,
97}
98
99pub fn run(args: EditArgs, llm_backend: crate::cli::LlmBackendChoice) -> Result<(), AppError> {
100    use crate::constants::*;
101
102    let inicio = std::time::Instant::now();
103    tracing::debug!(target: "edit", name = ?args.name_positional.as_deref().or(args.name.as_deref()), "updating memory");
104    // Resolve name from positional or --name flag; both are optional, at least one is required.
105    let name = args.name_positional.or(args.name).ok_or_else(|| {
106        AppError::Validation("name required: pass as positional argument or via --name".to_string())
107    })?;
108    let namespace = crate::namespace::resolve_namespace(args.namespace.as_deref())?;
109
110    let paths = AppPaths::resolve(args.db.as_deref())?;
111    crate::storage::connection::ensure_db_ready(&paths)?;
112    let mut conn = open_rw(&paths.db)?;
113
114    let (memory_id, current_updated_at, _current_version) =
115        memories::find_by_name(&conn, &namespace, &name)?
116            .ok_or_else(|| AppError::NotFound(errors_msg::memory_not_found(&name, &namespace)))?;
117
118    if let Some(expected) = args.expected_updated_at {
119        if expected != current_updated_at {
120            return Err(AppError::Conflict(errors_msg::optimistic_lock_conflict(
121                expected,
122                current_updated_at,
123            )));
124        }
125    }
126
127    let mut raw_body: Option<String> = None;
128    if args.body.is_some() || args.body_file.is_some() || args.body_stdin {
129        let b = if let Some(b) = args.body {
130            b
131        } else if let Some(path) = &args.body_file {
132            let file_size = std::fs::metadata(path).map_err(AppError::Io)?.len();
133            if file_size > MAX_MEMORY_BODY_LEN as u64 {
134                return Err(AppError::LimitExceeded(
135                    crate::i18n::validation::body_exceeds(MAX_MEMORY_BODY_LEN),
136                ));
137            }
138            std::fs::read_to_string(path).map_err(AppError::Io)?
139        } else {
140            crate::stdin_helper::read_stdin_with_timeout(60)?
141        };
142        if b.len() > MAX_MEMORY_BODY_LEN {
143            return Err(AppError::LimitExceeded(
144                crate::i18n::validation::body_exceeds(MAX_MEMORY_BODY_LEN),
145            ));
146        }
147        raw_body = Some(b);
148    }
149
150    if let Some(ref desc) = args.description {
151        if desc.len() > MAX_MEMORY_DESCRIPTION_LEN {
152            return Err(AppError::Validation(
153                crate::i18n::validation::description_exceeds(MAX_MEMORY_DESCRIPTION_LEN),
154            ));
155        }
156    }
157
158    let row = memories::read_by_name(&conn, &namespace, &name)?
159        .ok_or_else(|| AppError::Internal(anyhow::anyhow!("memory row not found after check")))?;
160
161    let body_changed = raw_body.is_some();
162    let new_body = raw_body.unwrap_or(row.body.clone());
163    let new_description = args.description.unwrap_or(row.description.clone());
164    let new_hash = blake3::hash(new_body.as_bytes()).to_hex().to_string();
165    // Skip re-embedding when body content is identical to the stored version.
166    let body_changed = body_changed && new_hash != row.body_hash;
167    let memory_type = args
168        .memory_type
169        .map(|t| t.as_str().to_string())
170        .unwrap_or_else(|| row.memory_type.clone());
171    let type_changed = memory_type != row.memory_type;
172    let metadata = row.metadata.clone();
173
174    let tx = conn.transaction_with_behavior(rusqlite::TransactionBehavior::Immediate)?;
175
176    let affected = if let Some(ts) = args.expected_updated_at {
177        tx.execute(
178            "UPDATE memories SET description=?2, body=?3, body_hash=?4, type=?5
179             WHERE id=?1 AND updated_at=?6 AND deleted_at IS NULL",
180            rusqlite::params![
181                memory_id,
182                new_description,
183                new_body,
184                new_hash,
185                memory_type,
186                ts
187            ],
188        )?
189    } else {
190        tx.execute(
191            "UPDATE memories SET description=?2, body=?3, body_hash=?4, type=?5
192             WHERE id=?1 AND deleted_at IS NULL",
193            rusqlite::params![memory_id, new_description, new_body, new_hash, memory_type],
194        )?
195    };
196
197    if affected == 0 {
198        return Err(AppError::Conflict(
199            "optimistic lock conflict: memory was modified by another process".to_string(),
200        ));
201    }
202
203    // v1.0.84 (ADR-0042): backend discriminator for the JSON envelope.
204    // Populated only when re-embedding actually ran; stays None for
205    // description-only or metadata-only edits.
206    let mut backend_invoked: Option<&'static str> = None;
207
208    if body_changed || type_changed || args.force_reembed {
209        output::emit_progress_i18n(
210            "Re-computing embedding for edited body...",
211            crate::i18n::validation::runtime_pt::edit_recomputing_embedding(),
212        );
213        // v1.0.82 (GAP-003): forward --llm-backend to embed_with_fallback.
214        // v1.0.84 (ADR-0042): tuple (Vec<f32>, LlmBackendKind) — extrai o
215        // backend que efetivamente rodou para popular `backend_invoked`.
216        let skip_embed = crate::embedder::should_skip_embedding_on_failure();
217        let embedding: Option<(Vec<f32>, &'static str)> = match crate::embedder::embed_passage_with_choice(
218            &paths.models,
219            &new_body,
220            Some(llm_backend),
221        ) {
222            Ok((emb, kind)) => Some((emb, kind.as_str())),
223            Err(AppError::Validation(msg)) => return Err(AppError::Validation(msg)),
224            Err(e) if skip_embed => {
225                tracing::warn!(error = %e, "edit: embedding failed; --skip-embedding-on-failure active, persisting without embedding");
226                None
227            }
228            Err(e) => return Err(e),
229        };
230        if let Some((ref emb, kind)) = embedding {
231            backend_invoked = Some(kind);
232            let snippet: String = new_body.chars().take(300).collect();
233            memories::upsert_vec(
234                &tx,
235                memory_id,
236                &namespace,
237                &memory_type,
238                emb,
239                &name,
240                &snippet,
241            )?;
242        }
243    }
244
245    let next_v = versions::next_version(&tx, memory_id)?;
246
247    versions::insert_version(
248        &tx,
249        memory_id,
250        next_v,
251        &name,
252        &memory_type,
253        &new_description,
254        &new_body,
255        &metadata,
256        None,
257        "edit",
258    )?;
259
260    memories::sync_fts_after_update(
261        &tx,
262        memory_id,
263        &row.name,
264        &row.description,
265        &row.body,
266        &row.name,
267        &new_description,
268        &new_body,
269    )?;
270
271    tx.commit()?;
272
273    conn.execute_batch("PRAGMA wal_checkpoint(TRUNCATE);")?;
274
275    output::emit_json(&EditResponse {
276        memory_id,
277        name,
278        action: "updated".to_string(),
279        version: next_v,
280        elapsed_ms: inicio.elapsed().as_millis() as u64,
281        backend_invoked,
282    })?;
283
284    Ok(())
285}
286
287#[cfg(test)]
288mod tests {
289    use super::*;
290
291    #[derive(clap::Parser)]
292    struct TestCli {
293        #[command(flatten)]
294        args: EditArgs,
295    }
296
297    #[test]
298    fn type_flag_is_a_visible_alias_of_memory_type() {
299        // G47: COOKBOOK, README and llms.txt promise `edit --type`; the flag
300        // was only reachable as --memory-type, breaking the documented CLI.
301        use clap::Parser;
302        let cli = TestCli::try_parse_from(["edit", "--name", "m", "--type", "decision"])
303            .expect("--type must parse as an alias of --memory-type");
304        assert!(cli.args.memory_type.is_some());
305        let cli = TestCli::try_parse_from(["edit", "--name", "m", "--memory-type", "decision"])
306            .expect("--memory-type must keep working");
307        assert!(cli.args.memory_type.is_some());
308    }
309
310    #[test]
311    fn edit_response_serializes_all_fields() {
312        let resp = EditResponse {
313            memory_id: 42,
314            name: "my-memory".to_string(),
315            action: "updated".to_string(),
316            version: 3,
317            elapsed_ms: 7,
318            backend_invoked: None,
319        };
320        let json = serde_json::to_value(&resp).expect("serialization failed");
321        assert_eq!(json["memory_id"], 42i64);
322        assert_eq!(json["name"], "my-memory");
323        assert_eq!(json["action"], "updated");
324        assert_eq!(json["version"], 3i64);
325        assert!(json["elapsed_ms"].is_number());
326    }
327
328    #[test]
329    fn edit_response_action_contains_updated() {
330        let resp = EditResponse {
331            memory_id: 1,
332            name: "n".to_string(),
333            action: "updated".to_string(),
334            version: 1,
335            elapsed_ms: 0,
336            backend_invoked: None,
337        };
338        assert_eq!(
339            resp.action, "updated",
340            "action must be 'updated' for successful edits"
341        );
342    }
343
344    #[test]
345    fn edit_body_exceeds_limit_returns_error() {
346        let limit = crate::constants::MAX_MEMORY_BODY_LEN;
347        let large_body: String = "a".repeat(limit + 1);
348        assert!(
349            large_body.len() > limit,
350            "body above limit must have length > MAX_MEMORY_BODY_LEN"
351        );
352    }
353
354    #[test]
355    fn edit_description_exceeds_limit_returns_error() {
356        let limit = crate::constants::MAX_MEMORY_DESCRIPTION_LEN;
357        let large_desc: String = "d".repeat(limit + 1);
358        assert!(
359            large_desc.len() > limit,
360            "description above limit must have length > MAX_MEMORY_DESCRIPTION_LEN"
361        );
362    }
363}