1use anyhow::Context;
2use rusqlite::Connection;
3use std::collections::HashSet;
4use std::path::Path;
5
6struct Migration {
10 version: i64,
11 sql: &'static str,
12}
13
14const MIGRATION_001: &str = r#"
15CREATE TABLE IF NOT EXISTS tasks (
16 task_id TEXT PRIMARY KEY,
17 title TEXT NOT NULL,
18 status TEXT NOT NULL,
19 project_hash TEXT NOT NULL,
20 opened_at TEXT NOT NULL,
21 closed_at TEXT,
22 last_event_at TEXT NOT NULL
23);
24CREATE INDEX IF NOT EXISTS idx_tasks_project ON tasks(project_hash, last_event_at DESC);
25
26CREATE TABLE IF NOT EXISTS events_index (
27 event_id TEXT PRIMARY KEY,
28 task_id TEXT NOT NULL,
29 type TEXT NOT NULL,
30 timestamp TEXT NOT NULL,
31 confidence REAL,
32 status TEXT NOT NULL
33);
34CREATE INDEX IF NOT EXISTS idx_events_task_time ON events_index(task_id, timestamp DESC);
35
36CREATE TABLE IF NOT EXISTS decisions (
37 decision_id TEXT PRIMARY KEY,
38 task_id TEXT NOT NULL,
39 text TEXT NOT NULL,
40 status TEXT NOT NULL,
41 superseded_by TEXT
42);
43
44CREATE TABLE IF NOT EXISTS evidence (
45 evidence_id TEXT PRIMARY KEY,
46 task_id TEXT NOT NULL,
47 text TEXT NOT NULL,
48 strength TEXT NOT NULL,
49 refers_to_decision_id TEXT
50);
51
52CREATE TABLE IF NOT EXISTS task_pack_cache (
53 task_id TEXT NOT NULL,
54 mode TEXT NOT NULL,
55 text TEXT NOT NULL,
56 generated_at TEXT NOT NULL,
57 source_event_count INTEGER NOT NULL,
58 PRIMARY KEY (task_id, mode)
59);
60
61CREATE VIRTUAL TABLE IF NOT EXISTS search_fts USING fts5(
62 task_id UNINDEXED,
63 event_id UNINDEXED,
64 text,
65 type
66);
67"#;
68
69const MIGRATION_002: &str = r#"
74CREATE TABLE IF NOT EXISTS index_state (
75 project_hash TEXT PRIMARY KEY,
76 last_indexed_event_id TEXT NOT NULL,
77 updated_at TEXT NOT NULL
78);
79"#;
80
81const MIGRATIONS: &[Migration] = &[
84 Migration {
85 version: 1,
86 sql: MIGRATION_001,
87 },
88 Migration {
89 version: 2,
90 sql: MIGRATION_002,
91 },
92];
93
94fn apply_migrations(conn: &Connection) -> anyhow::Result<()> {
95 conn.execute_batch(
96 "CREATE TABLE IF NOT EXISTS schema_migrations (
97 version INTEGER PRIMARY KEY,
98 applied_at TEXT NOT NULL
99 )",
100 )
101 .context("create schema_migrations table")?;
102
103 let applied: HashSet<i64> = {
104 let mut stmt = conn
105 .prepare("SELECT version FROM schema_migrations")
106 .context("select applied versions")?;
107 let rows = stmt
108 .query_map([], |r| r.get::<_, i64>(0))
109 .context("iterate schema_migrations")?;
110 rows.collect::<rusqlite::Result<HashSet<_>>>()
111 .context("collect applied versions")?
112 };
113
114 for migration in MIGRATIONS {
115 if applied.contains(&migration.version) {
116 continue;
117 }
118 conn.execute_batch(migration.sql)
119 .with_context(|| format!("apply schema migration v{:03}", migration.version))?;
120 conn.execute(
121 "INSERT INTO schema_migrations(version, applied_at) VALUES (?1, ?2)",
122 rusqlite::params![
123 migration.version,
124 chrono::Utc::now().to_rfc3339_opts(chrono::SecondsFormat::Millis, true)
125 ],
126 )
127 .with_context(|| {
128 format!(
129 "record schema migration v{:03} as applied",
130 migration.version
131 )
132 })?;
133 }
134 Ok(())
135}
136
137use crate::event::{Event, EventType};
138
139pub fn upsert_task_from_event(
140 conn: &Connection,
141 event: &Event,
142 project_hash: &str,
143) -> anyhow::Result<()> {
144 match event.event_type {
145 EventType::Open => {
146 let title = event
147 .meta
148 .get("title")
149 .and_then(|v| v.as_str())
150 .unwrap_or(&event.text)
151 .to_string();
152 conn.execute(
153 "INSERT INTO tasks(task_id, title, status, project_hash, opened_at, last_event_at)
154 VALUES (?1, ?2, 'open', ?3, ?4, ?4)
155 ON CONFLICT(task_id) DO UPDATE SET last_event_at = ?4",
156 rusqlite::params![event.task_id, title, project_hash, event.timestamp],
157 )?;
158 }
159 EventType::Close => {
160 conn.execute(
161 "UPDATE tasks SET status='closed', closed_at=?2, last_event_at=?2 WHERE task_id=?1",
162 rusqlite::params![event.task_id, event.timestamp],
163 )?;
164 }
165 EventType::Reopen => {
166 conn.execute(
167 "UPDATE tasks SET status='open', closed_at=NULL, last_event_at=?2 WHERE task_id=?1",
168 rusqlite::params![event.task_id, event.timestamp],
169 )?;
170 }
171 _ => {
172 conn.execute(
173 "UPDATE tasks SET last_event_at=?2 WHERE task_id=?1",
174 rusqlite::params![event.task_id, event.timestamp],
175 )?;
176 }
177 }
178 Ok(())
179}
180
181use std::io::BufRead;
182
183pub fn list_all_projects(state_dir: impl AsRef<Path>) -> anyhow::Result<Vec<String>> {
184 let dir = state_dir.as_ref();
185 if !dir.exists() {
186 return Ok(vec![]);
187 }
188 let mut out = Vec::new();
189 for entry in std::fs::read_dir(dir)? {
190 let entry = entry?;
191 let path = entry.path();
192 if path.extension().and_then(|e| e.to_str()) == Some("sqlite") {
193 if let Some(stem) = path.file_stem().and_then(|s| s.to_str()) {
194 out.push(stem.to_string());
195 }
196 }
197 }
198 Ok(out)
199}
200
201pub fn rebuild_state(
202 conn: &Connection,
203 jsonl_path: impl AsRef<Path>,
204 project_hash: &str,
205) -> anyhow::Result<usize> {
206 let f = std::fs::File::open(&jsonl_path)
207 .with_context(|| format!("open {:?}", jsonl_path.as_ref()))?;
208 let reader = std::io::BufReader::new(f);
209
210 let tx = conn.unchecked_transaction()?;
211 let mut count = 0;
212 let mut last_event_id: Option<String> = None;
213 for (i, line) in reader.lines().enumerate() {
214 let line = line.with_context(|| format!("read line {i}"))?;
215 if line.trim().is_empty() {
216 continue;
217 }
218 let event: Event = match serde_json::from_str(&line) {
222 Ok(e) => e,
223 Err(err) => {
224 tracing::warn!(
225 line_number = i + 1,
226 error = %err,
227 "skipping malformed JSONL line in rebuild_state"
228 );
229 continue;
230 }
231 };
232 upsert_task_from_event(&tx, &event, project_hash)?;
233 index_event(&tx, &event)?;
234 last_event_id = Some(event.event_id.clone());
235 count += 1;
236 }
237 if let Some(eid) = last_event_id.as_deref() {
238 record_last_indexed(&tx, project_hash, eid)?;
239 }
240 tx.commit()?;
241 Ok(count)
242}
243
244pub fn task_exists(conn: &Connection, task_id: &str) -> anyhow::Result<bool> {
249 let count: i64 = conn.query_row(
250 "SELECT COUNT(*) FROM tasks WHERE task_id = ?1",
251 rusqlite::params![task_id],
252 |r| r.get(0),
253 )?;
254 Ok(count > 0)
255}
256
257fn last_indexed_event_id(conn: &Connection, project_hash: &str) -> anyhow::Result<Option<String>> {
261 let mut stmt =
262 conn.prepare("SELECT last_indexed_event_id FROM index_state WHERE project_hash = ?1")?;
263 let mut rows = stmt.query(rusqlite::params![project_hash])?;
264 if let Some(row) = rows.next()? {
265 Ok(Some(row.get::<_, String>(0)?))
266 } else {
267 Ok(None)
268 }
269}
270
271fn record_last_indexed(
272 conn: &Connection,
273 project_hash: &str,
274 event_id: &str,
275) -> anyhow::Result<()> {
276 conn.execute(
277 "INSERT INTO index_state(project_hash, last_indexed_event_id, updated_at)
278 VALUES (?1, ?2, ?3)
279 ON CONFLICT(project_hash) DO UPDATE SET
280 last_indexed_event_id = excluded.last_indexed_event_id,
281 updated_at = excluded.updated_at",
282 rusqlite::params![
283 project_hash,
284 event_id,
285 chrono::Utc::now().to_rfc3339_opts(chrono::SecondsFormat::Millis, true)
286 ],
287 )?;
288 Ok(())
289}
290
291pub fn ingest_new_events(
301 conn: &Connection,
302 jsonl_path: impl AsRef<Path>,
303 project_hash: &str,
304) -> anyhow::Result<usize> {
305 let marker = match last_indexed_event_id(conn, project_hash)? {
306 Some(id) => id,
307 None => return rebuild_state(conn, jsonl_path, project_hash),
308 };
309
310 let f = std::fs::File::open(&jsonl_path)
311 .with_context(|| format!("open {:?}", jsonl_path.as_ref()))?;
312 let reader = std::io::BufReader::new(f);
313
314 let tx = conn.unchecked_transaction()?;
318 let mut found_marker = false;
319 let mut count = 0;
320 let mut last_event_id: Option<String> = None;
321 for (i, line) in reader.lines().enumerate() {
322 let line = line.with_context(|| format!("read line {i}"))?;
323 if line.trim().is_empty() {
324 continue;
325 }
326 let event: Event = match serde_json::from_str(&line) {
327 Ok(e) => e,
328 Err(err) => {
329 tracing::warn!(
330 line_number = i + 1,
331 error = %err,
332 "skipping malformed JSONL line in ingest_new_events"
333 );
334 continue;
335 }
336 };
337 if !found_marker {
338 if event.event_id == marker {
339 found_marker = true;
340 }
341 continue;
342 }
343 upsert_task_from_event(&tx, &event, project_hash)?;
344 index_event(&tx, &event)?;
345 last_event_id = Some(event.event_id.clone());
346 count += 1;
347 }
348
349 if !found_marker {
350 drop(tx);
352 tracing::warn!(
353 project_hash = project_hash,
354 marker = marker.as_str(),
355 "last_indexed_event_id not found in JSONL — falling back to full rebuild"
356 );
357 return rebuild_state(conn, jsonl_path, project_hash);
358 }
359
360 if let Some(eid) = last_event_id.as_deref() {
361 record_last_indexed(&tx, project_hash, eid)?;
362 }
363 tx.commit()?;
364 Ok(count)
365}
366
367pub fn index_event(conn: &Connection, event: &Event) -> anyhow::Result<()> {
368 let type_str = serde_json::to_value(event.event_type)?
369 .as_str()
370 .unwrap()
371 .to_string();
372 let status_str = serde_json::to_value(event.status)?
373 .as_str()
374 .unwrap()
375 .to_string();
376 conn.execute(
377 "INSERT OR REPLACE INTO events_index(event_id, task_id, type, timestamp, confidence, status)
378 VALUES (?1, ?2, ?3, ?4, ?5, ?6)",
379 rusqlite::params![
380 event.event_id, event.task_id, type_str,
381 event.timestamp, event.confidence, status_str
382 ],
383 )?;
384 conn.execute(
386 "DELETE FROM search_fts WHERE event_id=?1",
387 rusqlite::params![event.event_id],
388 )?;
389 conn.execute(
390 "INSERT INTO search_fts(task_id, event_id, text, type) VALUES (?1, ?2, ?3, ?4)",
391 rusqlite::params![event.task_id, event.event_id, event.text, type_str],
392 )?;
393
394 if event.event_type == EventType::Decision {
395 conn.execute(
396 "INSERT OR REPLACE INTO decisions(decision_id, task_id, text, status)
397 VALUES (?1, ?2, ?3, 'active')",
398 rusqlite::params![event.event_id, event.task_id, event.text],
399 )?;
400 }
401
402 if event.event_type == EventType::Supersede {
403 if let Some(target) = &event.supersedes {
404 conn.execute(
405 "UPDATE decisions SET status='superseded', superseded_by=?1 WHERE decision_id=?2",
406 rusqlite::params![event.event_id, target],
407 )?;
408 }
409 }
410
411 if event.event_type == EventType::Evidence {
412 let strength_str = event
413 .evidence_strength
414 .map(|s| {
415 serde_json::to_value(s)
416 .unwrap()
417 .as_str()
418 .unwrap()
419 .to_string()
420 })
421 .unwrap_or_else(|| "medium".into());
422 conn.execute(
423 "INSERT OR REPLACE INTO evidence(evidence_id, task_id, text, strength)
424 VALUES (?1, ?2, ?3, ?4)",
425 rusqlite::params![event.event_id, event.task_id, event.text, strength_str],
426 )?;
427 }
428
429 conn.execute(
431 "DELETE FROM task_pack_cache WHERE task_id=?1",
432 rusqlite::params![event.task_id],
433 )?;
434
435 Ok(())
436}
437
438pub fn open(path: impl AsRef<Path>) -> anyhow::Result<Connection> {
439 if let Some(parent) = path.as_ref().parent() {
440 std::fs::create_dir_all(parent).with_context(|| format!("create dir {parent:?}"))?;
441 }
442 let conn =
443 Connection::open(&path).with_context(|| format!("open SQLite at {:?}", path.as_ref()))?;
444 conn.execute_batch("PRAGMA journal_mode=WAL; PRAGMA foreign_keys=ON;")?;
445 apply_migrations(&conn).context("apply schema migrations")?;
446 Ok(conn)
447}
448
449#[derive(Debug, Clone)]
453pub struct TaskRow {
454 pub task_id: String,
455 pub title: String,
456 pub status: String,
457 pub last_event_at: String,
458 pub event_count: usize,
459}
460
461pub fn list_tasks_by_project(
465 conn: &Connection,
466 project_hash: &str,
467) -> anyhow::Result<Vec<TaskRow>> {
468 let mut stmt = conn.prepare(
469 "SELECT t.task_id, t.title, t.status, t.last_event_at,
470 COALESCE(c.cnt, 0) AS event_count
471 FROM tasks t
472 LEFT JOIN (
473 SELECT task_id, COUNT(*) AS cnt FROM events_index GROUP BY task_id
474 ) c ON c.task_id = t.task_id
475 WHERE t.project_hash = ?1
476 ORDER BY (t.status = 'open') DESC, t.last_event_at DESC",
477 )?;
478 let rows = stmt
479 .query_map(rusqlite::params![project_hash], |r| {
480 Ok(TaskRow {
481 task_id: r.get::<_, String>(0)?,
482 title: r.get::<_, String>(1)?,
483 status: r.get::<_, String>(2)?,
484 last_event_at: r.get::<_, String>(3)?,
485 event_count: r.get::<_, i64>(4)? as usize,
486 })
487 })?
488 .collect::<Result<Vec<_>, _>>()?;
489 Ok(rows)
490}
491
492#[cfg(test)]
493mod tests {
494 use super::*;
495 use tempfile::TempDir;
496
497 #[test]
498 fn task_exists_returns_true_for_known_id_false_otherwise() {
499 let d = TempDir::new().unwrap();
500 let conn = open(d.path().join("s.sqlite")).unwrap();
501
502 assert!(!task_exists(&conn, "tj-nope").unwrap());
503
504 let e = make_open_event("tj-yes", "Hello");
505 upsert_task_from_event(&conn, &e, "feedfacefeedface").unwrap();
506 index_event(&conn, &e).unwrap();
507
508 assert!(task_exists(&conn, "tj-yes").unwrap());
509 assert!(!task_exists(&conn, "tj-nope").unwrap());
510 }
511
512 #[test]
513 fn fresh_db_runs_all_migrations() {
514 let d = TempDir::new().unwrap();
515 let p = d.path().join("state.sqlite");
516 let conn = open(&p).unwrap();
517
518 let applied: Vec<i64> = conn
519 .prepare("SELECT version FROM schema_migrations ORDER BY version")
520 .unwrap()
521 .query_map([], |r| r.get::<_, i64>(0))
522 .unwrap()
523 .collect::<Result<_, _>>()
524 .unwrap();
525 assert_eq!(
526 applied,
527 (1..=MIGRATIONS.len() as i64).collect::<Vec<_>>(),
528 "every declared migration must be recorded"
529 );
530 }
531
532 #[test]
533 fn apply_migrations_is_idempotent_across_reopens() {
534 let d = TempDir::new().unwrap();
535 let p = d.path().join("state.sqlite");
536 let _ = open(&p).unwrap();
537 let _ = open(&p).unwrap();
538
539 let count: i64 = open(&p)
540 .unwrap()
541 .query_row("SELECT COUNT(*) FROM schema_migrations", [], |r| r.get(0))
542 .unwrap();
543 assert_eq!(
544 count,
545 MIGRATIONS.len() as i64,
546 "schema_migrations must contain exactly one row per declared migration after repeated opens"
547 );
548 }
549
550 #[test]
551 fn open_creates_all_tables() {
552 let d = TempDir::new().unwrap();
553 let p = d.path().join("state.sqlite");
554 let conn = open(&p).unwrap();
555
556 let names: Vec<String> = conn
557 .prepare("SELECT name FROM sqlite_master WHERE type='table' OR type='virtual table' ORDER BY name")
558 .unwrap()
559 .query_map([], |r| r.get::<_, String>(0))
560 .unwrap()
561 .collect::<Result<_, _>>()
562 .unwrap();
563
564 for required in [
565 "decisions",
566 "events_index",
567 "evidence",
568 "task_pack_cache",
569 "tasks",
570 "search_fts",
571 ] {
572 assert!(
573 names.iter().any(|n| n == required),
574 "missing table {required}, have {names:?}"
575 );
576 }
577 }
578
579 #[test]
580 fn open_is_idempotent() {
581 let d = TempDir::new().unwrap();
582 let p = d.path().join("state.sqlite");
583 let _ = open(&p).unwrap();
584 let _ = open(&p).unwrap();
585 }
586
587 #[test]
588 fn index_event_projects_evidence() {
589 let d = TempDir::new().unwrap();
590 let conn = open(d.path().join("s.sqlite")).unwrap();
591 let mut open_e = crate::event::Event::new(
592 "tj-e",
593 crate::event::EventType::Open,
594 crate::event::Author::User,
595 crate::event::Source::Cli,
596 "x".into(),
597 );
598 open_e.meta = serde_json::json!({"title": "T"});
599 upsert_task_from_event(&conn, &open_e, "feedface").unwrap();
600 index_event(&conn, &open_e).unwrap();
601
602 let mut ev = crate::event::Event::new(
603 "tj-e",
604 crate::event::EventType::Evidence,
605 crate::event::Author::Agent,
606 crate::event::Source::Chat,
607 "Hook startup measured at 12ms".into(),
608 );
609 ev.evidence_strength = Some(crate::event::EvidenceStrength::Strong);
610 upsert_task_from_event(&conn, &ev, "feedface").unwrap();
611 index_event(&conn, &ev).unwrap();
612
613 let (text, strength): (String, String) = conn
614 .query_row(
615 "SELECT text, strength FROM evidence WHERE task_id=?1",
616 rusqlite::params!["tj-e"],
617 |r| Ok((r.get(0)?, r.get(1)?)),
618 )
619 .unwrap();
620 assert!(text.contains("12ms"));
621 assert_eq!(strength, "strong");
622 }
623
624 #[test]
625 fn supersede_event_marks_decision_superseded() {
626 let d = TempDir::new().unwrap();
627 let conn = open(d.path().join("s.sqlite")).unwrap();
628 let mut open_e = crate::event::Event::new(
629 "tj-s",
630 crate::event::EventType::Open,
631 crate::event::Author::User,
632 crate::event::Source::Cli,
633 "x".into(),
634 );
635 open_e.meta = serde_json::json!({"title": "T"});
636 upsert_task_from_event(&conn, &open_e, "feedface").unwrap();
637 index_event(&conn, &open_e).unwrap();
638
639 let dec = crate::event::Event::new(
640 "tj-s",
641 crate::event::EventType::Decision,
642 crate::event::Author::Agent,
643 crate::event::Source::Chat,
644 "Use TS".into(),
645 );
646 upsert_task_from_event(&conn, &dec, "feedface").unwrap();
647 index_event(&conn, &dec).unwrap();
648
649 let mut sup = crate::event::Event::new(
650 "tj-s",
651 crate::event::EventType::Supersede,
652 crate::event::Author::Agent,
653 crate::event::Source::Chat,
654 "Replaced by Rust decision".into(),
655 );
656 sup.supersedes = Some(dec.event_id.clone());
657 upsert_task_from_event(&conn, &sup, "feedface").unwrap();
658 index_event(&conn, &sup).unwrap();
659
660 let (status, by): (String, Option<String>) = conn
661 .query_row(
662 "SELECT status, superseded_by FROM decisions WHERE decision_id=?1",
663 rusqlite::params![dec.event_id],
664 |r| Ok((r.get(0)?, r.get(1)?)),
665 )
666 .unwrap();
667 assert_eq!(status, "superseded");
668 assert_eq!(by.as_deref(), Some(sup.event_id.as_str()));
669 }
670
671 #[test]
672 fn index_event_projects_decision_to_decisions_table() {
673 let d = TempDir::new().unwrap();
674 let conn = open(d.path().join("s.sqlite")).unwrap();
675
676 let mut open_e = crate::event::Event::new(
677 "tj-d",
678 crate::event::EventType::Open,
679 crate::event::Author::User,
680 crate::event::Source::Cli,
681 "x".into(),
682 );
683 open_e.meta = serde_json::json!({"title": "T"});
684 upsert_task_from_event(&conn, &open_e, "feedface").unwrap();
685 index_event(&conn, &open_e).unwrap();
686
687 let dec = crate::event::Event::new(
688 "tj-d",
689 crate::event::EventType::Decision,
690 crate::event::Author::Agent,
691 crate::event::Source::Chat,
692 "Adopt Rust".into(),
693 );
694 upsert_task_from_event(&conn, &dec, "feedface").unwrap();
695 index_event(&conn, &dec).unwrap();
696
697 let (id, text, status): (String, String, String) = conn
698 .query_row(
699 "SELECT decision_id, text, status FROM decisions WHERE task_id=?1",
700 rusqlite::params!["tj-d"],
701 |r| Ok((r.get(0)?, r.get(1)?, r.get(2)?)),
702 )
703 .unwrap();
704 assert_eq!(id, dec.event_id);
705 assert_eq!(text, "Adopt Rust");
706 assert_eq!(status, "active");
707 }
708
709 #[test]
710 fn index_event_is_idempotent_no_search_fts_duplicates() {
711 let d = TempDir::new().unwrap();
712 let conn = open(d.path().join("s.sqlite")).unwrap();
713 let mut open_e = crate::event::Event::new(
714 "tj-id",
715 crate::event::EventType::Open,
716 crate::event::Author::User,
717 crate::event::Source::Cli,
718 "x".into(),
719 );
720 open_e.meta = serde_json::json!({"title": "Idempotent"});
721 upsert_task_from_event(&conn, &open_e, "feedface").unwrap();
722
723 index_event(&conn, &open_e).unwrap();
725 index_event(&conn, &open_e).unwrap();
726 index_event(&conn, &open_e).unwrap();
727
728 let n: i64 = conn
729 .query_row(
730 "SELECT COUNT(*) FROM search_fts WHERE event_id=?1",
731 rusqlite::params![open_e.event_id],
732 |r| r.get(0),
733 )
734 .unwrap();
735 assert_eq!(n, 1, "search_fts must hold exactly one row per event_id");
736 }
737
738 #[test]
739 fn list_all_projects_returns_hashes_from_state_dir() {
740 use std::fs::File;
741 let d = TempDir::new().unwrap();
742 let state_dir = d.path().join("state");
743 std::fs::create_dir_all(&state_dir).unwrap();
744 File::create(state_dir.join("aaaa1111aaaa1111.sqlite")).unwrap();
745 File::create(state_dir.join("bbbb2222bbbb2222.sqlite")).unwrap();
746 File::create(state_dir.join("not-a-project.txt")).unwrap();
747
748 let mut hashes = list_all_projects(&state_dir).unwrap();
749 hashes.sort();
750 assert_eq!(hashes, vec!["aaaa1111aaaa1111", "bbbb2222bbbb2222"]);
751 }
752
753 fn write_event_line(f: &mut std::fs::File, e: &crate::event::Event) {
754 use std::io::Write;
755 writeln!(f, "{}", serde_json::to_string(e).unwrap()).unwrap();
756 }
757
758 fn make_open_event(task_id: &str, title: &str) -> crate::event::Event {
759 let mut e = crate::event::Event::new(
760 task_id,
761 crate::event::EventType::Open,
762 crate::event::Author::User,
763 crate::event::Source::Cli,
764 "x".into(),
765 );
766 e.meta = serde_json::json!({"title": title});
767 e
768 }
769
770 #[test]
771 fn ingest_new_events_picks_up_only_new_lines() {
772 let d = TempDir::new().unwrap();
773 let jsonl = d.path().join("events.jsonl");
774 let db = d.path().join("s.sqlite");
775 let project = "deadbeefdeadbeef";
776
777 let e1 = make_open_event("tj-i1", "first");
778 let e2 = make_open_event("tj-i2", "second");
779 let e3 = make_open_event("tj-i3", "third");
780
781 let mut f = std::fs::File::create(&jsonl).unwrap();
782 write_event_line(&mut f, &e1);
783 write_event_line(&mut f, &e2);
784 write_event_line(&mut f, &e3);
785 drop(f);
786
787 let conn = open(&db).unwrap();
789 let n_first = ingest_new_events(&conn, &jsonl, project).unwrap();
790 assert_eq!(n_first, 3);
791
792 let e4 = make_open_event("tj-i4", "fourth");
794 let e5 = make_open_event("tj-i5", "fifth");
795 let mut f = std::fs::OpenOptions::new()
796 .append(true)
797 .open(&jsonl)
798 .unwrap();
799 write_event_line(&mut f, &e4);
800 write_event_line(&mut f, &e5);
801 drop(f);
802
803 let n_second = ingest_new_events(&conn, &jsonl, project).unwrap();
805 assert_eq!(n_second, 2, "incremental ingest must read only the tail");
806
807 let total: i64 = conn
808 .query_row("SELECT COUNT(*) FROM events_index", [], |r| r.get(0))
809 .unwrap();
810 assert_eq!(total, 5);
811
812 let marker: String = conn
813 .query_row(
814 "SELECT last_indexed_event_id FROM index_state WHERE project_hash=?1",
815 rusqlite::params![project],
816 |r| r.get(0),
817 )
818 .unwrap();
819 assert_eq!(marker, e5.event_id);
820 }
821
822 #[test]
823 fn ingest_new_events_falls_back_to_full_rebuild_when_marker_vanishes() {
824 let d = TempDir::new().unwrap();
825 let jsonl = d.path().join("events.jsonl");
826 let db = d.path().join("s.sqlite");
827 let project = "feedfacefeedface";
828
829 let e1 = make_open_event("tj-r1", "first");
830 let mut f = std::fs::File::create(&jsonl).unwrap();
831 write_event_line(&mut f, &e1);
832 drop(f);
833
834 let conn = open(&db).unwrap();
835 ingest_new_events(&conn, &jsonl, project).unwrap();
836
837 let e2 = make_open_event("tj-r2", "after-corruption");
840 let e3 = make_open_event("tj-r3", "after-corruption-2");
841 let mut f = std::fs::File::create(&jsonl).unwrap();
842 write_event_line(&mut f, &e2);
843 write_event_line(&mut f, &e3);
844 drop(f);
845
846 let n = ingest_new_events(&conn, &jsonl, project).unwrap();
847 assert_eq!(n, 2, "missing marker must trigger full rebuild");
848 }
849
850 #[test]
851 fn rebuild_state_and_ingest_new_events_produce_same_state() {
852 let d = TempDir::new().unwrap();
853 let jsonl_a = d.path().join("a.jsonl");
854 let jsonl_b = d.path().join("b.jsonl");
855 let db_a = d.path().join("a.sqlite");
856 let db_b = d.path().join("b.sqlite");
857
858 let events: Vec<_> = (0..5)
859 .map(|i| make_open_event(&format!("tj-eq{i}"), &format!("title {i}")))
860 .collect();
861 for path in [&jsonl_a, &jsonl_b] {
862 let mut f = std::fs::File::create(path).unwrap();
863 for e in &events {
864 write_event_line(&mut f, e);
865 }
866 }
867
868 let conn_a = open(&db_a).unwrap();
869 let n_a = rebuild_state(&conn_a, &jsonl_a, "abcd1234abcd1234").unwrap();
870
871 let conn_b = open(&db_b).unwrap();
872 let n_b = ingest_new_events(&conn_b, &jsonl_b, "abcd1234abcd1234").unwrap();
873
874 assert_eq!(n_a, n_b);
875 assert_eq!(n_a, 5);
876
877 for table in ["tasks", "events_index"] {
878 let q = format!("SELECT COUNT(*) FROM {table}");
879 let cnt_a: i64 = conn_a.query_row(&q, [], |r| r.get(0)).unwrap();
880 let cnt_b: i64 = conn_b.query_row(&q, [], |r| r.get(0)).unwrap();
881 assert_eq!(cnt_a, cnt_b, "row count mismatch in {table}");
882 }
883 }
884
885 #[test]
886 fn rebuild_state_skips_malformed_jsonl_lines() {
887 use std::io::Write;
888 let d = TempDir::new().unwrap();
889 let events_path = d.path().join("events.jsonl");
890 let db_path = d.path().join("s.sqlite");
891
892 let mut f = std::fs::File::create(&events_path).unwrap();
893
894 let mut e1 = crate::event::Event::new(
895 "tj-skip",
896 crate::event::EventType::Open,
897 crate::event::Author::User,
898 crate::event::Source::Cli,
899 "x".into(),
900 );
901 e1.meta = serde_json::json!({"title": "Skip test"});
902 writeln!(f, "{}", serde_json::to_string(&e1).unwrap()).unwrap();
903
904 writeln!(f, "this is not a json event line").unwrap();
906
907 writeln!(f, "{{\"foo\": 1}}").unwrap();
909
910 let e3 = crate::event::Event::new(
911 "tj-skip",
912 crate::event::EventType::Decision,
913 crate::event::Author::Agent,
914 crate::event::Source::Chat,
915 "Adopt Rust".into(),
916 );
917 writeln!(f, "{}", serde_json::to_string(&e3).unwrap()).unwrap();
918 drop(f);
919
920 let conn = open(&db_path).unwrap();
921 let n = rebuild_state(&conn, &events_path, "deadbeefdeadbeef")
922 .expect("rebuild_state must succeed despite malformed lines");
923 assert_eq!(
924 n, 2,
925 "expected 2 valid events indexed (2 malformed skipped)"
926 );
927
928 let indexed: i64 = conn
929 .query_row("SELECT COUNT(*) FROM events_index", [], |r| r.get(0))
930 .unwrap();
931 assert_eq!(indexed, 2);
932 }
933
934 #[test]
935 fn rebuild_state_reads_jsonl_and_populates_db() {
936 use std::io::Write;
937 let d = TempDir::new().unwrap();
938 let events_path = d.path().join("events.jsonl");
939 let db_path = d.path().join("s.sqlite");
940
941 let mut f = std::fs::File::create(&events_path).unwrap();
942 let mut e1 = crate::event::Event::new(
943 "tj-9",
944 crate::event::EventType::Open,
945 crate::event::Author::User,
946 crate::event::Source::Cli,
947 "x".into(),
948 );
949 e1.meta = serde_json::json!({"title": "Nine"});
950 let e2 = crate::event::Event::new(
951 "tj-9",
952 crate::event::EventType::Decision,
953 crate::event::Author::Agent,
954 crate::event::Source::Chat,
955 "Adopt Rust".into(),
956 );
957 writeln!(f, "{}", serde_json::to_string(&e1).unwrap()).unwrap();
958 writeln!(f, "{}", serde_json::to_string(&e2).unwrap()).unwrap();
959 drop(f);
960
961 let conn = open(&db_path).unwrap();
962 let n = rebuild_state(&conn, &events_path, "deadbeefdeadbeef").unwrap();
963 assert_eq!(n, 2);
964
965 let n: i64 = conn
966 .query_row("SELECT COUNT(*) FROM tasks", [], |r| r.get(0))
967 .unwrap();
968 assert_eq!(n, 1);
969 let n: i64 = conn
970 .query_row("SELECT COUNT(*) FROM events_index", [], |r| r.get(0))
971 .unwrap();
972 assert_eq!(n, 2);
973 }
974
975 #[test]
976 fn index_event_writes_index_and_fts() {
977 let d = TempDir::new().unwrap();
978 let conn = open(d.path().join("s.sqlite")).unwrap();
979 let mut open_e = crate::event::Event::new(
980 "tj-1",
981 crate::event::EventType::Open,
982 crate::event::Author::User,
983 crate::event::Source::Cli,
984 "Title".into(),
985 );
986 open_e.meta = serde_json::json!({"title": "Title"});
987 upsert_task_from_event(&conn, &open_e, "deadbeefdeadbeef").unwrap();
988 index_event(&conn, &open_e).unwrap();
989
990 let mut decision = crate::event::Event::new(
991 "tj-1",
992 crate::event::EventType::Decision,
993 crate::event::Author::Agent,
994 crate::event::Source::Chat,
995 "Adopt Rust".into(),
996 );
997 decision.confidence = Some(0.92);
998 upsert_task_from_event(&conn, &decision, "deadbeefdeadbeef").unwrap();
999 index_event(&conn, &decision).unwrap();
1000
1001 let count: i64 = conn
1002 .query_row(
1003 "SELECT COUNT(*) FROM events_index WHERE task_id=?1",
1004 rusqlite::params!["tj-1"],
1005 |r| r.get(0),
1006 )
1007 .unwrap();
1008 assert_eq!(count, 2);
1009
1010 let mut stmt = conn
1011 .prepare("SELECT event_id FROM search_fts WHERE search_fts MATCH ?1")
1012 .unwrap();
1013 let hits: Vec<String> = stmt
1014 .query_map(rusqlite::params!["Rust"], |r| {
1015 let s: String = r.get(0)?;
1016 Ok(s)
1017 })
1018 .unwrap()
1019 .collect::<Result<Vec<_>, _>>()
1020 .unwrap();
1021 assert_eq!(hits.len(), 1);
1022 assert_eq!(hits[0], decision.event_id);
1023 }
1024
1025 #[test]
1026 fn upsert_task_from_open_event_inserts_row() {
1027 let d = TempDir::new().unwrap();
1028 let conn = open(d.path().join("s.sqlite")).unwrap();
1029
1030 let mut e = crate::event::Event::new(
1031 "tj-7f3a",
1032 crate::event::EventType::Open,
1033 crate::event::Author::User,
1034 crate::event::Source::Cli,
1035 "Add OAuth".into(),
1036 );
1037 e.meta = serde_json::json!({ "title": "Add OAuth login" });
1038
1039 upsert_task_from_event(&conn, &e, "abcd1234abcd1234").unwrap();
1040
1041 let (id, title, status): (String, String, String) = conn
1042 .query_row(
1043 "SELECT task_id, title, status FROM tasks WHERE task_id = ?1",
1044 ["tj-7f3a"],
1045 |r| Ok((r.get(0)?, r.get(1)?, r.get(2)?)),
1046 )
1047 .unwrap();
1048
1049 assert_eq!(id, "tj-7f3a");
1050 assert_eq!(title, "Add OAuth login");
1051 assert_eq!(status, "open");
1052 }
1053}