Skip to main content

allsource_core/infrastructure/web/
api.rs

1use crate::{
2    application::{
3        dto::{
4            DetectDuplicatesRequest, DetectDuplicatesResponse, DuplicateGroup, EntitySummary,
5            EventDto, IngestEventRequest, IngestEventResponse, IngestEventsBatchRequest,
6            IngestEventsBatchResponse, ListEntitiesRequest, ListEntitiesResponse,
7            QueryEventsRequest, QueryEventsResponse,
8        },
9        services::{
10            analytics::{
11                AnalyticsEngine, CorrelationRequest, CorrelationResponse, EventFrequencyRequest,
12                EventFrequencyResponse, StatsSummaryRequest, StatsSummaryResponse,
13            },
14            pipeline::{PipelineConfig, PipelineStats},
15            replay::{ReplayProgress, StartReplayRequest, StartReplayResponse},
16            schema::{
17                CompatibilityMode, RegisterSchemaRequest, RegisterSchemaResponse,
18                ValidateEventRequest, ValidateEventResponse,
19            },
20            webhook::{RegisterWebhookRequest, UpdateWebhookRequest},
21        },
22    },
23    domain::entities::Event,
24    error::Result,
25    infrastructure::{
26        persistence::{
27            compaction::CompactionResult,
28            snapshot::{
29                CreateSnapshotRequest, CreateSnapshotResponse, ListSnapshotsRequest,
30                ListSnapshotsResponse, SnapshotInfo,
31            },
32        },
33        query::{
34            eventql::EventQLRequest,
35            geospatial::GeoQueryRequest,
36            graphql::{GraphQLError, GraphQLRequest, GraphQLResponse},
37        },
38        replication::ReplicationMode,
39        web::api_v1::AppState,
40    },
41    store::{EventStore, EventTypeInfo, StreamInfo},
42};
43use axum::{
44    Json, Router,
45    extract::{Path, Query, State, WebSocketUpgrade},
46    response::{IntoResponse, Response},
47    routing::{get, post, put},
48};
49use serde::Deserialize;
50use std::sync::Arc;
51use tower_http::{
52    cors::{Any, CorsLayer},
53    trace::TraceLayer,
54};
55
56type SharedStore = Arc<EventStore>;
57
58/// Wait for follower ACK(s) in semi-sync/sync replication modes.
59///
60/// In async mode (default), returns immediately. In semi-sync mode, waits for
61/// at least 1 follower to ACK the current WAL offset. In sync mode, waits for
62/// all followers. If the timeout expires, logs a warning and continues (degraded mode).
63async fn await_replication_ack(state: &AppState) {
64    let shipper_guard = state.wal_shipper.read().await;
65    if let Some(ref shipper) = *shipper_guard {
66        let mode = shipper.replication_mode();
67        if mode == ReplicationMode::Async {
68            return;
69        }
70
71        let target_offset = shipper.current_leader_offset();
72        if target_offset == 0 {
73            return;
74        }
75
76        let shipper = Arc::clone(shipper);
77        // Drop the read guard before the async wait to avoid holding it across await
78        drop(shipper_guard);
79
80        let timer = state
81            .store
82            .metrics()
83            .replication_ack_wait_seconds
84            .start_timer();
85        let acked = shipper.wait_for_ack(target_offset).await;
86        timer.observe_duration();
87
88        if !acked {
89            tracing::warn!(
90                "Replication ACK timeout in {} mode (offset {}). \
91                 Write succeeded locally but follower confirmation pending.",
92                mode,
93                target_offset,
94            );
95        }
96    }
97}
98
99pub async fn serve(store: SharedStore, addr: &str) -> anyhow::Result<()> {
100    let app = Router::new()
101        .route("/health", get(health))
102        .route("/metrics", get(prometheus_metrics)) // v0.6: Prometheus metrics endpoint
103        .route("/api/v1/events", post(ingest_event))
104        .route("/api/v1/events/batch", post(ingest_events_batch))
105        .route("/api/v1/events/query", get(query_events))
106        .route("/api/v1/events/{event_id}", get(get_event_by_id))
107        .route("/api/v1/events/stream", get(events_websocket)) // v0.2: WebSocket streaming
108        // v0.10: Stream and event type discovery endpoints
109        .route("/api/v1/streams", get(list_streams))
110        .route("/api/v1/event-types", get(list_event_types))
111        .route("/api/v1/entities/duplicates", get(detect_duplicates))
112        .route("/api/v1/entities/{entity_id}/state", get(get_entity_state))
113        .route(
114            "/api/v1/entities/{entity_id}/snapshot",
115            get(get_entity_snapshot),
116        )
117        .route("/api/v1/stats", get(get_stats))
118        // v0.2: Advanced analytics endpoints
119        .route("/api/v1/analytics/frequency", get(analytics_frequency))
120        .route("/api/v1/analytics/summary", get(analytics_summary))
121        .route("/api/v1/analytics/correlation", get(analytics_correlation))
122        // v0.2: Snapshot management endpoints
123        .route("/api/v1/snapshots", post(create_snapshot))
124        .route("/api/v1/snapshots", get(list_snapshots))
125        .route(
126            "/api/v1/snapshots/{entity_id}/latest",
127            get(get_latest_snapshot),
128        )
129        // v0.2: Compaction endpoints
130        .route("/api/v1/compaction/trigger", post(trigger_compaction))
131        .route("/api/v1/compaction/stats", get(compaction_stats))
132        // v0.5: Schema registry endpoints
133        .route("/api/v1/schemas", post(register_schema))
134        .route("/api/v1/schemas", get(list_subjects))
135        .route("/api/v1/schemas/{subject}", get(get_schema))
136        .route(
137            "/api/v1/schemas/{subject}/versions",
138            get(list_schema_versions),
139        )
140        .route("/api/v1/schemas/validate", post(validate_event_schema))
141        .route(
142            "/api/v1/schemas/{subject}/compatibility",
143            put(set_compatibility_mode),
144        )
145        // v0.5: Replay and projection rebuild endpoints
146        .route("/api/v1/replay", post(start_replay))
147        .route("/api/v1/replay", get(list_replays))
148        .route("/api/v1/replay/{replay_id}", get(get_replay_progress))
149        .route("/api/v1/replay/{replay_id}/cancel", post(cancel_replay))
150        .route(
151            "/api/v1/replay/{replay_id}",
152            axum::routing::delete(delete_replay),
153        )
154        // v0.5: Stream processing pipeline endpoints
155        .route("/api/v1/pipelines", post(register_pipeline))
156        .route("/api/v1/pipelines", get(list_pipelines))
157        .route("/api/v1/pipelines/stats", get(all_pipeline_stats))
158        .route("/api/v1/pipelines/{pipeline_id}", get(get_pipeline))
159        .route(
160            "/api/v1/pipelines/{pipeline_id}",
161            axum::routing::delete(remove_pipeline),
162        )
163        .route(
164            "/api/v1/pipelines/{pipeline_id}/stats",
165            get(get_pipeline_stats),
166        )
167        .route("/api/v1/pipelines/{pipeline_id}/reset", put(reset_pipeline))
168        // v0.7: Projection State API for Query Service integration
169        .route("/api/v1/projections", get(list_projections))
170        .route("/api/v1/projections/{name}", get(get_projection))
171        .route(
172            "/api/v1/projections/{name}",
173            axum::routing::delete(delete_projection),
174        )
175        .route(
176            "/api/v1/projections/{name}/state",
177            get(get_projection_state_summary),
178        )
179        .route("/api/v1/projections/{name}/reset", post(reset_projection))
180        .route(
181            "/api/v1/projections/{name}/{entity_id}/state",
182            get(get_projection_state),
183        )
184        .route(
185            "/api/v1/projections/{name}/{entity_id}/state",
186            post(save_projection_state),
187        )
188        .route(
189            "/api/v1/projections/{name}/{entity_id}/state",
190            put(save_projection_state),
191        )
192        .route(
193            "/api/v1/projections/{name}/bulk",
194            post(bulk_get_projection_states),
195        )
196        .route(
197            "/api/v1/projections/{name}/bulk/save",
198            post(bulk_save_projection_states),
199        )
200        // v0.11: Webhook management endpoints
201        .route("/api/v1/webhooks", post(register_webhook))
202        .route("/api/v1/webhooks", get(list_webhooks))
203        .route("/api/v1/webhooks/{webhook_id}", get(get_webhook))
204        .route("/api/v1/webhooks/{webhook_id}", put(update_webhook))
205        .route(
206            "/api/v1/webhooks/{webhook_id}",
207            axum::routing::delete(delete_webhook),
208        )
209        .route(
210            "/api/v1/webhooks/{webhook_id}/deliveries",
211            get(list_webhook_deliveries),
212        )
213        // v2.0: Advanced query features
214        .route("/api/v1/eventql", post(eventql_query))
215        .route("/api/v1/graphql", post(graphql_query))
216        .route("/api/v1/geospatial/query", post(geo_query))
217        .route("/api/v1/geospatial/stats", get(geo_stats))
218        .route("/api/v1/exactly-once/stats", get(exactly_once_stats))
219        .route(
220            "/api/v1/schema-evolution/history/{event_type}",
221            get(schema_evolution_history),
222        )
223        .route(
224            "/api/v1/schema-evolution/schema/{event_type}",
225            get(schema_evolution_schema),
226        )
227        .route(
228            "/api/v1/schema-evolution/stats",
229            get(schema_evolution_stats),
230        )
231        .layer(
232            CorsLayer::new()
233                .allow_origin(Any)
234                .allow_methods(Any)
235                .allow_headers(Any),
236        )
237        .layer(TraceLayer::new_for_http())
238        .with_state(store);
239
240    let listener = tokio::net::TcpListener::bind(addr).await?;
241    axum::serve(listener, app).await?;
242
243    Ok(())
244}
245
246pub async fn health() -> impl IntoResponse {
247    Json(serde_json::json!({
248        "status": "healthy",
249        "service": "allsource-core",
250        "version": env!("CARGO_PKG_VERSION")
251    }))
252}
253
254// v0.6: Prometheus metrics endpoint
255pub async fn prometheus_metrics(State(store): State<SharedStore>) -> impl IntoResponse {
256    let metrics = store.metrics();
257
258    match metrics.encode() {
259        Ok(encoded) => Response::builder()
260            .status(200)
261            .header("Content-Type", "text/plain; version=0.0.4")
262            .body(encoded)
263            .unwrap()
264            .into_response(),
265        Err(e) => Response::builder()
266            .status(500)
267            .body(format!("Error encoding metrics: {e}"))
268            .unwrap()
269            .into_response(),
270    }
271}
272
273pub async fn ingest_event(
274    State(store): State<SharedStore>,
275    Json(req): Json<IngestEventRequest>,
276) -> Result<Json<IngestEventResponse>> {
277    // Create event using from_strings with default tenant
278    let event = Event::from_strings(
279        req.event_type,
280        req.entity_id,
281        "default".to_string(),
282        req.payload,
283        req.metadata,
284    )?;
285
286    let event_id = event.id;
287    let timestamp = event.timestamp;
288
289    store.ingest(event)?;
290
291    tracing::info!("Event ingested: {}", event_id);
292
293    Ok(Json(IngestEventResponse {
294        event_id,
295        timestamp,
296    }))
297}
298
299/// Ingest a single event with semi-sync/sync replication ACK waiting.
300///
301/// Used by the v1 API (with auth and replication support).
302pub async fn ingest_event_v1(
303    State(state): State<AppState>,
304    Json(req): Json<IngestEventRequest>,
305) -> Result<Json<IngestEventResponse>> {
306    let event = Event::from_strings(
307        req.event_type,
308        req.entity_id,
309        "default".to_string(),
310        req.payload,
311        req.metadata,
312    )?;
313
314    let event_id = event.id;
315    let timestamp = event.timestamp;
316
317    state.store.ingest(event)?;
318
319    // Semi-sync/sync: wait for follower ACK(s) before returning
320    await_replication_ack(&state).await;
321
322    tracing::info!("Event ingested: {}", event_id);
323
324    Ok(Json(IngestEventResponse {
325        event_id,
326        timestamp,
327    }))
328}
329
330/// Batch ingest multiple events in a single request
331///
332/// This endpoint allows ingesting multiple events atomically, which is more
333/// efficient than making individual requests for each event.
334pub async fn ingest_events_batch(
335    State(store): State<SharedStore>,
336    Json(req): Json<IngestEventsBatchRequest>,
337) -> Result<Json<IngestEventsBatchResponse>> {
338    let total = req.events.len();
339    let mut ingested_events = Vec::with_capacity(total);
340
341    for event_req in req.events {
342        let tenant_id = event_req.tenant_id.unwrap_or_else(|| "default".to_string());
343
344        let event = Event::from_strings(
345            event_req.event_type,
346            event_req.entity_id,
347            tenant_id,
348            event_req.payload,
349            event_req.metadata,
350        )?;
351
352        let event_id = event.id;
353        let timestamp = event.timestamp;
354
355        store.ingest(event)?;
356
357        ingested_events.push(IngestEventResponse {
358            event_id,
359            timestamp,
360        });
361    }
362
363    let ingested = ingested_events.len();
364    tracing::info!("Batch ingested {} events", ingested);
365
366    Ok(Json(IngestEventsBatchResponse {
367        total,
368        ingested,
369        events: ingested_events,
370    }))
371}
372
373/// Batch ingest with semi-sync/sync replication ACK waiting.
374///
375/// Used by the v1 API (with auth and replication support).
376pub async fn ingest_events_batch_v1(
377    State(state): State<AppState>,
378    Json(req): Json<IngestEventsBatchRequest>,
379) -> Result<Json<IngestEventsBatchResponse>> {
380    let total = req.events.len();
381    let mut ingested_events = Vec::with_capacity(total);
382
383    for event_req in req.events {
384        let tenant_id = event_req.tenant_id.unwrap_or_else(|| "default".to_string());
385
386        let event = Event::from_strings(
387            event_req.event_type,
388            event_req.entity_id,
389            tenant_id,
390            event_req.payload,
391            event_req.metadata,
392        )?;
393
394        let event_id = event.id;
395        let timestamp = event.timestamp;
396
397        state.store.ingest(event)?;
398
399        ingested_events.push(IngestEventResponse {
400            event_id,
401            timestamp,
402        });
403    }
404
405    // Semi-sync/sync: wait for follower ACK(s) after all events are ingested
406    await_replication_ack(&state).await;
407
408    let ingested = ingested_events.len();
409    tracing::info!("Batch ingested {} events", ingested);
410
411    Ok(Json(IngestEventsBatchResponse {
412        total,
413        ingested,
414        events: ingested_events,
415    }))
416}
417
418pub async fn query_events(
419    State(store): State<SharedStore>,
420    Query(req): Query<QueryEventsRequest>,
421) -> Result<Json<QueryEventsResponse>> {
422    let requested_limit = req.limit;
423
424    // Query without limit to get total count
425    let unlimited_req = QueryEventsRequest {
426        entity_id: req.entity_id,
427        event_type: req.event_type,
428        tenant_id: req.tenant_id,
429        as_of: req.as_of,
430        since: req.since,
431        until: req.until,
432        limit: None,
433        event_type_prefix: req.event_type_prefix,
434        payload_filter: req.payload_filter,
435    };
436    let all_events = store.query(unlimited_req)?;
437    let total_count = all_events.len();
438
439    // Apply limit
440    let limited_events: Vec<Event> = if let Some(limit) = requested_limit {
441        all_events.into_iter().take(limit).collect()
442    } else {
443        all_events
444    };
445
446    let count = limited_events.len();
447    let has_more = count < total_count;
448    let events: Vec<EventDto> = limited_events.iter().map(EventDto::from).collect();
449
450    tracing::debug!("Query returned {} events (total: {})", count, total_count);
451
452    Ok(Json(QueryEventsResponse {
453        events,
454        count,
455        total_count,
456        has_more,
457    }))
458}
459
460pub async fn list_entities(
461    State(store): State<SharedStore>,
462    Query(req): Query<ListEntitiesRequest>,
463) -> Result<Json<ListEntitiesResponse>> {
464    use std::collections::HashMap;
465
466    // Get all events matching the filters
467    let query_req = QueryEventsRequest {
468        entity_id: None,
469        event_type: None,
470        tenant_id: None,
471        as_of: None,
472        since: None,
473        until: None,
474        limit: None,
475        event_type_prefix: req.event_type_prefix,
476        payload_filter: req.payload_filter,
477    };
478    let events = store.query(query_req)?;
479
480    // Group by entity_id
481    let mut entity_map: HashMap<String, Vec<&Event>> = HashMap::new();
482    for event in &events {
483        entity_map
484            .entry(event.entity_id().to_string())
485            .or_default()
486            .push(event);
487    }
488
489    // Build entity summaries sorted by last event time (descending)
490    let mut summaries: Vec<EntitySummary> = entity_map
491        .into_iter()
492        .map(|(entity_id, events)| {
493            let last = events.iter().max_by_key(|e| e.timestamp()).unwrap();
494            EntitySummary {
495                entity_id,
496                event_count: events.len(),
497                last_event_type: last.event_type_str().to_string(),
498                last_event_at: last.timestamp(),
499            }
500        })
501        .collect();
502    summaries.sort_by(|a, b| b.last_event_at.cmp(&a.last_event_at));
503
504    let total = summaries.len();
505
506    // Apply offset and limit
507    let offset = req.offset.unwrap_or(0);
508    let summaries: Vec<EntitySummary> = summaries.into_iter().skip(offset).collect::<Vec<_>>();
509    let summaries = if let Some(limit) = req.limit {
510        let has_more = summaries.len() > limit;
511        let truncated: Vec<EntitySummary> = summaries.into_iter().take(limit).collect();
512        return Ok(Json(ListEntitiesResponse {
513            entities: truncated,
514            total,
515            has_more,
516        }));
517    } else {
518        summaries
519    };
520
521    Ok(Json(ListEntitiesResponse {
522        entities: summaries,
523        total,
524        has_more: false,
525    }))
526}
527
528pub async fn detect_duplicates(
529    State(store): State<SharedStore>,
530    Query(req): Query<DetectDuplicatesRequest>,
531) -> Result<Json<DetectDuplicatesResponse>> {
532    use std::collections::HashMap;
533
534    let group_by_fields: Vec<&str> = req.group_by.split(',').map(|s| s.trim()).collect();
535
536    // Query events scoped by the required prefix
537    let query_req = QueryEventsRequest {
538        entity_id: None,
539        event_type: None,
540        tenant_id: None,
541        as_of: None,
542        since: None,
543        until: None,
544        limit: None,
545        event_type_prefix: Some(req.event_type_prefix),
546        payload_filter: None,
547    };
548    let events = store.query(query_req)?;
549
550    // For each entity, extract the latest event's payload fields specified by group_by
551    // Then group entities by those field values
552    let mut entity_latest: HashMap<String, &Event> = HashMap::new();
553    for event in &events {
554        let eid = event.entity_id().to_string();
555        entity_latest
556            .entry(eid)
557            .and_modify(|existing| {
558                if event.timestamp() > existing.timestamp() {
559                    *existing = event;
560                }
561            })
562            .or_insert(event);
563    }
564
565    // Group entities by their payload field values
566    let mut groups: HashMap<String, Vec<String>> = HashMap::new();
567    for (entity_id, event) in &entity_latest {
568        let payload = event.payload();
569        let mut key_parts = serde_json::Map::new();
570        for field in &group_by_fields {
571            let value = payload
572                .get(*field)
573                .cloned()
574                .unwrap_or(serde_json::Value::Null);
575            key_parts.insert(field.to_string(), value);
576        }
577        let key_str = serde_json::to_string(&key_parts).unwrap_or_default();
578        groups.entry(key_str).or_default().push(entity_id.clone());
579    }
580
581    // Filter to groups with count > 1 (actual duplicates)
582    let mut duplicate_groups: Vec<DuplicateGroup> = groups
583        .into_iter()
584        .filter(|(_, ids)| ids.len() > 1)
585        .map(|(key_str, mut ids)| {
586            ids.sort();
587            let key: serde_json::Value =
588                serde_json::from_str(&key_str).unwrap_or(serde_json::Value::Null);
589            let count = ids.len();
590            DuplicateGroup {
591                key,
592                entity_ids: ids,
593                count,
594            }
595        })
596        .collect();
597
598    // Sort by count descending for consistent output
599    duplicate_groups.sort_by(|a, b| b.count.cmp(&a.count));
600
601    let total = duplicate_groups.len();
602
603    // Apply offset and limit
604    let offset = req.offset.unwrap_or(0);
605    let duplicate_groups: Vec<DuplicateGroup> = duplicate_groups.into_iter().skip(offset).collect();
606
607    if let Some(limit) = req.limit {
608        let has_more = duplicate_groups.len() > limit;
609        let truncated: Vec<DuplicateGroup> = duplicate_groups.into_iter().take(limit).collect();
610        return Ok(Json(DetectDuplicatesResponse {
611            duplicates: truncated,
612            total,
613            has_more,
614        }));
615    }
616
617    Ok(Json(DetectDuplicatesResponse {
618        duplicates: duplicate_groups,
619        total,
620        has_more: false,
621    }))
622}
623
624#[derive(Deserialize)]
625pub struct EntityStateParams {
626    as_of: Option<chrono::DateTime<chrono::Utc>>,
627}
628
629pub async fn get_entity_state(
630    State(store): State<SharedStore>,
631    Path(entity_id): Path<String>,
632    Query(params): Query<EntityStateParams>,
633) -> Result<Json<serde_json::Value>> {
634    let state = store.reconstruct_state(&entity_id, params.as_of)?;
635
636    tracing::info!("State reconstructed for entity: {}", entity_id);
637
638    Ok(Json(state))
639}
640
641pub async fn get_entity_snapshot(
642    State(store): State<SharedStore>,
643    Path(entity_id): Path<String>,
644) -> Result<Json<serde_json::Value>> {
645    let snapshot = store.get_snapshot(&entity_id)?;
646
647    tracing::debug!("Snapshot retrieved for entity: {}", entity_id);
648
649    Ok(Json(snapshot))
650}
651
652pub async fn get_stats(State(store): State<SharedStore>) -> impl IntoResponse {
653    let stats = store.stats();
654    Json(stats)
655}
656
657// v0.10: List all streams (entity_ids) in the event store
658/// Query parameters for listing streams
659#[derive(Debug, Deserialize)]
660pub struct ListStreamsParams {
661    /// Optional limit on number of streams to return
662    pub limit: Option<usize>,
663    /// Optional offset for pagination
664    pub offset: Option<usize>,
665}
666
667/// Response for listing streams
668#[derive(Debug, serde::Serialize)]
669pub struct ListStreamsResponse {
670    pub streams: Vec<StreamInfo>,
671    pub total: usize,
672}
673
674pub async fn list_streams(
675    State(store): State<SharedStore>,
676    Query(params): Query<ListStreamsParams>,
677) -> Json<ListStreamsResponse> {
678    let mut streams = store.list_streams();
679    let total = streams.len();
680
681    // Sort by last_event_at descending (most recent first)
682    streams.sort_by(|a, b| b.last_event_at.cmp(&a.last_event_at));
683
684    // Apply pagination
685    if let Some(offset) = params.offset {
686        if offset < streams.len() {
687            streams = streams[offset..].to_vec();
688        } else {
689            streams = vec![];
690        }
691    }
692
693    if let Some(limit) = params.limit {
694        streams.truncate(limit);
695    }
696
697    tracing::debug!("Listed {} streams (total: {})", streams.len(), total);
698
699    Json(ListStreamsResponse { streams, total })
700}
701
702// v0.10: List all event types in the event store
703/// Query parameters for listing event types
704#[derive(Debug, Deserialize)]
705pub struct ListEventTypesParams {
706    /// Optional limit on number of event types to return
707    pub limit: Option<usize>,
708    /// Optional offset for pagination
709    pub offset: Option<usize>,
710}
711
712/// Response for listing event types
713#[derive(Debug, serde::Serialize)]
714pub struct ListEventTypesResponse {
715    pub event_types: Vec<EventTypeInfo>,
716    pub total: usize,
717}
718
719pub async fn list_event_types(
720    State(store): State<SharedStore>,
721    Query(params): Query<ListEventTypesParams>,
722) -> Json<ListEventTypesResponse> {
723    let mut event_types = store.list_event_types();
724    let total = event_types.len();
725
726    // Sort by event_count descending (most used first)
727    event_types.sort_by(|a, b| b.event_count.cmp(&a.event_count));
728
729    // Apply pagination
730    if let Some(offset) = params.offset {
731        if offset < event_types.len() {
732            event_types = event_types[offset..].to_vec();
733        } else {
734            event_types = vec![];
735        }
736    }
737
738    if let Some(limit) = params.limit {
739        event_types.truncate(limit);
740    }
741
742    tracing::debug!(
743        "Listed {} event types (total: {})",
744        event_types.len(),
745        total
746    );
747
748    Json(ListEventTypesResponse { event_types, total })
749}
750
751// v0.2: WebSocket endpoint for real-time event streaming
752pub async fn events_websocket(ws: WebSocketUpgrade, State(store): State<SharedStore>) -> Response {
753    let websocket_manager = store.websocket_manager();
754
755    ws.on_upgrade(move |socket| async move {
756        websocket_manager.handle_socket(socket).await;
757    })
758}
759
760// v0.2: Event frequency analytics endpoint
761pub async fn analytics_frequency(
762    State(store): State<SharedStore>,
763    Query(req): Query<EventFrequencyRequest>,
764) -> Result<Json<EventFrequencyResponse>> {
765    let response = AnalyticsEngine::event_frequency(&store, req)?;
766
767    tracing::debug!(
768        "Frequency analysis returned {} buckets",
769        response.buckets.len()
770    );
771
772    Ok(Json(response))
773}
774
775// v0.2: Statistical summary endpoint
776pub async fn analytics_summary(
777    State(store): State<SharedStore>,
778    Query(req): Query<StatsSummaryRequest>,
779) -> Result<Json<StatsSummaryResponse>> {
780    let response = AnalyticsEngine::stats_summary(&store, req)?;
781
782    tracing::debug!(
783        "Stats summary: {} events across {} entities",
784        response.total_events,
785        response.unique_entities
786    );
787
788    Ok(Json(response))
789}
790
791// v0.2: Event correlation analysis endpoint
792pub async fn analytics_correlation(
793    State(store): State<SharedStore>,
794    Query(req): Query<CorrelationRequest>,
795) -> Result<Json<CorrelationResponse>> {
796    let response = AnalyticsEngine::analyze_correlation(&store, req)?;
797
798    tracing::debug!(
799        "Correlation analysis: {}/{} correlated pairs ({:.2}%)",
800        response.correlated_pairs,
801        response.total_a,
802        response.correlation_percentage
803    );
804
805    Ok(Json(response))
806}
807
808// v0.2: Create a snapshot for an entity
809pub async fn create_snapshot(
810    State(store): State<SharedStore>,
811    Json(req): Json<CreateSnapshotRequest>,
812) -> Result<Json<CreateSnapshotResponse>> {
813    store.create_snapshot(&req.entity_id)?;
814
815    let snapshot_manager = store.snapshot_manager();
816    let snapshot = snapshot_manager
817        .get_latest_snapshot(&req.entity_id)
818        .ok_or_else(|| crate::error::AllSourceError::EntityNotFound(req.entity_id.clone()))?;
819
820    tracing::info!("📸 Created snapshot for entity: {}", req.entity_id);
821
822    Ok(Json(CreateSnapshotResponse {
823        snapshot_id: snapshot.id,
824        entity_id: snapshot.entity_id,
825        created_at: snapshot.created_at,
826        event_count: snapshot.event_count,
827        size_bytes: snapshot.metadata.size_bytes,
828    }))
829}
830
831// v0.2: List snapshots
832pub async fn list_snapshots(
833    State(store): State<SharedStore>,
834    Query(req): Query<ListSnapshotsRequest>,
835) -> Result<Json<ListSnapshotsResponse>> {
836    let snapshot_manager = store.snapshot_manager();
837
838    let snapshots: Vec<SnapshotInfo> = if let Some(entity_id) = req.entity_id {
839        snapshot_manager
840            .get_all_snapshots(&entity_id)
841            .into_iter()
842            .map(SnapshotInfo::from)
843            .collect()
844    } else {
845        // List all entities with snapshots
846        let entities = snapshot_manager.list_entities();
847        entities
848            .iter()
849            .flat_map(|entity_id| {
850                snapshot_manager
851                    .get_all_snapshots(entity_id)
852                    .into_iter()
853                    .map(SnapshotInfo::from)
854            })
855            .collect()
856    };
857
858    let total = snapshots.len();
859
860    tracing::debug!("Listed {} snapshots", total);
861
862    Ok(Json(ListSnapshotsResponse { snapshots, total }))
863}
864
865// v0.2: Get latest snapshot for an entity
866pub async fn get_latest_snapshot(
867    State(store): State<SharedStore>,
868    Path(entity_id): Path<String>,
869) -> Result<Json<serde_json::Value>> {
870    let snapshot_manager = store.snapshot_manager();
871
872    let snapshot = snapshot_manager
873        .get_latest_snapshot(&entity_id)
874        .ok_or_else(|| crate::error::AllSourceError::EntityNotFound(entity_id.clone()))?;
875
876    tracing::debug!("Retrieved latest snapshot for entity: {}", entity_id);
877
878    Ok(Json(serde_json::json!({
879        "snapshot_id": snapshot.id,
880        "entity_id": snapshot.entity_id,
881        "created_at": snapshot.created_at,
882        "as_of": snapshot.as_of,
883        "event_count": snapshot.event_count,
884        "size_bytes": snapshot.metadata.size_bytes,
885        "snapshot_type": snapshot.metadata.snapshot_type,
886        "state": snapshot.state
887    })))
888}
889
890// v0.2: Trigger manual compaction
891pub async fn trigger_compaction(
892    State(store): State<SharedStore>,
893) -> Result<Json<CompactionResult>> {
894    let compaction_manager = store.compaction_manager().ok_or_else(|| {
895        crate::error::AllSourceError::InternalError(
896            "Compaction not enabled (no Parquet storage)".to_string(),
897        )
898    })?;
899
900    tracing::info!("📦 Manual compaction triggered via API");
901
902    let result = compaction_manager.compact_now()?;
903
904    Ok(Json(result))
905}
906
907// v0.2: Get compaction statistics
908pub async fn compaction_stats(State(store): State<SharedStore>) -> Result<Json<serde_json::Value>> {
909    let compaction_manager = store.compaction_manager().ok_or_else(|| {
910        crate::error::AllSourceError::InternalError(
911            "Compaction not enabled (no Parquet storage)".to_string(),
912        )
913    })?;
914
915    let stats = compaction_manager.stats();
916    let config = compaction_manager.config();
917
918    Ok(Json(serde_json::json!({
919        "stats": stats,
920        "config": {
921            "min_files_to_compact": config.min_files_to_compact,
922            "target_file_size": config.target_file_size,
923            "max_file_size": config.max_file_size,
924            "small_file_threshold": config.small_file_threshold,
925            "compaction_interval_seconds": config.compaction_interval_seconds,
926            "auto_compact": config.auto_compact,
927            "strategy": config.strategy
928        }
929    })))
930}
931
932// v0.5: Register a new schema
933pub async fn register_schema(
934    State(store): State<SharedStore>,
935    Json(req): Json<RegisterSchemaRequest>,
936) -> Result<Json<RegisterSchemaResponse>> {
937    let schema_registry = store.schema_registry();
938
939    let response =
940        schema_registry.register_schema(req.subject, req.schema, req.description, req.tags)?;
941
942    tracing::info!(
943        "📋 Schema registered: v{} for '{}'",
944        response.version,
945        response.subject
946    );
947
948    Ok(Json(response))
949}
950
951// v0.5: Get a schema by subject and optional version
952#[derive(Deserialize)]
953pub struct GetSchemaParams {
954    version: Option<u32>,
955}
956
957pub async fn get_schema(
958    State(store): State<SharedStore>,
959    Path(subject): Path<String>,
960    Query(params): Query<GetSchemaParams>,
961) -> Result<Json<serde_json::Value>> {
962    let schema_registry = store.schema_registry();
963
964    let schema = schema_registry.get_schema(&subject, params.version)?;
965
966    tracing::debug!("Retrieved schema v{} for '{}'", schema.version, subject);
967
968    Ok(Json(serde_json::json!({
969        "id": schema.id,
970        "subject": schema.subject,
971        "version": schema.version,
972        "schema": schema.schema,
973        "created_at": schema.created_at,
974        "description": schema.description,
975        "tags": schema.tags
976    })))
977}
978
979// v0.5: List all versions of a schema subject
980pub async fn list_schema_versions(
981    State(store): State<SharedStore>,
982    Path(subject): Path<String>,
983) -> Result<Json<serde_json::Value>> {
984    let schema_registry = store.schema_registry();
985
986    let versions = schema_registry.list_versions(&subject)?;
987
988    Ok(Json(serde_json::json!({
989        "subject": subject,
990        "versions": versions
991    })))
992}
993
994// v0.5: List all schema subjects
995pub async fn list_subjects(State(store): State<SharedStore>) -> Json<serde_json::Value> {
996    let schema_registry = store.schema_registry();
997
998    let subjects = schema_registry.list_subjects();
999
1000    Json(serde_json::json!({
1001        "subjects": subjects,
1002        "total": subjects.len()
1003    }))
1004}
1005
1006// v0.5: Validate an event against a schema
1007pub async fn validate_event_schema(
1008    State(store): State<SharedStore>,
1009    Json(req): Json<ValidateEventRequest>,
1010) -> Result<Json<ValidateEventResponse>> {
1011    let schema_registry = store.schema_registry();
1012
1013    let response = schema_registry.validate(&req.subject, req.version, &req.payload)?;
1014
1015    if response.valid {
1016        tracing::debug!(
1017            "✅ Event validated against schema '{}' v{}",
1018            req.subject,
1019            response.schema_version
1020        );
1021    } else {
1022        tracing::warn!(
1023            "❌ Event validation failed for '{}': {:?}",
1024            req.subject,
1025            response.errors
1026        );
1027    }
1028
1029    Ok(Json(response))
1030}
1031
1032// v0.5: Set compatibility mode for a subject
1033#[derive(Deserialize)]
1034pub struct SetCompatibilityRequest {
1035    compatibility: CompatibilityMode,
1036}
1037
1038pub async fn set_compatibility_mode(
1039    State(store): State<SharedStore>,
1040    Path(subject): Path<String>,
1041    Json(req): Json<SetCompatibilityRequest>,
1042) -> Json<serde_json::Value> {
1043    let schema_registry = store.schema_registry();
1044
1045    schema_registry.set_compatibility_mode(subject.clone(), req.compatibility);
1046
1047    tracing::info!(
1048        "🔧 Set compatibility mode for '{}' to {:?}",
1049        subject,
1050        req.compatibility
1051    );
1052
1053    Json(serde_json::json!({
1054        "subject": subject,
1055        "compatibility": req.compatibility
1056    }))
1057}
1058
1059// v0.5: Start a replay operation
1060pub async fn start_replay(
1061    State(store): State<SharedStore>,
1062    Json(req): Json<StartReplayRequest>,
1063) -> Result<Json<StartReplayResponse>> {
1064    let replay_manager = store.replay_manager();
1065
1066    let response = replay_manager.start_replay(store, req)?;
1067
1068    tracing::info!(
1069        "🔄 Started replay {} with {} events",
1070        response.replay_id,
1071        response.total_events
1072    );
1073
1074    Ok(Json(response))
1075}
1076
1077// v0.5: Get replay progress
1078pub async fn get_replay_progress(
1079    State(store): State<SharedStore>,
1080    Path(replay_id): Path<uuid::Uuid>,
1081) -> Result<Json<ReplayProgress>> {
1082    let replay_manager = store.replay_manager();
1083
1084    let progress = replay_manager.get_progress(replay_id)?;
1085
1086    Ok(Json(progress))
1087}
1088
1089// v0.5: List all replay operations
1090pub async fn list_replays(State(store): State<SharedStore>) -> Json<serde_json::Value> {
1091    let replay_manager = store.replay_manager();
1092
1093    let replays = replay_manager.list_replays();
1094
1095    Json(serde_json::json!({
1096        "replays": replays,
1097        "total": replays.len()
1098    }))
1099}
1100
1101// v0.5: Cancel a running replay
1102pub async fn cancel_replay(
1103    State(store): State<SharedStore>,
1104    Path(replay_id): Path<uuid::Uuid>,
1105) -> Result<Json<serde_json::Value>> {
1106    let replay_manager = store.replay_manager();
1107
1108    replay_manager.cancel_replay(replay_id)?;
1109
1110    tracing::info!("🛑 Cancelled replay {}", replay_id);
1111
1112    Ok(Json(serde_json::json!({
1113        "replay_id": replay_id,
1114        "status": "cancelled"
1115    })))
1116}
1117
1118// v0.5: Delete a completed replay
1119pub async fn delete_replay(
1120    State(store): State<SharedStore>,
1121    Path(replay_id): Path<uuid::Uuid>,
1122) -> Result<Json<serde_json::Value>> {
1123    let replay_manager = store.replay_manager();
1124
1125    let deleted = replay_manager.delete_replay(replay_id)?;
1126
1127    if deleted {
1128        tracing::info!("🗑️  Deleted replay {}", replay_id);
1129    }
1130
1131    Ok(Json(serde_json::json!({
1132        "replay_id": replay_id,
1133        "deleted": deleted
1134    })))
1135}
1136
1137// v0.5: Register a new pipeline
1138pub async fn register_pipeline(
1139    State(store): State<SharedStore>,
1140    Json(config): Json<PipelineConfig>,
1141) -> Result<Json<serde_json::Value>> {
1142    let pipeline_manager = store.pipeline_manager();
1143
1144    let pipeline_id = pipeline_manager.register(config.clone());
1145
1146    tracing::info!(
1147        "🔀 Pipeline registered: {} (name: {})",
1148        pipeline_id,
1149        config.name
1150    );
1151
1152    Ok(Json(serde_json::json!({
1153        "pipeline_id": pipeline_id,
1154        "name": config.name,
1155        "enabled": config.enabled
1156    })))
1157}
1158
1159// v0.5: List all pipelines
1160pub async fn list_pipelines(State(store): State<SharedStore>) -> Json<serde_json::Value> {
1161    let pipeline_manager = store.pipeline_manager();
1162
1163    let pipelines = pipeline_manager.list();
1164
1165    tracing::debug!("Listed {} pipelines", pipelines.len());
1166
1167    Json(serde_json::json!({
1168        "pipelines": pipelines,
1169        "total": pipelines.len()
1170    }))
1171}
1172
1173// v0.5: Get a specific pipeline
1174pub async fn get_pipeline(
1175    State(store): State<SharedStore>,
1176    Path(pipeline_id): Path<uuid::Uuid>,
1177) -> Result<Json<PipelineConfig>> {
1178    let pipeline_manager = store.pipeline_manager();
1179
1180    let pipeline = pipeline_manager.get(pipeline_id).ok_or_else(|| {
1181        crate::error::AllSourceError::ValidationError(format!(
1182            "Pipeline not found: {}",
1183            pipeline_id
1184        ))
1185    })?;
1186
1187    Ok(Json(pipeline.config().clone()))
1188}
1189
1190// v0.5: Remove a pipeline
1191pub async fn remove_pipeline(
1192    State(store): State<SharedStore>,
1193    Path(pipeline_id): Path<uuid::Uuid>,
1194) -> Result<Json<serde_json::Value>> {
1195    let pipeline_manager = store.pipeline_manager();
1196
1197    let removed = pipeline_manager.remove(pipeline_id);
1198
1199    if removed {
1200        tracing::info!("🗑️  Removed pipeline {}", pipeline_id);
1201    }
1202
1203    Ok(Json(serde_json::json!({
1204        "pipeline_id": pipeline_id,
1205        "removed": removed
1206    })))
1207}
1208
1209// v0.5: Get statistics for all pipelines
1210pub async fn all_pipeline_stats(State(store): State<SharedStore>) -> Json<serde_json::Value> {
1211    let pipeline_manager = store.pipeline_manager();
1212
1213    let stats = pipeline_manager.all_stats();
1214
1215    Json(serde_json::json!({
1216        "stats": stats,
1217        "total": stats.len()
1218    }))
1219}
1220
1221// v0.5: Get statistics for a specific pipeline
1222pub async fn get_pipeline_stats(
1223    State(store): State<SharedStore>,
1224    Path(pipeline_id): Path<uuid::Uuid>,
1225) -> Result<Json<PipelineStats>> {
1226    let pipeline_manager = store.pipeline_manager();
1227
1228    let pipeline = pipeline_manager.get(pipeline_id).ok_or_else(|| {
1229        crate::error::AllSourceError::ValidationError(format!(
1230            "Pipeline not found: {}",
1231            pipeline_id
1232        ))
1233    })?;
1234
1235    Ok(Json(pipeline.stats()))
1236}
1237
1238// v0.5: Reset a pipeline's state
1239pub async fn reset_pipeline(
1240    State(store): State<SharedStore>,
1241    Path(pipeline_id): Path<uuid::Uuid>,
1242) -> Result<Json<serde_json::Value>> {
1243    let pipeline_manager = store.pipeline_manager();
1244
1245    let pipeline = pipeline_manager.get(pipeline_id).ok_or_else(|| {
1246        crate::error::AllSourceError::ValidationError(format!(
1247            "Pipeline not found: {}",
1248            pipeline_id
1249        ))
1250    })?;
1251
1252    pipeline.reset();
1253
1254    tracing::info!("🔄 Reset pipeline {}", pipeline_id);
1255
1256    Ok(Json(serde_json::json!({
1257        "pipeline_id": pipeline_id,
1258        "reset": true
1259    })))
1260}
1261
1262// =============================================================================
1263// v0.11: Single Event Lookup by ID
1264// =============================================================================
1265
1266/// Get a single event by UUID
1267pub async fn get_event_by_id(
1268    State(store): State<SharedStore>,
1269    Path(event_id): Path<uuid::Uuid>,
1270) -> Result<Json<serde_json::Value>> {
1271    let event = store.get_event_by_id(&event_id)?.ok_or_else(|| {
1272        crate::error::AllSourceError::EntityNotFound(format!("Event '{}' not found", event_id))
1273    })?;
1274
1275    let dto = EventDto::from(&event);
1276
1277    tracing::debug!("Event retrieved by ID: {}", event_id);
1278
1279    Ok(Json(serde_json::json!({
1280        "event": dto,
1281        "found": true
1282    })))
1283}
1284
1285// =============================================================================
1286// v0.7: Projection State API for Query Service Integration
1287// =============================================================================
1288
1289/// List all registered projections
1290pub async fn list_projections(State(store): State<SharedStore>) -> Json<serde_json::Value> {
1291    let projection_manager = store.projection_manager();
1292
1293    let projections: Vec<serde_json::Value> = projection_manager
1294        .list_projections()
1295        .iter()
1296        .map(|(name, projection)| {
1297            serde_json::json!({
1298                "name": name,
1299                "type": format!("{:?}", projection.name()),
1300            })
1301        })
1302        .collect();
1303
1304    tracing::debug!("Listed {} projections", projections.len());
1305
1306    Json(serde_json::json!({
1307        "projections": projections,
1308        "total": projections.len()
1309    }))
1310}
1311
1312/// Get projection metadata by name
1313pub async fn get_projection(
1314    State(store): State<SharedStore>,
1315    Path(name): Path<String>,
1316) -> Result<Json<serde_json::Value>> {
1317    let projection_manager = store.projection_manager();
1318
1319    let projection = projection_manager.get_projection(&name).ok_or_else(|| {
1320        crate::error::AllSourceError::EntityNotFound(format!("Projection '{name}' not found"))
1321    })?;
1322
1323    Ok(Json(serde_json::json!({
1324        "name": projection.name(),
1325        "found": true
1326    })))
1327}
1328
1329/// Get projection state for a specific entity
1330///
1331/// This endpoint allows the Elixir Query Service to fetch projection state
1332/// from the Rust Core for synchronization.
1333pub async fn get_projection_state(
1334    State(store): State<SharedStore>,
1335    Path((name, entity_id)): Path<(String, String)>,
1336) -> Result<Json<serde_json::Value>> {
1337    let projection_manager = store.projection_manager();
1338
1339    let projection = projection_manager.get_projection(&name).ok_or_else(|| {
1340        crate::error::AllSourceError::EntityNotFound(format!("Projection '{name}' not found"))
1341    })?;
1342
1343    let state = projection.get_state(&entity_id);
1344
1345    tracing::debug!("Projection state retrieved: {} / {}", name, entity_id);
1346
1347    Ok(Json(serde_json::json!({
1348        "projection": name,
1349        "entity_id": entity_id,
1350        "state": state,
1351        "found": state.is_some()
1352    })))
1353}
1354
1355/// Delete (clear) a projection by name
1356///
1357/// Removes all state from the projection. The projection definition remains
1358/// registered but its accumulated state is cleared.
1359pub async fn delete_projection(
1360    State(store): State<SharedStore>,
1361    Path(name): Path<String>,
1362) -> Result<Json<serde_json::Value>> {
1363    let projection_manager = store.projection_manager();
1364
1365    let projection = projection_manager.get_projection(&name).ok_or_else(|| {
1366        crate::error::AllSourceError::EntityNotFound(format!("Projection '{name}' not found"))
1367    })?;
1368
1369    projection.clear();
1370
1371    // Also clear any cached state for this projection
1372    let cache = store.projection_state_cache();
1373    let prefix = format!("{name}:");
1374    let keys_to_remove: Vec<String> = cache
1375        .iter()
1376        .filter(|entry| entry.key().starts_with(&prefix))
1377        .map(|entry| entry.key().clone())
1378        .collect();
1379    for key in keys_to_remove {
1380        cache.remove(&key);
1381    }
1382
1383    tracing::info!("Projection deleted (cleared): {}", name);
1384
1385    Ok(Json(serde_json::json!({
1386        "projection": name,
1387        "deleted": true
1388    })))
1389}
1390
1391/// Get aggregate projection state (all entities)
1392///
1393/// Returns summary information about a projection's state across all entities.
1394pub async fn get_projection_state_summary(
1395    State(store): State<SharedStore>,
1396    Path(name): Path<String>,
1397) -> Result<Json<serde_json::Value>> {
1398    let projection_manager = store.projection_manager();
1399
1400    let _projection = projection_manager.get_projection(&name).ok_or_else(|| {
1401        crate::error::AllSourceError::EntityNotFound(format!("Projection '{name}' not found"))
1402    })?;
1403
1404    // Collect cached states for this projection
1405    let cache = store.projection_state_cache();
1406    let prefix = format!("{name}:");
1407    let states: Vec<serde_json::Value> = cache
1408        .iter()
1409        .filter(|entry| entry.key().starts_with(&prefix))
1410        .map(|entry| {
1411            let entity_id = entry.key().strip_prefix(&prefix).unwrap_or(entry.key());
1412            serde_json::json!({
1413                "entity_id": entity_id,
1414                "state": entry.value().clone()
1415            })
1416        })
1417        .collect();
1418
1419    let total = states.len();
1420
1421    tracing::debug!("Projection state summary: {} ({} entities)", name, total);
1422
1423    Ok(Json(serde_json::json!({
1424        "projection": name,
1425        "states": states,
1426        "total": total
1427    })))
1428}
1429
1430/// Reset a projection to its initial state
1431///
1432/// Clears all accumulated state and reprocesses events from the beginning.
1433pub async fn reset_projection(
1434    State(store): State<SharedStore>,
1435    Path(name): Path<String>,
1436) -> Result<Json<serde_json::Value>> {
1437    let reprocessed = store.reset_projection(&name)?;
1438
1439    tracing::info!(
1440        "Projection reset: {} ({} events reprocessed)",
1441        name,
1442        reprocessed
1443    );
1444
1445    Ok(Json(serde_json::json!({
1446        "projection": name,
1447        "reset": true,
1448        "events_reprocessed": reprocessed
1449    })))
1450}
1451
1452/// Request body for saving projection state
1453#[derive(Debug, Deserialize)]
1454pub struct SaveProjectionStateRequest {
1455    pub state: serde_json::Value,
1456}
1457
1458/// Save/update projection state for an entity
1459///
1460/// This endpoint allows external services (like Elixir Query Service) to
1461/// store computed projection state back to the Core for persistence.
1462pub async fn save_projection_state(
1463    State(store): State<SharedStore>,
1464    Path((name, entity_id)): Path<(String, String)>,
1465    Json(req): Json<SaveProjectionStateRequest>,
1466) -> Result<Json<serde_json::Value>> {
1467    let projection_cache = store.projection_state_cache();
1468
1469    // Store in the projection state cache
1470    projection_cache.insert(format!("{name}:{entity_id}"), req.state.clone());
1471
1472    tracing::info!("Projection state saved: {} / {}", name, entity_id);
1473
1474    Ok(Json(serde_json::json!({
1475        "projection": name,
1476        "entity_id": entity_id,
1477        "saved": true
1478    })))
1479}
1480
1481/// Bulk get projection states for multiple entities
1482///
1483/// Efficient endpoint for fetching multiple entity states in a single request.
1484#[derive(Debug, Deserialize)]
1485pub struct BulkGetStateRequest {
1486    pub entity_ids: Vec<String>,
1487}
1488
1489/// Bulk save projection states for multiple entities
1490///
1491/// Efficient endpoint for saving multiple entity states in a single request.
1492#[derive(Debug, Deserialize)]
1493pub struct BulkSaveStateRequest {
1494    pub states: Vec<BulkSaveStateItem>,
1495}
1496
1497#[derive(Debug, Deserialize)]
1498pub struct BulkSaveStateItem {
1499    pub entity_id: String,
1500    pub state: serde_json::Value,
1501}
1502
1503pub async fn bulk_get_projection_states(
1504    State(store): State<SharedStore>,
1505    Path(name): Path<String>,
1506    Json(req): Json<BulkGetStateRequest>,
1507) -> Result<Json<serde_json::Value>> {
1508    let projection_manager = store.projection_manager();
1509
1510    let projection = projection_manager.get_projection(&name).ok_or_else(|| {
1511        crate::error::AllSourceError::EntityNotFound(format!("Projection '{name}' not found"))
1512    })?;
1513
1514    let states: Vec<serde_json::Value> = req
1515        .entity_ids
1516        .iter()
1517        .map(|entity_id| {
1518            let state = projection.get_state(entity_id);
1519            serde_json::json!({
1520                "entity_id": entity_id,
1521                "state": state,
1522                "found": state.is_some()
1523            })
1524        })
1525        .collect();
1526
1527    tracing::debug!(
1528        "Bulk projection state retrieved: {} entities from {}",
1529        states.len(),
1530        name
1531    );
1532
1533    Ok(Json(serde_json::json!({
1534        "projection": name,
1535        "states": states,
1536        "total": states.len()
1537    })))
1538}
1539
1540/// Bulk save projection states for multiple entities
1541///
1542/// This endpoint allows efficient batch saving of projection states,
1543/// critical for high-throughput event processing pipelines.
1544pub async fn bulk_save_projection_states(
1545    State(store): State<SharedStore>,
1546    Path(name): Path<String>,
1547    Json(req): Json<BulkSaveStateRequest>,
1548) -> Result<Json<serde_json::Value>> {
1549    let projection_cache = store.projection_state_cache();
1550
1551    let mut saved_count = 0;
1552    for item in &req.states {
1553        projection_cache.insert(format!("{name}:{}", item.entity_id), item.state.clone());
1554        saved_count += 1;
1555    }
1556
1557    tracing::info!(
1558        "Bulk projection state saved: {} entities for {}",
1559        saved_count,
1560        name
1561    );
1562
1563    Ok(Json(serde_json::json!({
1564        "projection": name,
1565        "saved": saved_count,
1566        "total": req.states.len()
1567    })))
1568}
1569
1570// =============================================================================
1571// v0.11: Webhook Management API
1572// =============================================================================
1573
1574/// Query parameters for listing webhooks
1575#[derive(Debug, Deserialize)]
1576pub struct ListWebhooksParams {
1577    pub tenant_id: Option<String>,
1578}
1579
1580/// Register a new webhook subscription
1581pub async fn register_webhook(
1582    State(store): State<SharedStore>,
1583    Json(req): Json<RegisterWebhookRequest>,
1584) -> Json<serde_json::Value> {
1585    let registry = store.webhook_registry();
1586    let webhook = registry.register(req);
1587
1588    tracing::info!("Webhook registered: {} -> {}", webhook.id, webhook.url);
1589
1590    Json(serde_json::json!({
1591        "webhook": webhook,
1592        "created": true
1593    }))
1594}
1595
1596/// List webhooks, optionally filtered by tenant_id
1597pub async fn list_webhooks(
1598    State(store): State<SharedStore>,
1599    Query(params): Query<ListWebhooksParams>,
1600) -> Json<serde_json::Value> {
1601    let registry = store.webhook_registry();
1602
1603    let webhooks = if let Some(tenant_id) = params.tenant_id {
1604        registry.list_by_tenant(&tenant_id)
1605    } else {
1606        // Without tenant filter, return empty (tenants should always filter)
1607        vec![]
1608    };
1609
1610    let total = webhooks.len();
1611
1612    Json(serde_json::json!({
1613        "webhooks": webhooks,
1614        "total": total
1615    }))
1616}
1617
1618/// Get a specific webhook by ID
1619pub async fn get_webhook(
1620    State(store): State<SharedStore>,
1621    Path(webhook_id): Path<uuid::Uuid>,
1622) -> Result<Json<serde_json::Value>> {
1623    let registry = store.webhook_registry();
1624
1625    let webhook = registry.get(webhook_id).ok_or_else(|| {
1626        crate::error::AllSourceError::EntityNotFound(format!("Webhook '{}' not found", webhook_id))
1627    })?;
1628
1629    Ok(Json(serde_json::json!({
1630        "webhook": webhook,
1631        "found": true
1632    })))
1633}
1634
1635/// Update a webhook subscription
1636pub async fn update_webhook(
1637    State(store): State<SharedStore>,
1638    Path(webhook_id): Path<uuid::Uuid>,
1639    Json(req): Json<UpdateWebhookRequest>,
1640) -> Result<Json<serde_json::Value>> {
1641    let registry = store.webhook_registry();
1642
1643    let webhook = registry.update(webhook_id, req).ok_or_else(|| {
1644        crate::error::AllSourceError::EntityNotFound(format!("Webhook '{}' not found", webhook_id))
1645    })?;
1646
1647    tracing::info!("Webhook updated: {}", webhook_id);
1648
1649    Ok(Json(serde_json::json!({
1650        "webhook": webhook,
1651        "updated": true
1652    })))
1653}
1654
1655/// Delete a webhook subscription
1656pub async fn delete_webhook(
1657    State(store): State<SharedStore>,
1658    Path(webhook_id): Path<uuid::Uuid>,
1659) -> Result<Json<serde_json::Value>> {
1660    let registry = store.webhook_registry();
1661
1662    let webhook = registry.delete(webhook_id).ok_or_else(|| {
1663        crate::error::AllSourceError::EntityNotFound(format!("Webhook '{}' not found", webhook_id))
1664    })?;
1665
1666    tracing::info!("Webhook deleted: {} ({})", webhook_id, webhook.url);
1667
1668    Ok(Json(serde_json::json!({
1669        "webhook_id": webhook_id,
1670        "deleted": true
1671    })))
1672}
1673
1674/// Query parameters for listing webhook deliveries
1675#[derive(Debug, Deserialize)]
1676pub struct ListDeliveriesParams {
1677    pub limit: Option<usize>,
1678}
1679
1680/// List delivery history for a webhook
1681pub async fn list_webhook_deliveries(
1682    State(store): State<SharedStore>,
1683    Path(webhook_id): Path<uuid::Uuid>,
1684    Query(params): Query<ListDeliveriesParams>,
1685) -> Result<Json<serde_json::Value>> {
1686    let registry = store.webhook_registry();
1687
1688    // Verify webhook exists
1689    registry.get(webhook_id).ok_or_else(|| {
1690        crate::error::AllSourceError::EntityNotFound(format!("Webhook '{}' not found", webhook_id))
1691    })?;
1692
1693    let limit = params.limit.unwrap_or(50);
1694    let deliveries = registry.get_deliveries(webhook_id, limit);
1695    let total = deliveries.len();
1696
1697    Ok(Json(serde_json::json!({
1698        "webhook_id": webhook_id,
1699        "deliveries": deliveries,
1700        "total": total
1701    })))
1702}
1703
1704// =============================================================================
1705// v2.0: Advanced Query Features
1706// =============================================================================
1707
1708/// EventQL: Execute SQL queries over events using DataFusion
1709pub async fn eventql_query(
1710    State(store): State<SharedStore>,
1711    Json(req): Json<EventQLRequest>,
1712) -> Result<Json<serde_json::Value>> {
1713    let events = store.snapshot_events();
1714    match crate::infrastructure::query::eventql::execute_eventql(&events, &req).await {
1715        Ok(response) => Ok(Json(serde_json::json!({
1716            "columns": response.columns,
1717            "rows": response.rows,
1718            "row_count": response.row_count,
1719        }))),
1720        Err(e) => Err(crate::error::AllSourceError::InvalidQuery(e)),
1721    }
1722}
1723
1724/// GraphQL: Execute GraphQL queries
1725pub async fn graphql_query(
1726    State(store): State<SharedStore>,
1727    Json(req): Json<GraphQLRequest>,
1728) -> Json<serde_json::Value> {
1729    let fields = match crate::infrastructure::query::graphql::parse_query(&req.query) {
1730        Ok(f) => f,
1731        Err(e) => {
1732            return Json(
1733                serde_json::to_value(GraphQLResponse {
1734                    data: None,
1735                    errors: vec![GraphQLError { message: e }],
1736                })
1737                .unwrap(),
1738            );
1739        }
1740    };
1741
1742    let mut data = serde_json::Map::new();
1743    let mut errors = Vec::new();
1744
1745    for field in &fields {
1746        match field.name.as_str() {
1747            "events" => {
1748                let request = crate::application::dto::QueryEventsRequest {
1749                    entity_id: field.arguments.get("entity_id").cloned(),
1750                    event_type: field.arguments.get("event_type").cloned(),
1751                    tenant_id: field.arguments.get("tenant_id").cloned(),
1752                    limit: field.arguments.get("limit").and_then(|l| l.parse().ok()),
1753                    as_of: None,
1754                    since: None,
1755                    until: None,
1756                    event_type_prefix: None,
1757                    payload_filter: None,
1758                };
1759                match store.query(request) {
1760                    Ok(events) => {
1761                        let json_events: Vec<serde_json::Value> = events
1762                            .iter()
1763                            .map(|e| {
1764                                crate::infrastructure::query::graphql::event_to_json(
1765                                    e,
1766                                    &field.fields,
1767                                )
1768                            })
1769                            .collect();
1770                        data.insert("events".to_string(), serde_json::Value::Array(json_events));
1771                    }
1772                    Err(e) => errors.push(GraphQLError {
1773                        message: format!("events query failed: {e}"),
1774                    }),
1775                }
1776            }
1777            "event" => {
1778                if let Some(id_str) = field.arguments.get("id") {
1779                    if let Ok(id) = uuid::Uuid::parse_str(id_str) {
1780                        match store.get_event_by_id(&id) {
1781                            Ok(Some(event)) => {
1782                                data.insert(
1783                                    "event".to_string(),
1784                                    crate::infrastructure::query::graphql::event_to_json(
1785                                        &event,
1786                                        &field.fields,
1787                                    ),
1788                                );
1789                            }
1790                            Ok(None) => {
1791                                data.insert("event".to_string(), serde_json::Value::Null);
1792                            }
1793                            Err(e) => errors.push(GraphQLError {
1794                                message: format!("event lookup failed: {e}"),
1795                            }),
1796                        }
1797                    } else {
1798                        errors.push(GraphQLError {
1799                            message: format!("Invalid UUID: {id_str}"),
1800                        });
1801                    }
1802                } else {
1803                    errors.push(GraphQLError {
1804                        message: "event query requires 'id' argument".to_string(),
1805                    });
1806                }
1807            }
1808            "projections" => {
1809                let pm = store.projection_manager();
1810                let names: Vec<serde_json::Value> = pm
1811                    .list_projections()
1812                    .iter()
1813                    .map(|(name, _)| serde_json::Value::String(name.clone()))
1814                    .collect();
1815                data.insert("projections".to_string(), serde_json::Value::Array(names));
1816            }
1817            "stats" => {
1818                let stats = store.stats();
1819                data.insert(
1820                    "stats".to_string(),
1821                    serde_json::json!({
1822                        "total_events": stats.total_events,
1823                        "total_entities": stats.total_entities,
1824                        "total_event_types": stats.total_event_types,
1825                    }),
1826                );
1827            }
1828            "__schema" => {
1829                data.insert(
1830                    "__schema".to_string(),
1831                    crate::infrastructure::query::graphql::introspection_schema(),
1832                );
1833            }
1834            other => {
1835                errors.push(GraphQLError {
1836                    message: format!("Unknown field: {other}"),
1837                });
1838            }
1839        }
1840    }
1841
1842    Json(
1843        serde_json::to_value(GraphQLResponse {
1844            data: Some(serde_json::Value::Object(data)),
1845            errors,
1846        })
1847        .unwrap(),
1848    )
1849}
1850
1851/// Geospatial: Query events by location
1852pub async fn geo_query(
1853    State(store): State<SharedStore>,
1854    Json(req): Json<GeoQueryRequest>,
1855) -> Json<serde_json::Value> {
1856    let events = store.snapshot_events();
1857    let geo_index = store.geo_index();
1858    let results =
1859        crate::infrastructure::query::geospatial::execute_geo_query(&events, &geo_index, &req);
1860    let total = results.len();
1861    Json(serde_json::json!({
1862        "results": results,
1863        "total": total,
1864    }))
1865}
1866
1867/// Geospatial index stats
1868pub async fn geo_stats(State(store): State<SharedStore>) -> Json<serde_json::Value> {
1869    let stats = store.geo_index().stats();
1870    Json(serde_json::json!(stats))
1871}
1872
1873/// Exactly-once processing stats
1874pub async fn exactly_once_stats(State(store): State<SharedStore>) -> Json<serde_json::Value> {
1875    let stats = store.exactly_once().stats();
1876    Json(serde_json::json!(stats))
1877}
1878
1879/// Schema evolution history for an event type
1880pub async fn schema_evolution_history(
1881    State(store): State<SharedStore>,
1882    Path(event_type): Path<String>,
1883) -> Json<serde_json::Value> {
1884    let mgr = store.schema_evolution();
1885    let history = mgr.get_history(&event_type);
1886    let version = mgr.get_version(&event_type);
1887    Json(serde_json::json!({
1888        "event_type": event_type,
1889        "current_version": version,
1890        "history": history,
1891    }))
1892}
1893
1894/// Current inferred schema for an event type
1895pub async fn schema_evolution_schema(
1896    State(store): State<SharedStore>,
1897    Path(event_type): Path<String>,
1898) -> Json<serde_json::Value> {
1899    let mgr = store.schema_evolution();
1900    if let Some(schema) = mgr.get_schema(&event_type) {
1901        let json_schema = crate::application::services::schema_evolution::to_json_schema(&schema);
1902        Json(serde_json::json!({
1903            "event_type": event_type,
1904            "version": mgr.get_version(&event_type),
1905            "inferred_schema": schema,
1906            "json_schema": json_schema,
1907        }))
1908    } else {
1909        Json(serde_json::json!({
1910            "event_type": event_type,
1911            "error": "No schema inferred for this event type"
1912        }))
1913    }
1914}
1915
1916/// Schema evolution stats
1917pub async fn schema_evolution_stats(State(store): State<SharedStore>) -> Json<serde_json::Value> {
1918    let stats = store.schema_evolution().stats();
1919    let event_types = store.schema_evolution().list_event_types();
1920    Json(serde_json::json!({
1921        "stats": stats,
1922        "tracked_event_types": event_types,
1923    }))
1924}
1925
1926#[cfg(test)]
1927mod tests {
1928    use super::*;
1929    use crate::{domain::entities::Event, store::EventStore};
1930
1931    fn create_test_store() -> Arc<EventStore> {
1932        Arc::new(EventStore::new())
1933    }
1934
1935    fn create_test_event(entity_id: &str, event_type: &str) -> Event {
1936        Event::from_strings(
1937            event_type.to_string(),
1938            entity_id.to_string(),
1939            "test-stream".to_string(),
1940            serde_json::json!({
1941                "name": "Test",
1942                "value": 42
1943            }),
1944            None,
1945        )
1946        .unwrap()
1947    }
1948
1949    #[tokio::test]
1950    async fn test_query_events_has_more_and_total_count() {
1951        let store = create_test_store();
1952
1953        // Ingest 50 events
1954        for i in 0..50 {
1955            store
1956                .ingest(create_test_event(&format!("entity-{}", i), "user.created"))
1957                .unwrap();
1958        }
1959
1960        // Query with limit=10 — should get has_more=true, total_count=50
1961        let req = QueryEventsRequest {
1962            entity_id: None,
1963            event_type: None,
1964            tenant_id: None,
1965            as_of: None,
1966            since: None,
1967            until: None,
1968            limit: Some(10),
1969            event_type_prefix: None,
1970            payload_filter: None,
1971        };
1972
1973        let requested_limit = req.limit;
1974        let unlimited_req = QueryEventsRequest {
1975            limit: None,
1976            ..QueryEventsRequest {
1977                entity_id: req.entity_id,
1978                event_type: req.event_type,
1979                tenant_id: req.tenant_id,
1980                as_of: req.as_of,
1981                since: req.since,
1982                until: req.until,
1983                limit: None,
1984                event_type_prefix: req.event_type_prefix,
1985                payload_filter: req.payload_filter,
1986            }
1987        };
1988        let all_events = store.query(unlimited_req).unwrap();
1989        let total_count = all_events.len();
1990        let limited_events: Vec<Event> = if let Some(limit) = requested_limit {
1991            all_events.into_iter().take(limit).collect()
1992        } else {
1993            all_events
1994        };
1995        let count = limited_events.len();
1996        let has_more = count < total_count;
1997
1998        assert_eq!(count, 10);
1999        assert_eq!(total_count, 50);
2000        assert!(has_more);
2001    }
2002
2003    #[tokio::test]
2004    async fn test_query_events_no_more_results() {
2005        let store = create_test_store();
2006
2007        // Ingest 5 events
2008        for i in 0..5 {
2009            store
2010                .ingest(create_test_event(&format!("entity-{}", i), "user.created"))
2011                .unwrap();
2012        }
2013
2014        // Query with limit=100 — should get has_more=false, total_count=5
2015        let all_events = store
2016            .query(QueryEventsRequest {
2017                entity_id: None,
2018                event_type: None,
2019                tenant_id: None,
2020                as_of: None,
2021                since: None,
2022                until: None,
2023                limit: None,
2024                event_type_prefix: None,
2025                payload_filter: None,
2026            })
2027            .unwrap();
2028        let total_count = all_events.len();
2029        let limited_events: Vec<Event> = all_events.into_iter().take(100).collect();
2030        let count = limited_events.len();
2031        let has_more = count < total_count;
2032
2033        assert_eq!(count, 5);
2034        assert_eq!(total_count, 5);
2035        assert!(!has_more);
2036    }
2037
2038    #[tokio::test]
2039    async fn test_list_entities_by_type_prefix() {
2040        let store = create_test_store();
2041
2042        // 3 index entities
2043        store
2044            .ingest(create_test_event("idx-1", "index.created"))
2045            .unwrap();
2046        store
2047            .ingest(create_test_event("idx-1", "index.updated"))
2048            .unwrap();
2049        store
2050            .ingest(create_test_event("idx-2", "index.created"))
2051            .unwrap();
2052        store
2053            .ingest(create_test_event("idx-3", "index.created"))
2054            .unwrap();
2055        // 2 trade entities
2056        store
2057            .ingest(create_test_event("trade-1", "trade.created"))
2058            .unwrap();
2059        store
2060            .ingest(create_test_event("trade-2", "trade.created"))
2061            .unwrap();
2062
2063        // List entities for index.*
2064        let req = ListEntitiesRequest {
2065            event_type_prefix: Some("index.".to_string()),
2066            payload_filter: None,
2067            limit: None,
2068            offset: None,
2069        };
2070        let query_req = QueryEventsRequest {
2071            entity_id: None,
2072            event_type: None,
2073            tenant_id: None,
2074            as_of: None,
2075            since: None,
2076            until: None,
2077            limit: None,
2078            event_type_prefix: req.event_type_prefix,
2079            payload_filter: req.payload_filter,
2080        };
2081        let events = store.query(query_req).unwrap();
2082
2083        // Group and verify
2084        let mut entity_map: std::collections::HashMap<String, Vec<&Event>> =
2085            std::collections::HashMap::new();
2086        for event in &events {
2087            entity_map
2088                .entry(event.entity_id().to_string())
2089                .or_default()
2090                .push(event);
2091        }
2092
2093        assert_eq!(entity_map.len(), 3); // idx-1, idx-2, idx-3
2094        assert_eq!(entity_map["idx-1"].len(), 2); // 2 events for idx-1
2095        assert_eq!(entity_map["idx-2"].len(), 1);
2096        assert_eq!(entity_map["idx-3"].len(), 1);
2097    }
2098
2099    fn create_test_event_with_payload(
2100        entity_id: &str,
2101        event_type: &str,
2102        payload: serde_json::Value,
2103    ) -> Event {
2104        Event::from_strings(
2105            event_type.to_string(),
2106            entity_id.to_string(),
2107            "test-stream".to_string(),
2108            payload,
2109            None,
2110        )
2111        .unwrap()
2112    }
2113
2114    #[tokio::test]
2115    async fn test_detect_duplicates_by_payload_fields() {
2116        let store = create_test_store();
2117
2118        // Create entities with duplicate "name" field values
2119        store
2120            .ingest(create_test_event_with_payload(
2121                "idx-1",
2122                "index.created",
2123                serde_json::json!({"name": "S&P 500", "user_id": "alice"}),
2124            ))
2125            .unwrap();
2126        store
2127            .ingest(create_test_event_with_payload(
2128                "idx-2",
2129                "index.created",
2130                serde_json::json!({"name": "S&P 500", "user_id": "bob"}),
2131            ))
2132            .unwrap();
2133        store
2134            .ingest(create_test_event_with_payload(
2135                "idx-3",
2136                "index.created",
2137                serde_json::json!({"name": "NASDAQ", "user_id": "alice"}),
2138            ))
2139            .unwrap();
2140        store
2141            .ingest(create_test_event_with_payload(
2142                "idx-4",
2143                "index.created",
2144                serde_json::json!({"name": "NASDAQ", "user_id": "carol"}),
2145            ))
2146            .unwrap();
2147        store
2148            .ingest(create_test_event_with_payload(
2149                "idx-5",
2150                "index.created",
2151                serde_json::json!({"name": "DAX", "user_id": "dave"}),
2152            ))
2153            .unwrap();
2154
2155        // Group by name — should find 2 groups: "S&P 500" (idx-1, idx-2) and "NASDAQ" (idx-3, idx-4)
2156        let query_req = QueryEventsRequest {
2157            entity_id: None,
2158            event_type: None,
2159            tenant_id: None,
2160            as_of: None,
2161            since: None,
2162            until: None,
2163            limit: None,
2164            event_type_prefix: Some("index.".to_string()),
2165            payload_filter: None,
2166        };
2167        let events = store.query(query_req).unwrap();
2168
2169        // Manually replicate the handler logic for testing
2170        let group_by_fields = vec!["name"];
2171        let mut entity_latest: std::collections::HashMap<String, &Event> =
2172            std::collections::HashMap::new();
2173        for event in &events {
2174            let eid = event.entity_id().to_string();
2175            entity_latest
2176                .entry(eid)
2177                .and_modify(|existing| {
2178                    if event.timestamp() > existing.timestamp() {
2179                        *existing = event;
2180                    }
2181                })
2182                .or_insert(event);
2183        }
2184
2185        let mut groups: std::collections::HashMap<String, Vec<String>> =
2186            std::collections::HashMap::new();
2187        for (entity_id, event) in &entity_latest {
2188            let payload = event.payload();
2189            let mut key_parts = serde_json::Map::new();
2190            for field in &group_by_fields {
2191                let value = payload
2192                    .get(*field)
2193                    .cloned()
2194                    .unwrap_or(serde_json::Value::Null);
2195                key_parts.insert(field.to_string(), value);
2196            }
2197            let key_str = serde_json::to_string(&key_parts).unwrap_or_default();
2198            groups.entry(key_str).or_default().push(entity_id.clone());
2199        }
2200
2201        let duplicate_groups: Vec<_> = groups
2202            .into_iter()
2203            .filter(|(_, ids)| ids.len() > 1)
2204            .collect();
2205
2206        assert_eq!(duplicate_groups.len(), 2); // S&P 500 and NASDAQ groups
2207        for (_, ids) in &duplicate_groups {
2208            assert_eq!(ids.len(), 2);
2209        }
2210    }
2211
2212    #[tokio::test]
2213    async fn test_detect_duplicates_no_duplicates() {
2214        let store = create_test_store();
2215
2216        // All unique names
2217        store
2218            .ingest(create_test_event_with_payload(
2219                "idx-1",
2220                "index.created",
2221                serde_json::json!({"name": "A"}),
2222            ))
2223            .unwrap();
2224        store
2225            .ingest(create_test_event_with_payload(
2226                "idx-2",
2227                "index.created",
2228                serde_json::json!({"name": "B"}),
2229            ))
2230            .unwrap();
2231
2232        let query_req = QueryEventsRequest {
2233            entity_id: None,
2234            event_type: None,
2235            tenant_id: None,
2236            as_of: None,
2237            since: None,
2238            until: None,
2239            limit: None,
2240            event_type_prefix: Some("index.".to_string()),
2241            payload_filter: None,
2242        };
2243        let events = store.query(query_req).unwrap();
2244
2245        let mut entity_latest: std::collections::HashMap<String, &Event> =
2246            std::collections::HashMap::new();
2247        for event in &events {
2248            entity_latest
2249                .entry(event.entity_id().to_string())
2250                .or_insert(event);
2251        }
2252
2253        let mut groups: std::collections::HashMap<String, Vec<String>> =
2254            std::collections::HashMap::new();
2255        for (entity_id, event) in &entity_latest {
2256            let key_str =
2257                serde_json::to_string(&serde_json::json!({"name": event.payload().get("name")}))
2258                    .unwrap();
2259            groups.entry(key_str).or_default().push(entity_id.clone());
2260        }
2261
2262        let duplicate_groups: Vec<_> = groups
2263            .into_iter()
2264            .filter(|(_, ids)| ids.len() > 1)
2265            .collect();
2266
2267        assert_eq!(duplicate_groups.len(), 0); // No duplicates
2268    }
2269
2270    #[tokio::test]
2271    async fn test_detect_duplicates_multi_field_group_by() {
2272        let store = create_test_store();
2273
2274        // Two entities with same name AND user_id = true duplicate
2275        store
2276            .ingest(create_test_event_with_payload(
2277                "idx-1",
2278                "index.created",
2279                serde_json::json!({"name": "S&P 500", "user_id": "alice"}),
2280            ))
2281            .unwrap();
2282        store
2283            .ingest(create_test_event_with_payload(
2284                "idx-2",
2285                "index.created",
2286                serde_json::json!({"name": "S&P 500", "user_id": "alice"}),
2287            ))
2288            .unwrap();
2289        // Same name but different user_id = NOT a duplicate in multi-field group
2290        store
2291            .ingest(create_test_event_with_payload(
2292                "idx-3",
2293                "index.created",
2294                serde_json::json!({"name": "S&P 500", "user_id": "bob"}),
2295            ))
2296            .unwrap();
2297
2298        let query_req = QueryEventsRequest {
2299            entity_id: None,
2300            event_type: None,
2301            tenant_id: None,
2302            as_of: None,
2303            since: None,
2304            until: None,
2305            limit: None,
2306            event_type_prefix: Some("index.".to_string()),
2307            payload_filter: None,
2308        };
2309        let events = store.query(query_req).unwrap();
2310
2311        let group_by_fields = vec!["name", "user_id"];
2312        let mut entity_latest: std::collections::HashMap<String, &Event> =
2313            std::collections::HashMap::new();
2314        for event in &events {
2315            entity_latest
2316                .entry(event.entity_id().to_string())
2317                .and_modify(|existing| {
2318                    if event.timestamp() > existing.timestamp() {
2319                        *existing = event;
2320                    }
2321                })
2322                .or_insert(event);
2323        }
2324
2325        let mut groups: std::collections::HashMap<String, Vec<String>> =
2326            std::collections::HashMap::new();
2327        for (entity_id, event) in &entity_latest {
2328            let payload = event.payload();
2329            let mut key_parts = serde_json::Map::new();
2330            for field in &group_by_fields {
2331                let value = payload
2332                    .get(*field)
2333                    .cloned()
2334                    .unwrap_or(serde_json::Value::Null);
2335                key_parts.insert(field.to_string(), value);
2336            }
2337            let key_str = serde_json::to_string(&key_parts).unwrap_or_default();
2338            groups.entry(key_str).or_default().push(entity_id.clone());
2339        }
2340
2341        let duplicate_groups: Vec<_> = groups
2342            .into_iter()
2343            .filter(|(_, ids)| ids.len() > 1)
2344            .collect();
2345
2346        // Only 1 duplicate group: name=S&P 500, user_id=alice (idx-1, idx-2)
2347        assert_eq!(duplicate_groups.len(), 1);
2348        let (_, ref ids) = duplicate_groups[0];
2349        assert_eq!(ids.len(), 2);
2350        let mut sorted_ids = ids.clone();
2351        sorted_ids.sort();
2352        assert_eq!(sorted_ids, vec!["idx-1", "idx-2"]);
2353    }
2354
2355    #[tokio::test]
2356    async fn test_projection_state_cache() {
2357        let store = create_test_store();
2358
2359        // Test cache insertion
2360        let cache = store.projection_state_cache();
2361        cache.insert(
2362            "entity_snapshots:user-123".to_string(),
2363            serde_json::json!({"name": "Test User", "age": 30}),
2364        );
2365
2366        // Test cache retrieval
2367        let state = cache.get("entity_snapshots:user-123");
2368        assert!(state.is_some());
2369        let state = state.unwrap();
2370        assert_eq!(state["name"], "Test User");
2371        assert_eq!(state["age"], 30);
2372    }
2373
2374    #[tokio::test]
2375    async fn test_projection_manager_list_projections() {
2376        let store = create_test_store();
2377
2378        // List projections (built-in projections should be available)
2379        let projection_manager = store.projection_manager();
2380        let projections = projection_manager.list_projections();
2381
2382        // Should have entity_snapshots and event_counters
2383        assert!(projections.len() >= 2);
2384
2385        let names: Vec<&str> = projections.iter().map(|(name, _)| name.as_str()).collect();
2386        assert!(names.contains(&"entity_snapshots"));
2387        assert!(names.contains(&"event_counters"));
2388    }
2389
2390    #[tokio::test]
2391    async fn test_projection_state_after_event_ingestion() {
2392        let store = create_test_store();
2393
2394        // Ingest an event
2395        let event = create_test_event("user-456", "user.created");
2396        store.ingest(event).unwrap();
2397
2398        // Get projection state
2399        let projection_manager = store.projection_manager();
2400        let snapshot_projection = projection_manager
2401            .get_projection("entity_snapshots")
2402            .unwrap();
2403
2404        let state = snapshot_projection.get_state("user-456");
2405        assert!(state.is_some());
2406        let state = state.unwrap();
2407        assert_eq!(state["name"], "Test");
2408        assert_eq!(state["value"], 42);
2409    }
2410
2411    #[tokio::test]
2412    async fn test_projection_state_cache_multiple_entities() {
2413        let store = create_test_store();
2414        let cache = store.projection_state_cache();
2415
2416        // Insert multiple entities
2417        for i in 0..10 {
2418            cache.insert(
2419                format!("entity_snapshots:entity-{}", i),
2420                serde_json::json!({"id": i, "status": "active"}),
2421            );
2422        }
2423
2424        // Verify all insertions
2425        assert_eq!(cache.len(), 10);
2426
2427        // Verify each entity
2428        for i in 0..10 {
2429            let key = format!("entity_snapshots:entity-{}", i);
2430            let state = cache.get(&key);
2431            assert!(state.is_some());
2432            assert_eq!(state.unwrap()["id"], i);
2433        }
2434    }
2435
2436    #[tokio::test]
2437    async fn test_projection_state_update() {
2438        let store = create_test_store();
2439        let cache = store.projection_state_cache();
2440
2441        // Initial state
2442        cache.insert(
2443            "entity_snapshots:user-789".to_string(),
2444            serde_json::json!({"balance": 100}),
2445        );
2446
2447        // Update state
2448        cache.insert(
2449            "entity_snapshots:user-789".to_string(),
2450            serde_json::json!({"balance": 150}),
2451        );
2452
2453        // Verify update
2454        let state = cache.get("entity_snapshots:user-789").unwrap();
2455        assert_eq!(state["balance"], 150);
2456    }
2457
2458    #[tokio::test]
2459    async fn test_event_counter_projection() {
2460        let store = create_test_store();
2461
2462        // Ingest events of different types
2463        store
2464            .ingest(create_test_event("user-1", "user.created"))
2465            .unwrap();
2466        store
2467            .ingest(create_test_event("user-2", "user.created"))
2468            .unwrap();
2469        store
2470            .ingest(create_test_event("user-1", "user.updated"))
2471            .unwrap();
2472
2473        // Get event counter projection
2474        let projection_manager = store.projection_manager();
2475        let counter_projection = projection_manager.get_projection("event_counters").unwrap();
2476
2477        // Check counts
2478        let created_state = counter_projection.get_state("user.created");
2479        assert!(created_state.is_some());
2480        assert_eq!(created_state.unwrap()["count"], 2);
2481
2482        let updated_state = counter_projection.get_state("user.updated");
2483        assert!(updated_state.is_some());
2484        assert_eq!(updated_state.unwrap()["count"], 1);
2485    }
2486
2487    #[tokio::test]
2488    async fn test_projection_state_cache_key_format() {
2489        let store = create_test_store();
2490        let cache = store.projection_state_cache();
2491
2492        // Test standard key format: {projection_name}:{entity_id}
2493        let key = "orders:order-12345".to_string();
2494        cache.insert(key.clone(), serde_json::json!({"total": 99.99}));
2495
2496        let state = cache.get(&key).unwrap();
2497        assert_eq!(state["total"], 99.99);
2498    }
2499
2500    #[tokio::test]
2501    async fn test_projection_state_cache_removal() {
2502        let store = create_test_store();
2503        let cache = store.projection_state_cache();
2504
2505        // Insert and then remove
2506        cache.insert(
2507            "test:entity-1".to_string(),
2508            serde_json::json!({"data": "value"}),
2509        );
2510        assert_eq!(cache.len(), 1);
2511
2512        cache.remove("test:entity-1");
2513        assert_eq!(cache.len(), 0);
2514        assert!(cache.get("test:entity-1").is_none());
2515    }
2516
2517    #[tokio::test]
2518    async fn test_get_nonexistent_projection() {
2519        let store = create_test_store();
2520        let projection_manager = store.projection_manager();
2521
2522        // Requesting a non-existent projection should return None
2523        let projection = projection_manager.get_projection("nonexistent_projection");
2524        assert!(projection.is_none());
2525    }
2526
2527    #[tokio::test]
2528    async fn test_get_nonexistent_entity_state() {
2529        let store = create_test_store();
2530        let projection_manager = store.projection_manager();
2531
2532        // Get state for non-existent entity
2533        let snapshot_projection = projection_manager
2534            .get_projection("entity_snapshots")
2535            .unwrap();
2536        let state = snapshot_projection.get_state("nonexistent-entity-xyz");
2537        assert!(state.is_none());
2538    }
2539
2540    #[tokio::test]
2541    async fn test_projection_state_cache_concurrent_access() {
2542        let store = create_test_store();
2543        let cache = store.projection_state_cache();
2544
2545        // Simulate concurrent writes
2546        let handles: Vec<_> = (0..10)
2547            .map(|i| {
2548                let cache_clone = cache.clone();
2549                tokio::spawn(async move {
2550                    cache_clone.insert(
2551                        format!("concurrent:entity-{}", i),
2552                        serde_json::json!({"thread": i}),
2553                    );
2554                })
2555            })
2556            .collect();
2557
2558        for handle in handles {
2559            handle.await.unwrap();
2560        }
2561
2562        // All 10 entries should be present
2563        assert_eq!(cache.len(), 10);
2564    }
2565
2566    #[tokio::test]
2567    async fn test_projection_state_large_payload() {
2568        let store = create_test_store();
2569        let cache = store.projection_state_cache();
2570
2571        // Create a large JSON payload (~10KB)
2572        let large_array: Vec<serde_json::Value> = (0..1000)
2573            .map(|i| serde_json::json!({"item": i, "description": "test item with some padding data to increase size"}))
2574            .collect();
2575
2576        cache.insert(
2577            "large:entity-1".to_string(),
2578            serde_json::json!({"items": large_array}),
2579        );
2580
2581        let state = cache.get("large:entity-1").unwrap();
2582        let items = state["items"].as_array().unwrap();
2583        assert_eq!(items.len(), 1000);
2584    }
2585
2586    #[tokio::test]
2587    async fn test_projection_state_complex_json() {
2588        let store = create_test_store();
2589        let cache = store.projection_state_cache();
2590
2591        // Complex nested JSON structure
2592        let complex_state = serde_json::json!({
2593            "user": {
2594                "id": "user-123",
2595                "profile": {
2596                    "name": "John Doe",
2597                    "email": "john@example.com",
2598                    "settings": {
2599                        "theme": "dark",
2600                        "notifications": true
2601                    }
2602                },
2603                "roles": ["admin", "user"],
2604                "metadata": {
2605                    "created_at": "2025-01-01T00:00:00Z",
2606                    "last_login": null
2607                }
2608            }
2609        });
2610
2611        cache.insert("complex:user-123".to_string(), complex_state);
2612
2613        let state = cache.get("complex:user-123").unwrap();
2614        assert_eq!(state["user"]["profile"]["name"], "John Doe");
2615        assert_eq!(state["user"]["roles"][0], "admin");
2616        assert!(state["user"]["metadata"]["last_login"].is_null());
2617    }
2618
2619    #[tokio::test]
2620    async fn test_projection_state_cache_iteration() {
2621        let store = create_test_store();
2622        let cache = store.projection_state_cache();
2623
2624        // Insert entries
2625        for i in 0..5 {
2626            cache.insert(
2627                format!("iter:entity-{}", i),
2628                serde_json::json!({"index": i}),
2629            );
2630        }
2631
2632        // Iterate over all entries
2633        let entries: Vec<_> = cache.iter().map(|entry| entry.key().clone()).collect();
2634        assert_eq!(entries.len(), 5);
2635    }
2636
2637    #[tokio::test]
2638    async fn test_projection_manager_get_entity_snapshots() {
2639        let store = create_test_store();
2640        let projection_manager = store.projection_manager();
2641
2642        // Get entity_snapshots projection specifically
2643        let projection = projection_manager.get_projection("entity_snapshots");
2644        assert!(projection.is_some());
2645        assert_eq!(projection.unwrap().name(), "entity_snapshots");
2646    }
2647
2648    #[tokio::test]
2649    async fn test_projection_manager_get_event_counters() {
2650        let store = create_test_store();
2651        let projection_manager = store.projection_manager();
2652
2653        // Get event_counters projection specifically
2654        let projection = projection_manager.get_projection("event_counters");
2655        assert!(projection.is_some());
2656        assert_eq!(projection.unwrap().name(), "event_counters");
2657    }
2658
2659    #[tokio::test]
2660    async fn test_projection_state_cache_overwrite() {
2661        let store = create_test_store();
2662        let cache = store.projection_state_cache();
2663
2664        // Initial value
2665        cache.insert(
2666            "overwrite:entity-1".to_string(),
2667            serde_json::json!({"version": 1}),
2668        );
2669
2670        // Overwrite with new value
2671        cache.insert(
2672            "overwrite:entity-1".to_string(),
2673            serde_json::json!({"version": 2}),
2674        );
2675
2676        // Overwrite again
2677        cache.insert(
2678            "overwrite:entity-1".to_string(),
2679            serde_json::json!({"version": 3}),
2680        );
2681
2682        let state = cache.get("overwrite:entity-1").unwrap();
2683        assert_eq!(state["version"], 3);
2684
2685        // Should still be only 1 entry
2686        assert_eq!(cache.len(), 1);
2687    }
2688
2689    #[tokio::test]
2690    async fn test_projection_state_multiple_projections() {
2691        let store = create_test_store();
2692        let cache = store.projection_state_cache();
2693
2694        // Store states for different projections
2695        cache.insert(
2696            "entity_snapshots:user-1".to_string(),
2697            serde_json::json!({"name": "Alice"}),
2698        );
2699        cache.insert(
2700            "event_counters:user.created".to_string(),
2701            serde_json::json!({"count": 5}),
2702        );
2703        cache.insert(
2704            "custom_projection:order-1".to_string(),
2705            serde_json::json!({"total": 150.0}),
2706        );
2707
2708        // Verify each projection's state
2709        assert_eq!(
2710            cache.get("entity_snapshots:user-1").unwrap()["name"],
2711            "Alice"
2712        );
2713        assert_eq!(
2714            cache.get("event_counters:user.created").unwrap()["count"],
2715            5
2716        );
2717        assert_eq!(
2718            cache.get("custom_projection:order-1").unwrap()["total"],
2719            150.0
2720        );
2721    }
2722
2723    #[tokio::test]
2724    async fn test_bulk_projection_state_access() {
2725        let store = create_test_store();
2726
2727        // Ingest multiple events for different entities
2728        for i in 0..5 {
2729            let event = create_test_event(&format!("bulk-user-{}", i), "user.created");
2730            store.ingest(event).unwrap();
2731        }
2732
2733        // Get projection and verify bulk access
2734        let projection_manager = store.projection_manager();
2735        let snapshot_projection = projection_manager
2736            .get_projection("entity_snapshots")
2737            .unwrap();
2738
2739        // Verify we can access all entities
2740        for i in 0..5 {
2741            let state = snapshot_projection.get_state(&format!("bulk-user-{}", i));
2742            assert!(state.is_some(), "Entity bulk-user-{} should have state", i);
2743        }
2744    }
2745
2746    #[tokio::test]
2747    async fn test_bulk_save_projection_states() {
2748        let store = create_test_store();
2749        let cache = store.projection_state_cache();
2750
2751        // Simulate bulk save request
2752        let states = vec![
2753            BulkSaveStateItem {
2754                entity_id: "bulk-entity-1".to_string(),
2755                state: serde_json::json!({"name": "Entity 1", "value": 100}),
2756            },
2757            BulkSaveStateItem {
2758                entity_id: "bulk-entity-2".to_string(),
2759                state: serde_json::json!({"name": "Entity 2", "value": 200}),
2760            },
2761            BulkSaveStateItem {
2762                entity_id: "bulk-entity-3".to_string(),
2763                state: serde_json::json!({"name": "Entity 3", "value": 300}),
2764            },
2765        ];
2766
2767        let projection_name = "test_projection";
2768
2769        // Save states to cache (simulating bulk_save_projection_states handler)
2770        for item in &states {
2771            cache.insert(
2772                format!("{projection_name}:{}", item.entity_id),
2773                item.state.clone(),
2774            );
2775        }
2776
2777        // Verify all states were saved
2778        assert_eq!(cache.len(), 3);
2779
2780        let state1 = cache.get("test_projection:bulk-entity-1").unwrap();
2781        assert_eq!(state1["name"], "Entity 1");
2782        assert_eq!(state1["value"], 100);
2783
2784        let state2 = cache.get("test_projection:bulk-entity-2").unwrap();
2785        assert_eq!(state2["name"], "Entity 2");
2786        assert_eq!(state2["value"], 200);
2787
2788        let state3 = cache.get("test_projection:bulk-entity-3").unwrap();
2789        assert_eq!(state3["name"], "Entity 3");
2790        assert_eq!(state3["value"], 300);
2791    }
2792
2793    #[tokio::test]
2794    async fn test_bulk_save_empty_states() {
2795        let store = create_test_store();
2796        let cache = store.projection_state_cache();
2797
2798        // Clear cache
2799        cache.clear();
2800
2801        // Empty states should work fine
2802        let states: Vec<BulkSaveStateItem> = vec![];
2803        assert_eq!(states.len(), 0);
2804
2805        // Cache should remain empty
2806        assert_eq!(cache.len(), 0);
2807    }
2808
2809    #[tokio::test]
2810    async fn test_bulk_save_overwrites_existing() {
2811        let store = create_test_store();
2812        let cache = store.projection_state_cache();
2813
2814        // Insert initial state
2815        cache.insert(
2816            "test:entity-1".to_string(),
2817            serde_json::json!({"version": 1, "data": "initial"}),
2818        );
2819
2820        // Bulk save with updated state
2821        let new_state = serde_json::json!({"version": 2, "data": "updated"});
2822        cache.insert("test:entity-1".to_string(), new_state);
2823
2824        // Verify overwrite
2825        let state = cache.get("test:entity-1").unwrap();
2826        assert_eq!(state["version"], 2);
2827        assert_eq!(state["data"], "updated");
2828    }
2829
2830    #[tokio::test]
2831    async fn test_bulk_save_high_volume() {
2832        let store = create_test_store();
2833        let cache = store.projection_state_cache();
2834
2835        // Simulate high volume save (1000 entities)
2836        for i in 0..1000 {
2837            cache.insert(
2838                format!("volume_test:entity-{}", i),
2839                serde_json::json!({"index": i, "status": "active"}),
2840            );
2841        }
2842
2843        // Verify count
2844        assert_eq!(cache.len(), 1000);
2845
2846        // Spot check some entries
2847        assert_eq!(cache.get("volume_test:entity-0").unwrap()["index"], 0);
2848        assert_eq!(cache.get("volume_test:entity-500").unwrap()["index"], 500);
2849        assert_eq!(cache.get("volume_test:entity-999").unwrap()["index"], 999);
2850    }
2851
2852    #[tokio::test]
2853    async fn test_bulk_save_different_projections() {
2854        let store = create_test_store();
2855        let cache = store.projection_state_cache();
2856
2857        // Save to multiple projections in bulk
2858        let projections = ["entity_snapshots", "event_counters", "custom_analytics"];
2859
2860        for proj in projections.iter() {
2861            for i in 0..5 {
2862                cache.insert(
2863                    format!("{proj}:entity-{i}"),
2864                    serde_json::json!({"projection": proj, "id": i}),
2865                );
2866            }
2867        }
2868
2869        // Verify total count (3 projections * 5 entities)
2870        assert_eq!(cache.len(), 15);
2871
2872        // Verify each projection
2873        for proj in projections.iter() {
2874            let state = cache.get(&format!("{proj}:entity-0")).unwrap();
2875            assert_eq!(state["projection"], *proj);
2876        }
2877    }
2878}