use std::collections::HashMap;
use std::sync::Arc;
use std::sync::atomic::{AtomicUsize, Ordering};
use std::time::{Duration, Instant};
use blazen_events::{AnyEvent, DynamicEvent, Event, EventEnvelope, InputRequestEvent, StopEvent};
use chrono::Utc;
use tokio::sync::{mpsc, oneshot};
use tokio::task::JoinSet;
use uuid::Uuid;
use tracing::Instrument;
use crate::builder::InputHandlerFn;
use crate::context::Context;
use crate::error::WorkflowError;
use crate::handler::WorkflowControl;
use crate::session_ref::{
RefLifetime, SERIALIZED_SESSION_REFS_META_KEY, SessionPausePolicy, SessionRefRegistry,
};
use crate::snapshot::{SNAPSHOT_VERSION, WorkflowSnapshot};
use crate::step::{StepOutput, StepRegistration};
#[cfg(feature = "persist")]
pub(crate) struct CheckpointConfig {
pub(crate) store: Option<Arc<dyn blazen_persist::CheckpointStore>>,
pub(crate) after_step: bool,
}
#[cfg(feature = "persist")]
async fn save_checkpoint(
store: &dyn blazen_persist::CheckpointStore,
ctx: &Context,
workflow_name: &str,
run_id: Uuid,
#[cfg(feature = "telemetry")] history_buffer: &[blazen_telemetry::HistoryEvent],
) {
let context_state = ctx.snapshot_state().await;
let collected_events = ctx.snapshot_collected().await;
let metadata = ctx.snapshot_metadata().await;
#[cfg(feature = "telemetry")]
let history = history_buffer.to_vec();
let snapshot = WorkflowSnapshot {
version: SNAPSHOT_VERSION,
workflow_name: workflow_name.to_owned(),
run_id,
timestamp: Utc::now(),
context_state,
collected_events,
pending_events: Vec::new(), metadata,
#[cfg(feature = "telemetry")]
history,
};
let checkpoint: blazen_persist::WorkflowCheckpoint = snapshot.into();
if let Err(e) = store.save(&checkpoint).await {
tracing::warn!(
run_id = %run_id,
error = %e,
"auto-checkpoint failed (best-effort)"
);
} else {
tracing::debug!(run_id = %run_id, "auto-checkpoint saved");
}
}
#[allow(clippy::too_many_arguments, clippy::too_many_lines)]
pub(crate) async fn event_loop(
event_rx: mpsc::UnboundedReceiver<EventEnvelope>,
event_tx: mpsc::UnboundedSender<EventEnvelope>,
registry: HashMap<String, Vec<StepRegistration>>,
ctx: Context,
result_tx: oneshot::Sender<Result<Box<dyn AnyEvent>, WorkflowError>>,
timeout: Option<Duration>,
control_rx: mpsc::UnboundedReceiver<WorkflowControl>,
workflow_name: String,
run_id: Uuid,
input_handler: Option<InputHandlerFn>,
auto_publish_events: bool,
#[cfg(feature = "persist")] checkpoint_config: CheckpointConfig,
#[cfg(feature = "telemetry")] history_tx: Option<
mpsc::UnboundedSender<blazen_telemetry::HistoryEvent>,
>,
) {
let stream_ctx = ctx.clone();
let span = tracing::info_span!(
"workflow.run",
workflow_name = %workflow_name,
run_id = %run_id,
);
event_loop_inner(
event_rx,
event_tx,
registry,
ctx,
result_tx,
timeout,
control_rx,
workflow_name,
run_id,
input_handler,
auto_publish_events,
#[cfg(feature = "persist")]
checkpoint_config,
#[cfg(feature = "telemetry")]
history_tx,
)
.instrument(span)
.await;
stream_ctx.signal_stream_end().await;
}
#[cfg(feature = "telemetry")]
fn emit_history(
tx: Option<&mpsc::UnboundedSender<blazen_telemetry::HistoryEvent>>,
buffer: &mut Vec<blazen_telemetry::HistoryEvent>,
event: blazen_telemetry::HistoryEvent,
) {
if let Some(tx) = tx {
let _ = tx.send(event.clone());
}
buffer.push(event);
}
#[allow(clippy::too_many_arguments, clippy::too_many_lines)]
async fn event_loop_inner(
mut event_rx: mpsc::UnboundedReceiver<EventEnvelope>,
event_tx: mpsc::UnboundedSender<EventEnvelope>,
registry: HashMap<String, Vec<StepRegistration>>,
ctx: Context,
result_tx: oneshot::Sender<Result<Box<dyn AnyEvent>, WorkflowError>>,
timeout: Option<Duration>,
mut control_rx: mpsc::UnboundedReceiver<WorkflowControl>,
workflow_name: String,
run_id: Uuid,
input_handler: Option<InputHandlerFn>,
auto_publish_events: bool,
#[cfg(feature = "persist")] checkpoint_config: CheckpointConfig,
#[cfg(feature = "telemetry")] history_tx: Option<
mpsc::UnboundedSender<blazen_telemetry::HistoryEvent>,
>,
) {
let start = Instant::now();
#[cfg(feature = "telemetry")]
let mut history_buffer: Vec<blazen_telemetry::HistoryEvent> = Vec::new();
#[cfg(feature = "telemetry")]
emit_history(
history_tx.as_ref(),
&mut history_buffer,
blazen_telemetry::HistoryEvent {
timestamp: Utc::now(),
sequence: 0,
kind: blazen_telemetry::HistoryEventKind::WorkflowStarted {
input: serde_json::json!({}),
},
},
);
let (error_tx, mut error_rx) = mpsc::unbounded_channel::<WorkflowError>();
let mut in_flight: JoinSet<()> = JoinSet::new();
let in_flight_count = Arc::new(AtomicUsize::new(0));
let mut parked = false;
let publish_lifecycle = |ctx: &Context,
kind: &str,
step_name: Option<&str>,
event_type_str: Option<&str>,
duration_ms: Option<u64>,
error: Option<&str>| {
let ctx = ctx.clone();
let kind = kind.to_owned();
let step_name = step_name.map(ToOwned::to_owned);
let event_type_str = event_type_str.map(ToOwned::to_owned);
let error = error.map(ToOwned::to_owned);
async move {
let mut data = serde_json::Map::new();
data.insert("kind".into(), serde_json::Value::String(kind));
if let Some(s) = step_name {
data.insert("step_name".into(), serde_json::Value::String(s));
}
if let Some(e) = event_type_str {
data.insert("event_type".into(), serde_json::Value::String(e));
}
if let Some(d) = duration_ms {
data.insert("duration_ms".into(), serde_json::Value::Number(d.into()));
}
if let Some(e) = error {
data.insert("error".into(), serde_json::Value::String(e));
}
ctx.write_event_to_stream(DynamicEvent {
event_type: "blazen::lifecycle".to_owned(),
data: serde_json::Value::Object(data),
})
.await;
}
};
loop {
let recv_result = if let Some(timeout_dur) = timeout {
let remaining = timeout_dur.saturating_sub(start.elapsed());
if remaining.is_zero() {
#[cfg(feature = "telemetry")]
emit_history(
history_tx.as_ref(),
&mut history_buffer,
blazen_telemetry::HistoryEvent {
timestamp: Utc::now(),
sequence: 0,
kind: blazen_telemetry::HistoryEventKind::WorkflowTimedOut {
elapsed_ms: u64::try_from(start.elapsed().as_millis())
.unwrap_or(u64::MAX),
},
},
);
let _ = result_tx.send(Err(WorkflowError::Timeout {
elapsed: start.elapsed(),
}));
return;
}
tokio::select! {
biased;
err = error_rx.recv() => {
if let Some(workflow_err) = err {
#[cfg(feature = "telemetry")]
emit_history(
history_tx.as_ref(),
&mut history_buffer,
blazen_telemetry::HistoryEvent {
timestamp: Utc::now(),
sequence: 0,
kind: blazen_telemetry::HistoryEventKind::WorkflowFailed {
error: workflow_err.to_string(),
duration_ms: u64::try_from(start.elapsed().as_millis()).unwrap_or(u64::MAX),
},
},
);
let _ = result_tx.send(Err(workflow_err));
return;
}
continue;
}
maybe_envelope = event_rx.recv(), if !parked => {
maybe_envelope.ok_or(())
}
() = tokio::time::sleep(remaining) => {
#[cfg(feature = "telemetry")]
emit_history(
history_tx.as_ref(),
&mut history_buffer,
blazen_telemetry::HistoryEvent {
timestamp: Utc::now(),
sequence: 0,
kind: blazen_telemetry::HistoryEventKind::WorkflowTimedOut {
elapsed_ms: u64::try_from(start.elapsed().as_millis()).unwrap_or(u64::MAX),
},
},
);
let _ = result_tx.send(Err(WorkflowError::Timeout {
elapsed: start.elapsed(),
}));
return;
}
Some(control) = control_rx.recv() => {
match control {
WorkflowControl::Pause => {
parked = true;
#[cfg(feature = "telemetry")]
emit_history(
history_tx.as_ref(),
&mut history_buffer,
blazen_telemetry::HistoryEvent {
timestamp: Utc::now(),
sequence: 0,
kind: blazen_telemetry::HistoryEventKind::WorkflowPaused {
reason: blazen_telemetry::PauseReason::Manual,
pending_count: 0,
},
},
);
continue;
}
WorkflowControl::Resume => {
parked = false;
continue;
}
WorkflowControl::Snapshot { reply } => {
let snap = build_snapshot_in_place(
&ctx,
&workflow_name,
run_id,
#[cfg(feature = "telemetry")]
&history_buffer,
).await;
let _ = reply.send(snap);
continue;
}
WorkflowControl::Abort => {
let _ = result_tx.send(Err(WorkflowError::Paused));
return;
}
WorkflowControl::InputResponse(response) => {
parked = false;
let envelope = EventEnvelope::new(
Box::new(response),
Some("__human_input".into()),
);
let _ = event_tx.send(envelope);
continue;
}
}
}
}
} else {
tokio::select! {
biased;
err = error_rx.recv() => {
if let Some(workflow_err) = err {
#[cfg(feature = "telemetry")]
emit_history(
history_tx.as_ref(),
&mut history_buffer,
blazen_telemetry::HistoryEvent {
timestamp: Utc::now(),
sequence: 0,
kind: blazen_telemetry::HistoryEventKind::WorkflowFailed {
error: workflow_err.to_string(),
duration_ms: u64::try_from(start.elapsed().as_millis()).unwrap_or(u64::MAX),
},
},
);
let _ = result_tx.send(Err(workflow_err));
return;
}
continue;
}
maybe_envelope = event_rx.recv(), if !parked => {
maybe_envelope.ok_or(())
}
Some(control) = control_rx.recv() => {
match control {
WorkflowControl::Pause => {
parked = true;
#[cfg(feature = "telemetry")]
emit_history(
history_tx.as_ref(),
&mut history_buffer,
blazen_telemetry::HistoryEvent {
timestamp: Utc::now(),
sequence: 0,
kind: blazen_telemetry::HistoryEventKind::WorkflowPaused {
reason: blazen_telemetry::PauseReason::Manual,
pending_count: 0,
},
},
);
continue;
}
WorkflowControl::Resume => {
parked = false;
continue;
}
WorkflowControl::Snapshot { reply } => {
let snap = build_snapshot_in_place(
&ctx,
&workflow_name,
run_id,
#[cfg(feature = "telemetry")]
&history_buffer,
).await;
let _ = reply.send(snap);
continue;
}
WorkflowControl::Abort => {
let _ = result_tx.send(Err(WorkflowError::Paused));
return;
}
WorkflowControl::InputResponse(response) => {
parked = false;
let envelope = EventEnvelope::new(
Box::new(response),
Some("__human_input".into()),
);
let _ = event_tx.send(envelope);
continue;
}
}
}
}
};
let Ok(envelope) = recv_result else {
let _ = result_tx.send(Err(WorkflowError::ChannelClosed));
return;
};
let event = envelope.event;
let event_type = event.event_type_id();
#[cfg(feature = "telemetry")]
emit_history(
history_tx.as_ref(),
&mut history_buffer,
blazen_telemetry::HistoryEvent {
timestamp: Utc::now(),
sequence: 0,
kind: blazen_telemetry::HistoryEventKind::EventReceived {
event_type: event_type.to_string(),
source_step: envelope.source_step.clone(),
},
},
);
if auto_publish_events {
publish_lifecycle(&ctx, "event_routed", None, Some(event_type), None, None).await;
}
{
let _event_span = tracing::debug_span!(
"workflow.event",
event_type = %event_type,
source_step = ?envelope.source_step,
)
.entered();
tracing::debug!(
event_type,
source_step = ?envelope.source_step,
"event loop received event"
);
}
if event_type == StopEvent::event_type() {
tracing::info!("workflow completed via StopEvent");
#[cfg(feature = "telemetry")]
emit_history(
history_tx.as_ref(),
&mut history_buffer,
blazen_telemetry::HistoryEvent {
timestamp: Utc::now(),
sequence: 0,
kind: blazen_telemetry::HistoryEventKind::WorkflowCompleted {
duration_ms: u64::try_from(start.elapsed().as_millis()).unwrap_or(u64::MAX),
},
},
);
let final_event: Box<dyn AnyEvent> =
if event.as_any().downcast_ref::<StopEvent>().is_some() {
event
} else if let Some(dynamic) = event.as_any().downcast_ref::<DynamicEvent>() {
match serde_json::from_value::<StopEvent>(dynamic.data.clone()) {
Ok(stop) => Box::new(stop),
Err(_) => {
Box::new(StopEvent {
result: dynamic.data.clone(),
})
}
}
} else {
let json = event.to_json();
Box::new(StopEvent {
result: json.get("result").cloned().unwrap_or(json),
})
};
let _ = result_tx.send(Ok(final_event));
return;
}
if event_type == InputRequestEvent::event_type() {
let request = if let Some(req) = event.as_any().downcast_ref::<InputRequestEvent>() {
req.clone()
} else if let Some(dynamic) = event.as_any().downcast_ref::<DynamicEvent>() {
if let Ok(req) = serde_json::from_value::<InputRequestEvent>(dynamic.data.clone()) {
req
} else {
let _ = result_tx.send(Err(WorkflowError::Context(
"failed to deserialize InputRequestEvent from DynamicEvent".into(),
)));
return;
}
} else {
let _ = result_tx.send(Err(WorkflowError::Context(
"InputRequestEvent type mismatch".into(),
)));
return;
};
#[cfg(feature = "telemetry")]
emit_history(
history_tx.as_ref(),
&mut history_buffer,
blazen_telemetry::HistoryEvent {
timestamp: Utc::now(),
sequence: 0,
kind: blazen_telemetry::HistoryEventKind::InputRequested {
request_id: request.request_id.clone(),
prompt: request.prompt.clone(),
},
},
);
if let Some(ref handler) = input_handler {
match handler(request).await {
Ok(response) => {
let envelope =
EventEnvelope::new(Box::new(response), Some("__input_handler".into()));
let _ = event_tx.send(envelope);
continue;
}
Err(e) => {
let _ = result_tx.send(Err(e));
return;
}
}
}
#[cfg(feature = "telemetry")]
emit_history(
history_tx.as_ref(),
&mut history_buffer,
blazen_telemetry::HistoryEvent {
timestamp: Utc::now(),
sequence: 0,
kind: blazen_telemetry::HistoryEventKind::WorkflowPaused {
reason: blazen_telemetry::PauseReason::InputRequired,
pending_count: 0,
},
},
);
ctx.set_metadata(
"__input_request",
serde_json::to_value(&request)
.expect("InputRequestEvent serialization should never fail"),
)
.await;
parked = true;
continue;
}
let Some(handlers) = registry.get(event_type) else {
tracing::warn!(event_type, "no handler registered for event type");
#[cfg(feature = "telemetry")]
emit_history(
history_tx.as_ref(),
&mut history_buffer,
blazen_telemetry::HistoryEvent {
timestamp: Utc::now(),
sequence: 0,
kind: blazen_telemetry::HistoryEventKind::WorkflowFailed {
error: format!("no handler registered for event type: {event_type}"),
duration_ms: u64::try_from(start.elapsed().as_millis()).unwrap_or(u64::MAX),
},
},
);
let _ = result_tx.send(Err(WorkflowError::NoHandler {
event_type: event_type.to_owned(),
}));
return;
};
let handlers = handlers.clone();
ctx.push_collected(&*event).await;
dispatch_to_handlers(
&handlers,
&*event,
&ctx,
&event_tx,
&error_tx,
&mut in_flight,
&in_flight_count,
auto_publish_events,
#[cfg(feature = "telemetry")]
history_tx.as_ref(),
);
#[cfg(feature = "persist")]
if checkpoint_config.after_step
&& let Some(ref store) = checkpoint_config.store
{
save_checkpoint(
&**store,
&ctx,
&workflow_name,
run_id,
#[cfg(feature = "telemetry")]
&history_buffer,
)
.await;
}
}
}
async fn build_snapshot_in_place(
ctx: &Context,
workflow_name: &str,
run_id: Uuid,
#[cfg(feature = "telemetry")] history_buffer: &[blazen_telemetry::HistoryEvent],
) -> Result<WorkflowSnapshot, WorkflowError> {
let context_state = ctx.snapshot_state().await;
let collected_events = ctx.snapshot_collected().await;
let mut metadata = ctx.snapshot_metadata().await;
apply_session_pause_policy(ctx, &mut metadata).await?;
#[cfg(feature = "telemetry")]
let history = history_buffer.to_vec();
Ok(WorkflowSnapshot {
version: SNAPSHOT_VERSION,
workflow_name: workflow_name.to_owned(),
run_id,
timestamp: Utc::now(),
context_state,
collected_events,
pending_events: Vec::new(), metadata,
#[cfg(feature = "telemetry")]
history,
})
}
async fn purge_until_snapshot_refs(registry: &SessionRefRegistry) {
let keys = registry.keys().await;
for key in keys {
if registry.lifetime_of(key).await == Some(RefLifetime::UntilSnapshot) {
registry.remove(key).await;
tracing::debug!(
key = %key,
"purged UntilSnapshot session ref before snapshot walk"
);
}
}
}
async fn apply_session_pause_policy(
ctx: &Context,
metadata: &mut HashMap<String, serde_json::Value>,
) -> Result<(), WorkflowError> {
let policy = ctx.session_pause_policy().await;
let registry = ctx.session_refs_arc().await;
purge_until_snapshot_refs(®istry).await;
if registry.is_empty().await {
return Ok(());
}
match policy {
SessionPausePolicy::HardError => {
let keys: Vec<String> = registry
.keys()
.await
.iter()
.map(std::string::ToString::to_string)
.collect();
Err(WorkflowError::SessionRefsNotSerializable { keys })
}
SessionPausePolicy::WarnDrop => {
let keys = registry.keys().await;
if !keys.is_empty() {
let key_strs: Vec<String> =
keys.iter().map(std::string::ToString::to_string).collect();
tracing::warn!(
count = keys.len(),
keys = ?key_strs,
"dropping live session refs from snapshot (WarnDrop policy)"
);
metadata.insert(
"__blazen_dropped_session_refs".to_owned(),
serde_json::to_value(&key_strs).unwrap_or_default(),
);
}
Ok(())
}
SessionPausePolicy::PickleOrError => {
let keys = registry.keys().await;
if !keys.is_empty() {
let key_strs: Vec<String> =
keys.iter().map(std::string::ToString::to_string).collect();
tracing::warn!(
count = keys.len(),
keys = ?key_strs,
"dropping live session refs from snapshot \
(PickleOrError policy, no pickler registered)"
);
metadata.insert(
"__blazen_dropped_session_refs".to_owned(),
serde_json::to_value(&key_strs).unwrap_or_default(),
);
}
Ok(())
}
SessionPausePolicy::PickleOrSerialize => {
apply_pickle_or_serialize_policy(®istry, metadata).await;
Ok(())
}
}
}
async fn apply_pickle_or_serialize_policy(
registry: &SessionRefRegistry,
metadata: &mut HashMap<String, serde_json::Value>,
) {
let all_keys = registry.keys().await;
let serializable = registry.serializable_entries().await;
let mut captured: HashMap<String, serde_json::Value> =
HashMap::with_capacity(serializable.len());
for (key, entry) in &serializable {
let type_tag = entry.blazen_type_tag();
match entry.blazen_serialize() {
Ok(bytes) => {
let mut record = serde_json::Map::with_capacity(2);
record.insert(
"type_tag".to_owned(),
serde_json::Value::String(type_tag.to_owned()),
);
record.insert(
"data".to_owned(),
serde_json::to_value(crate::value::BytesWrapper(bytes))
.unwrap_or(serde_json::Value::Null),
);
captured.insert(key.to_string(), serde_json::Value::Object(record));
}
Err(err) => {
tracing::warn!(
key = %key,
type_tag = %type_tag,
error = %err,
"session ref serialization failed; dropping entry from snapshot"
);
}
}
}
if !captured.is_empty() {
metadata.insert(
SERIALIZED_SESSION_REFS_META_KEY.to_owned(),
serde_json::to_value(&captured).unwrap_or_default(),
);
}
let dropped: Vec<String> = all_keys
.iter()
.filter(|k| !captured.contains_key(&k.to_string()))
.map(std::string::ToString::to_string)
.collect();
if !dropped.is_empty() {
tracing::warn!(
count = dropped.len(),
keys = ?dropped,
"dropping live session refs from snapshot \
(PickleOrSerialize policy, entries did not \
implement SessionRefSerializable)"
);
metadata.insert(
"__blazen_dropped_session_refs".to_owned(),
serde_json::to_value(&dropped).unwrap_or_default(),
);
}
}
#[allow(clippy::too_many_arguments, clippy::too_many_lines)]
fn dispatch_to_handlers(
handlers: &[StepRegistration],
event: &dyn AnyEvent,
ctx: &Context,
event_tx: &mpsc::UnboundedSender<EventEnvelope>,
error_tx: &mpsc::UnboundedSender<WorkflowError>,
in_flight: &mut JoinSet<()>,
in_flight_count: &Arc<AtomicUsize>,
auto_publish_events: bool,
#[cfg(feature = "telemetry")] history_tx: Option<
&mpsc::UnboundedSender<blazen_telemetry::HistoryEvent>,
>,
) {
for step in handlers {
let event_clone = event.clone_boxed();
let ctx_clone = ctx.clone();
let handler = step.handler.clone();
let step_name = step.name.clone();
let event_tx_clone = event_tx.clone();
let error_tx_clone = error_tx.clone();
let counter = Arc::clone(in_flight_count);
let event_type = event.event_type_id().to_owned();
let semaphore = step.semaphore.clone();
#[cfg(feature = "telemetry")]
let htx = history_tx.cloned();
#[cfg(feature = "telemetry")]
if let Some(ref tx) = htx {
let _ = tx.send(blazen_telemetry::HistoryEvent {
timestamp: Utc::now(),
sequence: 0,
kind: blazen_telemetry::HistoryEventKind::StepDispatched {
step_name: step_name.clone(),
event_type: event_type.clone(),
},
});
}
let stream_ctx = if auto_publish_events {
Some(ctx.clone())
} else {
None
};
counter.fetch_add(1, Ordering::Relaxed);
let step_span = tracing::info_span!(
"workflow.step",
step_name = %step_name,
event_type = %event_type,
otel.status_code = tracing::field::Empty,
duration_ms = tracing::field::Empty,
);
let step_span_clone = step_span.clone();
in_flight.spawn(
async move {
let _permit = match semaphore {
Some(ref sem) => Some(sem.acquire().await.expect("semaphore closed")),
None => None,
};
if let Some(ref sctx) = stream_ctx {
let mut data = serde_json::Map::new();
data.insert(
"kind".into(),
serde_json::Value::String("step_started".into()),
);
data.insert(
"step_name".into(),
serde_json::Value::String(step_name.clone()),
);
data.insert(
"event_type".into(),
serde_json::Value::String(event_type.clone()),
);
sctx.write_event_to_stream(DynamicEvent {
event_type: "blazen::lifecycle".to_owned(),
data: serde_json::Value::Object(data),
})
.await;
}
let start = Instant::now();
match handler(event_clone, ctx_clone).await {
Ok(StepOutput::Single(output_event)) => {
let duration =
u64::try_from(start.elapsed().as_millis()).unwrap_or(u64::MAX);
step_span_clone.record("duration_ms", duration);
step_span_clone.record("otel.status_code", "OK");
#[cfg(feature = "telemetry")]
if let Some(ref tx) = htx {
let output_type = output_event.event_type_id().to_owned();
let _ = tx.send(blazen_telemetry::HistoryEvent {
timestamp: Utc::now(),
sequence: 0,
kind: blazen_telemetry::HistoryEventKind::StepCompleted {
step_name: step_name.clone(),
duration_ms: duration,
output_type,
},
});
}
if let Some(ref sctx) = stream_ctx {
let mut data = serde_json::Map::new();
data.insert(
"kind".into(),
serde_json::Value::String("step_completed".into()),
);
data.insert(
"step_name".into(),
serde_json::Value::String(step_name.clone()),
);
data.insert(
"duration_ms".into(),
serde_json::Value::Number(duration.into()),
);
sctx.write_event_to_stream(DynamicEvent {
event_type: "blazen::lifecycle".to_owned(),
data: serde_json::Value::Object(data),
})
.await;
}
let envelope = EventEnvelope::new(output_event, Some(step_name));
let _ = event_tx_clone.send(envelope);
}
Ok(StepOutput::Multiple(events)) => {
let duration =
u64::try_from(start.elapsed().as_millis()).unwrap_or(u64::MAX);
step_span_clone.record("duration_ms", duration);
step_span_clone.record("otel.status_code", "OK");
#[cfg(feature = "telemetry")]
if let Some(ref tx) = htx {
let _ = tx.send(blazen_telemetry::HistoryEvent {
timestamp: Utc::now(),
sequence: 0,
kind: blazen_telemetry::HistoryEventKind::StepCompleted {
step_name: step_name.clone(),
duration_ms: duration,
output_type: "Multiple".to_owned(),
},
});
}
if let Some(ref sctx) = stream_ctx {
let mut data = serde_json::Map::new();
data.insert(
"kind".into(),
serde_json::Value::String("step_completed".into()),
);
data.insert(
"step_name".into(),
serde_json::Value::String(step_name.clone()),
);
data.insert(
"duration_ms".into(),
serde_json::Value::Number(duration.into()),
);
sctx.write_event_to_stream(DynamicEvent {
event_type: "blazen::lifecycle".to_owned(),
data: serde_json::Value::Object(data),
})
.await;
}
for e in events {
let envelope = EventEnvelope::new(e, Some(step_name.clone()));
let _ = event_tx_clone.send(envelope);
}
}
Ok(StepOutput::None) => {
let duration =
u64::try_from(start.elapsed().as_millis()).unwrap_or(u64::MAX);
step_span_clone.record("duration_ms", duration);
step_span_clone.record("otel.status_code", "OK");
#[cfg(feature = "telemetry")]
if let Some(ref tx) = htx {
let _ = tx.send(blazen_telemetry::HistoryEvent {
timestamp: Utc::now(),
sequence: 0,
kind: blazen_telemetry::HistoryEventKind::StepCompleted {
step_name: step_name.clone(),
duration_ms: duration,
output_type: "None".to_owned(),
},
});
}
if let Some(ref sctx) = stream_ctx {
let mut data = serde_json::Map::new();
data.insert(
"kind".into(),
serde_json::Value::String("step_completed".into()),
);
data.insert(
"step_name".into(),
serde_json::Value::String(step_name.clone()),
);
data.insert(
"duration_ms".into(),
serde_json::Value::Number(duration.into()),
);
sctx.write_event_to_stream(DynamicEvent {
event_type: "blazen::lifecycle".to_owned(),
data: serde_json::Value::Object(data),
})
.await;
}
}
Err(err) => {
let duration =
u64::try_from(start.elapsed().as_millis()).unwrap_or(u64::MAX);
step_span_clone.record("duration_ms", duration);
step_span_clone.record("otel.status_code", "ERROR");
let err_str = err.to_string();
#[cfg(feature = "telemetry")]
if let Some(ref tx) = htx {
let _ = tx.send(blazen_telemetry::HistoryEvent {
timestamp: Utc::now(),
sequence: 0,
kind: blazen_telemetry::HistoryEventKind::StepFailed {
step_name: step_name.clone(),
error: err_str.clone(),
duration_ms: duration,
},
});
}
if let Some(ref sctx) = stream_ctx {
let mut data = serde_json::Map::new();
data.insert(
"kind".into(),
serde_json::Value::String("step_failed".into()),
);
data.insert(
"step_name".into(),
serde_json::Value::String(step_name.clone()),
);
data.insert(
"duration_ms".into(),
serde_json::Value::Number(duration.into()),
);
data.insert("error".into(), serde_json::Value::String(err_str));
sctx.write_event_to_stream(DynamicEvent {
event_type: "blazen::lifecycle".to_owned(),
data: serde_json::Value::Object(data),
})
.await;
}
tracing::error!(
step = %step_name,
error = %err,
"step failed"
);
let _ = error_tx_clone.send(WorkflowError::StepFailed {
step_name,
source: Box::new(err),
});
}
}
counter.fetch_sub(1, Ordering::Relaxed);
}
.instrument(step_span),
);
}
}