pub type ExecutionContext = ServerStreamingEngine<PreprocessedRequest, ExecutionOutputStream>;
Expand description
Context for executing LLM inference, engine consumes backend input and produces execution output stream
Aliased Typeยง
pub struct ExecutionContext { /* private fields */ }