realizar 0.8.5

Pure Rust ML inference engine built from scratch - model serving for GGUF and safetensors
1
2
3
4
5
6
7
8
9
10
11
12
13
//! Batched forward pass operations for multi-sequence inference
//!
//! Extracted from layer.rs (PMAT-802) to reduce module size.
//! Contains:
//! - PAR-111: forward_batched_to_token_ids
//! - PAR-121: forward_batched_to_token_ids_graphed

#![allow(clippy::wildcard_imports)]

use super::super::*;

include!("rmsnorm_ptr.rs");
include!("batched_03.rs");