pub async fn batch_attention_compute(
queries: Vec<Float32Array>,
keys: Vec<Vec<Float32Array>>,
values: Vec<Vec<Float32Array>>,
dim: u32,
) -> Result<BatchResult>Expand description
Process a batch of attention computations
pub async fn batch_attention_compute(
queries: Vec<Float32Array>,
keys: Vec<Vec<Float32Array>>,
values: Vec<Vec<Float32Array>>,
dim: u32,
) -> Result<BatchResult>Process a batch of attention computations