pub async fn compute_attention_async(
query: Float32Array,
keys: Vec<Float32Array>,
values: Vec<Float32Array>,
dim: u32,
) -> Result<Float32Array>Expand description
Async scaled dot-product attention computation
pub async fn compute_attention_async(
query: Float32Array,
keys: Vec<Float32Array>,
values: Vec<Float32Array>,
dim: u32,
) -> Result<Float32Array>Async scaled dot-product attention computation