use scirs2_core::ndarray::{Array1, Array2};
use scirs2_core::numeric::{Float, FromPrimitive};
use std::fmt::Debug;
use super::lstm::LSTMCell;
use crate::error::Result;
#[derive(Debug)]
pub struct FlashAttention<F: Float + Debug> {
#[allow(dead_code)]
model_dim: usize,
#[allow(dead_code)]
num_heads: usize,
#[allow(dead_code)]
w_query: Array2<F>,
#[allow(dead_code)]
w_key: Array2<F>,
#[allow(dead_code)]
w_value: Array2<F>,
}
impl<F: Float + Debug + Clone + FromPrimitive> FlashAttention<F> {
pub fn new(model_dim: usize, num_heads: usize) -> Self {
let scale = F::from(2.0).expect("Failed to convert constant to float")
/ F::from(model_dim).expect("Failed to convert to float");
let std_dev = scale.sqrt();
Self {
model_dim,
num_heads,
w_query: LSTMCell::random_matrix(model_dim, model_dim, std_dev),
w_key: LSTMCell::random_matrix(model_dim, model_dim, std_dev),
w_value: LSTMCell::random_matrix(model_dim, model_dim, std_dev),
}
}
pub fn forward(&self, input: &Array2<F>) -> Result<Array2<F>> {
Ok(input.clone())
}
}