god_graph/transformer/
mod.rs1#![cfg(feature = "tensor")]
14
15pub mod autograd;
16pub mod layers;
17pub mod loader;
18pub mod model;
19pub mod generation;
20pub mod graph_transformer;
21pub mod kv_cache;
22#[cfg(feature = "tensor")]
23pub mod sparse_attention;
24pub mod batch;
25#[cfg(feature = "tensor")]
26pub mod quantization;
27pub mod perf;
28pub mod optimization;
29
30pub use autograd::{ComputeGraph, DifferentiableTensor, Op, Optimizer};
32pub use layers::{MultiHeadAttention, RMSNorm, LayerNorm, RoPE, FeedForward};
33pub use loader::{SafetensorsLoader, ModelConfig};
34pub use model::{LlamaModel, LlamaConfig};
35pub use generation::{GenerationConfig, TextGenerator};
36pub use graph_transformer::{GraphExecutor, GraphTransformer, GraphNode, GraphEdge};
37pub use kv_cache::KVCache;
38#[cfg(feature = "tensor")]
39pub use sparse_attention::SparseAttention;
40pub use batch::BatchInference;
41pub use quantization::{QuantizedTensor, QuantizationConfig};
42pub use perf::{TransformerMemoryPool, softmax_inplace_simd, matmul_with_buffer};