burn_dragon_kernel 0.5.0

Fused GPU kernel crate for burn_dragon execution paths
Documentation
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
#[derive(Clone, Copy, Debug)]
pub struct Rwkv8BenchCase {
    pub batch: usize,
    pub heads: usize,
    pub time: usize,
    pub latent: usize,
    pub embd: usize,
}

pub const LARGE_RUNG_CASE: Rwkv8BenchCase = Rwkv8BenchCase {
    batch: 1,
    heads: 8,
    time: 256,
    latent: 8192,
    embd: 1024,
};