[package]
edition = "2021"
name = "ferrum-kernels"
version = "0.7.2"
authors = ["Ferrum Team"]
build = "build.rs"
autolib = false
autobins = false
autoexamples = false
autotests = false
autobenches = false
description = "Unified compute kernels (CUDA/Metal/CPU) and model runner for Ferrum inference"
readme = "README.md"
license = "MIT"
[features]
cuda = [
"candle-core/cuda",
"dep:cudarc",
"marlin",
"cudarc?/nccl",
]
default = []
marlin = []
metal = [
"dep:metal",
"dep:ferrum-attention",
"ferrum-attention/metal",
]
tensor-parallel = ["cuda"]
triton-kernels = ["cuda"]
[lib]
name = "ferrum_kernels"
path = "src/lib.rs"
[[test]]
name = "cudarc_graph_repro"
path = "tests/cudarc_graph_repro.rs"
[[test]]
name = "triton_add_bias_eq"
path = "tests/triton_add_bias_eq.rs"
[[test]]
name = "triton_fused_add_rms_norm_eq"
path = "tests/triton_fused_add_rms_norm_eq.rs"
[[test]]
name = "triton_fused_silu_mul_eq"
path = "tests/triton_fused_silu_mul_eq.rs"
[[test]]
name = "triton_gelu_eq"
path = "tests/triton_gelu_eq.rs"
[[test]]
name = "triton_layer_norm_eq"
path = "tests/triton_layer_norm_eq.rs"
[[test]]
name = "triton_residual_add_eq"
path = "tests/triton_residual_add_eq.rs"
[[test]]
name = "triton_residual_add_inplace_eq"
path = "tests/triton_residual_add_inplace_eq.rs"
[[test]]
name = "triton_rms_norm_eq"
path = "tests/triton_rms_norm_eq.rs"
[[test]]
name = "triton_softmax_eq"
path = "tests/triton_softmax_eq.rs"
[[test]]
name = "triton_w4a16_eq"
path = "tests/triton_w4a16_eq.rs"
[dependencies.candle-core]
version = "0.9.2"
[dependencies.cudarc]
version = "0.19"
features = [
"driver",
"cublas",
"f16",
"nvrtc",
]
optional = true
default-features = false
[dependencies.ferrum-attention]
version = "0.7.0"
optional = true
[dependencies.ferrum-types]
version = "0.7.2"
[dependencies.half]
version = "2.5.0"
features = [
"num-traits",
"use-intrinsics",
"rand_distr",
]
[dependencies.metal]
version = "0.31"
optional = true
[dependencies.tracing]
version = "0.1"
[build-dependencies.bindgen_cuda]
version = "0.1.6"