ferrum-kernels 0.7.2

Unified compute kernels (CUDA/Metal/CPU) and model runner for Ferrum inference
Documentation
# THIS FILE IS AUTOMATICALLY GENERATED BY CARGO
#
# When uploading crates to the registry Cargo will automatically
# "normalize" Cargo.toml files for maximal compatibility
# with all versions of Cargo and also rewrite `path` dependencies
# to registry (e.g., crates.io) dependencies.
#
# If you are reading this file be aware that the original Cargo.toml
# will likely look very different (and much more reasonable).
# See Cargo.toml.orig for the original contents.

[package]
edition = "2021"
name = "ferrum-kernels"
version = "0.7.2"
authors = ["Ferrum Team"]
build = "build.rs"
autolib = false
autobins = false
autoexamples = false
autotests = false
autobenches = false
description = "Unified compute kernels (CUDA/Metal/CPU) and model runner for Ferrum inference"
readme = "README.md"
license = "MIT"

[features]
cuda = [
    "candle-core/cuda",
    "dep:cudarc",
    "marlin",
    "cudarc?/nccl",
]
default = []
marlin = []
metal = [
    "dep:metal",
    "dep:ferrum-attention",
    "ferrum-attention/metal",
]
tensor-parallel = ["cuda"]
triton-kernels = ["cuda"]

[lib]
name = "ferrum_kernels"
path = "src/lib.rs"

[[test]]
name = "cudarc_graph_repro"
path = "tests/cudarc_graph_repro.rs"

[[test]]
name = "triton_add_bias_eq"
path = "tests/triton_add_bias_eq.rs"

[[test]]
name = "triton_fused_add_rms_norm_eq"
path = "tests/triton_fused_add_rms_norm_eq.rs"

[[test]]
name = "triton_fused_silu_mul_eq"
path = "tests/triton_fused_silu_mul_eq.rs"

[[test]]
name = "triton_gelu_eq"
path = "tests/triton_gelu_eq.rs"

[[test]]
name = "triton_layer_norm_eq"
path = "tests/triton_layer_norm_eq.rs"

[[test]]
name = "triton_residual_add_eq"
path = "tests/triton_residual_add_eq.rs"

[[test]]
name = "triton_residual_add_inplace_eq"
path = "tests/triton_residual_add_inplace_eq.rs"

[[test]]
name = "triton_rms_norm_eq"
path = "tests/triton_rms_norm_eq.rs"

[[test]]
name = "triton_softmax_eq"
path = "tests/triton_softmax_eq.rs"

[[test]]
name = "triton_w4a16_eq"
path = "tests/triton_w4a16_eq.rs"

[dependencies.candle-core]
version = "0.9.2"

[dependencies.cudarc]
version = "0.19"
features = [
    "driver",
    "cublas",
    "f16",
    "nvrtc",
]
optional = true
default-features = false

[dependencies.ferrum-attention]
version = "0.7.0"
optional = true

[dependencies.ferrum-types]
version = "0.7.2"

[dependencies.half]
version = "2.5.0"
features = [
    "num-traits",
    "use-intrinsics",
    "rand_distr",
]

[dependencies.metal]
version = "0.31"
optional = true

[dependencies.tracing]
version = "0.1"

[build-dependencies.bindgen_cuda]
version = "0.1.6"