[package]
name = "bitmamba"
version = "0.1.0"
edition = "2021"
authors = ["Riley Seaburg <riley@seaburg.dev>"]
description = "BitMamba: 1.58-bit Mamba language model with infinite context window - includes OpenAI-compatible API server"
license = "MIT"
repository = "https://github.com/rileyseaburg/bitmamba"
homepage = "https://github.com/rileyseaburg/bitmamba"
documentation = "https://docs.rs/bitmamba"
readme = "README.md"
keywords = ["llm", "mamba", "bitnet", "inference", "ai"]
categories = ["science", "command-line-utilities", "web-programming"]
exclude = ["distill_cache/", "*.pt", "*.safetensors"]
[[bin]]
name = "bitmamba-server"
path = "src/server.rs"
[[bin]]
name = "bitmamba"
path = "src/main.rs"
[lib]
name = "bitmamba"
path = "src/lib.rs"
[dependencies]
anyhow = "1.0"
candle-core = "0.8"
candle-nn = "0.8"
hf-hub = "0.3.2"
tokenizers = "0.20"
serde = { version = "1.0", features = ["derive"] }
serde_json = "1.0"
rand = "0.8"
axum = { version = "0.7", features = ["macros"] }
tokio = { version = "1", features = ["full"] }
tower-http = { version = "0.5", features = ["cors"] }
uuid = { version = "1", features = ["v4"] }
chrono = "0.4"
futures = "0.3"
async-stream = "0.3"
tokio-stream = "0.1"
[features]
default = []
cuda = ["candle-core/cuda", "candle-nn/cuda"]