[[bin]]
name = "bitmamba"
path = "src/main.rs"
[[bin]]
name = "bitmamba-server"
path = "src/server.rs"
[dependencies.anyhow]
version = "1.0"
[dependencies.async-stream]
version = "0.3"
[dependencies.axum]
features = ["macros"]
version = "0.7"
[dependencies.candle-core]
version = "0.8"
[dependencies.candle-nn]
version = "0.8"
[dependencies.chrono]
version = "0.4"
[dependencies.futures]
version = "0.3"
[dependencies.hf-hub]
version = "0.3.2"
[dependencies.rand]
version = "0.8"
[dependencies.serde]
features = ["derive"]
version = "1.0"
[dependencies.serde_json]
version = "1.0"
[dependencies.tokenizers]
version = "0.20"
[dependencies.tokio]
features = ["full"]
version = "1"
[dependencies.tokio-stream]
version = "0.1"
[dependencies.tower-http]
features = ["cors"]
version = "0.5"
[dependencies.uuid]
features = ["v4"]
version = "1"
[features]
cuda = ["candle-core/cuda", "candle-nn/cuda"]
default = []
[lib]
name = "bitmamba"
path = "src/lib.rs"
[package]
authors = ["Riley Seaburg <riley@seaburg.dev>"]
autobenches = false
autobins = false
autoexamples = false
autolib = false
autotests = false
build = false
categories = ["science", "command-line-utilities", "web-programming"]
description = "BitMamba: 1.58-bit Mamba language model with infinite context window - includes OpenAI-compatible API server"
documentation = "https://docs.rs/bitmamba"
edition = "2021"
exclude = ["distill_cache/", "*.pt", "*.safetensors"]
homepage = "https://github.com/rileyseaburg/bitmamba"
keywords = ["llm", "mamba", "bitnet", "inference", "ai"]
license = "MIT"
name = "bitmamba"
readme = "README.md"
repository = "https://github.com/rileyseaburg/bitmamba"
version = "0.1.0"