llmux 0.2.0

Zero-reload model switching for vLLM - manages multiple models on shared GPU
Documentation
# THIS FILE IS AUTOMATICALLY GENERATED BY CARGO
#
# When uploading crates to the registry Cargo will automatically
# "normalize" Cargo.toml files for maximal compatibility
# with all versions of Cargo and also rewrite `path` dependencies
# to registry (e.g., crates.io) dependencies.
#
# If you are reading this file be aware that the original Cargo.toml
# will likely look very different (and much more reasonable).
# See Cargo.toml.orig for the original contents.

[package]
edition = "2024"
rust-version = "1.88.0"
name = "llmux"
version = "0.2.0"
build = false
autolib = false
autobins = false
autoexamples = false
autotests = false
autobenches = false
description = "Zero-reload model switching for vLLM - manages multiple models on shared GPU"
readme = "README.md"
license = "MIT"
repository = "https://github.com/doublewordai/llmux"

[lib]
name = "llmux"
path = "src/lib.rs"

[[bin]]
name = "llmux"
path = "src/main.rs"

[[bin]]
name = "mock-vllm"
path = "src/bin/mock_vllm.rs"

[[test]]
name = "integration_test"
path = "tests/integration_test.rs"

[dependencies.anyhow]
version = "1.0.98"
features = ["backtrace"]

[dependencies.async-trait]
version = "0.1.88"

[dependencies.axum]
version = "0.8.4"

[dependencies.bytes]
version = "1.10"

[dependencies.clap]
version = "4.5.40"
features = [
    "derive",
    "env",
]

[dependencies.dashmap]
version = "6.1.0"

[dependencies.futures-util]
version = "0.3"

[dependencies.http]
version = "1.0"

[dependencies.http-body]
version = "1.0"

[dependencies.http-body-util]
version = "0.1.3"

[dependencies.hyper]
version = "1.0"

[dependencies.hyper-util]
version = "0.1.0"
features = [
    "client",
    "client-legacy",
    "http1",
    "tokio",
]

[dependencies.libc]
version = "0.2"

[dependencies.onwards]
version = "0.11"

[dependencies.pin-project-lite]
version = "0.2"

[dependencies.reqwest]
version = "0.12"
features = ["json"]

[dependencies.serde]
version = "1.0.219"
features = ["derive"]

[dependencies.serde_json]
version = "1.0.140"

[dependencies.thiserror]
version = "2.0"

[dependencies.tokio]
version = "1.45.1"
features = [
    "rt-multi-thread",
    "macros",
    "net",
    "fs",
    "sync",
    "time",
    "process",
    "io-util",
]

[dependencies.tower]
version = "0.5"
features = ["util"]

[dependencies.tracing]
version = "0.1.41"

[dependencies.tracing-subscriber]
version = "0.3.18"
features = ["env-filter"]

[dependencies.url]
version = "2.5"
features = ["serde"]

[dev-dependencies.rstest]
version = "0.26.1"

[dev-dependencies.serial_test]
version = "3.2"