[package]
edition = "2021"
rust-version = "1.78"
name = "atomr-infer-runtime-tensorrt"
version = "0.8.0"
authors = ["atomr-infer contributors"]
build = false
autolib = false
autobins = false
autoexamples = false
autotests = false
autobenches = false
description = "TensorRT runner for atomr-infer. Wraps atomr-accel-tensorrt's TrtRuntime / ExecutionContext / ExecutionBindings behind the ModelRunner trait."
homepage = "https://github.com/rustakka/atomr-infer"
documentation = "https://docs.rs/atomr-infer-runtime-tensorrt"
readme = "README.md"
keywords = [
"llm",
"inference",
"atomr",
"actor",
"openai",
]
categories = [
"concurrency",
"asynchronous",
"science",
]
license = "Apache-2.0"
repository = "https://github.com/rustakka/atomr-infer"
[features]
default = []
tensorrt = [
"dep:atomr-accel-tensorrt",
"dep:cudarc",
"dep:parking_lot",
]
tensorrt-fp8 = [
"tensorrt",
"atomr-accel-tensorrt/tensorrt-fp8",
]
tensorrt-int8 = [
"tensorrt",
"atomr-accel-tensorrt/tensorrt-int8",
]
tensorrt-link = [
"tensorrt",
"atomr-accel-tensorrt/tensorrt-link",
]
tensorrt-onnx = [
"tensorrt",
"atomr-accel-tensorrt/tensorrt-onnx",
]
tensorrt-plugin = [
"tensorrt",
"atomr-accel-tensorrt/tensorrt-plugin",
]
[lib]
name = "atomr_infer_runtime_tensorrt"
path = "src/lib.rs"
[dependencies.async-trait]
version = "0.1"
[dependencies.atomr-accel-tensorrt]
version = "0.10.0"
optional = true
[dependencies.atomr-infer-core]
version = "0.8.0"
[dependencies.atomr-infer-runtime]
version = "0.8.0"
[dependencies.cudarc]
version = "0.19.4"
features = [
"cuda-version-from-build-system",
"fallback-latest",
]
optional = true
[dependencies.parking_lot]
version = "0.12"
optional = true
[dependencies.serde]
version = "1"
features = ["derive"]
[dependencies.tracing]
version = "0.1"
[dev-dependencies.tempfile]
version = "3"
[dev-dependencies.tokio]
version = "1.39"
features = [
"full",
"macros",
"rt",
]