pub struct LlmBenchArgs {Show 18 fields
pub url: String,
pub model: String,
pub start: Option<String>,
pub health_timeout: String,
pub prompt_profile: String,
pub prompt_file: Option<PathBuf>,
pub warmup: String,
pub duration: String,
pub concurrency: usize,
pub runs: usize,
pub cooldown: String,
pub baseline: Option<PathBuf>,
pub fail_on_regression: Option<f64>,
pub runtime_name: String,
pub output: Option<PathBuf>,
pub stream: bool,
pub trace_level: Option<String>,
pub num_layers: Option<u32>,
}Expand description
Arguments for probador llm bench (full benchmark lifecycle)
Fields§
§url: StringBase URL of the LLM API server
model: StringModel name to include in requests
start: Option<String>Shell command to start the server (optional)
health_timeout: StringMaximum time to wait for server readiness (e.g., 120s)
prompt_profile: StringPrompt profile: micro, short, medium, long
prompt_file: Option<PathBuf>Path to YAML prompt file (overrides –prompt-profile)
warmup: StringWarmup duration before measurement (e.g., 10s)
duration: StringPer-run measurement duration (e.g., 60s)
concurrency: usizeNumber of concurrent workers
runs: usizeNumber of measurement runs
cooldown: StringCooldown between runs (e.g., 5s)
baseline: Option<PathBuf>Baseline JSON file for regression detection
fail_on_regression: Option<f64>Percentage threshold for regression detection (exit 1 if exceeded)
runtime_name: StringRuntime name for reporting (e.g., apr-gguf-gpu)
output: Option<PathBuf>Output file path for JSON results
stream: boolUse SSE streaming for real per-token timing (TTFT, TPOT, ITL). Use –stream false to disable.
trace_level: Option<String>Trace level for brick profiler data (GH-114): brick, step, layer
num_layers: Option<u32>Number of transformer layers in the model (e.g., 28 for Qwen 1.5B). Computes per-layer decode time for cross-runtime comparison.
Trait Implementations§
Source§impl Args for LlmBenchArgs
impl Args for LlmBenchArgs
Source§fn augment_args<'b>(__clap_app: Command) -> Command
fn augment_args<'b>(__clap_app: Command) -> Command
Source§fn augment_args_for_update<'b>(__clap_app: Command) -> Command
fn augment_args_for_update<'b>(__clap_app: Command) -> Command
Command so it can instantiate self via
FromArgMatches::update_from_arg_matches_mut Read moreSource§impl CommandFactory for LlmBenchArgs
impl CommandFactory for LlmBenchArgs
Source§impl Debug for LlmBenchArgs
impl Debug for LlmBenchArgs
Source§impl FromArgMatches for LlmBenchArgs
impl FromArgMatches for LlmBenchArgs
Source§fn from_arg_matches(__clap_arg_matches: &ArgMatches) -> Result<Self, Error>
fn from_arg_matches(__clap_arg_matches: &ArgMatches) -> Result<Self, Error>
Source§fn from_arg_matches_mut(
__clap_arg_matches: &mut ArgMatches,
) -> Result<Self, Error>
fn from_arg_matches_mut( __clap_arg_matches: &mut ArgMatches, ) -> Result<Self, Error>
Source§fn update_from_arg_matches(
&mut self,
__clap_arg_matches: &ArgMatches,
) -> Result<(), Error>
fn update_from_arg_matches( &mut self, __clap_arg_matches: &ArgMatches, ) -> Result<(), Error>
ArgMatches to self.Source§fn update_from_arg_matches_mut(
&mut self,
__clap_arg_matches: &mut ArgMatches,
) -> Result<(), Error>
fn update_from_arg_matches_mut( &mut self, __clap_arg_matches: &mut ArgMatches, ) -> Result<(), Error>
ArgMatches to self.Source§impl Parser for LlmBenchArgs
impl Parser for LlmBenchArgs
Source§fn parse_from<I, T>(itr: I) -> Self
fn parse_from<I, T>(itr: I) -> Self
Source§fn try_parse_from<I, T>(itr: I) -> Result<Self, Error>
fn try_parse_from<I, T>(itr: I) -> Result<Self, Error>
Source§fn update_from<I, T>(&mut self, itr: I)
fn update_from<I, T>(&mut self, itr: I)
Auto Trait Implementations§
impl Freeze for LlmBenchArgs
impl RefUnwindSafe for LlmBenchArgs
impl Send for LlmBenchArgs
impl Sync for LlmBenchArgs
impl Unpin for LlmBenchArgs
impl UnsafeUnpin for LlmBenchArgs
impl UnwindSafe for LlmBenchArgs
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
impl<A, B, T> HttpServerConnExec<A, B> for Twhere
B: Body,
Source§impl<T> Instrument for T
impl<T> Instrument for T
Source§fn instrument(self, span: Span) -> Instrumented<Self>
fn instrument(self, span: Span) -> Instrumented<Self>
Source§fn in_current_span(self) -> Instrumented<Self>
fn in_current_span(self) -> Instrumented<Self>
Source§impl<T> IntoEither for T
impl<T> IntoEither for T
Source§fn into_either(self, into_left: bool) -> Either<Self, Self>
fn into_either(self, into_left: bool) -> Either<Self, Self>
self into a Left variant of Either<Self, Self>
if into_left is true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read moreSource§fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
self into a Left variant of Either<Self, Self>
if into_left(&self) returns true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read more