Skip to main content

LlmLoadArgs

Struct LlmLoadArgs 

Source
pub struct LlmLoadArgs {
Show 23 fields pub url: String, pub model: String, pub concurrency: usize, pub duration: String, pub runtime_name: String, pub prompt_profile: Option<String>, pub prompt_file: Option<PathBuf>, pub warmup: String, pub output: Option<PathBuf>, pub stream: bool, pub rate: Option<f64>, pub rate_distribution: String, pub num_layers: Option<u32>, pub validate: String, pub fail_on_quality: Option<f64>, pub spike_threshold: f64, pub gpu_telemetry: bool, pub gpu_poll_interval: String, pub expected_clock_mhz: Option<u32>, pub skip_health_check: bool, pub dataset: Option<PathBuf>, pub max_tokens: Option<u32>, pub max_tokens_distribution: Option<String>,
}
Expand description

Arguments for probador llm load

Fields§

§url: String

Base URL of the LLM API server

§model: String

Model name to include in requests

§concurrency: usize

Number of concurrent workers

§duration: String

Test duration (e.g., 30s, 2m, 1h)

§runtime_name: String

Runtime name for reporting

§prompt_profile: Option<String>

Prompt profile: micro, short, medium, long

§prompt_file: Option<PathBuf>

Path to YAML prompt file

§warmup: String

Warmup duration before measurement (e.g., 5s, 10s). Default: no warmup.

§output: Option<PathBuf>

Output file path for JSON results

§stream: bool

Use SSE streaming for real per-token timing (TTFT, TPOT, ITL). Use –stream false to disable.

§rate: Option<f64>

Target request rate (req/s). Omit for max throughput (closed-loop).

§rate_distribution: String

Rate distribution: poisson (default) or constant. Only used with –rate.

§num_layers: Option<u32>

Number of transformer layers in the model (e.g., 28 for Qwen 1.5B). Computes per-layer decode time for cross-runtime comparison.

§validate: String

Inline correctness validation: none, basic, contains:X, pattern:X

§fail_on_quality: Option<f64>

Exit non-zero if quality pass rate drops below this threshold (e.g., 0.95)

§spike_threshold: f64

Multiplier of median ITL for spike detection (default: 5.0)

§gpu_telemetry: bool

Enable GPU telemetry collection via nvidia-smi

§gpu_poll_interval: String

GPU telemetry polling interval (e.g., 1s, 2s)

§expected_clock_mhz: Option<u32>

Expected GPU clock speed in MHz for throttle detection (auto-detect if omitted)

§skip_health_check: bool

Skip the pre-flight health check (not recommended)

§dataset: Option<PathBuf>

Path to JSONL dataset file for workload-driven benchmarking

§max_tokens: Option<u32>

Override max_tokens for all requests (e.g., –max-tokens 128)

§max_tokens_distribution: Option<String>

Max tokens distribution: uniform:MIN,MAX or fixed:N. Creates heterogeneous traffic with staggered completion times. Example: –max-tokens-distribution uniform:16,128

Trait Implementations§

Source§

impl Args for LlmLoadArgs

Source§

fn group_id() -> Option<Id>

Report the ArgGroup::id for this set of arguments
Source§

fn augment_args<'b>(__clap_app: Command) -> Command

Append to Command so it can instantiate Self via FromArgMatches::from_arg_matches_mut Read more
Source§

fn augment_args_for_update<'b>(__clap_app: Command) -> Command

Append to Command so it can instantiate self via FromArgMatches::update_from_arg_matches_mut Read more
Source§

impl CommandFactory for LlmLoadArgs

Source§

fn command<'b>() -> Command

Build a Command that can instantiate Self. Read more
Source§

fn command_for_update<'b>() -> Command

Build a Command that can update self. Read more
Source§

impl Debug for LlmLoadArgs

Source§

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Formats the value using the given formatter. Read more
Source§

impl FromArgMatches for LlmLoadArgs

Source§

fn from_arg_matches(__clap_arg_matches: &ArgMatches) -> Result<Self, Error>

Instantiate Self from ArgMatches, parsing the arguments as needed. Read more
Source§

fn from_arg_matches_mut( __clap_arg_matches: &mut ArgMatches, ) -> Result<Self, Error>

Instantiate Self from ArgMatches, parsing the arguments as needed. Read more
Source§

fn update_from_arg_matches( &mut self, __clap_arg_matches: &ArgMatches, ) -> Result<(), Error>

Assign values from ArgMatches to self.
Source§

fn update_from_arg_matches_mut( &mut self, __clap_arg_matches: &mut ArgMatches, ) -> Result<(), Error>

Assign values from ArgMatches to self.
Source§

impl Parser for LlmLoadArgs

Source§

fn parse() -> Self

Parse from std::env::args_os(), exit on error.
Source§

fn try_parse() -> Result<Self, Error>

Parse from std::env::args_os(), return Err on error.
Source§

fn parse_from<I, T>(itr: I) -> Self
where I: IntoIterator<Item = T>, T: Into<OsString> + Clone,

Parse from iterator, exit on error.
Source§

fn try_parse_from<I, T>(itr: I) -> Result<Self, Error>
where I: IntoIterator<Item = T>, T: Into<OsString> + Clone,

Parse from iterator, return Err on error.
Source§

fn update_from<I, T>(&mut self, itr: I)
where I: IntoIterator<Item = T>, T: Into<OsString> + Clone,

Update from iterator, exit on error. Read more
Source§

fn try_update_from<I, T>(&mut self, itr: I) -> Result<(), Error>
where I: IntoIterator<Item = T>, T: Into<OsString> + Clone,

Update from iterator, return Err on error.

Auto Trait Implementations§

Blanket Implementations§

Source§

impl<T> Any for T
where T: 'static + ?Sized,

Source§

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more
Source§

impl<T> Borrow<T> for T
where T: ?Sized,

Source§

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more
Source§

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source§

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more
Source§

impl<T> From<T> for T

Source§

fn from(t: T) -> T

Returns the argument unchanged.

Source§

impl<A, B, T> HttpServerConnExec<A, B> for T
where B: Body,

Source§

impl<T> Instrument for T

Source§

fn instrument(self, span: Span) -> Instrumented<Self>

Instruments this type with the provided Span, returning an Instrumented wrapper. Read more
Source§

fn in_current_span(self) -> Instrumented<Self>

Instruments this type with the current Span, returning an Instrumented wrapper. Read more
Source§

impl<T, U> Into<U> for T
where U: From<T>,

Source§

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source§

impl<T> IntoEither for T

Source§

fn into_either(self, into_left: bool) -> Either<Self, Self>

Converts self into a Left variant of Either<Self, Self> if into_left is true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more
Source§

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

Converts self into a Left variant of Either<Self, Self> if into_left(&self) returns true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more
Source§

impl<T> Pointable for T

Source§

const ALIGN: usize

The alignment of pointer.
Source§

type Init = T

The type for initializers.
Source§

unsafe fn init(init: <T as Pointable>::Init) -> usize

Initializes a with the given initializer. Read more
Source§

unsafe fn deref<'a>(ptr: usize) -> &'a T

Dereferences the given pointer. Read more
Source§

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

Mutably dereferences the given pointer. Read more
Source§

unsafe fn drop(ptr: usize)

Drops the object pointed to by the given pointer. Read more
Source§

impl<T> PolicyExt for T
where T: ?Sized,

Source§

fn and<P, B, E>(self, other: P) -> And<T, P>
where T: Sized + Policy<B, E>, P: Policy<B, E>,

Create a new Policy that returns Action::Follow only if self and other return Action::Follow. Read more
Source§

fn or<P, B, E>(self, other: P) -> Or<T, P>
where T: Sized + Policy<B, E>, P: Policy<B, E>,

Create a new Policy that returns Action::Follow if either self or other returns Action::Follow. Read more
Source§

impl<T> Same for T

Source§

type Output = T

Should always be Self
Source§

impl<T, U> TryFrom<U> for T
where U: Into<T>,

Source§

type Error = Infallible

The type returned in the event of a conversion error.
Source§

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

Performs the conversion.
Source§

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

Source§

type Error = <U as TryFrom<T>>::Error

The type returned in the event of a conversion error.
Source§

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Performs the conversion.
Source§

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

Source§

fn vzip(self) -> V

Source§

impl<T> WithSubscriber for T

Source§

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,

Attaches the provided Subscriber to this type, returning a WithDispatch wrapper. Read more
Source§

fn with_current_subscriber(self) -> WithDispatch<Self>

Attaches the current default Subscriber to this type, returning a WithDispatch wrapper. Read more