Struct LlmLoadArgs

Source

pub struct LlmLoadArgs {Show 23 fields
    pub url: String,
    pub model: String,
    pub concurrency: usize,
    pub duration: String,
    pub runtime_name: String,
    pub prompt_profile: Option<String>,
    pub prompt_file: Option<PathBuf>,
    pub warmup: String,
    pub output: Option<PathBuf>,
    pub stream: bool,
    pub rate: Option<f64>,
    pub rate_distribution: String,
    pub num_layers: Option<u32>,
    pub validate: String,
    pub fail_on_quality: Option<f64>,
    pub spike_threshold: f64,
    pub gpu_telemetry: bool,
    pub gpu_poll_interval: String,
    pub expected_clock_mhz: Option<u32>,
    pub skip_health_check: bool,
    pub dataset: Option<PathBuf>,
    pub max_tokens: Option<u32>,
    pub max_tokens_distribution: Option<String>,
}

Expand description

Arguments for probador llm load

Fields§

§url: String

Base URL of the LLM API server

§model: String

Model name to include in requests

§concurrency: usize

Number of concurrent workers

§duration: String

Test duration (e.g., 30s, 2m, 1h)

§runtime_name: String

Runtime name for reporting

§prompt_profile: Option<String>

Prompt profile: micro, short, medium, long

§prompt_file: Option<PathBuf>

Path to YAML prompt file

§warmup: String

Warmup duration before measurement (e.g., 5s, 10s). Default: no warmup.

§output: Option<PathBuf>

Output file path for JSON results

§stream: bool

Use SSE streaming for real per-token timing (TTFT, TPOT, ITL). Use –stream false to disable.

§rate: Option<f64>

Target request rate (req/s). Omit for max throughput (closed-loop).

§rate_distribution: String

Rate distribution: poisson (default) or constant. Only used with –rate.

§num_layers: Option<u32>

Number of transformer layers in the model (e.g., 28 for Qwen 1.5B). Computes per-layer decode time for cross-runtime comparison.

§validate: String

Inline correctness validation: none, basic, contains:X, pattern:X

§fail_on_quality: Option<f64>

Exit non-zero if quality pass rate drops below this threshold (e.g., 0.95)

§spike_threshold: f64

Multiplier of median ITL for spike detection (default: 5.0)

§gpu_telemetry: bool

Enable GPU telemetry collection via nvidia-smi

§gpu_poll_interval: String

GPU telemetry polling interval (e.g., 1s, 2s)

§expected_clock_mhz: Option<u32>

Expected GPU clock speed in MHz for throttle detection (auto-detect if omitted)

§skip_health_check: bool

Skip the pre-flight health check (not recommended)

§dataset: Option<PathBuf>

Path to JSONL dataset file for workload-driven benchmarking

§max_tokens: Option<u32>

Override max_tokens for all requests (e.g., –max-tokens 128)

§max_tokens_distribution: Option<String>

Max tokens distribution: uniform:MIN,MAX or fixed:N. Creates heterogeneous traffic with staggered completion times. Example: –max-tokens-distribution uniform:16,128

Trait Implementations§

Source §

impl Args for LlmLoadArgs

Source §

fn group_id() -> Option<Id>

Report the ArgGroup::id for this set of arguments

Source §

fn command<'b>() -> Command

Build a Command that can instantiate Self. Read more

Source §

fn command_for_update<'b>() -> Command

Build a Command that can update self. Read more

Source §

impl Debug for LlmLoadArgs

Source §

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Formats the value using the given formatter. Read more

Source §

impl FromArgMatches for LlmLoadArgs

Source §

fn from_arg_matches(__clap_arg_matches: &ArgMatches) -> Result<Self, Error>

Instantiate Self from ArgMatches, parsing the arguments as needed. Read more

Source §

fn from_arg_matches_mut( __clap_arg_matches: &mut ArgMatches, ) -> Result<Self, Error>

Instantiate Self from ArgMatches, parsing the arguments as needed. Read more

Source §

fn update_from_arg_matches( &mut self, __clap_arg_matches: &ArgMatches, ) -> Result<(), Error>

Assign values from ArgMatches to self.

Source §

fn update_from_arg_matches_mut( &mut self, __clap_arg_matches: &mut ArgMatches, ) -> Result<(), Error>

Assign values from ArgMatches to self.

Source §

impl Parser for LlmLoadArgs

Source §

fn parse() -> Self

Parse from std::env::args_os(), exit on error.

Source §

fn try_parse() -> Result<Self, Error>

Parse from std::env::args_os(), return Err on error.

Source §

fn parse_from<I, T>(itr: I) -> Self
where I: IntoIterator<Item = T>, T: Into<OsString> + Clone,

Parse from iterator, exit on error.

Source §

fn try_parse_from<I, T>(itr: I) -> Result<Self, Error>
where I: IntoIterator<Item = T>, T: Into<OsString> + Clone,

Parse from iterator, return Err on error.

Source §

fn update_from<I, T>(&mut self, itr: I)
where I: IntoIterator<Item = T>, T: Into<OsString> + Clone,

Update from iterator, exit on error. Read more

Source §

fn try_update_from<I, T>(&mut self, itr: I) -> Result<(), Error>
where I: IntoIterator<Item = T>, T: Into<OsString> + Clone,

Update from iterator, return Err on error.

Auto Trait Implementations§

§

impl Freeze for LlmLoadArgs

§

impl RefUnwindSafe for LlmLoadArgs

§

impl Send for LlmLoadArgs

§

impl Sync for LlmLoadArgs

§

impl Unpin for LlmLoadArgs

§

impl UnsafeUnpin for LlmLoadArgs

§

impl UnwindSafe for LlmLoadArgs

Blanket Implementations§

Source §

impl<T> Any for T
where T: 'static + ?Sized,

Source §

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more

Source §

impl<T> Borrow<T> for T
where T: ?Sized,

Source §

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more

Source §

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source §

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more

Source §

impl<T> From<T> for T

Source §

fn from(t: T) -> T

Returns the argument unchanged.

Source §

impl<A, B, T> HttpServerConnExec<A, B> for T
where B: Body,

Source §

impl<T> Instrument for T

Source §

fn instrument(self, span: Span) -> Instrumented<Self>

Instruments this type with the provided Span, returning an Instrumented wrapper. Read more

Source §

fn in_current_span(self) -> Instrumented<Self>

Instruments this type with the current Span, returning an Instrumented wrapper. Read more

Source §

impl<T, U> Into for T
where U: From<T>,

Source §

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source §

impl<T> IntoEither for T

Source §

fn into_either(self, into_left: bool) -> Either<Self, Self>

Converts self into a Left variant of Either<Self, Self> if into_left is true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more

Source §

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

Converts self into a Left variant of Either<Self, Self> if into_left(&self) returns true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more

Source §

impl<T> Pointable for T

Source §

const ALIGN: usize

The alignment of pointer.

Source §

type Init = T

The type for initializers.

Source §

unsafe fn init(init: <T as Pointable>::Init) -> usize

Initializes a with the given initializer. Read more

Source §

unsafe fn deref<'a>(ptr: usize) -> &'a T

Dereferences the given pointer. Read more

Source §

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

Mutably dereferences the given pointer. Read more

Source §

unsafe fn drop(ptr: usize)

Drops the object pointed to by the given pointer. Read more

Source §

impl<T> PolicyExt for T
where T: ?Sized,

Source §

fn and<P, B, E>(self, other: P) -> And<T, P>
where T: Sized + Policy<B, E>, P: Policy<B, E>,

Create a new Policy that returns Action::Follow only if self and other return Action::Follow. Read more

Source §

fn or<P, B, E>(self, other: P) -> Or<T, P>
where T: Sized + Policy<B, E>, P: Policy<B, E>,

Create a new Policy that returns Action::Follow if either self or other returns Action::Follow. Read more

Source §

impl<T> Same for T

Source §

type Output = T

Should always be Self

Source §

impl<T, U> TryFrom for T
where U: Into<T>,

Source §

type Error = Infallible

The type returned in the event of a conversion error.

Source §

fn try_from(value: U) -> Result<T, <T as TryFrom>::Error>

Performs the conversion.

Source §

impl<T, U> TryInto for T
where U: TryFrom<T>,

Source §

type Error = >::Error

The type returned in the event of a conversion error.

Source §

fn try_into(self) -> Result<U, >::Error>

Performs the conversion.

Source §

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

Source §

fn vzip(self) -> V

Source §

impl<T> WithSubscriber for T

Source §

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,

Attaches the provided Subscriber to this type, returning a WithDispatch wrapper. Read more

Source §

fn with_current_subscriber(self) -> WithDispatch<Self>

Attaches the current default Subscriber to this type, returning a WithDispatch wrapper. Read more

LlmLoadArgs

Struct LlmLoadArgs Copy item path

Fields§

Trait Implementations§

impl Args for LlmLoadArgs

fn group_id() -> Option<Id>

fn augment_args<'b>(__clap_app: Command) -> Command

fn augment_args_for_update<'b>(__clap_app: Command) -> Command

impl CommandFactory for LlmLoadArgs

fn command<'b>() -> Command

fn command_for_update<'b>() -> Command

impl Debug for LlmLoadArgs

fn fmt(&self, f: &mut Formatter<'_>) -> Result

impl FromArgMatches for LlmLoadArgs

fn from_arg_matches(__clap_arg_matches: &ArgMatches) -> Result<Self, Error>

fn from_arg_matches_mut( __clap_arg_matches: &mut ArgMatches, ) -> Result<Self, Error>

fn update_from_arg_matches( &mut self, __clap_arg_matches: &ArgMatches, ) -> Result<(), Error>

fn update_from_arg_matches_mut( &mut self, __clap_arg_matches: &mut ArgMatches, ) -> Result<(), Error>

impl Parser for LlmLoadArgs

fn parse() -> Self

fn try_parse() -> Result<Self, Error>

fn parse_from<I, T>(itr: I) -> Selfwhere I: IntoIterator<Item = T>, T: Into<OsString> + Clone,

fn try_parse_from<I, T>(itr: I) -> Result<Self, Error>where I: IntoIterator<Item = T>, T: Into<OsString> + Clone,

fn update_from<I, T>(&mut self, itr: I)where I: IntoIterator<Item = T>, T: Into<OsString> + Clone,

fn try_update_from<I, T>(&mut self, itr: I) -> Result<(), Error>where I: IntoIterator<Item = T>, T: Into<OsString> + Clone,

Auto Trait Implementations§

impl Freeze for LlmLoadArgs

impl RefUnwindSafe for LlmLoadArgs

impl Send for LlmLoadArgs

impl Sync for LlmLoadArgs

impl Unpin for LlmLoadArgs

impl UnsafeUnpin for LlmLoadArgs

impl UnwindSafe for LlmLoadArgs

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<A, B, T> HttpServerConnExec<A, B> for Twhere B: Body,

impl<T> Instrument for T

fn instrument(self, span: Span) -> Instrumented<Self>

fn in_current_span(self) -> Instrumented<Self>

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> IntoEither for T

fn into_either(self, into_left: bool) -> Either<Self, Self>

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>where F: FnOnce(&Self) -> bool,

impl<T> Pointable for T

const ALIGN: usize

type Init = T

unsafe fn init(init: <T as Pointable>::Init) -> usize

unsafe fn deref<'a>(ptr: usize) -> &'a T

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

unsafe fn drop(ptr: usize)

impl<T> PolicyExt for Twhere T: ?Sized,

fn and<P, B, E>(self, other: P) -> And<T, P>where T: Sized + Policy<B, E>, P: Policy<B, E>,

fn or<P, B, E>(self, other: P) -> Or<T, P>where T: Sized + Policy<B, E>, P: Policy<B, E>,

impl<T> Same for T

type Output = T

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for Twhere V: MultiLane<T>,

fn vzip(self) -> V

impl<T> WithSubscriber for T

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>where S: Into<Dispatch>,

fn with_current_subscriber(self) -> WithDispatch<Self>

Struct LlmLoadArgs

fn parse_from<I, T>(itr: I) -> Self
where I: IntoIterator<Item = T>, T: Into<OsString> + Clone,

fn try_parse_from<I, T>(itr: I) -> Result<Self, Error>
where I: IntoIterator<Item = T>, T: Into<OsString> + Clone,

fn update_from<I, T>(&mut self, itr: I)
where I: IntoIterator<Item = T>, T: Into<OsString> + Clone,

fn try_update_from<I, T>(&mut self, itr: I) -> Result<(), Error>
where I: IntoIterator<Item = T>, T: Into<OsString> + Clone,

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<A, B, T> HttpServerConnExec<A, B> for T
where B: Body,

impl<T, U> Into<U> for T
where U: From<T>,

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

impl<T> PolicyExt for T
where T: ?Sized,

fn and<P, B, E>(self, other: P) -> And<T, P>
where T: Sized + Policy<B, E>, P: Policy<B, E>,

fn or<P, B, E>(self, other: P) -> Or<T, P>
where T: Sized + Policy<B, E>, P: Policy<B, E>,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,