pub struct GenerationParams {
pub temperature: f64,
pub top_p: Option<f64>,
pub top_k: Option<usize>,
pub max_tokens: usize,
pub seed: u64,
pub repeat_penalty: f32,
pub repeat_last_n: usize,
}Expand description
Sampling / generation parameters for Candle local inference.
Used inside [llm.candle.generation] or a [[llm.providers]] Candle entry.
Fields§
§temperature: f64Sampling temperature. Higher values produce more creative outputs. Default: 0.7.
top_p: Option<f64>Nucleus sampling threshold. When set, tokens with cumulative probability above
this value are excluded. Default: None (disabled).
top_k: Option<usize>Top-k sampling. When set, only the top-k most probable tokens are considered.
Default: None (disabled).
max_tokens: usizeMaximum number of tokens to generate per response. Capped at MAX_TOKENS_CAP.
Default: 2048.
seed: u64Random seed for reproducible outputs. Default: 42.
repeat_penalty: f32Repetition penalty applied during sampling. Default: 1.1.
repeat_last_n: usizeNumber of last tokens to consider for the repetition penalty window. Default: 64.
Implementations§
Source§impl GenerationParams
impl GenerationParams
Sourcepub fn capped_max_tokens(&self) -> usize
pub fn capped_max_tokens(&self) -> usize
Returns max_tokens clamped to MAX_TOKENS_CAP.
§Examples
use zeph_config::GenerationParams;
let params = GenerationParams::default();
assert!(params.capped_max_tokens() <= 32768);Trait Implementations§
Source§impl Clone for GenerationParams
impl Clone for GenerationParams
Source§fn clone(&self) -> GenerationParams
fn clone(&self) -> GenerationParams
1.0.0 · Source§fn clone_from(&mut self, source: &Self)
fn clone_from(&mut self, source: &Self)
source. Read moreSource§impl Debug for GenerationParams
impl Debug for GenerationParams
Source§impl Default for GenerationParams
impl Default for GenerationParams
Source§fn default() -> GenerationParams
fn default() -> GenerationParams
Source§impl<'de> Deserialize<'de> for GenerationParams
impl<'de> Deserialize<'de> for GenerationParams
Source§fn deserialize<__D>(
__deserializer: __D,
) -> Result<GenerationParams, <__D as Deserializer<'de>>::Error>where
__D: Deserializer<'de>,
fn deserialize<__D>(
__deserializer: __D,
) -> Result<GenerationParams, <__D as Deserializer<'de>>::Error>where
__D: Deserializer<'de>,
Source§impl Serialize for GenerationParams
impl Serialize for GenerationParams
Source§fn serialize<__S>(
&self,
__serializer: __S,
) -> Result<<__S as Serializer>::Ok, <__S as Serializer>::Error>where
__S: Serializer,
fn serialize<__S>(
&self,
__serializer: __S,
) -> Result<<__S as Serializer>::Ok, <__S as Serializer>::Error>where
__S: Serializer,
Auto Trait Implementations§
impl Freeze for GenerationParams
impl RefUnwindSafe for GenerationParams
impl Send for GenerationParams
impl Sync for GenerationParams
impl Unpin for GenerationParams
impl UnsafeUnpin for GenerationParams
impl UnwindSafe for GenerationParams
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Source§impl<T> CloneToUninit for Twhere
T: Clone,
impl<T> CloneToUninit for Twhere
T: Clone,
Source§impl<T> Instrument for T
impl<T> Instrument for T
Source§fn instrument(self, span: Span) -> Instrumented<Self>
fn instrument(self, span: Span) -> Instrumented<Self>
Source§fn in_current_span(self) -> Instrumented<Self>
fn in_current_span(self) -> Instrumented<Self>
Source§impl<T> IntoEither for T
impl<T> IntoEither for T
Source§fn into_either(self, into_left: bool) -> Either<Self, Self>
fn into_either(self, into_left: bool) -> Either<Self, Self>
self into a Left variant of Either<Self, Self>
if into_left is true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read moreSource§fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
self into a Left variant of Either<Self, Self>
if into_left(&self) returns true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read moreSource§impl<T> IntoRequest<T> for T
impl<T> IntoRequest<T> for T
Source§fn into_request(self) -> Request<T>
fn into_request(self) -> Request<T>
T in a tonic::Request