Struct LlamaContextParams

pub struct LlamaContextParams {
    pub context_params: llama_context_params,
}

Fields§

§context_params: llama_context_params

Implementations§

Trait Implementations§

Returns a duplicate of the value. Read more

Performs copy-assignment from source. Read more

Formats the value using the given formatter. Read more

Returns the “default value” for a type. Read more

Auto Trait Implementations§

Blanket Implementations§

Gets the TypeId of self. Read more

Immutably borrows from an owned value. Read more

Mutably borrows from an owned value. Read more

🔬This is a nightly-only experimental API. (clone_to_uninit)

Performs copy-assignment from self to dest. Read more

Returns the argument unchanged.

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Converts self into a Left variant of Either<Self, Self> if into_left is true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more

Converts self into a Left variant of Either<Self, Self> if into_left(&self) returns true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more

The alignment of pointer.

The type for initializers.

Initializes a with the given initializer. Read more

Dereferences the given pointer. Read more

Mutably dereferences the given pointer. Read more

Drops the object pointed to by the given pointer. Read more

The resulting type after obtaining ownership.

Creates owned data from borrowed data, usually by cloning. Read more

Uses borrowed data to replace owned data, usually by cloning. Read more

The type returned in the event of a conversion error.

Performs the conversion.

The type returned in the event of a conversion error.

Performs the conversion.

Struct LlamaContextParams Copy item path

Fields§

Implementations§

impl LlamaContextParams

pub fn with_n_ctx(self, n_ctx: Option<NonZeroU32>) -> Self

pub const fn n_ctx(&self) -> Option<NonZeroU32>

pub const fn with_n_batch(self, n_batch: u32) -> Self

pub const fn n_batch(&self) -> u32

pub const fn with_n_ubatch(self, n_ubatch: u32) -> Self

pub const fn n_ubatch(&self) -> u32

pub const fn with_flash_attention_policy( self, policy: llama_flash_attn_type, ) -> Self

pub const fn flash_attention_policy(&self) -> llama_flash_attn_type

pub const fn with_offload_kqv(self, enabled: bool) -> Self

pub const fn offload_kqv(&self) -> bool

pub fn with_rope_scaling_type(self, rope_scaling_type: RopeScalingType) -> Self

pub fn rope_scaling_type(&self) -> RopeScalingType

pub const fn with_rope_freq_base(self, rope_freq_base: f32) -> Self

pub const fn rope_freq_base(&self) -> f32

pub const fn with_rope_freq_scale(self, rope_freq_scale: f32) -> Self

pub const fn rope_freq_scale(&self) -> f32

pub const fn n_threads(&self) -> i32

pub const fn n_threads_batch(&self) -> i32

pub const fn with_n_threads(self, n_threads: i32) -> Self

pub const fn with_n_threads_batch(self, n_threads: i32) -> Self

pub const fn embeddings(&self) -> bool

pub const fn with_embeddings(self, embedding: bool) -> Self

pub fn with_cb_eval(self, cb_eval: ggml_backend_sched_eval_callback) -> Self

pub const fn with_cb_eval_user_data( self, cb_eval_user_data: *mut c_void, ) -> Self

pub fn with_pooling_type(self, pooling_type: LlamaPoolingType) -> Self

pub fn pooling_type(&self) -> LlamaPoolingType

pub const fn with_swa_full(self, enabled: bool) -> Self

pub const fn swa_full(&self) -> bool

pub const fn with_n_seq_max(self, n_seq_max: u32) -> Self

pub const fn n_seq_max(&self) -> u32

pub fn with_type_k(self, type_k: KvCacheType) -> Self

pub fn type_k(&self) -> KvCacheType

pub fn with_type_v(self, type_v: KvCacheType) -> Self

pub fn type_v(&self) -> KvCacheType

pub fn with_attention_type(self, attention_type: LlamaAttentionType) -> Self

pub fn attention_type(&self) -> LlamaAttentionType

pub const fn with_yarn_ext_factor(self, yarn_ext_factor: f32) -> Self

pub const fn yarn_ext_factor(&self) -> f32

pub const fn with_yarn_attn_factor(self, yarn_attn_factor: f32) -> Self

pub const fn yarn_attn_factor(&self) -> f32

pub const fn with_yarn_beta_fast(self, yarn_beta_fast: f32) -> Self

pub const fn yarn_beta_fast(&self) -> f32

pub const fn with_yarn_beta_slow(self, yarn_beta_slow: f32) -> Self

pub const fn yarn_beta_slow(&self) -> f32

pub const fn with_yarn_orig_ctx(self, yarn_orig_ctx: u32) -> Self

pub const fn yarn_orig_ctx(&self) -> u32

pub const fn with_defrag_thold(self, defrag_thold: f32) -> Self

pub const fn defrag_thold(&self) -> f32

pub const fn with_no_perf(self, no_perf: bool) -> Self

pub const fn no_perf(&self) -> bool

pub const fn with_op_offload(self, op_offload: bool) -> Self

pub const fn op_offload(&self) -> bool

pub const fn with_kv_unified(self, kv_unified: bool) -> Self

pub const fn kv_unified(&self) -> bool

Trait Implementations§

impl Clone for LlamaContextParams

fn clone(&self) -> LlamaContextParams

fn clone_from(&mut self, source: &Self)

impl Debug for LlamaContextParams

fn fmt(&self, f: &mut Formatter<'_>) -> Result

impl Default for LlamaContextParams

fn default() -> Self

impl Send for LlamaContextParams

impl Sync for LlamaContextParams

Auto Trait Implementations§

impl Freeze for LlamaContextParams

impl RefUnwindSafe for LlamaContextParams

impl Unpin for LlamaContextParams

impl UnsafeUnpin for LlamaContextParams

impl UnwindSafe for LlamaContextParams

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

Struct LlamaContextParams

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T> CloneToUninit for T
where T: Clone,

impl<T, U> Into<U> for T
where U: From<T>,

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

impl<T> ToOwned for T
where T: Clone,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,