Struct llama_cpp_2::llama_batch::LlamaBatch

source ·

pub struct LlamaBatch { /* private fields */ }

Expand description

A safe wrapper around llama_batch.

Implementations§

source §

impl LlamaBatch

source

pub fn clear(&mut self)

Clear the batch. This does not free the memory associated with the batch, but it does reset the number of tokens to 0.

source

pub fn set_last_logit(&mut self, value: bool)

👎Deprecated: not compatible with multiple sequences. prefer setting logits while adding tokens

Set the last token in the batch to [value]. If [value] is true, the token will be initilized after a decode and can be read from. If [value] is false, the token will not be initilized (this is the default).

Panics

Panics if there are no tokens in the batch.

source

pub fn add( &mut self, LlamaToken: LlamaToken, pos: llama_pos, seq_ids: &[i32], logits: bool )

add a token to the batch for sequences [seq_ids] at position [pos]. If [logits] is true, the token will be initilized and can be read from after the next decode.

Panics

[self.llama_batch.n_tokens] does not fit into a usize
[seq_ids.len()] does not fit into a llama_seq_id

source

pub fn new(n_tokens: usize, embd: i32, n_seq_max: i32) -> Self

Create a new LlamaBatch that cab contain up to n_tokens tokens.

Panics

Panics if n_tokens is greater than i32::MAX.

source

pub fn add_prompt(&mut self, prompt: &[LlamaToken])

👎Deprecated: not compatible with multiple sequences. use add_prompt_seq instead

add a prompt to the batch at sequence id 0

source

pub fn add_prompt_seq(&mut self, prompt: &[LlamaToken], seq_ids: &[i32])

add a prompt to the batch at the given sequence ids. This must be the initial prompt as it will be added to the batch starting at position 0.

source

pub fn n_tokens(&self) -> i32

Returns the number of tokens in the batch.

Trait Implementations§

source §

impl Debug for LlamaBatch

source §

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Formats the value using the given formatter. Read more

source §

impl Drop for LlamaBatch

source §

fn drop(&mut self)

Drops the LlamaBatch.

let batch = LlamaBatch::new_from_prompt(&[]);
// frees the memory associated with the batch. (allocated by llama.cpp)
drop(batch);

Auto Trait Implementations§

§

impl UnwindSafe for LlamaBatch

Blanket Implementations§

source §

impl<T> Any for T
where T: 'static + ?Sized,

source §

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more

source §

impl<T> Borrow<T> for T
where T: ?Sized,

source §

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more

source §

impl<T> BorrowMut<T> for T
where T: ?Sized,

source §

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more

source §

impl<T> From<T> for T

source §

fn from(t: T) -> T

Returns the argument unchanged.

source §

impl<T> Instrument for T

source §

fn instrument(self, span: Span) -> Instrumented<Self>

Instruments this type with the provided Span, returning an Instrumented wrapper. Read more

source §

fn in_current_span(self) -> Instrumented<Self>

Instruments this type with the current Span, returning an Instrumented wrapper. Read more

source §

impl<T, U> Into for T
where U: From<T>,

source §

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

source §

impl<T, U> TryFrom for T
where U: Into<T>,

§

type Error = Infallible

The type returned in the event of a conversion error.

source §

fn try_from(value: U) -> Result<T, <T as TryFrom>::Error>

Performs the conversion.

source §

impl<T, U> TryInto for T
where U: TryFrom<T>,

§

type Error = >::Error

The type returned in the event of a conversion error.

source §

fn try_into(self) -> Result<U, >::Error>

Performs the conversion.

source §

impl<T> WithSubscriber for T

source §

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,

Attaches the provided Subscriber to this type, returning a WithDispatch wrapper. Read more

source §

fn with_current_subscriber(self) -> WithDispatch<Self>

Attaches the current default Subscriber to this type, returning a WithDispatch wrapper. Read more

Struct llama_cpp_2::llama_batch::LlamaBatch

Implementations§

impl LlamaBatch

pub fn clear(&mut self)

pub fn set_last_logit(&mut self, value: bool)

pub fn add( &mut self, LlamaToken: LlamaToken, pos: llama_pos, seq_ids: &[i32], logits: bool )

pub fn new(n_tokens: usize, embd: i32, n_seq_max: i32) -> Self

pub fn add_prompt(&mut self, prompt: &[LlamaToken])

pub fn add_prompt_seq(&mut self, prompt: &[LlamaToken], seq_ids: &[i32])

pub fn n_tokens(&self) -> i32

Trait Implementations§

impl Debug for LlamaBatch

fn fmt(&self, f: &mut Formatter<'_>) -> Result

impl Drop for LlamaBatch

fn drop(&mut self)

Auto Trait Implementations§

impl RefUnwindSafe for LlamaBatch

impl !Send for LlamaBatch

impl !Sync for LlamaBatch

impl Unpin for LlamaBatch

impl UnwindSafe for LlamaBatch

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T> Instrument for T

fn instrument(self, span: Span) -> Instrumented<Self>

fn in_current_span(self) -> Instrumented<Self>

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<T> WithSubscriber for T

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>where S: Into<Dispatch>,

fn with_current_subscriber(self) -> WithDispatch<Self>

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,