pub struct KvCache<B: Backend> {
pub k: B::Buffer,
pub v: B::Buffer,
pub len: usize,
pub capacity: usize,
pub num_kv_heads: usize,
pub head_dim: usize,
}Expand description
Per-layer KV cache. Each model owns its own Vec<KvCache<B>> per sequence.
Fields§
§k: B::Buffer§v: B::Buffer§len: usize§capacity: usize§num_kv_heads: usize§head_dim: usizeAuto Trait Implementations§
impl<B> Freeze for KvCache<B>
impl<B> RefUnwindSafe for KvCache<B>
impl<B> Send for KvCache<B>
impl<B> Sync for KvCache<B>
impl<B> Unpin for KvCache<B>
impl<B> UnsafeUnpin for KvCache<B>
impl<B> UnwindSafe for KvCache<B>
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more