pub struct SpeculativeSamplingPlan { /* private fields */ }Expand description
Speculative-decode verification plan (FlashInfer ChainSpeculativeSampling).
Implementations§
Source§impl SpeculativeSamplingPlan
impl SpeculativeSamplingPlan
Sourcepub fn select(
_stream: &Stream,
desc: &SpeculativeSamplingDescriptor,
_pref: PlanPreference,
) -> Result<Self>
pub fn select( _stream: &Stream, desc: &SpeculativeSamplingDescriptor, _pref: PlanPreference, ) -> Result<Self>
Validate the descriptor.
Sourcepub fn can_implement(&self, args: &SpeculativeSamplingArgs<'_>) -> Result<()>
pub fn can_implement(&self, args: &SpeculativeSamplingArgs<'_>) -> Result<()>
Validate args against the descriptor.
Sourcepub fn workspace_size(&self) -> usize
pub fn workspace_size(&self) -> usize
Workspace bytes — always 0.
Sourcepub fn precision_guarantee(&self) -> PrecisionGuarantee
pub fn precision_guarantee(&self) -> PrecisionGuarantee
Numerical guarantees.
Auto Trait Implementations§
impl Freeze for SpeculativeSamplingPlan
impl RefUnwindSafe for SpeculativeSamplingPlan
impl Send for SpeculativeSamplingPlan
impl Sync for SpeculativeSamplingPlan
impl Unpin for SpeculativeSamplingPlan
impl UnsafeUnpin for SpeculativeSamplingPlan
impl UnwindSafe for SpeculativeSamplingPlan
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more