pub trait ModelRunner {
// Required methods
fn forward(
&self,
input: &ModelInput,
config: &InferenceConfig,
) -> Result<ModelOutput, SparseInferenceError>;
fn get_predictor(&self, layer_idx: usize) -> Option<&LowRankPredictor>;
fn calibrate(
&mut self,
samples: &[ModelInput],
) -> Result<CalibrationStats, SparseInferenceError>;
fn metadata(&self) -> &ModelMetadata;
}Expand description
Trait for running inference on models
Required Methods§
Sourcefn forward(
&self,
input: &ModelInput,
config: &InferenceConfig,
) -> Result<ModelOutput, SparseInferenceError>
fn forward( &self, input: &ModelInput, config: &InferenceConfig, ) -> Result<ModelOutput, SparseInferenceError>
Forward pass with optional sparse computation
Sourcefn get_predictor(&self, layer_idx: usize) -> Option<&LowRankPredictor>
fn get_predictor(&self, layer_idx: usize) -> Option<&LowRankPredictor>
Get predictor for a specific layer (if available)
Sourcefn calibrate(
&mut self,
samples: &[ModelInput],
) -> Result<CalibrationStats, SparseInferenceError>
fn calibrate( &mut self, samples: &[ModelInput], ) -> Result<CalibrationStats, SparseInferenceError>
Calibrate predictors with sample data
Sourcefn metadata(&self) -> &ModelMetadata
fn metadata(&self) -> &ModelMetadata
Get model metadata