kyro 0.1.1

A high-performance ML inference engine
1
2
3
4
5
6
7
8
9
10
11
#![allow(dead_code)]

pub mod awq;
pub mod fp8;

use candle_core::{Result, Tensor};

pub trait QuantizedLayer {
    fn forward(&self, x: &Tensor) -> Result<Tensor>;
    fn unpack_weights(&self) -> Result<Tensor>;
}