use crate::{
channel::ComputeChannel,
server::{ComputeServer, Handle},
tune::{AutotuneOperationSet, Tuner},
};
use alloc::vec::Vec;
use alloc::{boxed::Box, sync::Arc};
use burn_common::reader::Reader;
use burn_common::stub::RwLock;
#[derive(Debug)]
pub struct ComputeClient<Server: ComputeServer, Channel> {
channel: Channel,
tuner: Arc<RwLock<Tuner<Server, Channel>>>,
}
impl<S, C> Clone for ComputeClient<S, C>
where
S: ComputeServer,
C: ComputeChannel<S>,
{
fn clone(&self) -> Self {
Self {
channel: self.channel.clone(),
tuner: self.tuner.clone(),
}
}
}
impl<Server, Channel> ComputeClient<Server, Channel>
where
Server: ComputeServer,
Channel: ComputeChannel<Server>,
{
pub fn new(channel: Channel, tuner: Arc<RwLock<Tuner<Server, Channel>>>) -> Self {
Self { channel, tuner }
}
pub fn read(&self, handle: &Handle<Server>) -> Reader<Vec<u8>> {
self.channel.read(handle)
}
pub fn create(&self, data: &[u8]) -> Handle<Server> {
self.channel.create(data)
}
pub fn empty(&self, size: usize) -> Handle<Server> {
self.channel.empty(size)
}
pub fn execute(&self, kernel: Server::Kernel, handles: &[&Handle<Server>]) {
self.channel.execute(kernel, handles)
}
pub fn sync(&self) {
self.channel.sync()
}
pub fn autotune_execute(
&self,
autotune_operation_set: Box<dyn AutotuneOperationSet<Server::AutotuneKey>>,
) {
self.tuner
.write()
.unwrap()
.execute_autotune(autotune_operation_set, self);
}
pub fn autotune_result(&self, key: &Server::AutotuneKey) -> Option<usize> {
self.tuner.read().unwrap().autotune_fastest(key)
}
}