use crate::tokenizer::Tokenizer;
use std::sync::Arc;
pub mod api_model;
pub mod local_model;
pub mod tokenizer;
#[allow(unused_imports)]
pub(crate) use anyhow::{Error, Result, anyhow, bail};
#[allow(unused_imports)]
pub(crate) use tracing::{Level, debug, error, info, span, trace, warn};
#[derive(Clone)]
pub struct LLMModelBase {
pub model_id: String,
pub model_ctx_size: u64,
pub inference_ctx_size: u64,
pub tokenizer: Arc<Tokenizer>,
}