from __future__ import annotations
from oxillama_py.callback import StreamingCallback, TokenCallback
from oxillama_py.tqdm_helper import CollectTokens, TqdmProgress
from oxillama_py.utils import decode_from_logits
try:
from oxillama_py.oxillama_py import ( Engine,
EngineConfig,
GenerateError,
GrammarError,
LoadError,
Lora,
OxiLlamaError,
QuantError,
SamplerConfig,
SpeculativeConfig,
SpeculativeEngine,
Tokenizer,
TokenizerError,
)
except ImportError:
Engine = None EngineConfig = None GenerateError = None GrammarError = None LoadError = None Lora = None OxiLlamaError = None QuantError = None SamplerConfig = None SpeculativeConfig = None SpeculativeEngine = None Tokenizer = None TokenizerError = None
__version__ = "0.1.0"
__all__ = [
"EngineConfig",
"Engine",
"SamplerConfig",
"SpeculativeConfig",
"SpeculativeEngine",
"Lora",
"Tokenizer",
"OxiLlamaError",
"LoadError",
"GenerateError",
"TokenizerError",
"GrammarError",
"QuantError",
"StreamingCallback",
"TokenCallback",
]