pub struct TokenizerTrainingMetrics {
pub training_time_sec: u64,
}
pub struct TokenizerVocabMetrics {
pub vocab_size: usize,
pub avg_token_length: f64,
pub max_token_length: usize,
pub min_token_length: usize,
}
pub struct TokenizerInferenceMetrics {
pub avg_encode_time_ns: f64,
pub avg_decode_time_ns: f64,
pub encode_throughput_tokens_per_sec: f64,
pub decode_throughput_tokens_per_sec: f64,
pub corpus_token_count: usize,
}
pub struct TokenizerDevelopmentResult {
pub version: String,
pub corpus_name: String,
pub corpus_size_bytes: u64,
pub training_metrics: TokenizerTrainingMetrics,
pub vocab_metrics: TokenizerVocabMetrics,
pub inference_metrics: TokenizerInferenceMetrics,
}