hermes-llm 1.3.3

LLM training from scratch using Candle
Documentation
1
2
3
4
5
6
7
8
9
10
11
12
13
pub mod config;
pub mod data;
pub mod distributed;
pub mod dpo;
pub mod io;
pub mod model;
pub mod tokenizer;
pub mod training;

pub use config::Config;
pub use distributed::{DistributedConfig, NcclCommunicator};
pub use model::GPT;
pub use training::Trainer;