base_d/lib.rs
1//! # base-d
2//!
3//! A universal, multi-alphabet encoding library for Rust.
4//!
5//! Encode binary data to 33+ alphabets including RFC standards, ancient scripts,
6//! emoji, playing cards, and more. Supports three encoding modes: mathematical
7//! base conversion, RFC 4648 chunked encoding, and direct byte-range mapping.
8//!
9//! ## Quick Start
10//!
11//! ```
12//! use base_d::{AlphabetsConfig, Alphabet, encode, decode};
13//!
14//! # fn main() -> Result<(), Box<dyn std::error::Error>> {
15//! // Load built-in alphabets
16//! let config = AlphabetsConfig::load_default()?;
17//! let base64_config = config.get_alphabet("base64").unwrap();
18//!
19//! // Create alphabet
20//! let chars: Vec<char> = base64_config.chars.chars().collect();
21//! let padding = base64_config.padding.as_ref().and_then(|s| s.chars().next());
22//! let alphabet = Alphabet::new_with_mode(
23//! chars,
24//! base64_config.mode.clone(),
25//! padding
26//! )?;
27//!
28//! // Encode and decode
29//! let data = b"Hello, World!";
30//! let encoded = encode(data, &alphabet);
31//! let decoded = decode(&encoded, &alphabet)?;
32//! assert_eq!(data, &decoded[..]);
33//! # Ok(())
34//! # }
35//! ```
36//!
37//! ## Features
38//!
39//! - **33 Built-in Alphabets**: RFC standards, emoji, ancient scripts, and more
40//! - **3 Encoding Modes**: Mathematical, chunked (RFC-compliant), byte-range
41//! - **Streaming Support**: Memory-efficient processing for large files
42//! - **Custom Alphabets**: Define your own via TOML configuration
43//! - **User Configuration**: Load alphabets from `~/.config/base-d/alphabets.toml`
44//!
45//! ## Encoding Modes
46//!
47//! ### Mathematical Base Conversion
48//!
49//! Treats data as a large number. Works with any alphabet size.
50//!
51//! ```
52//! use base_d::{Alphabet, EncodingMode, encode};
53//!
54//! # fn main() -> Result<(), Box<dyn std::error::Error>> {
55//! let chars: Vec<char> = "😀😁😂🤣😃😄😅😆".chars().collect();
56//! let alphabet = Alphabet::new_with_mode(
57//! chars,
58//! EncodingMode::BaseConversion,
59//! None
60//! )?;
61//!
62//! let encoded = encode(b"Hi", &alphabet);
63//! # Ok(())
64//! # }
65//! ```
66//!
67//! ### Chunked Mode (RFC 4648)
68//!
69//! Fixed-size bit groups, compatible with standard base64/base32.
70//!
71//! ```
72//! use base_d::{Alphabet, EncodingMode, encode};
73//!
74//! # fn main() -> Result<(), Box<dyn std::error::Error>> {
75//! let chars: Vec<char> = "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/"
76//! .chars().collect();
77//! let alphabet = Alphabet::new_with_mode(
78//! chars,
79//! EncodingMode::Chunked,
80//! Some('=')
81//! )?;
82//!
83//! let encoded = encode(b"Hello", &alphabet);
84//! assert_eq!(encoded, "SGVsbG8=");
85//! # Ok(())
86//! # }
87//! ```
88//!
89//! ### Byte Range Mode
90//!
91//! Direct 1:1 byte-to-emoji mapping. Zero encoding overhead.
92//!
93//! ```
94//! use base_d::{Alphabet, EncodingMode, encode};
95//!
96//! # fn main() -> Result<(), Box<dyn std::error::Error>> {
97//! let alphabet = Alphabet::new_with_mode_and_range(
98//! Vec::new(),
99//! EncodingMode::ByteRange,
100//! None,
101//! Some(127991) // U+1F3F7
102//! )?;
103//!
104//! let data = b"Hi";
105//! let encoded = encode(data, &alphabet);
106//! assert_eq!(encoded.chars().count(), 2); // 1:1 mapping
107//! # Ok(())
108//! # }
109//! ```
110//!
111//! ## Streaming
112//!
113//! For large files, use streaming to avoid loading entire file into memory:
114//!
115//! ```no_run
116//! use base_d::{AlphabetsConfig, StreamingEncoder};
117//! use std::fs::File;
118//!
119//! # fn main() -> Result<(), Box<dyn std::error::Error>> {
120//! let config = AlphabetsConfig::load_default()?;
121//! let alphabet_config = config.get_alphabet("base64").unwrap();
122//!
123//! // ... create alphabet from config
124//! # let chars: Vec<char> = alphabet_config.chars.chars().collect();
125//! # let padding = alphabet_config.padding.as_ref().and_then(|s| s.chars().next());
126//! # let alphabet = base_d::Alphabet::new_with_mode(chars, alphabet_config.mode.clone(), padding)?;
127//!
128//! let mut input = File::open("large_file.bin")?;
129//! let output = File::create("encoded.txt")?;
130//!
131//! let mut encoder = StreamingEncoder::new(&alphabet, output);
132//! encoder.encode(&mut input)?;
133//! # Ok(())
134//! # }
135//! ```
136
137mod core;
138mod encoders;
139
140pub use core::alphabet::Alphabet;
141pub use core::config::{AlphabetsConfig, AlphabetConfig, EncodingMode};
142pub use encoders::streaming::{StreamingEncoder, StreamingDecoder};
143pub use encoders::encoding::DecodeError;
144
145/// Encodes binary data using the specified alphabet.
146///
147/// Automatically selects the appropriate encoding strategy based on the
148/// alphabet's mode (BaseConversion, Chunked, or ByteRange).
149///
150/// # Arguments
151///
152/// * `data` - The binary data to encode
153/// * `alphabet` - The alphabet to use for encoding
154///
155/// # Returns
156///
157/// A string containing the encoded data
158///
159/// # Examples
160///
161/// ```
162/// use base_d::{Alphabet, EncodingMode};
163///
164/// # fn main() -> Result<(), Box<dyn std::error::Error>> {
165/// let chars: Vec<char> = "01".chars().collect();
166/// let alphabet = Alphabet::new_with_mode(chars, EncodingMode::BaseConversion, None)?;
167/// let encoded = base_d::encode(b"Hi", &alphabet);
168/// # Ok(())
169/// # }
170/// ```
171pub fn encode(data: &[u8], alphabet: &Alphabet) -> String {
172 match alphabet.mode() {
173 EncodingMode::BaseConversion => encoders::encoding::encode(data, alphabet),
174 EncodingMode::Chunked => encoders::chunked::encode_chunked(data, alphabet),
175 EncodingMode::ByteRange => encoders::byte_range::encode_byte_range(data, alphabet),
176 }
177}
178
179/// Decodes a string back to binary data using the specified alphabet.
180///
181/// Automatically selects the appropriate decoding strategy based on the
182/// alphabet's mode (BaseConversion, Chunked, or ByteRange).
183///
184/// # Arguments
185///
186/// * `encoded` - The encoded string to decode
187/// * `alphabet` - The alphabet used for encoding
188///
189/// # Returns
190///
191/// A `Result` containing the decoded binary data, or a `DecodeError` if
192/// the input is invalid
193///
194/// # Errors
195///
196/// Returns `DecodeError` if:
197/// - The input contains invalid characters
198/// - The input is empty
199/// - The padding is invalid (for chunked mode)
200///
201/// # Examples
202///
203/// ```
204/// use base_d::{Alphabet, EncodingMode, encode, decode};
205///
206/// # fn main() -> Result<(), Box<dyn std::error::Error>> {
207/// let chars: Vec<char> = "01".chars().collect();
208/// let alphabet = Alphabet::new_with_mode(chars, EncodingMode::BaseConversion, None)?;
209/// let data = b"Hi";
210/// let encoded = encode(data, &alphabet);
211/// let decoded = decode(&encoded, &alphabet)?;
212/// assert_eq!(data, &decoded[..]);
213/// # Ok(())
214/// # }
215/// ```
216pub fn decode(encoded: &str, alphabet: &Alphabet) -> Result<Vec<u8>, DecodeError> {
217 match alphabet.mode() {
218 EncodingMode::BaseConversion => encoders::encoding::decode(encoded, alphabet),
219 EncodingMode::Chunked => encoders::chunked::decode_chunked(encoded, alphabet),
220 EncodingMode::ByteRange => encoders::byte_range::decode_byte_range(encoded, alphabet),
221 }
222}
223
224#[cfg(test)]
225mod tests;