base_d/lib.rs
1//! # base-d
2//!
3//! A universal, multi-alphabet encoding library for Rust.
4//!
5//! Encode binary data to 33+ alphabets including RFC standards, ancient scripts,
6//! emoji, playing cards, and more. Supports three encoding modes: mathematical
7//! base conversion, RFC 4648 chunked encoding, and direct byte-range mapping.
8//!
9//! ## Quick Start
10//!
11//! ```
12//! use base_d::{AlphabetsConfig, Alphabet, encode, decode};
13//!
14//! # fn main() -> Result<(), Box<dyn std::error::Error>> {
15//! // Load built-in alphabets
16//! let config = AlphabetsConfig::load_default()?;
17//! let base64_config = config.get_alphabet("base64").unwrap();
18//!
19//! // Create alphabet
20//! let chars: Vec<char> = base64_config.chars.chars().collect();
21//! let padding = base64_config.padding.as_ref().and_then(|s| s.chars().next());
22//! let alphabet = Alphabet::new_with_mode(
23//! chars,
24//! base64_config.mode.clone(),
25//! padding
26//! )?;
27//!
28//! // Encode and decode
29//! let data = b"Hello, World!";
30//! let encoded = encode(data, &alphabet);
31//! let decoded = decode(&encoded, &alphabet)?;
32//! assert_eq!(data, &decoded[..]);
33//! # Ok(())
34//! # }
35//! ```
36//!
37//! ## Features
38//!
39//! - **33 Built-in Alphabets**: RFC standards, emoji, ancient scripts, and more
40//! - **3 Encoding Modes**: Mathematical, chunked (RFC-compliant), byte-range
41//! - **Streaming Support**: Memory-efficient processing for large files
42//! - **Custom Alphabets**: Define your own via TOML configuration
43//! - **User Configuration**: Load alphabets from `~/.config/base-d/alphabets.toml`
44//!
45//! ## Encoding Modes
46//!
47//! ### Mathematical Base Conversion
48//!
49//! Treats data as a large number. Works with any alphabet size.
50//!
51//! ```
52//! use base_d::{Alphabet, EncodingMode, encode};
53//!
54//! # fn main() -> Result<(), Box<dyn std::error::Error>> {
55//! let chars: Vec<char> = "😀😁😂🤣😃😄😅😆".chars().collect();
56//! let alphabet = Alphabet::new_with_mode(
57//! chars,
58//! EncodingMode::BaseConversion,
59//! None
60//! )?;
61//!
62//! let encoded = encode(b"Hi", &alphabet);
63//! # Ok(())
64//! # }
65//! ```
66//!
67//! ### Chunked Mode (RFC 4648)
68//!
69//! Fixed-size bit groups, compatible with standard base64/base32.
70//!
71//! ```
72//! use base_d::{Alphabet, EncodingMode, encode};
73//!
74//! # fn main() -> Result<(), Box<dyn std::error::Error>> {
75//! let chars: Vec<char> = "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/"
76//! .chars().collect();
77//! let alphabet = Alphabet::new_with_mode(
78//! chars,
79//! EncodingMode::Chunked,
80//! Some('=')
81//! )?;
82//!
83//! let encoded = encode(b"Hello", &alphabet);
84//! assert_eq!(encoded, "SGVsbG8=");
85//! # Ok(())
86//! # }
87//! ```
88//!
89//! ### Byte Range Mode
90//!
91//! Direct 1:1 byte-to-emoji mapping. Zero encoding overhead.
92//!
93//! ```
94//! use base_d::{Alphabet, EncodingMode, encode};
95//!
96//! # fn main() -> Result<(), Box<dyn std::error::Error>> {
97//! let alphabet = Alphabet::new_with_mode_and_range(
98//! Vec::new(),
99//! EncodingMode::ByteRange,
100//! None,
101//! Some(127991) // U+1F3F7
102//! )?;
103//!
104//! let data = b"Hi";
105//! let encoded = encode(data, &alphabet);
106//! assert_eq!(encoded.chars().count(), 2); // 1:1 mapping
107//! # Ok(())
108//! # }
109//! ```
110//!
111//! ## Streaming
112//!
113//! For large files, use streaming to avoid loading entire file into memory:
114//!
115//! ```no_run
116//! use base_d::{AlphabetsConfig, StreamingEncoder};
117//! use std::fs::File;
118//!
119//! # fn main() -> Result<(), Box<dyn std::error::Error>> {
120//! let config = AlphabetsConfig::load_default()?;
121//! let alphabet_config = config.get_alphabet("base64").unwrap();
122//!
123//! // ... create alphabet from config
124//! # let chars: Vec<char> = alphabet_config.chars.chars().collect();
125//! # let padding = alphabet_config.padding.as_ref().and_then(|s| s.chars().next());
126//! # let alphabet = base_d::Alphabet::new_with_mode(chars, alphabet_config.mode.clone(), padding)?;
127//!
128//! let mut input = File::open("large_file.bin")?;
129//! let output = File::create("encoded.txt")?;
130//!
131//! let mut encoder = StreamingEncoder::new(&alphabet, output);
132//! encoder.encode(&mut input)?;
133//! # Ok(())
134//! # }
135//! ```
136
137mod alphabet;
138mod encoding;
139mod chunked;
140mod byte_range;
141mod config;
142mod streaming;
143
144pub use alphabet::Alphabet;
145pub use config::{AlphabetsConfig, AlphabetConfig, EncodingMode};
146pub use streaming::{StreamingEncoder, StreamingDecoder};
147pub use encoding::DecodeError;
148
149/// Encodes binary data using the specified alphabet.
150///
151/// Automatically selects the appropriate encoding strategy based on the
152/// alphabet's mode (BaseConversion, Chunked, or ByteRange).
153///
154/// # Arguments
155///
156/// * `data` - The binary data to encode
157/// * `alphabet` - The alphabet to use for encoding
158///
159/// # Returns
160///
161/// A string containing the encoded data
162///
163/// # Examples
164///
165/// ```
166/// use base_d::{Alphabet, EncodingMode};
167///
168/// # fn main() -> Result<(), Box<dyn std::error::Error>> {
169/// let chars: Vec<char> = "01".chars().collect();
170/// let alphabet = Alphabet::new_with_mode(chars, EncodingMode::BaseConversion, None)?;
171/// let encoded = base_d::encode(b"Hi", &alphabet);
172/// # Ok(())
173/// # }
174/// ```
175pub fn encode(data: &[u8], alphabet: &Alphabet) -> String {
176 match alphabet.mode() {
177 EncodingMode::BaseConversion => encoding::encode(data, alphabet),
178 EncodingMode::Chunked => chunked::encode_chunked(data, alphabet),
179 EncodingMode::ByteRange => byte_range::encode_byte_range(data, alphabet),
180 }
181}
182
183/// Decodes a string back to binary data using the specified alphabet.
184///
185/// Automatically selects the appropriate decoding strategy based on the
186/// alphabet's mode (BaseConversion, Chunked, or ByteRange).
187///
188/// # Arguments
189///
190/// * `encoded` - The encoded string to decode
191/// * `alphabet` - The alphabet used for encoding
192///
193/// # Returns
194///
195/// A `Result` containing the decoded binary data, or a `DecodeError` if
196/// the input is invalid
197///
198/// # Errors
199///
200/// Returns `DecodeError` if:
201/// - The input contains invalid characters
202/// - The input is empty
203/// - The padding is invalid (for chunked mode)
204///
205/// # Examples
206///
207/// ```
208/// use base_d::{Alphabet, EncodingMode, encode, decode};
209///
210/// # fn main() -> Result<(), Box<dyn std::error::Error>> {
211/// let chars: Vec<char> = "01".chars().collect();
212/// let alphabet = Alphabet::new_with_mode(chars, EncodingMode::BaseConversion, None)?;
213/// let data = b"Hi";
214/// let encoded = encode(data, &alphabet);
215/// let decoded = decode(&encoded, &alphabet)?;
216/// assert_eq!(data, &decoded[..]);
217/// # Ok(())
218/// # }
219/// ```
220pub fn decode(encoded: &str, alphabet: &Alphabet) -> Result<Vec<u8>, DecodeError> {
221 match alphabet.mode() {
222 EncodingMode::BaseConversion => encoding::decode(encoded, alphabet),
223 EncodingMode::Chunked => chunked::decode_chunked(encoded, alphabet),
224 EncodingMode::ByteRange => byte_range::decode_byte_range(encoded, alphabet),
225 }
226}
227
228#[cfg(test)]
229mod tests;