linear_srgb/
lut.rs

1//! Lookup table (LUT) based sRGB conversions.
2//!
3//! This module provides two types of lookup tables:
4//!
5//! ## Build-time Tables (Recommended)
6//!
7//! [`SrgbConverter`] uses pre-computed const tables embedded in the binary:
8//! - **Zero initialization cost** - tables exist at compile time
9//! - **8-bit linearization** (256 entries, 1KB): Direct lookup for sRGB u8 → linear f32
10//! - **12-bit encoding** (4096 entries, 16KB): Interpolated lookup for linear f32 → sRGB f32
11//!
12//! ## Runtime Tables (For Custom Bit Depths)
13//!
14//! [`LinearizationTable`] and [`EncodingTable`] generate tables at runtime:
15//! - Use when you need non-standard bit depths (10-bit, 16-bit, etc.)
16//! - Incur one-time allocation and computation cost
17//! - Table sizes:
18//!   - 8-bit: 256 entries (1KB for f32)
19//!   - 10-bit: 1024 entries (4KB for f32)
20//!   - 12-bit: 4096 entries (16KB for f32)
21//!   - 16-bit: 65536 entries (256KB for f32)
22
23#[cfg(not(feature = "std"))]
24use alloc::{boxed::Box, vec};
25
26use crate::mlaf::{mlaf, neg_mlaf};
27use crate::transfer::{linear_to_srgb_f64, srgb_to_linear_f64};
28
29/// Pre-computed linearization table for sRGB to linear conversion.
30pub struct LinearizationTable<const N: usize> {
31    table: Box<[f32; N]>,
32}
33
34impl<const N: usize> LinearizationTable<N> {
35    /// Create a linearization table for the given bit depth.
36    ///
37    /// N must equal 2^BIT_DEPTH (e.g., N=256 for 8-bit, N=65536 for 16-bit).
38    pub fn new() -> Self {
39        let mut table = vec![0.0f32; N].into_boxed_slice();
40        let max_value = (N - 1) as f64;
41
42        for (i, entry) in table.iter_mut().enumerate() {
43            let srgb = i as f64 / max_value;
44            *entry = srgb_to_linear_f64(srgb) as f32;
45        }
46
47        // Convert boxed slice to boxed array (safe - size is guaranteed by const N)
48        let table: Box<[f32; N]> = table.try_into().expect("size mismatch");
49
50        Self { table }
51    }
52
53    /// Direct lookup (no interpolation) - for exact bit-depth matches.
54    #[inline]
55    pub fn lookup(&self, index: usize) -> f32 {
56        self.table[index.min(N - 1)]
57    }
58
59    /// Get the raw table for custom interpolation.
60    #[inline]
61    pub fn as_slice(&self) -> &[f32] {
62        &self.table[..]
63    }
64}
65
66impl<const N: usize> Default for LinearizationTable<N> {
67    fn default() -> Self {
68        Self::new()
69    }
70}
71
72/// Pre-computed encoding table for linear to sRGB conversion.
73pub struct EncodingTable<const N: usize> {
74    table: Box<[f32; N]>,
75}
76
77impl<const N: usize> EncodingTable<N> {
78    /// Create an encoding table for the given resolution.
79    ///
80    /// Higher N means finer granularity for interpolation.
81    pub fn new() -> Self {
82        let mut table = vec![0.0f32; N].into_boxed_slice();
83        let max_value = (N - 1) as f64;
84
85        for (i, entry) in table.iter_mut().enumerate() {
86            let linear = i as f64 / max_value;
87            *entry = linear_to_srgb_f64(linear) as f32;
88        }
89
90        // Convert boxed slice to boxed array (safe - size is guaranteed by const N)
91        let table: Box<[f32; N]> = table.try_into().expect("size mismatch");
92
93        Self { table }
94    }
95
96    /// Direct lookup (no interpolation).
97    #[inline]
98    pub fn lookup(&self, index: usize) -> f32 {
99        self.table[index.min(N - 1)]
100    }
101
102    /// Get the raw table for custom interpolation.
103    #[inline]
104    pub fn as_slice(&self) -> &[f32] {
105        &self.table[..]
106    }
107}
108
109impl<const N: usize> Default for EncodingTable<N> {
110    fn default() -> Self {
111        Self::new()
112    }
113}
114
115/// Linear interpolation in a float LUT.
116///
117/// `x` should be in [0, 1]. Values outside are clamped.
118/// Uses FMA for the interpolation calculation.
119#[inline]
120pub fn lut_interp_linear_float(x: f32, table: &[f32]) -> f32 {
121    let x = x.clamp(0.0, 1.0);
122    let value = x * (table.len() - 1) as f32;
123
124    let upper = value.ceil() as usize;
125    let lower = value.floor() as usize;
126
127    // Safety: upper and lower are bounded by table.len() - 1 due to clamping
128    let tu = table[upper.min(table.len() - 1)];
129    let tl = table[lower];
130
131    let diff = upper as f32 - value;
132
133    // result = tl * diff + tu * (1 - diff)
134    // Using FMA: neg_mlaf(tu, tu, diff) = tu - tu*diff = tu*(1-diff)
135    // Then: mlaf(tu*(1-diff), tl, diff) = tu*(1-diff) + tl*diff
136    mlaf(neg_mlaf(tu, tu, diff), tl, diff)
137}
138
139/// Linear interpolation in a u16 LUT using fixed-point arithmetic.
140///
141/// Avoids floating-point entirely for integer-only pipelines.
142#[inline]
143pub fn lut_interp_linear_u16(input_value: u16, table: &[u16]) -> u16 {
144    let table_len = table.len() as u32;
145    let mut value: u32 = input_value as u32 * (table_len - 1);
146
147    let upper = value.div_ceil(65535) as usize;
148    let lower = (value / 65535) as usize;
149    let interp: u32 = value % 65535;
150
151    // Safety: upper and lower are bounded
152    let upper = upper.min(table.len() - 1);
153    let lower = lower.min(table.len() - 1);
154
155    value = (table[upper] as u32 * interp + table[lower] as u32 * (65535 - interp)) / 65535;
156    value as u16
157}
158
159/// Pre-computed 8-bit linearization table (256 entries).
160pub type LinearTable8 = LinearizationTable<256>;
161
162/// Pre-computed 10-bit linearization table (1024 entries).
163pub type LinearTable10 = LinearizationTable<1024>;
164
165/// Pre-computed 12-bit linearization table (4096 entries).
166pub type LinearTable12 = LinearizationTable<4096>;
167
168/// Pre-computed 16-bit linearization table (65536 entries).
169pub type LinearTable16 = LinearizationTable<65536>;
170
171/// Pre-computed 8-bit encoding table (256 entries).
172pub type EncodeTable8 = EncodingTable<256>;
173
174/// Pre-computed 12-bit encoding table (4096 entries).
175pub type EncodeTable12 = EncodingTable<4096>;
176
177/// Pre-computed 16-bit encoding table (65536 entries).
178pub type EncodeTable16 = EncodingTable<65536>;
179
180/// Converter using pre-computed const LUTs for fast batch conversion.
181///
182/// This is a **zero-sized type** - the tables are embedded in the binary at
183/// compile time with no runtime initialization cost. This is the recommended
184/// approach for standard 8-bit sRGB workflows.
185///
186/// # Example
187///
188/// ```rust
189/// use linear_srgb::SrgbConverter;
190///
191/// let conv = SrgbConverter::new();  // No allocation, just a marker type
192///
193/// // Fast 8-bit lookups
194/// let linear = conv.srgb_u8_to_linear(128);
195/// let srgb = conv.linear_to_srgb_u8(linear);
196/// ```
197///
198/// # Implementation Details
199///
200/// - Uses a 256-entry const table for sRGB u8 → linear f32 (direct lookup)
201/// - Uses a 4096-entry const table for linear f32 → sRGB f32 (linear interpolation)
202pub struct SrgbConverter;
203
204impl SrgbConverter {
205    /// Create a new converter.
206    ///
207    /// This is a no-op since tables are const and embedded in binary.
208    #[inline]
209    pub const fn new() -> Self {
210        Self
211    }
212
213    /// Convert 8-bit sRGB to linear using direct table lookup.
214    #[inline]
215    pub fn srgb_u8_to_linear(&self, value: u8) -> f32 {
216        crate::const_luts::LINEAR_TABLE_8[value as usize]
217    }
218
219    /// Convert linear to sRGB using table interpolation.
220    #[inline]
221    pub fn linear_to_srgb(&self, linear: f32) -> f32 {
222        lut_interp_linear_float(linear, &crate::const_luts::ENCODE_TABLE_12)
223    }
224
225    /// Convert linear to 8-bit sRGB.
226    #[inline]
227    pub fn linear_to_srgb_u8(&self, linear: f32) -> u8 {
228        (self.linear_to_srgb(linear) * 255.0 + 0.5) as u8
229    }
230
231    /// Batch convert sRGB u8 values to linear f32.
232    #[inline]
233    pub fn batch_srgb_to_linear(&self, input: &[u8], output: &mut [f32]) {
234        assert_eq!(input.len(), output.len());
235        for (i, o) in input.iter().zip(output.iter_mut()) {
236            *o = self.srgb_u8_to_linear(*i);
237        }
238    }
239
240    /// Batch convert linear f32 values to sRGB u8.
241    #[inline]
242    pub fn batch_linear_to_srgb(&self, input: &[f32], output: &mut [u8]) {
243        assert_eq!(input.len(), output.len());
244        for (i, o) in input.iter().zip(output.iter_mut()) {
245            *o = self.linear_to_srgb_u8(*i);
246        }
247    }
248}
249
250impl Default for SrgbConverter {
251    fn default() -> Self {
252        Self::new()
253    }
254}
255
256#[cfg(test)]
257mod tests {
258    use super::*;
259
260    #[cfg(not(feature = "std"))]
261    use alloc::{vec, vec::Vec};
262
263    #[test]
264    fn test_linearization_table_8bit() {
265        let table = LinearTable8::new();
266
267        // Check boundaries
268        assert_eq!(table.lookup(0), 0.0);
269        assert!((table.lookup(255) - 1.0).abs() < 1e-6);
270
271        // Check middle value
272        let mid = table.lookup(128);
273        assert!(mid > 0.0 && mid < 1.0);
274    }
275
276    #[test]
277    fn test_encoding_table() {
278        let table = EncodeTable12::new();
279
280        assert_eq!(table.lookup(0), 0.0);
281        assert!((table.lookup(4095) - 1.0).abs() < 1e-5);
282    }
283
284    #[test]
285    fn test_lut_interpolation() {
286        let table = EncodeTable12::new();
287
288        // Test interpolation at exact points
289        let result = lut_interp_linear_float(0.0, table.as_slice());
290        assert!((result - 0.0).abs() < 1e-6);
291
292        let result = lut_interp_linear_float(1.0, table.as_slice());
293        assert!((result - 1.0).abs() < 1e-5);
294    }
295
296    #[test]
297    fn test_converter_roundtrip() {
298        let conv = SrgbConverter::new();
299
300        for i in 0..=255u8 {
301            let linear = conv.srgb_u8_to_linear(i);
302            let back = conv.linear_to_srgb_u8(linear);
303            assert!(
304                (i as i32 - back as i32).abs() <= 1,
305                "Roundtrip failed for {}: {} -> {} -> {}",
306                i,
307                i,
308                linear,
309                back
310            );
311        }
312    }
313
314    #[test]
315    fn test_lut_vs_direct() {
316        use crate::transfer::srgb_to_linear;
317
318        let table = LinearTable8::new();
319
320        // Compare LUT to direct computation
321        for i in 0..=255u8 {
322            let lut_result = table.lookup(i as usize);
323            let direct_result = srgb_to_linear(i as f32 / 255.0);
324            assert!(
325                (lut_result - direct_result).abs() < 1e-5,
326                "Mismatch at {}: LUT={}, direct={}",
327                i,
328                lut_result,
329                direct_result
330            );
331        }
332    }
333
334    #[test]
335    fn test_u16_interpolation() {
336        // Create a simple linear ramp table
337        let table: Vec<u16> = (0..=255).map(|i| (i * 257) as u16).collect();
338
339        // Input 0 should give 0
340        assert_eq!(lut_interp_linear_u16(0, &table), 0);
341
342        // Input max should give max
343        assert_eq!(lut_interp_linear_u16(65535, &table), 65535);
344    }
345
346    #[test]
347    fn test_batch_conversion() {
348        let conv = SrgbConverter::new();
349
350        let input: Vec<u8> = (0..=255).collect();
351        let mut linear = vec![0.0f32; 256];
352        let mut back = vec![0u8; 256];
353
354        conv.batch_srgb_to_linear(&input, &mut linear);
355        conv.batch_linear_to_srgb(&linear, &mut back);
356
357        for i in 0..256 {
358            assert!(
359                (input[i] as i32 - back[i] as i32).abs() <= 1,
360                "Batch roundtrip failed at {}",
361                i
362            );
363        }
364    }
365}
linear_srgb/lut.rs

linear_srgb/
lut.rs