linear_srgb/
lut.rs

1//! Lookup table (LUT) based sRGB conversions.
2//!
3//! This module provides two types of lookup tables:
4//!
5//! ## Build-time Tables (Recommended)
6//!
7//! [`SrgbConverter`] uses pre-computed const tables embedded in the binary:
8//! - **Zero initialization cost** - tables exist at compile time
9//! - **8-bit linearization** (256 entries, 1KB): Direct lookup for sRGB u8 → linear f32
10//! - **12-bit encoding** (4096 entries, 16KB): Interpolated lookup for linear f32 → sRGB f32
11//!
12//! ## Runtime Tables (For Custom Bit Depths)
13//!
14//! [`LinearizationTable`] and [`EncodingTable`] generate tables at runtime:
15//! - Use when you need non-standard bit depths (10-bit, 16-bit, etc.)
16//! - Incur one-time allocation and computation cost
17//! - Table sizes:
18//!   - 8-bit: 256 entries (1KB for f32)
19//!   - 10-bit: 1024 entries (4KB for f32)
20//!   - 12-bit: 4096 entries (16KB for f32)
21//!   - 16-bit: 65536 entries (256KB for f32)
22
23#[cfg(not(feature = "std"))]
24use alloc::{boxed::Box, vec};
25
26use crate::mlaf::{mlaf, neg_mlaf};
27use crate::scalar::{linear_to_srgb_f64, srgb_to_linear_f64};
28
29/// Pre-computed linearization table for sRGB to linear conversion.
30pub struct LinearizationTable<const N: usize> {
31    table: Box<[f32; N]>,
32}
33
34impl<const N: usize> LinearizationTable<N> {
35    /// Create a linearization table for the given bit depth.
36    ///
37    /// N must equal 2^BIT_DEPTH (e.g., N=256 for 8-bit, N=65536 for 16-bit).
38    pub fn new() -> Self {
39        let mut table = vec![0.0f32; N].into_boxed_slice();
40        let max_value = (N - 1) as f64;
41
42        for (i, entry) in table.iter_mut().enumerate() {
43            let srgb = i as f64 / max_value;
44            *entry = srgb_to_linear_f64(srgb) as f32;
45        }
46
47        // Convert boxed slice to boxed array (safe - size is guaranteed by const N)
48        let table: Box<[f32; N]> = table.try_into().expect("size mismatch");
49
50        Self { table }
51    }
52
53    /// Direct lookup (no interpolation) - for exact bit-depth matches.
54    #[inline]
55    pub fn lookup(&self, index: usize) -> f32 {
56        self.table[index.min(N - 1)]
57    }
58
59    /// Get the raw table for custom interpolation.
60    #[inline]
61    pub fn as_slice(&self) -> &[f32] {
62        &self.table[..]
63    }
64}
65
66impl<const N: usize> Default for LinearizationTable<N> {
67    fn default() -> Self {
68        Self::new()
69    }
70}
71
72/// Pre-computed encoding table for linear to sRGB conversion.
73pub struct EncodingTable<const N: usize> {
74    table: Box<[f32; N]>,
75}
76
77impl<const N: usize> EncodingTable<N> {
78    /// Create an encoding table for the given resolution.
79    ///
80    /// Higher N means finer granularity for interpolation.
81    pub fn new() -> Self {
82        let mut table = vec![0.0f32; N].into_boxed_slice();
83        let max_value = (N - 1) as f64;
84
85        for (i, entry) in table.iter_mut().enumerate() {
86            let linear = i as f64 / max_value;
87            *entry = linear_to_srgb_f64(linear) as f32;
88        }
89
90        // Convert boxed slice to boxed array (safe - size is guaranteed by const N)
91        let table: Box<[f32; N]> = table.try_into().expect("size mismatch");
92
93        Self { table }
94    }
95
96    /// Direct lookup (no interpolation).
97    #[inline]
98    pub fn lookup(&self, index: usize) -> f32 {
99        self.table[index.min(N - 1)]
100    }
101
102    /// Get the raw table for custom interpolation.
103    #[inline]
104    pub fn as_slice(&self) -> &[f32] {
105        &self.table[..]
106    }
107}
108
109impl<const N: usize> Default for EncodingTable<N> {
110    fn default() -> Self {
111        Self::new()
112    }
113}
114
115/// Linear interpolation in a float LUT.
116///
117/// `x` should be in [0, 1]. Values outside are clamped.
118/// Uses FMA for the interpolation calculation.
119#[inline]
120pub fn lut_interp_linear_float(x: f32, table: &[f32]) -> f32 {
121    let x = x.clamp(0.0, 1.0);
122    let value = x * (table.len() - 1) as f32;
123
124    let upper = value.ceil() as usize;
125    let lower = value.floor() as usize;
126
127    // Safety: upper and lower are bounded by table.len() - 1 due to clamping
128    let tu = table[upper.min(table.len() - 1)];
129    let tl = table[lower];
130
131    let diff = upper as f32 - value;
132
133    // result = tl * diff + tu * (1 - diff)
134    // Using FMA: neg_mlaf(tu, tu, diff) = tu - tu*diff = tu*(1-diff)
135    // Then: mlaf(tu*(1-diff), tl, diff) = tu*(1-diff) + tl*diff
136    mlaf(neg_mlaf(tu, tu, diff), tl, diff)
137}
138
139/// Linear interpolation in a u16 LUT using fixed-point arithmetic.
140///
141/// Avoids floating-point entirely for integer-only pipelines.
142#[inline]
143pub fn lut_interp_linear_u16(input_value: u16, table: &[u16]) -> u16 {
144    let table_len = table.len() as u32;
145    let mut value: u32 = input_value as u32 * (table_len - 1);
146
147    let upper = value.div_ceil(65535) as usize;
148    let lower = (value / 65535) as usize;
149    let interp: u32 = value % 65535;
150
151    // Safety: upper and lower are bounded
152    let upper = upper.min(table.len() - 1);
153    let lower = lower.min(table.len() - 1);
154
155    value = (table[upper] as u32 * interp + table[lower] as u32 * (65535 - interp)) / 65535;
156    value as u16
157}
158
159/// Pre-computed 8-bit linearization table (256 entries).
160pub type LinearTable8 = LinearizationTable<256>;
161
162/// Pre-computed 10-bit linearization table (1024 entries).
163pub type LinearTable10 = LinearizationTable<1024>;
164
165/// Pre-computed 12-bit linearization table (4096 entries).
166pub type LinearTable12 = LinearizationTable<4096>;
167
168/// Pre-computed 16-bit linearization table (65536 entries).
169pub type LinearTable16 = LinearizationTable<65536>;
170
171/// Pre-computed 8-bit encoding table (256 entries).
172pub type EncodeTable8 = EncodingTable<256>;
173
174/// Pre-computed 12-bit encoding table (4096 entries).
175pub type EncodeTable12 = EncodingTable<4096>;
176
177/// Pre-computed 16-bit encoding table (65536 entries).
178pub type EncodeTable16 = EncodingTable<65536>;
179
180/// Converter using pre-computed const LUTs for fast batch conversion.
181///
182/// This is a **zero-sized type** - the tables are embedded in the binary at
183/// compile time with no runtime initialization cost. This is the recommended
184/// approach for standard 8-bit sRGB workflows.
185///
186/// # Example
187///
188/// ```rust
189/// use linear_srgb::lut::SrgbConverter;
190///
191/// let conv = SrgbConverter::new();  // No allocation, just a marker type
192///
193/// // Fast 8-bit lookups
194/// let linear = conv.srgb_u8_to_linear(128);
195/// let srgb = conv.linear_to_srgb_u8(linear);
196/// ```
197///
198/// # Implementation Details
199///
200/// - Uses a 256-entry const table for sRGB u8 → linear f32 (direct lookup)
201/// - Uses a 4096-entry const table for linear f32 → sRGB f32 (linear interpolation)
202pub struct SrgbConverter;
203
204impl SrgbConverter {
205    /// Create a new converter.
206    ///
207    /// This is a no-op since tables are const and embedded in binary.
208    #[inline]
209    pub const fn new() -> Self {
210        Self
211    }
212
213    /// Convert 8-bit sRGB to linear using direct table lookup.
214    #[inline]
215    pub fn srgb_u8_to_linear(&self, value: u8) -> f32 {
216        crate::const_luts::LINEAR_TABLE_8[value as usize]
217    }
218
219    /// Convert linear to sRGB using table interpolation.
220    #[inline]
221    pub fn linear_to_srgb(&self, linear: f32) -> f32 {
222        lut_interp_linear_float(linear, &crate::const_luts::ENCODE_TABLE_12)
223    }
224
225    /// Convert linear to 8-bit sRGB.
226    ///
227    /// # Deprecation
228    ///
229    /// This LUT interpolation method is ~2x slower than SIMD.
230    /// Prefer [`crate::simd::linear_to_srgb_u8_slice`] for batches or
231    /// [`crate::scalar::linear_to_srgb_u8`] for single values.
232    #[deprecated(
233        since = "0.3.0",
234        note = "2x slower than SIMD. Use simd::linear_to_srgb_u8_slice for batches or scalar::linear_to_srgb_u8 for single values."
235    )]
236    #[inline]
237    pub fn linear_to_srgb_u8(&self, linear: f32) -> u8 {
238        (self.linear_to_srgb(linear) * 255.0 + 0.5) as u8
239    }
240
241    /// Batch convert sRGB u8 values to linear f32.
242    #[inline]
243    pub fn batch_srgb_to_linear(&self, input: &[u8], output: &mut [f32]) {
244        assert_eq!(input.len(), output.len());
245        for (i, o) in input.iter().zip(output.iter_mut()) {
246            *o = self.srgb_u8_to_linear(*i);
247        }
248    }
249
250    /// Batch convert linear f32 values to sRGB u8.
251    ///
252    /// # Deprecation
253    ///
254    /// This LUT interpolation method is ~2x slower than SIMD.
255    /// Prefer [`crate::simd::linear_to_srgb_u8_slice`] instead.
256    #[deprecated(
257        since = "0.3.0",
258        note = "2x slower than SIMD. Use simd::linear_to_srgb_u8_slice instead."
259    )]
260    #[inline]
261    #[allow(deprecated)]
262    pub fn batch_linear_to_srgb(&self, input: &[f32], output: &mut [u8]) {
263        assert_eq!(input.len(), output.len());
264        for (i, o) in input.iter().zip(output.iter_mut()) {
265            *o = self.linear_to_srgb_u8(*i);
266        }
267    }
268}
269
270impl Default for SrgbConverter {
271    fn default() -> Self {
272        Self::new()
273    }
274}
275
276#[cfg(test)]
277mod tests {
278    use super::*;
279
280    #[cfg(not(feature = "std"))]
281    use alloc::{vec, vec::Vec};
282
283    #[test]
284    fn test_linearization_table_8bit() {
285        let table = LinearTable8::new();
286
287        // Check boundaries
288        assert_eq!(table.lookup(0), 0.0);
289        assert!((table.lookup(255) - 1.0).abs() < 1e-6);
290
291        // Check middle value
292        let mid = table.lookup(128);
293        assert!(mid > 0.0 && mid < 1.0);
294    }
295
296    #[test]
297    fn test_encoding_table() {
298        let table = EncodeTable12::new();
299
300        assert_eq!(table.lookup(0), 0.0);
301        assert!((table.lookup(4095) - 1.0).abs() < 1e-5);
302    }
303
304    #[test]
305    fn test_lut_interpolation() {
306        let table = EncodeTable12::new();
307
308        // Test interpolation at exact points
309        let result = lut_interp_linear_float(0.0, table.as_slice());
310        assert!((result - 0.0).abs() < 1e-6);
311
312        let result = lut_interp_linear_float(1.0, table.as_slice());
313        assert!((result - 1.0).abs() < 1e-5);
314    }
315
316    #[test]
317    #[allow(deprecated)]
318    fn test_converter_roundtrip() {
319        let conv = SrgbConverter::new();
320
321        for i in 0..=255u8 {
322            let linear = conv.srgb_u8_to_linear(i);
323            let back = conv.linear_to_srgb_u8(linear);
324            assert!(
325                (i as i32 - back as i32).abs() <= 1,
326                "Roundtrip failed for {}: {} -> {} -> {}",
327                i,
328                i,
329                linear,
330                back
331            );
332        }
333    }
334
335    #[test]
336    fn test_lut_vs_direct() {
337        use crate::scalar::srgb_to_linear;
338
339        let table = LinearTable8::new();
340
341        // Compare LUT to direct computation
342        for i in 0..=255u8 {
343            let lut_result = table.lookup(i as usize);
344            let direct_result = srgb_to_linear(i as f32 / 255.0);
345            assert!(
346                (lut_result - direct_result).abs() < 1e-5,
347                "Mismatch at {}: LUT={}, direct={}",
348                i,
349                lut_result,
350                direct_result
351            );
352        }
353    }
354
355    #[test]
356    fn test_u16_interpolation() {
357        // Create a simple linear ramp table
358        let table: Vec<u16> = (0..=255).map(|i| (i * 257) as u16).collect();
359
360        // Input 0 should give 0
361        assert_eq!(lut_interp_linear_u16(0, &table), 0);
362
363        // Input max should give max
364        assert_eq!(lut_interp_linear_u16(65535, &table), 65535);
365    }
366
367    #[test]
368    #[allow(deprecated)]
369    fn test_batch_conversion() {
370        let conv = SrgbConverter::new();
371
372        let input: Vec<u8> = (0..=255).collect();
373        let mut linear = vec![0.0f32; 256];
374        let mut back = vec![0u8; 256];
375
376        conv.batch_srgb_to_linear(&input, &mut linear);
377        conv.batch_linear_to_srgb(&linear, &mut back);
378
379        for i in 0..256 {
380            assert!(
381                (input[i] as i32 - back[i] as i32).abs() <= 1,
382                "Batch roundtrip failed at {}",
383                i
384            );
385        }
386    }
387}