Skip to main content

rar_stream/decompress/
bit_reader.rs

1//! Bit reader for compressed data streams.
2//!
3//! Reads bits from a byte stream, LSB first (RAR convention).
4
5use super::{DecompressError, Result};
6
7/// Bit reader that reads from a byte slice.
8pub struct BitReader<'a> {
9    data: &'a [u8],
10    pos: usize,
11    bit_pos: u32,
12    /// Current bit buffer (up to 32 bits)
13    buffer: u32,
14    /// Bits available in buffer
15    bits_in_buffer: u32,
16}
17
18impl<'a> BitReader<'a> {
19    /// Create a new bit reader from a byte slice.
20    pub fn new(data: &'a [u8]) -> Self {
21        let mut reader = Self {
22            data,
23            pos: 0,
24            bit_pos: 0,
25            buffer: 0,
26            bits_in_buffer: 0,
27        };
28        reader.fill_buffer();
29        reader
30    }
31
32    /// Fill the buffer with more bytes.
33    /// Optimized to read multiple bytes when possible.
34    #[inline(always)]
35    fn fill_buffer(&mut self) {
36        // Fast path: if we need 3+ bytes and have them, read all at once
37        if self.bits_in_buffer <= 8 && self.pos + 3 <= self.data.len() {
38            // Read 3 bytes (24 bits) at once
39            // SAFETY: bounds checked above
40            unsafe {
41                let b0 = *self.data.get_unchecked(self.pos) as u32;
42                let b1 = *self.data.get_unchecked(self.pos + 1) as u32;
43                let b2 = *self.data.get_unchecked(self.pos + 2) as u32;
44                let bytes = (b0 << 16) | (b1 << 8) | b2;
45                self.buffer |= bytes << (8 - self.bits_in_buffer);
46            }
47            self.bits_in_buffer += 24;
48            self.pos += 3;
49            return;
50        }
51
52        // Slow path: read one byte at a time
53        while self.bits_in_buffer <= 24 && self.pos < self.data.len() {
54            // SAFETY: bounds checked above
55            self.buffer |= unsafe {
56                (*self.data.get_unchecked(self.pos) as u32) << (24 - self.bits_in_buffer)
57            };
58            self.bits_in_buffer += 8;
59            self.pos += 1;
60        }
61    }
62
63    /// Peek at the next n bits without consuming them.
64    #[inline(always)]
65    pub fn peek_bits(&self, n: u32) -> u32 {
66        debug_assert!(n <= 16);
67        self.buffer >> (32 - n)
68    }
69
70    /// Read n bits and advance the position.
71    #[inline(always)]
72    pub fn read_bits(&mut self, n: u32) -> Result<u32> {
73        debug_assert!(n <= 16);
74
75        if n > self.bits_in_buffer && self.pos >= self.data.len() {
76            return Err(DecompressError::UnexpectedEof);
77        }
78
79        let value = self.peek_bits(n);
80        self.advance_bits(n);
81        Ok(value)
82    }
83
84    /// Advance by n bits.
85    #[inline(always)]
86    pub fn advance_bits(&mut self, n: u32) {
87        self.buffer <<= n;
88        self.bits_in_buffer = self.bits_in_buffer.saturating_sub(n);
89        self.bit_pos += n;
90        self.fill_buffer();
91    }
92
93    /// Read a single bit.
94    #[inline(always)]
95    pub fn read_bit(&mut self) -> Result<bool> {
96        Ok(self.read_bits(1)? != 0)
97    }
98
99    /// Read a single byte (8 bits).
100    #[inline]
101    pub fn read_byte(&mut self) -> Option<u8> {
102        self.read_bits(8).ok().map(|v| v as u8)
103    }
104
105    /// Align to byte boundary by skipping remaining bits in current byte.
106    #[inline]
107    pub fn align_to_byte(&mut self) {
108        let bits_used_in_byte = self.bit_pos % 8;
109        if bits_used_in_byte > 0 {
110            let skip = 8 - bits_used_in_byte;
111            self.advance_bits(skip);
112        }
113    }
114
115    /// Get the current bit position.
116    pub fn bit_position(&self) -> u64 {
117        self.bit_pos as u64
118    }
119
120    /// Get the current byte position (bytes consumed from stream).
121    pub fn byte_position(&self) -> usize {
122        self.pos
123    }
124
125    /// Check if at end of data.
126    pub fn is_eof(&self) -> bool {
127        self.bits_in_buffer == 0 && self.pos >= self.data.len()
128    }
129
130    /// Remaining bits available.
131    pub fn remaining_bits(&self) -> u64 {
132        self.bits_in_buffer as u64 + ((self.data.len() - self.pos) as u64 * 8)
133    }
134
135    /// Debug helper to show internal state
136    #[cfg(test)]
137    pub fn debug_state(&self) -> String {
138        format!(
139            "BitReader {{ pos: {}, bit_pos: {}, buffer: {:08x}, bits_in_buffer: {} }}",
140            self.pos, self.bit_pos, self.buffer, self.bits_in_buffer
141        )
142    }
143
144    /// Peek at raw bytes from current logical position (for debugging)
145    #[cfg(test)]
146    pub fn peek_bytes(&self, n: usize) -> Vec<u8> {
147        let byte_pos = (self.bit_pos / 8) as usize;
148        self.data
149            .get(byte_pos..byte_pos + n)
150            .map(|s| s.to_vec())
151            .unwrap_or_default()
152    }
153}
154
155#[cfg(test)]
156mod tests {
157    use super::*;
158
159    #[test]
160    fn test_read_bits() {
161        let data = [0b10110100, 0b11001010];
162        let mut reader = BitReader::new(&data);
163
164        assert_eq!(reader.read_bits(4).unwrap(), 0b1011);
165        assert_eq!(reader.read_bits(4).unwrap(), 0b0100);
166        assert_eq!(reader.read_bits(8).unwrap(), 0b11001010);
167    }
168
169    #[test]
170    fn test_peek_bits() {
171        let data = [0b10110100];
172        let reader = BitReader::new(&data);
173
174        assert_eq!(reader.peek_bits(4), 0b1011);
175        assert_eq!(reader.peek_bits(8), 0b10110100);
176    }
177
178    #[test]
179    fn test_eof() {
180        let data = [0xFF];
181        let mut reader = BitReader::new(&data);
182
183        assert!(!reader.is_eof());
184        reader.read_bits(8).unwrap();
185        assert!(reader.is_eof());
186    }
187}