1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
/// Bitstream reader for parsing H.265 NAL unit RBSP data.
/// Reads bits left-to-right (MSB first).
///
/// The internal buffer is padded with zero bytes so that `read_bit` can skip
/// per-bit bounds checks in the hot path. Only `bits_remaining` and
/// `more_rbsp_data` use the true data length.
pub struct BitstreamReader {
data: Vec<u8>,
data_len: usize, // actual RBSP length (excluding padding)
byte_offset: usize,
bit_offset: u8, // 0-7, bits already consumed in current byte
}
/// Number of zero bytes appended after RBSP data.
/// Must be large enough that reading past the end during multi-CTU
/// end-of-slice detection doesn't cause index-out-of-bounds panics.
const PADDING: usize = 128;
impl BitstreamReader {
pub fn new(rbsp: &[u8]) -> Self {
let data_len = rbsp.len();
let mut data = Vec::with_capacity(data_len + PADDING);
data.extend_from_slice(rbsp);
data.resize(data_len + PADDING, 0);
Self {
data,
data_len,
byte_offset: 0,
bit_offset: 0,
}
}
/// Read a single bit, returning 0 or 1.
/// Does not bounds-check on every call; relies on padding to avoid
/// out-of-bounds reads. Call `bits_remaining` to check before bulk reads.
#[inline(always)]
pub fn read_bit(&mut self) -> Result<u8, &'static str> {
let bit = (self.data[self.byte_offset] >> (7 - self.bit_offset)) & 1;
self.bit_offset += 1;
if self.bit_offset == 8 {
self.bit_offset = 0;
self.byte_offset += 1;
}
Ok(bit)
}
/// Read `n` bits (up to 32) as a u32.
pub fn read_bits(&mut self, n: u8) -> Result<u32, &'static str> {
let mut val: u32 = 0;
for _ in 0..n {
val = (val << 1) | self.read_bit()? as u32;
}
Ok(val)
}
/// Peek at the next `n` bits without consuming them. Zero-pads if fewer bits remain.
pub fn peek_bits(&self, n: u8) -> u32 {
let mut val: u32 = 0;
let mut byte_offset = self.byte_offset;
let mut bit_offset = self.bit_offset;
for _ in 0..n {
if byte_offset < self.data.len() {
val = (val << 1) | ((self.data[byte_offset] >> (7 - bit_offset)) & 1) as u32;
} else {
val <<= 1;
}
bit_offset += 1;
if bit_offset == 8 {
bit_offset = 0;
byte_offset += 1;
}
}
val
}
/// Advance position by `n` bits without reading them.
pub fn skip_bits(&mut self, n: u8) {
let total = self.bit_offset as usize + n as usize;
self.byte_offset += total / 8;
self.bit_offset = (total % 8) as u8;
}
/// Read an unsigned Exp-Golomb coded value (ue(v)).
pub fn read_ue(&mut self) -> Result<u32, &'static str> {
let mut leading_zeros: u32 = 0;
while self.read_bit()? == 0 {
leading_zeros += 1;
if leading_zeros > 31 {
return Err("exp-golomb overflow");
}
}
if leading_zeros == 0 {
return Ok(0);
}
let suffix = self.read_bits(leading_zeros as u8)?;
Ok((1 << leading_zeros) - 1 + suffix)
}
/// Read a signed Exp-Golomb coded value (se(v)).
pub fn read_se(&mut self) -> Result<i32, &'static str> {
let code = self.read_ue()?;
let val = code.div_ceil(2) as i32;
if code % 2 == 0 { Ok(-val) } else { Ok(val) }
}
/// Returns true if there is more RBSP data before the trailing bits.
/// The RBSP trailing bits are: a stop bit (1) followed by zero bits to byte-align.
pub fn more_rbsp_data(&self) -> bool {
if self.byte_offset >= self.data_len {
return false;
}
// Find the position of the last non-zero byte in the actual data
let mut last_nz = self.data_len;
while last_nz > self.byte_offset && self.data[last_nz - 1] == 0 {
last_nz -= 1;
}
if last_nz <= self.byte_offset {
return false;
}
// If we're before the last non-zero byte, there's definitely more data
if self.byte_offset < last_nz - 1 {
return true;
}
// We're in the last non-zero byte. The RBSP stop bit is the lowest set bit.
// Everything above it (towards MSB) is data. Check if there are unconsumed
// data bits above the stop bit.
let byte = self.data[self.byte_offset];
let stop_bit = byte.trailing_zeros();
let data_bits_in_byte = 7 - stop_bit as u8;
self.bit_offset < data_bits_in_byte
}
/// Advance to the next byte boundary.
pub fn align_to_byte(&mut self) {
if self.bit_offset != 0 {
self.bit_offset = 0;
self.byte_offset += 1;
}
}
pub fn position(&self) -> (usize, u8) {
(self.byte_offset, self.bit_offset)
}
pub fn bits_remaining(&self) -> usize {
if self.byte_offset >= self.data_len {
return 0;
}
(self.data_len - self.byte_offset) * 8 - self.bit_offset as usize
}
}
#[cfg(test)]
mod tests {
use super::*;
#[test]
fn test_read_bits() {
let data = [0b1010_0011, 0b1100_0000];
let mut r = BitstreamReader::new(&data);
assert_eq!(r.read_bits(4).unwrap(), 0b1010);
assert_eq!(r.read_bits(4).unwrap(), 0b0011);
assert_eq!(r.read_bits(2).unwrap(), 0b11);
}
#[test]
fn test_read_ue() {
// ue(0) = 1 -> code 0
// ue(1) = 010 -> code 1
// ue(2) = 011 -> code 2
// ue(3) = 00100 -> code 3
// Bit pattern: 1 010 011 00100 = 1010 0110 0100 = 0xA64
let data = [0xA6, 0x40];
let mut r = BitstreamReader::new(&data);
assert_eq!(r.read_ue().unwrap(), 0);
assert_eq!(r.read_ue().unwrap(), 1);
assert_eq!(r.read_ue().unwrap(), 2);
assert_eq!(r.read_ue().unwrap(), 3);
}
#[test]
fn test_read_se() {
// se mapping: code 0->0, 1->1, 2->-1, 3->2, 4->-2
// ue values: 0 1 2 3 4
// bits: 1 010 011 00100 00101
// Combined: 1 010 011 00100 00101 = 1010 0110 0100 0010 1
let data = [0xA6, 0x42, 0x80];
let mut r = BitstreamReader::new(&data);
assert_eq!(r.read_se().unwrap(), 0);
assert_eq!(r.read_se().unwrap(), 1);
assert_eq!(r.read_se().unwrap(), -1);
assert_eq!(r.read_se().unwrap(), 2);
assert_eq!(r.read_se().unwrap(), -2);
}
#[test]
fn test_padding_allows_overread() {
// After reading all real data, reads return 0 (from padding) rather than panicking
let data = [0xFF];
let mut r = BitstreamReader::new(&data);
assert_eq!(r.bits_remaining(), 8);
assert_eq!(r.read_bits(8).unwrap(), 0xFF);
assert_eq!(r.bits_remaining(), 0);
// Reading into padding returns 0 bits without panic
assert_eq!(r.read_bits(8).unwrap(), 0);
}
}