idb/innodb/
compression.rs1use flate2::read::ZlibDecoder;
12use std::io::Read;
13
14use crate::innodb::vendor::VendorInfo;
15
16#[derive(Debug, Clone, Copy, PartialEq, Eq)]
18pub enum CompressionAlgorithm {
19 None,
20 Zlib,
21 Lz4,
22 Lzo,
24 Lzma,
26 Bzip2,
28 Snappy,
30}
31
32pub fn detect_compression(
41 fsp_flags: u32,
42 vendor_info: Option<&VendorInfo>,
43) -> CompressionAlgorithm {
44 use crate::innodb::constants::*;
45
46 if let Some(vi) = vendor_info {
47 if vi.is_full_crc32() {
48 let algo = (fsp_flags & MARIADB_FSP_FLAGS_FCRC32_COMPRESSED_ALGO_MASK) >> 5;
50 return mariadb_algo_from_id(algo as u8);
51 }
52 if vi.vendor == crate::innodb::vendor::InnoDbVendor::MariaDB {
53 if fsp_flags & MARIADB_FSP_FLAGS_PAGE_COMPRESSION != 0 {
56 return CompressionAlgorithm::Zlib;
59 }
60 return CompressionAlgorithm::None;
61 }
62 }
63
64 let comp_bits = (fsp_flags >> 11) & 0x03;
66 match comp_bits {
67 1 => CompressionAlgorithm::Zlib,
68 2 => CompressionAlgorithm::Lz4,
69 _ => CompressionAlgorithm::None,
70 }
71}
72
73pub fn detect_mariadb_page_compression(page_data: &[u8]) -> Option<CompressionAlgorithm> {
78 if page_data.len() < 27 {
79 return None;
80 }
81 let algo_id = page_data[26];
82 Some(mariadb_algo_from_id(algo_id))
83}
84
85fn mariadb_algo_from_id(id: u8) -> CompressionAlgorithm {
90 match id {
91 1 => CompressionAlgorithm::Zlib,
92 2 => CompressionAlgorithm::Lz4,
93 3 => CompressionAlgorithm::Lzo,
94 4 => CompressionAlgorithm::Lzma,
95 5 => CompressionAlgorithm::Bzip2,
96 6 => CompressionAlgorithm::Snappy,
97 _ => CompressionAlgorithm::None,
98 }
99}
100
101pub fn decompress_zlib(compressed: &[u8]) -> Option<Vec<u8>> {
105 let mut decoder = ZlibDecoder::new(compressed);
106 let mut decompressed = Vec::new();
107 decoder.read_to_end(&mut decompressed).ok()?;
108 Some(decompressed)
109}
110
111pub fn decompress_lz4(compressed: &[u8], uncompressed_len: usize) -> Option<Vec<u8>> {
116 lz4_flex::decompress(compressed, uncompressed_len).ok()
117}
118
119pub fn is_hole_punched(page_data: &[u8], page_size: u32) -> bool {
124 if page_data.len() < page_size as usize {
125 return false;
126 }
127
128 let check_start = (page_size as usize * 3) / 4;
130 page_data[check_start..page_size as usize]
131 .iter()
132 .all(|&b| b == 0)
133}
134
135impl std::fmt::Display for CompressionAlgorithm {
136 fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
137 match self {
138 CompressionAlgorithm::None => write!(f, "None"),
139 CompressionAlgorithm::Zlib => write!(f, "Zlib"),
140 CompressionAlgorithm::Lz4 => write!(f, "LZ4"),
141 CompressionAlgorithm::Lzo => write!(f, "LZO"),
142 CompressionAlgorithm::Lzma => write!(f, "LZMA"),
143 CompressionAlgorithm::Bzip2 => write!(f, "bzip2"),
144 CompressionAlgorithm::Snappy => write!(f, "Snappy"),
145 }
146 }
147}
148
149#[cfg(test)]
150mod tests {
151 use super::*;
152 use crate::innodb::vendor::MariaDbFormat;
153
154 #[test]
155 fn test_detect_compression_mysql() {
156 assert_eq!(detect_compression(0, None), CompressionAlgorithm::None);
157 assert_eq!(
158 detect_compression(1 << 11, None),
159 CompressionAlgorithm::Zlib
160 );
161 assert_eq!(detect_compression(2 << 11, None), CompressionAlgorithm::Lz4);
162 assert_eq!(
163 detect_compression(3 << 11, None),
164 CompressionAlgorithm::None
165 );
166 assert_eq!(
168 detect_compression(0xFF | (1 << 11), None),
169 CompressionAlgorithm::Zlib
170 );
171 }
172
173 #[test]
174 fn test_detect_compression_mariadb_full_crc32() {
175 let vendor = VendorInfo::mariadb(MariaDbFormat::FullCrc32);
176 let flags = 0x10 | (1 << 5);
178 assert_eq!(
179 detect_compression(flags, Some(&vendor)),
180 CompressionAlgorithm::Zlib
181 );
182 let flags = 0x10 | (2 << 5);
184 assert_eq!(
185 detect_compression(flags, Some(&vendor)),
186 CompressionAlgorithm::Lz4
187 );
188 let flags = 0x10 | (3 << 5);
190 assert_eq!(
191 detect_compression(flags, Some(&vendor)),
192 CompressionAlgorithm::Lzo
193 );
194 }
195
196 #[test]
197 fn test_detect_mariadb_page_compression() {
198 let mut page = vec![0u8; 38];
199 page[26] = 2; assert_eq!(
201 detect_mariadb_page_compression(&page),
202 Some(CompressionAlgorithm::Lz4)
203 );
204 page[26] = 6; assert_eq!(
206 detect_mariadb_page_compression(&page),
207 Some(CompressionAlgorithm::Snappy)
208 );
209 }
210
211 #[test]
212 fn test_decompress_zlib() {
213 use flate2::write::ZlibEncoder;
214 use flate2::Compression;
215 use std::io::Write;
216
217 let original = b"Hello, InnoDB compression test data!";
218 let mut encoder = ZlibEncoder::new(Vec::new(), Compression::default());
219 encoder.write_all(original).unwrap();
220 let compressed = encoder.finish().unwrap();
221
222 let result = decompress_zlib(&compressed).unwrap();
223 assert_eq!(result, original);
224 }
225
226 #[test]
227 fn test_decompress_lz4() {
228 let original = b"Hello, LZ4 compression test data for InnoDB!";
229 let compressed = lz4_flex::compress_prepend_size(original);
230 let result = lz4_flex::decompress(&compressed[4..], original.len());
233 assert!(result.is_ok());
234 assert_eq!(result.unwrap(), original);
235 }
236
237 #[test]
238 fn test_is_hole_punched() {
239 let page_size = 16384u32;
240 let mut page = vec![0u8; page_size as usize];
241 assert!(is_hole_punched(&page, page_size));
243
244 page[0] = 0xFF;
246 page[100] = 0xAB;
247 assert!(is_hole_punched(&page, page_size));
248
249 page[page_size as usize - 10] = 0x01;
251 assert!(!is_hole_punched(&page, page_size));
252 }
253}