#![cfg(feature = "lzs")]
use compcol::lzs::{Decoder, Encoder, Lzs};
use compcol::{Algorithm, Decoder as _, Encoder as _, Error, Status};
fn encode_chunked(enc: &mut Encoder, input: &[u8], in_chunk: usize, out_chunk: usize) -> Vec<u8> {
let mut encoded = Vec::new();
let mut buf = vec![0u8; out_chunk.max(1)];
let mut i = 0;
while i < input.len() {
let end = (i + in_chunk).min(input.len());
let chunk = &input[i..end];
let mut consumed = 0;
while consumed < chunk.len() {
let (p, status) = enc.encode(&chunk[consumed..], &mut buf).unwrap();
encoded.extend_from_slice(&buf[..p.written]);
consumed += p.consumed;
match status {
Status::InputEmpty | Status::StreamEnd => break,
Status::OutputFull => continue,
}
}
i = end;
}
loop {
let (p, status) = enc.finish(&mut buf).unwrap();
encoded.extend_from_slice(&buf[..p.written]);
match status {
Status::StreamEnd => break,
Status::OutputFull | Status::InputEmpty => {
if p.written == 0 {
panic!("lzs encoder finish stalled");
}
}
}
}
encoded
}
fn decode_chunked(encoded: &[u8], in_chunk: usize, out_chunk: usize) -> Result<Vec<u8>, Error> {
let mut dec = Decoder::new();
decode_chunked_with(&mut dec, encoded, in_chunk, out_chunk)
}
fn decode_chunked_with(
dec: &mut Decoder,
encoded: &[u8],
in_chunk: usize,
out_chunk: usize,
) -> Result<Vec<u8>, Error> {
let mut decoded = Vec::new();
let mut buf = vec![0u8; out_chunk.max(1)];
let mut i = 0;
while i < encoded.len() {
let end = (i + in_chunk).min(encoded.len());
let chunk = &encoded[i..end];
let mut consumed = 0;
while consumed < chunk.len() {
let (p, status) = dec.decode(&chunk[consumed..], &mut buf)?;
decoded.extend_from_slice(&buf[..p.written]);
consumed += p.consumed;
match status {
Status::StreamEnd => break,
Status::InputEmpty => break,
Status::OutputFull => continue,
}
}
i = end;
}
loop {
let (p, _status) = dec.decode(&[], &mut buf)?;
decoded.extend_from_slice(&buf[..p.written]);
if p.written == 0 {
break;
}
}
loop {
let (p, status) = dec.finish(&mut buf)?;
decoded.extend_from_slice(&buf[..p.written]);
match status {
Status::StreamEnd => break,
Status::OutputFull | Status::InputEmpty => {
if p.written == 0 {
panic!("lzs decoder finish stalled");
}
}
}
}
Ok(decoded)
}
fn encode_all(input: &[u8]) -> Vec<u8> {
let mut enc = Encoder::new();
encode_chunked(&mut enc, input, input.len().max(1), 4096)
}
fn round_trip(input: &[u8]) {
let encoded = encode_all(input);
let decoded = decode_chunked(&encoded, 4096, 4096).unwrap();
assert_eq!(decoded, input, "round-trip mismatch len {}", input.len());
}
#[test]
fn name_is_lzs() {
assert_eq!(<Lzs as Algorithm>::NAME, "lzs");
}
#[test]
fn round_trip_empty() {
let encoded = encode_all(b"");
assert!(encoded.len() >= 9);
assert_eq!(&encoded[..8], &0u64.to_le_bytes());
let decoded = decode_chunked(&encoded, 4096, 4096).unwrap();
assert_eq!(decoded, b"");
}
#[test]
fn round_trip_single_byte() {
round_trip(b"X");
}
#[test]
fn round_trip_hello_world() {
round_trip(b"hello world");
}
#[test]
fn round_trip_repeated_bytes() {
let input = vec![b'a'; 1024];
round_trip(&input);
}
#[test]
fn round_trip_repeated_64kib() {
let phrase = b"the quick brown fox jumps over the lazy dog ";
let mut input = Vec::new();
while input.len() < 64 * 1024 {
input.extend_from_slice(phrase);
}
round_trip(&input);
}
#[test]
fn round_trip_mixed_short_runs() {
let mut input = Vec::new();
input.extend(core::iter::repeat_n(b'a', 10));
input.extend(core::iter::repeat_n(b'b', 3));
input.extend(core::iter::repeat_n(b'c', 7));
input.extend(b"and a quick fox jumps over");
input.extend(core::iter::repeat_n(b'z', 200));
round_trip(&input);
}
#[test]
fn round_trip_pseudo_random_8kib() {
let mut state: u32 = 0xC0FFEE_u32;
let mut input = Vec::with_capacity(8 * 1024);
for _ in 0..(8 * 1024) {
state = state.wrapping_mul(1_664_525).wrapping_add(1_013_904_223);
input.push((state >> 16) as u8);
}
round_trip(&input);
}
#[test]
fn round_trip_full_byte_range() {
let input: Vec<u8> = (0..=255u8).collect();
round_trip(&input);
}
#[test]
fn round_trip_streaming_one_byte() {
let input = b"streaming bytes one at a time".to_vec();
let mut enc = Encoder::new();
let encoded = encode_chunked(&mut enc, &input, 1, 1);
let decoded = decode_chunked(&encoded, 1, 1).unwrap();
assert_eq!(decoded, input);
}
#[test]
fn round_trip_streaming_tiny_buffers() {
let input = b"the quick brown fox jumps over the lazy dog\
the quick brown fox jumps over the lazy dog\
the quick brown fox jumps over the lazy dog"
.to_vec();
let mut enc = Encoder::new();
let encoded = encode_chunked(&mut enc, &input, 3, 4);
let decoded = decode_chunked(&encoded, 3, 4).unwrap();
assert_eq!(decoded, input);
}
#[test]
fn encoder_reset_allows_reuse() {
let input_a = b"alpha alpha alpha alpha alpha".as_slice();
let input_b = b"bravo bravo bravo bravo bravo".as_slice();
let mut enc = Encoder::new();
let encoded_a = encode_chunked(&mut enc, input_a, 4096, 4096);
enc.reset();
let encoded_b = encode_chunked(&mut enc, input_b, 4096, 4096);
assert_eq!(decode_chunked(&encoded_a, 4096, 4096).unwrap(), input_a);
assert_eq!(decode_chunked(&encoded_b, 4096, 4096).unwrap(), input_b);
}
#[test]
fn decoder_reset_allows_reuse() {
let mut enc = Encoder::new();
let encoded_a = encode_chunked(&mut enc, b"hello", 4096, 4096);
enc.reset();
let encoded_b = encode_chunked(&mut enc, b"world", 4096, 4096);
let mut dec = Decoder::new();
assert_eq!(
decode_chunked_with(&mut dec, &encoded_a, 4096, 4096).unwrap(),
b"hello"
);
dec.reset();
assert_eq!(
decode_chunked_with(&mut dec, &encoded_b, 4096, 4096).unwrap(),
b"world"
);
}
#[test]
fn decode_fixture_three_literals() {
let bits = [
0u8, 0, 1, 1, 0, 0, 0, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0,
];
let payload = pack_msb(&bits);
let mut framed = Vec::new();
framed.extend_from_slice(&3u64.to_le_bytes());
framed.extend_from_slice(&payload);
let decoded = decode_chunked(&framed, 4096, 4096).unwrap();
assert_eq!(decoded, b"abc");
}
#[test]
fn decode_fixture_match_short_offset_len2() {
let bits = [
0u8, 0, 1, 1, 0, 0, 0, 0, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0,
];
let payload = pack_msb(&bits);
let mut framed = Vec::new();
framed.extend_from_slice(&8u64.to_le_bytes());
framed.extend_from_slice(&payload);
let decoded = decode_chunked(&framed, 4096, 4096).unwrap();
assert_eq!(decoded, b"abababab");
}
#[test]
fn decode_fixture_long_offset() {
let mut bits: Vec<u8> = Vec::new();
for i in 0u16..256 {
let b = i as u8;
bits.push(0); for shift in (0..8).rev() {
bits.push((b >> shift) & 1);
}
}
bits.push(1);
bits.push(0);
let off: u16 = 200;
for shift in (0..11).rev() {
bits.push(((off >> shift) & 1) as u8);
}
bits.push(1);
bits.push(0);
bits.extend_from_slice(&[1, 1, 0, 0, 0, 0, 0, 0, 0]);
let payload = pack_msb(&bits);
let mut framed = Vec::new();
framed.extend_from_slice(&260u64.to_le_bytes());
framed.extend_from_slice(&payload);
let decoded = decode_chunked(&framed, 4096, 4096).unwrap();
let mut expected: Vec<u8> = (0..=255u8).collect();
for _ in 0..4 {
expected.push(expected[expected.len() - 200]);
}
assert_eq!(decoded, expected);
}
#[test]
fn decode_fixture_extended_length() {
let mut bits: Vec<u8> = Vec::new();
bits.push(0);
for shift in (0..8).rev() {
bits.push((0x61u8 >> shift) & 1);
}
bits.push(1);
bits.push(1);
let off: u8 = 1;
for shift in (0..7).rev() {
bits.push((off >> shift) & 1);
}
bits.extend_from_slice(&[1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0]);
bits.extend_from_slice(&[1, 1, 0, 0, 0, 0, 0, 0, 0]);
let payload = pack_msb(&bits);
let mut framed = Vec::new();
framed.extend_from_slice(&24u64.to_le_bytes());
framed.extend_from_slice(&payload);
let decoded = decode_chunked(&framed, 4096, 4096).unwrap();
assert_eq!(decoded, vec![b'a'; 24]);
}
fn pack_msb(bits: &[u8]) -> Vec<u8> {
let mut out = Vec::with_capacity(bits.len().div_ceil(8));
let mut cur: u8 = 0;
let mut n: u8 = 0;
for &b in bits {
debug_assert!(b <= 1);
cur = (cur << 1) | (b & 1);
n += 1;
if n == 8 {
out.push(cur);
cur = 0;
n = 0;
}
}
if n != 0 {
while n < 8 {
cur = (cur << 1) | 1;
n += 1;
}
out.push(cur);
}
out
}
#[test]
fn truncated_header_rejected() {
let stream = [0u8, 0, 0];
let mut dec = Decoder::new();
let mut buf = [0u8; 16];
let (_, _) = dec.decode(&stream, &mut buf).unwrap();
let err = dec.finish(&mut buf).unwrap_err();
assert!(
matches!(err, Error::UnexpectedEnd | Error::Corrupt),
"unexpected error: {:?}",
err
);
}
#[test]
fn truncated_payload_rejected() {
let mut framed = Vec::new();
framed.extend_from_slice(&10u64.to_le_bytes());
let err = decode_chunked(&framed, 4096, 4096).unwrap_err();
assert!(
matches!(err, Error::UnexpectedEnd | Error::Corrupt),
"unexpected error: {:?}",
err
);
}
#[test]
fn match_before_any_output_rejected() {
let bits = [
1u8, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0,
0, ];
let payload = pack_msb(&bits);
let mut framed = Vec::new();
framed.extend_from_slice(&8u64.to_le_bytes());
framed.extend_from_slice(&payload);
let err = decode_chunked(&framed, 4096, 4096).unwrap_err();
assert_eq!(err, Error::InvalidDistance);
}
#[test]
fn length_mismatch_rejected() {
let mut bits: Vec<u8> = Vec::new();
bits.push(0);
for shift in (0..8).rev() {
bits.push((b'X' >> shift) & 1);
}
bits.extend_from_slice(&[1, 1, 0, 0, 0, 0, 0, 0, 0]);
let payload = pack_msb(&bits);
let mut framed = Vec::new();
framed.extend_from_slice(&99u64.to_le_bytes()); framed.extend_from_slice(&payload);
let err = decode_chunked(&framed, 4096, 4096).unwrap_err();
assert!(
matches!(
err,
Error::TrailerMismatch | Error::UnexpectedEnd | Error::Corrupt
),
"unexpected error: {:?}",
err
);
}
#[test]
fn algorithm_encoder_decoder_round_trip() {
let mut enc = <Lzs as Algorithm>::encoder();
let mut dec = <Lzs as Algorithm>::decoder();
let input = b"compcol Algorithm trait roundtrip for lzs!";
let mut encoded = Vec::new();
let mut buf = vec![0u8; 256];
let mut consumed = 0;
while consumed < input.len() {
let (p, status) = enc.encode(&input[consumed..], &mut buf).unwrap();
encoded.extend_from_slice(&buf[..p.written]);
consumed += p.consumed;
if matches!(status, Status::InputEmpty) {
break;
}
}
loop {
let (p, status) = enc.finish(&mut buf).unwrap();
encoded.extend_from_slice(&buf[..p.written]);
if matches!(status, Status::StreamEnd) {
break;
}
if p.written == 0 {
panic!("finish stalled");
}
}
let mut decoded = Vec::new();
let mut consumed = 0;
loop {
let (p, status) = dec.decode(&encoded[consumed..], &mut buf).unwrap();
decoded.extend_from_slice(&buf[..p.written]);
consumed += p.consumed;
if matches!(status, Status::StreamEnd | Status::InputEmpty) {
break;
}
}
let (_, status) = dec.finish(&mut buf).unwrap();
assert!(matches!(status, Status::StreamEnd));
assert_eq!(decoded, input);
}
#[cfg(feature = "factory")]
mod factory {
use compcol::Status;
use compcol::factory;
#[test]
fn lookup_known() {
assert!(factory::encoder_by_name("lzs").is_some());
assert!(factory::decoder_by_name("lzs").is_some());
}
#[test]
fn names_contains_lzs() {
assert!(factory::names().contains(&"lzs"));
}
#[test]
fn extension_is_lzs() {
assert_eq!(factory::extension("lzs"), Some("lzs"));
}
#[test]
fn boxed_round_trip() {
let mut enc = factory::encoder_by_name("lzs").unwrap();
let mut dec = factory::decoder_by_name("lzs").unwrap();
let input = b"factory boxed round-trip for lzs";
let mut encoded = Vec::new();
let mut buf = vec![0u8; 256];
let mut consumed = 0;
while consumed < input.len() {
let (p, status) = enc.encode(&input[consumed..], &mut buf).unwrap();
encoded.extend_from_slice(&buf[..p.written]);
consumed += p.consumed;
if matches!(status, Status::InputEmpty) {
break;
}
}
loop {
let (p, status) = enc.finish(&mut buf).unwrap();
encoded.extend_from_slice(&buf[..p.written]);
if matches!(status, Status::StreamEnd) {
break;
}
if p.written == 0 {
panic!("finish stalled");
}
}
let mut decoded = Vec::new();
let mut consumed = 0;
loop {
let (p, status) = dec.decode(&encoded[consumed..], &mut buf).unwrap();
decoded.extend_from_slice(&buf[..p.written]);
consumed += p.consumed;
if matches!(status, Status::StreamEnd | Status::InputEmpty) {
break;
}
}
let (_, status) = dec.finish(&mut buf).unwrap();
assert!(matches!(status, Status::StreamEnd));
assert_eq!(&decoded[..], input);
}
}