aehobak 0.0.18

Transcoder for bsdiff binary patches.
Documentation
/*-
 * Copyright 2025 David Michael Barr
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted providing that the following conditions
 * are met:
 * 1. Redistributions of source code must retain the above copyright
 *    notice, this list of conditions and the following disclaimer.
 * 2. Redistributions in binary form must reproduce the above copyright
 *    notice, this list of conditions and the following disclaimer in the
 *    documentation and/or other materials provided with the distribution.
 *
 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
 * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
 * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
 * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING
 * IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
 * POSSIBILITY OF SUCH DAMAGE.
 */

#![doc = include_str!("../README.md")]

mod control;
mod decode;
mod diff;
mod encode;
mod patch;

pub use decode::decode;
pub use diff::diff;
pub use encode::encode;
pub use patch::patch;

#[cfg(test)]
mod tests {
    use super::*;
    use bsdiff;
    use quickcheck::{quickcheck, TestResult};
    use rand_xoshiro::rand_core::{RngCore, SeedableRng};
    use rand_xoshiro::Xoshiro256Plus;
    use std::collections::LinkedList;

    quickcheck! {
        fn round_trip(old: Vec<u8>, new: Vec<u8>) -> bool {
            let mut patch = Vec::new();
            let mut encoded = Vec::new();
            let mut decoded = Vec::new();
            bsdiff::diff(&old, &new, &mut patch).unwrap();
            encode(&patch, &mut encoded).unwrap();
            decode(&mut encoded.as_slice(), &mut decoded).unwrap();
            decoded == patch
        }

        fn replace_one(old: Vec<u8>, idx: usize) -> bool {
            let mut new = old.clone();
            if !new.is_empty() {
                let idx = idx % new.len();
                new[idx] = new[idx].wrapping_add(1);
            }
            let mut patch = Vec::new();
            let mut encoded = Vec::new();
            let mut decoded = Vec::new();
            bsdiff::diff(&old, &new, &mut patch).unwrap();
            encode(&patch, &mut encoded).unwrap();
            decode(&mut encoded.as_slice(), &mut decoded).unwrap();
            decoded == patch
        }

        fn direct_patch(old: Vec<u8>, idx: usize) -> bool {
            let mut new = old.clone();
            if !new.is_empty() {
                let idx = idx % new.len();
                new[idx] = new[idx].wrapping_add(1);
            }
            let mut bspatch = Vec::new();
            let mut encoded = Vec::new();
            let mut result = Vec::with_capacity(new.len());
            bsdiff::diff(&old, &new, &mut bspatch).unwrap();
            encode(&bspatch, &mut encoded).unwrap();
            patch(&old, &encoded, &mut result).unwrap();
            result == new
        }

        fn direct_patch_truncated(old: Vec<u8>, idx: usize, sub: usize) -> bool {
            let mut new = old.clone();
            if !new.is_empty() {
                let idx = idx % new.len();
                new[idx] = new[idx].wrapping_add(1);
            }
            let mut bspatch = Vec::new();
            let mut encoded = Vec::new();
            let mut result = Vec::with_capacity(new.len());
            bsdiff::diff(&old, &new, &mut bspatch).unwrap();
            encode(&bspatch, &mut encoded).unwrap();
            if encoded.is_empty() {
                return true;
            }
            encoded.truncate(encoded.len().saturating_sub(sub.max(1)).max(1));
            patch(&old, &encoded, &mut result).is_err() || new.is_empty()
        }

        fn direct_patch_nospace(old: Vec<u8>, idx: usize) -> bool {
            let mut new = old.clone();
            if !new.is_empty() {
                let idx = idx % new.len();
                new[idx] = new[idx].wrapping_add(1);
            }
            let mut bspatch = Vec::new();
            let mut encoded = Vec::new();
            let mut result = Vec::with_capacity(new.len() / 2);
            bsdiff::diff(&old, &new, &mut bspatch).unwrap();
            encode(&bspatch, &mut encoded).unwrap();
            patch(&old, &encoded, &mut result).is_err() || new.len() < 2
        }

        fn direct_diff(old: Vec<u8>, idx: usize) -> bool {
            let mut new = old.clone();
            if !new.is_empty() {
                let idx = idx % new.len();
                new[idx] = new[idx].wrapping_add(1);
            }
            let mut encoded = Vec::new();
            diff(&old, &new, &mut encoded).unwrap();
            let mut result = Vec::with_capacity(new.len());
            let mut decoded = Vec::new();
            decode(&mut encoded.as_slice(), &mut decoded).unwrap();
            bsdiff::patch(&old, &mut decoded.as_slice(), &mut result).unwrap();
            result == new
        }

        fn direct_diff_nospace(old: Vec<u8>, idx: usize) -> TestResult {
            let mut new = old.clone();
            if new.is_empty() {
                return TestResult::discard();
            }
            let idx = idx % new.len();
            new[idx] = new[idx].wrapping_add(1);
            let mut patch:[u8; 0] = [];
            TestResult::from_bool(diff(&old, &new, &mut patch.as_mut_slice()).is_err())
        }

        #[cfg_attr(miri, ignore)] // Slow
        fn arbitrary_patch(skeleton: LinkedList<(u8,u8,i8)>, period: u8, phase: u8) -> bool {
            use std::io::ErrorKind::{InvalidData, UnexpectedEof};
            let (bspatch, old_len, new_len) = gen_bspatch(skeleton, period, phase);
            let mut encoded = Vec::new();
            let mut result = Vec::with_capacity(new_len);
            let old = vec![0; old_len];
            encode(&bspatch, &mut encoded).unwrap();
            match patch(&old, &encoded, &mut result) {
                Err(e) if e.kind() == InvalidData => true,
                Err(e) if e.kind() == UnexpectedEof => true,
                Ok(_) => {
                    let mut reference = Vec::new();
                    bsdiff::patch(&old, &mut bspatch.as_slice(), &mut reference).unwrap();
                    reference == result
                }
                _ => false,
            }
        }

        #[cfg_attr(miri, ignore)] // Slow
        fn arbitrary_diff(skeleton: LinkedList<(u8,u8,i8)>, period: u8, phase: u8) -> TestResult {
            if let Some((old, new)) = gen_old_new(skeleton, period, phase) {
                let mut encoded = Vec::with_capacity(new.len());
                if diff(&old, &new, &mut encoded).is_err() {
                    return TestResult::failed();
                }
                let mut result = Vec::with_capacity(new.len());
                let mut decoded = Vec::new();
                decode(&mut encoded.as_slice(), &mut decoded).unwrap();
                bsdiff::patch(&old, &mut decoded.as_slice(), &mut result).unwrap();
                TestResult::from_bool(result == new)
            } else {
                TestResult::discard()
            }
        }
    }

    #[test]
    #[cfg_attr(miri, ignore)] // Slow
    fn direct_diff_huge() {
        let mut old = Vec::with_capacity(i32::MAX as usize + 1);
        old.resize(old.capacity(), 0);
        let mut patch = Vec::new();
        assert!(diff(&old, &old, &mut patch.as_mut_slice()).is_err());
    }

    #[test]
    fn arbitrary_diff_vectors() {
        #[rustfmt::skip]
        let skeleton: Vec<(u8, i8)> = vec![
            (208, -5), (167, -8), (246, 46), (155, -30), (180, 112), (219, 0), (220, -81),
            (170, 3), (223, 49), (29, 57), (144, 56), (169, 100), (170, -105), (147, 121),
            (74, 1), (125, -99), (214, 115), (9, 73), (114, 123), (9, 80), (9, 0)
        ];
        let skeleton = skeleton.into_iter().map(|(a, b)| (a, 0, b)).collect();
        let period = 20;
        let phase = 0;
        let (old, new) = gen_old_new(skeleton, period, phase).unwrap();
        let mut encoded = Vec::with_capacity(new.len());
        diff(&old, &new, &mut encoded).unwrap();
        let mut result = Vec::with_capacity(new.len());
        patch(&old, &encoded, &mut result).unwrap();
        assert!(result == new)
    }

    fn gen_old_new(
        skeleton: LinkedList<(u8, u8, i8)>,
        period: u8,
        phase: u8,
    ) -> Option<(Vec<u8>, Vec<u8>)> {
        let (bspatch, old_len, new_len) = gen_bspatch(skeleton, period, phase);
        let mut new = Vec::with_capacity(new_len);
        let mut old = vec![0; old_len];
        let mut rng = Xoshiro256Plus::seed_from_u64(0xeba2fa67e5a81121);
        rng.fill_bytes(&mut old);
        if bsdiff::patch(&old, &mut bspatch.as_slice(), &mut new).is_err() {
            return None;
        }
        Some((old, new))
    }

    fn gen_bspatch(
        skeleton: LinkedList<(u8, u8, i8)>,
        period: u8,
        phase: u8,
    ) -> (Vec<u8>, usize, usize) {
        use crate::control::{Aehobak, Bsdiff};
        let mut bspatch = Vec::new();
        let mut diffs = phase as usize;
        let mut old_len = 0;
        let mut new_len = 0;
        let mut cursor = 0;
        let mut rng = Xoshiro256Plus::seed_from_u64(0x75efdb1b26806fd8);
        for (add, copy, seek) in skeleton {
            let (add, copy, seek) = (add as u32, copy as u32, seek as i32);
            let seek = (seek << 1 ^ seek >> 31) as u32;
            let control: Bsdiff =
                (&Aehobak::try_from([add, copy, seek].as_slice()).unwrap()).into();
            control.encode(&mut bspatch);
            for _ in 0..add {
                bspatch.push((diffs % (1 + period as usize) == 0) as u8);
                diffs += 1;
            }
            cursor += add as usize;
            old_len = old_len.max(cursor);
            cursor = (cursor as i64 + seek as i64).max(0) as usize;
            let bspatch_len = bspatch.len();
            bspatch.resize(bspatch_len + copy as usize, 0);
            rng.fill_bytes(&mut bspatch[bspatch_len..]);
            new_len += copy as usize + add as usize;
        }
        (bspatch, old_len, new_len)
    }
}