use crate::*;
const ALIGNED_ADDR: u64 = 0x3000;
const ALIGNED_ADDR2: u64 = 0x3100;
#[test]
fn test_vpsadbw_ymm0_ymm1_ymm2_all_zeros() {
let mut emu = emu64();
let code = [
0xc5, 0xf5, 0xf6, 0xc2, 0xf4, ];
emu.load_code_bytes(&code);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_ymm3_ymm4_ymm5_all_ones() {
let mut emu = emu64();
let code = [
0xc5, 0xdd, 0xf6, 0xdd, 0xf4, ];
emu.load_code_bytes(&code);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_ymm6_ymm7_ymm8_identical() {
let mut emu = emu64();
let code = [
0xc5, 0x45, 0xf6, 0xf0, 0xf4, ];
emu.load_code_bytes(&code);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_ymm9_ymm10_ymm11_mixed_values() {
let mut emu = emu64();
let code = [
0xc4, 0x41, 0x2d, 0xf6, 0xcb, 0xf4, ];
emu.load_code_bytes(&code);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_ymm12_ymm13_ymm14_alternating() {
let mut emu = emu64();
let code = [
0xc4, 0x41, 0x15, 0xf6, 0xe6, 0xf4, ];
emu.load_code_bytes(&code);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_ymm15_ymm0_ymm1_high_reg() {
let mut emu = emu64();
let code = [
0xc4, 0xc1, 0x7d, 0xf6, 0xf9, 0xf4, ];
emu.load_code_bytes(&code);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_ymm0_ymm1_mem() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc5, 0xf5, 0xf6, 0x00, 0xf4, ]);
emu.load_code_bytes(&full_code);
emu.maps.write_bytes_slice(ALIGNED_ADDR, &[0x11, 0x11, 0x11, 0x11, 0x11, 0x11, 0x11, 0x11, 0x11, 0x11, 0x11, 0x11, 0x11, 0x11, 0x11, 0x11, 0x11, 0x11, 0x11, 0x11, 0x11, 0x11, 0x11, 0x11, 0x11, 0x11, 0x11, 0x11, 0x11, 0x11, 0x11, 0x11]);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_ymm2_ymm3_mem_max() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc5, 0xe5, 0xf6, 0x10, 0xf4, ]);
emu.load_code_bytes(&full_code);
emu.maps.write_bytes_slice(ALIGNED_ADDR, &[0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF]);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_ymm4_ymm5_mem_sequential() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc5, 0xd5, 0xf6, 0x20, 0xf4, ]);
emu.load_code_bytes(&full_code);
let seq: Vec<u8> = (0..32).collect();
emu.maps.write_bytes_slice(ALIGNED_ADDR, &seq);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_ymm6_ymm7_mem_alternating() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc5, 0x45, 0xf6, 0x30, 0xf4, ]);
emu.load_code_bytes(&full_code);
let pattern: Vec<u8> = (0..32).map(|i| if i % 2 == 0 { 0xFF } else { 0x00 }).collect();
emu.maps.write_bytes_slice(ALIGNED_ADDR, &pattern);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_absolute_difference() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc5, 0xf5, 0xf6, 0x00, 0xf4, ]);
emu.load_code_bytes(&full_code);
let data: Vec<u8> = vec![0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF];
emu.maps.write_bytes_slice(ALIGNED_ADDR, &data);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_zero_difference() {
let mut emu = emu64();
let code = [
0xc5, 0xf5, 0xf6, 0xc1, 0xf4, ];
emu.load_code_bytes(&code);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_max_difference() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc5, 0xf5, 0xf6, 0x00, 0xf4, ]);
emu.load_code_bytes(&full_code);
emu.maps.write_bytes_slice(ALIGNED_ADDR, &[0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF]);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_lane_independence() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc5, 0xf5, 0xf6, 0x00, 0xf4, ]);
emu.load_code_bytes(&full_code);
let mut data = vec![0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01];
data.extend(vec![0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02]);
emu.maps.write_bytes_slice(ALIGNED_ADDR, &data);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_qword_grouping() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc5, 0xf5, 0xf6, 0x00, 0xf4, ]);
emu.load_code_bytes(&full_code);
let mut data = vec![0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00];
data.extend(vec![0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF]);
data.extend(vec![0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00]);
data.extend(vec![0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF]);
emu.maps.write_bytes_slice(ALIGNED_ADDR, &data);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_chain_multiple_ops() {
let mut emu = emu64();
let code = [
0xc5, 0xf5, 0xf6, 0xc2, 0xc5, 0xfd, 0xf6, 0xc3, 0xf4, ];
emu.load_code_bytes(&code);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_mem_unaligned_offset() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&(ALIGNED_ADDR + 1).to_le_bytes());
full_code.extend_from_slice(&[
0xc5, 0xf5, 0xf6, 0x00, 0xf4, ]);
emu.load_code_bytes(&full_code);
emu.maps.write_bytes_slice(ALIGNED_ADDR, &[0x42, 0x42, 0x42, 0x42, 0x42, 0x42, 0x42, 0x42, 0x42, 0x42, 0x42, 0x42, 0x42, 0x42, 0x42, 0x42, 0x42, 0x42, 0x42, 0x42, 0x42, 0x42, 0x42, 0x42, 0x42, 0x42, 0x42, 0x42, 0x42, 0x42, 0x42, 0x42, 0x42]);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_extended_regs_r8_r9_r10() {
let mut emu = emu64();
let code = [
0xc4, 0x41, 0x3d, 0xf6, 0xc2, 0xf4, ];
emu.load_code_bytes(&code);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_extended_regs_r11_r12_r13() {
let mut emu = emu64();
let code = [
0xc4, 0x41, 0x1d, 0xf6, 0xdd, 0xf4, ];
emu.load_code_bytes(&code);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_extended_regs_r14_r15_r8() {
let mut emu = emu64();
let code = [
0xc4, 0x41, 0x05, 0xf6, 0xf0, 0xf4, ];
emu.load_code_bytes(&code);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_pattern_1() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc5, 0xf5, 0xf6, 0x00, 0xf4, ]);
emu.load_code_bytes(&full_code);
let data: Vec<u8> = (0..32u8).map(|i| i * 2).collect();
emu.maps.write_bytes_slice(ALIGNED_ADDR, &data);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_pattern_2() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc5, 0xf5, 0xf6, 0x00, 0xf4, ]);
emu.load_code_bytes(&full_code);
let data: Vec<u8> = vec![0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01];
emu.maps.write_bytes_slice(ALIGNED_ADDR, &data);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_pattern_3() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc5, 0xf5, 0xf6, 0x00, 0xf4, ]);
emu.load_code_bytes(&full_code);
let pattern: Vec<u8> = (0..32).map(|i| if i % 2 == 0 { 0x80 } else { 0x7F }).collect();
emu.maps.write_bytes_slice(ALIGNED_ADDR, &pattern);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_boundary_values() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc5, 0xf5, 0xf6, 0x00, 0xf4, ]);
emu.load_code_bytes(&full_code);
let boundary: Vec<u8> = vec![0x00, 0x01, 0x7F, 0x80, 0x81, 0xFE, 0xFF, 0x00].repeat(4);
emu.maps.write_bytes_slice(ALIGNED_ADDR, &boundary);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_reverse_sequential() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc5, 0xf5, 0xf6, 0x00, 0xf4, ]);
emu.load_code_bytes(&full_code);
let pattern: Vec<u8> = (0..32).rev().collect();
emu.maps.write_bytes_slice(ALIGNED_ADDR, &pattern);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_small_differences() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc5, 0xf5, 0xf6, 0x00, 0xf4, ]);
emu.load_code_bytes(&full_code);
let data: Vec<u8> = (0..32).map(|_| 0x02).collect();
emu.maps.write_bytes_slice(ALIGNED_ADDR, &data);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_mixed_differences() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc5, 0xf5, 0xf6, 0x00, 0xf4, ]);
emu.load_code_bytes(&full_code);
let data: Vec<u8> = vec![0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, 0x08].repeat(4);
emu.maps.write_bytes_slice(ALIGNED_ADDR, &data);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_powers_of_two() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc5, 0xf5, 0xf6, 0x00, 0xf4, ]);
emu.load_code_bytes(&full_code);
let powers: Vec<u8> = (0..8).map(|i| 1u8 << i).chain((0..8).map(|i| 1u8 << i))
.chain((0..8).map(|i| 1u8 << i)).chain((0..8).map(|i| 1u8 << i)).collect();
emu.maps.write_bytes_slice(ALIGNED_ADDR, &powers);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_gradient_pattern() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc5, 0xf5, 0xf6, 0x00, 0xf4, ]);
emu.load_code_bytes(&full_code);
let gradient: Vec<u8> = (0..32).map(|i| ((i * 16) % 256) as u8).collect();
emu.maps.write_bytes_slice(ALIGNED_ADDR, &gradient);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_checkerboard_pattern() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc5, 0xf5, 0xf6, 0x00, 0xf4, ]);
emu.load_code_bytes(&full_code);
let checkerboard: Vec<u8> = (0..32).map(|i| if i % 2 == 0 { 0xAA } else { 0x55 }).collect();
emu.maps.write_bytes_slice(ALIGNED_ADDR, &checkerboard);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_diagonal_pattern() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc5, 0xf5, 0xf6, 0x00, 0xf4, ]);
emu.load_code_bytes(&full_code);
let diagonal: Vec<u8> = (0..32).map(|i| ((i * 7 + 13) % 256) as u8).collect();
emu.maps.write_bytes_slice(ALIGNED_ADDR, &diagonal);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_symmetric_pattern() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc5, 0xf5, 0xf6, 0x00, 0xf4, ]);
emu.load_code_bytes(&full_code);
let symmetric: Vec<u8> = vec![
0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, 0x08,
0x08, 0x07, 0x06, 0x05, 0x04, 0x03, 0x02, 0x01,
0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, 0x08,
0x08, 0x07, 0x06, 0x05, 0x04, 0x03, 0x02, 0x01,
];
emu.maps.write_bytes_slice(ALIGNED_ADDR, &symmetric);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_all_max_diff() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc5, 0xf5, 0xf6, 0x00, 0xf4, ]);
emu.load_code_bytes(&full_code);
let all_max: Vec<u8> = vec![0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00];
emu.maps.write_bytes_slice(ALIGNED_ADDR, &all_max);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_partial_match() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc5, 0xf5, 0xf6, 0x00, 0xf4, ]);
emu.load_code_bytes(&full_code);
let partial: Vec<u8> = (0..32).map(|i| if i % 4 == 0 { 0x00 } else { 0x10 }).collect();
emu.maps.write_bytes_slice(ALIGNED_ADDR, &partial);
emu.run(None).unwrap();
}
#[test]
fn test_vpsadbw_fibonacci_like() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc5, 0xf5, 0xf6, 0x00, 0xf4, ]);
emu.load_code_bytes(&full_code);
let mut fib = vec![0u8, 1u8];
for i in 2..32 {
fib.push(fib[i-1].wrapping_add(fib[i-2]));
}
emu.maps.write_bytes_slice(ALIGNED_ADDR, &fib);
emu.run(None).unwrap();
}