use crate::*;
const ALIGNED_ADDR: u64 = 0x3000;
const ALIGNED_ADDR2: u64 = 0x3100;
#[test]
fn test_vpmullw_ymm0_ymm1_ymm2_all_zeros() {
let mut emu = emu64();
let code = [
0xc5, 0xf5, 0xd5, 0xc2, 0xf4, ];
emu.load_code_bytes(&code);
emu.run(None).unwrap();
}
#[test]
fn test_vpmullw_ymm3_ymm4_ymm5_all_ones() {
let mut emu = emu64();
let code = [
0xc5, 0xdd, 0xd5, 0xdd, 0xf4, ];
emu.load_code_bytes(&code);
emu.run(None).unwrap();
}
#[test]
fn test_vpmullw_ymm6_ymm7_ymm8_by_two() {
let mut emu = emu64();
let code = [
0xc5, 0x45, 0xd5, 0xf0, 0xf4, ];
emu.load_code_bytes(&code);
emu.run(None).unwrap();
}
#[test]
fn test_vpmullw_ymm9_ymm10_ymm11_overflow() {
let mut emu = emu64();
let code = [
0xc4, 0x41, 0x2d, 0xd5, 0xcb, 0xf4, ];
emu.load_code_bytes(&code);
emu.run(None).unwrap();
}
#[test]
fn test_vpmullw_ymm12_ymm13_ymm14_mixed() {
let mut emu = emu64();
let code = [
0xc4, 0x41, 0x15, 0xd5, 0xe6, 0xf4, ];
emu.load_code_bytes(&code);
emu.run(None).unwrap();
}
#[test]
fn test_vpmullw_ymm15_ymm0_ymm1_high_reg() {
let mut emu = emu64();
let code = [
0xc4, 0xc1, 0x7d, 0xd5, 0xf9, 0xf4, ];
emu.load_code_bytes(&code);
emu.run(None).unwrap();
}
#[test]
fn test_vpmullw_ymm0_ymm1_mem() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc5, 0xf5, 0xd5, 0x00, 0xf4, ]);
emu.load_code_bytes(&full_code);
let data: Vec<u8> = (0..16).flat_map(|i| (i as u16).to_le_bytes()).collect();
emu.maps.write_bytes_slice(ALIGNED_ADDR, &data);
emu.run(None).unwrap();
}
#[test]
fn test_vpmullw_ymm2_ymm3_mem_max_values() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc5, 0xe5, 0xd5, 0x10, 0xf4, ]);
emu.load_code_bytes(&full_code);
emu.maps.write_bytes_slice(ALIGNED_ADDR, &[0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF]);
emu.run(None).unwrap();
}
#[test]
fn test_vpmullw_ymm4_ymm5_mem_powers_of_two() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc5, 0xd5, 0xd5, 0x20, 0xf4, ]);
emu.load_code_bytes(&full_code);
let powers: Vec<u8> = (0..16).flat_map(|i| (1u16 << (i % 16)).to_le_bytes()).collect();
emu.maps.write_bytes_slice(ALIGNED_ADDR, &powers);
emu.run(None).unwrap();
}
#[test]
fn test_vpmullw_ymm6_ymm7_mem_sequential() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc5, 0x45, 0xd5, 0x30, 0xf4, ]);
emu.load_code_bytes(&full_code);
let data: Vec<u8> = (1..=16).flat_map(|i| (i as u16).to_le_bytes()).collect();
emu.maps.write_bytes_slice(ALIGNED_ADDR, &data);
emu.run(None).unwrap();
}
#[test]
fn test_vpmullw_ymm0_ymm1_ymm2_small_values() {
let mut emu = emu64();
let code = [
0xc5, 0xf5, 0xd5, 0xc2, 0xf4, ];
emu.load_code_bytes(&code);
emu.run(None).unwrap();
}
#[test]
fn test_vpmullw_ymm3_ymm4_ymm5_negative_representation() {
let mut emu = emu64();
let code = [
0xc5, 0xdd, 0xd5, 0xdd, 0xf4, ];
emu.load_code_bytes(&code);
emu.run(None).unwrap();
}
#[test]
fn test_vpmullw_ymm8_ymm9_ymm10_alternating() {
let mut emu = emu64();
let code = [
0xc4, 0x41, 0x35, 0xd5, 0xc2, 0xf4, ];
emu.load_code_bytes(&code);
emu.run(None).unwrap();
}
#[test]
fn test_vpmullw_ymm11_ymm12_ymm13_pattern() {
let mut emu = emu64();
let code = [
0xc4, 0x41, 0x1d, 0xd5, 0xdd, 0xf4, ];
emu.load_code_bytes(&code);
emu.run(None).unwrap();
}
#[test]
fn test_vpmullw_chain_operations() {
let mut emu = emu64();
let code = [
0xc5, 0xf5, 0xd5, 0xc2, 0xc5, 0xfd, 0xd5, 0xc3, 0xf4, ];
emu.load_code_bytes(&code);
emu.run(None).unwrap();
}
#[test]
fn test_vpmullw_mem_different_patterns() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc5, 0xf5, 0xd5, 0x00, 0xf4, ]);
emu.load_code_bytes(&full_code);
let pattern: Vec<u8> = (0..16).flat_map(|i| {
if i % 2 == 0 { 0x000Au16 } else { 0x0005u16 }.to_le_bytes()
}).collect();
emu.maps.write_bytes_slice(ALIGNED_ADDR, &pattern);
emu.run(None).unwrap();
}
#[test]
fn test_vpmullw_mem_large_multipliers() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc5, 0xf5, 0xd5, 0x00, 0xf4, ]);
emu.load_code_bytes(&full_code);
let data: Vec<u8> = (0..16).flat_map(|_| 0x8000u16.to_le_bytes()).collect();
emu.maps.write_bytes_slice(ALIGNED_ADDR, &data);
emu.run(None).unwrap();
}
#[test]
fn test_vpmulld_ymm0_ymm1_ymm2_all_zeros() {
let mut emu = emu64();
let code = [
0xc4, 0xe2, 0x75, 0x40, 0xc2, 0xf4, ];
emu.load_code_bytes(&code);
emu.run(None).unwrap();
}
#[test]
fn test_vpmulld_ymm3_ymm4_ymm5_all_ones() {
let mut emu = emu64();
let code = [
0xc4, 0xe2, 0x5d, 0x40, 0xdd, 0xf4, ];
emu.load_code_bytes(&code);
emu.run(None).unwrap();
}
#[test]
fn test_vpmulld_ymm6_ymm7_ymm8_by_two() {
let mut emu = emu64();
let code = [
0xc4, 0xc2, 0x45, 0x40, 0xf0, 0xf4, ];
emu.load_code_bytes(&code);
emu.run(None).unwrap();
}
#[test]
fn test_vpmulld_ymm9_ymm10_ymm11_overflow() {
let mut emu = emu64();
let code = [
0xc4, 0x42, 0x2d, 0x40, 0xcb, 0xf4, ];
emu.load_code_bytes(&code);
emu.run(None).unwrap();
}
#[test]
fn test_vpmulld_ymm12_ymm13_ymm14_mixed() {
let mut emu = emu64();
let code = [
0xc4, 0x42, 0x15, 0x40, 0xe6, 0xf4, ];
emu.load_code_bytes(&code);
emu.run(None).unwrap();
}
#[test]
fn test_vpmulld_ymm15_ymm0_ymm1_high_reg() {
let mut emu = emu64();
let code = [
0xc4, 0xc2, 0x7d, 0x40, 0xf9, 0xf4, ];
emu.load_code_bytes(&code);
emu.run(None).unwrap();
}
#[test]
fn test_vpmulld_ymm0_ymm1_mem() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc4, 0xe2, 0x75, 0x40, 0x00, 0xf4, ]);
emu.load_code_bytes(&full_code);
let data: Vec<u8> = (0..8).flat_map(|i| (i as u32).to_le_bytes()).collect();
emu.maps.write_bytes_slice(ALIGNED_ADDR, &data);
emu.run(None).unwrap();
}
#[test]
fn test_vpmulld_ymm2_ymm3_mem_max_values() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc4, 0xe2, 0x65, 0x40, 0x10, 0xf4, ]);
emu.load_code_bytes(&full_code);
emu.maps.write_bytes_slice(ALIGNED_ADDR, &[0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF]);
emu.run(None).unwrap();
}
#[test]
fn test_vpmulld_ymm4_ymm5_mem_powers_of_two() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc4, 0xe2, 0x55, 0x40, 0x20, 0xf4, ]);
emu.load_code_bytes(&full_code);
let powers: Vec<u8> = (0..8).flat_map(|i| (1u32 << i).to_le_bytes()).collect();
emu.maps.write_bytes_slice(ALIGNED_ADDR, &powers);
emu.run(None).unwrap();
}
#[test]
fn test_vpmulld_ymm6_ymm7_mem_sequential() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc4, 0xc2, 0x45, 0x40, 0x30, 0xf4, ]);
emu.load_code_bytes(&full_code);
let data: Vec<u8> = (1..=8).flat_map(|i| (i as u32).to_le_bytes()).collect();
emu.maps.write_bytes_slice(ALIGNED_ADDR, &data);
emu.run(None).unwrap();
}
#[test]
fn test_vpmulld_ymm0_ymm1_ymm2_small_values() {
let mut emu = emu64();
let code = [
0xc4, 0xe2, 0x75, 0x40, 0xc2, 0xf4, ];
emu.load_code_bytes(&code);
emu.run(None).unwrap();
}
#[test]
fn test_vpmulld_ymm3_ymm4_ymm5_negative_representation() {
let mut emu = emu64();
let code = [
0xc4, 0xe2, 0x5d, 0x40, 0xdd, 0xf4, ];
emu.load_code_bytes(&code);
emu.run(None).unwrap();
}
#[test]
fn test_vpmulld_ymm8_ymm9_ymm10_alternating() {
let mut emu = emu64();
let code = [
0xc4, 0x42, 0x35, 0x40, 0xc2, 0xf4, ];
emu.load_code_bytes(&code);
emu.run(None).unwrap();
}
#[test]
fn test_vpmulld_ymm11_ymm12_ymm13_pattern() {
let mut emu = emu64();
let code = [
0xc4, 0x42, 0x1d, 0x40, 0xdd, 0xf4, ];
emu.load_code_bytes(&code);
emu.run(None).unwrap();
}
#[test]
fn test_vpmulld_chain_operations() {
let mut emu = emu64();
let code = [
0xc4, 0xe2, 0x75, 0x40, 0xc2, 0xc4, 0xe2, 0x7d, 0x40, 0xc3, 0xf4, ];
emu.load_code_bytes(&code);
emu.run(None).unwrap();
}
#[test]
fn test_vpmulld_mem_different_patterns() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc4, 0xe2, 0x75, 0x40, 0x00, 0xf4, ]);
emu.load_code_bytes(&full_code);
let pattern: Vec<u8> = (0..8).flat_map(|i| {
if i % 2 == 0 { 10u32 } else { 5u32 }.to_le_bytes()
}).collect();
emu.maps.write_bytes_slice(ALIGNED_ADDR, &pattern);
emu.run(None).unwrap();
}
#[test]
fn test_vpmulld_mem_large_multipliers() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc4, 0xe2, 0x75, 0x40, 0x00, 0xf4, ]);
emu.load_code_bytes(&full_code);
let data: Vec<u8> = (0..8).flat_map(|_| 0x80000000u32.to_le_bytes()).collect();
emu.maps.write_bytes_slice(ALIGNED_ADDR, &data);
emu.run(None).unwrap();
}
#[test]
fn test_vpmulld_mem_prime_numbers() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&ALIGNED_ADDR.to_le_bytes());
full_code.extend_from_slice(&[
0xc4, 0xe2, 0x75, 0x40, 0x00, 0xf4, ]);
emu.load_code_bytes(&full_code);
let primes: Vec<u8> = vec![2u32, 3, 5, 7, 11, 13, 17, 19]
.into_iter()
.flat_map(|p| p.to_le_bytes())
.collect();
emu.maps.write_bytes_slice(ALIGNED_ADDR, &primes);
emu.run(None).unwrap();
}
#[test]
fn test_vpmullw_mem_unaligned() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&(ALIGNED_ADDR + 2).to_le_bytes());
full_code.extend_from_slice(&[
0xc5, 0xf5, 0xd5, 0x00, 0xf4, ]);
emu.load_code_bytes(&full_code);
emu.maps.write_bytes_slice(ALIGNED_ADDR, &[0x03, 0x03, 0x03, 0x03, 0x03, 0x03, 0x03, 0x03, 0x03, 0x03, 0x03, 0x03, 0x03, 0x03, 0x03, 0x03, 0x03, 0x03, 0x03, 0x03, 0x03, 0x03, 0x03, 0x03, 0x03, 0x03, 0x03, 0x03, 0x03, 0x03, 0x03, 0x03, 0x03, 0x03]);
emu.run(None).unwrap();
}
#[test]
fn test_vpmulld_mem_unaligned() {
let mut emu = emu64();
let code = [0x48, 0xb8];
let mut full_code = code.to_vec();
full_code.extend_from_slice(&(ALIGNED_ADDR + 4).to_le_bytes());
full_code.extend_from_slice(&[
0xc4, 0xe2, 0x75, 0x40, 0x00, 0xf4, ]);
emu.load_code_bytes(&full_code);
emu.maps.write_bytes_slice(ALIGNED_ADDR, &[0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02]);
emu.run(None).unwrap();
}