1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
use stdsimd::vendor::*;
use vecs::{u8x64, u8x32, u8x16, i8x64, i8x32, i8x16, u16x32, u16x16, u16x8, i16x32, i16x16, i16x8, u32x16, u32x8, u32x4, i32x16, i32x8, i32x4, f32x16, f32x8, f32x4, u64x8, u64x4, u64x2, i64x8, i64x4, i64x2, f64x8, f64x4, f64x2};
pub trait PackedSqrt {
fn sqrt(&self) -> Self;
}
rust_fallback_impl! {
impl PackedSqrt for f32x8 where "avx" {
sqrt => _mm256_sqrt_ps(), [0, 1, 2, 3, 4, 5, 6, 7];
}
}
rust_fallback_impl! {
impl PackedSqrt for f64x4 where "avx" {
sqrt => _mm256_sqrt_pd(), [0, 1, 2, 3];
}
}
rust_fallback_impl! {
impl PackedSqrt for f32x4 where "sse" {
sqrt => _mm_sqrt_ps(), [0, 1, 2, 3];
}
}
rust_fallback_impl! {
impl PackedSqrt for f64x2 where "sse2" {
sqrt => _mm_sqrt_pd(), [0, 1];
}
}
#[cfg(test)]
mod tests {
use vecs::*;
use intrin::*;
#[test]
fn sqrt_f64s() {
assert_eq!(f64s::splat(1.0).sqrt(), f64s::splat(1.0));
assert!(f64s::splat(9.0).sqrt().max(f64s::splat(2.999)) == f64s::splat(9.0).sqrt());
assert!(f64s::splat(9.0).sqrt().min(f64s::splat(3.001)) == f64s::splat(9.0).sqrt());
}
#[test]
fn sqrt_f32s() {
assert_eq!(f32s::splat(1.0).sqrt(), f32s::splat(1.0));
assert!(f32s::splat(9.0).sqrt().max(f32s::splat(2.999)) == f32s::splat(9.0).sqrt());
assert!(f32s::splat(9.0).sqrt().min(f32s::splat(3.001)) == f32s::splat(9.0).sqrt());
}
}