105 lines
2.7 KiB
Rust
105 lines
2.7 KiB
Rust
//@ run-pass
|
|
//@ ignore-emscripten FIXME(#45351) hits an LLVM assert
|
|
|
|
#![feature(repr_simd, intrinsics, concat_idents)]
|
|
#![allow(non_camel_case_types)]
|
|
|
|
#[repr(simd)]
|
|
#[derive(Copy, Clone)]
|
|
struct i32x4([i32; 4]);
|
|
#[repr(simd)]
|
|
#[derive(Copy, Clone)]
|
|
struct u32x4(pub [u32; 4]);
|
|
#[repr(simd)]
|
|
#[derive(Copy, Clone)]
|
|
struct f32x4(pub [f32; 4]);
|
|
|
|
extern "rust-intrinsic" {
|
|
fn simd_eq<T, U>(x: T, y: T) -> U;
|
|
fn simd_ne<T, U>(x: T, y: T) -> U;
|
|
fn simd_lt<T, U>(x: T, y: T) -> U;
|
|
fn simd_le<T, U>(x: T, y: T) -> U;
|
|
fn simd_gt<T, U>(x: T, y: T) -> U;
|
|
fn simd_ge<T, U>(x: T, y: T) -> U;
|
|
}
|
|
|
|
macro_rules! cmp {
|
|
($method: ident($lhs: expr, $rhs: expr)) => {{
|
|
let lhs = $lhs;
|
|
let rhs = $rhs;
|
|
let e: u32x4 = concat_idents!(simd_, $method)($lhs, $rhs);
|
|
// assume the scalar version is correct/the behaviour we want.
|
|
assert!((e.0[0] != 0) == lhs.0[0] .$method(&rhs.0[0]));
|
|
assert!((e.0[1] != 0) == lhs.0[1] .$method(&rhs.0[1]));
|
|
assert!((e.0[2] != 0) == lhs.0[2] .$method(&rhs.0[2]));
|
|
assert!((e.0[3] != 0) == lhs.0[3] .$method(&rhs.0[3]));
|
|
}}
|
|
}
|
|
macro_rules! tests {
|
|
($($lhs: ident, $rhs: ident;)*) => {{
|
|
$(
|
|
(|| {
|
|
cmp!(eq($lhs, $rhs));
|
|
cmp!(ne($lhs, $rhs));
|
|
|
|
// test both directions
|
|
cmp!(lt($lhs, $rhs));
|
|
cmp!(lt($rhs, $lhs));
|
|
|
|
cmp!(le($lhs, $rhs));
|
|
cmp!(le($rhs, $lhs));
|
|
|
|
cmp!(gt($lhs, $rhs));
|
|
cmp!(gt($rhs, $lhs));
|
|
|
|
cmp!(ge($lhs, $rhs));
|
|
cmp!(ge($rhs, $lhs));
|
|
})();
|
|
)*
|
|
}}
|
|
}
|
|
fn main() {
|
|
// 13 vs. -100 tests that we get signed vs. unsigned comparisons
|
|
// correct (i32: 13 > -100, u32: 13 < -100). let i1 = i32x4(10, -11, 12, 13);
|
|
let i1 = i32x4([10, -11, 12, 13]);
|
|
let i2 = i32x4([5, -5, 20, -100]);
|
|
let i3 = i32x4([10, -11, 20, -100]);
|
|
|
|
let u1 = u32x4([10, !11+1, 12, 13]);
|
|
let u2 = u32x4([5, !5+1, 20, !100+1]);
|
|
let u3 = u32x4([10, !11+1, 20, !100+1]);
|
|
|
|
let f1 = f32x4([10.0, -11.0, 12.0, 13.0]);
|
|
let f2 = f32x4([5.0, -5.0, 20.0, -100.0]);
|
|
let f3 = f32x4([10.0, -11.0, 20.0, -100.0]);
|
|
|
|
unsafe {
|
|
tests! {
|
|
i1, i1;
|
|
u1, u1;
|
|
f1, f1;
|
|
|
|
i1, i2;
|
|
u1, u2;
|
|
f1, f2;
|
|
|
|
i1, i3;
|
|
u1, u3;
|
|
f1, f3;
|
|
}
|
|
}
|
|
|
|
// NAN comparisons are special:
|
|
// -11 (*) 13
|
|
// -5 -100 (*)
|
|
let f4 = f32x4([f32::NAN, f1.0[1], f32::NAN, f2.0[3]]);
|
|
|
|
unsafe {
|
|
tests! {
|
|
f1, f4;
|
|
f2, f4;
|
|
f4, f4;
|
|
}
|
|
}
|
|
}
|