Auto merge of #3204 - RalfJung:simd, r=RalfJung
add new SIMD intrinsics
This commit is contained in:
commit
28f9fe3262
@ -1,6 +1,7 @@
|
|||||||
use rustc_apfloat::{Float, Round};
|
use rustc_apfloat::{Float, Round};
|
||||||
use rustc_middle::ty::layout::{HasParamEnv, LayoutOf};
|
use rustc_middle::ty::layout::{HasParamEnv, LayoutOf};
|
||||||
use rustc_middle::{mir, ty, ty::FloatTy};
|
use rustc_middle::{mir, ty, ty::FloatTy};
|
||||||
|
use rustc_span::{sym, Symbol};
|
||||||
use rustc_target::abi::{Endian, HasDataLayout};
|
use rustc_target::abi::{Endian, HasDataLayout};
|
||||||
|
|
||||||
use crate::*;
|
use crate::*;
|
||||||
@ -25,7 +26,12 @@ fn emulate_simd_intrinsic(
|
|||||||
| "floor"
|
| "floor"
|
||||||
| "round"
|
| "round"
|
||||||
| "trunc"
|
| "trunc"
|
||||||
| "fsqrt" => {
|
| "fsqrt"
|
||||||
|
| "ctlz"
|
||||||
|
| "cttz"
|
||||||
|
| "bswap"
|
||||||
|
| "bitreverse"
|
||||||
|
=> {
|
||||||
let [op] = check_arg_count(args)?;
|
let [op] = check_arg_count(args)?;
|
||||||
let (op, op_len) = this.operand_to_simd(op)?;
|
let (op, op_len) = this.operand_to_simd(op)?;
|
||||||
let (dest, dest_len) = this.place_to_simd(dest)?;
|
let (dest, dest_len) = this.place_to_simd(dest)?;
|
||||||
@ -38,6 +44,7 @@ enum Op {
|
|||||||
Abs,
|
Abs,
|
||||||
Sqrt,
|
Sqrt,
|
||||||
Round(rustc_apfloat::Round),
|
Round(rustc_apfloat::Round),
|
||||||
|
Numeric(Symbol),
|
||||||
}
|
}
|
||||||
let which = match intrinsic_name {
|
let which = match intrinsic_name {
|
||||||
"neg" => Op::MirOp(mir::UnOp::Neg),
|
"neg" => Op::MirOp(mir::UnOp::Neg),
|
||||||
@ -47,6 +54,10 @@ enum Op {
|
|||||||
"floor" => Op::Round(rustc_apfloat::Round::TowardNegative),
|
"floor" => Op::Round(rustc_apfloat::Round::TowardNegative),
|
||||||
"round" => Op::Round(rustc_apfloat::Round::NearestTiesToAway),
|
"round" => Op::Round(rustc_apfloat::Round::NearestTiesToAway),
|
||||||
"trunc" => Op::Round(rustc_apfloat::Round::TowardZero),
|
"trunc" => Op::Round(rustc_apfloat::Round::TowardZero),
|
||||||
|
"ctlz" => Op::Numeric(sym::ctlz),
|
||||||
|
"cttz" => Op::Numeric(sym::cttz),
|
||||||
|
"bswap" => Op::Numeric(sym::bswap),
|
||||||
|
"bitreverse" => Op::Numeric(sym::bitreverse),
|
||||||
_ => unreachable!(),
|
_ => unreachable!(),
|
||||||
};
|
};
|
||||||
|
|
||||||
@ -101,6 +112,20 @@ enum Op {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
Op::Numeric(name) => {
|
||||||
|
assert!(op.layout.ty.is_integral());
|
||||||
|
let size = op.layout.size;
|
||||||
|
let bits = op.to_scalar().to_bits(size).unwrap();
|
||||||
|
let extra = 128u128.checked_sub(u128::from(size.bits())).unwrap();
|
||||||
|
let bits_out = match name {
|
||||||
|
sym::ctlz => u128::from(bits.leading_zeros()).checked_sub(extra).unwrap(),
|
||||||
|
sym::cttz => u128::from((bits << extra).trailing_zeros()).checked_sub(extra).unwrap(),
|
||||||
|
sym::bswap => (bits << extra).swap_bytes(),
|
||||||
|
sym::bitreverse => (bits << extra).reverse_bits(),
|
||||||
|
_ => unreachable!(),
|
||||||
|
};
|
||||||
|
Scalar::from_uint(bits_out, size)
|
||||||
|
}
|
||||||
};
|
};
|
||||||
this.write_scalar(val, &dest)?;
|
this.write_scalar(val, &dest)?;
|
||||||
}
|
}
|
||||||
@ -126,7 +151,8 @@ enum Op {
|
|||||||
| "fmin"
|
| "fmin"
|
||||||
| "saturating_add"
|
| "saturating_add"
|
||||||
| "saturating_sub"
|
| "saturating_sub"
|
||||||
| "arith_offset" => {
|
| "arith_offset"
|
||||||
|
=> {
|
||||||
use mir::BinOp;
|
use mir::BinOp;
|
||||||
|
|
||||||
let [left, right] = check_arg_count(args)?;
|
let [left, right] = check_arg_count(args)?;
|
||||||
@ -386,7 +412,6 @@ enum Op {
|
|||||||
let (dest, dest_len) = this.place_to_simd(dest)?;
|
let (dest, dest_len) = this.place_to_simd(dest)?;
|
||||||
let bitmask_len = dest_len.max(8);
|
let bitmask_len = dest_len.max(8);
|
||||||
|
|
||||||
assert!(mask.layout.ty.is_integral());
|
|
||||||
assert!(bitmask_len <= 64);
|
assert!(bitmask_len <= 64);
|
||||||
assert_eq!(bitmask_len, mask.layout.size.bits());
|
assert_eq!(bitmask_len, mask.layout.size.bits());
|
||||||
assert_eq!(dest_len, yes_len);
|
assert_eq!(dest_len, yes_len);
|
||||||
@ -394,8 +419,18 @@ enum Op {
|
|||||||
let dest_len = u32::try_from(dest_len).unwrap();
|
let dest_len = u32::try_from(dest_len).unwrap();
|
||||||
let bitmask_len = u32::try_from(bitmask_len).unwrap();
|
let bitmask_len = u32::try_from(bitmask_len).unwrap();
|
||||||
|
|
||||||
let mask: u64 =
|
// The mask can be a single integer or an array.
|
||||||
this.read_scalar(mask)?.to_bits(mask.layout.size)?.try_into().unwrap();
|
let mask: u64 = match mask.layout.ty.kind() {
|
||||||
|
ty::Int(..) | ty::Uint(..) =>
|
||||||
|
this.read_scalar(mask)?.to_bits(mask.layout.size)?.try_into().unwrap(),
|
||||||
|
ty::Array(elem, _) if matches!(elem.kind(), ty::Uint(ty::UintTy::U8)) => {
|
||||||
|
let mask_ty = this.machine.layouts.uint(mask.layout.size).unwrap();
|
||||||
|
let mask = mask.transmute(mask_ty, this)?;
|
||||||
|
this.read_scalar(&mask)?.to_bits(mask_ty.size)?.try_into().unwrap()
|
||||||
|
}
|
||||||
|
_ => bug!("simd_select_bitmask: invalid mask type {}", mask.layout.ty),
|
||||||
|
};
|
||||||
|
|
||||||
for i in 0..dest_len {
|
for i in 0..dest_len {
|
||||||
let mask = mask
|
let mask = mask
|
||||||
& 1u64
|
& 1u64
|
||||||
|
@ -197,6 +197,24 @@ fn simd_ops_i32() {
|
|||||||
assert_eq!(b.reduce_or(), -1);
|
assert_eq!(b.reduce_or(), -1);
|
||||||
assert_eq!(a.reduce_xor(), 0);
|
assert_eq!(a.reduce_xor(), 0);
|
||||||
assert_eq!(b.reduce_xor(), -4);
|
assert_eq!(b.reduce_xor(), -4);
|
||||||
|
|
||||||
|
assert_eq!(b.leading_zeros(), u32x4::from_array([31, 30, 30, 0]));
|
||||||
|
assert_eq!(b.trailing_zeros(), u32x4::from_array([0, 1, 0, 2]));
|
||||||
|
assert_eq!(b.leading_ones(), u32x4::from_array([0, 0, 0, 30]));
|
||||||
|
assert_eq!(b.trailing_ones(), u32x4::from_array([1, 0, 2, 0]));
|
||||||
|
assert_eq!(
|
||||||
|
b.swap_bytes(),
|
||||||
|
i32x4::from_array([0x01000000, 0x02000000, 0x03000000, 0xfcffffffu32 as i32])
|
||||||
|
);
|
||||||
|
assert_eq!(
|
||||||
|
b.reverse_bits(),
|
||||||
|
i32x4::from_array([
|
||||||
|
0x80000000u32 as i32,
|
||||||
|
0x40000000,
|
||||||
|
0xc0000000u32 as i32,
|
||||||
|
0x3fffffffu32 as i32
|
||||||
|
])
|
||||||
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
fn simd_mask() {
|
fn simd_mask() {
|
||||||
@ -247,6 +265,22 @@ fn simd_mask() {
|
|||||||
assert_eq!(bitmask2, [0b0001]);
|
assert_eq!(bitmask2, [0b0001]);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// This used to cause an ICE.
|
||||||
|
let bitmask = u8x8::from_array([0b01000101, 0, 0, 0, 0, 0, 0, 0]);
|
||||||
|
assert_eq!(
|
||||||
|
mask32x8::from_bitmask_vector(bitmask),
|
||||||
|
mask32x8::from_array([true, false, true, false, false, false, true, false]),
|
||||||
|
);
|
||||||
|
let bitmask =
|
||||||
|
u8x16::from_array([0b01000101, 0b11110000, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]);
|
||||||
|
assert_eq!(
|
||||||
|
mask32x16::from_bitmask_vector(bitmask),
|
||||||
|
mask32x16::from_array([
|
||||||
|
true, false, true, false, false, false, true, false, false, false, false, false, true,
|
||||||
|
true, true, true,
|
||||||
|
]),
|
||||||
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
fn simd_cast() {
|
fn simd_cast() {
|
||||||
|
Loading…
Reference in New Issue
Block a user