Rollup merge of #112096 - workingjubilee:array-unzip, r=scottmcm
Remove array_zip `[T; N]::zip` is "eager" but most zips are mapped. This causes poor optimization in generated code. This is a fundamental design issue and "zip" is "prime real estate" in terms of function names, so let's free it up again. - FCP concluded in https://github.com/rust-lang/rust/issues/80094#issuecomment-1468300057 - Closes https://github.com/rust-lang/rust/issues/80094 - Closes https://github.com/rust-lang/rust/issues/103555 Could use review to make sure we aren't losing any essential codegen tests. r? `@scottmcm`
This commit is contained in:
commit
88160ab94c
@ -538,29 +538,6 @@ macro_rules! array_impl_default {
|
||||
drain_array_with(self, |iter| try_from_trusted_iterator(iter.map(f)))
|
||||
}
|
||||
|
||||
/// 'Zips up' two arrays into a single array of pairs.
|
||||
///
|
||||
/// `zip()` returns a new array where every element is a tuple where the
|
||||
/// first element comes from the first array, and the second element comes
|
||||
/// from the second array. In other words, it zips two arrays together,
|
||||
/// into a single one.
|
||||
///
|
||||
/// # Examples
|
||||
///
|
||||
/// ```
|
||||
/// #![feature(array_zip)]
|
||||
/// let x = [1, 2, 3];
|
||||
/// let y = [4, 5, 6];
|
||||
/// let z = x.zip(y);
|
||||
/// assert_eq!(z, [(1, 4), (2, 5), (3, 6)]);
|
||||
/// ```
|
||||
#[unstable(feature = "array_zip", issue = "80094")]
|
||||
pub fn zip<U>(self, rhs: [U; N]) -> [(T, U); N] {
|
||||
drain_array_with(self, |lhs| {
|
||||
drain_array_with(rhs, |rhs| from_trusted_iterator(crate::iter::zip(lhs, rhs)))
|
||||
})
|
||||
}
|
||||
|
||||
/// Returns a slice containing the entire array. Equivalent to `&s[..]`.
|
||||
#[stable(feature = "array_as_slice", since = "1.57.0")]
|
||||
#[rustc_const_stable(feature = "array_as_slice", since = "1.57.0")]
|
||||
|
@ -4,7 +4,6 @@
|
||||
// ignore-debug (the extra assertions get in the way)
|
||||
|
||||
#![crate_type = "lib"]
|
||||
#![feature(array_zip)]
|
||||
|
||||
// CHECK-LABEL: @short_integer_map
|
||||
#[no_mangle]
|
||||
@ -16,16 +15,6 @@
|
||||
x.map(|x| 2 * x + 1)
|
||||
}
|
||||
|
||||
// CHECK-LABEL: @short_integer_zip_map
|
||||
#[no_mangle]
|
||||
pub fn short_integer_zip_map(x: [u32; 8], y: [u32; 8]) -> [u32; 8] {
|
||||
// CHECK: %[[A:.+]] = load <8 x i32>
|
||||
// CHECK: %[[B:.+]] = load <8 x i32>
|
||||
// CHECK: sub <8 x i32> %[[B]], %[[A]]
|
||||
// CHECK: store <8 x i32>
|
||||
x.zip(y).map(|(x, y)| x - y)
|
||||
}
|
||||
|
||||
// This test is checking that LLVM can SRoA away a bunch of the overhead,
|
||||
// like fully moving the iterators to registers. Notably, previous implementations
|
||||
// of `map` ended up `alloca`ing the whole `array::IntoIterator`, meaning both a
|
||||
|
@ -1,7 +1,6 @@
|
||||
// compile-flags: -C opt-level=3 -Z merge-functions=disabled
|
||||
// only-x86_64
|
||||
#![crate_type = "lib"]
|
||||
#![feature(array_zip)]
|
||||
|
||||
// CHECK-LABEL: @auto_vectorize_direct
|
||||
#[no_mangle]
|
||||
@ -32,12 +31,12 @@
|
||||
c
|
||||
}
|
||||
|
||||
// CHECK-LABEL: @auto_vectorize_array_zip_map
|
||||
// CHECK-LABEL: @auto_vectorize_array_from_fn
|
||||
#[no_mangle]
|
||||
pub fn auto_vectorize_array_zip_map(a: [f32; 4], b: [f32; 4]) -> [f32; 4] {
|
||||
pub fn auto_vectorize_array_from_fn(a: [f32; 4], b: [f32; 4]) -> [f32; 4] {
|
||||
// CHECK: load <4 x float>
|
||||
// CHECK: load <4 x float>
|
||||
// CHECK: fadd <4 x float>
|
||||
// CHECK: store <4 x float>
|
||||
a.zip(b).map(|(a, b)| a + b)
|
||||
std::array::from_fn(|i| a[i] + b[i])
|
||||
}
|
||||
|
Loading…
Reference in New Issue
Block a user