convert _mm_mask_i32gather_epi32 to const generics
This commit is contained in:
parent
48c7ba0886
commit
a93607a9f2
1 changed files with 6 additions and 12 deletions
|
|
@ -1109,26 +1109,21 @@ pub unsafe fn _mm_i32gather_epi32<const SCALE: i32>(
|
|||
/// [Intel's documentation](https://software.intel.com/sites/landingpage/IntrinsicsGuide/#text=_mm_mask_i32gather_epi32)
|
||||
#[inline]
|
||||
#[target_feature(enable = "avx2")]
|
||||
#[cfg_attr(test, assert_instr(vpgatherdd, scale = 1))]
|
||||
#[rustc_args_required_const(4)]
|
||||
#[cfg_attr(test, assert_instr(vpgatherdd, SCALE = 1))]
|
||||
#[rustc_legacy_const_generics(4)]
|
||||
#[stable(feature = "simd_x86", since = "1.27.0")]
|
||||
pub unsafe fn _mm_mask_i32gather_epi32(
|
||||
pub unsafe fn _mm_mask_i32gather_epi32<const SCALE: i32>(
|
||||
src: __m128i,
|
||||
slice: *const i32,
|
||||
offsets: __m128i,
|
||||
mask: __m128i,
|
||||
scale: i32,
|
||||
) -> __m128i {
|
||||
static_assert_imm8_scale!(SCALE);
|
||||
let src = src.as_i32x4();
|
||||
let mask = mask.as_i32x4();
|
||||
let offsets = offsets.as_i32x4();
|
||||
let slice = slice as *const i8;
|
||||
macro_rules! call {
|
||||
($imm8:expr) => {
|
||||
pgatherdd(src, slice, offsets, mask, $imm8)
|
||||
};
|
||||
}
|
||||
let r = constify_imm8_gather!(scale, call);
|
||||
let r = pgatherdd(src, slice, offsets, mask, SCALE as i8);
|
||||
transmute(r)
|
||||
}
|
||||
|
||||
|
|
@ -5583,12 +5578,11 @@ mod tests {
|
|||
arr[i as usize] = i;
|
||||
}
|
||||
// A multiplier of 4 is word-addressing
|
||||
let r = _mm_mask_i32gather_epi32(
|
||||
let r = _mm_mask_i32gather_epi32::<4>(
|
||||
_mm_set1_epi32(256),
|
||||
arr.as_ptr(),
|
||||
_mm_setr_epi32(0, 16, 64, 96),
|
||||
_mm_setr_epi32(-1, -1, -1, 0),
|
||||
4,
|
||||
);
|
||||
assert_eq_m128i(r, _mm_setr_epi32(0, 16, 64, 256));
|
||||
}
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue