Fixed missing tmp var needed for use with gather intrinsic
This commit is contained in:
@@ -1589,11 +1589,6 @@ CAST_BITS_SCALAR(double, int64_t)
|
||||
///////////////////////////////////////////////////////////////////////////
|
||||
// various math functions
|
||||
|
||||
/*
|
||||
static FORCEINLINE void __fastmath() {
|
||||
}
|
||||
*/
|
||||
|
||||
static FORCEINLINE float __round_uniform_float(float v) {
|
||||
return roundf(v);
|
||||
}
|
||||
@@ -1943,7 +1938,7 @@ static FORCEINLINE void __masked_store_blend_float(void *p, __vec16_f val,
|
||||
static FORCEINLINE __vec16_i32
|
||||
__gather_base_offsets32_i32(uint8_t *base, uint32_t scale, __vec16_i32 offsets,
|
||||
__vec16_i1 mask) {
|
||||
// Loop is generated by intrinsic
|
||||
__vec16_i32 tmp = _mm512_undefined_epi32();
|
||||
__vec16_i32 ret = _mm512_mask_i32extgather_epi32(tmp, mask, offsets, base,
|
||||
_MM_UPCONV_EPI32_NONE, scale,
|
||||
_MM_HINT_NONE);
|
||||
@@ -1953,7 +1948,7 @@ __gather_base_offsets32_i32(uint8_t *base, uint32_t scale, __vec16_i32 offsets,
|
||||
static FORCEINLINE __vec16_f
|
||||
__gather_base_offsets32_float(uint8_t *base, uint32_t scale, __vec16_i32 offsets,
|
||||
__vec16_i1 mask) {
|
||||
// Loop is generated by intrinsic
|
||||
__vec16_f tmp = _mm512_undefined_ps();
|
||||
__vec16_f ret = _mm512_mask_i32extgather_ps(tmp, mask, offsets, base,
|
||||
_MM_UPCONV_PS_NONE, scale,
|
||||
_MM_HINT_NONE);
|
||||
|
||||
Reference in New Issue
Block a user