Saturating multiplication for int64 was added.
This commit is contained in:
36
stdlib.ispc
36
stdlib.ispc
@@ -4885,6 +4885,28 @@ static inline varying int32 saturating_mul(varying int32 a, varying int32 b) {
|
|||||||
return result;
|
return result;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
static inline uniform int64 saturating_mul(uniform int64 a, uniform int64 b) {
|
||||||
|
uniform int64 a_abs = (a > 0) ? a : -a;
|
||||||
|
uniform int64 b_abs = (b > 0) ? b : -b;
|
||||||
|
if (a_abs > (INT64_MAX / b_abs))
|
||||||
|
if (((a > 0) && (b > 0)) || ((a < 0) && (b < 0)))
|
||||||
|
return INT64_MAX;
|
||||||
|
else
|
||||||
|
return INT64_MIN;
|
||||||
|
return a * b;
|
||||||
|
}
|
||||||
|
|
||||||
|
static inline varying int64 saturating_mul(varying int64 a, varying int64 b) {
|
||||||
|
varying int64 a_abs = (a > 0) ? a : -a;
|
||||||
|
varying int64 b_abs = (b > 0) ? b : -b;
|
||||||
|
if (a_abs > (INT64_MAX / b_abs))
|
||||||
|
if (((a > 0) && (b > 0)) || ((a < 0) && (b < 0)))
|
||||||
|
return INT64_MAX;
|
||||||
|
else
|
||||||
|
return INT64_MIN;
|
||||||
|
return a * b;
|
||||||
|
}
|
||||||
|
|
||||||
static inline uniform unsigned int8 saturating_mul(uniform unsigned int8 a,
|
static inline uniform unsigned int8 saturating_mul(uniform unsigned int8 a,
|
||||||
uniform unsigned int8 b) {
|
uniform unsigned int8 b) {
|
||||||
uniform unsigned int16 result = (uniform unsigned int16) a *
|
uniform unsigned int16 result = (uniform unsigned int16) a *
|
||||||
@@ -4938,6 +4960,20 @@ static inline varying unsigned int32 saturating_mul(varying unsigned int32 a,
|
|||||||
varying unsigned int32 lo = result;
|
varying unsigned int32 lo = result;
|
||||||
return lo | - (varying int32) !! hi;
|
return lo | - (varying int32) !! hi;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
static inline uniform unsigned int64 saturating_mul(uniform unsigned int64 a,
|
||||||
|
uniform unsigned int64 b) {
|
||||||
|
if (a > (UINT64_MAX / b))
|
||||||
|
return UINT64_MAX;
|
||||||
|
return a * b;
|
||||||
|
}
|
||||||
|
|
||||||
|
static inline varying unsigned int64 saturating_mul(varying unsigned int64 a,
|
||||||
|
varying unsigned int64 b) {
|
||||||
|
if (a > (UINT64_MAX / b))
|
||||||
|
return UINT64_MAX;
|
||||||
|
return a * b;
|
||||||
|
}
|
||||||
///////////////////////////////////////////////////////////////////////////
|
///////////////////////////////////////////////////////////////////////////
|
||||||
// rdrand
|
// rdrand
|
||||||
|
|
||||||
|
|||||||
28
tests/pmuls_i64.ispc
Normal file
28
tests/pmuls_i64.ispc
Normal file
@@ -0,0 +1,28 @@
|
|||||||
|
|
||||||
|
export uniform int width() { return programCount; }
|
||||||
|
|
||||||
|
export void f_fu(uniform float RET[], uniform float aFOO[], uniform float b) {
|
||||||
|
uniform int64 a_max = 0x7FFFFFFFFFFFFFFF, a_min = -0x8000000000000000; // max and min signed int64
|
||||||
|
if (programIndex % 3 == 0) {
|
||||||
|
RET[programIndex] = saturating_mul(a_max, (uniform int64) b);
|
||||||
|
}
|
||||||
|
else if (programIndex % 3 == 1) {
|
||||||
|
RET[programIndex] = saturating_mul(a_min, (uniform int64) b);
|
||||||
|
}
|
||||||
|
else {
|
||||||
|
RET[programIndex] = saturating_mul((uniform int64) b,
|
||||||
|
(uniform int64) b);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
export void result(uniform float RET[]) {
|
||||||
|
if (programIndex % 3 == 0) {
|
||||||
|
RET[programIndex] = (uniform int64) 0x7FFFFFFFFFFFFFFF; // max signed int64
|
||||||
|
}
|
||||||
|
else if (programIndex % 3 == 1) {
|
||||||
|
RET[programIndex] = (uniform int64) -0x8000000000000000; // min signed int64
|
||||||
|
}
|
||||||
|
else {
|
||||||
|
RET[programIndex] = (uniform int64) 25;
|
||||||
|
}
|
||||||
|
}
|
||||||
28
tests/pmuls_vi64.ispc
Normal file
28
tests/pmuls_vi64.ispc
Normal file
@@ -0,0 +1,28 @@
|
|||||||
|
|
||||||
|
export uniform int width() { return programCount; }
|
||||||
|
|
||||||
|
export void f_fu(uniform float RET[], uniform float aFOO[], uniform float b) {
|
||||||
|
varying int64 a_max = 0x7FFFFFFFFFFFFFFF, a_min = -0x8000000000000000; // max and min signed int64
|
||||||
|
if (programIndex % 3 == 0) {
|
||||||
|
RET[programIndex] = saturating_mul(a_max, (varying int64) b);
|
||||||
|
}
|
||||||
|
else if (programIndex % 3 == 1) {
|
||||||
|
RET[programIndex] = saturating_mul(a_min, (varying int64) b);
|
||||||
|
}
|
||||||
|
else {
|
||||||
|
RET[programIndex] = saturating_mul((varying int64) b,
|
||||||
|
(varying int64) b);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
export void result(uniform float RET[]) {
|
||||||
|
if (programIndex % 3 == 0) {
|
||||||
|
RET[programIndex] = (varying int64) 0x7FFFFFFFFFFFFFFF; // max signed int64
|
||||||
|
}
|
||||||
|
else if (programIndex % 3 == 1) {
|
||||||
|
RET[programIndex] = (varying int64) -0x8000000000000000; // min signed int64
|
||||||
|
}
|
||||||
|
else {
|
||||||
|
RET[programIndex] = (varying int64) 25;
|
||||||
|
}
|
||||||
|
}
|
||||||
28
tests/pmulus_i64.ispc
Normal file
28
tests/pmulus_i64.ispc
Normal file
@@ -0,0 +1,28 @@
|
|||||||
|
|
||||||
|
export uniform int width() { return programCount; }
|
||||||
|
|
||||||
|
export void f_fu(uniform float RET[], uniform float aFOO[], uniform float b) {
|
||||||
|
uniform unsigned int64 a_max = 0xFFFFFFFFFFFFFFFF, a_min = 0; // max and min unsigned int64
|
||||||
|
if (programIndex % 3 == 0) {
|
||||||
|
RET[programIndex] = saturating_mul(a_max, (uniform unsigned int64) b);
|
||||||
|
}
|
||||||
|
else if (programIndex % 3 == 1) {
|
||||||
|
RET[programIndex] = saturating_mul(a_min, (uniform unsigned int64) -b);
|
||||||
|
}
|
||||||
|
else {
|
||||||
|
RET[programIndex] = saturating_mul((uniform unsigned int64) b,
|
||||||
|
(uniform unsigned int64) b);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
export void result(uniform float RET[]) {
|
||||||
|
if (programIndex % 3 == 0) {
|
||||||
|
RET[programIndex] = (uniform unsigned int64) 0xFFFFFFFFFFFFFFFF; // max unsigned int64
|
||||||
|
}
|
||||||
|
else if (programIndex % 3 == 1) {
|
||||||
|
RET[programIndex] = (uniform unsigned int64) 0; // min unsigned int64
|
||||||
|
}
|
||||||
|
else {
|
||||||
|
RET[programIndex] = (uniform unsigned int64) 25;
|
||||||
|
}
|
||||||
|
}
|
||||||
28
tests/pmulus_vi64.ispc
Normal file
28
tests/pmulus_vi64.ispc
Normal file
@@ -0,0 +1,28 @@
|
|||||||
|
|
||||||
|
export uniform int width() { return programCount; }
|
||||||
|
|
||||||
|
export void f_fu(uniform float RET[], uniform float aFOO[], uniform float b) {
|
||||||
|
varying unsigned int64 a_max = 0xFFFFFFFFFFFFFFFF, a_min = 0; // max and min unsigned int64
|
||||||
|
if (programIndex % 3 == 0) {
|
||||||
|
RET[programIndex] = saturating_mul(a_max, (varying unsigned int64) b);
|
||||||
|
}
|
||||||
|
else if (programIndex % 3 == 1) {
|
||||||
|
RET[programIndex] = saturating_mul(a_min, (varying unsigned int64) -b);
|
||||||
|
}
|
||||||
|
else {
|
||||||
|
RET[programIndex] = saturating_mul((varying unsigned int64) b,
|
||||||
|
(varying unsigned int64) b);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
export void result(uniform float RET[]) {
|
||||||
|
if (programIndex % 3 == 0) {
|
||||||
|
RET[programIndex] = (varying unsigned int64) 0xFFFFFFFFFFFFFFFF; // max unsigned int64
|
||||||
|
}
|
||||||
|
else if (programIndex % 3 == 1) {
|
||||||
|
RET[programIndex] = (varying unsigned int64) 0; // min unsigned int64
|
||||||
|
}
|
||||||
|
else {
|
||||||
|
RET[programIndex] = (varying unsigned int64) 25;
|
||||||
|
}
|
||||||
|
}
|
||||||
Reference in New Issue
Block a user