Saturating multiplication for int64 was added.

This commit is contained in:
Vsevolod Livinskij
2014-02-23 19:48:03 +04:00
parent 1f2541fbec
commit af836cda27
5 changed files with 148 additions and 0 deletions

View File

@@ -4885,6 +4885,28 @@ static inline varying int32 saturating_mul(varying int32 a, varying int32 b) {
return result;
}
static inline uniform int64 saturating_mul(uniform int64 a, uniform int64 b) {
uniform int64 a_abs = (a > 0) ? a : -a;
uniform int64 b_abs = (b > 0) ? b : -b;
if (a_abs > (INT64_MAX / b_abs))
if (((a > 0) && (b > 0)) || ((a < 0) && (b < 0)))
return INT64_MAX;
else
return INT64_MIN;
return a * b;
}
static inline varying int64 saturating_mul(varying int64 a, varying int64 b) {
varying int64 a_abs = (a > 0) ? a : -a;
varying int64 b_abs = (b > 0) ? b : -b;
if (a_abs > (INT64_MAX / b_abs))
if (((a > 0) && (b > 0)) || ((a < 0) && (b < 0)))
return INT64_MAX;
else
return INT64_MIN;
return a * b;
}
static inline uniform unsigned int8 saturating_mul(uniform unsigned int8 a,
uniform unsigned int8 b) {
uniform unsigned int16 result = (uniform unsigned int16) a *
@@ -4938,6 +4960,20 @@ static inline varying unsigned int32 saturating_mul(varying unsigned int32 a,
varying unsigned int32 lo = result;
return lo | - (varying int32) !! hi;
}
static inline uniform unsigned int64 saturating_mul(uniform unsigned int64 a,
uniform unsigned int64 b) {
if (a > (UINT64_MAX / b))
return UINT64_MAX;
return a * b;
}
static inline varying unsigned int64 saturating_mul(varying unsigned int64 a,
varying unsigned int64 b) {
if (a > (UINT64_MAX / b))
return UINT64_MAX;
return a * b;
}
///////////////////////////////////////////////////////////////////////////
// rdrand

28
tests/pmuls_i64.ispc Normal file
View File

@@ -0,0 +1,28 @@
export uniform int width() { return programCount; }
export void f_fu(uniform float RET[], uniform float aFOO[], uniform float b) {
uniform int64 a_max = 0x7FFFFFFFFFFFFFFF, a_min = -0x8000000000000000; // max and min signed int64
if (programIndex % 3 == 0) {
RET[programIndex] = saturating_mul(a_max, (uniform int64) b);
}
else if (programIndex % 3 == 1) {
RET[programIndex] = saturating_mul(a_min, (uniform int64) b);
}
else {
RET[programIndex] = saturating_mul((uniform int64) b,
(uniform int64) b);
}
}
export void result(uniform float RET[]) {
if (programIndex % 3 == 0) {
RET[programIndex] = (uniform int64) 0x7FFFFFFFFFFFFFFF; // max signed int64
}
else if (programIndex % 3 == 1) {
RET[programIndex] = (uniform int64) -0x8000000000000000; // min signed int64
}
else {
RET[programIndex] = (uniform int64) 25;
}
}

28
tests/pmuls_vi64.ispc Normal file
View File

@@ -0,0 +1,28 @@
export uniform int width() { return programCount; }
export void f_fu(uniform float RET[], uniform float aFOO[], uniform float b) {
varying int64 a_max = 0x7FFFFFFFFFFFFFFF, a_min = -0x8000000000000000; // max and min signed int64
if (programIndex % 3 == 0) {
RET[programIndex] = saturating_mul(a_max, (varying int64) b);
}
else if (programIndex % 3 == 1) {
RET[programIndex] = saturating_mul(a_min, (varying int64) b);
}
else {
RET[programIndex] = saturating_mul((varying int64) b,
(varying int64) b);
}
}
export void result(uniform float RET[]) {
if (programIndex % 3 == 0) {
RET[programIndex] = (varying int64) 0x7FFFFFFFFFFFFFFF; // max signed int64
}
else if (programIndex % 3 == 1) {
RET[programIndex] = (varying int64) -0x8000000000000000; // min signed int64
}
else {
RET[programIndex] = (varying int64) 25;
}
}

28
tests/pmulus_i64.ispc Normal file
View File

@@ -0,0 +1,28 @@
export uniform int width() { return programCount; }
export void f_fu(uniform float RET[], uniform float aFOO[], uniform float b) {
uniform unsigned int64 a_max = 0xFFFFFFFFFFFFFFFF, a_min = 0; // max and min unsigned int64
if (programIndex % 3 == 0) {
RET[programIndex] = saturating_mul(a_max, (uniform unsigned int64) b);
}
else if (programIndex % 3 == 1) {
RET[programIndex] = saturating_mul(a_min, (uniform unsigned int64) -b);
}
else {
RET[programIndex] = saturating_mul((uniform unsigned int64) b,
(uniform unsigned int64) b);
}
}
export void result(uniform float RET[]) {
if (programIndex % 3 == 0) {
RET[programIndex] = (uniform unsigned int64) 0xFFFFFFFFFFFFFFFF; // max unsigned int64
}
else if (programIndex % 3 == 1) {
RET[programIndex] = (uniform unsigned int64) 0; // min unsigned int64
}
else {
RET[programIndex] = (uniform unsigned int64) 25;
}
}

28
tests/pmulus_vi64.ispc Normal file
View File

@@ -0,0 +1,28 @@
export uniform int width() { return programCount; }
export void f_fu(uniform float RET[], uniform float aFOO[], uniform float b) {
varying unsigned int64 a_max = 0xFFFFFFFFFFFFFFFF, a_min = 0; // max and min unsigned int64
if (programIndex % 3 == 0) {
RET[programIndex] = saturating_mul(a_max, (varying unsigned int64) b);
}
else if (programIndex % 3 == 1) {
RET[programIndex] = saturating_mul(a_min, (varying unsigned int64) -b);
}
else {
RET[programIndex] = saturating_mul((varying unsigned int64) b,
(varying unsigned int64) b);
}
}
export void result(uniform float RET[]) {
if (programIndex % 3 == 0) {
RET[programIndex] = (varying unsigned int64) 0xFFFFFFFFFFFFFFFF; // max unsigned int64
}
else if (programIndex % 3 == 1) {
RET[programIndex] = (varying unsigned int64) 0; // min unsigned int64
}
else {
RET[programIndex] = (varying unsigned int64) 25;
}
}