On a target with a 16-bit mask (for example), we would choose the type of an integer literal "1024" to be an int16. Previously, we used an int32, which is a worse fit and leads to less efficient code than an int16 on a 16-bit mask target. (However, we'd still give an integer literal 1000000 the type int32, even in a 16-bit target.) Updated the tests to still pass with 8 and 16-bit targets, given this change.
21 lines
611 B
Plaintext
21 lines
611 B
Plaintext
|
|
export uniform int width() { return programCount; }
|
|
|
|
uniform unsigned int64 s = 0xffffffffff000000;
|
|
|
|
export void f_f(uniform float RET[], uniform float aFOO[]) {
|
|
float a = aFOO[programIndex];
|
|
float b = 0;
|
|
if (programIndex < 32 && (programIndex & 1))
|
|
b = atomic_or_local(&s, (1ul << programIndex));
|
|
RET[programIndex] = (s>>20);
|
|
}
|
|
|
|
export void result(uniform float RET[]) {
|
|
uniform int sum = 0;
|
|
for (uniform int i = 0; i < min(32, programCount); ++i)
|
|
if (i & 1)
|
|
sum += (1ul << i);
|
|
RET[programIndex] = ((unsigned int64)(0xffffffffff000000 | sum)) >> 20;
|
|
}
|