1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35
|
#include "test_static.isph"
// rule: skip on arch=xe64
#define THREADS 4
task void f_f_task(uniform float RET[], uniform float aFOO[]) {
uniform float val[programCount];
for (uniform int i = 0; i < programCount; ++i)
val[i] = 0;
foreach (i = 0 ... programCount)
val[i] += aFOO[programCount*taskIndex + i] - 1;
uniform float sum = 0;
for (uniform int i = 0; i < programCount; ++i)
sum += val[i];
if (programIndex < programCount/THREADS)
RET[programCount/THREADS*taskIndex + programIndex] = sum;
}
task void f_f(uniform float RET[], uniform float aFOO[])
{
launch[THREADS] f_f_task(RET, aFOO);
}
task void result_task(uniform float RET[])
{
const uniform float ret = reduce_add(programIndex + programCount*taskIndex);
if (programIndex < programCount/THREADS)
RET[programCount/THREADS*taskIndex + programIndex] = ret;
}
task void result(uniform float RET[]) {
launch[THREADS] result_task(RET);
}
|