1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46
|
#include "Halide.h"
namespace {
class GpuAdd : public Halide::Generator<GpuAdd> {
public:
Input<Buffer<int32_t, 2>> input{"input"};
Output<Buffer<int32_t, 2>> output{"output"};
void generate() {
Var x("x"), y("y");
// Create a simple pipeline that scales pixel values by 2.
output(x, y) = input(x, y) + 2;
Target target = get_target();
if (target.has_gpu_feature()) {
Var xo, yo, xi, yi;
output.gpu_tile(x, y, xo, yo, xi, yi, 16, 16);
}
}
};
class GpuMul : public Halide::Generator<GpuMul> {
public:
Input<Buffer<int32_t, 2>> input{"input"};
Output<Buffer<int32_t, 2>> output{"output"};
void generate() {
Var x("x"), y("y");
// Create a simple pipeline that scales pixel values by 2.
output(x, y) = input(x, y) * 2;
Target target = get_target();
if (target.has_gpu_feature()) {
Var xo, yo, xi, yi;
output.gpu_tile(x, y, xo, yo, xi, yi, 16, 16);
}
}
};
} // namespace
HALIDE_REGISTER_GENERATOR(GpuAdd, gpu_multi_context_threaded_add)
HALIDE_REGISTER_GENERATOR(GpuMul, gpu_multi_context_threaded_mul)
|