1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112
|
#include "Halide.h"
// Avoid the need to link this test to libjpeg and libpng
#define HALIDE_NO_JPEG
#define HALIDE_NO_PNG
#include "halide_image_io.h"
#include "halide_test_dirs.h"
#include <cstdio>
using namespace Halide;
int main(int argc, char **argv) {
if (get_jit_target_from_environment().arch == Target::WebAssembly) {
printf("[SKIP] WebAssembly JIT does not support debug_to_file() yet.\n");
return 0;
}
std::vector<std::string> formats = {"npy", "mat"};
for (const auto &format : formats) {
std::cout << "Testing format " << format << "...\n";
std::string f_path = Internal::get_test_tmp_dir() + "f." + format;
std::string g_path = Internal::get_test_tmp_dir() + "g." + format;
std::string h_path = Internal::get_test_tmp_dir() + "h." + format;
Internal::ensure_no_file_exists(f_path);
Internal::ensure_no_file_exists(g_path);
Internal::ensure_no_file_exists(h_path);
{
Func f, g, h, j;
Var x, y, z;
f(x, y, z) = cast<int32_t>(x + y + z);
g(x, y) = cast<float>(f(x, y, 0) + f(x + 1, y, 1));
h(x, y) = cast<int32_t>(f(x, y, -1) + g(x, y));
Target target = get_jit_target_from_environment();
if (target.has_gpu_feature()) {
Var xi, yi;
f.compute_root().gpu_tile(x, y, xi, yi, 1, 1).debug_to_file(f_path);
g.compute_root().gpu_tile(x, y, xi, yi, 1, 1).debug_to_file(g_path);
h.compute_root().gpu_tile(x, y, xi, yi, 1, 1).debug_to_file(h_path);
} else {
f.compute_root().debug_to_file(f_path);
g.compute_root().debug_to_file(g_path);
h.compute_root().debug_to_file(h_path);
}
Buffer<int32_t> im = h.realize({10, 10}, target);
}
{
Internal::assert_file_exists(f_path);
Internal::assert_file_exists(g_path);
Internal::assert_file_exists(h_path);
Buffer<int32_t> f = Tools::load_image(f_path);
assert(f.dimensions() == 3 &&
f.dim(0).extent() == 11 &&
f.dim(1).extent() == 10 &&
f.dim(2).extent() == 3);
for (int z = 0; z < 3; z++) {
for (int y = 0; y < 10; y++) {
for (int x = 0; x < 11; x++) {
int32_t val = f(x, y, z);
// The min coord gets lost on debug_to_file, so f should be shifted up by one.
if (val != x + y + z - 1) {
printf("f(%d, %d, %d) = %d instead of %d\n", x, y, z, val, x + y);
return 1;
}
}
}
}
Buffer<float> g = Tools::load_image(g_path);
assert(g.dimensions() == 2 &&
g.dim(0).extent() == 10 &&
g.dim(1).extent() == 10);
for (int y = 0; y < 10; y++) {
for (int x = 0; x < 10; x++) {
float val = g(x, y);
float correct = (float)(f(x, y, 1) + f(x + 1, y, 2));
if (val != correct) {
printf("g(%d, %d) = %f instead of %f\n", x, y, val, correct);
return 1;
}
}
}
Buffer<int32_t> h = Tools::load_image(h_path);
assert(h.dimensions() == 2 &&
h.dim(0).extent() == 10 &&
h.dim(1).extent() == 10);
for (int y = 0; y < 10; y++) {
for (int x = 0; x < 10; x++) {
int32_t val = h(x, y);
int32_t correct = f(x, y, 0) + g(x, y);
if (val != correct) {
printf("h(%d, %d) = %d instead of %d\n", x, y, val, correct);
return 1;
}
}
}
}
}
printf("Success!\n");
return 0;
}
|