File: hello_generator.cpp

package info (click to toggle)
halide 21.0.0-4
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid
  • size: 55,752 kB
  • sloc: cpp: 289,334; ansic: 22,751; python: 7,486; makefile: 4,299; sh: 2,508; java: 1,549; javascript: 282; pascal: 207; xml: 127; asm: 9
file content (49 lines) | stat: -rw-r--r-- 1,353 bytes parent folder | download | duplicates (4)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
#include "Halide.h"

using namespace Halide;

namespace {

class Hello : public Generator<Hello> {
public:
    Input<Buffer<uint8_t, 2>> input{"input"};
    Output<Buffer<uint8_t, 2>> result{"result"};

    void generate() {
        tone_curve(x) = cast<int16_t>(pow(cast<float>(x) / 256.0f, 1.8f) * 256.0f);

        Func clamped = BoundaryConditions::repeat_edge(input);

        curved(x, y) = tone_curve(clamped(x, y));

        Func sharper;
        sharper(x, y) = 9 * curved(x, y) - 2 * (curved(x - 1, y) + curved(x + 1, y) + curved(x, y - 1) + curved(x, y + 1));

        result(x, y) = cast<uint8_t>(clamp(sharper(x, y), 0, 255));
    }

    void schedule() {
        Var yi;

        tone_curve.compute_root();
        result.split(y, y, yi, 60).vectorize(x, 8).parallel(y);
        curved.store_at(result, y).compute_at(result, yi);

        // We want to handle inputs that may be rotated 180 due to camera module placement.

        // Unset the default stride constraint
        input.dim(0).set_stride(Expr());

        // Make specialized versions for input stride +/-1 to get dense vector loads
        curved.specialize(input.dim(0).stride() == 1);
        curved.specialize(input.dim(0).stride() == -1);
    }

private:
    Var x{"x"}, y{"y"};
    Func tone_curve, curved;
};

}  // namespace

HALIDE_REGISTER_GENERATOR(Hello, hello)