File: main.hip

package info (click to toggle)
cmake 3.25.1-1
  • links: PTS, VCS
  • area: main
  • in suites: bookworm
  • size: 121,376 kB
  • sloc: ansic: 361,053; cpp: 250,806; sh: 3,828; yacc: 3,243; python: 2,707; lex: 1,328; lisp: 382; asm: 371; f90: 314; java: 266; perl: 217; objc: 212; xml: 202; cs: 200; fortran: 131; makefile: 99; javascript: 83; pascal: 63; tcl: 55; php: 25; ruby: 22
file content (40 lines) | stat: -rw-r--r-- 903 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40

#include <stdexcept>
#include <cmath>
#include <math.h>
#include <memory>

#include <hip/hip_runtime.h>
#include <hip/hip_fp16.h>

namespace {
template<class T, class F>
__global__ void global_entry_point(F f, T *out) {
  *out = f();
}

template <class T, class F>
bool verify(F f, T expected)
{
  std::unique_ptr<T> cpu_T(new T);
  T* gpu_T = nullptr;
  hipMalloc((void**)&gpu_T, sizeof(T));
  hipLaunchKernelGGL(global_entry_point, 1, 1, 0, 0, f, gpu_T);
  hipMemcpy(cpu_T.get(), gpu_T, sizeof(T), hipMemcpyDeviceToHost);
  hipFree(gpu_T);
  return (*cpu_T == expected);
}
}

int main(int argc, char** argv)
{
  bool valid = verify([]__device__(){ return std::round(1.4f); }, 1.0f);
  valid &= verify([]__device__(){ return max<_Float16>(1.0f, 2.0f); }, 2.0f);
  valid &= verify([]__device__(){ return min<_Float16>(1.0f, 2.0f); }, 1.0f);

  if (valid) {
    return 0;
  } else {
    return 1;
  }
}