File: copy_kernel_timestamps.builtin_kernel

package info (click to toggle)
intel-compute-runtime 20.44.18297-1
  • links: PTS, VCS
  • area: main
  • in suites: bullseye
  • size: 34,780 kB
  • sloc: cpp: 379,729; lisp: 4,931; python: 299; sh: 196; makefile: 8
file content (52 lines) | stat: -rw-r--r-- 1,717 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
/*
 * Copyright (C) 2020 Intel Corporation
 *
 * SPDX-License-Identifier: MIT
 *
 */

R"===(
__kernel void QueryKernelTimestamps(__global ulong* srcEvents, __global ulong* dst, uint useOnlyGlobalTimestamps) {
    uint gid = get_global_id(0);
    const ulong tsMask = (1ull << 32) - 1;
    uint currentOffset = gid * 4;
    dst[currentOffset] = 0;
    dst[currentOffset + 1] = 0;
    dst[currentOffset + 2] = 0;
    dst[currentOffset + 3] = 0;

    ulong srcPtr = srcEvents[gid];
    __global uint *src = (__global uint *) srcPtr;
    dst[currentOffset] = src[1] & tsMask;
    dst[currentOffset + 1] = src[3] & tsMask;
    if (useOnlyGlobalTimestamps != 0) {
        dst[currentOffset + 2] = src[1] & tsMask;
        dst[currentOffset + 3] = src[3] & tsMask;
    } else {
        dst[currentOffset + 2] = src[0] & tsMask;
        dst[currentOffset + 3] = src[2] & tsMask;
    }
}

__kernel void QueryKernelTimestampsWithOffsets(__global ulong* srcEvents, __global ulong* dst, __global ulong *offsets, uint useOnlyGlobalTimestamps) {
    uint gid = get_global_id(0);
    const ulong tsMask = (1ull << 32) - 1;
    uint currentOffset = offsets[gid] / 8;
    dst[currentOffset] = 0;
    dst[currentOffset + 1] = 0;
    dst[currentOffset + 2] = 0;
    dst[currentOffset + 3] = 0;

    ulong srcPtr = srcEvents[gid];
    __global uint *src = (__global uint *) srcPtr;
    dst[currentOffset] = src[1] & tsMask;
    dst[currentOffset + 1] = src[3] & tsMask;
    if (useOnlyGlobalTimestamps != 0) {
        dst[currentOffset + 2] = src[1] & tsMask;
        dst[currentOffset + 3] = src[3] & tsMask;
    } else {
        dst[currentOffset + 2] = src[0] & tsMask;
        dst[currentOffset + 3] = src[2] & tsMask;
    }
}
)==="