File: cpuintrinsics.cpp

package info (click to toggle)
intel-compute-runtime 25.44.36015.8-1
  • links: PTS, VCS
  • area: main
  • in suites: sid
  • size: 79,632 kB
  • sloc: cpp: 931,547; lisp: 2,074; sh: 719; makefile: 162; python: 21
file content (106 lines) | stat: -rw-r--r-- 2,844 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
/*
 * Copyright (C) 2020-2025 Intel Corporation
 *
 * SPDX-License-Identifier: MIT
 *
 */

#include "shared/source/utilities/cpuintrinsics.h"

#include "shared/source/command_stream/task_count_helper.h"
#include "shared/source/helpers/ptr_math.h"

#include <atomic>
#include <cstdint>
#include <functional>

namespace CpuIntrinsicsTests {
// std::atomic is used for sake of sanitation in MT tests
std::atomic<uintptr_t> lastClFlushedPtr(0u);
std::atomic<uint32_t> clFlushCounter(0u);
std::atomic<uint32_t> pauseCounter(0u);
std::atomic<uint32_t> sfenceCounter(0u);
std::atomic<uint32_t> mfenceCounter(0u);

std::atomic<uint64_t> lastUmwaitCounter(0u);
std::atomic<unsigned int> lastUmwaitControl(0u);
std::atomic<uint32_t> umwaitCounter(0u);

std::atomic<uintptr_t> lastUmonitorPtr(0u);
std::atomic<uint32_t> umonitorCounter(0u);

std::atomic<uint32_t> rdtscCounter(0u);

std::atomic_uint32_t tpauseCounter{};

volatile TagAddressType *pauseAddress = nullptr;
TaskCountType pauseValue = 0u;
uint32_t pauseOffset = 0u;
uint64_t rdtscRetValue = 0;
unsigned char umwaitRetValue = 0;

std::function<void()> setupPauseAddress;
std::function<void()> controlUmwait;
} // namespace CpuIntrinsicsTests

namespace NEO {
namespace CpuIntrinsics {

void clFlush(void const *ptr) {
    CpuIntrinsicsTests::clFlushCounter++;
    CpuIntrinsicsTests::lastClFlushedPtr = reinterpret_cast<uintptr_t>(ptr);
}

void clFlushOpt(void *ptr) {
    clFlush(ptr);
}

void sfence() {
    CpuIntrinsicsTests::sfenceCounter++;
}

void mfence() {
    CpuIntrinsicsTests::mfenceCounter++;
}

void pause() {
    CpuIntrinsicsTests::pauseCounter++;
    if (CpuIntrinsicsTests::pauseAddress != nullptr) {
        *CpuIntrinsicsTests::pauseAddress = CpuIntrinsicsTests::pauseValue;
        if (CpuIntrinsicsTests::setupPauseAddress) {
            CpuIntrinsicsTests::setupPauseAddress();
        } else {
            CpuIntrinsicsTests::pauseAddress = ptrOffset(CpuIntrinsicsTests::pauseAddress, CpuIntrinsicsTests::pauseOffset);
        }
    }
}

uint8_t tpause(uint32_t control, uint64_t counter) {
    CpuIntrinsicsTests::tpauseCounter++;
    return 0;
}

unsigned char umwait(unsigned int ctrl, uint64_t counter) {
    CpuIntrinsicsTests::lastUmwaitControl = ctrl;
    CpuIntrinsicsTests::lastUmwaitCounter = counter;
    CpuIntrinsicsTests::umwaitCounter++;
    if (CpuIntrinsicsTests::controlUmwait) {
        CpuIntrinsicsTests::controlUmwait();
        return CpuIntrinsicsTests::umwaitRetValue;
    } else {
        return CpuIntrinsicsTests::umwaitRetValue;
    }
}

void umonitor(void *a) {
    CpuIntrinsicsTests::lastUmonitorPtr = reinterpret_cast<uintptr_t>(a);
    CpuIntrinsicsTests::umonitorCounter++;
}

uint64_t rdtsc() {
    CpuIntrinsicsTests::rdtscCounter++;
    return CpuIntrinsicsTests::rdtscRetValue;
}

} // namespace CpuIntrinsics
} // namespace NEO