File: printf_handler.cpp

package info (click to toggle)
intel-compute-runtime 25.44.36015.8-1
  • links: PTS, VCS
  • area: main
  • in suites: sid
  • size: 79,632 kB
  • sloc: cpp: 931,547; lisp: 2,074; sh: 719; makefile: 162; python: 21
file content (86 lines) | stat: -rw-r--r-- 4,272 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
/*
 * Copyright (C) 2020-2025 Intel Corporation
 *
 * SPDX-License-Identifier: MIT
 *
 */

#include "level_zero/core/source/printf_handler/printf_handler.h"

#include "shared/source/command_stream/command_stream_receiver.h"
#include "shared/source/execution_environment/execution_environment.h"
#include "shared/source/helpers/blit_properties.h"
#include "shared/source/helpers/engine_node_helper.h"
#include "shared/source/memory_manager/allocation_properties.h"
#include "shared/source/memory_manager/memory_manager.h"
#include "shared/source/program/print_formatter.h"

#include "level_zero/core/source/device/device_imp.h"

namespace L0 {

NEO::GraphicsAllocation *PrintfHandler::createPrintfBuffer(Device *device) {
    NEO::AllocationProperties properties(
        device->getRootDeviceIndex(), PrintfHandler::printfBufferSize, NEO::AllocationType::printfSurface, device->getNEODevice()->getDeviceBitfield());
    properties.alignment = MemoryConstants::pageSize64k;
    auto allocation = device->getNEODevice()->getMemoryManager()->allocateGraphicsMemoryWithProperties(properties);

    *reinterpret_cast<uint32_t *>(allocation->getUnderlyingBuffer()) =
        PrintfHandler::printfSurfaceInitialDataSize;
    return allocation;
}

void PrintfHandler::printOutput(const KernelImmutableData *kernelData,
                                NEO::GraphicsAllocation *printfBuffer, Device *device, bool useInternalBlitter) {
    bool using32BitGpuPointers = kernelData->getDescriptor().kernelAttributes.gpuPointerSize == 4u;
    auto usesStringMap = kernelData->getDescriptor().kernelAttributes.usesStringMap();

    auto printfOutputBuffer = static_cast<uint8_t *>(printfBuffer->getUnderlyingBuffer());
    auto printfOutputSize = static_cast<uint32_t>(printfBuffer->getUnderlyingBufferSize());
    std::unique_ptr<uint8_t[]> printfOutputTemporary;

    if (useInternalBlitter) {
        auto selectedDevice = device->getNEODevice()->getNearestGenericSubDevice(0);
        auto &selectorCopyEngine = selectedDevice->getSelectorCopyEngine();
        auto deviceBitfield = selectedDevice->getDeviceBitfield();
        const auto internalUsage = true;
        auto bcsEngineType = NEO::EngineHelpers::getBcsEngineType(selectedDevice->getRootDeviceEnvironment(), deviceBitfield, selectorCopyEngine, internalUsage);
        auto bcsEngineUsage = NEO::EngineUsage::internal;
        auto bcsEngine = selectedDevice->tryGetEngine(bcsEngineType, bcsEngineUsage);

        if (bcsEngine) {
            printfOutputTemporary = std::make_unique<uint8_t[]>(printfOutputSize);
            printfOutputBuffer = printfOutputTemporary.get();

            NEO::BlitPropertiesContainer blitPropertiesContainer;
            blitPropertiesContainer.push_back(
                NEO::BlitProperties::constructPropertiesForReadWrite(BlitterConstants::BlitDirection::bufferToHostPtr,
                                                                     *bcsEngine->commandStreamReceiver, printfBuffer, nullptr,
                                                                     printfOutputBuffer,
                                                                     printfBuffer->getGpuAddress(),
                                                                     0, 0, 0, Vec3<size_t>(printfOutputSize, 0, 0), 0, 0, 0, 0));

            const auto newTaskCount = bcsEngine->commandStreamReceiver->flushBcsTask(blitPropertiesContainer, true, *selectedDevice);
            if (newTaskCount == NEO::CompletionStamp::gpuHang) {
                PRINT_DEBUG_STRING(NEO::debugManager.flags.PrintDebugMessages.get(), stderr, "Failed to copy printf buffer.\n", "");
                printfOutputBuffer = static_cast<uint8_t *>(printfBuffer->getUnderlyingBuffer());
            }
        }
    }

    NEO::PrintFormatter printfFormatter{
        printfOutputBuffer,
        printfOutputSize,
        using32BitGpuPointers,
        usesStringMap ? &kernelData->getDescriptor().kernelMetadata.printfStringsMap : nullptr};
    printfFormatter.printKernelOutput();

    *reinterpret_cast<uint32_t *>(printfBuffer->getUnderlyingBuffer()) =
        PrintfHandler::printfSurfaceInitialDataSize;
}

size_t PrintfHandler::getPrintBufferSize() {
    return PrintfHandler::printfBufferSize;
}

} // namespace L0