File: ModuleSplitter.cpp

package info (click to toggle)
intel-graphics-compiler 1.0.12504.6-1%2Bdeb12u1
  • links: PTS, VCS
  • area: main
  • in suites: bookworm
  • size: 83,912 kB
  • sloc: cpp: 910,147; lisp: 202,655; ansic: 15,197; python: 4,025; yacc: 2,241; lex: 1,570; pascal: 244; sh: 104; makefile: 25
file content (113 lines) | stat: -rw-r--r-- 3,376 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
/*========================== begin_copyright_notice ============================

Copyright (C) 2021 Intel Corporation

SPDX-License-Identifier: MIT

============================= end_copyright_notice ===========================*/

#include "common/LLVMWarningsPush.hpp"
#include <llvm/ADT/SetVector.h>
#include <llvm/IR/InstIterator.h>
#include <llvm/Transforms/Utils/Cloning.h>
#include <llvm/Transforms/IPO.h>
#include "common/LLVMWarningsPop.hpp"

#include <common/LLVMUtils.h>
#include <common/ModuleSplitter.h>
#include <Compiler/CodeGenPublic.h>

namespace IGC {
KernelModuleSplitter::KernelModuleSplitter(
    IGC::OpenCLProgramContext &oclContext, llvm::Module &module)
    : _oclContext(oclContext), _originalModule(module), _splittedModule(nullptr)
    {}

KernelModuleSplitter::~KernelModuleSplitter()
{
    restoreOclContextModule();
}

void KernelModuleSplitter::splitModuleForKernel(const llvm::Function* kernelF) {
    using namespace llvm;
    IGC_ASSERT_EXIT_MESSAGE(kernelF != nullptr, "Cannot split for null function!");

    std::vector<const Function*> workqueue;
    SetVector<const GlobalValue*> GVs;

    // add all functions called by the kernel, recursively
    // start with the kernel...
    GVs.insert(kernelF);
    workqueue.push_back(kernelF);

    // and for all called functions...
    while (!workqueue.empty())
    {
        const Function* F = workqueue.back();
        workqueue.pop_back();

        for (const auto& I : instructions(F))
        {
            if (const CallBase* CB = dyn_cast<CallBase>(&I))
            {
                if (const Function* CF = CB->getCalledFunction())
                {
                    if (CF->isDeclaration() || GVs.count(CF))
                        continue;

                    // add only defined ones and rerun for their's calls ...
                    GVs.insert(CF);
                    workqueue.push_back(CF);
                }
            }
        }
    }

    // add all globals - it's easier to let them be removed later than search for them here
    for (auto &GV : _originalModule.globals()) {
        GVs.insert(&GV);
    }

    // create new module with selected globals and functions
    ValueToValueMapTy VMap;
    std::unique_ptr<Module> kernelM = CloneModule(_originalModule, VMap,
                                                    [&](const GlobalValue* GV) { return GVs.count(GV); });
    IGC_ASSERT_EXIT_MESSAGE(kernelM, "Cloning module failed!");

    // Do cleanup.
    IGC::IGCPassManager mpm(&_oclContext, "CleanupAfterModuleSplitting");
    mpm.add(createGlobalDCEPass());           // Delete unreachable globals.
    mpm.add(createStripDeadDebugInfoPass());  // Remove dead debug info.
    mpm.add(createStripDeadPrototypesPass()); // Remove dead func decls.

    mpm.run(*kernelM.get());
    _splittedModule = std::move(kernelM);
}

void KernelModuleSplitter::retry()
{
    if(_splittedModule)
    {
        restoreOclContextModule();
        delete _splittedModule.release();
    }
}

void KernelModuleSplitter::restoreOclContextModule()
{
    if(_splittedModule)
    {
        _oclContext.clearMD();
        _oclContext.setModule(&_originalModule);
    }
}

void KernelModuleSplitter::setSplittedModuleInOCLContext()
{
    if(_splittedModule)
    {
        _oclContext.clearMD();
        _oclContext.setModule(_splittedModule.get());
    }
}
} // namespace IGC