1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70
|
/*========================== begin_copyright_notice ============================
Copyright (C) 2021 Intel Corporation
SPDX-License-Identifier: MIT
============================= end_copyright_notice ===========================*/
#pragma once
#include "IGC/common/StringMacros.hpp"
#include "Compiler/CodeGenPublic.h"
#include "Compiler/CISACodeGen/helper.h"
#include "Compiler/MetaDataUtilsWrapper.h"
#include "Compiler/CISACodeGen/WIAnalysis.hpp"
#include "common/LLVMWarningsPush.hpp"
#include <llvm/IR/PassManager.h>
#include "common/LLVMWarningsPop.hpp"
namespace IGC {
class DivergentBarrierPass : public llvm::ModulePass {
public:
DivergentBarrierPass(void *Ctx = nullptr) : llvm::ModulePass(ID), Ctx(Ctx) {}
bool runOnModule(llvm::Module &M) override;
void getAnalysisUsage(llvm::AnalysisUsage &AU) const override {
AU.addRequired<MetaDataUtilsWrapper>();
AU.addRequired<CodeGenContextWrapper>();
}
static char ID;
llvm::StringRef getPassName() const override { return "DivergentBarrierPass"; }
private:
struct FenceArgs {
bool CommitEnable = true;
bool L3_Flush_RW_Data = false;
bool L3_Flush_Constant_Data = false;
bool L3_Flush_Texture_Data = false;
bool L3_Flush_Instructions = false;
bool Global = false;
bool L1_Invalidate = false;
bool L1_Evict = false;
// init Scope with GROUP which should be used for SLM barriers
// to be consistent with Global argument initialized to false
uint Scope = LSC_SCOPE_GROUP;
};
typedef llvm::DenseMap<uint64_t, WIAnalysis::WIDependancy> SlotDepMap;
CodeGenContext *m_CGCtx = nullptr;
IGCMD::MetaDataUtils *m_MDUtils = nullptr;
bool processShader(llvm::Function *F);
bool hasDivergentBarrier(const std::vector<llvm::Instruction *> &Barriers, WIAnalysisRunner &WI) const;
llvm::Function *createContinuation(llvm::BasicBlock *EntryBB);
void updateFenceArgs(const llvm::GenIntrinsicInst *I, FenceArgs &Args) const;
void generateBody(llvm::Function *Wrapper, llvm::Function *Entry, const std::vector<llvm::Function *> &Continuations,
const FenceArgs &FA);
llvm::Value *getGroupSize(llvm::Function &F) const;
llvm::Value *allocateSLM(llvm::IRBuilder<> &IRB);
llvm::CallInst *insertFence(llvm::IRBuilder<> &IRB, const FenceArgs &FA) const;
void handleSpillFill(llvm::Function *F, SlotDepMap &depMap);
void *Ctx = nullptr;
};
void initializeDivergentBarrierPassPass(llvm::PassRegistry &);
llvm::ModulePass *createDivergentBarrierPass(void *Ctx);
} // namespace IGC
|