File: DivergentBarrierPass.h

package info (click to toggle)
intel-graphics-compiler2 2.16.0-2
  • links: PTS, VCS
  • area: main
  • in suites: sid
  • size: 106,644 kB
  • sloc: cpp: 805,640; lisp: 287,672; ansic: 16,414; python: 3,952; yacc: 2,588; lex: 1,666; pascal: 313; sh: 186; makefile: 35
file content (70 lines) | stat: -rw-r--r-- 2,532 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
/*========================== begin_copyright_notice ============================

Copyright (C) 2021 Intel Corporation

SPDX-License-Identifier: MIT

============================= end_copyright_notice ===========================*/

#pragma once
#include "IGC/common/StringMacros.hpp"
#include "Compiler/CodeGenPublic.h"
#include "Compiler/CISACodeGen/helper.h"
#include "Compiler/MetaDataUtilsWrapper.h"
#include "Compiler/CISACodeGen/WIAnalysis.hpp"

#include "common/LLVMWarningsPush.hpp"
#include <llvm/IR/PassManager.h>
#include "common/LLVMWarningsPop.hpp"

namespace IGC {
class DivergentBarrierPass : public llvm::ModulePass {
public:
  DivergentBarrierPass(void *Ctx = nullptr) : llvm::ModulePass(ID), Ctx(Ctx) {}
  bool runOnModule(llvm::Module &M) override;

  void getAnalysisUsage(llvm::AnalysisUsage &AU) const override {
    AU.addRequired<MetaDataUtilsWrapper>();
    AU.addRequired<CodeGenContextWrapper>();
  }

  static char ID;

  llvm::StringRef getPassName() const override { return "DivergentBarrierPass"; }

private:
  struct FenceArgs {
    bool CommitEnable = true;
    bool L3_Flush_RW_Data = false;
    bool L3_Flush_Constant_Data = false;
    bool L3_Flush_Texture_Data = false;
    bool L3_Flush_Instructions = false;
    bool Global = false;
    bool L1_Invalidate = false;
    bool L1_Evict = false;
    // init Scope with GROUP which should be used for SLM barriers
    // to be consistent with Global argument initialized to false
    uint Scope = LSC_SCOPE_GROUP;
  };

  typedef llvm::DenseMap<uint64_t, WIAnalysis::WIDependancy> SlotDepMap;

  CodeGenContext *m_CGCtx = nullptr;
  IGCMD::MetaDataUtils *m_MDUtils = nullptr;
  bool processShader(llvm::Function *F);
  bool hasDivergentBarrier(const std::vector<llvm::Instruction *> &Barriers, WIAnalysisRunner &WI) const;
  llvm::Function *createContinuation(llvm::BasicBlock *EntryBB);
  void updateFenceArgs(const llvm::GenIntrinsicInst *I, FenceArgs &Args) const;
  void generateBody(llvm::Function *Wrapper, llvm::Function *Entry, const std::vector<llvm::Function *> &Continuations,
                    const FenceArgs &FA);
  llvm::Value *getGroupSize(llvm::Function &F) const;
  llvm::Value *allocateSLM(llvm::IRBuilder<> &IRB);
  llvm::CallInst *insertFence(llvm::IRBuilder<> &IRB, const FenceArgs &FA) const;
  void handleSpillFill(llvm::Function *F, SlotDepMap &depMap);

  void *Ctx = nullptr;
};

void initializeDivergentBarrierPassPass(llvm::PassRegistry &);
llvm::ModulePass *createDivergentBarrierPass(void *Ctx);
} // namespace IGC