File: LegalizationPass.hpp

package info (click to toggle)
intel-graphics-compiler2 2.16.0-2
  • links: PTS, VCS
  • area: main
  • in suites: sid
  • size: 106,644 kB
  • sloc: cpp: 805,640; lisp: 287,672; ansic: 16,414; python: 3,952; yacc: 2,588; lex: 1,666; pascal: 313; sh: 186; makefile: 35
file content (105 lines) | stat: -rw-r--r-- 3,744 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
/*========================== begin_copyright_notice ============================

Copyright (C) 2017-2024 Intel Corporation

SPDX-License-Identifier: MIT

============================= end_copyright_notice ===========================*/

#pragma once

#include "Compiler/MetaDataUtilsWrapper.h"
#include "Compiler/CodeGenContextWrapper.hpp"

#include "common/LLVMWarningsPush.hpp"
#include <llvm/Pass.h>
#include <llvm/IR/DataLayout.h>
#include <llvm/IR/Function.h>
#include <llvm/IR/InstVisitor.h>
#include <llvm/IR/IRBuilder.h>
#include "common/LLVMWarningsPop.hpp"

namespace IGC {
class CodeGenContext;
}

namespace IGC {
class Legalization : public llvm::FunctionPass, public llvm::InstVisitor<Legalization> {
  bool m_preserveNan;

  // With option "-finite-math-only", IGC ignores all nans but keeps isnan
  // checks. That is, in the fast mode, isnan will be honored. We also
  // *assume* all isnan checks are lowered into the following forms:
  //   %b = fcmp uno float %x, 0.000000e+00 or %b = fcmp une float %x, %x
  // All other forms will be optimized away. This is a less ideal workaround
  // to limit the scope. A proper fix is to keep isnan check as an intrinsic
  // call, but implementing this requires to rewrite ocl builtins.
  bool m_preserveNanCheck;

  const llvm::DataLayout *m_DL;
  std::vector<llvm::Instruction *> m_instructionsToRemove;
  llvm::IRBuilder<> *m_builder = nullptr;
  IGC::CodeGenContext *m_ctx = nullptr;

public:
  static char ID;

  Legalization(bool preserveNan = false);

  ~Legalization() {}

  virtual void getAnalysisUsage(llvm::AnalysisUsage &AU) const override {
    AU.addRequired<MetaDataUtilsWrapper>();
    AU.addRequired<CodeGenContextWrapper>();
  }

  virtual bool runOnFunction(llvm::Function &F) override;

  virtual llvm::StringRef getPassName() const override { return "Legalization Pass"; }

  void visitInstruction(llvm::Instruction &I);
  void visitCallInst(llvm::CallInst &I);
  void visitSelectInst(llvm::SelectInst &I);
  void visitPHINode(llvm::PHINode &I);
  void visitICmpInst(llvm::ICmpInst &IC);
  void visitFCmpInst(llvm::FCmpInst &FC);
  void visitFCmpInstUndorderedPredicate(llvm::FCmpInst &FC);
  void visitFCmpInstUndorderedFlushNan(llvm::FCmpInst &FC);
  void visitInsertElementInst(llvm::InsertElementInst &I);
  void visitShuffleVectorInst(llvm::ShuffleVectorInst &I);
  void visitStoreInst(llvm::StoreInst &I);
  void visitLoadInst(llvm::LoadInst &I);
  void visitAlloca(llvm::AllocaInst &I);
  void visitIntrinsicInst(llvm::IntrinsicInst &I);
  void visitBitCastInst(llvm::BitCastInst &I);
  void visitBasicBlock(llvm::BasicBlock &BB);
  void visitTruncInst(llvm::TruncInst &);
  void visitUnaryInstruction(llvm::UnaryInstruction &I);
  void visitBinaryOperator(llvm::BinaryOperator &I);
  void visitAddrSpaceCastInst(llvm::AddrSpaceCastInst &);

protected:
  llvm::Value *addFCmpWithORD(llvm::FCmpInst &FC);
  llvm::Value *addFCmpWithUNO(llvm::FCmpInst &FC);
  llvm::Value *findInsert(llvm::Value *vector, unsigned int index);
  llvm::Type *LegalAllocaType(llvm::Type *type) const;
  llvm::Type *LegalStructAllocaType(llvm::Type *type) const;

  void RecursivelyChangePointerType(llvm::Instruction *oldPtr, llvm::Type *Ty, llvm::Instruction *newPtr);
  void PromoteFp16ToFp32OnGenSampleCall(llvm::CallInst &I);
  void PromoteInsertElement(llvm::Value *I, llvm::Value *newVec);

  /// \brief Ensure a function have a unique return instruction.
  void unifyReturnInsts(llvm::Function &F);

private:
  llvm::DenseMap<llvm::Value *, llvm::Value *> fpMap;
};

// Legalize IR out of LLVM optimization passes (such as GVN).
llvm::FunctionPass *createGenOptLegalizer();

// Emulate FDIV instructions.
llvm::FunctionPass *createGenFDIVEmulation();

} // namespace IGC