File: HandleFRemInstructions.cpp

package info (click to toggle)
intel-graphics-compiler2 2.16.0-2
  • links: PTS, VCS
  • area: main
  • in suites: sid
  • size: 106,644 kB
  • sloc: cpp: 805,640; lisp: 287,672; ansic: 16,414; python: 3,952; yacc: 2,588; lex: 1,666; pascal: 313; sh: 186; makefile: 35
file content (100 lines) | stat: -rw-r--r-- 3,709 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
/*========================== begin_copyright_notice ============================

Copyright (C) 2019-2021 Intel Corporation

SPDX-License-Identifier: MIT

============================= end_copyright_notice ===========================*/

#include "Compiler/HandleFRemInstructions.hpp"
#include "common/LLVMWarningsPush.hpp"
#include <llvm/IR/Module.h>
#include <llvm/IR/Instructions.h>
#include <llvm/Transforms/Utils/BasicBlockUtils.h>
#include "llvmWrapper/IR/DerivedTypes.h"
#include "common/LLVMWarningsPop.hpp"
#include "Compiler/IGCPassSupport.h"
#include "Probe/Assertion.h"

using namespace llvm;
using namespace IGC;

#define PASS_FLAG "igc-handle-frem-inst"
#define PASS_DESCRIPTION "Replace FRem instructions with proper builtin calls"
#define PASS_CFG_ONLY false
#define PASS_ANALYSIS false
IGC_INITIALIZE_PASS_BEGIN(HandleFRemInstructions, PASS_FLAG, PASS_DESCRIPTION, PASS_CFG_ONLY, PASS_ANALYSIS)
IGC_INITIALIZE_PASS_END(HandleFRemInstructions, PASS_FLAG, PASS_DESCRIPTION, PASS_CFG_ONLY, PASS_ANALYSIS)

char HandleFRemInstructions::ID = 0;

HandleFRemInstructions::HandleFRemInstructions() : ModulePass(ID) {
  initializeHandleFRemInstructionsPass(*PassRegistry::getPassRegistry());
}

void HandleFRemInstructions::visitFRem(llvm::BinaryOperator &I) {
  auto Val1 = I.getOperand(0);
  auto Val2 = I.getOperand(1);
  auto ValType = Val1->getType();
  auto ScalarType = ValType->getScalarType();

  IGC_ASSERT_MESSAGE(Val1->getType() == Val2->getType(), "Operands of frem instruction must have same type");
  IGC_ASSERT_MESSAGE(ScalarType->isFloatingPointTy(), "Operands of frem instruction must have floating point type");

  std::string VecStr = "";
  std::string FpTypeStr;

  if (ScalarType->isHalfTy() || ScalarType->isFloatTy() || ScalarType->isDoubleTy()) {
    auto TypeWidth = ScalarType->getScalarSizeInBits();
    FpTypeStr = "f" + std::to_string(TypeWidth);
  } else if (IGCLLVM::isBFloatTy(ScalarType)) {
    FpTypeStr = "f32";
    Type *FloatTy = Type::getFloatTy(I.getContext());
    ValType = ValType->isVectorTy() ? IGCLLVM::FixedVectorType::get(
                                          FloatTy, (unsigned)cast<IGCLLVM::FixedVectorType>(ValType)->getNumElements())
                                    : FloatTy;

    auto Val1Float = new FPExtInst(Val1, ValType, "", &I);
    Val1Float->setDebugLoc(I.getDebugLoc());
    auto Val2Float = new FPExtInst(Val2, ValType, "", &I);
    Val2Float->setDebugLoc(I.getDebugLoc());
    Val1 = Val1Float;
    Val2 = Val2Float;
  } else {
    IGC_ASSERT_MESSAGE(0, "Unsupported type");
  }

  SmallVector<Type *, 2> ArgsTypes{ValType, ValType};

  if (ValType->isVectorTy()) {
    auto VecCount = cast<IGCLLVM::FixedVectorType>(ValType)->getNumElements();
    if (VecCount == 2 || VecCount == 3 || VecCount == 4 || VecCount == 8 || VecCount == 16) {
      VecStr = "v" + std::to_string(VecCount);
    } else {
      IGC_ASSERT_MESSAGE(0, "Unsupported vector size");
    }
  }
  std::string TypeStr = "_" + VecStr + FpTypeStr;
  std::string FuncName = "__builtin_spirv_OpFRem" + TypeStr + TypeStr;
  auto FT = FunctionType::get(Val1->getType(), ArgsTypes, false);
  auto Callee = m_module->getOrInsertFunction(FuncName, FT);
  SmallVector<Value *, 2> FuncArgs{Val1, Val2};
  Instruction *NewFRem = CallInst::Create(Callee, FuncArgs, "");
  if (IGCLLVM::isBFloatTy(ScalarType)) {
    NewFRem->insertBefore(&I);
    NewFRem->setDebugLoc(I.getDebugLoc());
    NewFRem = new FPTruncInst(NewFRem, I.getOperand(0)->getType());
  }
  ReplaceInstWithInst(&I, NewFRem);
  m_changed = true;
}

bool HandleFRemInstructions::runOnModule(llvm::Module &M) {
  m_changed = false;
  m_module = &M;

  visit(M);

  m_module = nullptr;
  return m_changed;
}