File: BreakdownIntrinsic.cpp

package info (click to toggle)
intel-graphics-compiler2 2.16.0-2
  • links: PTS, VCS
  • area: main
  • in suites: sid
  • size: 106,644 kB
  • sloc: cpp: 805,640; lisp: 287,672; ansic: 16,414; python: 3,952; yacc: 2,588; lex: 1,666; pascal: 313; sh: 186; makefile: 35
file content (65 lines) | stat: -rw-r--r-- 2,499 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
/*========================== begin_copyright_notice ============================

Copyright (C) 2017-2021 Intel Corporation

SPDX-License-Identifier: MIT

============================= end_copyright_notice ===========================*/

#include "Compiler/Optimizer/OpenCLPasses/BreakdownIntrinsic/BreakdownIntrinsic.h"
#include "Compiler/IGCPassSupport.h"
#include "Compiler/CodeGenPublic.h"

#include "common/LLVMWarningsPush.hpp"
#include <llvm/IR/Function.h>
#include "common/LLVMWarningsPop.hpp"

using namespace llvm;
using namespace IGC;
using namespace IGC::IGCMD;

// Register pass to igc-opt
#define PASS_FLAG "breakdown-intrinsics"
#define PASS_DESCRIPTION "Breakdown intrinsics into simpler operations to enable better optimization"
#define PASS_CFG_ONLY false
#define PASS_ANALYSIS true
IGC_INITIALIZE_PASS_BEGIN(BreakdownIntrinsicPass, PASS_FLAG, PASS_DESCRIPTION, PASS_CFG_ONLY, PASS_ANALYSIS)
IGC_INITIALIZE_PASS_END(BreakdownIntrinsicPass, PASS_FLAG, PASS_DESCRIPTION, PASS_CFG_ONLY, PASS_ANALYSIS)

char BreakdownIntrinsicPass::ID = 0;

BreakdownIntrinsicPass::BreakdownIntrinsicPass()
    : FunctionPass(ID), m_changed(false), m_pMdUtils(nullptr), modMD(nullptr) {
  initializeBreakdownIntrinsicPassPass(*PassRegistry::getPassRegistry());
}

void BreakdownIntrinsicPass::visitIntrinsicInst(llvm::IntrinsicInst &I) {
  // const MetaDataUtils &mdUtils = *(getAnalysis<MetaDataUtilsWrapper>().getMetaDataUtils());
  ModuleMetaData &modMD = *(getAnalysis<MetaDataUtilsWrapper>().getModuleMetaData());
  llvm::IRBuilder<> builder(&I);
  bool md_added = false;

  auto pCtx = getAnalysis<CodeGenContextWrapper>().getCodeGenContext();

  if (I.getIntrinsicID() == llvm::Intrinsic::fmuladd ||
      // For FMA only break it up if unsafe math optimizations are set
      (I.getIntrinsicID() == llvm::Intrinsic::fma && modMD.compOpt.UnsafeMathOptimizations)) {
    llvm::Value *pMulInst = builder.CreateFMul(I.getOperand(0), I.getOperand(1));
    llvm::Value *pAddInst = builder.CreateFAdd(pMulInst, I.getOperand(2));
    I.replaceAllUsesWith(pAddInst);
    I.eraseFromParent();
    m_changed = true;

    // The presence of fmuladd indicates that the fp_contract needs to be set.
    if (pCtx->m_DriverInfo.NeedsBreakdownMulAdd() && !md_added) {
      modMD.compOpt.MadEnable = true;
      md_added = true;
    }
  }
}

bool BreakdownIntrinsicPass::runOnFunction(llvm::Function &F) {
  m_pMdUtils = getAnalysis<MetaDataUtilsWrapper>().getMetaDataUtils();
  visit(F);
  return m_changed;
}