File: fma.ll

package info (click to toggle)
intel-graphics-compiler 1.0.17791.18-1
  • links: PTS, VCS
  • area: main
  • in suites: sid
  • size: 102,312 kB
  • sloc: cpp: 935,343; lisp: 286,143; ansic: 16,196; python: 3,279; yacc: 2,487; lex: 1,642; pascal: 300; sh: 174; makefile: 27
file content (23 lines) | stat: -rw-r--r-- 1,250 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
;=========================== begin_copyright_notice ============================
;
; Copyright (C) 2023 Intel Corporation
;
; SPDX-License-Identifier: MIT
;
;============================ end_copyright_notice =============================

; RUN: %opt %use_old_pass_manager% -GenXLegalization -march=genx64 -mcpu=XeHPG -mtriple=spir64-unknown-unknown -S < %s | FileCheck %s
; RUN: %opt %use_old_pass_manager% -GenXLegalization -march=genx64 -mcpu=XeHPC -mtriple=spir64-unknown-unknown -S < %s | FileCheck --check-prefix=CHECK-WIDE %s

target datalayout = "e-p:64:64-i64:64-n8:16:32"
target triple = "genx64-unknown-unknown"

declare <32 x float> @llvm.fma.v32f32(<32 x float>, <32 x float>, <32 x float>)

define <32 x float> @test(<32 x float> %a, <32 x float> %b, <32 x float> %c) {
  ; CHECK: call <16 x float> @llvm.fma.v16f32(<16 x float> %{{[^,]+}}, <16 x float> %{{[^,]+}}, <16 x float> %{{[^)]+}})
  ; CHECK: call <16 x float> @llvm.fma.v16f32(<16 x float> %{{[^,]+}}, <16 x float> %{{[^,]+}}, <16 x float> %{{[^)]+}})
  ; CHECK-WIDE: %r = call <32 x float> @llvm.fma.v32f32(<32 x float> %a, <32 x float> %b, <32 x float> %c)
  %r = call <32 x float> @llvm.fma.v32f32(<32 x float> %a, <32 x float> %b, <32 x float> %c)
  ret <32 x float> %r
}