File: scalarize-two-calls.ll

package info (click to toggle)
llvm-toolchain-21 1%3A21.1.0-1
  • links: PTS, VCS
  • area: main
  • in suites: sid
  • size: 2,235,796 kB
  • sloc: cpp: 7,617,614; ansic: 1,433,901; asm: 1,058,726; python: 252,096; f90: 94,671; objc: 70,753; lisp: 42,813; pascal: 18,401; sh: 10,032; ml: 5,111; perl: 4,720; awk: 3,523; makefile: 3,401; javascript: 2,272; xml: 892; fortran: 770
file content (27 lines) | stat: -rw-r--r-- 1,636 bytes parent folder | download | duplicates (4)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
; RUN: llc %s -mtriple=dxil-pc-shadermodel6.3-library --filetype=asm -o - | FileCheck %s

; CHECK: target triple = "dxilv1.3-pc-shadermodel6.3-library"
; CHECK-LABEL: cos_sin_float_test
define noundef <4 x float> @cos_sin_float_test(<4 x float> noundef %a) #0 {
    ; CHECK: [[ee0:%.*]] = extractelement <4 x float> %a, i32 0
    ; CHECK: [[ie0:%.*]] = call float @dx.op.unary.f32(i32 13, float [[ee0]])
    ; CHECK: [[ee1:%.*]] = extractelement <4 x float> %a, i32 1
    ; CHECK: [[ie1:%.*]] = call float @dx.op.unary.f32(i32 13, float [[ee1]])
    ; CHECK: [[ee2:%.*]] = extractelement <4 x float> %a, i32 2
    ; CHECK: [[ie2:%.*]] = call float @dx.op.unary.f32(i32 13, float [[ee2]])
    ; CHECK: [[ee3:%.*]] = extractelement <4 x float> %a, i32 3
    ; CHECK: [[ie3:%.*]] = call float @dx.op.unary.f32(i32 13, float [[ee3]])
    ; CHECK: [[ie4:%.*]] = call float @dx.op.unary.f32(i32 12, float [[ie0]])
    ; CHECK: [[ie5:%.*]] = call float @dx.op.unary.f32(i32 12, float [[ie1]])
    ; CHECK: [[ie6:%.*]] = call float @dx.op.unary.f32(i32 12, float [[ie2]])
    ; CHECK: [[ie7:%.*]] = call float @dx.op.unary.f32(i32 12, float [[ie3]])
    ; CHECK: insertelement <4 x float> poison, float [[ie4]], i32 0
    ; CHECK: insertelement <4 x float> %{{.*}}, float [[ie5]], i32 1
    ; CHECK: insertelement <4 x float> %{{.*}}, float [[ie6]], i32 2
    ; CHECK: insertelement <4 x float> %{{.*}}, float [[ie7]], i32 3
    %2 = tail call <4 x float> @llvm.sin.v4f32(<4 x float> %a) 
    %3 = tail call <4 x float> @llvm.cos.v4f32(<4 x float> %2) 
    ret <4 x float> %3 
} 

attributes #0 = { convergent norecurse nounwind "hlsl.export"}