File: vector_times_matrix.spt

package info (click to toggle)
spirv-llvm-translator-15 15.0.0-2
  • links: PTS, VCS
  • area: main
  • in suites: bookworm
  • size: 14,028 kB
  • sloc: cpp: 43,715; lisp: 3,497; sh: 153; python: 43; makefile: 26
file content (112 lines) | stat: -rw-r--r-- 5,301 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
119734787 65536 458752 21 0
2 Capability Addresses
2 Capability Linkage
2 Capability Kernel
2 Capability Float64
2 Capability Matrix
3 MemoryModel 2 2
8 EntryPoint 6 20 "vector_times_matrix"
3 Source 3 102000
3 Name 12 "res"
3 Name 13 "lhs"
3 Name 14 "rhs"

2 TypeVoid 5
3 TypeFloat 6 32
4 TypeVector 7 6 4
4 TypeMatrix 8 7 4
4 TypePointer 9 7 8
4 TypePointer 10 7 7
6 TypeFunction 11 5 10 10 9

5 Function 5 20 0 11
3 FunctionParameter 10 12
3 FunctionParameter 10 13
3 FunctionParameter 9 14

2 Label 15
4 Load 7 16 13
4 Load 8 17 14
5 VectorTimesMatrix 7 18 16 17
3 Store 12 18
1 Return

1 FunctionEnd

; RUN: llvm-spirv %s -to-binary -o %t.spv
; RUN: spirv-val %t.spv
; RUN: llvm-spirv -r %t.spv -o %t.bc
; RUN: llvm-dis < %t.bc | FileCheck %s --check-prefix=CHECK-LLVM

; CHECK-LLVM: %1 = load <4 x float>, <4 x float>* %lhs
; CHECK-LLVM: %2 = load [4 x <4 x float>], [4 x <4 x float>]* %rhs
; CHECK-LLVM: %3 = extractelement <4 x float> %1, i32 0
; CHECK-LLVM: %.splatinsert = insertelement <4 x float> poison, float %3, i32 0
; CHECK-LLVM: %.splat = shufflevector <4 x float> %.splatinsert, <4 x float> poison, <4 x i32> zeroinitializer
; CHECK-LLVM: %4 = extractvalue [4 x <4 x float>] %2, 0
; CHECK-LLVM: %5 = extractelement <4 x float> %4, i32 0
; CHECK-LLVM: %6 = insertelement <4 x float> undef, float %5, i32 0
; CHECK-LLVM: %7 = extractvalue [4 x <4 x float>] %2, 1
; CHECK-LLVM: %8 = extractelement <4 x float> %7, i32 0
; CHECK-LLVM: %9 = insertelement <4 x float> %6, float %8, i32 1
; CHECK-LLVM: %10 = extractvalue [4 x <4 x float>] %2, 2
; CHECK-LLVM: %11 = extractelement <4 x float> %10, i32 0
; CHECK-LLVM: %12 = insertelement <4 x float> %9, float %11, i32 2
; CHECK-LLVM: %13 = extractvalue [4 x <4 x float>] %2, 3
; CHECK-LLVM: %14 = extractelement <4 x float> %13, i32 0
; CHECK-LLVM: %15 = insertelement <4 x float> %12, float %14, i32 3
; CHECK-LLVM: %16 = fmul <4 x float> %.splat, %15
; CHECK-LLVM: %17 = fadd <4 x float> zeroinitializer, %16
; CHECK-LLVM: %18 = extractelement <4 x float> %1, i32 1
; CHECK-LLVM: %.splatinsert1 = insertelement <4 x float> poison, float %18, i32 0
; CHECK-LLVM: %.splat2 = shufflevector <4 x float> %.splatinsert1, <4 x float> poison, <4 x i32> zeroinitializer
; CHECK-LLVM: %19 = extractvalue [4 x <4 x float>] %2, 0
; CHECK-LLVM: %20 = extractelement <4 x float> %19, i32 1
; CHECK-LLVM: %21 = insertelement <4 x float> undef, float %20, i32 0
; CHECK-LLVM: %22 = extractvalue [4 x <4 x float>] %2, 1
; CHECK-LLVM: %23 = extractelement <4 x float> %22, i32 1
; CHECK-LLVM: %24 = insertelement <4 x float> %21, float %23, i32 1
; CHECK-LLVM: %25 = extractvalue [4 x <4 x float>] %2, 2
; CHECK-LLVM: %26 = extractelement <4 x float> %25, i32 1
; CHECK-LLVM: %27 = insertelement <4 x float> %24, float %26, i32 2
; CHECK-LLVM: %28 = extractvalue [4 x <4 x float>] %2, 3
; CHECK-LLVM: %29 = extractelement <4 x float> %28, i32 1
; CHECK-LLVM: %30 = insertelement <4 x float> %27, float %29, i32 3
; CHECK-LLVM: %31 = fmul <4 x float> %.splat2, %30
; CHECK-LLVM: %32 = fadd <4 x float> %17, %31
; CHECK-LLVM: %33 = extractelement <4 x float> %1, i32 2
; CHECK-LLVM: %.splatinsert3 = insertelement <4 x float> poison, float %33, i32 0
; CHECK-LLVM: %.splat4 = shufflevector <4 x float> %.splatinsert3, <4 x float> poison, <4 x i32> zeroinitializer
; CHECK-LLVM: %34 = extractvalue [4 x <4 x float>] %2, 0
; CHECK-LLVM: %35 = extractelement <4 x float> %34, i32 2
; CHECK-LLVM: %36 = insertelement <4 x float> undef, float %35, i32 0
; CHECK-LLVM: %37 = extractvalue [4 x <4 x float>] %2, 1
; CHECK-LLVM: %38 = extractelement <4 x float> %37, i32 2
; CHECK-LLVM: %39 = insertelement <4 x float> %36, float %38, i32 1
; CHECK-LLVM: %40 = extractvalue [4 x <4 x float>] %2, 2
; CHECK-LLVM: %41 = extractelement <4 x float> %40, i32 2
; CHECK-LLVM: %42 = insertelement <4 x float> %39, float %41, i32 2
; CHECK-LLVM: %43 = extractvalue [4 x <4 x float>] %2, 3
; CHECK-LLVM: %44 = extractelement <4 x float> %43, i32 2
; CHECK-LLVM: %45 = insertelement <4 x float> %42, float %44, i32 3
; CHECK-LLVM: %46 = fmul <4 x float> %.splat4, %45
; CHECK-LLVM: %47 = fadd <4 x float> %32, %46
; CHECK-LLVM: %48 = extractelement <4 x float> %1, i32 3
; CHECK-LLVM: %.splatinsert5 = insertelement <4 x float> poison, float %48, i32 0
; CHECK-LLVM: %.splat6 = shufflevector <4 x float> %.splatinsert5, <4 x float> poison, <4 x i32> zeroinitializer
; CHECK-LLVM: %49 = extractvalue [4 x <4 x float>] %2, 0
; CHECK-LLVM: %50 = extractelement <4 x float> %49, i32 3
; CHECK-LLVM: %51 = insertelement <4 x float> undef, float %50, i32 0
; CHECK-LLVM: %52 = extractvalue [4 x <4 x float>] %2, 1
; CHECK-LLVM: %53 = extractelement <4 x float> %52, i32 3
; CHECK-LLVM: %54 = insertelement <4 x float> %51, float %53, i32 1
; CHECK-LLVM: %55 = extractvalue [4 x <4 x float>] %2, 2
; CHECK-LLVM: %56 = extractelement <4 x float> %55, i32 3
; CHECK-LLVM: %57 = insertelement <4 x float> %54, float %56, i32 2
; CHECK-LLVM: %58 = extractvalue [4 x <4 x float>] %2, 3
; CHECK-LLVM: %59 = extractelement <4 x float> %58, i32 3
; CHECK-LLVM: %60 = insertelement <4 x float> %57, float %59, i32 3
; CHECK-LLVM: %61 = fmul <4 x float> %.splat6, %60
; CHECK-LLVM: %62 = fadd <4 x float> %47, %61
; CHECK-LLVM: store <4 x float> %62, <4 x float>* %res
; CHECK-LLVM: ret void