1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290
|
; RUN: llc -march=amdgcn -mcpu=tahiti -enable-amdgpu-aa=0 -misched=gcn-iterative-minreg -verify-machineinstrs < %s | FileCheck --check-prefix=SI-MINREG %s
; RUN: llc -march=amdgcn -mcpu=tahiti -enable-amdgpu-aa=0 -misched=gcn-iterative-max-occupancy-experimental -verify-machineinstrs < %s | FileCheck --check-prefix=SI-MAXOCC %s
; RUN: llc -march=amdgcn -mcpu=fiji -enable-amdgpu-aa=0 -misched=gcn-iterative-minreg -verify-machineinstrs < %s | FileCheck --check-prefix=VI %s
; RUN: llc -march=amdgcn -mcpu=fiji -enable-amdgpu-aa=0 -misched=gcn-iterative-max-occupancy-experimental -verify-machineinstrs < %s | FileCheck --check-prefix=VI %s
; SI-MINREG: NumSgprs: {{[1-9]$}}
; SI-MINREG: NumVgprs: {{[1-9]$}}
; SI-MAXOCC: NumSgprs: {{[1-4]?[0-9]$}}
; SI-MAXOCC: NumVgprs: {{[1-4]?[0-9]$}}
; stores may alias loads
; VI: NumSgprs: {{[0-9]$}}
; VI: NumVgprs: {{[1-3][0-9]$}}
define amdgpu_kernel void @load_fma_store(ptr addrspace(3) nocapture readonly %in_arg, ptr addrspace(1) nocapture %out_arg) {
bb:
%adr.a.0 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 20004
%adr.b.0 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 20252
%adr.c.0 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 20508
%adr.a.1 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 20772
%adr.b.1 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 21020
%adr.c.1 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 21276
%adr.a.2 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 21540
%adr.b.2 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 21788
%adr.c.2 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 22044
%adr.a.3 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 22308
%adr.b.3 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 22556
%adr.c.3 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 22812
%adr.a.4 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 23076
%adr.b.4 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 23324
%adr.c.4 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 23580
%adr.a.5 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 23844
%adr.b.5 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 24092
%adr.c.5 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 24348
%adr.a.6 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 24612
%adr.b.6 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 24860
%adr.c.6 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 25116
%adr.a.7 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 25380
%adr.b.7 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 25628
%adr.c.7 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 25884
%adr.a.8 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 26148
%adr.b.8 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 26396
%adr.c.8 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 26652
%adr.a.9 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 26916
%adr.b.9 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 27164
%adr.c.9 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 27420
%adr.a.10 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 27684
%adr.b.10 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 27932
%adr.c.10 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 28188
%adr.a.11 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 28452
%adr.b.11 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 28700
%adr.c.11 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 28956
%adr.a.12 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 29220
%adr.b.12 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 29468
%adr.c.12 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 29724
%adr.a.13 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 29988
%adr.b.13 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 30236
%adr.c.13 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 30492
%adr.a.14 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 30756
%adr.b.14 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 31004
%adr.c.14 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 31260
%adr.a.15 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 31524
%adr.b.15 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 31772
%adr.c.15 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 32028
%adr.a.16 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 32292
%adr.b.16 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 32540
%adr.c.16 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 32796
%adr.a.17 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 33060
%adr.b.17 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 33308
%adr.c.17 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 33564
%adr.a.18 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 33828
%adr.b.18 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 34076
%adr.c.18 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 34332
%adr.a.19 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 34596
%adr.b.19 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 34844
%adr.c.19 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 35100
%adr.a.20 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 35364
%adr.b.20 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 35612
%adr.c.20 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 35868
%adr.a.21 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 36132
%adr.b.21 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 36380
%adr.c.21 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 36636
%adr.a.22 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 36900
%adr.b.22 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 37148
%adr.c.22 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 37404
%adr.a.23 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 37668
%adr.b.23 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 37916
%adr.c.23 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 38172
%adr.a.24 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 38436
%adr.b.24 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 38684
%adr.c.24 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 38940
%adr.a.25 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 39204
%adr.b.25 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 39452
%adr.c.25 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 39708
%adr.a.26 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 39972
%adr.b.26 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 40220
%adr.c.26 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 40476
%adr.a.27 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 40740
%adr.b.27 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 40988
%adr.c.27 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 41244
%adr.a.28 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 41508
%adr.b.28 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 41756
%adr.c.28 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 42012
%adr.a.29 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 42276
%adr.b.29 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 42524
%adr.c.29 = getelementptr inbounds float, ptr addrspace(3) %in_arg, i32 42780
%a.0 = load float, ptr addrspace(3) %adr.a.0, align 4
%b.0 = load float, ptr addrspace(3) %adr.b.0, align 4
%c.0 = load float, ptr addrspace(3) %adr.c.0, align 4
%a.1 = load float, ptr addrspace(3) %adr.a.1, align 4
%b.1 = load float, ptr addrspace(3) %adr.b.1, align 4
%c.1 = load float, ptr addrspace(3) %adr.c.1, align 4
%a.2 = load float, ptr addrspace(3) %adr.a.2, align 4
%b.2 = load float, ptr addrspace(3) %adr.b.2, align 4
%c.2 = load float, ptr addrspace(3) %adr.c.2, align 4
%a.3 = load float, ptr addrspace(3) %adr.a.3, align 4
%b.3 = load float, ptr addrspace(3) %adr.b.3, align 4
%c.3 = load float, ptr addrspace(3) %adr.c.3, align 4
%a.4 = load float, ptr addrspace(3) %adr.a.4, align 4
%b.4 = load float, ptr addrspace(3) %adr.b.4, align 4
%c.4 = load float, ptr addrspace(3) %adr.c.4, align 4
%a.5 = load float, ptr addrspace(3) %adr.a.5, align 4
%b.5 = load float, ptr addrspace(3) %adr.b.5, align 4
%c.5 = load float, ptr addrspace(3) %adr.c.5, align 4
%a.6 = load float, ptr addrspace(3) %adr.a.6, align 4
%b.6 = load float, ptr addrspace(3) %adr.b.6, align 4
%c.6 = load float, ptr addrspace(3) %adr.c.6, align 4
%a.7 = load float, ptr addrspace(3) %adr.a.7, align 4
%b.7 = load float, ptr addrspace(3) %adr.b.7, align 4
%c.7 = load float, ptr addrspace(3) %adr.c.7, align 4
%a.8 = load float, ptr addrspace(3) %adr.a.8, align 4
%b.8 = load float, ptr addrspace(3) %adr.b.8, align 4
%c.8 = load float, ptr addrspace(3) %adr.c.8, align 4
%a.9 = load float, ptr addrspace(3) %adr.a.9, align 4
%b.9 = load float, ptr addrspace(3) %adr.b.9, align 4
%c.9 = load float, ptr addrspace(3) %adr.c.9, align 4
%a.10 = load float, ptr addrspace(3) %adr.a.10, align 4
%b.10 = load float, ptr addrspace(3) %adr.b.10, align 4
%c.10 = load float, ptr addrspace(3) %adr.c.10, align 4
%a.11 = load float, ptr addrspace(3) %adr.a.11, align 4
%b.11 = load float, ptr addrspace(3) %adr.b.11, align 4
%c.11 = load float, ptr addrspace(3) %adr.c.11, align 4
%a.12 = load float, ptr addrspace(3) %adr.a.12, align 4
%b.12 = load float, ptr addrspace(3) %adr.b.12, align 4
%c.12 = load float, ptr addrspace(3) %adr.c.12, align 4
%a.13 = load float, ptr addrspace(3) %adr.a.13, align 4
%b.13 = load float, ptr addrspace(3) %adr.b.13, align 4
%c.13 = load float, ptr addrspace(3) %adr.c.13, align 4
%a.14 = load float, ptr addrspace(3) %adr.a.14, align 4
%b.14 = load float, ptr addrspace(3) %adr.b.14, align 4
%c.14 = load float, ptr addrspace(3) %adr.c.14, align 4
%a.15 = load float, ptr addrspace(3) %adr.a.15, align 4
%b.15 = load float, ptr addrspace(3) %adr.b.15, align 4
%c.15 = load float, ptr addrspace(3) %adr.c.15, align 4
%a.16 = load float, ptr addrspace(3) %adr.a.16, align 4
%b.16 = load float, ptr addrspace(3) %adr.b.16, align 4
%c.16 = load float, ptr addrspace(3) %adr.c.16, align 4
%a.17 = load float, ptr addrspace(3) %adr.a.17, align 4
%b.17 = load float, ptr addrspace(3) %adr.b.17, align 4
%c.17 = load float, ptr addrspace(3) %adr.c.17, align 4
%a.18 = load float, ptr addrspace(3) %adr.a.18, align 4
%b.18 = load float, ptr addrspace(3) %adr.b.18, align 4
%c.18 = load float, ptr addrspace(3) %adr.c.18, align 4
%a.19 = load float, ptr addrspace(3) %adr.a.19, align 4
%b.19 = load float, ptr addrspace(3) %adr.b.19, align 4
%c.19 = load float, ptr addrspace(3) %adr.c.19, align 4
%a.20 = load float, ptr addrspace(3) %adr.a.20, align 4
%b.20 = load float, ptr addrspace(3) %adr.b.20, align 4
%c.20 = load float, ptr addrspace(3) %adr.c.20, align 4
%a.21 = load float, ptr addrspace(3) %adr.a.21, align 4
%b.21 = load float, ptr addrspace(3) %adr.b.21, align 4
%c.21 = load float, ptr addrspace(3) %adr.c.21, align 4
%a.22 = load float, ptr addrspace(3) %adr.a.22, align 4
%b.22 = load float, ptr addrspace(3) %adr.b.22, align 4
%c.22 = load float, ptr addrspace(3) %adr.c.22, align 4
%a.23 = load float, ptr addrspace(3) %adr.a.23, align 4
%b.23 = load float, ptr addrspace(3) %adr.b.23, align 4
%c.23 = load float, ptr addrspace(3) %adr.c.23, align 4
%a.24 = load float, ptr addrspace(3) %adr.a.24, align 4
%b.24 = load float, ptr addrspace(3) %adr.b.24, align 4
%c.24 = load float, ptr addrspace(3) %adr.c.24, align 4
%a.25 = load float, ptr addrspace(3) %adr.a.25, align 4
%b.25 = load float, ptr addrspace(3) %adr.b.25, align 4
%c.25 = load float, ptr addrspace(3) %adr.c.25, align 4
%a.26 = load float, ptr addrspace(3) %adr.a.26, align 4
%b.26 = load float, ptr addrspace(3) %adr.b.26, align 4
%c.26 = load float, ptr addrspace(3) %adr.c.26, align 4
%a.27 = load float, ptr addrspace(3) %adr.a.27, align 4
%b.27 = load float, ptr addrspace(3) %adr.b.27, align 4
%c.27 = load float, ptr addrspace(3) %adr.c.27, align 4
%a.28 = load float, ptr addrspace(3) %adr.a.28, align 4
%b.28 = load float, ptr addrspace(3) %adr.b.28, align 4
%c.28 = load float, ptr addrspace(3) %adr.c.28, align 4
%a.29 = load float, ptr addrspace(3) %adr.a.29, align 4
%b.29 = load float, ptr addrspace(3) %adr.b.29, align 4
%c.29 = load float, ptr addrspace(3) %adr.c.29, align 4
%res.0 = tail call float @llvm.fmuladd.f32(float %a.0, float %b.0, float %c.0)
%res.1 = tail call float @llvm.fmuladd.f32(float %a.1, float %b.1, float %c.1)
%res.2 = tail call float @llvm.fmuladd.f32(float %a.2, float %b.2, float %c.2)
%res.3 = tail call float @llvm.fmuladd.f32(float %a.3, float %b.3, float %c.3)
%res.4 = tail call float @llvm.fmuladd.f32(float %a.4, float %b.4, float %c.4)
%res.5 = tail call float @llvm.fmuladd.f32(float %a.5, float %b.5, float %c.5)
%res.6 = tail call float @llvm.fmuladd.f32(float %a.6, float %b.6, float %c.6)
%res.7 = tail call float @llvm.fmuladd.f32(float %a.7, float %b.7, float %c.7)
%res.8 = tail call float @llvm.fmuladd.f32(float %a.8, float %b.8, float %c.8)
%res.9 = tail call float @llvm.fmuladd.f32(float %a.9, float %b.9, float %c.9)
%res.10 = tail call float @llvm.fmuladd.f32(float %a.10, float %b.10, float %c.10)
%res.11 = tail call float @llvm.fmuladd.f32(float %a.11, float %b.11, float %c.11)
%res.12 = tail call float @llvm.fmuladd.f32(float %a.12, float %b.12, float %c.12)
%res.13 = tail call float @llvm.fmuladd.f32(float %a.13, float %b.13, float %c.13)
%res.14 = tail call float @llvm.fmuladd.f32(float %a.14, float %b.14, float %c.14)
%res.15 = tail call float @llvm.fmuladd.f32(float %a.15, float %b.15, float %c.15)
%res.16 = tail call float @llvm.fmuladd.f32(float %a.16, float %b.16, float %c.16)
%res.17 = tail call float @llvm.fmuladd.f32(float %a.17, float %b.17, float %c.17)
%res.18 = tail call float @llvm.fmuladd.f32(float %a.18, float %b.18, float %c.18)
%res.19 = tail call float @llvm.fmuladd.f32(float %a.19, float %b.19, float %c.19)
%res.20 = tail call float @llvm.fmuladd.f32(float %a.20, float %b.20, float %c.20)
%res.21 = tail call float @llvm.fmuladd.f32(float %a.21, float %b.21, float %c.21)
%res.22 = tail call float @llvm.fmuladd.f32(float %a.22, float %b.22, float %c.22)
%res.23 = tail call float @llvm.fmuladd.f32(float %a.23, float %b.23, float %c.23)
%res.24 = tail call float @llvm.fmuladd.f32(float %a.24, float %b.24, float %c.24)
%res.25 = tail call float @llvm.fmuladd.f32(float %a.25, float %b.25, float %c.25)
%res.26 = tail call float @llvm.fmuladd.f32(float %a.26, float %b.26, float %c.26)
%res.27 = tail call float @llvm.fmuladd.f32(float %a.27, float %b.27, float %c.27)
%res.28 = tail call float @llvm.fmuladd.f32(float %a.28, float %b.28, float %c.28)
%res.29 = tail call float @llvm.fmuladd.f32(float %a.29, float %b.29, float %c.29)
%adr.res.1 = getelementptr inbounds float, ptr addrspace(1) %out_arg, i64 2
%adr.res.2 = getelementptr inbounds float, ptr addrspace(1) %out_arg, i64 4
%adr.res.3 = getelementptr inbounds float, ptr addrspace(1) %out_arg, i64 6
%adr.res.4 = getelementptr inbounds float, ptr addrspace(1) %out_arg, i64 8
%adr.res.5 = getelementptr inbounds float, ptr addrspace(1) %out_arg, i64 10
%adr.res.6 = getelementptr inbounds float, ptr addrspace(1) %out_arg, i64 12
%adr.res.7 = getelementptr inbounds float, ptr addrspace(1) %out_arg, i64 14
%adr.res.8 = getelementptr inbounds float, ptr addrspace(1) %out_arg, i64 16
%adr.res.9 = getelementptr inbounds float, ptr addrspace(1) %out_arg, i64 18
%adr.res.10 = getelementptr inbounds float, ptr addrspace(1) %out_arg, i64 20
%adr.res.11 = getelementptr inbounds float, ptr addrspace(1) %out_arg, i64 22
%adr.res.12 = getelementptr inbounds float, ptr addrspace(1) %out_arg, i64 24
%adr.res.13 = getelementptr inbounds float, ptr addrspace(1) %out_arg, i64 26
%adr.res.14 = getelementptr inbounds float, ptr addrspace(1) %out_arg, i64 28
%adr.res.15 = getelementptr inbounds float, ptr addrspace(1) %out_arg, i64 30
%adr.res.16 = getelementptr inbounds float, ptr addrspace(1) %out_arg, i64 32
%adr.res.17 = getelementptr inbounds float, ptr addrspace(1) %out_arg, i64 34
%adr.res.18 = getelementptr inbounds float, ptr addrspace(1) %out_arg, i64 36
%adr.res.19 = getelementptr inbounds float, ptr addrspace(1) %out_arg, i64 38
%adr.res.20 = getelementptr inbounds float, ptr addrspace(1) %out_arg, i64 40
%adr.res.21 = getelementptr inbounds float, ptr addrspace(1) %out_arg, i64 42
%adr.res.22 = getelementptr inbounds float, ptr addrspace(1) %out_arg, i64 44
%adr.res.23 = getelementptr inbounds float, ptr addrspace(1) %out_arg, i64 46
%adr.res.24 = getelementptr inbounds float, ptr addrspace(1) %out_arg, i64 48
%adr.res.25 = getelementptr inbounds float, ptr addrspace(1) %out_arg, i64 50
%adr.res.26 = getelementptr inbounds float, ptr addrspace(1) %out_arg, i64 52
%adr.res.27 = getelementptr inbounds float, ptr addrspace(1) %out_arg, i64 54
%adr.res.28 = getelementptr inbounds float, ptr addrspace(1) %out_arg, i64 56
%adr.res.29 = getelementptr inbounds float, ptr addrspace(1) %out_arg, i64 58
store float %res.0, ptr addrspace(1) %out_arg, align 4
store float %res.1, ptr addrspace(1) %adr.res.1, align 4
store float %res.2, ptr addrspace(1) %adr.res.2, align 4
store float %res.3, ptr addrspace(1) %adr.res.3, align 4
store float %res.4, ptr addrspace(1) %adr.res.4, align 4
store float %res.5, ptr addrspace(1) %adr.res.5, align 4
store float %res.6, ptr addrspace(1) %adr.res.6, align 4
store float %res.7, ptr addrspace(1) %adr.res.7, align 4
store float %res.8, ptr addrspace(1) %adr.res.8, align 4
store float %res.9, ptr addrspace(1) %adr.res.9, align 4
store float %res.10, ptr addrspace(1) %adr.res.10, align 4
store float %res.11, ptr addrspace(1) %adr.res.11, align 4
store float %res.12, ptr addrspace(1) %adr.res.12, align 4
store float %res.13, ptr addrspace(1) %adr.res.13, align 4
store float %res.14, ptr addrspace(1) %adr.res.14, align 4
store float %res.15, ptr addrspace(1) %adr.res.15, align 4
store float %res.16, ptr addrspace(1) %adr.res.16, align 4
store float %res.17, ptr addrspace(1) %adr.res.17, align 4
store float %res.18, ptr addrspace(1) %adr.res.18, align 4
store float %res.19, ptr addrspace(1) %adr.res.19, align 4
store float %res.20, ptr addrspace(1) %adr.res.20, align 4
store float %res.21, ptr addrspace(1) %adr.res.21, align 4
store float %res.22, ptr addrspace(1) %adr.res.22, align 4
store float %res.23, ptr addrspace(1) %adr.res.23, align 4
store float %res.24, ptr addrspace(1) %adr.res.24, align 4
store float %res.25, ptr addrspace(1) %adr.res.25, align 4
store float %res.26, ptr addrspace(1) %adr.res.26, align 4
store float %res.27, ptr addrspace(1) %adr.res.27, align 4
store float %res.28, ptr addrspace(1) %adr.res.28, align 4
store float %res.29, ptr addrspace(1) %adr.res.29, align 4
ret void
}
declare float @llvm.fmuladd.f32(float, float, float) #0
attributes #0 = { nounwind readnone }
|