File: ldu-reg-plus-offset.ll

package info (click to toggle)
llvm-toolchain-3.4 1%3A3.4.2-13
  • links: PTS, VCS
  • area: main
  • in suites: jessie, jessie-kfreebsd
  • size: 253,236 kB
  • ctags: 276,203
  • sloc: cpp: 1,665,580; ansic: 298,647; asm: 206,157; objc: 84,350; python: 73,119; sh: 23,466; perl: 5,679; makefile: 5,542; ml: 5,250; pascal: 2,467; lisp: 1,420; xml: 679; cs: 236; csh: 117
file content (21 lines) | stat: -rw-r--r-- 768 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
; RUN: llc < %s -march=nvptx -mcpu=sm_20 | FileCheck %s

target datalayout = "e-p:32:32:32-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v16:16:16-v32:32:32-v64:64:64-v128:128:128-n16:32:64"


define void @reg_plus_offset(i32* %a) {
; CHECK:        ldu.global.u32  %r{{[0-9]+}}, [%r{{[0-9]+}}+32];
; CHECK:        ldu.global.u32  %r{{[0-9]+}}, [%r{{[0-9]+}}+36];
  %p2 = getelementptr i32* %a, i32 8
  %t1 = call i32 @llvm.nvvm.ldu.global.i.i32(i32* %p2), !align !1
  %p3 = getelementptr i32* %a, i32 9
  %t2 = call i32 @llvm.nvvm.ldu.global.i.i32(i32* %p3), !align !1
  %t3 = mul i32 %t1, %t2
  store i32 %t3, i32* %a
  ret void
}

!1 = metadata !{ i32 4 }

declare i32 @llvm.nvvm.ldu.global.i.i32(i32*)
declare i32 @llvm.nvvm.read.ptx.sreg.tid.x()