1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123
|
; RUN: opt -mtriple amdgcn-unknown-amdhsa -passes='print<uniformity>' -disable-output %s 2>&1 | FileCheck %s
declare i32 @llvm.amdgcn.workitem.id.x() #0
declare i32 @llvm.amdgcn.workitem.id.y() #0
declare i32 @llvm.amdgcn.workitem.id.z() #0
declare i32 @llvm.amdgcn.mbcnt.lo(i32, i32) #0
declare i32 @llvm.amdgcn.mbcnt.hi(i32, i32) #0
; CHECK: DIVERGENT: %id.x = call i32 @llvm.amdgcn.workitem.id.x()
define amdgpu_kernel void @workitem_id_x() #1 {
%id.x = call i32 @llvm.amdgcn.workitem.id.x()
store volatile i32 %id.x, ptr addrspace(1) undef
ret void
}
; CHECK: DIVERGENT: %id.y = call i32 @llvm.amdgcn.workitem.id.y()
define amdgpu_kernel void @workitem_id_y() #1 {
%id.y = call i32 @llvm.amdgcn.workitem.id.y()
store volatile i32 %id.y, ptr addrspace(1) undef
ret void
}
; CHECK: DIVERGENT: %id.z = call i32 @llvm.amdgcn.workitem.id.z()
define amdgpu_kernel void @workitem_id_z() #1 {
%id.z = call i32 @llvm.amdgcn.workitem.id.z()
store volatile i32 %id.z, ptr addrspace(1) undef
ret void
}
; CHECK: DIVERGENT: %mbcnt.lo = call i32 @llvm.amdgcn.mbcnt.lo(i32 0, i32 0)
define amdgpu_kernel void @mbcnt_lo() #1 {
%mbcnt.lo = call i32 @llvm.amdgcn.mbcnt.lo(i32 0, i32 0)
store volatile i32 %mbcnt.lo, ptr addrspace(1) undef
ret void
}
; CHECK: DIVERGENT: %mbcnt.hi = call i32 @llvm.amdgcn.mbcnt.hi(i32 0, i32 0)
define amdgpu_kernel void @mbcnt_hi() #1 {
%mbcnt.hi = call i32 @llvm.amdgcn.mbcnt.hi(i32 0, i32 0)
store volatile i32 %mbcnt.hi, ptr addrspace(1) undef
ret void
}
; CHECK-LABEL: UniformityInfo for function 'workitem_id_x_singlethreaded':
; CHECK-NOT: DIVERGENT
define amdgpu_kernel void @workitem_id_x_singlethreaded() #2 {
%id.x = call i32 @llvm.amdgcn.workitem.id.x()
store volatile i32 %id.x, ptr addrspace(1) undef
ret void
}
; CHECK-LABEL: UniformityInfo for function 'workitem_id_y_singlethreaded':
; CHECK-NOT: DIVERGENT
define amdgpu_kernel void @workitem_id_y_singlethreaded() #2 {
%id.x = call i32 @llvm.amdgcn.workitem.id.y()
store volatile i32 %id.x, ptr addrspace(1) undef
ret void
}
; CHECK-LABEL: UniformityInfo for function 'workitem_id_z_singlethreaded':
; CHECK-NOT: DIVERGENT
define amdgpu_kernel void @workitem_id_z_singlethreaded() #2 {
%id.x = call i32 @llvm.amdgcn.workitem.id.y()
store volatile i32 %id.x, ptr addrspace(1) undef
ret void
}
; CHECK-LABEL: UniformityInfo for function 'workitem_id_x_singlethreaded_md':
; CHECK-NOT: DIVERGENT
define amdgpu_kernel void @workitem_id_x_singlethreaded_md() !reqd_work_group_size !0 {
%id.x = call i32 @llvm.amdgcn.workitem.id.x()
store volatile i32 %id.x, ptr addrspace(1) undef
ret void
}
; CHECK-LABEL: UniformityInfo for function 'workitem_id_y_singlethreaded_md':
; CHECK-NOT: DIVERGENT
define amdgpu_kernel void @workitem_id_y_singlethreaded_md() !reqd_work_group_size !0 {
%id.x = call i32 @llvm.amdgcn.workitem.id.y()
store volatile i32 %id.x, ptr addrspace(1) undef
ret void
}
; CHECK-LABEL: UniformityInfo for function 'workitem_id_z_singlethreaded_md':
; CHECK-NOT: DIVERGENT
define amdgpu_kernel void @workitem_id_z_singlethreaded_md() !reqd_work_group_size !0 {
%id.x = call i32 @llvm.amdgcn.workitem.id.y()
store volatile i32 %id.x, ptr addrspace(1) undef
ret void
}
; CHECK-LABEL: UniformityInfo for function 'workitem_id_x_not_singlethreaded_dimx':
; CHECK: DIVERGENT: %id.x = call i32 @llvm.amdgcn.workitem.id.x()
define amdgpu_kernel void @workitem_id_x_not_singlethreaded_dimx() !reqd_work_group_size !1 {
%id.x = call i32 @llvm.amdgcn.workitem.id.x()
store volatile i32 %id.x, ptr addrspace(1) undef
ret void
}
; CHECK-LABEL: UniformityInfo for function 'workitem_id_x_not_singlethreaded_dimy':
; CHECK: DIVERGENT: %id.x = call i32 @llvm.amdgcn.workitem.id.x()
define amdgpu_kernel void @workitem_id_x_not_singlethreaded_dimy() !reqd_work_group_size !2 {
%id.x = call i32 @llvm.amdgcn.workitem.id.x()
store volatile i32 %id.x, ptr addrspace(1) undef
ret void
}
; CHECK-LABEL: UniformityInfo for function 'workitem_id_x_not_singlethreaded_dimz':
; CHECK: DIVERGENT: %id.x = call i32 @llvm.amdgcn.workitem.id.x()
define amdgpu_kernel void @workitem_id_x_not_singlethreaded_dimz() !reqd_work_group_size !3 {
%id.x = call i32 @llvm.amdgcn.workitem.id.x()
store volatile i32 %id.x, ptr addrspace(1) undef
ret void
}
attributes #0 = { nounwind readnone }
attributes #1 = { nounwind }
attributes #2 = { "amdgpu-flat-work-group-size"="1,1" }
!0 = !{i32 1, i32 1, i32 1}
!1 = !{i32 2, i32 1, i32 1}
!2 = !{i32 1, i32 2, i32 1}
!3 = !{i32 1, i32 1, i32 2}
|