Files
clang-p2996/libclc/amdgpu/lib/workitem/get_num_groups.ll
Matt Arsenault a48e15c6cb Split sources for amdgcn and r600
Most files remain in a common amdgpu directory.

Also switches barriers to to use convergent,
and use llvm.amdgcn.s.barrier.

This now requires 3.9/trunk to build amdgcn.

llvm-svn: 260777
2016-02-13 01:01:59 +00:00

19 lines
610 B
LLVM

declare i32 @llvm.r600.read.ngroups.x() nounwind readnone
declare i32 @llvm.r600.read.ngroups.y() nounwind readnone
declare i32 @llvm.r600.read.ngroups.z() nounwind readnone
define i32 @get_num_groups(i32 %dim) nounwind readnone alwaysinline {
switch i32 %dim, label %default [i32 0, label %x_dim i32 1, label %y_dim i32 2, label %z_dim]
x_dim:
%x = call i32 @llvm.r600.read.ngroups.x() nounwind readnone
ret i32 %x
y_dim:
%y = call i32 @llvm.r600.read.ngroups.y() nounwind readnone
ret i32 %y
z_dim:
%z = call i32 @llvm.r600.read.ngroups.z() nounwind readnone
ret i32 %z
default:
ret i32 0
}