Files
clang-p2996/llvm/test/CodeGen/AMDGPU/divergence-driven-min-max.ll
alex-t 98d09705e1 [AMDGPU] Re-enabling divergence predicates for min/max
This patch enables divergence predicates for min/max nodes.
It makes ISD::MIN/MAX selected to S_MIN_I(U)32/S_MAX_I(U)32 or V_MIN_I(U)32_e64/V_MAX_I(U)32_e64

Reviewed By: rampitec

Differential Revision: https://reviews.llvm.org/D115954
2021-12-20 16:10:55 +03:00

74 lines
2.3 KiB
LLVM
Executable File

; RUN: llc -march=amdgcn -stop-after=amdgpu-isel < %s | FileCheck -check-prefix=GCN %s
; GCN-LABEL: name: uniform_imin
; GCN: S_MIN_I32
define amdgpu_kernel void @uniform_imin(i32 addrspace(1)* %out, i32 %a, i32 %b) #0 {
%cmp = icmp sle i32 %a, %b
%val = select i1 %cmp, i32 %a, i32 %b
store i32 %val, i32 addrspace(1)* %out, align 4
ret void
}
; GCN-LABEL: name: divergent_imin
; GCN: V_MIN_I32_e64
define void @divergent_imin(i32 addrspace(1)* %out, i32 %a, i32 %b) #0 {
%cmp = icmp sle i32 %a, %b
%val = select i1 %cmp, i32 %a, i32 %b
store i32 %val, i32 addrspace(1)* %out, align 4
ret void
}
; GCN-LABEL: name: uniform_umin
; GCN: S_MIN_U32
define amdgpu_kernel void @uniform_umin(i32 addrspace(1)* %out, i32 %a, i32 %b) #0 {
%tmp = icmp ule i32 %a, %b
%val = select i1 %tmp, i32 %a, i32 %b
store i32 %val, i32 addrspace(1)* %out, align 8
ret void
}
; GCN-LABEL: name: divergent_umin
; GCN: V_MIN_U32_e64
define void @divergent_umin(i32 addrspace(1)* %out, i32 %a, i32 %b) #0 {
%tmp = icmp ule i32 %a, %b
%val = select i1 %tmp, i32 %a, i32 %b
store i32 %val, i32 addrspace(1)* %out, align 8
ret void
}
; GCN-LABEL: name: uniform_imax
; GCN: S_MAX_I32
define amdgpu_kernel void @uniform_imax(i32 addrspace(1)* %out, i32 %a, i32 %b) nounwind {
%cmp = icmp sge i32 %a, %b
%val = select i1 %cmp, i32 %a, i32 %b
store i32 %val, i32 addrspace(1)* %out, align 4
ret void
}
; GCN-LABEL: name: divergent_imax
; GCN: V_MAX_I32_e64
define void @divergent_imax(i32 addrspace(1)* %out, i32 %a, i32 %b) nounwind {
%cmp = icmp sge i32 %a, %b
%val = select i1 %cmp, i32 %a, i32 %b
store i32 %val, i32 addrspace(1)* %out, align 4
ret void
}
; GCN-LABEL: name: uniform_umax
; GCN: S_MAX_U32
define amdgpu_kernel void @uniform_umax(i32 addrspace(1)* %out, i32 %a, i32 %b) nounwind {
%cmp = icmp uge i32 %a, %b
%val = select i1 %cmp, i32 %a, i32 %b
store i32 %val, i32 addrspace(1)* %out, align 4
ret void
}
; GCN-LABEL: name: divergent_umax
; GCN: V_MAX_U32_e64
define void @divergent_umax(i32 addrspace(1)* %out, i32 %a, i32 %b) nounwind {
%cmp = icmp uge i32 %a, %b
%val = select i1 %cmp, i32 %a, i32 %b
store i32 %val, i32 addrspace(1)* %out, align 4
ret void
}