Implements elementwise firstbithigh hlsl builtin. Implements firstbituhigh intrinsic for spirv and directx, which handles unsigned integers Implements firstbitshigh intrinsic for spirv and directx, which handles signed integers. Fixes #113486 Closes #99115
92 lines
3.8 KiB
LLVM
92 lines
3.8 KiB
LLVM
; RUN: opt -S -scalarizer -dxil-op-lower -mtriple=dxil-pc-shadermodel6.3-library %s | FileCheck %s
|
|
|
|
; Make sure dxil operation function calls for firstbithigh are generated for all integer types.
|
|
|
|
define noundef i32 @test_firstbithigh_ushort(i16 noundef %a) {
|
|
entry:
|
|
; CHECK: call i32 @dx.op.unaryBits.i16(i32 33, i16 %{{.*}})
|
|
%elt.firstbithigh = call i32 @llvm.dx.firstbituhigh.i16(i16 %a)
|
|
ret i32 %elt.firstbithigh
|
|
}
|
|
|
|
define noundef i32 @test_firstbithigh_short(i16 noundef %a) {
|
|
entry:
|
|
; CHECK: call i32 @dx.op.unaryBits.i16(i32 34, i16 %{{.*}})
|
|
%elt.firstbithigh = call i32 @llvm.dx.firstbitshigh.i16(i16 %a)
|
|
ret i32 %elt.firstbithigh
|
|
}
|
|
|
|
define noundef i32 @test_firstbithigh_uint(i32 noundef %a) {
|
|
entry:
|
|
; CHECK: call i32 @dx.op.unaryBits.i32(i32 33, i32 %{{.*}})
|
|
%elt.firstbithigh = call i32 @llvm.dx.firstbituhigh.i32(i32 %a)
|
|
ret i32 %elt.firstbithigh
|
|
}
|
|
|
|
define noundef i32 @test_firstbithigh_int(i32 noundef %a) {
|
|
entry:
|
|
; CHECK: call i32 @dx.op.unaryBits.i32(i32 34, i32 %{{.*}})
|
|
%elt.firstbithigh = call i32 @llvm.dx.firstbitshigh.i32(i32 %a)
|
|
ret i32 %elt.firstbithigh
|
|
}
|
|
|
|
define noundef i32 @test_firstbithigh_ulong(i64 noundef %a) {
|
|
entry:
|
|
; CHECK: call i32 @dx.op.unaryBits.i64(i32 33, i64 %{{.*}})
|
|
%elt.firstbithigh = call i32 @llvm.dx.firstbituhigh.i64(i64 %a)
|
|
ret i32 %elt.firstbithigh
|
|
}
|
|
|
|
define noundef i32 @test_firstbithigh_long(i64 noundef %a) {
|
|
entry:
|
|
; CHECK: call i32 @dx.op.unaryBits.i64(i32 34, i64 %{{.*}})
|
|
%elt.firstbithigh = call i32 @llvm.dx.firstbitshigh.i64(i64 %a)
|
|
ret i32 %elt.firstbithigh
|
|
}
|
|
|
|
define noundef <4 x i32> @test_firstbituhigh_vec4_i32(<4 x i32> noundef %a) {
|
|
entry:
|
|
; CHECK: [[ee0:%.*]] = extractelement <4 x i32> %a, i64 0
|
|
; CHECK: [[ie0:%.*]] = call i32 @dx.op.unaryBits.i32(i32 33, i32 [[ee0]])
|
|
; CHECK: [[ee1:%.*]] = extractelement <4 x i32> %a, i64 1
|
|
; CHECK: [[ie1:%.*]] = call i32 @dx.op.unaryBits.i32(i32 33, i32 [[ee1]])
|
|
; CHECK: [[ee2:%.*]] = extractelement <4 x i32> %a, i64 2
|
|
; CHECK: [[ie2:%.*]] = call i32 @dx.op.unaryBits.i32(i32 33, i32 [[ee2]])
|
|
; CHECK: [[ee3:%.*]] = extractelement <4 x i32> %a, i64 3
|
|
; CHECK: [[ie3:%.*]] = call i32 @dx.op.unaryBits.i32(i32 33, i32 [[ee3]])
|
|
; CHECK: insertelement <4 x i32> poison, i32 [[ie0]], i64 0
|
|
; CHECK: insertelement <4 x i32> %{{.*}}, i32 [[ie1]], i64 1
|
|
; CHECK: insertelement <4 x i32> %{{.*}}, i32 [[ie2]], i64 2
|
|
; CHECK: insertelement <4 x i32> %{{.*}}, i32 [[ie3]], i64 3
|
|
%2 = call <4 x i32> @llvm.dx.firstbituhigh.v4i32(<4 x i32> %a)
|
|
ret <4 x i32> %2
|
|
}
|
|
|
|
define noundef <4 x i32> @test_firstbitshigh_vec4_i32(<4 x i32> noundef %a) {
|
|
entry:
|
|
; CHECK: [[ee0:%.*]] = extractelement <4 x i32> %a, i64 0
|
|
; CHECK: [[ie0:%.*]] = call i32 @dx.op.unaryBits.i32(i32 34, i32 [[ee0]])
|
|
; CHECK: [[ee1:%.*]] = extractelement <4 x i32> %a, i64 1
|
|
; CHECK: [[ie1:%.*]] = call i32 @dx.op.unaryBits.i32(i32 34, i32 [[ee1]])
|
|
; CHECK: [[ee2:%.*]] = extractelement <4 x i32> %a, i64 2
|
|
; CHECK: [[ie2:%.*]] = call i32 @dx.op.unaryBits.i32(i32 34, i32 [[ee2]])
|
|
; CHECK: [[ee3:%.*]] = extractelement <4 x i32> %a, i64 3
|
|
; CHECK: [[ie3:%.*]] = call i32 @dx.op.unaryBits.i32(i32 34, i32 [[ee3]])
|
|
; CHECK: insertelement <4 x i32> poison, i32 [[ie0]], i64 0
|
|
; CHECK: insertelement <4 x i32> %{{.*}}, i32 [[ie1]], i64 1
|
|
; CHECK: insertelement <4 x i32> %{{.*}}, i32 [[ie2]], i64 2
|
|
; CHECK: insertelement <4 x i32> %{{.*}}, i32 [[ie3]], i64 3
|
|
%2 = call <4 x i32> @llvm.dx.firstbitshigh.v4i32(<4 x i32> %a)
|
|
ret <4 x i32> %2
|
|
}
|
|
|
|
declare i32 @llvm.dx.firstbituhigh.i16(i16)
|
|
declare i32 @llvm.dx.firstbituhigh.i32(i32)
|
|
declare i32 @llvm.dx.firstbituhigh.i64(i64)
|
|
declare <4 x i32> @llvm.dx.firstbituhigh.v4i32(<4 x i32>)
|
|
|
|
declare i32 @llvm.dx.firstbitshigh.i16(i16)
|
|
declare i32 @llvm.dx.firstbitshigh.i32(i32)
|
|
declare i32 @llvm.dx.firstbitshigh.i64(i64)
|
|
declare <4 x i32> @llvm.dx.firstbitshigh.v4i32(<4 x i32>)
|