Completes #83626 - `CGBuiltin.cpp` - modify `getDotProductIntrinsic` to be able to emit `dot2`, `dot3`, and `dot4` intrinsics based on element count - `IntrinsicsDirectX.td` - for floating point add `dot2`, `dot3`, and `dot4` inntrinsics -`DXIL.td` add dxilop intrinsic lowering for `dot2`, `dot3`, & `dot4`. - `DXILOpLowering.cpp` - add vector arg flattening for dot product. - `DXILOpBuilder.h` - modify `createDXILOpCall` to take a smallVector instead of an iterator - `DXILOpBuilder.cpp` - modify `createDXILOpCall` by moving the small vector up to the calling function in `DXILOpLowering.cpp`. - Moving one function up gives us access to the `CallInst` and `Function` which were needed to distinguish the dot product intrinsics and get the operands without using the iterator.
95 lines
4.1 KiB
LLVM
95 lines
4.1 KiB
LLVM
; RUN: opt -S -dxil-op-lower < %s | FileCheck %s
|
|
|
|
; Make sure dxil operation function calls for dot are generated for int/uint vectors.
|
|
|
|
; CHECK-LABEL: dot_half2
|
|
define noundef half @dot_half2(<2 x half> noundef %a, <2 x half> noundef %b) {
|
|
entry:
|
|
; CHECK: extractelement <2 x half> %a, i32 0
|
|
; CHECK: extractelement <2 x half> %a, i32 1
|
|
; CHECK: extractelement <2 x half> %b, i32 0
|
|
; CHECK: extractelement <2 x half> %b, i32 1
|
|
; CHECK: call half @dx.op.dot2.f16(i32 54, half %{{.*}}, half %{{.*}}, half %{{.*}}, half %{{.*}})
|
|
%dx.dot = call half @llvm.dx.dot2.v2f16(<2 x half> %a, <2 x half> %b)
|
|
ret half %dx.dot
|
|
}
|
|
|
|
; CHECK-LABEL: dot_half3
|
|
define noundef half @dot_half3(<3 x half> noundef %a, <3 x half> noundef %b) {
|
|
entry:
|
|
; CHECK: extractelement <3 x half> %a, i32 0
|
|
; CHECK: extractelement <3 x half> %a, i32 1
|
|
; CHECK: extractelement <3 x half> %a, i32 2
|
|
; CHECK: extractelement <3 x half> %b, i32 0
|
|
; CHECK: extractelement <3 x half> %b, i32 1
|
|
; CHECK: extractelement <3 x half> %b, i32 2
|
|
; CHECK: call half @dx.op.dot3.f16(i32 55, half %{{.*}}, half %{{.*}}, half %{{.*}}, half %{{.*}}, half %{{.*}}, half %{{.*}})
|
|
%dx.dot = call half @llvm.dx.dot3.v3f16(<3 x half> %a, <3 x half> %b)
|
|
ret half %dx.dot
|
|
}
|
|
|
|
; CHECK-LABEL: dot_half4
|
|
define noundef half @dot_half4(<4 x half> noundef %a, <4 x half> noundef %b) {
|
|
entry:
|
|
; CHECK: extractelement <4 x half> %a, i32 0
|
|
; CHECK: extractelement <4 x half> %a, i32 1
|
|
; CHECK: extractelement <4 x half> %a, i32 2
|
|
; CHECK: extractelement <4 x half> %a, i32 3
|
|
; CHECK: extractelement <4 x half> %b, i32 0
|
|
; CHECK: extractelement <4 x half> %b, i32 1
|
|
; CHECK: extractelement <4 x half> %b, i32 2
|
|
; CHECK: extractelement <4 x half> %b, i32 3
|
|
; CHECK: call half @dx.op.dot4.f16(i32 56, half %{{.*}}, half %{{.*}}, half %{{.*}}, half %{{.*}}, half %{{.*}}, half %{{.*}}, half %{{.*}}, half %{{.*}})
|
|
%dx.dot = call half @llvm.dx.dot4.v4f16(<4 x half> %a, <4 x half> %b)
|
|
ret half %dx.dot
|
|
}
|
|
|
|
; CHECK-LABEL: dot_float2
|
|
define noundef float @dot_float2(<2 x float> noundef %a, <2 x float> noundef %b) {
|
|
entry:
|
|
; CHECK: extractelement <2 x float> %a, i32 0
|
|
; CHECK: extractelement <2 x float> %a, i32 1
|
|
; CHECK: extractelement <2 x float> %b, i32 0
|
|
; CHECK: extractelement <2 x float> %b, i32 1
|
|
; CHECK: call float @dx.op.dot2.f32(i32 54, float %{{.*}}, float %{{.*}}, float %{{.*}}, float %{{.*}})
|
|
%dx.dot = call float @llvm.dx.dot2.v2f32(<2 x float> %a, <2 x float> %b)
|
|
ret float %dx.dot
|
|
}
|
|
|
|
; CHECK-LABEL: dot_float3
|
|
define noundef float @dot_float3(<3 x float> noundef %a, <3 x float> noundef %b) {
|
|
entry:
|
|
; CHECK: extractelement <3 x float> %a, i32 0
|
|
; CHECK: extractelement <3 x float> %a, i32 1
|
|
; CHECK: extractelement <3 x float> %a, i32 2
|
|
; CHECK: extractelement <3 x float> %b, i32 0
|
|
; CHECK: extractelement <3 x float> %b, i32 1
|
|
; CHECK: extractelement <3 x float> %b, i32 2
|
|
; CHECK: call float @dx.op.dot3.f32(i32 55, float %{{.*}}, float %{{.*}}, float %{{.*}}, float %{{.*}}, float %{{.*}}, float %{{.*}})
|
|
%dx.dot = call float @llvm.dx.dot3.v3f32(<3 x float> %a, <3 x float> %b)
|
|
ret float %dx.dot
|
|
}
|
|
|
|
; CHECK-LABEL: dot_float4
|
|
define noundef float @dot_float4(<4 x float> noundef %a, <4 x float> noundef %b) {
|
|
entry:
|
|
; CHECK: extractelement <4 x float> %a, i32 0
|
|
; CHECK: extractelement <4 x float> %a, i32 1
|
|
; CHECK: extractelement <4 x float> %a, i32 2
|
|
; CHECK: extractelement <4 x float> %a, i32 3
|
|
; CHECK: extractelement <4 x float> %b, i32 0
|
|
; CHECK: extractelement <4 x float> %b, i32 1
|
|
; CHECK: extractelement <4 x float> %b, i32 2
|
|
; CHECK: extractelement <4 x float> %b, i32 3
|
|
; CHECK: call float @dx.op.dot4.f32(i32 56, float %{{.*}}, float %{{.*}}, float %{{.*}}, float %{{.*}}, float %{{.*}}, float %{{.*}}, float %{{.*}}, float %{{.*}})
|
|
%dx.dot = call float @llvm.dx.dot4.v4f32(<4 x float> %a, <4 x float> %b)
|
|
ret float %dx.dot
|
|
}
|
|
|
|
declare half @llvm.dx.dot.v2f16(<2 x half> , <2 x half> )
|
|
declare half @llvm.dx.dot.v3f16(<3 x half> , <3 x half> )
|
|
declare half @llvm.dx.dot.v4f16(<4 x half> , <4 x half> )
|
|
declare float @llvm.dx.dot.v2f32(<2 x float>, <2 x float>)
|
|
declare float @llvm.dx.dot.v3f32(<3 x float>, <3 x float>)
|
|
declare float @llvm.dx.dot.v4f32(<4 x float>, <4 x float>)
|