Files
clang-p2996/llvm/test/CodeGen/DirectX/lerp.ll
Farzon Lotfi de1a97db39 [DXIL] exp, any, lerp, & rcp Intrinsic Lowering (#84526)
This change implements lowering for #70076, #70100, #70072, & #70102 
`CGBuiltin.cpp` - - simplify `lerp` intrinsic
`IntrinsicsDirectX.td` - simplify `lerp` intrinsic
`SemaChecking.cpp` - remove unnecessary check
`DXILIntrinsicExpansion.*` - add intrinsic to instruction expansion
cases
`DXILOpLowering.cpp` - make sure `DXILIntrinsicExpansion` happens first
`DirectX.h` - changes to support new pass
`DirectXTargetMachine.cpp` - changes to support new pass

Why `any`, and `lerp` as instruction expansion just for DXIL?
- SPIR-V there is an
[OpAny](https://registry.khronos.org/SPIR-V/specs/unified1/SPIRV.html#OpAny)
- SPIR-V has a GLSL lerp extension via
[Fmix](https://registry.khronos.org/SPIR-V/specs/1.0/GLSL.std.450.html#FMix)

Why `exp` instruction expansion?
- We have an `exp2` opcode and `exp` reuses that opcode. So instruction
expansion is a convenient way to do preprocessing.
- Further SPIR-V has a GLSL exp extension via
[Exp](https://registry.khronos.org/SPIR-V/specs/1.0/GLSL.std.450.html#Exp)
and
[Exp2](https://registry.khronos.org/SPIR-V/specs/1.0/GLSL.std.450.html#Exp2)

Why `rcp` as instruction expansion?
This one is a bit of the odd man out and might have to move to
`cgbuiltins` when we better understand SPIRV requirements. However I
included it because it seems like [fast math mode has an AllowRecip
flag](https://registry.khronos.org/SPIR-V/specs/unified1/SPIRV.html#_fp_fast_math_mode)
which lets you compute the reciprocal without performing the division.
We don't have that in DXIL so thought to include it.
2024-03-14 20:25:57 -04:00

57 lines
2.0 KiB
LLVM

; RUN: opt -S -dxil-op-lower < %s | FileCheck %s
; Make sure dxil operation function calls for lerp are generated for float and half.
; CHECK-LABEL: lerp_half
; CHECK: fsub half %{{.*}}, %{{.*}}
; CHECK: fmul half %{{.*}}, %{{.*}}
; CHECK: fadd half %{{.*}}, %{{.*}}
define noundef half @lerp_half(half noundef %p0) {
entry:
%p0.addr = alloca half, align 2
store half %p0, ptr %p0.addr, align 2
%0 = load half, ptr %p0.addr, align 2
%1 = load half, ptr %p0.addr, align 2
%2 = load half, ptr %p0.addr, align 2
%dx.lerp = call half @llvm.dx.lerp.f16(half %0, half %1, half %2)
ret half %dx.lerp
}
; CHECK-LABEL: lerp_float
; CHECK: fsub float %{{.*}}, %{{.*}}
; CHECK: fmul float %{{.*}}, %{{.*}}
; CHECK: fadd float %{{.*}}, %{{.*}}
define noundef float @lerp_float(float noundef %p0, float noundef %p1) {
entry:
%p1.addr = alloca float, align 4
%p0.addr = alloca float, align 4
store float %p1, ptr %p1.addr, align 4
store float %p0, ptr %p0.addr, align 4
%0 = load float, ptr %p0.addr, align 4
%1 = load float, ptr %p0.addr, align 4
%2 = load float, ptr %p0.addr, align 4
%dx.lerp = call float @llvm.dx.lerp.f32(float %0, float %1, float %2)
ret float %dx.lerp
}
; CHECK-LABEL: lerp_float4
; CHECK: fsub <4 x float> %{{.*}}, %{{.*}}
; CHECK: fmul <4 x float> %{{.*}}, %{{.*}}
; CHECK: fadd <4 x float> %{{.*}}, %{{.*}}
define noundef <4 x float> @lerp_float4(<4 x float> noundef %p0, <4 x float> noundef %p1) {
entry:
%p1.addr = alloca <4 x float>, align 16
%p0.addr = alloca <4 x float>, align 16
store <4 x float> %p1, ptr %p1.addr, align 16
store <4 x float> %p0, ptr %p0.addr, align 16
%0 = load <4 x float>, ptr %p0.addr, align 16
%1 = load <4 x float>, ptr %p0.addr, align 16
%2 = load <4 x float>, ptr %p0.addr, align 16
%dx.lerp = call <4 x float> @llvm.dx.lerp.v4f32(<4 x float> %0, <4 x float> %1, <4 x float> %2)
ret <4 x float> %dx.lerp
}
declare half @llvm.dx.lerp.f16(half, half, half)
declare float @llvm.dx.lerp.f32(float, float, float)
declare <4 x float> @llvm.dx.lerp.v4f32(<4 x float>, <4 x float>, <4 x float>)