This change implements lowering for #70076, #70100, #70072, & #70102 `CGBuiltin.cpp` - - simplify `lerp` intrinsic `IntrinsicsDirectX.td` - simplify `lerp` intrinsic `SemaChecking.cpp` - remove unnecessary check `DXILIntrinsicExpansion.*` - add intrinsic to instruction expansion cases `DXILOpLowering.cpp` - make sure `DXILIntrinsicExpansion` happens first `DirectX.h` - changes to support new pass `DirectXTargetMachine.cpp` - changes to support new pass Why `any`, and `lerp` as instruction expansion just for DXIL? - SPIR-V there is an [OpAny](https://registry.khronos.org/SPIR-V/specs/unified1/SPIRV.html#OpAny) - SPIR-V has a GLSL lerp extension via [Fmix](https://registry.khronos.org/SPIR-V/specs/1.0/GLSL.std.450.html#FMix) Why `exp` instruction expansion? - We have an `exp2` opcode and `exp` reuses that opcode. So instruction expansion is a convenient way to do preprocessing. - Further SPIR-V has a GLSL exp extension via [Exp](https://registry.khronos.org/SPIR-V/specs/1.0/GLSL.std.450.html#Exp) and [Exp2](https://registry.khronos.org/SPIR-V/specs/1.0/GLSL.std.450.html#Exp2) Why `rcp` as instruction expansion? This one is a bit of the odd man out and might have to move to `cgbuiltins` when we better understand SPIRV requirements. However I included it because it seems like [fast math mode has an AllowRecip flag](https://registry.khronos.org/SPIR-V/specs/unified1/SPIRV.html#_fp_fast_math_mode) which lets you compute the reciprocal without performing the division. We don't have that in DXIL so thought to include it.
32 lines
977 B
LLVM
32 lines
977 B
LLVM
; RUN: opt -S -dxil-op-lower < %s | FileCheck %s
|
|
|
|
; Make sure dxil operation function calls for exp are generated for float and half.
|
|
|
|
; CHECK-LABEL: exp_float
|
|
; CHECK: fmul float 0x3FF7154760000000, %{{.*}}
|
|
; CHECK: call float @dx.op.unary.f32(i32 21, float %{{.*}})
|
|
define noundef float @exp_float(float noundef %a) {
|
|
entry:
|
|
%a.addr = alloca float, align 4
|
|
store float %a, ptr %a.addr, align 4
|
|
%0 = load float, ptr %a.addr, align 4
|
|
%elt.exp = call float @llvm.exp.f32(float %0)
|
|
ret float %elt.exp
|
|
}
|
|
|
|
; CHECK-LABEL: exp_half
|
|
; CHECK: fmul half 0xH3DC5, %{{.*}}
|
|
; CHECK: call half @dx.op.unary.f16(i32 21, half %{{.*}})
|
|
; Function Attrs: noinline nounwind optnone
|
|
define noundef half @exp_half(half noundef %a) {
|
|
entry:
|
|
%a.addr = alloca half, align 2
|
|
store half %a, ptr %a.addr, align 2
|
|
%0 = load half, ptr %a.addr, align 2
|
|
%elt.exp = call half @llvm.exp.f16(half %0)
|
|
ret half %elt.exp
|
|
}
|
|
|
|
declare half @llvm.exp.f16(half)
|
|
declare float @llvm.exp.f32(float)
|