Files
clang-p2996/llvm/test/CodeGen/X86/jcc-indirect-thunk-kernel.ll
Joao Moreira eac3e5c3fb [X86] Do not emit JCC to __x86_indirect_thunk
Clang may optimize conditional tailcall blocks with the following layout:

cmp <condition>
je  tailcall_target
ret

When retpoline is in place, indirect calls are converted into direct calls to a retpoline thunk. When these indirect calls are tail calls, they may be subject to the above described optimization (there is no indirect JCC, but since now the jump is direct it can be made conditional). The above layout is non-ideal for the Linux kernel scenario because the branches into thunks may be patched back into indirect branches during runtime depending on the underlying CPU features, what would not be feasible if the binary is emitted with the optimized layout above.

Thus, prevent clang from emitting this it if CodeModel is Kernel.

Feature request from the respective kernel mailing list: https://lore.kernel.org/llvm/Yv3uI%2FMoJVctmBCh@worktop.programming.kicks-ass.net/

Reviewed By: nickdesaulniers, pengfei

Differential Revision: https://reviews.llvm.org/D134915
2022-10-06 11:09:24 -07:00

33 lines
893 B
LLVM

; RUN: llc < %s -O2 --code-model=kernel | FileCheck %s
; The intent of the test is that we do not generate conditional
; tail calls to the thunk.
target triple = "x86_64-unknown-linux-gnu"
define dso_local void @foo(ptr %something) #0 {
; CHECK-LABEL: foo:
; CHECK: # %bb.0: # %entry
; CHECK-NEXT: movq (%rdi), %r11
; CHECK-NEXT: testq %r11, %r11
; Make sure that a JNE was not generated instead of a JE + JMP sequence
; CHECK-NOT: jne
; CHECK-NEXT: je .LBB0_1
; CHECK-NEXT: bb.2: # %if.then
; CHECK-NEXT: jmp __x86_indirect_thunk_r11
; CHECK-NEXT: LBB0_1:
; CHECK-NEXT: retq
entry:
%0 = load ptr, ptr %something, align 8
%tobool.not = icmp eq ptr %0, null
br i1 %tobool.not, label %if.end, label %if.then
if.then:
tail call void %0()
br label %if.end
if.end:
ret void
}
attributes #0 = { optsize "target-features"="+retpoline-external-thunk" }