Files
clang-p2996/llvm/test/CodeGen/X86/pr63692.ll
Jeremy Morse e6bf48d110 [X86] Don't request 0x90 nop filling in p2align directives (#110134)
As of rev ea222be0d, LLVMs assembler will actually try to honour the
"fill value" part of p2align directives. X86 printed these as 0x90, which
isn't actually what it wanted: we want multi-byte nops for .text
padding. Compiling via a textual assembly file produces single-byte
nop padding since ea222be0d but the built-in assembler will produce
multi-byte nops. This divergent behaviour is undesirable.

To fix: don't set the byte padding field for x86, which allows the
assembler to pick multi-byte nops. Test that we get the same multi-byte
padding when compiled via textual assembly or directly to object file.
Added same-align-bytes-with-llasm-llobj.ll to that effect, updated
numerous other tests to not contain check-lines for the explicit padding.
2024-10-02 11:14:05 +01:00

32 lines
1.2 KiB
LLVM

; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 3
; RUN: llc < %s -mtriple=x86_64-- | FileCheck %s
define void @prefault(ptr noundef %range_start, ptr noundef readnone %range_end) {
; CHECK-LABEL: prefault:
; CHECK: # %bb.0: # %entry
; CHECK-NEXT: cmpq %rsi, %rdi
; CHECK-NEXT: jae .LBB0_3
; CHECK-NEXT: .p2align 4
; CHECK-NEXT: .LBB0_1: # %while.body
; CHECK-NEXT: # =>This Inner Loop Header: Depth=1
; CHECK-NEXT: lock orb $0, (%rdi)
; CHECK-NEXT: addq $4096, %rdi # imm = 0x1000
; CHECK-NEXT: cmpq %rsi, %rdi
; CHECK-NEXT: jb .LBB0_1
; CHECK-NEXT: .LBB0_3: # %while.end
; CHECK-NEXT: retq
entry:
%cmp3 = icmp ult ptr %range_start, %range_end
br i1 %cmp3, label %while.body, label %while.end
while.body: ; preds = %entry, %while.body
%start.04 = phi ptr [ %add.ptr, %while.body ], [ %range_start, %entry ]
%0 = atomicrmw volatile or ptr %start.04, i8 0 monotonic, align 1
%add.ptr = getelementptr inbounds i8, ptr %start.04, i64 4096
%cmp = icmp ult ptr %add.ptr, %range_end
br i1 %cmp, label %while.body, label %while.end
while.end: ; preds = %while.body, %entry
ret void
}