Files
clang-p2996/llvm/test/CodeGen/X86/pr33290.ll
Jeremy Morse e6bf48d110 [X86] Don't request 0x90 nop filling in p2align directives (#110134)
As of rev ea222be0d, LLVMs assembler will actually try to honour the
"fill value" part of p2align directives. X86 printed these as 0x90, which
isn't actually what it wanted: we want multi-byte nops for .text
padding. Compiling via a textual assembly file produces single-byte
nop padding since ea222be0d but the built-in assembler will produce
multi-byte nops. This divergent behaviour is undesirable.

To fix: don't set the byte padding field for x86, which allows the
assembler to pick multi-byte nops. Test that we get the same multi-byte
padding when compiled via textual assembly or directly to object file.
Added same-align-bytes-with-llasm-llobj.ll to that effect, updated
numerous other tests to not contain check-lines for the explicit padding.
2024-10-02 11:14:05 +01:00

51 lines
1.6 KiB
LLVM

; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc < %s -mtriple=i686-unknown-unknown | FileCheck %s --check-prefix=X86
; RUN: llc < %s -mtriple=x86_64-unknown-unknown | FileCheck %s --check-prefix=X64
@a = common dso_local global i32 0, align 4
@c = common dso_local local_unnamed_addr global i8 0, align 1
@b = common dso_local local_unnamed_addr global ptr null, align 8
define dso_local void @e() {
; X86-LABEL: e:
; X86: # %bb.0: # %entry
; X86-NEXT: movl b, %eax
; X86-NEXT: .p2align 4
; X86-NEXT: .LBB0_1: # %for.cond
; X86-NEXT: # =>This Inner Loop Header: Depth=1
; X86-NEXT: movzbl c, %ecx
; X86-NEXT: movb $0, c
; X86-NEXT: leal a+2(%ecx), %ecx
; X86-NEXT: movl %ecx, (%eax)
; X86-NEXT: jmp .LBB0_1
;
; X64-LABEL: e:
; X64: # %bb.0: # %entry
; X64-NEXT: movq b(%rip), %rax
; X64-NEXT: .p2align 4
; X64-NEXT: .LBB0_1: # %for.cond
; X64-NEXT: # =>This Inner Loop Header: Depth=1
; X64-NEXT: movzbl c(%rip), %ecx
; X64-NEXT: addq $a, %rcx
; X64-NEXT: setb %dl
; X64-NEXT: addq $2, %rcx
; X64-NEXT: adcb $0, %dl
; X64-NEXT: movb %dl, c(%rip)
; X64-NEXT: movl %ecx, (%rax)
; X64-NEXT: jmp .LBB0_1
entry:
%0 = load ptr, ptr @b, align 8
br label %for.cond
for.cond:
%1 = load i8, ptr @c, align 1
%conv = zext i8 %1 to i128
%add = add nuw nsw i128 %conv, add (i128 ptrtoint (ptr @a to i128), i128 2)
%2 = lshr i128 %add, 64
%conv1 = trunc i128 %2 to i8
store i8 %conv1, ptr @c, align 1
%conv2 = trunc i128 %add to i32
store i32 %conv2, ptr %0, align 4
br label %for.cond
}