This essentially reverts the x86-64 side effect of r327198. For x86-32, @PLT (R_386_PLT32) is not suitable in -fno-pic mode so the code forces MO_NO_FLAG (like a forced dso_local) (https://bugs.llvm.org//show_bug.cgi?id=36674#c6). For x86-64, both `call/jmp foo` and `call/jmp foo@PLT` emit R_X86_64_PLT32 (https://sourceware.org/bugzilla/show_bug.cgi?id=22791) so there is no difference using @PLT. Using @PLT is actually favorable because this drops a difference with -fpie/-fpic code and makes it possible to avoid a canonical PLT entry when taking the address of an undefined function symbol.
100 lines
2.8 KiB
LLVM
100 lines
2.8 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
|
; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=avx | FileCheck %s
|
|
|
|
declare double @sin(double %f)
|
|
|
|
; When the subs are strict, they can't be removed because of signed zero.
|
|
|
|
define double @strict(double %e) nounwind {
|
|
; CHECK-LABEL: strict:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: pushq %rax
|
|
; CHECK-NEXT: vxorpd %xmm1, %xmm1, %xmm1
|
|
; CHECK-NEXT: vsubsd %xmm0, %xmm1, %xmm0
|
|
; CHECK-NEXT: callq sin
|
|
; CHECK-NEXT: vxorpd %xmm1, %xmm1, %xmm1
|
|
; CHECK-NEXT: vsubsd %xmm0, %xmm1, %xmm0
|
|
; CHECK-NEXT: popq %rax
|
|
; CHECK-NEXT: retq
|
|
%f = fsub double 0.0, %e
|
|
%g = call double @sin(double %f) readonly
|
|
%h = fsub double 0.0, %g
|
|
ret double %h
|
|
}
|
|
|
|
; 'fast' implies no-signed-zeros, so the negates fold away.
|
|
; The 'sin' does not need any fast-math-flags for this transform.
|
|
|
|
define double @fast(double %e) nounwind {
|
|
; CHECK-LABEL: fast:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: jmp sin@PLT # TAILCALL
|
|
%f = fsub fast double 0.0, %e
|
|
%g = call double @sin(double %f) readonly
|
|
%h = fsub fast double 0.0, %g
|
|
ret double %h
|
|
}
|
|
|
|
; No-signed-zeros is all that we need for this transform.
|
|
|
|
define double @nsz(double %e) nounwind {
|
|
; CHECK-LABEL: nsz:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: jmp sin@PLT # TAILCALL
|
|
%f = fsub nsz double 0.0, %e
|
|
%g = call double @sin(double %f) readonly
|
|
%h = fsub nsz double 0.0, %g
|
|
ret double %h
|
|
}
|
|
|
|
; The 1st negate is strict, so we can't kill that sub, but the 2nd disappears.
|
|
|
|
define double @semi_strict1(double %e) nounwind {
|
|
; CHECK-LABEL: semi_strict1:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: pushq %rax
|
|
; CHECK-NEXT: vxorpd %xmm1, %xmm1, %xmm1
|
|
; CHECK-NEXT: vsubsd %xmm0, %xmm1, %xmm0
|
|
; CHECK-NEXT: callq sin
|
|
; CHECK-NEXT: vxorpd {{.*}}(%rip), %xmm0, %xmm0
|
|
; CHECK-NEXT: popq %rax
|
|
; CHECK-NEXT: retq
|
|
%f = fsub double 0.0, %e
|
|
%g = call double @sin(double %f) readonly
|
|
%h = fsub nsz double 0.0, %g
|
|
ret double %h
|
|
}
|
|
|
|
; The 2nd negate is strict, so we can't kill it. It becomes an add of zero instead.
|
|
|
|
define double @semi_strict2(double %e) nounwind {
|
|
; CHECK-LABEL: semi_strict2:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: pushq %rax
|
|
; CHECK-NEXT: callq sin
|
|
; CHECK-NEXT: vxorpd %xmm1, %xmm1, %xmm1
|
|
; CHECK-NEXT: vaddsd %xmm1, %xmm0, %xmm0
|
|
; CHECK-NEXT: popq %rax
|
|
; CHECK-NEXT: retq
|
|
%f = fsub nsz double 0.0, %e
|
|
%g = call double @sin(double %f) readonly
|
|
%h = fsub double 0.0, %g
|
|
ret double %h
|
|
}
|
|
|
|
; FIXME:
|
|
; Auto-upgrade function attribute to IR-level fast-math-flags.
|
|
|
|
define double @fn_attr(double %e) nounwind #0 {
|
|
; CHECK-LABEL: fn_attr:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: jmp sin@PLT # TAILCALL
|
|
%f = fsub double 0.0, %e
|
|
%g = call double @sin(double %f) readonly
|
|
%h = fsub double 0.0, %g
|
|
ret double %h
|
|
}
|
|
|
|
attributes #0 = { "unsafe-fp-math"="true" "no-signed-zeros-fp-math"="true" }
|
|
|