Files
clang-p2996/llvm/test/CodeGen/ARM/cortex-a57-misched-basic.ll
Kristof Beyls eecb353d0e [ARM] Make -mcpu=generic schedule for an in-order core (Cortex-A8).
The benchmarking summarized in
http://lists.llvm.org/pipermail/llvm-dev/2017-May/113525.html showed
this is beneficial for a wide range of cores.

As is to be expected, quite a few small adaptations are needed to the
regressions tests, as the difference in scheduling results in:
- Quite a few small instruction schedule differences.
- A few changes in register allocation decisions caused by different
 instruction schedules.
- A few changes in IfConversion decisions, due to a difference in
 instruction schedule and/or the estimated cost of a branch mispredict.

llvm-svn: 306514
2017-06-28 07:07:03 +00:00

54 lines
1.7 KiB
LLVM

; REQUIRES: asserts
; RUN: llc < %s -mtriple=armv8r-eabi -mcpu=cortex-a57 -enable-misched -verify-misched -debug-only=machine-scheduler -o - 2>&1 > /dev/null | FileCheck %s --check-prefix=CHECK --check-prefix=A57_SCHED
; RUN: llc < %s -mtriple=armv8r-eabi -mcpu=generic -enable-misched -verify-misched -debug-only=machine-scheduler -o - 2>&1 > /dev/null | FileCheck %s --check-prefix=CHECK --check-prefix=GENERIC
; Check the latency for instructions for both generic and cortex-a57.
; SDIV should be scheduled at the block's begin (20 cyc of independent M unit).
;
; CHECK: ********** MI Scheduling **********
; CHECK: foo:BB#0 entry
; GENERIC: LDRi12
; GENERIC: Latency : 1
; GENERIC: EORrr
; GENERIC: Latency : 1
; GENERIC: ADDrr
; GENERIC: Latency : 1
; GENERIC: SDIV
; GENERIC: Latency : 0
; GENERIC: SUBrr
; GENERIC: Latency : 1
; A57_SCHED: SDIV
; A57_SCHED: Latency : 20
; A57_SCHED: EORrr
; A57_SCHED: Latency : 1
; A57_SCHED: LDRi12
; A57_SCHED: Latency : 4
; A57_SCHED: ADDrr
; A57_SCHED: Latency : 1
; A57_SCHED: SUBrr
; A57_SCHED: Latency : 1
; CHECK: ** Final schedule for BB#0 ***
; GENERIC: LDRi12
; GENERIC: SDIV
; A57_SCHED: SDIV
; A57_SCHED: LDRi12
; CHECK: ********** INTERVALS **********
target datalayout = "e-m:e-p:32:32-i64:64-v128:64:128-a:0:32-n32-S64"
target triple = "armv8r-arm-none-eabi"
; Function Attrs: norecurse nounwind readnone
define hidden i32 @foo(i32 %a, i32 %b, i32 %c, i32* %d) local_unnamed_addr #0 {
entry:
%xor = xor i32 %c, %b
%ld = load i32, i32* %d
%add = add nsw i32 %xor, %ld
%div = sdiv i32 %a, %b
%sub = sub i32 %div, %add
ret i32 %sub
}