Files
clang-p2996/llvm/test/Transforms/LoopStrengthReduce/AArch64/pr53625.ll
Harvin Iriawan db158c7c83 [AArch64] Update generic sched model to A510
Refresh of the generic scheduling model to use A510 instead of A55.
  Main benefits are to the little core, and introducing SVE scheduling information.
  Changes tested on various OoO cores, no performance degradation is seen.

  Differential Revision: https://reviews.llvm.org/D156799
2023-08-21 12:25:15 +01:00

173 lines
6.3 KiB
LLVM

; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc < %s -mtriple=aarch64-unknown-unknown | FileCheck %s
target datalayout = "e-m:w-p:64:64-i32:32-i64:64-i128:128-n32:64-S128"
; we need to generate post index load for this case
define i32 @test(i32 %c, ptr %a, ptr %b) {
; CHECK-LABEL: test:
; CHECK: // %bb.0: // %entry
; CHECK-NEXT: cmp w0, #1
; CHECK-NEXT: b.lt .LBB0_4
; CHECK-NEXT: // %bb.1: // %for.body.preheader
; CHECK-NEXT: mov w8, w0
; CHECK-NEXT: .LBB0_2: // %for.body
; CHECK-NEXT: // =>This Inner Loop Header: Depth=1
; CHECK-NEXT: ldr w9, [x1], #4
; CHECK-NEXT: cbnz w9, .LBB0_5
; CHECK-NEXT: // %bb.3: // %for.cond
; CHECK-NEXT: // in Loop: Header=BB0_2 Depth=1
; CHECK-NEXT: subs x8, x8, #1
; CHECK-NEXT: b.ne .LBB0_2
; CHECK-NEXT: .LBB0_4:
; CHECK-NEXT: mov w0, wzr
; CHECK-NEXT: ret
; CHECK-NEXT: .LBB0_5:
; CHECK-NEXT: mov w0, #1 // =0x1
; CHECK-NEXT: ret
entry:
%cmp13 = icmp sgt i32 %c, 0
br i1 %cmp13, label %for.body.preheader, label %return
for.body.preheader: ; preds = %entry
%wide.trip.count = zext i32 %c to i64
br label %for.body
for.cond: ; preds = %for.body
%iv.next = add nuw nsw i64 %iv, 1
%exitcond.not = icmp eq i64 %iv.next, %wide.trip.count
br i1 %exitcond.not, label %return, label %for.body
for.body: ; preds = %for.body.preheader, %for.cond
%iv = phi i64 [ 0, %for.body.preheader ], [ %iv.next, %for.cond ]
%arrayidx = getelementptr inbounds i32, ptr %a, i64 %iv
%val = load i32, ptr %arrayidx, align 4
%tobool3.not = icmp eq i32 %val, 0
br i1 %tobool3.not, label %for.cond, label %return
return: ; preds = %for.cond, %for.body, %entry
%retval.1 = phi i32 [ 0, %entry ], [ 0, %for.cond ], [ 1, %for.body ]
ret i32 %retval.1
}
; negative case: %arrayidx.b is not in header
define i64 @IVIncHoist_not_all_user_in_header(i32 %c, ptr %a, ptr %b) {
; CHECK-LABEL: IVIncHoist_not_all_user_in_header:
; CHECK: // %bb.0: // %entry
; CHECK-NEXT: cmp w0, #1
; CHECK-NEXT: b.lt .LBB1_5
; CHECK-NEXT: // %bb.1: // %for.body.preheader
; CHECK-NEXT: mov x8, xzr
; CHECK-NEXT: mov w9, w0
; CHECK-NEXT: add x10, x1, #4
; CHECK-NEXT: add x11, x2, #8
; CHECK-NEXT: mov w0, #1 // =0x1
; CHECK-NEXT: .LBB1_2: // %for.body
; CHECK-NEXT: // =>This Inner Loop Header: Depth=1
; CHECK-NEXT: ldr w12, [x10, x8, lsl #2]
; CHECK-NEXT: cbnz w12, .LBB1_7
; CHECK-NEXT: // %bb.3: // %if.then
; CHECK-NEXT: // in Loop: Header=BB1_2 Depth=1
; CHECK-NEXT: ldr w12, [x11, x8, lsl #2]
; CHECK-NEXT: cbnz w12, .LBB1_6
; CHECK-NEXT: // %bb.4: // %for.cond
; CHECK-NEXT: // in Loop: Header=BB1_2 Depth=1
; CHECK-NEXT: add x8, x8, #1
; CHECK-NEXT: cmp x9, x8
; CHECK-NEXT: b.ne .LBB1_2
; CHECK-NEXT: .LBB1_5:
; CHECK-NEXT: mov x0, xzr
; CHECK-NEXT: ret
; CHECK-NEXT: .LBB1_6: // %if.then.return.loopexit_crit_edge
; CHECK-NEXT: add x0, x8, #3
; CHECK-NEXT: .LBB1_7: // %return
; CHECK-NEXT: ret
entry:
%cmp13 = icmp sgt i32 %c, 0
br i1 %cmp13, label %for.body.preheader, label %return
for.body.preheader: ; preds = %entry
%wide.trip.count = zext i32 %c to i64
br label %for.body
for.cond: ; preds = %for.body
%iv.next = add nuw nsw i64 %iv, 1
%exitcond.not = icmp eq i64 %iv.next, %wide.trip.count
br i1 %exitcond.not, label %return, label %for.body
for.body: ; preds = %for.body.preheader, %for.cond
%iv = phi i64 [ 0, %for.body.preheader ], [ %iv.next, %for.cond ]
%iv.a = phi i64 [ 1, %for.body.preheader ], [ %iv.next.a, %for.cond ]
%iv.b = phi i64 [ 2, %for.body.preheader ], [ %iv.next.b, %for.cond ]
%arrayidx.a = getelementptr inbounds i32, ptr %a, i64 %iv.a
%iv.next.a = add nuw nsw i64 %iv.a, 1
%val.a = load i32, ptr %arrayidx.a, align 4
%tobool3.not = icmp eq i32 %val.a, 0
br i1 %tobool3.not, label %if.then, label %return
if.then:
%arrayidx.b = getelementptr inbounds i32, ptr %b, i64 %iv.b
%iv.next.b = add nuw nsw i64 %iv.b, 1
%val.b = load i32, ptr %arrayidx.b, align 4
%tobool4.not = icmp eq i32 %val.b, 0
br i1 %tobool4.not, label %for.cond, label %return
return: ; preds = %for.cond, %for.body, %entry
%retval.1 = phi i64 [ 0, %entry ], [ 0, %for.cond ], [ 1, %for.body ], [ %iv.next.b, %if.then ]
ret i64 %retval.1
}
%struct.A = type { i32 }
; this used to crash because the load type is struct
define i32 @negative_test_type_is_struct(i32 %c, ptr %a, ptr %b) {
; CHECK-LABEL: negative_test_type_is_struct:
; CHECK: // %bb.0: // %entry
; CHECK-NEXT: cmp w0, #1
; CHECK-NEXT: b.lt .LBB2_4
; CHECK-NEXT: // %bb.1: // %for.body.preheader
; CHECK-NEXT: mov w8, w0
; CHECK-NEXT: .LBB2_2: // %for.body
; CHECK-NEXT: // =>This Inner Loop Header: Depth=1
; CHECK-NEXT: ldr w9, [x1]
; CHECK-NEXT: cbnz w9, .LBB2_5
; CHECK-NEXT: // %bb.3: // %for.cond
; CHECK-NEXT: // in Loop: Header=BB2_2 Depth=1
; CHECK-NEXT: subs x8, x8, #1
; CHECK-NEXT: add x1, x1, #4
; CHECK-NEXT: b.ne .LBB2_2
; CHECK-NEXT: .LBB2_4:
; CHECK-NEXT: mov w0, wzr
; CHECK-NEXT: ret
; CHECK-NEXT: .LBB2_5:
; CHECK-NEXT: mov w0, #1 // =0x1
; CHECK-NEXT: ret
entry:
%cmp13 = icmp sgt i32 %c, 0
br i1 %cmp13, label %for.body.preheader, label %return
for.body.preheader: ; preds = %entry
%wide.trip.count = zext i32 %c to i64
br label %for.body
for.cond: ; preds = %for.body
%iv.next = add nuw nsw i64 %iv, 1
%exitcond.not = icmp eq i64 %iv.next, %wide.trip.count
br i1 %exitcond.not, label %return, label %for.body
for.body: ; preds = %for.body.preheader, %for.cond
%iv = phi i64 [ 0, %for.body.preheader ], [ %iv.next, %for.cond ]
%arrayidx = getelementptr inbounds i32, ptr %a, i64 %iv
%str.val = load %struct.A, ptr %arrayidx
%val = extractvalue %struct.A %str.val, 0
%tobool3.not = icmp eq i32 %val, 0
br i1 %tobool3.not, label %for.cond, label %return
return: ; preds = %for.cond, %for.body, %entry
%retval.1 = phi i32 [ 0, %entry ], [ 0, %for.cond ], [ 1, %for.body ]
ret i32 %retval.1
}