Files
clang-p2996/llvm/test/Transforms/LoopStrengthReduce/AArch64/pr53625.ll
sgokhale c4a60c9d34 [CodeGen][ShrinkWrap] Enable PostShrinkWrap by default
This is an attempt to reland D42600 and enabling this optimisation by default.

This also resolves the issue pointed out in the context of PGO build.

Differential Revision: https://reviews.llvm.org/D42600
2023-05-25 13:56:29 +05:30

173 lines
6.3 KiB
LLVM

; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc < %s -mtriple=aarch64-unknown-unknown | FileCheck %s
target datalayout = "e-m:w-p:64:64-i32:32-i64:64-i128:128-n32:64-S128"
; we need to generate post index load for this case
define i32 @test(i32 %c, ptr %a, ptr %b) {
; CHECK-LABEL: test:
; CHECK: // %bb.0: // %entry
; CHECK-NEXT: cmp w0, #1
; CHECK-NEXT: b.lt .LBB0_4
; CHECK-NEXT: // %bb.1: // %for.body.preheader
; CHECK-NEXT: mov w8, w0
; CHECK-NEXT: .LBB0_2: // %for.body
; CHECK-NEXT: // =>This Inner Loop Header: Depth=1
; CHECK-NEXT: ldr w9, [x1], #4
; CHECK-NEXT: cbnz w9, .LBB0_5
; CHECK-NEXT: // %bb.3: // %for.cond
; CHECK-NEXT: // in Loop: Header=BB0_2 Depth=1
; CHECK-NEXT: subs x8, x8, #1
; CHECK-NEXT: b.ne .LBB0_2
; CHECK-NEXT: .LBB0_4:
; CHECK-NEXT: mov w0, wzr
; CHECK-NEXT: ret
; CHECK-NEXT: .LBB0_5:
; CHECK-NEXT: mov w0, #1 // =0x1
; CHECK-NEXT: ret
entry:
%cmp13 = icmp sgt i32 %c, 0
br i1 %cmp13, label %for.body.preheader, label %return
for.body.preheader: ; preds = %entry
%wide.trip.count = zext i32 %c to i64
br label %for.body
for.cond: ; preds = %for.body
%iv.next = add nuw nsw i64 %iv, 1
%exitcond.not = icmp eq i64 %iv.next, %wide.trip.count
br i1 %exitcond.not, label %return, label %for.body
for.body: ; preds = %for.body.preheader, %for.cond
%iv = phi i64 [ 0, %for.body.preheader ], [ %iv.next, %for.cond ]
%arrayidx = getelementptr inbounds i32, ptr %a, i64 %iv
%val = load i32, ptr %arrayidx, align 4
%tobool3.not = icmp eq i32 %val, 0
br i1 %tobool3.not, label %for.cond, label %return
return: ; preds = %for.cond, %for.body, %entry
%retval.1 = phi i32 [ 0, %entry ], [ 0, %for.cond ], [ 1, %for.body ]
ret i32 %retval.1
}
; negative case: %arrayidx.b is not in header
define i64 @IVIncHoist_not_all_user_in_header(i32 %c, ptr %a, ptr %b) {
; CHECK-LABEL: IVIncHoist_not_all_user_in_header:
; CHECK: // %bb.0: // %entry
; CHECK-NEXT: cmp w0, #1
; CHECK-NEXT: b.lt .LBB1_5
; CHECK-NEXT: // %bb.1: // %for.body.preheader
; CHECK-NEXT: mov x8, xzr
; CHECK-NEXT: mov w9, w0
; CHECK-NEXT: add x10, x1, #4
; CHECK-NEXT: add x11, x2, #8
; CHECK-NEXT: mov w0, #1 // =0x1
; CHECK-NEXT: .LBB1_2: // %for.body
; CHECK-NEXT: // =>This Inner Loop Header: Depth=1
; CHECK-NEXT: ldr w12, [x10, x8, lsl #2]
; CHECK-NEXT: cbnz w12, .LBB1_7
; CHECK-NEXT: // %bb.3: // %if.then
; CHECK-NEXT: // in Loop: Header=BB1_2 Depth=1
; CHECK-NEXT: ldr w12, [x11, x8, lsl #2]
; CHECK-NEXT: cbnz w12, .LBB1_6
; CHECK-NEXT: // %bb.4: // %for.cond
; CHECK-NEXT: // in Loop: Header=BB1_2 Depth=1
; CHECK-NEXT: add x8, x8, #1
; CHECK-NEXT: cmp x9, x8
; CHECK-NEXT: b.ne .LBB1_2
; CHECK-NEXT: .LBB1_5:
; CHECK-NEXT: mov x0, xzr
; CHECK-NEXT: ret
; CHECK-NEXT: .LBB1_6: // %if.then.return.loopexit_crit_edge
; CHECK-NEXT: add x0, x8, #3
; CHECK-NEXT: .LBB1_7: // %return
; CHECK-NEXT: ret
entry:
%cmp13 = icmp sgt i32 %c, 0
br i1 %cmp13, label %for.body.preheader, label %return
for.body.preheader: ; preds = %entry
%wide.trip.count = zext i32 %c to i64
br label %for.body
for.cond: ; preds = %for.body
%iv.next = add nuw nsw i64 %iv, 1
%exitcond.not = icmp eq i64 %iv.next, %wide.trip.count
br i1 %exitcond.not, label %return, label %for.body
for.body: ; preds = %for.body.preheader, %for.cond
%iv = phi i64 [ 0, %for.body.preheader ], [ %iv.next, %for.cond ]
%iv.a = phi i64 [ 1, %for.body.preheader ], [ %iv.next.a, %for.cond ]
%iv.b = phi i64 [ 2, %for.body.preheader ], [ %iv.next.b, %for.cond ]
%arrayidx.a = getelementptr inbounds i32, ptr %a, i64 %iv.a
%iv.next.a = add nuw nsw i64 %iv.a, 1
%val.a = load i32, ptr %arrayidx.a, align 4
%tobool3.not = icmp eq i32 %val.a, 0
br i1 %tobool3.not, label %if.then, label %return
if.then:
%arrayidx.b = getelementptr inbounds i32, ptr %b, i64 %iv.b
%iv.next.b = add nuw nsw i64 %iv.b, 1
%val.b = load i32, ptr %arrayidx.b, align 4
%tobool4.not = icmp eq i32 %val.b, 0
br i1 %tobool4.not, label %for.cond, label %return
return: ; preds = %for.cond, %for.body, %entry
%retval.1 = phi i64 [ 0, %entry ], [ 0, %for.cond ], [ 1, %for.body ], [ %iv.next.b, %if.then ]
ret i64 %retval.1
}
%struct.A = type { i32 }
; this used to crash because the load type is struct
define i32 @negative_test_type_is_struct(i32 %c, ptr %a, ptr %b) {
; CHECK-LABEL: negative_test_type_is_struct:
; CHECK: // %bb.0: // %entry
; CHECK-NEXT: cmp w0, #1
; CHECK-NEXT: b.lt .LBB2_4
; CHECK-NEXT: // %bb.1: // %for.body.preheader
; CHECK-NEXT: mov w8, w0
; CHECK-NEXT: .LBB2_2: // %for.body
; CHECK-NEXT: // =>This Inner Loop Header: Depth=1
; CHECK-NEXT: ldr w9, [x1]
; CHECK-NEXT: cbnz w9, .LBB2_5
; CHECK-NEXT: // %bb.3: // %for.cond
; CHECK-NEXT: // in Loop: Header=BB2_2 Depth=1
; CHECK-NEXT: add x1, x1, #4
; CHECK-NEXT: subs x8, x8, #1
; CHECK-NEXT: b.ne .LBB2_2
; CHECK-NEXT: .LBB2_4:
; CHECK-NEXT: mov w0, wzr
; CHECK-NEXT: ret
; CHECK-NEXT: .LBB2_5:
; CHECK-NEXT: mov w0, #1 // =0x1
; CHECK-NEXT: ret
entry:
%cmp13 = icmp sgt i32 %c, 0
br i1 %cmp13, label %for.body.preheader, label %return
for.body.preheader: ; preds = %entry
%wide.trip.count = zext i32 %c to i64
br label %for.body
for.cond: ; preds = %for.body
%iv.next = add nuw nsw i64 %iv, 1
%exitcond.not = icmp eq i64 %iv.next, %wide.trip.count
br i1 %exitcond.not, label %return, label %for.body
for.body: ; preds = %for.body.preheader, %for.cond
%iv = phi i64 [ 0, %for.body.preheader ], [ %iv.next, %for.cond ]
%arrayidx = getelementptr inbounds i32, ptr %a, i64 %iv
%str.val = load %struct.A, ptr %arrayidx
%val = extractvalue %struct.A %str.val, 0
%tobool3.not = icmp eq i32 %val, 0
br i1 %tobool3.not, label %for.cond, label %return
return: ; preds = %for.cond, %for.body, %entry
%retval.1 = phi i32 [ 0, %entry ], [ 0, %for.cond ], [ 1, %for.body ]
ret i32 %retval.1
}