Files
clang-p2996/llvm/test/CodeGen/PowerPC/noPermuteFormasking.ll
Nemanja Ivanovic 6cc31ca814 [PowerPC] Do not emit record-form rotates when record-form andi suffices
Up until Power9, the performance profile for rlwinm., rldicl. and andi. looked
more or less equivalent. However with Power9, the rotates are still 2-way
cracked whereas the and-immediate is not.

This patch just ensures that we don't emit record-form rotates when an andi.
is adequate.

As first pointed out by Carrot in https://bugs.llvm.org/show_bug.cgi?id=30833
(this patch is a fix for that PR).

Differential Revision: https://reviews.llvm.org/D43977

llvm-svn: 326736
2018-03-05 19:27:16 +00:00

43 lines
1.5 KiB
LLVM

; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc -mcpu=pwr9 -mtriple=powerpc64le-unkknown-unknown \
; RUN: -verify-machineinstrs -O2 < %s | FileCheck %s
$test = comdat any
; Function Attrs: noinline nounwind
define void @test() local_unnamed_addr #0 comdat align 2 {
; CHECK-LABEL: test:
; CHECK: # %bb.0: # %entry
; CHECK-NEXT: ld 3, 0(3)
; CHECK-NEXT: cmpdi 1, 3, 0
; CHECK-NEXT: andi. 4, 3, 3
; CHECK-NEXT: crand 20, 2, 5
; CHECK-NEXT: isel 3, 0, 3, 20
; CHECK-NEXT: addi 3, 3, -1
; CHECK-NEXT: cmpldi 3, 3
; CHECK-NEXT: bltlr+ 0
; CHECK-NEXT: # %bb.1: # %for.body.i.i.i.i.i.i.i
entry:
%0 = load float*, float** undef, align 8
%1 = load i64, i64* undef, align 8
%add.ptr.i.i.i.i = getelementptr inbounds float, float* %0, i64 undef
%2 = ptrtoint float* %add.ptr.i.i.i.i to i64
%and.i.i.i.i.i.i.i = and i64 %2, 3
%tobool.i.i.i.i.i.i.i = icmp eq i64 %and.i.i.i.i.i.i.i, 0
%cmp.i.i.i.i.i.i.i = icmp slt i64 0, %1
%3 = and i1 %tobool.i.i.i.i.i.i.i, %cmp.i.i.i.i.i.i.i
%spec.select.i.i.i.i.i.i.i = select i1 %3, i64 0, i64 %1
%4 = add i64 %spec.select.i.i.i.i.i.i.i, -1
%5 = sub i64 %4, 0
br label %for.body.i.i.i.i.i.i.i.prol.loopexit
for.body.i.i.i.i.i.i.i.prol.loopexit: ; preds = %entry
%6 = icmp ult i64 %5, 3
br i1 %6, label %exitBB, label %for.body.i.i.i.i.i.i.i
for.body.i.i.i.i.i.i.i: ; preds = %for.body.i.i.i.i.i.i.i.prol.loopexit
unreachable
exitBB: ; preds = %for.body.i.i.i.i.i.i.i.prol.loopexit
ret void
}