With this patch an undefined mask in a shufflevector will be printed as poison. This change is done to support the new shufflevector semantics for undefined mask elements. Differential Revision: https://reviews.llvm.org/D149210
51 lines
2.3 KiB
LLVM
51 lines
2.3 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
|
; RUN: opt --passes=slp-vectorizer -mtriple=x86_64-unknown-linux-gnu -mcpu=icelake-server -S < %s | FileCheck %s
|
|
|
|
define i1 @test() {
|
|
; CHECK-LABEL: define i1 @test
|
|
; CHECK-SAME: () #[[ATTR0:[0-9]+]] {
|
|
; CHECK-NEXT: entry:
|
|
; CHECK-NEXT: [[TMP0:%.*]] = shl i64 0, 0
|
|
; CHECK-NEXT: [[TMP1:%.*]] = insertelement <8 x i64> <i64 poison, i64 poison, i64 0, i64 poison, i64 0, i64 0, i64 0, i64 0>, i64 [[TMP0]], i32 0
|
|
; CHECK-NEXT: [[TMP2:%.*]] = insertelement <8 x i64> [[TMP1]], i64 0, i32 1
|
|
; CHECK-NEXT: [[TMP3:%.*]] = insertelement <8 x i64> [[TMP2]], i64 0, i32 3
|
|
; CHECK-NEXT: [[TMP4:%.*]] = shufflevector <8 x i64> [[TMP3]], <8 x i64> poison, <4 x i32> <i32 3, i32 poison, i32 1, i32 0>
|
|
; CHECK-NEXT: [[TMP5:%.*]] = shufflevector <8 x i64> <i64 undef, i64 0, i64 undef, i64 undef, i64 undef, i64 undef, i64 undef, i64 undef>, <8 x i64> [[TMP3]], <8 x i32> <i32 11, i32 11, i32 11, i32 1, i32 9, i32 9, i32 1, i32 8>
|
|
; CHECK-NEXT: [[TMP6:%.*]] = or <8 x i64> [[TMP3]], [[TMP5]]
|
|
; CHECK-NEXT: [[TMP7:%.*]] = sub <8 x i64> [[TMP3]], [[TMP5]]
|
|
; CHECK-NEXT: [[TMP8:%.*]] = shufflevector <8 x i64> [[TMP6]], <8 x i64> [[TMP7]], <8 x i32> <i32 0, i32 1, i32 2, i32 11, i32 12, i32 5, i32 6, i32 7>
|
|
; CHECK-NEXT: [[TMP9:%.*]] = icmp ult <8 x i64> [[TMP8]], zeroinitializer
|
|
; CHECK-NEXT: [[TMP10:%.*]] = call i1 @llvm.vector.reduce.or.v8i1(<8 x i1> [[TMP9]])
|
|
; CHECK-NEXT: ret i1 [[TMP10]]
|
|
;
|
|
entry:
|
|
%0 = shl i64 0, 0
|
|
%1 = add i64 0, 0
|
|
%2 = add i64 0, 0
|
|
%3 = or i64 %2, %1
|
|
%cmp750 = icmp ult i64 %3, 0
|
|
%4 = or i64 %0, %1
|
|
%cmp752 = icmp ult i64 %4, 0
|
|
%or753 = or i1 %cmp750, %cmp752
|
|
%5 = or i64 0, %1
|
|
%cmp754 = icmp ult i64 %5, 0
|
|
%or755 = or i1 %or753, %cmp754
|
|
%6 = extractelement <16 x i64> zeroinitializer, i32 0
|
|
%7 = sub i64 %1, %6
|
|
%cmp756 = icmp ult i64 %7, 0
|
|
%or757 = or i1 %or755, %cmp756
|
|
%8 = sub i64 0, %2
|
|
%cmp758 = icmp ult i64 %8, 0
|
|
%or759 = or i1 %or757, %cmp758
|
|
%9 = or i64 0, %2
|
|
%cmp760 = icmp ult i64 %9, 0
|
|
%or761 = or i1 %or759, %cmp760
|
|
%10 = or i64 0, %6
|
|
%cmp762 = icmp ult i64 %10, 0
|
|
%or763 = or i1 %or761, %cmp762
|
|
%11 = or i64 0, %0
|
|
%cmp764 = icmp ult i64 %11, 0
|
|
%or765 = or i1 %or763, %cmp764
|
|
ret i1 %or765
|
|
}
|