197 lines
9.3 KiB
LLVM
197 lines
9.3 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
|
|
; RUN: opt < %s -passes=vector-combine -S -mtriple=x86_64-- -mattr=SSE2 | FileCheck %s --check-prefixes=CHECK,SSE
|
|
; RUN: opt < %s -passes=vector-combine -S -mtriple=x86_64-- -mattr=AVX2 | FileCheck %s --check-prefixes=CHECK,AVX
|
|
|
|
|
|
define <4 x double> @src_ins0_v4f64_ext0_v2f64(<4 x double> %a, <2 x double> %b) #0 {
|
|
; CHECK-LABEL: @src_ins0_v4f64_ext0_v2f64(
|
|
; CHECK-NEXT: [[EXT:%.*]] = extractelement <2 x double> [[B:%.*]], i32 0
|
|
; CHECK-NEXT: [[INS:%.*]] = insertelement <4 x double> [[A:%.*]], double [[EXT]], i32 0
|
|
; CHECK-NEXT: ret <4 x double> [[INS]]
|
|
;
|
|
%ext = extractelement <2 x double> %b, i32 0
|
|
%ins = insertelement <4 x double> %a, double %ext, i32 0
|
|
ret <4 x double> %ins
|
|
}
|
|
|
|
define <4 x double> @src_ins1_v4f64_ext0_v2f64(<4 x double> %a, <2 x double> %b) #0 {
|
|
; CHECK-LABEL: @src_ins1_v4f64_ext0_v2f64(
|
|
; CHECK-NEXT: [[EXT:%.*]] = extractelement <2 x double> [[B:%.*]], i32 0
|
|
; CHECK-NEXT: [[INS:%.*]] = insertelement <4 x double> [[A:%.*]], double [[EXT]], i32 1
|
|
; CHECK-NEXT: ret <4 x double> [[INS]]
|
|
;
|
|
%ext = extractelement <2 x double> %b, i32 0
|
|
%ins = insertelement <4 x double> %a, double %ext, i32 1
|
|
ret <4 x double> %ins
|
|
}
|
|
|
|
define <4 x double> @src_ins2_v4f64_ext0_v2f64(<4 x double> %a, <2 x double> %b) #0 {
|
|
; CHECK-LABEL: @src_ins2_v4f64_ext0_v2f64(
|
|
; CHECK-NEXT: [[EXT:%.*]] = extractelement <2 x double> [[B:%.*]], i32 0
|
|
; CHECK-NEXT: [[INS:%.*]] = insertelement <4 x double> [[A:%.*]], double [[EXT]], i32 2
|
|
; CHECK-NEXT: ret <4 x double> [[INS]]
|
|
;
|
|
%ext = extractelement <2 x double> %b, i32 0
|
|
%ins = insertelement <4 x double> %a, double %ext, i32 2
|
|
ret <4 x double> %ins
|
|
}
|
|
|
|
define <4 x double> @src_ins3_v4f64_ext0_v2f64(<4 x double> %a, <2 x double> %b) #0 {
|
|
; CHECK-LABEL: @src_ins3_v4f64_ext0_v2f64(
|
|
; CHECK-NEXT: [[EXT:%.*]] = extractelement <2 x double> [[B:%.*]], i32 0
|
|
; CHECK-NEXT: [[INS:%.*]] = insertelement <4 x double> [[A:%.*]], double [[EXT]], i32 3
|
|
; CHECK-NEXT: ret <4 x double> [[INS]]
|
|
;
|
|
%ext = extractelement <2 x double> %b, i32 0
|
|
%ins = insertelement <4 x double> %a, double %ext, i32 3
|
|
ret <4 x double> %ins
|
|
}
|
|
|
|
define <4 x double> @src_ins0_v4f64_ext1_v2f64(<4 x double> %a, <2 x double> %b) #0 {
|
|
; SSE-LABEL: @src_ins0_v4f64_ext1_v2f64(
|
|
; SSE-NEXT: [[TMP1:%.*]] = shufflevector <2 x double> [[B:%.*]], <2 x double> poison, <4 x i32> <i32 poison, i32 1, i32 poison, i32 poison>
|
|
; SSE-NEXT: [[INS:%.*]] = shufflevector <4 x double> [[A:%.*]], <4 x double> [[TMP1]], <4 x i32> <i32 5, i32 1, i32 2, i32 3>
|
|
; SSE-NEXT: ret <4 x double> [[INS]]
|
|
;
|
|
; AVX-LABEL: @src_ins0_v4f64_ext1_v2f64(
|
|
; AVX-NEXT: [[EXT:%.*]] = extractelement <2 x double> [[B:%.*]], i32 1
|
|
; AVX-NEXT: [[INS:%.*]] = insertelement <4 x double> [[A:%.*]], double [[EXT]], i32 0
|
|
; AVX-NEXT: ret <4 x double> [[INS]]
|
|
;
|
|
%ext = extractelement <2 x double> %b, i32 1
|
|
%ins = insertelement <4 x double> %a, double %ext, i32 0
|
|
ret <4 x double> %ins
|
|
}
|
|
|
|
define <4 x double> @src_ins1_v4f64_ext1_v2f64(<4 x double> %a, <2 x double> %b) #0 {
|
|
; CHECK-LABEL: @src_ins1_v4f64_ext1_v2f64(
|
|
; CHECK-NEXT: [[TMP1:%.*]] = shufflevector <2 x double> [[B:%.*]], <2 x double> poison, <4 x i32> <i32 poison, i32 1, i32 poison, i32 poison>
|
|
; CHECK-NEXT: [[INS:%.*]] = shufflevector <4 x double> [[A:%.*]], <4 x double> [[TMP1]], <4 x i32> <i32 0, i32 5, i32 2, i32 3>
|
|
; CHECK-NEXT: ret <4 x double> [[INS]]
|
|
;
|
|
%ext = extractelement <2 x double> %b, i32 1
|
|
%ins = insertelement <4 x double> %a, double %ext, i32 1
|
|
ret <4 x double> %ins
|
|
}
|
|
|
|
define <4 x double> @src_ins2_v4f64_ext1_v2f64(<4 x double> %a, <2 x double> %b) #0 {
|
|
; CHECK-LABEL: @src_ins2_v4f64_ext1_v2f64(
|
|
; CHECK-NEXT: [[TMP1:%.*]] = shufflevector <2 x double> [[B:%.*]], <2 x double> poison, <4 x i32> <i32 poison, i32 1, i32 poison, i32 poison>
|
|
; CHECK-NEXT: [[INS:%.*]] = shufflevector <4 x double> [[A:%.*]], <4 x double> [[TMP1]], <4 x i32> <i32 0, i32 1, i32 5, i32 3>
|
|
; CHECK-NEXT: ret <4 x double> [[INS]]
|
|
;
|
|
%ext = extractelement <2 x double> %b, i32 1
|
|
%ins = insertelement <4 x double> %a, double %ext, i32 2
|
|
ret <4 x double> %ins
|
|
}
|
|
|
|
define <4 x double> @src_ins3_v4f64_ext1_v2f64(<4 x double> %a, <2 x double> %b) #0 {
|
|
; CHECK-LABEL: @src_ins3_v4f64_ext1_v2f64(
|
|
; CHECK-NEXT: [[TMP1:%.*]] = shufflevector <2 x double> [[B:%.*]], <2 x double> poison, <4 x i32> <i32 poison, i32 1, i32 poison, i32 poison>
|
|
; CHECK-NEXT: [[INS:%.*]] = shufflevector <4 x double> [[A:%.*]], <4 x double> [[TMP1]], <4 x i32> <i32 0, i32 1, i32 2, i32 5>
|
|
; CHECK-NEXT: ret <4 x double> [[INS]]
|
|
;
|
|
%ext = extractelement <2 x double> %b, i32 1
|
|
%ins = insertelement <4 x double> %a, double %ext, i32 3
|
|
ret <4 x double> %ins
|
|
}
|
|
|
|
define <2 x double> @src_ins0_v2f64_ext0_v4f64(<2 x double> %a, <4 x double> %b) {
|
|
; CHECK-LABEL: @src_ins0_v2f64_ext0_v4f64(
|
|
; CHECK-NEXT: [[TMP1:%.*]] = shufflevector <4 x double> [[B:%.*]], <4 x double> poison, <2 x i32> <i32 0, i32 poison>
|
|
; CHECK-NEXT: [[INS:%.*]] = shufflevector <2 x double> [[A:%.*]], <2 x double> [[TMP1]], <2 x i32> <i32 2, i32 1>
|
|
; CHECK-NEXT: ret <2 x double> [[INS]]
|
|
;
|
|
%ext = extractelement <4 x double> %b, i32 0
|
|
%ins = insertelement <2 x double> %a, double %ext, i32 0
|
|
ret <2 x double> %ins
|
|
}
|
|
|
|
define <2 x double> @src_ins0_v2f64_ext1_v4f64(<2 x double> %a, <4 x double> %b) {
|
|
; CHECK-LABEL: @src_ins0_v2f64_ext1_v4f64(
|
|
; CHECK-NEXT: [[TMP1:%.*]] = shufflevector <4 x double> [[B:%.*]], <4 x double> poison, <2 x i32> <i32 poison, i32 1>
|
|
; CHECK-NEXT: [[INS:%.*]] = shufflevector <2 x double> [[A:%.*]], <2 x double> [[TMP1]], <2 x i32> <i32 3, i32 1>
|
|
; CHECK-NEXT: ret <2 x double> [[INS]]
|
|
;
|
|
%ext = extractelement <4 x double> %b, i32 1
|
|
%ins = insertelement <2 x double> %a, double %ext, i32 0
|
|
ret <2 x double> %ins
|
|
}
|
|
|
|
define <2 x double> @src_ins0_v2f64_ext2_v4f64(<2 x double> %a, <4 x double> %b) {
|
|
; SSE-LABEL: @src_ins0_v2f64_ext2_v4f64(
|
|
; SSE-NEXT: [[TMP1:%.*]] = shufflevector <4 x double> [[B:%.*]], <4 x double> poison, <2 x i32> <i32 2, i32 poison>
|
|
; SSE-NEXT: [[INS:%.*]] = shufflevector <2 x double> [[A:%.*]], <2 x double> [[TMP1]], <2 x i32> <i32 2, i32 1>
|
|
; SSE-NEXT: ret <2 x double> [[INS]]
|
|
;
|
|
; AVX-LABEL: @src_ins0_v2f64_ext2_v4f64(
|
|
; AVX-NEXT: [[EXT:%.*]] = extractelement <4 x double> [[B:%.*]], i32 2
|
|
; AVX-NEXT: [[INS:%.*]] = insertelement <2 x double> [[A:%.*]], double [[EXT]], i32 0
|
|
; AVX-NEXT: ret <2 x double> [[INS]]
|
|
;
|
|
%ext = extractelement <4 x double> %b, i32 2
|
|
%ins = insertelement <2 x double> %a, double %ext, i32 0
|
|
ret <2 x double> %ins
|
|
}
|
|
|
|
define <2 x double> @src_ins0_v2f64_ext3_v4f64(<2 x double> %a, <4 x double> %b) {
|
|
; CHECK-LABEL: @src_ins0_v2f64_ext3_v4f64(
|
|
; CHECK-NEXT: [[TMP1:%.*]] = shufflevector <4 x double> [[B:%.*]], <4 x double> poison, <2 x i32> <i32 3, i32 poison>
|
|
; CHECK-NEXT: [[INS:%.*]] = shufflevector <2 x double> [[A:%.*]], <2 x double> [[TMP1]], <2 x i32> <i32 2, i32 1>
|
|
; CHECK-NEXT: ret <2 x double> [[INS]]
|
|
;
|
|
%ext = extractelement <4 x double> %b, i32 3
|
|
%ins = insertelement <2 x double> %a, double %ext, i32 0
|
|
ret <2 x double> %ins
|
|
}
|
|
|
|
define <2 x double> @src_ins1_v2f64_ext0_v4f64(<2 x double> %a, <4 x double> %b) {
|
|
; CHECK-LABEL: @src_ins1_v2f64_ext0_v4f64(
|
|
; CHECK-NEXT: [[TMP1:%.*]] = shufflevector <4 x double> [[B:%.*]], <4 x double> poison, <2 x i32> <i32 0, i32 poison>
|
|
; CHECK-NEXT: [[INS:%.*]] = shufflevector <2 x double> [[A:%.*]], <2 x double> [[TMP1]], <2 x i32> <i32 0, i32 2>
|
|
; CHECK-NEXT: ret <2 x double> [[INS]]
|
|
;
|
|
%ext = extractelement <4 x double> %b, i32 0
|
|
%ins = insertelement <2 x double> %a, double %ext, i32 1
|
|
ret <2 x double> %ins
|
|
}
|
|
|
|
define <2 x double> @src_ins1_v2f64_ext1_v4f64(<2 x double> %a, <4 x double> %b) {
|
|
; CHECK-LABEL: @src_ins1_v2f64_ext1_v4f64(
|
|
; CHECK-NEXT: [[TMP1:%.*]] = shufflevector <4 x double> [[B:%.*]], <4 x double> poison, <2 x i32> <i32 poison, i32 1>
|
|
; CHECK-NEXT: [[INS:%.*]] = shufflevector <2 x double> [[A:%.*]], <2 x double> [[TMP1]], <2 x i32> <i32 0, i32 3>
|
|
; CHECK-NEXT: ret <2 x double> [[INS]]
|
|
;
|
|
%ext = extractelement <4 x double> %b, i32 1
|
|
%ins = insertelement <2 x double> %a, double %ext, i32 1
|
|
ret <2 x double> %ins
|
|
}
|
|
|
|
define <2 x double> @src_ins1_v2f64_ext2_v4f64(<2 x double> %a, <4 x double> %b) {
|
|
; SSE-LABEL: @src_ins1_v2f64_ext2_v4f64(
|
|
; SSE-NEXT: [[TMP1:%.*]] = shufflevector <4 x double> [[B:%.*]], <4 x double> poison, <2 x i32> <i32 2, i32 poison>
|
|
; SSE-NEXT: [[INS:%.*]] = shufflevector <2 x double> [[A:%.*]], <2 x double> [[TMP1]], <2 x i32> <i32 0, i32 2>
|
|
; SSE-NEXT: ret <2 x double> [[INS]]
|
|
;
|
|
; AVX-LABEL: @src_ins1_v2f64_ext2_v4f64(
|
|
; AVX-NEXT: [[EXT:%.*]] = extractelement <4 x double> [[B:%.*]], i32 2
|
|
; AVX-NEXT: [[INS:%.*]] = insertelement <2 x double> [[A:%.*]], double [[EXT]], i32 1
|
|
; AVX-NEXT: ret <2 x double> [[INS]]
|
|
;
|
|
%ext = extractelement <4 x double> %b, i32 2
|
|
%ins = insertelement <2 x double> %a, double %ext, i32 1
|
|
ret <2 x double> %ins
|
|
}
|
|
|
|
define <2 x double> @src_ins1_v2f64_ext3_v4f64(<2 x double> %a, <4 x double> %b) {
|
|
; CHECK-LABEL: @src_ins1_v2f64_ext3_v4f64(
|
|
; CHECK-NEXT: [[TMP1:%.*]] = shufflevector <4 x double> [[B:%.*]], <4 x double> poison, <2 x i32> <i32 3, i32 poison>
|
|
; CHECK-NEXT: [[INS:%.*]] = shufflevector <2 x double> [[A:%.*]], <2 x double> [[TMP1]], <2 x i32> <i32 0, i32 2>
|
|
; CHECK-NEXT: ret <2 x double> [[INS]]
|
|
;
|
|
%ext = extractelement <4 x double> %b, i32 3
|
|
%ins = insertelement <2 x double> %a, double %ext, i32 1
|
|
ret <2 x double> %ins
|
|
}
|
|
|