Enables interaleaved stores, results in better estimation for segmented stores for RISC-V Reviewers: preames, topperc, RKSimon Reviewed By: RKSimon Pull Request: https://github.com/llvm/llvm-project/pull/115354
45 lines
2.0 KiB
LLVM
45 lines
2.0 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 5
|
|
; RUN: opt -S --passes=slp-vectorizer -mtriple=riscv64-unknown-linux -mattr=+v -pass-remarks-output=%t -mcpu=sifive-p670 < %s | FileCheck %s
|
|
; RUN: FileCheck %s --check-prefix YAML --input-file=%t
|
|
|
|
; YAML-LABEL: --- !Passed
|
|
; YAML-NEXT: Pass: slp-vectorizer
|
|
; YAML-NEXT: Name: StoresVectorized
|
|
; YAML-NEXT: Function: test
|
|
; YAML-NEXT: Args:
|
|
; YAML-NEXT: - String: 'Stores SLP vectorized with cost '
|
|
; YAML-NEXT: - Cost: '-2'
|
|
; YAML-NEXT: - String: ' and with tree size '
|
|
; YAML-NEXT: - TreeSize: '2'
|
|
define void @test(ptr %h) {
|
|
; CHECK-LABEL: define void @test(
|
|
; CHECK-SAME: ptr [[H:%.*]]) #[[ATTR0:[0-9]+]] {
|
|
; CHECK-NEXT: [[ENTRY:.*:]]
|
|
; CHECK-NEXT: [[DCT2X211:%.*]] = alloca [0 x [0 x [8 x i64]]], i32 0, align 16
|
|
; CHECK-NEXT: [[CHROMA_DC209:%.*]] = getelementptr i8, ptr [[H]], i64 0
|
|
; CHECK-NEXT: [[TMP0:%.*]] = load <4 x i64>, ptr [[DCT2X211]], align 16
|
|
; CHECK-NEXT: [[TMP1:%.*]] = shufflevector <4 x i64> [[TMP0]], <4 x i64> poison, <4 x i32> <i32 0, i32 2, i32 1, i32 3>
|
|
; CHECK-NEXT: store <4 x i64> [[TMP1]], ptr [[CHROMA_DC209]], align 2
|
|
; CHECK-NEXT: ret void
|
|
;
|
|
entry:
|
|
%dct2x211 = alloca [0 x [0 x [8 x i64]]], i32 0, align 16
|
|
%chroma_dc209 = getelementptr i8, ptr %h, i64 0
|
|
%arrayidx30.i = getelementptr i8, ptr %dct2x211, i64 16
|
|
%arrayidx33.i = getelementptr i8, ptr %dct2x211, i64 8
|
|
%arrayidx36.i181 = getelementptr i8, ptr %dct2x211, i64 24
|
|
%0 = load i64, ptr %dct2x211, align 16
|
|
store i64 %0, ptr %chroma_dc209, align 2
|
|
%1 = load i64, ptr %arrayidx30.i, align 4
|
|
%arrayidx3.i224 = getelementptr i8, ptr %h, i64 8
|
|
store i64 %1, ptr %arrayidx3.i224, align 2
|
|
%2 = load i64, ptr %arrayidx33.i, align 2
|
|
%arrayidx5.i226 = getelementptr i8, ptr %h, i64 16
|
|
store i64 %2, ptr %arrayidx5.i226, align 2
|
|
%3 = load i64, ptr %arrayidx36.i181, align 2
|
|
%arrayidx7.i228 = getelementptr i8, ptr %h, i64 24
|
|
store i64 %3, ptr %arrayidx7.i228, align 2
|
|
ret void
|
|
}
|
|
|