Files
clang-p2996/llvm/test/CodeGen/SystemZ/vec-mul-10.ll
Ulrich Weigand 80267f8148 Support z17 processor name and scheduler description (#135254)
The recently announced IBM z17 processor implements the architecture
already supported as "arch15" in LLVM. This patch adds support for "z17"
as an alternate architecture name for arch15.

This patch also add the scheduler description for the z17 processor,
provided by Jonas Paulsson.
2025-04-11 00:20:58 +02:00

73 lines
2.4 KiB
LLVM

; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5
; Test widening vector multiply-and-add on z17.
;
; RUN: llc < %s -mtriple=s390x-linux-gnu -mcpu=z17 | FileCheck %s
; Test a v2i64 (even) -> i128 unsigned widening multiply-and-add.
define i128 @f1(<2 x i64> %val1, <2 x i64> %val2, i128 %val3) {
; CHECK-LABEL: f1:
; CHECK: # %bb.0:
; CHECK-NEXT: vl %v0, 0(%r3), 3
; CHECK-NEXT: vmaleg %v0, %v24, %v26, %v0
; CHECK-NEXT: vst %v0, 0(%r2), 3
; CHECK-NEXT: br %r14
%elt1 = extractelement <2 x i64> %val1, i32 0
%zext1 = zext i64 %elt1 to i128
%elt2 = extractelement <2 x i64> %val2, i32 0
%zext2 = zext i64 %elt2 to i128
%mul = mul i128 %zext1, %zext2
%ret = add i128 %mul, %val3
ret i128 %ret
}
; Test a v2i64 (odd) -> i128 unsigned widening multiply-and-add.
define i128 @f2(<2 x i64> %val1, <2 x i64> %val2, i128 %val3) {
; CHECK-LABEL: f2:
; CHECK: # %bb.0:
; CHECK-NEXT: vl %v0, 0(%r3), 3
; CHECK-NEXT: vmalog %v0, %v24, %v26, %v0
; CHECK-NEXT: vst %v0, 0(%r2), 3
; CHECK-NEXT: br %r14
%elt1 = extractelement <2 x i64> %val1, i32 1
%zext1 = zext i64 %elt1 to i128
%elt2 = extractelement <2 x i64> %val2, i32 1
%zext2 = zext i64 %elt2 to i128
%mul = mul i128 %zext1, %zext2
%ret = add i128 %mul, %val3
ret i128 %ret
}
; Test a v2i64 (even) -> i128 signed widening multiply-and-add.
define i128 @f3(<2 x i64> %val1, <2 x i64> %val2, i128 %val3) {
; CHECK-LABEL: f3:
; CHECK: # %bb.0:
; CHECK-NEXT: vl %v0, 0(%r3), 3
; CHECK-NEXT: vmaeg %v0, %v24, %v26, %v0
; CHECK-NEXT: vst %v0, 0(%r2), 3
; CHECK-NEXT: br %r14
%elt1 = extractelement <2 x i64> %val1, i32 0
%sext1 = sext i64 %elt1 to i128
%elt2 = extractelement <2 x i64> %val2, i32 0
%sext2 = sext i64 %elt2 to i128
%mul = mul i128 %sext1, %sext2
%ret = add i128 %mul, %val3
ret i128 %ret
}
; Test a v2i64 (odd) -> i128 signed widening multiply-and-add.
define i128 @f4(<2 x i64> %val1, <2 x i64> %val2, i128 %val3) {
; CHECK-LABEL: f4:
; CHECK: # %bb.0:
; CHECK-NEXT: vl %v0, 0(%r3), 3
; CHECK-NEXT: vmaog %v0, %v24, %v26, %v0
; CHECK-NEXT: vst %v0, 0(%r2), 3
; CHECK-NEXT: br %r14
%elt1 = extractelement <2 x i64> %val1, i32 1
%sext1 = sext i64 %elt1 to i128
%elt2 = extractelement <2 x i64> %val2, i32 1
%sext2 = sext i64 %elt2 to i128
%mul = mul i128 %sext1, %sext2
%ret = add i128 %mul, %val3
ret i128 %ret
}