Detect (non-intrinsic) IR patterns corresponding to the semantics of the various widening and high-word multiplication instructions. Specifically, this is done by: - Recognizing even/odd widening multiplication patterns in DAGCombine - Recognizing widening multiply-and-add on top during ISel - Implementing the standard MULHS/MUHLU IR opcodes - Detecting high-word multiply-and-add (which common code does not) Depending on architecture level, this can support all integer vector types as well as the scalar i128 type. Fixes: https://github.com/llvm/llvm-project/issues/129705
33 lines
1.1 KiB
LLVM
33 lines
1.1 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5
|
|
; Test high-part vector multiplication on arch15
|
|
;
|
|
; RUN: llc < %s -mtriple=s390x-linux-gnu -mcpu=arch15 | FileCheck %s
|
|
|
|
; Test a v2i64 unsigned high-part multiplication.
|
|
define <2 x i64> @f1(<2 x i64> %val1, <2 x i64> %val2) {
|
|
; CHECK-LABEL: f1:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vmlhg %v24, %v24, %v26
|
|
; CHECK-NEXT: br %r14
|
|
%zext1 = zext <2 x i64> %val1 to <2 x i128>
|
|
%zext2 = zext <2 x i64> %val2 to <2 x i128>
|
|
%mulx = mul <2 x i128> %zext1, %zext2
|
|
%highx = lshr <2 x i128> %mulx, splat(i128 64)
|
|
%high = trunc <2 x i128> %highx to <2 x i64>
|
|
ret <2 x i64> %high
|
|
}
|
|
|
|
; Test a v2i64 signed high-part multiplication.
|
|
define <2 x i64> @f2(<2 x i64> %val1, <2 x i64> %val2) {
|
|
; CHECK-LABEL: f2:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vmhg %v24, %v24, %v26
|
|
; CHECK-NEXT: br %r14
|
|
%sext1 = sext <2 x i64> %val1 to <2 x i128>
|
|
%sext2 = sext <2 x i64> %val2 to <2 x i128>
|
|
%mulx = mul <2 x i128> %sext1, %sext2
|
|
%highx = lshr <2 x i128> %mulx, splat(i128 64)
|
|
%high = trunc <2 x i128> %highx to <2 x i64>
|
|
ret <2 x i64> %high
|
|
}
|