On processors supporting vector registers and SIMD instructions, enable i128 as legal type in VRs. This allows many operations to be implemented via native instructions directly in VRs (including add, subtract, logical operations and shifts). For a few other operations (e.g. multiply and divide, as well as atomic operations), we need to move the i128 value back to a GPR pair to use the corresponding instruction there. Overall, this is still beneficial. The patch includes the following LLVM changes: - Enable i128 as legal type - Set up legal operations (in SystemZInstrVector.td) - Custom expansion for i128 add/subtract with carry - Custom expansion for i128 comparisons and selects - Support for moving i128 to/from GPR pairs when required - Handle 128-bit integer constant values everywhere - Use i128 as intrinsic operand type where appropriate - Updated and new test cases In addition, clang builtins are updated to reflect the intrinsic operand type changes (which also improves compatibility with GCC).
186 lines
5.5 KiB
LLVM
186 lines
5.5 KiB
LLVM
; Test 128-bit compare and swap.
|
|
;
|
|
; RUN: llc < %s -mtriple=s390x-linux-gnu | FileCheck %s --check-prefix=CHECK --check-prefix=CHECK-Z10
|
|
; RUN: llc < %s -mtriple=s390x-linux-gnu -mcpu=z13 | FileCheck %s --check-prefix=CHECK --check-prefix=CHECK-Z13
|
|
|
|
; Check CDSG without a displacement.
|
|
define i128 @f1(i128 %cmp, i128 %swap, ptr %src) {
|
|
; CHECK-LABEL: f1:
|
|
; CHECK-DAG: lg %r1, 8(%r4)
|
|
; CHECK-DAG: lg %r0, 0(%r4)
|
|
; CHECK-DAG: lg %r13, 8(%r3)
|
|
; CHECK-DAG: lg %r12, 0(%r3)
|
|
; CHECK: cdsg %r12, %r0, 0(%r5)
|
|
; CHECK-DAG: stg %r13, 8(%r2)
|
|
; CHECK-DAG: stg %r12, 0(%r2)
|
|
; CHECK: br %r14
|
|
%pairval = cmpxchg ptr %src, i128 %cmp, i128 %swap seq_cst seq_cst
|
|
%val = extractvalue { i128, i1 } %pairval, 0
|
|
ret i128 %val
|
|
}
|
|
|
|
; Check the high end of the aligned CDSG range.
|
|
define i128 @f2(i128 %cmp, i128 %swap, ptr %src) {
|
|
; CHECK-LABEL: f2:
|
|
; CHECK: cdsg {{%r[0-9]+}}, {{%r[0-9]+}}, 524272(%r5)
|
|
; CHECK: br %r14
|
|
%ptr = getelementptr i128, ptr %src, i128 32767
|
|
%pairval = cmpxchg ptr %ptr, i128 %cmp, i128 %swap seq_cst seq_cst
|
|
%val = extractvalue { i128, i1 } %pairval, 0
|
|
ret i128 %val
|
|
}
|
|
|
|
; Check the next doubleword up, which needs separate address logic.
|
|
; Other sequences besides this one would be OK.
|
|
define i128 @f3(i128 %cmp, i128 %swap, ptr %src) {
|
|
; CHECK-LABEL: f3:
|
|
; CHECK: agfi %r5, 524288
|
|
; CHECK: cdsg {{%r[0-9]+}}, {{%r[0-9]+}}, 0(%r5)
|
|
; CHECK: br %r14
|
|
%ptr = getelementptr i128, ptr %src, i128 32768
|
|
%pairval = cmpxchg ptr %ptr, i128 %cmp, i128 %swap seq_cst seq_cst
|
|
%val = extractvalue { i128, i1 } %pairval, 0
|
|
ret i128 %val
|
|
}
|
|
|
|
; Check the high end of the negative aligned CDSG range.
|
|
define i128 @f4(i128 %cmp, i128 %swap, ptr %src) {
|
|
; CHECK-LABEL: f4:
|
|
; CHECK: cdsg {{%r[0-9]+}}, {{%r[0-9]+}}, -16(%r5)
|
|
; CHECK: br %r14
|
|
%ptr = getelementptr i128, ptr %src, i128 -1
|
|
%pairval = cmpxchg ptr %ptr, i128 %cmp, i128 %swap seq_cst seq_cst
|
|
%val = extractvalue { i128, i1 } %pairval, 0
|
|
ret i128 %val
|
|
}
|
|
|
|
; Check the low end of the CDSG range.
|
|
define i128 @f5(i128 %cmp, i128 %swap, ptr %src) {
|
|
; CHECK-LABEL: f5:
|
|
; CHECK: cdsg {{%r[0-9]+}}, {{%r[0-9]+}}, -524288(%r5)
|
|
; CHECK: br %r14
|
|
%ptr = getelementptr i128, ptr %src, i128 -32768
|
|
%pairval = cmpxchg ptr %ptr, i128 %cmp, i128 %swap seq_cst seq_cst
|
|
%val = extractvalue { i128, i1 } %pairval, 0
|
|
ret i128 %val
|
|
}
|
|
|
|
; Check the next doubleword down, which needs separate address logic.
|
|
; Other sequences besides this one would be OK.
|
|
define i128 @f6(i128 %cmp, i128 %swap, ptr %src) {
|
|
; CHECK-LABEL: f6:
|
|
; CHECK: agfi %r5, -524304
|
|
; CHECK: cdsg {{%r[0-9]+}}, {{%r[0-9]+}}, 0(%r5)
|
|
; CHECK: br %r14
|
|
%ptr = getelementptr i128, ptr %src, i128 -32769
|
|
%pairval = cmpxchg ptr %ptr, i128 %cmp, i128 %swap seq_cst seq_cst
|
|
%val = extractvalue { i128, i1 } %pairval, 0
|
|
ret i128 %val
|
|
}
|
|
|
|
; Check that CDSG does not allow an index.
|
|
define i128 @f7(i128 %cmp, i128 %swap, i64 %src, i64 %index) {
|
|
; CHECK-LABEL: f7:
|
|
; CHECK: agr %r5, %r6
|
|
; CHECK: cdsg {{%r[0-9]+}}, {{%r[0-9]+}}, 0(%r5)
|
|
; CHECK: br %r14
|
|
%add1 = add i64 %src, %index
|
|
%ptr = inttoptr i64 %add1 to ptr
|
|
%pairval = cmpxchg ptr %ptr, i128 %cmp, i128 %swap seq_cst seq_cst
|
|
%val = extractvalue { i128, i1 } %pairval, 0
|
|
ret i128 %val
|
|
}
|
|
|
|
; Check that a constant %cmp value is loaded into a register first.
|
|
define i128 @f8(i128 %swap, ptr %ptr) {
|
|
; CHECK-LABEL: f8:
|
|
; CHECK: lghi {{%r[0-9]+}}, 1001
|
|
; CHECK: cdsg {{%r[0-9]+}}, {{%r[0-9]+}}, 0(%r4)
|
|
; CHECK: br %r14
|
|
%pairval = cmpxchg ptr %ptr, i128 1001, i128 %swap seq_cst seq_cst
|
|
%val = extractvalue { i128, i1 } %pairval, 0
|
|
ret i128 %val
|
|
}
|
|
|
|
; Check that a constant %swap value is loaded into a register first.
|
|
define i128 @f9(i128 %cmp, ptr %ptr) {
|
|
; CHECK-LABEL: f9:
|
|
; CHECK: lghi {{%r[0-9]+}}, 1002
|
|
; CHECK: cdsg {{%r[0-9]+}}, {{%r[0-9]+}}, 0(%r4)
|
|
; CHECK: br %r14
|
|
%pairval = cmpxchg ptr %ptr, i128 %cmp, i128 1002 seq_cst seq_cst
|
|
%val = extractvalue { i128, i1 } %pairval, 0
|
|
ret i128 %val
|
|
}
|
|
|
|
; Check generating the comparison result.
|
|
; CHECK-LABEL: f10
|
|
; CHECK-DAG: lg %r1, 8(%r3)
|
|
; CHECK-DAG: lg %r0, 0(%r3)
|
|
; CHECK-DAG: lg %r13, 8(%r2)
|
|
; CHECK-DAG: lg %r12, 0(%r2)
|
|
; CHECK-Z13: lhi %r2, 0
|
|
; CHECK: cdsg %r12, %r0, 0(%r4)
|
|
; CHECK-Z10-NEXT: ipm %r2
|
|
; CHECK-Z10-NEXT: afi %r2, -268435456
|
|
; CHECK-Z10-NEXT: srl %r2, 31
|
|
; CHECK-Z13-NEXT: lochie %r2, 1
|
|
; CHECK: br %r14
|
|
define i32 @f10(i128 %cmp, i128 %swap, ptr %src) {
|
|
%pairval = cmpxchg ptr %src, i128 %cmp, i128 %swap seq_cst seq_cst
|
|
%val = extractvalue { i128, i1 } %pairval, 1
|
|
%res = zext i1 %val to i32
|
|
ret i32 %res
|
|
}
|
|
|
|
declare void @g()
|
|
|
|
; Check using the comparison result for a branch.
|
|
; CHECK-LABEL: f11
|
|
; CHECK-DAG: lg %r1, 8(%r3)
|
|
; CHECK-DAG: lg %r0, 0(%r3)
|
|
; CHECK-DAG: lg %r13, 8(%r2)
|
|
; CHECK-DAG: lg %r12, 0(%r2)
|
|
; CHECK: cdsg %r12, %r0, 0(%r4)
|
|
; CHECK-NEXT: jl [[LABEL:\.[^ ]*]]
|
|
; CHECK: jg g
|
|
; CHECK: [[LABEL]]:
|
|
; CHECK: br %r14
|
|
define void @f11(i128 %cmp, i128 %swap, ptr %src) {
|
|
%pairval = cmpxchg ptr %src, i128 %cmp, i128 %swap seq_cst seq_cst
|
|
%cond = extractvalue { i128, i1 } %pairval, 1
|
|
br i1 %cond, label %call, label %exit
|
|
|
|
call:
|
|
tail call void @g()
|
|
br label %exit
|
|
|
|
exit:
|
|
ret void
|
|
}
|
|
|
|
; ... and the same with the inverted direction.
|
|
; CHECK-LABEL: f12
|
|
; CHECK-DAG: lg %r1, 8(%r3)
|
|
; CHECK-DAG: lg %r0, 0(%r3)
|
|
; CHECK-DAG: lg %r13, 8(%r2)
|
|
; CHECK-DAG: lg %r12, 0(%r2)
|
|
; CHECK: cdsg %r12, %r0, 0(%r4)
|
|
; CHECK-NEXT: jl [[LABEL:\.[^ ]*]]
|
|
; CHECK: br %r14
|
|
; CHECK: [[LABEL]]:
|
|
; CHECK: jg g
|
|
define void @f12(i128 %cmp, i128 %swap, ptr %src) {
|
|
%pairval = cmpxchg ptr %src, i128 %cmp, i128 %swap seq_cst seq_cst
|
|
%cond = extractvalue { i128, i1 } %pairval, 1
|
|
br i1 %cond, label %exit, label %call
|
|
|
|
call:
|
|
tail call void @g()
|
|
br label %exit
|
|
|
|
exit:
|
|
ret void
|
|
}
|
|
|