On processors supporting vector registers and SIMD instructions, enable i128 as legal type in VRs. This allows many operations to be implemented via native instructions directly in VRs (including add, subtract, logical operations and shifts). For a few other operations (e.g. multiply and divide, as well as atomic operations), we need to move the i128 value back to a GPR pair to use the corresponding instruction there. Overall, this is still beneficial. The patch includes the following LLVM changes: - Enable i128 as legal type - Set up legal operations (in SystemZInstrVector.td) - Custom expansion for i128 add/subtract with carry - Custom expansion for i128 comparisons and selects - Support for moving i128 to/from GPR pairs when required - Handle 128-bit integer constant values everywhere - Use i128 as intrinsic operand type where appropriate - Updated and new test cases In addition, clang builtins are updated to reflect the intrinsic operand type changes (which also improves compatibility with GCC).
409 lines
14 KiB
LLVM
409 lines
14 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 2
|
|
; Test i128 atomicrmw operations.
|
|
;
|
|
; RUN: llc < %s -mtriple=s390x-linux-gnu -mcpu=z15 | FileCheck %s
|
|
;
|
|
; Test expansion of AtomicRMW instructions, which assume a natural alignment.
|
|
; Note that the multiple regmoves inside the CDSG loops hopefully will go away
|
|
; when the new i128 support is added.
|
|
|
|
; Check register exchange.
|
|
define i128 @atomicrmw_xchg(ptr %src, i128 %b) {
|
|
; CHECK-LABEL: atomicrmw_xchg:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vl %v1, 0(%r4), 3
|
|
; CHECK-NEXT: vl %v0, 0(%r3), 4
|
|
; CHECK-NEXT: vlgvg %r1, %v1, 1
|
|
; CHECK-NEXT: vlgvg %r0, %v1, 0
|
|
; CHECK-NEXT: .LBB0_1: # %atomicrmw.start
|
|
; CHECK-NEXT: # =>This Inner Loop Header: Depth=1
|
|
; CHECK-NEXT: vlgvg %r5, %v0, 1
|
|
; CHECK-NEXT: vlgvg %r4, %v0, 0
|
|
; CHECK-NEXT: cdsg %r4, %r0, 0(%r3)
|
|
; CHECK-NEXT: vlvgp %v0, %r4, %r5
|
|
; CHECK-NEXT: jl .LBB0_1
|
|
; CHECK-NEXT: # %bb.2: # %atomicrmw.end
|
|
; CHECK-NEXT: vst %v0, 0(%r2), 3
|
|
; CHECK-NEXT: br %r14
|
|
%res = atomicrmw xchg ptr %src, i128 %b seq_cst
|
|
ret i128 %res
|
|
}
|
|
|
|
; Check addition of a variable.
|
|
define i128 @atomicrmw_add(ptr %src, i128 %b) {
|
|
; CHECK-LABEL: atomicrmw_add:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vl %v0, 0(%r4), 3
|
|
; CHECK-NEXT: vl %v1, 0(%r3), 4
|
|
; CHECK-NEXT: .LBB1_1: # %atomicrmw.start
|
|
; CHECK-NEXT: # =>This Inner Loop Header: Depth=1
|
|
; CHECK-NEXT: vaq %v2, %v1, %v0
|
|
; CHECK-NEXT: vlgvg %r1, %v2, 1
|
|
; CHECK-NEXT: vlgvg %r0, %v2, 0
|
|
; CHECK-NEXT: vlgvg %r5, %v1, 1
|
|
; CHECK-NEXT: vlgvg %r4, %v1, 0
|
|
; CHECK-NEXT: cdsg %r4, %r0, 0(%r3)
|
|
; CHECK-NEXT: vlvgp %v1, %r4, %r5
|
|
; CHECK-NEXT: jl .LBB1_1
|
|
; CHECK-NEXT: # %bb.2: # %atomicrmw.end
|
|
; CHECK-NEXT: vst %v1, 0(%r2), 3
|
|
; CHECK-NEXT: br %r14
|
|
%res = atomicrmw add ptr %src, i128 %b seq_cst
|
|
ret i128 %res
|
|
}
|
|
|
|
; Check subtraction of a variable.
|
|
define i128 @atomicrmw_sub(ptr %src, i128 %b) {
|
|
; CHECK-LABEL: atomicrmw_sub:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vl %v0, 0(%r4), 3
|
|
; CHECK-NEXT: vl %v1, 0(%r3), 4
|
|
; CHECK-NEXT: .LBB2_1: # %atomicrmw.start
|
|
; CHECK-NEXT: # =>This Inner Loop Header: Depth=1
|
|
; CHECK-NEXT: vsq %v2, %v1, %v0
|
|
; CHECK-NEXT: vlgvg %r1, %v2, 1
|
|
; CHECK-NEXT: vlgvg %r0, %v2, 0
|
|
; CHECK-NEXT: vlgvg %r5, %v1, 1
|
|
; CHECK-NEXT: vlgvg %r4, %v1, 0
|
|
; CHECK-NEXT: cdsg %r4, %r0, 0(%r3)
|
|
; CHECK-NEXT: vlvgp %v1, %r4, %r5
|
|
; CHECK-NEXT: jl .LBB2_1
|
|
; CHECK-NEXT: # %bb.2: # %atomicrmw.end
|
|
; CHECK-NEXT: vst %v1, 0(%r2), 3
|
|
; CHECK-NEXT: br %r14
|
|
%res = atomicrmw sub ptr %src, i128 %b seq_cst
|
|
ret i128 %res
|
|
}
|
|
|
|
; Check AND of a variable.
|
|
define i128 @atomicrmw_and(ptr %src, i128 %b) {
|
|
; CHECK-LABEL: atomicrmw_and:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vl %v0, 0(%r4), 3
|
|
; CHECK-NEXT: vl %v1, 0(%r3), 4
|
|
; CHECK-NEXT: .LBB3_1: # %atomicrmw.start
|
|
; CHECK-NEXT: # =>This Inner Loop Header: Depth=1
|
|
; CHECK-NEXT: vn %v2, %v1, %v0
|
|
; CHECK-NEXT: vlgvg %r1, %v2, 1
|
|
; CHECK-NEXT: vlgvg %r0, %v2, 0
|
|
; CHECK-NEXT: vlgvg %r5, %v1, 1
|
|
; CHECK-NEXT: vlgvg %r4, %v1, 0
|
|
; CHECK-NEXT: cdsg %r4, %r0, 0(%r3)
|
|
; CHECK-NEXT: vlvgp %v1, %r4, %r5
|
|
; CHECK-NEXT: jl .LBB3_1
|
|
; CHECK-NEXT: # %bb.2: # %atomicrmw.end
|
|
; CHECK-NEXT: vst %v1, 0(%r2), 3
|
|
; CHECK-NEXT: br %r14
|
|
%res = atomicrmw and ptr %src, i128 %b seq_cst
|
|
ret i128 %res
|
|
}
|
|
|
|
; Check NAND of a variable.
|
|
define i128 @atomicrmw_nand(ptr %src, i128 %b) {
|
|
; CHECK-LABEL: atomicrmw_nand:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vl %v0, 0(%r4), 3
|
|
; CHECK-NEXT: vl %v1, 0(%r3), 4
|
|
; CHECK-NEXT: .LBB4_1: # %atomicrmw.start
|
|
; CHECK-NEXT: # =>This Inner Loop Header: Depth=1
|
|
; CHECK-NEXT: vlgvg %r1, %v1, 1
|
|
; CHECK-NEXT: vlgvg %r0, %v1, 0
|
|
; CHECK-NEXT: vnn %v1, %v1, %v0
|
|
; CHECK-NEXT: vlgvg %r5, %v1, 1
|
|
; CHECK-NEXT: vlgvg %r4, %v1, 0
|
|
; CHECK-NEXT: cdsg %r0, %r4, 0(%r3)
|
|
; CHECK-NEXT: vlvgp %v1, %r0, %r1
|
|
; CHECK-NEXT: jl .LBB4_1
|
|
; CHECK-NEXT: # %bb.2: # %atomicrmw.end
|
|
; CHECK-NEXT: vst %v1, 0(%r2), 3
|
|
; CHECK-NEXT: br %r14
|
|
%res = atomicrmw nand ptr %src, i128 %b seq_cst
|
|
ret i128 %res
|
|
}
|
|
|
|
; Check OR of a variable.
|
|
define i128 @atomicrmw_or(ptr %src, i128 %b) {
|
|
; CHECK-LABEL: atomicrmw_or:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vl %v0, 0(%r4), 3
|
|
; CHECK-NEXT: vl %v1, 0(%r3), 4
|
|
; CHECK-NEXT: .LBB5_1: # %atomicrmw.start
|
|
; CHECK-NEXT: # =>This Inner Loop Header: Depth=1
|
|
; CHECK-NEXT: vo %v2, %v1, %v0
|
|
; CHECK-NEXT: vlgvg %r1, %v2, 1
|
|
; CHECK-NEXT: vlgvg %r0, %v2, 0
|
|
; CHECK-NEXT: vlgvg %r5, %v1, 1
|
|
; CHECK-NEXT: vlgvg %r4, %v1, 0
|
|
; CHECK-NEXT: cdsg %r4, %r0, 0(%r3)
|
|
; CHECK-NEXT: vlvgp %v1, %r4, %r5
|
|
; CHECK-NEXT: jl .LBB5_1
|
|
; CHECK-NEXT: # %bb.2: # %atomicrmw.end
|
|
; CHECK-NEXT: vst %v1, 0(%r2), 3
|
|
; CHECK-NEXT: br %r14
|
|
%res = atomicrmw or ptr %src, i128 %b seq_cst
|
|
ret i128 %res
|
|
}
|
|
|
|
; Check XOR of a variable.
|
|
define i128 @atomicrmw_xor(ptr %src, i128 %b) {
|
|
; CHECK-LABEL: atomicrmw_xor:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vl %v0, 0(%r4), 3
|
|
; CHECK-NEXT: vl %v1, 0(%r3), 4
|
|
; CHECK-NEXT: .LBB6_1: # %atomicrmw.start
|
|
; CHECK-NEXT: # =>This Inner Loop Header: Depth=1
|
|
; CHECK-NEXT: vx %v2, %v1, %v0
|
|
; CHECK-NEXT: vlgvg %r1, %v2, 1
|
|
; CHECK-NEXT: vlgvg %r0, %v2, 0
|
|
; CHECK-NEXT: vlgvg %r5, %v1, 1
|
|
; CHECK-NEXT: vlgvg %r4, %v1, 0
|
|
; CHECK-NEXT: cdsg %r4, %r0, 0(%r3)
|
|
; CHECK-NEXT: vlvgp %v1, %r4, %r5
|
|
; CHECK-NEXT: jl .LBB6_1
|
|
; CHECK-NEXT: # %bb.2: # %atomicrmw.end
|
|
; CHECK-NEXT: vst %v1, 0(%r2), 3
|
|
; CHECK-NEXT: br %r14
|
|
%res = atomicrmw xor ptr %src, i128 %b seq_cst
|
|
ret i128 %res
|
|
}
|
|
|
|
; Check signed minimum.
|
|
define i128 @atomicrmw_min(ptr %src, i128 %b) {
|
|
; CHECK-LABEL: atomicrmw_min:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vl %v0, 0(%r4), 3
|
|
; CHECK-NEXT: vl %v1, 0(%r3), 4
|
|
; CHECK-NEXT: j .LBB7_2
|
|
; CHECK-NEXT: .LBB7_1: # %atomicrmw.start
|
|
; CHECK-NEXT: # in Loop: Header=BB7_2 Depth=1
|
|
; CHECK-NEXT: vlgvg %r1, %v1, 1
|
|
; CHECK-NEXT: vlgvg %r0, %v1, 0
|
|
; CHECK-NEXT: vlgvg %r5, %v2, 1
|
|
; CHECK-NEXT: vlgvg %r4, %v2, 0
|
|
; CHECK-NEXT: cdsg %r0, %r4, 0(%r3)
|
|
; CHECK-NEXT: vlvgp %v1, %r0, %r1
|
|
; CHECK-NEXT: je .LBB7_6
|
|
; CHECK-NEXT: .LBB7_2: # %atomicrmw.start
|
|
; CHECK-NEXT: # =>This Inner Loop Header: Depth=1
|
|
; CHECK-NEXT: vecg %v0, %v1
|
|
; CHECK-NEXT: jlh .LBB7_4
|
|
; CHECK-NEXT: # %bb.3: # %atomicrmw.start
|
|
; CHECK-NEXT: # in Loop: Header=BB7_2 Depth=1
|
|
; CHECK-NEXT: vchlgs %v2, %v1, %v0
|
|
; CHECK-NEXT: .LBB7_4: # %atomicrmw.start
|
|
; CHECK-NEXT: # in Loop: Header=BB7_2 Depth=1
|
|
; CHECK-NEXT: vlr %v2, %v1
|
|
; CHECK-NEXT: jnl .LBB7_1
|
|
; CHECK-NEXT: # %bb.5: # %atomicrmw.start
|
|
; CHECK-NEXT: # in Loop: Header=BB7_2 Depth=1
|
|
; CHECK-NEXT: vlr %v2, %v0
|
|
; CHECK-NEXT: j .LBB7_1
|
|
; CHECK-NEXT: .LBB7_6: # %atomicrmw.end
|
|
; CHECK-NEXT: vst %v1, 0(%r2), 3
|
|
; CHECK-NEXT: br %r14
|
|
%res = atomicrmw min ptr %src, i128 %b seq_cst
|
|
ret i128 %res
|
|
}
|
|
|
|
; Check signed maximum.
|
|
define i128 @atomicrmw_max(ptr %src, i128 %b) {
|
|
; CHECK-LABEL: atomicrmw_max:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vl %v0, 0(%r4), 3
|
|
; CHECK-NEXT: vl %v1, 0(%r3), 4
|
|
; CHECK-NEXT: j .LBB8_2
|
|
; CHECK-NEXT: .LBB8_1: # %atomicrmw.start
|
|
; CHECK-NEXT: # in Loop: Header=BB8_2 Depth=1
|
|
; CHECK-NEXT: vlgvg %r1, %v1, 1
|
|
; CHECK-NEXT: vlgvg %r0, %v1, 0
|
|
; CHECK-NEXT: vlgvg %r5, %v2, 1
|
|
; CHECK-NEXT: vlgvg %r4, %v2, 0
|
|
; CHECK-NEXT: cdsg %r0, %r4, 0(%r3)
|
|
; CHECK-NEXT: vlvgp %v1, %r0, %r1
|
|
; CHECK-NEXT: je .LBB8_6
|
|
; CHECK-NEXT: .LBB8_2: # %atomicrmw.start
|
|
; CHECK-NEXT: # =>This Inner Loop Header: Depth=1
|
|
; CHECK-NEXT: vecg %v0, %v1
|
|
; CHECK-NEXT: jlh .LBB8_4
|
|
; CHECK-NEXT: # %bb.3: # %atomicrmw.start
|
|
; CHECK-NEXT: # in Loop: Header=BB8_2 Depth=1
|
|
; CHECK-NEXT: vchlgs %v2, %v1, %v0
|
|
; CHECK-NEXT: .LBB8_4: # %atomicrmw.start
|
|
; CHECK-NEXT: # in Loop: Header=BB8_2 Depth=1
|
|
; CHECK-NEXT: vlr %v2, %v1
|
|
; CHECK-NEXT: jl .LBB8_1
|
|
; CHECK-NEXT: # %bb.5: # %atomicrmw.start
|
|
; CHECK-NEXT: # in Loop: Header=BB8_2 Depth=1
|
|
; CHECK-NEXT: vlr %v2, %v0
|
|
; CHECK-NEXT: j .LBB8_1
|
|
; CHECK-NEXT: .LBB8_6: # %atomicrmw.end
|
|
; CHECK-NEXT: vst %v1, 0(%r2), 3
|
|
; CHECK-NEXT: br %r14
|
|
%res = atomicrmw max ptr %src, i128 %b seq_cst
|
|
ret i128 %res
|
|
}
|
|
|
|
; Check unsigned minimum.
|
|
define i128 @atomicrmw_umin(ptr %src, i128 %b) {
|
|
; CHECK-LABEL: atomicrmw_umin:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vl %v0, 0(%r4), 3
|
|
; CHECK-NEXT: vl %v1, 0(%r3), 4
|
|
; CHECK-NEXT: j .LBB9_2
|
|
; CHECK-NEXT: .LBB9_1: # %atomicrmw.start
|
|
; CHECK-NEXT: # in Loop: Header=BB9_2 Depth=1
|
|
; CHECK-NEXT: vlgvg %r1, %v1, 1
|
|
; CHECK-NEXT: vlgvg %r0, %v1, 0
|
|
; CHECK-NEXT: vlgvg %r5, %v2, 1
|
|
; CHECK-NEXT: vlgvg %r4, %v2, 0
|
|
; CHECK-NEXT: cdsg %r0, %r4, 0(%r3)
|
|
; CHECK-NEXT: vlvgp %v1, %r0, %r1
|
|
; CHECK-NEXT: je .LBB9_6
|
|
; CHECK-NEXT: .LBB9_2: # %atomicrmw.start
|
|
; CHECK-NEXT: # =>This Inner Loop Header: Depth=1
|
|
; CHECK-NEXT: veclg %v0, %v1
|
|
; CHECK-NEXT: jlh .LBB9_4
|
|
; CHECK-NEXT: # %bb.3: # %atomicrmw.start
|
|
; CHECK-NEXT: # in Loop: Header=BB9_2 Depth=1
|
|
; CHECK-NEXT: vchlgs %v2, %v1, %v0
|
|
; CHECK-NEXT: .LBB9_4: # %atomicrmw.start
|
|
; CHECK-NEXT: # in Loop: Header=BB9_2 Depth=1
|
|
; CHECK-NEXT: vlr %v2, %v1
|
|
; CHECK-NEXT: jnl .LBB9_1
|
|
; CHECK-NEXT: # %bb.5: # %atomicrmw.start
|
|
; CHECK-NEXT: # in Loop: Header=BB9_2 Depth=1
|
|
; CHECK-NEXT: vlr %v2, %v0
|
|
; CHECK-NEXT: j .LBB9_1
|
|
; CHECK-NEXT: .LBB9_6: # %atomicrmw.end
|
|
; CHECK-NEXT: vst %v1, 0(%r2), 3
|
|
; CHECK-NEXT: br %r14
|
|
%res = atomicrmw umin ptr %src, i128 %b seq_cst
|
|
ret i128 %res
|
|
}
|
|
|
|
; Check unsigned maximum.
|
|
define i128 @atomicrmw_umax(ptr %src, i128 %b) {
|
|
; CHECK-LABEL: atomicrmw_umax:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vl %v0, 0(%r4), 3
|
|
; CHECK-NEXT: vl %v1, 0(%r3), 4
|
|
; CHECK-NEXT: j .LBB10_2
|
|
; CHECK-NEXT: .LBB10_1: # %atomicrmw.start
|
|
; CHECK-NEXT: # in Loop: Header=BB10_2 Depth=1
|
|
; CHECK-NEXT: vlgvg %r1, %v1, 1
|
|
; CHECK-NEXT: vlgvg %r0, %v1, 0
|
|
; CHECK-NEXT: vlgvg %r5, %v2, 1
|
|
; CHECK-NEXT: vlgvg %r4, %v2, 0
|
|
; CHECK-NEXT: cdsg %r0, %r4, 0(%r3)
|
|
; CHECK-NEXT: vlvgp %v1, %r0, %r1
|
|
; CHECK-NEXT: je .LBB10_6
|
|
; CHECK-NEXT: .LBB10_2: # %atomicrmw.start
|
|
; CHECK-NEXT: # =>This Inner Loop Header: Depth=1
|
|
; CHECK-NEXT: veclg %v0, %v1
|
|
; CHECK-NEXT: jlh .LBB10_4
|
|
; CHECK-NEXT: # %bb.3: # %atomicrmw.start
|
|
; CHECK-NEXT: # in Loop: Header=BB10_2 Depth=1
|
|
; CHECK-NEXT: vchlgs %v2, %v1, %v0
|
|
; CHECK-NEXT: .LBB10_4: # %atomicrmw.start
|
|
; CHECK-NEXT: # in Loop: Header=BB10_2 Depth=1
|
|
; CHECK-NEXT: vlr %v2, %v1
|
|
; CHECK-NEXT: jl .LBB10_1
|
|
; CHECK-NEXT: # %bb.5: # %atomicrmw.start
|
|
; CHECK-NEXT: # in Loop: Header=BB10_2 Depth=1
|
|
; CHECK-NEXT: vlr %v2, %v0
|
|
; CHECK-NEXT: j .LBB10_1
|
|
; CHECK-NEXT: .LBB10_6: # %atomicrmw.end
|
|
; CHECK-NEXT: vst %v1, 0(%r2), 3
|
|
; CHECK-NEXT: br %r14
|
|
%res = atomicrmw umax ptr %src, i128 %b seq_cst
|
|
ret i128 %res
|
|
}
|
|
|
|
; Check increment with wraparound.
|
|
define i128 @atomicrmw_uinc_wrap(ptr %src, i128 %b) {
|
|
; CHECK-LABEL: atomicrmw_uinc_wrap:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: larl %r1, .LCPI11_0
|
|
; CHECK-NEXT: vl %v0, 0(%r4), 3
|
|
; CHECK-NEXT: vl %v2, 0(%r3), 4
|
|
; CHECK-NEXT: vl %v1, 0(%r1), 3
|
|
; CHECK-NEXT: j .LBB11_2
|
|
; CHECK-NEXT: .LBB11_1: # %atomicrmw.start
|
|
; CHECK-NEXT: # in Loop: Header=BB11_2 Depth=1
|
|
; CHECK-NEXT: vlgvg %r1, %v2, 1
|
|
; CHECK-NEXT: vlgvg %r0, %v2, 0
|
|
; CHECK-NEXT: vlgvg %r5, %v3, 1
|
|
; CHECK-NEXT: vlgvg %r4, %v3, 0
|
|
; CHECK-NEXT: cdsg %r0, %r4, 0(%r3)
|
|
; CHECK-NEXT: vlvgp %v2, %r0, %r1
|
|
; CHECK-NEXT: je .LBB11_6
|
|
; CHECK-NEXT: .LBB11_2: # %atomicrmw.start
|
|
; CHECK-NEXT: # =>This Inner Loop Header: Depth=1
|
|
; CHECK-NEXT: veclg %v2, %v0
|
|
; CHECK-NEXT: jlh .LBB11_4
|
|
; CHECK-NEXT: # %bb.3: # %atomicrmw.start
|
|
; CHECK-NEXT: # in Loop: Header=BB11_2 Depth=1
|
|
; CHECK-NEXT: vchlgs %v3, %v0, %v2
|
|
; CHECK-NEXT: .LBB11_4: # %atomicrmw.start
|
|
; CHECK-NEXT: # in Loop: Header=BB11_2 Depth=1
|
|
; CHECK-NEXT: vgbm %v3, 0
|
|
; CHECK-NEXT: jnl .LBB11_1
|
|
; CHECK-NEXT: # %bb.5: # %atomicrmw.start
|
|
; CHECK-NEXT: # in Loop: Header=BB11_2 Depth=1
|
|
; CHECK-NEXT: vaq %v3, %v2, %v1
|
|
; CHECK-NEXT: j .LBB11_1
|
|
; CHECK-NEXT: .LBB11_6: # %atomicrmw.end
|
|
; CHECK-NEXT: vst %v2, 0(%r2), 3
|
|
; CHECK-NEXT: br %r14
|
|
%res = atomicrmw uinc_wrap ptr %src, i128 %b seq_cst
|
|
ret i128 %res
|
|
}
|
|
|
|
; Check decrement with wraparound.
|
|
define i128 @atomicrmw_udec_wrap(ptr %src, i128 %b) {
|
|
; CHECK-LABEL: atomicrmw_udec_wrap:
|
|
; CHECK: # %bb.0:
|
|
; CHECK-NEXT: vl %v0, 0(%r4), 3
|
|
; CHECK-NEXT: vl %v3, 0(%r3), 4
|
|
; CHECK-NEXT: vgbm %v1, 65535
|
|
; CHECK-NEXT: vgbm %v2, 0
|
|
; CHECK-NEXT: j .LBB12_2
|
|
; CHECK-NEXT: .LBB12_1: # %atomicrmw.start
|
|
; CHECK-NEXT: # in Loop: Header=BB12_2 Depth=1
|
|
; CHECK-NEXT: vlgvg %r1, %v3, 1
|
|
; CHECK-NEXT: vlgvg %r0, %v3, 0
|
|
; CHECK-NEXT: vlgvg %r5, %v4, 1
|
|
; CHECK-NEXT: vlgvg %r4, %v4, 0
|
|
; CHECK-NEXT: cdsg %r0, %r4, 0(%r3)
|
|
; CHECK-NEXT: vlvgp %v3, %r0, %r1
|
|
; CHECK-NEXT: je .LBB12_8
|
|
; CHECK-NEXT: .LBB12_2: # %atomicrmw.start
|
|
; CHECK-NEXT: # =>This Inner Loop Header: Depth=1
|
|
; CHECK-NEXT: veclg %v0, %v3
|
|
; CHECK-NEXT: jlh .LBB12_4
|
|
; CHECK-NEXT: # %bb.3: # %atomicrmw.start
|
|
; CHECK-NEXT: # in Loop: Header=BB12_2 Depth=1
|
|
; CHECK-NEXT: vchlgs %v4, %v3, %v0
|
|
; CHECK-NEXT: .LBB12_4: # %atomicrmw.start
|
|
; CHECK-NEXT: # in Loop: Header=BB12_2 Depth=1
|
|
; CHECK-NEXT: vlr %v5, %v0
|
|
; CHECK-NEXT: jl .LBB12_6
|
|
; CHECK-NEXT: # %bb.5: # %atomicrmw.start
|
|
; CHECK-NEXT: # in Loop: Header=BB12_2 Depth=1
|
|
; CHECK-NEXT: vaq %v5, %v3, %v1
|
|
; CHECK-NEXT: .LBB12_6: # %atomicrmw.start
|
|
; CHECK-NEXT: # in Loop: Header=BB12_2 Depth=1
|
|
; CHECK-NEXT: vceqgs %v4, %v3, %v2
|
|
; CHECK-NEXT: vlr %v4, %v0
|
|
; CHECK-NEXT: je .LBB12_1
|
|
; CHECK-NEXT: # %bb.7: # %atomicrmw.start
|
|
; CHECK-NEXT: # in Loop: Header=BB12_2 Depth=1
|
|
; CHECK-NEXT: vlr %v4, %v5
|
|
; CHECK-NEXT: j .LBB12_1
|
|
; CHECK-NEXT: .LBB12_8: # %atomicrmw.end
|
|
; CHECK-NEXT: vst %v3, 0(%r2), 3
|
|
; CHECK-NEXT: br %r14
|
|
%res = atomicrmw udec_wrap ptr %src, i128 %b seq_cst
|
|
ret i128 %res
|
|
}
|