Improve the codegen for uaddo node for i64 in 64-bit mode and i32 in 32-bit mode by custom lowering.
63 lines
2.1 KiB
LLVM
63 lines
2.1 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5
|
|
; RUN: llc < %s -mtriple=powerpc64-unknown-linux-gnu | FileCheck %s
|
|
; RUN: llc < %s -mtriple=powerpc64-ibm-aix-xcoff | FileCheck %s
|
|
|
|
define noundef i64 @add(i64 noundef %a, i64 noundef %b, ptr nocapture noundef writeonly %ovf) {
|
|
; CHECK-LABEL: add:
|
|
; CHECK: # %bb.0: # %entry
|
|
; CHECK-NEXT: li 6, 0
|
|
; CHECK-NEXT: addc 3, 3, 4
|
|
; CHECK-NEXT: addze 4, 6
|
|
; CHECK-NEXT: std 4, 0(5)
|
|
; CHECK-NEXT: blr
|
|
entry:
|
|
%0 = tail call { i64, i1 } @llvm.uadd.with.overflow.i64(i64 %a, i64 %b)
|
|
%1 = extractvalue { i64, i1 } %0, 1
|
|
%2 = extractvalue { i64, i1 } %0, 0
|
|
%3 = zext i1 %1 to i64
|
|
store i64 %3, ptr %ovf, align 8
|
|
ret i64 %2
|
|
}
|
|
|
|
declare { i64, i1 } @llvm.uadd.with.overflow.i64(i64, i64)
|
|
|
|
define noundef zeroext i1 @add_overflow(i64 noundef %a, i64 noundef %b, ptr nocapture noundef writeonly %ovf) {
|
|
; CHECK-LABEL: add_overflow:
|
|
; CHECK: # %bb.0: # %entry
|
|
; CHECK-NEXT: li 6, 0
|
|
; CHECK-NEXT: addc 4, 3, 4
|
|
; CHECK-NEXT: addze 3, 6
|
|
; CHECK-NEXT: std 4, 0(5)
|
|
; CHECK-NEXT: blr
|
|
entry:
|
|
%0 = tail call { i64, i1 } @llvm.uadd.with.overflow.i64(i64 %a, i64 %b)
|
|
%1 = extractvalue { i64, i1 } %0, 1
|
|
%2 = extractvalue { i64, i1 } %0, 0
|
|
store i64 %2, ptr %ovf, align 8
|
|
ret i1 %1
|
|
}
|
|
|
|
define noundef i64 @addWithCarryIn (i64 noundef %a, i64 noundef %b, i64 noundef %c, ptr nocapture noundef writeonly %ovf) {
|
|
; CHECK-LABEL: addWithCarryIn:
|
|
; CHECK: # %bb.0: # %entry
|
|
; CHECK-NEXT: li 7, 0
|
|
; CHECK-NEXT: addc 3, 3, 4
|
|
; CHECK-NEXT: addze 4, 7
|
|
; CHECK-NEXT: addc 3, 3, 5
|
|
; CHECK-NEXT: addze 5, 7
|
|
; CHECK-NEXT: or 4, 4, 5
|
|
; CHECK-NEXT: std 4, 0(6)
|
|
; CHECK-NEXT: blr
|
|
entry:
|
|
%0 = tail call { i64, i1 } @llvm.uadd.with.overflow.i64(i64 %a, i64 %b)
|
|
%1 = extractvalue { i64, i1 } %0, 1
|
|
%2 = extractvalue { i64, i1 } %0, 0
|
|
%3 = tail call { i64, i1 } @llvm.uadd.with.overflow.i64(i64 %2, i64 %c)
|
|
%4 = extractvalue { i64, i1 } %3, 1
|
|
%5 = extractvalue { i64, i1 } %3, 0
|
|
%6 = or i1 %1, %4
|
|
%7 = zext i1 %6 to i64
|
|
store i64 %7, ptr %ovf, align 8
|
|
ret i64 %5
|
|
}
|