Recommit "[SCCP] Use range info to prove AddInst has NUW flag."
This reverts commit531756b954. The recommitted version fixes a crash when one of the operands is a constant other than a ConstantInt. Test for that case have been added in5b16cd97b8. It splits off the new logic into a separate function because setting the flags is quite different compared to the other cases handled in replaceSignedInst which all require replacing an existing instruction. It also guards makeGuaranteedNoWrapRegion by `if (!Inst.hasNoUnsignedWrap())` as discussed in the review. Fixes #60280. Fixes #60278. Original message: This patch updates SCCP to use the value ranges of AddInst operands to try to prove the AddInst does not overflow in the unsigned sense and adds the NUW flag. The reasoning is done with makeGuaranteedNoWrapRegion (thanks @nikic for point it out!). Follow-ups will include adding NSW and extension to more OverflowingBinaryOperators. Reviewed By: nikic Differential Revision: https://reviews.llvm.org/D142387
This commit is contained in:
@@ -41,6 +41,14 @@ static ValueLatticeElement::MergeOptions getMaxWidenStepsOpts() {
|
||||
MaxNumRangeExtensions);
|
||||
}
|
||||
|
||||
static ConstantRange getConstantRange(const ValueLatticeElement &LV, Type *Ty,
|
||||
bool UndefAllowed = true) {
|
||||
assert(Ty->isIntOrIntVectorTy() && "Should be int or int vector");
|
||||
if (LV.isConstantRange(UndefAllowed))
|
||||
return LV.getConstantRange();
|
||||
return ConstantRange::getFull(Ty->getScalarSizeInBits());
|
||||
}
|
||||
|
||||
namespace llvm {
|
||||
|
||||
bool SCCPSolver::isConstant(const ValueLatticeElement &LV) {
|
||||
@@ -115,6 +123,37 @@ bool SCCPSolver::tryToReplaceWithConstant(Value *V) {
|
||||
return true;
|
||||
}
|
||||
|
||||
/// Try to use \p Inst's value range from \p Solver to infer the NUW flag.
|
||||
static bool refineInstruction(SCCPSolver &Solver,
|
||||
const SmallPtrSetImpl<Value *> &InsertedValues,
|
||||
Instruction &Inst) {
|
||||
if (Inst.getOpcode() != Instruction::Add)
|
||||
return false;
|
||||
|
||||
auto GetRange = [&Solver, &InsertedValues](Value *Op) {
|
||||
if (auto *Const = dyn_cast<ConstantInt>(Op))
|
||||
return ConstantRange(Const->getValue());
|
||||
if (isa<Constant>(Op) || InsertedValues.contains(Op)) {
|
||||
unsigned Bitwidth = Op->getType()->getScalarSizeInBits();
|
||||
return ConstantRange::getFull(Bitwidth);
|
||||
}
|
||||
return getConstantRange(Solver.getLatticeValueFor(Op), Op->getType(),
|
||||
/*UndefAllowed=*/false);
|
||||
};
|
||||
auto RangeA = GetRange(Inst.getOperand(0));
|
||||
auto RangeB = GetRange(Inst.getOperand(1));
|
||||
if (!Inst.hasNoUnsignedWrap()) {
|
||||
auto NUWRange = ConstantRange::makeGuaranteedNoWrapRegion(
|
||||
Instruction::Add, RangeB, OverflowingBinaryOperator::NoUnsignedWrap);
|
||||
if (NUWRange.contains(RangeA)) {
|
||||
Inst.setHasNoUnsignedWrap();
|
||||
return true;
|
||||
}
|
||||
}
|
||||
|
||||
return false;
|
||||
}
|
||||
|
||||
/// Try to replace signed instructions with their unsigned equivalent.
|
||||
static bool replaceSignedInst(SCCPSolver &Solver,
|
||||
SmallPtrSetImpl<Value *> &InsertedValues,
|
||||
@@ -195,6 +234,8 @@ bool SCCPSolver::simplifyInstsInBlock(BasicBlock &BB,
|
||||
} else if (replaceSignedInst(*this, InsertedValues, Inst)) {
|
||||
MadeChanges = true;
|
||||
++InstReplacedStat;
|
||||
} else if (refineInstruction(*this, InsertedValues, Inst)) {
|
||||
MadeChanges = true;
|
||||
}
|
||||
}
|
||||
return MadeChanges;
|
||||
@@ -682,7 +723,6 @@ public:
|
||||
bool isStructLatticeConstant(Function *F, StructType *STy);
|
||||
|
||||
Constant *getConstant(const ValueLatticeElement &LV) const;
|
||||
ConstantRange getConstantRange(const ValueLatticeElement &LV, Type *Ty) const;
|
||||
|
||||
SmallPtrSetImpl<Function *> &getArgumentTrackedFunctions() {
|
||||
return TrackingIncomingArguments;
|
||||
@@ -783,15 +823,6 @@ Constant *SCCPInstVisitor::getConstant(const ValueLatticeElement &LV) const {
|
||||
return nullptr;
|
||||
}
|
||||
|
||||
ConstantRange
|
||||
SCCPInstVisitor::getConstantRange(const ValueLatticeElement &LV,
|
||||
Type *Ty) const {
|
||||
assert(Ty->isIntOrIntVectorTy() && "Should be int or int vector");
|
||||
if (LV.isConstantRange())
|
||||
return LV.getConstantRange();
|
||||
return ConstantRange::getFull(Ty->getScalarSizeInBits());
|
||||
}
|
||||
|
||||
void SCCPInstVisitor::markArgInFuncSpecialization(
|
||||
Function *F, const SmallVectorImpl<ArgInfo> &Args) {
|
||||
assert(!Args.empty() && "Specialization without arguments");
|
||||
|
||||
@@ -5,8 +5,8 @@ define i8 @range_from_lshr(i8 %a) {
|
||||
; CHECK-LABEL: @range_from_lshr(
|
||||
; CHECK-NEXT: entry:
|
||||
; CHECK-NEXT: [[A_SHR:%.*]] = lshr i8 [[A:%.*]], 1
|
||||
; CHECK-NEXT: [[ADD_1:%.*]] = add i8 [[A_SHR]], 1
|
||||
; CHECK-NEXT: [[ADD_2:%.*]] = add i8 [[A_SHR]], -128
|
||||
; CHECK-NEXT: [[ADD_1:%.*]] = add nuw i8 [[A_SHR]], 1
|
||||
; CHECK-NEXT: [[ADD_2:%.*]] = add nuw i8 [[A_SHR]], -128
|
||||
; CHECK-NEXT: [[ADD_3:%.*]] = add i8 [[A_SHR]], -127
|
||||
; CHECK-NEXT: [[ADD_4:%.*]] = add i8 [[A_SHR]], -1
|
||||
; CHECK-NEXT: [[RES_1:%.*]] = xor i8 [[ADD_1]], [[ADD_2]]
|
||||
@@ -30,7 +30,7 @@ define i8 @a_and_15_add_1(i8 %a) {
|
||||
; CHECK-LABEL: @a_and_15_add_1(
|
||||
; CHECK-NEXT: entry:
|
||||
; CHECK-NEXT: [[A_AND:%.*]] = and i8 [[A:%.*]], 15
|
||||
; CHECK-NEXT: [[ADD_1:%.*]] = add i8 [[A_AND]], 1
|
||||
; CHECK-NEXT: [[ADD_1:%.*]] = add nuw i8 [[A_AND]], 1
|
||||
; CHECK-NEXT: ret i8 [[ADD_1]]
|
||||
;
|
||||
entry:
|
||||
@@ -73,9 +73,9 @@ define i8 @sge_0_and_sle_90(i8 %a) {
|
||||
; CHECK-NEXT: [[AND:%.*]] = and i1 [[SGT]], [[SLT]]
|
||||
; CHECK-NEXT: br i1 [[AND]], label [[THEN:%.*]], label [[ELSE:%.*]]
|
||||
; CHECK: then:
|
||||
; CHECK-NEXT: [[ADD_1:%.*]] = add i8 [[A]], 1
|
||||
; CHECK-NEXT: [[ADD_1:%.*]] = add nuw i8 [[A]], 1
|
||||
; CHECK-NEXT: [[ADD_2:%.*]] = add i8 [[A]], -1
|
||||
; CHECK-NEXT: [[ADD_3:%.*]] = add i8 [[A]], -91
|
||||
; CHECK-NEXT: [[ADD_3:%.*]] = add nuw i8 [[A]], -91
|
||||
; CHECK-NEXT: [[ADD_4:%.*]] = add i8 [[A]], -90
|
||||
; CHECK-NEXT: [[RES_1:%.*]] = xor i8 [[ADD_1]], [[ADD_2]]
|
||||
; CHECK-NEXT: [[RES_2:%.*]] = xor i8 [[RES_1]], [[ADD_3]]
|
||||
@@ -125,8 +125,8 @@ define i16 @sge_with_sext_to_zext_conversion(i8 %a) {
|
||||
; CHECK-NEXT: br i1 [[CMP]], label [[THEN:%.*]], label [[ELSE:%.*]]
|
||||
; CHECK: then:
|
||||
; CHECK-NEXT: [[SEXT:%.*]] = zext i8 [[A]] to i16
|
||||
; CHECK-NEXT: [[ADD_1:%.*]] = add i16 [[SEXT]], 1
|
||||
; CHECK-NEXT: [[ADD_2:%.*]] = add i16 [[SEXT]], -128
|
||||
; CHECK-NEXT: [[ADD_1:%.*]] = add nuw i16 [[SEXT]], 1
|
||||
; CHECK-NEXT: [[ADD_2:%.*]] = add nuw i16 [[SEXT]], -128
|
||||
; CHECK-NEXT: [[ADD_3:%.*]] = add i16 [[SEXT]], -127
|
||||
; CHECK-NEXT: [[RES_1:%.*]] = xor i16 [[ADD_1]], [[ADD_2]]
|
||||
; CHECK-NEXT: [[RES_2:%.*]] = xor i16 [[RES_1]], [[ADD_3]]
|
||||
|
||||
@@ -36,7 +36,7 @@ entry:
|
||||
define void @add_constexpr(i32 %a) {
|
||||
; CHECK-LABEL: @add_constexpr(
|
||||
; CHECK-NEXT: entry:
|
||||
; CHECK-NEXT: [[ADD_1:%.*]] = add i32 0, [[A:%.*]]
|
||||
; CHECK-NEXT: [[ADD_1:%.*]] = add nuw i32 0, [[A:%.*]]
|
||||
; CHECK-NEXT: call void @use.i32(i32 [[ADD_1]])
|
||||
; CHECK-NEXT: [[ADD_2:%.*]] = add i32 20, [[A]]
|
||||
; CHECK-NEXT: call void @use.i32(i32 [[ADD_2]])
|
||||
|
||||
@@ -8,7 +8,7 @@ declare void @use(i1)
|
||||
define void @val_undef_eq() {
|
||||
; CHECK-LABEL: @val_undef_eq(
|
||||
; CHECK-NEXT: entry:
|
||||
; CHECK-NEXT: [[A:%.*]] = add i32 undef, 0
|
||||
; CHECK-NEXT: [[A:%.*]] = add nuw i32 undef, 0
|
||||
; CHECK-NEXT: [[BC_1:%.*]] = icmp eq i32 [[A]], 10
|
||||
; CHECK-NEXT: br i1 [[BC_1]], label [[TRUE:%.*]], label [[FALSE:%.*]]
|
||||
; CHECK: true:
|
||||
@@ -41,7 +41,7 @@ declare void @use.i32(i32)
|
||||
define void @val_undef_range() {
|
||||
; CHECK-LABEL: @val_undef_range(
|
||||
; CHECK-NEXT: entry:
|
||||
; CHECK-NEXT: [[A:%.*]] = add i32 undef, 0
|
||||
; CHECK-NEXT: [[A:%.*]] = add nuw i32 undef, 0
|
||||
; CHECK-NEXT: [[BC_1:%.*]] = icmp ult i32 [[A]], 127
|
||||
; CHECK-NEXT: br i1 [[BC_1]], label [[TRUE:%.*]], label [[FALSE:%.*]]
|
||||
; CHECK: true:
|
||||
|
||||
@@ -7,7 +7,7 @@ define void @f1(i32 %a, i32 %b) {
|
||||
; CHECK-LABEL: @f1(
|
||||
; CHECK-NEXT: entry:
|
||||
; CHECK-NEXT: [[A_255:%.*]] = and i32 [[A:%.*]], 255
|
||||
; CHECK-NEXT: [[A_2:%.*]] = add i32 [[A_255]], 20
|
||||
; CHECK-NEXT: [[A_2:%.*]] = add nuw i32 [[A_255]], 20
|
||||
; CHECK-NEXT: [[BC:%.*]] = icmp ugt i32 [[B:%.*]], [[A_2]]
|
||||
; CHECK-NEXT: br i1 [[BC]], label [[TRUE:%.*]], label [[FALSE:%.*]]
|
||||
; CHECK: true:
|
||||
@@ -260,7 +260,7 @@ define void @f8_nested_conds(i32 %a, i32 %b) {
|
||||
; CHECK-LABEL: @f8_nested_conds(
|
||||
; CHECK-NEXT: entry:
|
||||
; CHECK-NEXT: [[A_255:%.*]] = and i32 [[A:%.*]], 255
|
||||
; CHECK-NEXT: [[A_2:%.*]] = add i32 [[A_255]], 20
|
||||
; CHECK-NEXT: [[A_2:%.*]] = add nuw i32 [[A_255]], 20
|
||||
; CHECK-NEXT: [[BC_1:%.*]] = icmp ugt i32 [[B:%.*]], [[A_2]]
|
||||
; CHECK-NEXT: br i1 [[BC_1]], label [[TRUE:%.*]], label [[FALSE:%.*]]
|
||||
; CHECK: true:
|
||||
@@ -718,7 +718,7 @@ define void @loop() {
|
||||
; CHECK-NEXT: [[INC27]] = add nsw i32 [[I_0]], 1
|
||||
; CHECK-NEXT: br label [[FOR_COND]]
|
||||
; CHECK: for.body14:
|
||||
; CHECK-NEXT: [[INC]] = add nsw i32 [[J_0]], 1
|
||||
; CHECK-NEXT: [[INC]] = add nuw nsw i32 [[J_0]], 1
|
||||
; CHECK-NEXT: br label [[FOR_COND11]]
|
||||
;
|
||||
entry:
|
||||
|
||||
@@ -15,7 +15,7 @@ define i32 @caller1() {
|
||||
; CHECK-LABEL: @caller1(
|
||||
; CHECK-NEXT: [[C1:%.*]] = call i32 @callee(i32 10), !range [[RNG0:![0-9]+]]
|
||||
; CHECK-NEXT: [[C2:%.*]] = call i32 @callee(i32 20), !range [[RNG0]]
|
||||
; CHECK-NEXT: [[A:%.*]] = add i32 [[C1]], [[C2]]
|
||||
; CHECK-NEXT: [[A:%.*]] = add nuw i32 [[C1]], [[C2]]
|
||||
; CHECK-NEXT: ret i32 [[A]]
|
||||
;
|
||||
%c1 = call i32 @callee(i32 10)
|
||||
|
||||
@@ -33,9 +33,9 @@ define internal i32 @f2(i32 %x) {
|
||||
; CHECK-NEXT: [[CMP4:%.*]] = icmp ugt i32 [[X]], 300
|
||||
; CHECK-NEXT: [[RES1:%.*]] = select i1 [[CMP]], i32 1, i32 2
|
||||
; CHECK-NEXT: [[RES4:%.*]] = select i1 [[CMP4]], i32 3, i32 4
|
||||
; CHECK-NEXT: [[RES6:%.*]] = add i32 [[RES1]], 3
|
||||
; CHECK-NEXT: [[RES7:%.*]] = add i32 5, [[RES4]]
|
||||
; CHECK-NEXT: [[RES:%.*]] = add i32 [[RES6]], 5
|
||||
; CHECK-NEXT: [[RES6:%.*]] = add nuw i32 [[RES1]], 3
|
||||
; CHECK-NEXT: [[RES7:%.*]] = add nuw i32 5, [[RES4]]
|
||||
; CHECK-NEXT: [[RES:%.*]] = add nuw i32 [[RES6]], 5
|
||||
; CHECK-NEXT: ret i32 [[RES]]
|
||||
;
|
||||
entry:
|
||||
@@ -63,8 +63,8 @@ define i32 @caller1() {
|
||||
; CHECK-NEXT: [[CALL2:%.*]] = tail call i32 @f1(i32 47, i32 999)
|
||||
; CHECK-NEXT: [[CALL3:%.*]] = tail call i32 @f2(i32 47)
|
||||
; CHECK-NEXT: [[CALL4:%.*]] = tail call i32 @f2(i32 301)
|
||||
; CHECK-NEXT: [[RES_1:%.*]] = add nsw i32 12, [[CALL3]]
|
||||
; CHECK-NEXT: [[RES_2:%.*]] = add nsw i32 [[RES_1]], [[CALL4]]
|
||||
; CHECK-NEXT: [[RES_1:%.*]] = add nuw nsw i32 12, [[CALL3]]
|
||||
; CHECK-NEXT: [[RES_2:%.*]] = add nuw nsw i32 [[RES_1]], [[CALL4]]
|
||||
; CHECK-NEXT: ret i32 [[RES_2]]
|
||||
;
|
||||
entry:
|
||||
|
||||
@@ -5,13 +5,13 @@
|
||||
; x + y = [110, 221)
|
||||
define internal i1 @f.add(i32 %x, i32 %y) {
|
||||
; CHECK-LABEL: @f.add(
|
||||
; CHECK-NEXT: [[A_1:%.*]] = add i32 [[X:%.*]], [[Y:%.*]]
|
||||
; CHECK-NEXT: [[A_1:%.*]] = add nuw i32 [[X:%.*]], [[Y:%.*]]
|
||||
; CHECK-NEXT: [[C_2:%.*]] = icmp sgt i32 [[A_1]], 219
|
||||
; CHECK-NEXT: [[C_4:%.*]] = icmp slt i32 [[A_1]], 111
|
||||
; CHECK-NEXT: [[C_5:%.*]] = icmp eq i32 [[A_1]], 150
|
||||
; CHECK-NEXT: [[C_6:%.*]] = icmp slt i32 [[A_1]], 150
|
||||
; CHECK-NEXT: [[RES_1:%.*]] = add i1 false, [[C_2]]
|
||||
; CHECK-NEXT: [[RES_2:%.*]] = add i1 [[RES_1]], false
|
||||
; CHECK-NEXT: [[RES_1:%.*]] = add nuw i1 false, [[C_2]]
|
||||
; CHECK-NEXT: [[RES_2:%.*]] = add nuw i1 [[RES_1]], false
|
||||
; CHECK-NEXT: [[RES_3:%.*]] = add i1 [[RES_2]], [[C_4]]
|
||||
; CHECK-NEXT: [[RES_4:%.*]] = add i1 [[RES_3]], [[C_5]]
|
||||
; CHECK-NEXT: [[RES_5:%.*]] = add i1 [[RES_4]], [[C_6]]
|
||||
@@ -55,8 +55,8 @@ define internal i1 @f.sub(i32 %x, i32 %y) {
|
||||
; CHECK-NEXT: [[C_4:%.*]] = icmp slt i32 [[A_1]], -189
|
||||
; CHECK-NEXT: [[C_5:%.*]] = icmp eq i32 [[A_1]], -150
|
||||
; CHECK-NEXT: [[C_6:%.*]] = icmp slt i32 [[A_1]], -150
|
||||
; CHECK-NEXT: [[RES_1:%.*]] = add i1 false, [[C_2]]
|
||||
; CHECK-NEXT: [[RES_2:%.*]] = add i1 [[RES_1]], false
|
||||
; CHECK-NEXT: [[RES_1:%.*]] = add nuw i1 false, [[C_2]]
|
||||
; CHECK-NEXT: [[RES_2:%.*]] = add nuw i1 [[RES_1]], false
|
||||
; CHECK-NEXT: [[RES_3:%.*]] = add i1 [[RES_2]], [[C_4]]
|
||||
; CHECK-NEXT: [[RES_4:%.*]] = add i1 [[RES_3]], [[C_5]]
|
||||
; CHECK-NEXT: [[RES_5:%.*]] = add i1 [[RES_4]], [[C_6]]
|
||||
@@ -99,8 +99,8 @@ define internal i1 @f.mul(i32 %x, i32 %y) {
|
||||
; CHECK-NEXT: [[C_4:%.*]] = icmp slt i32 [[A_1]], 1001
|
||||
; CHECK-NEXT: [[C_5:%.*]] = icmp eq i32 [[A_1]], 1500
|
||||
; CHECK-NEXT: [[C_6:%.*]] = icmp slt i32 [[A_1]], 1500
|
||||
; CHECK-NEXT: [[RES_1:%.*]] = add i1 false, [[C_2]]
|
||||
; CHECK-NEXT: [[RES_2:%.*]] = add i1 [[RES_1]], false
|
||||
; CHECK-NEXT: [[RES_1:%.*]] = add nuw i1 false, [[C_2]]
|
||||
; CHECK-NEXT: [[RES_2:%.*]] = add nuw i1 [[RES_1]], false
|
||||
; CHECK-NEXT: [[RES_3:%.*]] = add i1 [[RES_2]], [[C_4]]
|
||||
; CHECK-NEXT: [[RES_4:%.*]] = add i1 [[RES_3]], [[C_5]]
|
||||
; CHECK-NEXT: [[RES_5:%.*]] = add i1 [[RES_4]], [[C_6]]
|
||||
|
||||
@@ -7,8 +7,8 @@ define internal i1 @f.trunc(i32 %x) {
|
||||
; CHECK-NEXT: [[T_1:%.*]] = trunc i32 [[X:%.*]] to i16
|
||||
; CHECK-NEXT: [[C_2:%.*]] = icmp sgt i16 [[T_1]], 299
|
||||
; CHECK-NEXT: [[C_4:%.*]] = icmp slt i16 [[T_1]], 101
|
||||
; CHECK-NEXT: [[RES_1:%.*]] = add i1 false, [[C_2]]
|
||||
; CHECK-NEXT: [[RES_2:%.*]] = add i1 [[RES_1]], false
|
||||
; CHECK-NEXT: [[RES_1:%.*]] = add nuw i1 false, [[C_2]]
|
||||
; CHECK-NEXT: [[RES_2:%.*]] = add nuw i1 [[RES_1]], false
|
||||
; CHECK-NEXT: [[RES_3:%.*]] = add i1 [[RES_2]], [[C_4]]
|
||||
; CHECK-NEXT: [[T_2:%.*]] = trunc i32 [[X]] to i8
|
||||
; CHECK-NEXT: [[C_5:%.*]] = icmp sgt i8 [[T_2]], 44
|
||||
@@ -62,8 +62,8 @@ define internal i1 @f.zext(i32 %x, i32 %y) {
|
||||
; CHECK-NEXT: [[T_1:%.*]] = zext i32 [[X:%.*]] to i64
|
||||
; CHECK-NEXT: [[C_2:%.*]] = icmp sgt i64 [[T_1]], 299
|
||||
; CHECK-NEXT: [[C_4:%.*]] = icmp slt i64 [[T_1]], 101
|
||||
; CHECK-NEXT: [[RES_1:%.*]] = add i1 false, [[C_2]]
|
||||
; CHECK-NEXT: [[RES_2:%.*]] = add i1 [[RES_1]], false
|
||||
; CHECK-NEXT: [[RES_1:%.*]] = add nuw i1 false, [[C_2]]
|
||||
; CHECK-NEXT: [[RES_2:%.*]] = add nuw i1 [[RES_1]], false
|
||||
; CHECK-NEXT: [[RES_3:%.*]] = add i1 [[RES_2]], [[C_4]]
|
||||
; CHECK-NEXT: [[T_2:%.*]] = zext i32 [[Y:%.*]] to i64
|
||||
; CHECK-NEXT: [[C_5:%.*]] = icmp sgt i64 [[T_2]], 300
|
||||
@@ -71,7 +71,7 @@ define internal i1 @f.zext(i32 %x, i32 %y) {
|
||||
; CHECK-NEXT: [[C_8:%.*]] = icmp slt i64 [[T_2]], 1
|
||||
; CHECK-NEXT: [[RES_4:%.*]] = add i1 [[RES_3]], [[C_5]]
|
||||
; CHECK-NEXT: [[RES_5:%.*]] = add i1 [[RES_4]], [[C_6]]
|
||||
; CHECK-NEXT: [[RES_6:%.*]] = add i1 [[RES_5]], false
|
||||
; CHECK-NEXT: [[RES_6:%.*]] = add nuw i1 [[RES_5]], false
|
||||
; CHECK-NEXT: [[RES_7:%.*]] = add i1 [[RES_6]], [[C_8]]
|
||||
; CHECK-NEXT: ret i1 [[RES_7]]
|
||||
;
|
||||
@@ -115,15 +115,15 @@ define internal i1 @f.sext(i32 %x, i32 %y) {
|
||||
; CHECK-NEXT: [[T_1:%.*]] = zext i32 [[X:%.*]] to i64
|
||||
; CHECK-NEXT: [[C_2:%.*]] = icmp sgt i64 [[T_1]], 299
|
||||
; CHECK-NEXT: [[C_4:%.*]] = icmp slt i64 [[T_1]], 101
|
||||
; CHECK-NEXT: [[RES_1:%.*]] = add i1 false, [[C_2]]
|
||||
; CHECK-NEXT: [[RES_2:%.*]] = add i1 [[RES_1]], false
|
||||
; CHECK-NEXT: [[RES_1:%.*]] = add nuw i1 false, [[C_2]]
|
||||
; CHECK-NEXT: [[RES_2:%.*]] = add nuw i1 [[RES_1]], false
|
||||
; CHECK-NEXT: [[RES_3:%.*]] = add i1 [[RES_2]], [[C_4]]
|
||||
; CHECK-NEXT: [[T_2:%.*]] = sext i32 [[Y:%.*]] to i64
|
||||
; CHECK-NEXT: [[C_6:%.*]] = icmp sgt i64 [[T_2]], 899
|
||||
; CHECK-NEXT: [[C_8:%.*]] = icmp slt i64 [[T_2]], -119
|
||||
; CHECK-NEXT: [[RES_4:%.*]] = add i1 [[RES_3]], false
|
||||
; CHECK-NEXT: [[RES_4:%.*]] = add nuw i1 [[RES_3]], false
|
||||
; CHECK-NEXT: [[RES_5:%.*]] = add i1 [[RES_4]], [[C_6]]
|
||||
; CHECK-NEXT: [[RES_6:%.*]] = add i1 [[RES_5]], false
|
||||
; CHECK-NEXT: [[RES_6:%.*]] = add nuw i1 [[RES_5]], false
|
||||
; CHECK-NEXT: [[RES_7:%.*]] = add i1 [[RES_6]], [[C_8]]
|
||||
; CHECK-NEXT: ret i1 [[RES_7]]
|
||||
;
|
||||
|
||||
@@ -55,12 +55,12 @@ define internal i32 @f2(i32 %x, i32 %y, i32 %z, i1 %cmp.1, i1 %cmp.2) {
|
||||
; CHECK-NEXT: [[V_1:%.*]] = select i1 [[C_1]], i32 10, i32 100
|
||||
; CHECK-NEXT: [[V_2:%.*]] = select i1 [[C_2]], i32 20, i32 200
|
||||
; CHECK-NEXT: [[V_3:%.*]] = select i1 [[C_3]], i32 30, i32 300
|
||||
; CHECK-NEXT: [[R_1:%.*]] = add i32 [[V_1]], [[V_2]]
|
||||
; CHECK-NEXT: [[R_2:%.*]] = add i32 [[R_1]], [[V_3]]
|
||||
; CHECK-NEXT: [[R_3:%.*]] = add i32 [[R_2]], 400
|
||||
; CHECK-NEXT: [[R_4:%.*]] = add i32 [[R_3]], 50
|
||||
; CHECK-NEXT: [[R_5:%.*]] = add i32 [[R_4]], 60
|
||||
; CHECK-NEXT: [[R_6:%.*]] = add i32 [[R_4]], 700
|
||||
; CHECK-NEXT: [[R_1:%.*]] = add nuw i32 [[V_1]], [[V_2]]
|
||||
; CHECK-NEXT: [[R_2:%.*]] = add nuw i32 [[R_1]], [[V_3]]
|
||||
; CHECK-NEXT: [[R_3:%.*]] = add nuw i32 [[R_2]], 400
|
||||
; CHECK-NEXT: [[R_4:%.*]] = add nuw i32 [[R_3]], 50
|
||||
; CHECK-NEXT: [[R_5:%.*]] = add nuw i32 [[R_4]], 60
|
||||
; CHECK-NEXT: [[R_6:%.*]] = add nuw i32 [[R_4]], 700
|
||||
; CHECK-NEXT: ret i32 [[R_6]]
|
||||
;
|
||||
|
||||
@@ -154,12 +154,12 @@ define internal i32 @f3(i32 %x, i32 %y, i1 %cmp.1) {
|
||||
; CHECK-NEXT: [[V_5:%.*]] = select i1 [[C_5]], i32 50, i32 500
|
||||
; CHECK-NEXT: [[V_6:%.*]] = select i1 [[C_6]], i32 60, i32 600
|
||||
; CHECK-NEXT: [[V_7:%.*]] = select i1 [[C_7]], i32 70, i32 700
|
||||
; CHECK-NEXT: [[R_1:%.*]] = add i32 [[V_1]], [[V_2]]
|
||||
; CHECK-NEXT: [[R_2:%.*]] = add i32 [[R_1]], [[V_3]]
|
||||
; CHECK-NEXT: [[R_3:%.*]] = add i32 [[R_2]], [[V_4]]
|
||||
; CHECK-NEXT: [[R_4:%.*]] = add i32 [[R_3]], [[V_5]]
|
||||
; CHECK-NEXT: [[R_5:%.*]] = add i32 [[R_4]], [[V_6]]
|
||||
; CHECK-NEXT: [[R_6:%.*]] = add i32 [[R_4]], [[V_7]]
|
||||
; CHECK-NEXT: [[R_1:%.*]] = add nuw i32 [[V_1]], [[V_2]]
|
||||
; CHECK-NEXT: [[R_2:%.*]] = add nuw i32 [[R_1]], [[V_3]]
|
||||
; CHECK-NEXT: [[R_3:%.*]] = add nuw i32 [[R_2]], [[V_4]]
|
||||
; CHECK-NEXT: [[R_4:%.*]] = add nuw i32 [[R_3]], [[V_5]]
|
||||
; CHECK-NEXT: [[R_5:%.*]] = add nuw i32 [[R_4]], [[V_6]]
|
||||
; CHECK-NEXT: [[R_6:%.*]] = add nuw i32 [[R_4]], [[V_7]]
|
||||
; CHECK-NEXT: ret i32 [[R_6]]
|
||||
;
|
||||
|
||||
|
||||
@@ -44,9 +44,9 @@ define internal i1 @f1(i32 %x, i32 %y, i1 %cmp) {
|
||||
; CHECK-NEXT: [[SEL_1:%.*]] = select i1 [[CMP]], i32 [[X]], i32 [[Y]]
|
||||
; CHECK-NEXT: [[C_2:%.*]] = icmp sgt i32 [[SEL_1]], 100
|
||||
; CHECK-NEXT: [[C_3:%.*]] = icmp eq i32 [[SEL_1]], 50
|
||||
; CHECK-NEXT: [[RES_1:%.*]] = add i1 false, [[C_2]]
|
||||
; CHECK-NEXT: [[RES_1:%.*]] = add nuw i1 false, [[C_2]]
|
||||
; CHECK-NEXT: [[RES_2:%.*]] = add i1 [[RES_1]], [[C_3]]
|
||||
; CHECK-NEXT: [[RES_3:%.*]] = add i1 [[RES_2]], false
|
||||
; CHECK-NEXT: [[RES_3:%.*]] = add nuw i1 [[RES_2]], false
|
||||
; CHECK-NEXT: ret i1 [[RES_3]]
|
||||
;
|
||||
%sel.1 = select i1 %cmp, i32 %x, i32 %y
|
||||
|
||||
@@ -33,7 +33,7 @@ F: ; preds = %0
|
||||
;; value
|
||||
define internal { i32, i32 } @foo(i32 %A, i32 %B) {
|
||||
; CHECK-LABEL: @foo(
|
||||
; CHECK-NEXT: [[X:%.*]] = add i32 [[A:%.*]], [[B:%.*]]
|
||||
; CHECK-NEXT: [[X:%.*]] = add nuw i32 [[A:%.*]], [[B:%.*]]
|
||||
; CHECK-NEXT: [[Y:%.*]] = insertvalue { i32, i32 } undef, i32 [[A]], 0
|
||||
; CHECK-NEXT: [[Z:%.*]] = insertvalue { i32, i32 } [[Y]], i32 [[X]], 1
|
||||
; CHECK-NEXT: ret { i32, i32 } [[Z]]
|
||||
@@ -54,7 +54,7 @@ define void @caller(i1 %C) personality ptr @__gxx_personality_v0 {
|
||||
; CHECK-NEXT: to label [[OK:%.*]] unwind label [[LPAD:%.*]]
|
||||
; CHECK: OK:
|
||||
; CHECK-NEXT: [[X2:%.*]] = extractvalue { i32, i32 } [[S2]], 0
|
||||
; CHECK-NEXT: [[Z:%.*]] = add i32 [[X1]], [[X2]]
|
||||
; CHECK-NEXT: [[Z:%.*]] = add nuw i32 [[X1]], [[X2]]
|
||||
; CHECK-NEXT: store i32 [[Z]], ptr [[W]], align 4
|
||||
; CHECK-NEXT: br label [[RET:%.*]]
|
||||
; CHECK: LPAD:
|
||||
|
||||
@@ -50,7 +50,7 @@ define %0 @caller(i1 %Q) {
|
||||
; CHECK-NEXT: [[B:%.*]] = extractvalue [[TMP0]] [[X]], 1
|
||||
; CHECK-NEXT: [[Y:%.*]] = call [[TMP0]] @bar(i1 [[Q]])
|
||||
; CHECK-NEXT: [[D:%.*]] = extractvalue [[TMP0]] [[Y]], 1
|
||||
; CHECK-NEXT: [[N:%.*]] = add i32 [[B]], [[D]]
|
||||
; CHECK-NEXT: [[N:%.*]] = add nuw i32 [[B]], [[D]]
|
||||
; CHECK-NEXT: ret [[TMP0]] [[X]]
|
||||
;
|
||||
%X = call %0 @foo(i1 %Q)
|
||||
|
||||
@@ -16,7 +16,7 @@ define void @test_2_incoming_constants(i32 %x) {
|
||||
; SCCP-NEXT: br label [[EXIT]]
|
||||
; SCCP: exit:
|
||||
; SCCP-NEXT: [[P:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ 1, [[BB1]] ]
|
||||
; SCCP-NEXT: [[A:%.*]] = add i32 [[P]], 1
|
||||
; SCCP-NEXT: [[A:%.*]] = add nuw i32 [[P]], 1
|
||||
; SCCP-NEXT: call void @use(i1 true)
|
||||
; SCCP-NEXT: call void @use(i1 false)
|
||||
; SCCP-NEXT: ret void
|
||||
@@ -29,7 +29,7 @@ define void @test_2_incoming_constants(i32 %x) {
|
||||
; IPSCCP-NEXT: br label [[EXIT]]
|
||||
; IPSCCP: exit:
|
||||
; IPSCCP-NEXT: [[P:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ 1, [[BB1]] ]
|
||||
; IPSCCP-NEXT: [[A:%.*]] = add i32 [[P]], 1
|
||||
; IPSCCP-NEXT: [[A:%.*]] = add nuw i32 [[P]], 1
|
||||
; IPSCCP-NEXT: call void @use(i1 true)
|
||||
; IPSCCP-NEXT: call void @use(i1 false)
|
||||
; IPSCCP-NEXT: ret void
|
||||
@@ -63,7 +63,7 @@ define void @test_3_incoming_constants(i32 %x) {
|
||||
; SCCP-NEXT: br label [[EXIT]]
|
||||
; SCCP: exit:
|
||||
; SCCP-NEXT: [[P:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ 1, [[BB1]] ], [ 2, [[BB2]] ]
|
||||
; SCCP-NEXT: [[A:%.*]] = add i32 [[P]], 1
|
||||
; SCCP-NEXT: [[A:%.*]] = add nuw i32 [[P]], 1
|
||||
; SCCP-NEXT: call void @use(i1 true)
|
||||
; SCCP-NEXT: call void @use(i1 false)
|
||||
; SCCP-NEXT: ret void
|
||||
@@ -79,7 +79,7 @@ define void @test_3_incoming_constants(i32 %x) {
|
||||
; IPSCCP-NEXT: br label [[EXIT]]
|
||||
; IPSCCP: exit:
|
||||
; IPSCCP-NEXT: [[P:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ 1, [[BB1]] ], [ 2, [[BB2]] ]
|
||||
; IPSCCP-NEXT: [[A:%.*]] = add i32 [[P]], 1
|
||||
; IPSCCP-NEXT: [[A:%.*]] = add nuw i32 [[P]], 1
|
||||
; IPSCCP-NEXT: call void @use(i1 true)
|
||||
; IPSCCP-NEXT: call void @use(i1 false)
|
||||
; IPSCCP-NEXT: ret void
|
||||
@@ -123,7 +123,7 @@ define void @test_5_incoming_constants(i32 %x) {
|
||||
; SCCP-NEXT: br label [[EXIT]]
|
||||
; SCCP: exit:
|
||||
; SCCP-NEXT: [[P:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ 1, [[BB1]] ], [ 2, [[BB2]] ], [ 3, [[BB3]] ], [ 4, [[BB4]] ]
|
||||
; SCCP-NEXT: [[A:%.*]] = add i32 [[P]], 1
|
||||
; SCCP-NEXT: [[A:%.*]] = add nuw i32 [[P]], 1
|
||||
; SCCP-NEXT: call void @use(i1 true)
|
||||
; SCCP-NEXT: call void @use(i1 false)
|
||||
; SCCP-NEXT: ret void
|
||||
@@ -145,7 +145,7 @@ define void @test_5_incoming_constants(i32 %x) {
|
||||
; IPSCCP-NEXT: br label [[EXIT]]
|
||||
; IPSCCP: exit:
|
||||
; IPSCCP-NEXT: [[P:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ 1, [[BB1]] ], [ 2, [[BB2]] ], [ 3, [[BB3]] ], [ 4, [[BB4]] ]
|
||||
; IPSCCP-NEXT: [[A:%.*]] = add i32 [[P]], 1
|
||||
; IPSCCP-NEXT: [[A:%.*]] = add nuw i32 [[P]], 1
|
||||
; IPSCCP-NEXT: call void @use(i1 true)
|
||||
; IPSCCP-NEXT: call void @use(i1 false)
|
||||
; IPSCCP-NEXT: ret void
|
||||
@@ -196,7 +196,7 @@ define void @rotated_loop_2(i32 %x) {
|
||||
; SCCP-NEXT: br label [[EXIT]]
|
||||
; SCCP: exit:
|
||||
; SCCP-NEXT: [[P:%.*]] = phi i32 [ 1, [[ENTRY:%.*]] ], [ 3, [[BB1]] ], [ 2, [[BB2]] ], [ 5, [[BB3]] ]
|
||||
; SCCP-NEXT: [[A:%.*]] = add i32 [[P]], 1
|
||||
; SCCP-NEXT: [[A:%.*]] = add nuw i32 [[P]], 1
|
||||
; SCCP-NEXT: call void @use(i1 true)
|
||||
; SCCP-NEXT: call void @use(i1 false)
|
||||
; SCCP-NEXT: br label [[EXIT_1:%.*]]
|
||||
@@ -217,7 +217,7 @@ define void @rotated_loop_2(i32 %x) {
|
||||
; IPSCCP-NEXT: br label [[EXIT]]
|
||||
; IPSCCP: exit:
|
||||
; IPSCCP-NEXT: [[P:%.*]] = phi i32 [ 1, [[ENTRY:%.*]] ], [ 3, [[BB1]] ], [ 2, [[BB2]] ], [ 5, [[BB3]] ]
|
||||
; IPSCCP-NEXT: [[A:%.*]] = add i32 [[P]], 1
|
||||
; IPSCCP-NEXT: [[A:%.*]] = add nuw i32 [[P]], 1
|
||||
; IPSCCP-NEXT: call void @use(i1 true)
|
||||
; IPSCCP-NEXT: call void @use(i1 false)
|
||||
; IPSCCP-NEXT: br label [[EXIT_1:%.*]]
|
||||
@@ -358,7 +358,7 @@ define void @loop_with_header_1(i32 %x) {
|
||||
; IPSCCP-NEXT: br i1 [[C_1]], label [[LOOP_BODY]], label [[EXIT:%.*]]
|
||||
; IPSCCP: loop.body:
|
||||
; IPSCCP-NEXT: call void @use(i1 true)
|
||||
; IPSCCP-NEXT: [[IV_NEXT]] = add nsw i32 [[IV]], 1
|
||||
; IPSCCP-NEXT: [[IV_NEXT]] = add nuw nsw i32 [[IV]], 1
|
||||
; IPSCCP-NEXT: br label [[LOOP_HEADER]]
|
||||
; IPSCCP: exit:
|
||||
; IPSCCP-NEXT: ret void
|
||||
|
||||
Reference in New Issue
Block a user