2010-01-05 15:50:36 +08:00
|
|
|
//===- InstCombineAndOrXor.cpp --------------------------------------------===//
|
|
|
|
//
|
|
|
|
// The LLVM Compiler Infrastructure
|
|
|
|
//
|
|
|
|
// This file is distributed under the University of Illinois Open Source
|
|
|
|
// License. See LICENSE.TXT for details.
|
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
//
|
|
|
|
// This file implements the visitAnd, visitOr, and visitXor functions.
|
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
2015-01-22 13:25:13 +08:00
|
|
|
#include "InstCombineInternal.h"
|
2010-01-05 15:50:36 +08:00
|
|
|
#include "llvm/Analysis/InstructionSimplify.h"
|
2014-03-04 20:24:34 +08:00
|
|
|
#include "llvm/IR/ConstantRange.h"
|
2013-01-02 19:36:10 +08:00
|
|
|
#include "llvm/IR/Intrinsics.h"
|
2014-03-04 19:08:18 +08:00
|
|
|
#include "llvm/IR/PatternMatch.h"
|
2012-12-04 00:50:05 +08:00
|
|
|
#include "llvm/Transforms/Utils/CmpInstAnalysis.h"
|
2016-01-15 17:20:19 +08:00
|
|
|
#include "llvm/Transforms/Utils/Local.h"
|
2010-01-05 15:50:36 +08:00
|
|
|
using namespace llvm;
|
|
|
|
using namespace PatternMatch;
|
|
|
|
|
2014-04-22 10:55:47 +08:00
|
|
|
#define DEBUG_TYPE "instcombine"
|
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
static inline Value *dyn_castNotVal(Value *V) {
|
|
|
|
// If this is not(not(x)) don't return that this is a not: we want the two
|
|
|
|
// not's to be folded first.
|
|
|
|
if (BinaryOperator::isNot(V)) {
|
|
|
|
Value *Operand = BinaryOperator::getNotArgument(V);
|
2015-02-24 08:08:41 +08:00
|
|
|
if (!IsFreeToInvert(Operand, Operand->hasOneUse()))
|
2010-01-05 15:50:36 +08:00
|
|
|
return Operand;
|
|
|
|
}
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
// Constants can be considered to be not'ed values...
|
|
|
|
if (ConstantInt *C = dyn_cast<ConstantInt>(V))
|
|
|
|
return ConstantInt::get(C->getType(), ~C->getValue());
|
2014-04-25 13:29:35 +08:00
|
|
|
return nullptr;
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
|
2015-09-09 02:24:36 +08:00
|
|
|
/// Similar to getICmpCode but for FCmpInst. This encodes a fcmp predicate into
|
[InstCombine] Simplify and correct folding fcmps with the same children
Summary: Take advantage of FCmpInst::Predicate's bit pattern and handle (fcmp *, x, y) | (fcmp *, x, y) and (fcmp *, x, y) & (fcmp *, x, y) more consistently. Also fold more FCmpInst::FCMP_FALSE and FCmpInst::FCMP_TRUE to constants.
Currently InstCombine wrongly folds (fcmp ogt, x, y) | (fcmp ord, x, y) to (fcmp ogt, x, y); this patch also fixes that.
Reviewers: spatel
Subscribers: llvm-commits, iteratee, echristo
Differential Revision: http://reviews.llvm.org/D21775
llvm-svn: 274156
2016-06-30 04:10:17 +08:00
|
|
|
/// a four bit mask.
|
|
|
|
static unsigned getFCmpCode(FCmpInst::Predicate CC) {
|
|
|
|
assert(FCmpInst::FCMP_FALSE <= CC && CC <= FCmpInst::FCMP_TRUE &&
|
|
|
|
"Unexpected FCmp predicate!");
|
|
|
|
// Take advantage of the bit pattern of FCmpInst::Predicate here.
|
|
|
|
// U L G E
|
|
|
|
static_assert(FCmpInst::FCMP_FALSE == 0, ""); // 0 0 0 0
|
|
|
|
static_assert(FCmpInst::FCMP_OEQ == 1, ""); // 0 0 0 1
|
|
|
|
static_assert(FCmpInst::FCMP_OGT == 2, ""); // 0 0 1 0
|
|
|
|
static_assert(FCmpInst::FCMP_OGE == 3, ""); // 0 0 1 1
|
|
|
|
static_assert(FCmpInst::FCMP_OLT == 4, ""); // 0 1 0 0
|
|
|
|
static_assert(FCmpInst::FCMP_OLE == 5, ""); // 0 1 0 1
|
|
|
|
static_assert(FCmpInst::FCMP_ONE == 6, ""); // 0 1 1 0
|
|
|
|
static_assert(FCmpInst::FCMP_ORD == 7, ""); // 0 1 1 1
|
|
|
|
static_assert(FCmpInst::FCMP_UNO == 8, ""); // 1 0 0 0
|
|
|
|
static_assert(FCmpInst::FCMP_UEQ == 9, ""); // 1 0 0 1
|
|
|
|
static_assert(FCmpInst::FCMP_UGT == 10, ""); // 1 0 1 0
|
|
|
|
static_assert(FCmpInst::FCMP_UGE == 11, ""); // 1 0 1 1
|
|
|
|
static_assert(FCmpInst::FCMP_ULT == 12, ""); // 1 1 0 0
|
|
|
|
static_assert(FCmpInst::FCMP_ULE == 13, ""); // 1 1 0 1
|
|
|
|
static_assert(FCmpInst::FCMP_UNE == 14, ""); // 1 1 1 0
|
|
|
|
static_assert(FCmpInst::FCMP_TRUE == 15, ""); // 1 1 1 1
|
|
|
|
return CC;
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
|
2015-09-09 02:24:36 +08:00
|
|
|
/// This is the complement of getICmpCode, which turns an opcode and two
|
|
|
|
/// operands into either a constant true or false, or a brand new ICmp
|
|
|
|
/// instruction. The sign is passed in to determine which kind of predicate to
|
|
|
|
/// use in the new icmp instruction.
|
2012-02-06 19:28:19 +08:00
|
|
|
static Value *getNewICmpValue(bool Sign, unsigned Code, Value *LHS, Value *RHS,
|
|
|
|
InstCombiner::BuilderTy *Builder) {
|
2011-12-17 09:20:32 +08:00
|
|
|
ICmpInst::Predicate NewPred;
|
|
|
|
if (Value *NewConstant = getICmpValue(Sign, Code, LHS, RHS, NewPred))
|
|
|
|
return NewConstant;
|
|
|
|
return Builder->CreateICmp(NewPred, LHS, RHS);
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
|
2015-09-09 02:24:36 +08:00
|
|
|
/// This is the complement of getFCmpCode, which turns an opcode and two
|
[InstCombine] Simplify and correct folding fcmps with the same children
Summary: Take advantage of FCmpInst::Predicate's bit pattern and handle (fcmp *, x, y) | (fcmp *, x, y) and (fcmp *, x, y) & (fcmp *, x, y) more consistently. Also fold more FCmpInst::FCMP_FALSE and FCmpInst::FCMP_TRUE to constants.
Currently InstCombine wrongly folds (fcmp ogt, x, y) | (fcmp ord, x, y) to (fcmp ogt, x, y); this patch also fixes that.
Reviewers: spatel
Subscribers: llvm-commits, iteratee, echristo
Differential Revision: http://reviews.llvm.org/D21775
llvm-svn: 274156
2016-06-30 04:10:17 +08:00
|
|
|
/// operands into either a FCmp instruction, or a true/false constant.
|
|
|
|
static Value *getFCmpValue(unsigned Code, Value *LHS, Value *RHS,
|
2010-03-05 16:46:26 +08:00
|
|
|
InstCombiner::BuilderTy *Builder) {
|
[InstCombine] Simplify and correct folding fcmps with the same children
Summary: Take advantage of FCmpInst::Predicate's bit pattern and handle (fcmp *, x, y) | (fcmp *, x, y) and (fcmp *, x, y) & (fcmp *, x, y) more consistently. Also fold more FCmpInst::FCMP_FALSE and FCmpInst::FCMP_TRUE to constants.
Currently InstCombine wrongly folds (fcmp ogt, x, y) | (fcmp ord, x, y) to (fcmp ogt, x, y); this patch also fixes that.
Reviewers: spatel
Subscribers: llvm-commits, iteratee, echristo
Differential Revision: http://reviews.llvm.org/D21775
llvm-svn: 274156
2016-06-30 04:10:17 +08:00
|
|
|
const auto Pred = static_cast<FCmpInst::Predicate>(Code);
|
|
|
|
assert(FCmpInst::FCMP_FALSE <= Pred && Pred <= FCmpInst::FCMP_TRUE &&
|
|
|
|
"Unexpected FCmp predicate!");
|
|
|
|
if (Pred == FCmpInst::FCMP_FALSE)
|
|
|
|
return ConstantInt::get(CmpInst::makeCmpResultType(LHS->getType()), 0);
|
|
|
|
if (Pred == FCmpInst::FCMP_TRUE)
|
|
|
|
return ConstantInt::get(CmpInst::makeCmpResultType(LHS->getType()), 1);
|
2010-03-05 16:46:26 +08:00
|
|
|
return Builder->CreateFCmp(Pred, LHS, RHS);
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
|
2014-12-04 17:44:01 +08:00
|
|
|
/// \brief Transform BITWISE_OP(BSWAP(A),BSWAP(B)) to BSWAP(BITWISE_OP(A, B))
|
|
|
|
/// \param I Binary operator to transform.
|
|
|
|
/// \return Pointer to node that must replace the original binary operator, or
|
|
|
|
/// null pointer if no transformation was made.
|
|
|
|
Value *InstCombiner::SimplifyBSwap(BinaryOperator &I) {
|
|
|
|
IntegerType *ITy = dyn_cast<IntegerType>(I.getType());
|
|
|
|
|
|
|
|
// Can't do vectors.
|
|
|
|
if (I.getType()->isVectorTy()) return nullptr;
|
|
|
|
|
|
|
|
// Can only do bitwise ops.
|
|
|
|
unsigned Op = I.getOpcode();
|
|
|
|
if (Op != Instruction::And && Op != Instruction::Or &&
|
|
|
|
Op != Instruction::Xor)
|
|
|
|
return nullptr;
|
|
|
|
|
|
|
|
Value *OldLHS = I.getOperand(0);
|
|
|
|
Value *OldRHS = I.getOperand(1);
|
|
|
|
ConstantInt *ConstLHS = dyn_cast<ConstantInt>(OldLHS);
|
|
|
|
ConstantInt *ConstRHS = dyn_cast<ConstantInt>(OldRHS);
|
|
|
|
IntrinsicInst *IntrLHS = dyn_cast<IntrinsicInst>(OldLHS);
|
|
|
|
IntrinsicInst *IntrRHS = dyn_cast<IntrinsicInst>(OldRHS);
|
|
|
|
bool IsBswapLHS = (IntrLHS && IntrLHS->getIntrinsicID() == Intrinsic::bswap);
|
|
|
|
bool IsBswapRHS = (IntrRHS && IntrRHS->getIntrinsicID() == Intrinsic::bswap);
|
|
|
|
|
|
|
|
if (!IsBswapLHS && !IsBswapRHS)
|
|
|
|
return nullptr;
|
|
|
|
|
|
|
|
if (!IsBswapLHS && !ConstLHS)
|
|
|
|
return nullptr;
|
|
|
|
|
|
|
|
if (!IsBswapRHS && !ConstRHS)
|
|
|
|
return nullptr;
|
|
|
|
|
|
|
|
/// OP( BSWAP(x), BSWAP(y) ) -> BSWAP( OP(x, y) )
|
|
|
|
/// OP( BSWAP(x), CONSTANT ) -> BSWAP( OP(x, BSWAP(CONSTANT) ) )
|
|
|
|
Value *NewLHS = IsBswapLHS ? IntrLHS->getOperand(0) :
|
|
|
|
Builder->getInt(ConstLHS->getValue().byteSwap());
|
|
|
|
|
|
|
|
Value *NewRHS = IsBswapRHS ? IntrRHS->getOperand(0) :
|
|
|
|
Builder->getInt(ConstRHS->getValue().byteSwap());
|
|
|
|
|
|
|
|
Value *BinOp = nullptr;
|
|
|
|
if (Op == Instruction::And)
|
|
|
|
BinOp = Builder->CreateAnd(NewLHS, NewRHS);
|
|
|
|
else if (Op == Instruction::Or)
|
|
|
|
BinOp = Builder->CreateOr(NewLHS, NewRHS);
|
|
|
|
else //if (Op == Instruction::Xor)
|
|
|
|
BinOp = Builder->CreateXor(NewLHS, NewRHS);
|
|
|
|
|
2015-12-15 01:24:23 +08:00
|
|
|
Function *F = Intrinsic::getDeclaration(I.getModule(), Intrinsic::bswap, ITy);
|
2014-12-04 17:44:01 +08:00
|
|
|
return Builder->CreateCall(F, BinOp);
|
|
|
|
}
|
|
|
|
|
2015-09-09 02:24:36 +08:00
|
|
|
/// This handles expressions of the form ((val OP C1) & C2). Where
|
|
|
|
/// the Op parameter is 'OP', OpRHS is 'C1', and AndRHS is 'C2'. Op is
|
|
|
|
/// guaranteed to be a binary operator.
|
2010-01-05 15:50:36 +08:00
|
|
|
Instruction *InstCombiner::OptAndOp(Instruction *Op,
|
|
|
|
ConstantInt *OpRHS,
|
|
|
|
ConstantInt *AndRHS,
|
|
|
|
BinaryOperator &TheAnd) {
|
|
|
|
Value *X = Op->getOperand(0);
|
2014-04-25 13:29:35 +08:00
|
|
|
Constant *Together = nullptr;
|
2010-01-05 15:50:36 +08:00
|
|
|
if (!Op->isShift())
|
|
|
|
Together = ConstantExpr::getAnd(AndRHS, OpRHS);
|
|
|
|
|
|
|
|
switch (Op->getOpcode()) {
|
|
|
|
case Instruction::Xor:
|
|
|
|
if (Op->hasOneUse()) {
|
|
|
|
// (X ^ C1) & C2 --> (X & C2) ^ (C1&C2)
|
|
|
|
Value *And = Builder->CreateAnd(X, AndRHS);
|
|
|
|
And->takeName(Op);
|
|
|
|
return BinaryOperator::CreateXor(And, Together);
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case Instruction::Or:
|
2010-09-14 01:59:27 +08:00
|
|
|
if (Op->hasOneUse()){
|
|
|
|
if (Together != OpRHS) {
|
|
|
|
// (X | C1) & C2 --> (X | (C1&C2)) & C2
|
|
|
|
Value *Or = Builder->CreateOr(X, Together);
|
|
|
|
Or->takeName(Op);
|
|
|
|
return BinaryOperator::CreateAnd(Or, AndRHS);
|
|
|
|
}
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2010-09-14 01:59:27 +08:00
|
|
|
ConstantInt *TogetherCI = dyn_cast<ConstantInt>(Together);
|
|
|
|
if (TogetherCI && !TogetherCI->isZero()){
|
|
|
|
// (X | C1) & C2 --> (X & (C2^(C1&C2))) | C1
|
|
|
|
// NOTE: This reduces the number of bits set in the & mask, which
|
|
|
|
// can expose opportunities for store narrowing.
|
|
|
|
Together = ConstantExpr::getXor(AndRHS, Together);
|
|
|
|
Value *And = Builder->CreateAnd(X, Together);
|
|
|
|
And->takeName(Op);
|
|
|
|
return BinaryOperator::CreateOr(And, OpRHS);
|
|
|
|
}
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
break;
|
|
|
|
case Instruction::Add:
|
|
|
|
if (Op->hasOneUse()) {
|
|
|
|
// Adding a one to a single bit bit-field should be turned into an XOR
|
|
|
|
// of the bit. First thing to check is to see if this AND is with a
|
|
|
|
// single bit constant.
|
2013-06-06 08:49:57 +08:00
|
|
|
const APInt &AndRHSV = AndRHS->getValue();
|
2010-01-05 15:50:36 +08:00
|
|
|
|
|
|
|
// If there is only one bit set.
|
|
|
|
if (AndRHSV.isPowerOf2()) {
|
|
|
|
// Ok, at this point, we know that we are masking the result of the
|
|
|
|
// ADD down to exactly one bit. If the constant we are adding has
|
|
|
|
// no bits set below this bit, then we can eliminate the ADD.
|
2013-06-06 08:49:57 +08:00
|
|
|
const APInt& AddRHS = OpRHS->getValue();
|
2010-01-05 15:50:36 +08:00
|
|
|
|
|
|
|
// Check to see if any bits below the one bit set in AndRHSV are set.
|
|
|
|
if ((AddRHS & (AndRHSV-1)) == 0) {
|
|
|
|
// If not, the only thing that can effect the output of the AND is
|
|
|
|
// the bit specified by AndRHSV. If that bit is set, the effect of
|
|
|
|
// the XOR is to toggle the bit. If it is clear, then the ADD has
|
|
|
|
// no effect.
|
|
|
|
if ((AddRHS & AndRHSV) == 0) { // Bit is not set, noop
|
|
|
|
TheAnd.setOperand(0, X);
|
|
|
|
return &TheAnd;
|
|
|
|
} else {
|
|
|
|
// Pull the XOR out of the AND.
|
|
|
|
Value *NewAnd = Builder->CreateAnd(X, AndRHS);
|
|
|
|
NewAnd->takeName(Op);
|
|
|
|
return BinaryOperator::CreateXor(NewAnd, AndRHS);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
|
|
|
|
case Instruction::Shl: {
|
|
|
|
// We know that the AND will not produce any of the bits shifted in, so if
|
|
|
|
// the anded constant includes them, clear them now!
|
|
|
|
//
|
|
|
|
uint32_t BitWidth = AndRHS->getType()->getBitWidth();
|
|
|
|
uint32_t OpRHSVal = OpRHS->getLimitedValue(BitWidth);
|
|
|
|
APInt ShlMask(APInt::getHighBitsSet(BitWidth, BitWidth-OpRHSVal));
|
2013-06-06 08:37:23 +08:00
|
|
|
ConstantInt *CI = Builder->getInt(AndRHS->getValue() & ShlMask);
|
2010-01-05 15:50:36 +08:00
|
|
|
|
2011-02-15 09:56:08 +08:00
|
|
|
if (CI->getValue() == ShlMask)
|
|
|
|
// Masking out bits that the shift already masks.
|
2016-02-02 06:23:39 +08:00
|
|
|
return replaceInstUsesWith(TheAnd, Op); // No need for the and.
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2011-02-15 09:56:08 +08:00
|
|
|
if (CI != AndRHS) { // Reducing bits set in and.
|
2010-01-05 15:50:36 +08:00
|
|
|
TheAnd.setOperand(1, CI);
|
|
|
|
return &TheAnd;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case Instruction::LShr: {
|
|
|
|
// We know that the AND will not produce any of the bits shifted in, so if
|
|
|
|
// the anded constant includes them, clear them now! This only applies to
|
|
|
|
// unsigned shifts, because a signed shr may bring in set bits!
|
|
|
|
//
|
|
|
|
uint32_t BitWidth = AndRHS->getType()->getBitWidth();
|
|
|
|
uint32_t OpRHSVal = OpRHS->getLimitedValue(BitWidth);
|
|
|
|
APInt ShrMask(APInt::getLowBitsSet(BitWidth, BitWidth - OpRHSVal));
|
2013-06-06 08:37:23 +08:00
|
|
|
ConstantInt *CI = Builder->getInt(AndRHS->getValue() & ShrMask);
|
2010-01-05 15:50:36 +08:00
|
|
|
|
2011-02-15 09:56:08 +08:00
|
|
|
if (CI->getValue() == ShrMask)
|
|
|
|
// Masking out bits that the shift already masks.
|
2016-02-02 06:23:39 +08:00
|
|
|
return replaceInstUsesWith(TheAnd, Op);
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2011-02-15 09:56:08 +08:00
|
|
|
if (CI != AndRHS) {
|
2010-01-05 15:50:36 +08:00
|
|
|
TheAnd.setOperand(1, CI); // Reduce bits set in and cst.
|
|
|
|
return &TheAnd;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case Instruction::AShr:
|
|
|
|
// Signed shr.
|
|
|
|
// See if this is shifting in some sign extension, then masking it out
|
|
|
|
// with an and.
|
|
|
|
if (Op->hasOneUse()) {
|
|
|
|
uint32_t BitWidth = AndRHS->getType()->getBitWidth();
|
|
|
|
uint32_t OpRHSVal = OpRHS->getLimitedValue(BitWidth);
|
|
|
|
APInt ShrMask(APInt::getLowBitsSet(BitWidth, BitWidth - OpRHSVal));
|
2013-06-06 08:37:23 +08:00
|
|
|
Constant *C = Builder->getInt(AndRHS->getValue() & ShrMask);
|
2010-01-05 15:50:36 +08:00
|
|
|
if (C == AndRHS) { // Masking out bits shifted in.
|
|
|
|
// (Val ashr C1) & C2 -> (Val lshr C1) & C2
|
|
|
|
// Make the argument unsigned.
|
|
|
|
Value *ShVal = Op->getOperand(0);
|
|
|
|
ShVal = Builder->CreateLShr(ShVal, OpRHS, Op->getName());
|
|
|
|
return BinaryOperator::CreateAnd(ShVal, AndRHS, TheAnd.getName());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
2014-04-25 13:29:35 +08:00
|
|
|
return nullptr;
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
|
2013-04-06 05:20:12 +08:00
|
|
|
/// Emit a computation of: (V >= Lo && V < Hi) if Inside is true, otherwise
|
|
|
|
/// (V < Lo || V >= Hi). In practice, we emit the more efficient
|
2012-11-15 08:35:50 +08:00
|
|
|
/// (V-Lo) \<u Hi-Lo. This method expects that Lo <= Hi. isSigned indicates
|
2010-01-05 15:50:36 +08:00
|
|
|
/// whether to treat the V, Lo and HI as signed or not. IB is the location to
|
|
|
|
/// insert new instructions.
|
2010-03-05 16:46:26 +08:00
|
|
|
Value *InstCombiner::InsertRangeTest(Value *V, Constant *Lo, Constant *Hi,
|
|
|
|
bool isSigned, bool Inside) {
|
2012-12-20 15:09:41 +08:00
|
|
|
assert(cast<ConstantInt>(ConstantExpr::getICmp((isSigned ?
|
2010-01-05 15:50:36 +08:00
|
|
|
ICmpInst::ICMP_SLE:ICmpInst::ICMP_ULE), Lo, Hi))->getZExtValue() &&
|
|
|
|
"Lo is not <= Hi in range emission code!");
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
if (Inside) {
|
|
|
|
if (Lo == Hi) // Trivially false.
|
2013-06-06 08:37:23 +08:00
|
|
|
return Builder->getFalse();
|
2010-01-05 15:50:36 +08:00
|
|
|
|
|
|
|
// V >= Min && V < Hi --> V < Hi
|
|
|
|
if (cast<ConstantInt>(Lo)->isMinValue(isSigned)) {
|
2012-12-20 15:09:41 +08:00
|
|
|
ICmpInst::Predicate pred = (isSigned ?
|
2010-01-05 15:50:36 +08:00
|
|
|
ICmpInst::ICMP_SLT : ICmpInst::ICMP_ULT);
|
2010-03-05 16:46:26 +08:00
|
|
|
return Builder->CreateICmp(pred, V, Hi);
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
// Emit V-Lo <u Hi-Lo
|
|
|
|
Constant *NegLo = ConstantExpr::getNeg(Lo);
|
|
|
|
Value *Add = Builder->CreateAdd(V, NegLo, V->getName()+".off");
|
|
|
|
Constant *UpperBound = ConstantExpr::getAdd(NegLo, Hi);
|
2010-03-05 16:46:26 +08:00
|
|
|
return Builder->CreateICmpULT(Add, UpperBound);
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
if (Lo == Hi) // Trivially true.
|
2013-06-06 08:37:23 +08:00
|
|
|
return Builder->getTrue();
|
2010-01-05 15:50:36 +08:00
|
|
|
|
|
|
|
// V < Min || V >= Hi -> V > Hi-1
|
|
|
|
Hi = SubOne(cast<ConstantInt>(Hi));
|
|
|
|
if (cast<ConstantInt>(Lo)->isMinValue(isSigned)) {
|
2012-12-20 15:09:41 +08:00
|
|
|
ICmpInst::Predicate pred = (isSigned ?
|
2010-01-05 15:50:36 +08:00
|
|
|
ICmpInst::ICMP_SGT : ICmpInst::ICMP_UGT);
|
2010-03-05 16:46:26 +08:00
|
|
|
return Builder->CreateICmp(pred, V, Hi);
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
// Emit V-Lo >u Hi-1-Lo
|
|
|
|
// Note that Hi has already had one subtracted from it, above.
|
|
|
|
ConstantInt *NegLo = cast<ConstantInt>(ConstantExpr::getNeg(Lo));
|
|
|
|
Value *Add = Builder->CreateAdd(V, NegLo, V->getName()+".off");
|
|
|
|
Constant *LowerBound = ConstantExpr::getAdd(NegLo, Hi);
|
2010-03-05 16:46:26 +08:00
|
|
|
return Builder->CreateICmpUGT(Add, LowerBound);
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
|
2015-09-09 02:24:36 +08:00
|
|
|
/// Returns true iff Val consists of one contiguous run of 1s with any number
|
|
|
|
/// of 0s on either side. The 1s are allowed to wrap from LSB to MSB,
|
|
|
|
/// so 0x000FFF0, 0x0000FFFF, and 0xFF0000FF are all runs. 0x0F0F0000 is
|
|
|
|
/// not, since all 1s are not contiguous.
|
2010-01-05 15:50:36 +08:00
|
|
|
static bool isRunOfOnes(ConstantInt *Val, uint32_t &MB, uint32_t &ME) {
|
|
|
|
const APInt& V = Val->getValue();
|
|
|
|
uint32_t BitWidth = Val->getType()->getBitWidth();
|
|
|
|
if (!APIntOps::isShiftedMask(BitWidth, V)) return false;
|
|
|
|
|
|
|
|
// look for the first zero bit after the run of ones
|
|
|
|
MB = BitWidth - ((V - 1) ^ V).countLeadingZeros();
|
|
|
|
// look for the first non-zero bit
|
2012-12-20 15:09:41 +08:00
|
|
|
ME = V.getActiveBits();
|
2010-01-05 15:50:36 +08:00
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2015-09-09 02:24:36 +08:00
|
|
|
/// This is part of an expression (LHS +/- RHS) & Mask, where isSub determines
|
|
|
|
/// whether the operator is a sub. If we can fold one of the following xforms:
|
2012-12-20 15:09:41 +08:00
|
|
|
///
|
2012-09-27 18:14:43 +08:00
|
|
|
/// ((A & N) +/- B) & Mask -> (A +/- B) & Mask iff N&Mask == Mask
|
|
|
|
/// ((A | N) +/- B) & Mask -> (A +/- B) & Mask iff N&Mask == 0
|
|
|
|
/// ((A ^ N) +/- B) & Mask -> (A +/- B) & Mask iff N&Mask == 0
|
2010-01-05 15:50:36 +08:00
|
|
|
///
|
|
|
|
/// return (A +/- B).
|
|
|
|
///
|
|
|
|
Value *InstCombiner::FoldLogicalPlusAnd(Value *LHS, Value *RHS,
|
|
|
|
ConstantInt *Mask, bool isSub,
|
|
|
|
Instruction &I) {
|
|
|
|
Instruction *LHSI = dyn_cast<Instruction>(LHS);
|
|
|
|
if (!LHSI || LHSI->getNumOperands() != 2 ||
|
2014-04-25 13:29:35 +08:00
|
|
|
!isa<ConstantInt>(LHSI->getOperand(1))) return nullptr;
|
2010-01-05 15:50:36 +08:00
|
|
|
|
|
|
|
ConstantInt *N = cast<ConstantInt>(LHSI->getOperand(1));
|
|
|
|
|
|
|
|
switch (LHSI->getOpcode()) {
|
2014-04-25 13:29:35 +08:00
|
|
|
default: return nullptr;
|
2010-01-05 15:50:36 +08:00
|
|
|
case Instruction::And:
|
|
|
|
if (ConstantExpr::getAnd(N, Mask) == Mask) {
|
|
|
|
// If the AndRHS is a power of two minus one (0+1+), this is simple.
|
2012-12-20 15:09:41 +08:00
|
|
|
if ((Mask->getValue().countLeadingZeros() +
|
|
|
|
Mask->getValue().countPopulation()) ==
|
2010-01-05 15:50:36 +08:00
|
|
|
Mask->getValue().getBitWidth())
|
|
|
|
break;
|
|
|
|
|
|
|
|
// Otherwise, if Mask is 0+1+0+, and if B is known to have the low 0+
|
|
|
|
// part, we don't need any explicit masks to take them out of A. If that
|
|
|
|
// is all N is, ignore it.
|
|
|
|
uint32_t MB = 0, ME = 0;
|
|
|
|
if (isRunOfOnes(Mask, MB, ME)) { // begin/end bit of run, inclusive
|
|
|
|
uint32_t BitWidth = cast<IntegerType>(RHS->getType())->getBitWidth();
|
|
|
|
APInt Mask(APInt::getLowBitsSet(BitWidth, MB-1));
|
Make use of @llvm.assume in ValueTracking (computeKnownBits, etc.)
This change, which allows @llvm.assume to be used from within computeKnownBits
(and other associated functions in ValueTracking), adds some (optional)
parameters to computeKnownBits and friends. These functions now (optionally)
take a "context" instruction pointer, an AssumptionTracker pointer, and also a
DomTree pointer, and most of the changes are just to pass this new information
when it is easily available from InstSimplify, InstCombine, etc.
As explained below, the significant conceptual change is that known properties
of a value might depend on the control-flow location of the use (because we
care that the @llvm.assume dominates the use because assumptions have
control-flow dependencies). This means that, when we ask if bits are known in a
value, we might get different answers for different uses.
The significant changes are all in ValueTracking. Two main changes: First, as
with the rest of the code, new parameters need to be passed around. To make
this easier, I grouped them into a structure, and I made internal static
versions of the relevant functions that take this structure as a parameter. The
new code does as you might expect, it looks for @llvm.assume calls that make
use of the value we're trying to learn something about (often indirectly),
attempts to pattern match that expression, and uses the result if successful.
By making use of the AssumptionTracker, the process of finding @llvm.assume
calls is not expensive.
Part of the structure being passed around inside ValueTracking is a set of
already-considered @llvm.assume calls. This is to prevent a query using, for
example, the assume(a == b), to recurse on itself. The context and DT params
are used to find applicable assumptions. An assumption needs to dominate the
context instruction, or come after it deterministically. In this latter case we
only handle the specific case where both the assumption and the context
instruction are in the same block, and we need to exclude assumptions from
being used to simplify their own ephemeral values (those which contribute only
to the assumption) because otherwise the assumption would prove its feeding
comparison trivial and would be removed.
This commit adds the plumbing and the logic for a simple masked-bit propagation
(just enough to write a regression test). Future commits add more patterns
(and, correspondingly, more regression tests).
llvm-svn: 217342
2014-09-08 02:57:58 +08:00
|
|
|
if (MaskedValueIsZero(RHS, Mask, 0, &I))
|
2010-01-05 15:50:36 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
2014-04-25 13:29:35 +08:00
|
|
|
return nullptr;
|
2010-01-05 15:50:36 +08:00
|
|
|
case Instruction::Or:
|
|
|
|
case Instruction::Xor:
|
|
|
|
// If the AndRHS is a power of two minus one (0+1+), and N&Mask == 0
|
2012-12-20 15:09:41 +08:00
|
|
|
if ((Mask->getValue().countLeadingZeros() +
|
2010-01-05 15:50:36 +08:00
|
|
|
Mask->getValue().countPopulation()) == Mask->getValue().getBitWidth()
|
|
|
|
&& ConstantExpr::getAnd(N, Mask)->isNullValue())
|
|
|
|
break;
|
2014-04-25 13:29:35 +08:00
|
|
|
return nullptr;
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
if (isSub)
|
|
|
|
return Builder->CreateSub(LHSI->getOperand(0), RHS, "fold");
|
|
|
|
return Builder->CreateAdd(LHSI->getOperand(0), RHS, "fold");
|
|
|
|
}
|
|
|
|
|
2010-09-09 06:16:17 +08:00
|
|
|
/// enum for classifying (icmp eq (A & B), C) and (icmp ne (A & B), C)
|
2012-12-20 15:09:41 +08:00
|
|
|
/// One of A and B is considered the mask, the other the value. This is
|
|
|
|
/// described as the "AMask" or "BMask" part of the enum. If the enum
|
2010-09-09 06:16:17 +08:00
|
|
|
/// contains only "Mask", then both A and B can be considered masks.
|
|
|
|
/// If A is the mask, then it was proven, that (A & C) == C. This
|
|
|
|
/// is trivial if C == A, or C == 0. If both A and C are constants, this
|
|
|
|
/// proof is also easy.
|
|
|
|
/// For the following explanations we assume that A is the mask.
|
2012-12-20 15:09:41 +08:00
|
|
|
/// The part "AllOnes" declares, that the comparison is true only
|
2010-09-09 06:16:17 +08:00
|
|
|
/// if (A & B) == A, or all bits of A are set in B.
|
|
|
|
/// Example: (icmp eq (A & 3), 3) -> FoldMskICmp_AMask_AllOnes
|
2012-12-20 15:09:41 +08:00
|
|
|
/// The part "AllZeroes" declares, that the comparison is true only
|
2010-09-09 06:16:17 +08:00
|
|
|
/// if (A & B) == 0, or all bits of A are cleared in B.
|
|
|
|
/// Example: (icmp eq (A & 3), 0) -> FoldMskICmp_Mask_AllZeroes
|
2012-12-20 15:09:41 +08:00
|
|
|
/// The part "Mixed" declares, that (A & B) == C and C might or might not
|
2010-09-09 06:16:17 +08:00
|
|
|
/// contain any number of one bits and zero bits.
|
|
|
|
/// Example: (icmp eq (A & 3), 1) -> FoldMskICmp_AMask_Mixed
|
|
|
|
/// The Part "Not" means, that in above descriptions "==" should be replaced
|
|
|
|
/// by "!=".
|
|
|
|
/// Example: (icmp ne (A & 3), 3) -> FoldMskICmp_AMask_NotAllOnes
|
|
|
|
/// If the mask A contains a single bit, then the following is equivalent:
|
|
|
|
/// (icmp eq (A & B), A) equals (icmp ne (A & B), 0)
|
|
|
|
/// (icmp ne (A & B), A) equals (icmp eq (A & B), 0)
|
|
|
|
enum MaskedICmpType {
|
|
|
|
FoldMskICmp_AMask_AllOnes = 1,
|
|
|
|
FoldMskICmp_AMask_NotAllOnes = 2,
|
|
|
|
FoldMskICmp_BMask_AllOnes = 4,
|
|
|
|
FoldMskICmp_BMask_NotAllOnes = 8,
|
|
|
|
FoldMskICmp_Mask_AllZeroes = 16,
|
|
|
|
FoldMskICmp_Mask_NotAllZeroes = 32,
|
|
|
|
FoldMskICmp_AMask_Mixed = 64,
|
|
|
|
FoldMskICmp_AMask_NotMixed = 128,
|
|
|
|
FoldMskICmp_BMask_Mixed = 256,
|
|
|
|
FoldMskICmp_BMask_NotMixed = 512
|
|
|
|
};
|
|
|
|
|
2015-09-09 02:24:36 +08:00
|
|
|
/// Return the set of pattern classes (from MaskedICmpType)
|
|
|
|
/// that (icmp SCC (A & B), C) satisfies.
|
2012-12-20 15:09:41 +08:00
|
|
|
static unsigned getTypeOfMaskedICmp(Value* A, Value* B, Value* C,
|
2010-09-09 06:16:17 +08:00
|
|
|
ICmpInst::Predicate SCC)
|
|
|
|
{
|
|
|
|
ConstantInt *ACst = dyn_cast<ConstantInt>(A);
|
|
|
|
ConstantInt *BCst = dyn_cast<ConstantInt>(B);
|
|
|
|
ConstantInt *CCst = dyn_cast<ConstantInt>(C);
|
|
|
|
bool icmp_eq = (SCC == ICmpInst::ICMP_EQ);
|
2014-04-25 13:29:35 +08:00
|
|
|
bool icmp_abit = (ACst && !ACst->isZero() &&
|
2010-09-09 06:16:17 +08:00
|
|
|
ACst->getValue().isPowerOf2());
|
2014-04-25 13:29:35 +08:00
|
|
|
bool icmp_bbit = (BCst && !BCst->isZero() &&
|
2010-09-09 06:16:17 +08:00
|
|
|
BCst->getValue().isPowerOf2());
|
|
|
|
unsigned result = 0;
|
2014-04-25 13:29:35 +08:00
|
|
|
if (CCst && CCst->isZero()) {
|
2010-09-09 06:16:17 +08:00
|
|
|
// if C is zero, then both A and B qualify as mask
|
|
|
|
result |= (icmp_eq ? (FoldMskICmp_Mask_AllZeroes |
|
|
|
|
FoldMskICmp_AMask_Mixed |
|
|
|
|
FoldMskICmp_BMask_Mixed)
|
|
|
|
: (FoldMskICmp_Mask_NotAllZeroes |
|
|
|
|
FoldMskICmp_AMask_NotMixed |
|
|
|
|
FoldMskICmp_BMask_NotMixed));
|
|
|
|
if (icmp_abit)
|
|
|
|
result |= (icmp_eq ? (FoldMskICmp_AMask_NotAllOnes |
|
2012-12-20 15:09:41 +08:00
|
|
|
FoldMskICmp_AMask_NotMixed)
|
2010-09-09 06:16:17 +08:00
|
|
|
: (FoldMskICmp_AMask_AllOnes |
|
|
|
|
FoldMskICmp_AMask_Mixed));
|
|
|
|
if (icmp_bbit)
|
|
|
|
result |= (icmp_eq ? (FoldMskICmp_BMask_NotAllOnes |
|
2012-12-20 15:09:41 +08:00
|
|
|
FoldMskICmp_BMask_NotMixed)
|
2010-09-09 06:16:17 +08:00
|
|
|
: (FoldMskICmp_BMask_AllOnes |
|
|
|
|
FoldMskICmp_BMask_Mixed));
|
|
|
|
return result;
|
|
|
|
}
|
|
|
|
if (A == C) {
|
|
|
|
result |= (icmp_eq ? (FoldMskICmp_AMask_AllOnes |
|
|
|
|
FoldMskICmp_AMask_Mixed)
|
|
|
|
: (FoldMskICmp_AMask_NotAllOnes |
|
|
|
|
FoldMskICmp_AMask_NotMixed));
|
|
|
|
if (icmp_abit)
|
|
|
|
result |= (icmp_eq ? (FoldMskICmp_Mask_NotAllZeroes |
|
|
|
|
FoldMskICmp_AMask_NotMixed)
|
|
|
|
: (FoldMskICmp_Mask_AllZeroes |
|
|
|
|
FoldMskICmp_AMask_Mixed));
|
2014-04-25 13:29:35 +08:00
|
|
|
} else if (ACst && CCst &&
|
2012-12-20 15:15:54 +08:00
|
|
|
ConstantExpr::getAnd(ACst, CCst) == CCst) {
|
2010-09-09 06:16:17 +08:00
|
|
|
result |= (icmp_eq ? FoldMskICmp_AMask_Mixed
|
|
|
|
: FoldMskICmp_AMask_NotMixed);
|
|
|
|
}
|
2012-12-20 15:15:54 +08:00
|
|
|
if (B == C) {
|
2010-09-09 06:16:17 +08:00
|
|
|
result |= (icmp_eq ? (FoldMskICmp_BMask_AllOnes |
|
|
|
|
FoldMskICmp_BMask_Mixed)
|
|
|
|
: (FoldMskICmp_BMask_NotAllOnes |
|
|
|
|
FoldMskICmp_BMask_NotMixed));
|
|
|
|
if (icmp_bbit)
|
|
|
|
result |= (icmp_eq ? (FoldMskICmp_Mask_NotAllZeroes |
|
2012-12-20 15:09:41 +08:00
|
|
|
FoldMskICmp_BMask_NotMixed)
|
2010-09-09 06:16:17 +08:00
|
|
|
: (FoldMskICmp_Mask_AllZeroes |
|
|
|
|
FoldMskICmp_BMask_Mixed));
|
2014-04-25 13:29:35 +08:00
|
|
|
} else if (BCst && CCst &&
|
2012-12-20 15:15:54 +08:00
|
|
|
ConstantExpr::getAnd(BCst, CCst) == CCst) {
|
2010-09-09 06:16:17 +08:00
|
|
|
result |= (icmp_eq ? FoldMskICmp_BMask_Mixed
|
|
|
|
: FoldMskICmp_BMask_NotMixed);
|
|
|
|
}
|
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
2013-09-04 19:57:13 +08:00
|
|
|
/// Convert an analysis of a masked ICmp into its equivalent if all boolean
|
|
|
|
/// operations had the opposite sense. Since each "NotXXX" flag (recording !=)
|
|
|
|
/// is adjacent to the corresponding normal flag (recording ==), this just
|
|
|
|
/// involves swapping those bits over.
|
|
|
|
static unsigned conjugateICmpMask(unsigned Mask) {
|
|
|
|
unsigned NewMask;
|
|
|
|
NewMask = (Mask & (FoldMskICmp_AMask_AllOnes | FoldMskICmp_BMask_AllOnes |
|
|
|
|
FoldMskICmp_Mask_AllZeroes | FoldMskICmp_AMask_Mixed |
|
|
|
|
FoldMskICmp_BMask_Mixed))
|
|
|
|
<< 1;
|
|
|
|
|
|
|
|
NewMask |=
|
|
|
|
(Mask & (FoldMskICmp_AMask_NotAllOnes | FoldMskICmp_BMask_NotAllOnes |
|
|
|
|
FoldMskICmp_Mask_NotAllZeroes | FoldMskICmp_AMask_NotMixed |
|
|
|
|
FoldMskICmp_BMask_NotMixed))
|
|
|
|
>> 1;
|
|
|
|
|
|
|
|
return NewMask;
|
|
|
|
}
|
|
|
|
|
2015-09-09 02:24:36 +08:00
|
|
|
/// Decompose an icmp into the form ((X & Y) pred Z) if possible.
|
|
|
|
/// The returned predicate is either == or !=. Returns false if
|
2012-01-10 01:23:27 +08:00
|
|
|
/// decomposition fails.
|
|
|
|
static bool decomposeBitTestICmp(const ICmpInst *I, ICmpInst::Predicate &Pred,
|
|
|
|
Value *&X, Value *&Y, Value *&Z) {
|
2014-02-12 05:09:03 +08:00
|
|
|
ConstantInt *C = dyn_cast<ConstantInt>(I->getOperand(1));
|
|
|
|
if (!C)
|
|
|
|
return false;
|
2012-01-10 01:23:27 +08:00
|
|
|
|
2014-02-12 05:09:03 +08:00
|
|
|
switch (I->getPredicate()) {
|
|
|
|
default:
|
|
|
|
return false;
|
|
|
|
case ICmpInst::ICMP_SLT:
|
|
|
|
// X < 0 is equivalent to (X & SignBit) != 0.
|
|
|
|
if (!C->isZero())
|
|
|
|
return false;
|
|
|
|
Y = ConstantInt::get(I->getContext(), APInt::getSignBit(C->getBitWidth()));
|
|
|
|
Pred = ICmpInst::ICMP_NE;
|
|
|
|
break;
|
|
|
|
case ICmpInst::ICMP_SGT:
|
|
|
|
// X > -1 is equivalent to (X & SignBit) == 0.
|
|
|
|
if (!C->isAllOnesValue())
|
|
|
|
return false;
|
|
|
|
Y = ConstantInt::get(I->getContext(), APInt::getSignBit(C->getBitWidth()));
|
|
|
|
Pred = ICmpInst::ICMP_EQ;
|
|
|
|
break;
|
|
|
|
case ICmpInst::ICMP_ULT:
|
|
|
|
// X <u 2^n is equivalent to (X & ~(2^n-1)) == 0.
|
|
|
|
if (!C->getValue().isPowerOf2())
|
|
|
|
return false;
|
|
|
|
Y = ConstantInt::get(I->getContext(), -C->getValue());
|
|
|
|
Pred = ICmpInst::ICMP_EQ;
|
|
|
|
break;
|
|
|
|
case ICmpInst::ICMP_UGT:
|
|
|
|
// X >u 2^n-1 is equivalent to (X & ~(2^n-1)) != 0.
|
|
|
|
if (!(C->getValue() + 1).isPowerOf2())
|
|
|
|
return false;
|
|
|
|
Y = ConstantInt::get(I->getContext(), ~C->getValue());
|
|
|
|
Pred = ICmpInst::ICMP_NE;
|
|
|
|
break;
|
|
|
|
}
|
2012-01-10 01:23:27 +08:00
|
|
|
|
2014-02-12 05:09:03 +08:00
|
|
|
X = I->getOperand(0);
|
|
|
|
Z = ConstantInt::getNullValue(C->getType());
|
|
|
|
return true;
|
2012-01-10 01:23:27 +08:00
|
|
|
}
|
|
|
|
|
2015-09-09 02:24:36 +08:00
|
|
|
/// Handle (icmp(A & B) ==/!= C) &/| (icmp(A & D) ==/!= E)
|
|
|
|
/// Return the set of pattern classes (from MaskedICmpType)
|
|
|
|
/// that both LHS and RHS satisfy.
|
2012-12-20 15:09:41 +08:00
|
|
|
static unsigned foldLogOpOfMaskedICmpsHelper(Value*& A,
|
2010-09-09 06:16:17 +08:00
|
|
|
Value*& B, Value*& C,
|
|
|
|
Value*& D, Value*& E,
|
2012-01-10 01:23:27 +08:00
|
|
|
ICmpInst *LHS, ICmpInst *RHS,
|
|
|
|
ICmpInst::Predicate &LHSCC,
|
|
|
|
ICmpInst::Predicate &RHSCC) {
|
2010-09-09 06:16:17 +08:00
|
|
|
if (LHS->getOperand(0)->getType() != RHS->getOperand(0)->getType()) return 0;
|
|
|
|
// vectors are not (yet?) supported
|
|
|
|
if (LHS->getOperand(0)->getType()->isVectorTy()) return 0;
|
|
|
|
|
|
|
|
// Here comes the tricky part:
|
2012-12-20 15:09:41 +08:00
|
|
|
// LHS might be of the form L11 & L12 == X, X == L21 & L22,
|
2010-09-09 06:16:17 +08:00
|
|
|
// and L11 & L12 == L21 & L22. The same goes for RHS.
|
|
|
|
// Now we must find those components L** and R**, that are equal, so
|
2012-12-20 15:09:41 +08:00
|
|
|
// that we can extract the parameters A, B, C, D, and E for the canonical
|
2010-09-09 06:16:17 +08:00
|
|
|
// above.
|
|
|
|
Value *L1 = LHS->getOperand(0);
|
|
|
|
Value *L2 = LHS->getOperand(1);
|
|
|
|
Value *L11,*L12,*L21,*L22;
|
2012-01-10 01:23:27 +08:00
|
|
|
// Check whether the icmp can be decomposed into a bit test.
|
|
|
|
if (decomposeBitTestICmp(LHS, LHSCC, L11, L12, L2)) {
|
2014-04-25 13:29:35 +08:00
|
|
|
L21 = L22 = L1 = nullptr;
|
2012-01-10 01:23:27 +08:00
|
|
|
} else {
|
|
|
|
// Look for ANDs in the LHS icmp.
|
2013-09-04 19:57:17 +08:00
|
|
|
if (!L1->getType()->isIntegerTy()) {
|
|
|
|
// You can icmp pointers, for example. They really aren't masks.
|
2014-04-25 13:29:35 +08:00
|
|
|
L11 = L12 = nullptr;
|
2013-09-04 19:57:17 +08:00
|
|
|
} else if (!match(L1, m_And(m_Value(L11), m_Value(L12)))) {
|
|
|
|
// Any icmp can be viewed as being trivially masked; if it allows us to
|
|
|
|
// remove one, it's worth it.
|
|
|
|
L11 = L1;
|
|
|
|
L12 = Constant::getAllOnesValue(L1->getType());
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!L2->getType()->isIntegerTy()) {
|
|
|
|
// You can icmp pointers, for example. They really aren't masks.
|
2014-04-25 13:29:35 +08:00
|
|
|
L21 = L22 = nullptr;
|
2013-09-04 19:57:17 +08:00
|
|
|
} else if (!match(L2, m_And(m_Value(L21), m_Value(L22)))) {
|
|
|
|
L21 = L2;
|
|
|
|
L22 = Constant::getAllOnesValue(L2->getType());
|
2012-01-10 01:23:27 +08:00
|
|
|
}
|
2010-09-09 06:16:17 +08:00
|
|
|
}
|
|
|
|
|
2012-01-10 01:23:27 +08:00
|
|
|
// Bail if LHS was a icmp that can't be decomposed into an equality.
|
|
|
|
if (!ICmpInst::isEquality(LHSCC))
|
|
|
|
return 0;
|
|
|
|
|
2010-09-09 06:16:17 +08:00
|
|
|
Value *R1 = RHS->getOperand(0);
|
|
|
|
Value *R2 = RHS->getOperand(1);
|
|
|
|
Value *R11,*R12;
|
|
|
|
bool ok = false;
|
2012-01-10 01:23:27 +08:00
|
|
|
if (decomposeBitTestICmp(RHS, RHSCC, R11, R12, R2)) {
|
|
|
|
if (R11 == L11 || R11 == L12 || R11 == L21 || R11 == L22) {
|
|
|
|
A = R11; D = R12;
|
|
|
|
} else if (R12 == L11 || R12 == L12 || R12 == L21 || R12 == L22) {
|
|
|
|
A = R12; D = R11;
|
|
|
|
} else {
|
|
|
|
return 0;
|
2010-09-09 06:16:17 +08:00
|
|
|
}
|
2014-04-25 13:29:35 +08:00
|
|
|
E = R2; R1 = nullptr; ok = true;
|
2013-09-04 19:57:17 +08:00
|
|
|
} else if (R1->getType()->isIntegerTy()) {
|
|
|
|
if (!match(R1, m_And(m_Value(R11), m_Value(R12)))) {
|
|
|
|
// As before, model no mask as a trivial mask if it'll let us do an
|
2014-08-19 14:41:55 +08:00
|
|
|
// optimization.
|
2013-09-04 19:57:17 +08:00
|
|
|
R11 = R1;
|
|
|
|
R12 = Constant::getAllOnesValue(R1->getType());
|
|
|
|
}
|
|
|
|
|
2012-01-10 01:23:27 +08:00
|
|
|
if (R11 == L11 || R11 == L12 || R11 == L21 || R11 == L22) {
|
|
|
|
A = R11; D = R12; E = R2; ok = true;
|
|
|
|
} else if (R12 == L11 || R12 == L12 || R12 == L21 || R12 == L22) {
|
2010-09-09 06:16:17 +08:00
|
|
|
A = R12; D = R11; E = R2; ok = true;
|
|
|
|
}
|
|
|
|
}
|
2012-01-10 01:23:27 +08:00
|
|
|
|
|
|
|
// Bail if RHS was a icmp that can't be decomposed into an equality.
|
|
|
|
if (!ICmpInst::isEquality(RHSCC))
|
|
|
|
return 0;
|
|
|
|
|
2016-05-10 05:37:43 +08:00
|
|
|
// Look for ANDs on the right side of the RHS icmp.
|
2013-09-04 19:57:17 +08:00
|
|
|
if (!ok && R2->getType()->isIntegerTy()) {
|
|
|
|
if (!match(R2, m_And(m_Value(R11), m_Value(R12)))) {
|
|
|
|
R11 = R2;
|
|
|
|
R12 = Constant::getAllOnesValue(R2->getType());
|
|
|
|
}
|
|
|
|
|
2012-01-10 01:23:27 +08:00
|
|
|
if (R11 == L11 || R11 == L12 || R11 == L21 || R11 == L22) {
|
|
|
|
A = R11; D = R12; E = R1; ok = true;
|
|
|
|
} else if (R12 == L11 || R12 == L12 || R12 == L21 || R12 == L22) {
|
2010-09-09 06:16:17 +08:00
|
|
|
A = R12; D = R11; E = R1; ok = true;
|
2012-01-10 01:23:27 +08:00
|
|
|
} else {
|
2010-09-09 06:16:17 +08:00
|
|
|
return 0;
|
2012-01-10 01:23:27 +08:00
|
|
|
}
|
2010-09-09 06:16:17 +08:00
|
|
|
}
|
|
|
|
if (!ok)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
if (L11 == A) {
|
|
|
|
B = L12; C = L2;
|
2012-12-20 15:15:54 +08:00
|
|
|
} else if (L12 == A) {
|
2010-09-09 06:16:17 +08:00
|
|
|
B = L11; C = L2;
|
2012-12-20 15:15:54 +08:00
|
|
|
} else if (L21 == A) {
|
2010-09-09 06:16:17 +08:00
|
|
|
B = L22; C = L1;
|
2012-12-20 15:15:54 +08:00
|
|
|
} else if (L22 == A) {
|
2010-09-09 06:16:17 +08:00
|
|
|
B = L21; C = L1;
|
|
|
|
}
|
|
|
|
|
2016-01-19 02:28:09 +08:00
|
|
|
unsigned LeftType = getTypeOfMaskedICmp(A, B, C, LHSCC);
|
|
|
|
unsigned RightType = getTypeOfMaskedICmp(A, D, E, RHSCC);
|
|
|
|
return LeftType & RightType;
|
2010-09-09 06:16:17 +08:00
|
|
|
}
|
2015-09-09 02:24:36 +08:00
|
|
|
|
|
|
|
/// Try to fold (icmp(A & B) ==/!= C) &/| (icmp(A & D) ==/!= E)
|
|
|
|
/// into a single (icmp(A & X) ==/!= Y).
|
2014-11-18 17:31:36 +08:00
|
|
|
static Value *foldLogOpOfMaskedICmps(ICmpInst *LHS, ICmpInst *RHS, bool IsAnd,
|
|
|
|
llvm::InstCombiner::BuilderTy *Builder) {
|
2014-04-25 13:29:35 +08:00
|
|
|
Value *A = nullptr, *B = nullptr, *C = nullptr, *D = nullptr, *E = nullptr;
|
2012-01-10 01:23:27 +08:00
|
|
|
ICmpInst::Predicate LHSCC = LHS->getPredicate(), RHSCC = RHS->getPredicate();
|
2016-01-19 02:28:09 +08:00
|
|
|
unsigned Mask = foldLogOpOfMaskedICmpsHelper(A, B, C, D, E, LHS, RHS,
|
2012-01-10 01:23:27 +08:00
|
|
|
LHSCC, RHSCC);
|
2016-01-19 02:28:09 +08:00
|
|
|
if (Mask == 0) return nullptr;
|
2012-01-10 01:23:27 +08:00
|
|
|
assert(ICmpInst::isEquality(LHSCC) && ICmpInst::isEquality(RHSCC) &&
|
|
|
|
"foldLogOpOfMaskedICmpsHelper must return an equality predicate.");
|
2010-09-09 06:16:17 +08:00
|
|
|
|
2013-09-04 19:57:13 +08:00
|
|
|
// In full generality:
|
|
|
|
// (icmp (A & B) Op C) | (icmp (A & D) Op E)
|
|
|
|
// == ![ (icmp (A & B) !Op C) & (icmp (A & D) !Op E) ]
|
|
|
|
//
|
|
|
|
// If the latter can be converted into (icmp (A & X) Op Y) then the former is
|
|
|
|
// equivalent to (icmp (A & X) !Op Y).
|
|
|
|
//
|
|
|
|
// Therefore, we can pretend for the rest of this function that we're dealing
|
|
|
|
// with the conjunction, provided we flip the sense of any comparisons (both
|
|
|
|
// input and output).
|
|
|
|
|
|
|
|
// In most cases we're going to produce an EQ for the "&&" case.
|
2016-01-19 02:28:09 +08:00
|
|
|
ICmpInst::Predicate NewCC = IsAnd ? ICmpInst::ICMP_EQ : ICmpInst::ICMP_NE;
|
2013-09-04 19:57:13 +08:00
|
|
|
if (!IsAnd) {
|
|
|
|
// Convert the masking analysis into its equivalent with negated
|
|
|
|
// comparisons.
|
2016-01-19 02:28:09 +08:00
|
|
|
Mask = conjugateICmpMask(Mask);
|
2013-09-04 19:57:13 +08:00
|
|
|
}
|
2010-09-09 06:16:17 +08:00
|
|
|
|
2016-01-19 02:28:09 +08:00
|
|
|
if (Mask & FoldMskICmp_Mask_AllZeroes) {
|
2012-12-20 15:09:41 +08:00
|
|
|
// (icmp eq (A & B), 0) & (icmp eq (A & D), 0)
|
2010-09-09 06:16:17 +08:00
|
|
|
// -> (icmp eq (A & (B|D)), 0)
|
2016-01-19 02:28:09 +08:00
|
|
|
Value *NewOr = Builder->CreateOr(B, D);
|
|
|
|
Value *NewAnd = Builder->CreateAnd(A, NewOr);
|
|
|
|
// We can't use C as zero because we might actually handle
|
2012-12-20 15:09:41 +08:00
|
|
|
// (icmp ne (A & B), B) & (icmp ne (A & D), D)
|
2016-01-19 02:28:09 +08:00
|
|
|
// with B and D, having a single bit set.
|
|
|
|
Value *Zero = Constant::getNullValue(A->getType());
|
|
|
|
return Builder->CreateICmp(NewCC, NewAnd, Zero);
|
2010-09-09 06:16:17 +08:00
|
|
|
}
|
2016-01-19 02:28:09 +08:00
|
|
|
if (Mask & FoldMskICmp_BMask_AllOnes) {
|
2012-12-20 15:09:41 +08:00
|
|
|
// (icmp eq (A & B), B) & (icmp eq (A & D), D)
|
2010-09-09 06:16:17 +08:00
|
|
|
// -> (icmp eq (A & (B|D)), (B|D))
|
2016-01-19 02:28:09 +08:00
|
|
|
Value *NewOr = Builder->CreateOr(B, D);
|
|
|
|
Value *NewAnd = Builder->CreateAnd(A, NewOr);
|
|
|
|
return Builder->CreateICmp(NewCC, NewAnd, NewOr);
|
2012-12-20 15:09:41 +08:00
|
|
|
}
|
2016-01-19 02:28:09 +08:00
|
|
|
if (Mask & FoldMskICmp_AMask_AllOnes) {
|
2012-12-20 15:09:41 +08:00
|
|
|
// (icmp eq (A & B), A) & (icmp eq (A & D), A)
|
2010-09-09 06:16:17 +08:00
|
|
|
// -> (icmp eq (A & (B&D)), A)
|
2016-01-19 02:28:09 +08:00
|
|
|
Value *NewAnd1 = Builder->CreateAnd(B, D);
|
|
|
|
Value *NewAnd2 = Builder->CreateAnd(A, NewAnd1);
|
|
|
|
return Builder->CreateICmp(NewCC, NewAnd2, A);
|
2010-09-09 06:16:17 +08:00
|
|
|
}
|
2013-09-04 19:57:13 +08:00
|
|
|
|
|
|
|
// Remaining cases assume at least that B and D are constant, and depend on
|
2016-01-19 02:28:09 +08:00
|
|
|
// their actual values. This isn't strictly necessary, just a "handle the
|
2013-09-04 19:57:13 +08:00
|
|
|
// easy cases for now" decision.
|
|
|
|
ConstantInt *BCst = dyn_cast<ConstantInt>(B);
|
2014-04-25 13:29:35 +08:00
|
|
|
if (!BCst) return nullptr;
|
2013-09-04 19:57:13 +08:00
|
|
|
ConstantInt *DCst = dyn_cast<ConstantInt>(D);
|
2014-04-25 13:29:35 +08:00
|
|
|
if (!DCst) return nullptr;
|
2013-09-04 19:57:13 +08:00
|
|
|
|
2016-01-19 02:28:09 +08:00
|
|
|
if (Mask & (FoldMskICmp_Mask_NotAllZeroes | FoldMskICmp_BMask_NotAllOnes)) {
|
2013-09-04 19:57:13 +08:00
|
|
|
// (icmp ne (A & B), 0) & (icmp ne (A & D), 0) and
|
|
|
|
// (icmp ne (A & B), B) & (icmp ne (A & D), D)
|
|
|
|
// -> (icmp ne (A & B), 0) or (icmp ne (A & D), 0)
|
|
|
|
// Only valid if one of the masks is a superset of the other (check "B&D" is
|
|
|
|
// the same as either B or D).
|
|
|
|
APInt NewMask = BCst->getValue() & DCst->getValue();
|
|
|
|
|
|
|
|
if (NewMask == BCst->getValue())
|
|
|
|
return LHS;
|
|
|
|
else if (NewMask == DCst->getValue())
|
|
|
|
return RHS;
|
|
|
|
}
|
2016-01-19 02:28:09 +08:00
|
|
|
if (Mask & FoldMskICmp_AMask_NotAllOnes) {
|
2013-09-04 19:57:13 +08:00
|
|
|
// (icmp ne (A & B), B) & (icmp ne (A & D), D)
|
|
|
|
// -> (icmp ne (A & B), A) or (icmp ne (A & D), A)
|
|
|
|
// Only valid if one of the masks is a superset of the other (check "B|D" is
|
|
|
|
// the same as either B or D).
|
|
|
|
APInt NewMask = BCst->getValue() | DCst->getValue();
|
|
|
|
|
|
|
|
if (NewMask == BCst->getValue())
|
|
|
|
return LHS;
|
|
|
|
else if (NewMask == DCst->getValue())
|
|
|
|
return RHS;
|
|
|
|
}
|
2016-01-19 02:28:09 +08:00
|
|
|
if (Mask & FoldMskICmp_BMask_Mixed) {
|
2012-12-20 15:09:41 +08:00
|
|
|
// (icmp eq (A & B), C) & (icmp eq (A & D), E)
|
2010-09-09 06:16:17 +08:00
|
|
|
// We already know that B & C == C && D & E == E.
|
|
|
|
// If we can prove that (B & D) & (C ^ E) == 0, that is, the bits of
|
|
|
|
// C and E, which are shared by both the mask B and the mask D, don't
|
|
|
|
// contradict, then we can transform to
|
|
|
|
// -> (icmp eq (A & (B|D)), (C|E))
|
|
|
|
// Currently, we only handle the case of B, C, D, and E being constant.
|
2016-01-19 02:28:09 +08:00
|
|
|
// We can't simply use C and E because we might actually handle
|
2012-12-20 15:09:41 +08:00
|
|
|
// (icmp ne (A & B), B) & (icmp eq (A & D), D)
|
2016-01-19 02:28:09 +08:00
|
|
|
// with B and D, having a single bit set.
|
2010-09-09 06:16:17 +08:00
|
|
|
ConstantInt *CCst = dyn_cast<ConstantInt>(C);
|
2014-04-25 13:29:35 +08:00
|
|
|
if (!CCst) return nullptr;
|
2010-09-09 06:16:17 +08:00
|
|
|
ConstantInt *ECst = dyn_cast<ConstantInt>(E);
|
2014-04-25 13:29:35 +08:00
|
|
|
if (!ECst) return nullptr;
|
2016-01-19 02:28:09 +08:00
|
|
|
if (LHSCC != NewCC)
|
2014-11-18 17:31:36 +08:00
|
|
|
CCst = cast<ConstantInt>(ConstantExpr::getXor(BCst, CCst));
|
2016-01-19 02:28:09 +08:00
|
|
|
if (RHSCC != NewCC)
|
2014-11-18 17:31:36 +08:00
|
|
|
ECst = cast<ConstantInt>(ConstantExpr::getXor(DCst, ECst));
|
2016-01-19 02:28:09 +08:00
|
|
|
// If there is a conflict, we should actually return a false for the
|
|
|
|
// whole construct.
|
2014-11-18 17:31:36 +08:00
|
|
|
if (((BCst->getValue() & DCst->getValue()) &
|
|
|
|
(CCst->getValue() ^ ECst->getValue())) != 0)
|
2014-11-18 17:31:41 +08:00
|
|
|
return ConstantInt::get(LHS->getType(), !IsAnd);
|
2016-01-19 02:28:09 +08:00
|
|
|
Value *NewOr1 = Builder->CreateOr(B, D);
|
|
|
|
Value *NewOr2 = ConstantExpr::getOr(CCst, ECst);
|
|
|
|
Value *NewAnd = Builder->CreateAnd(A, NewOr1);
|
|
|
|
return Builder->CreateICmp(NewCC, NewAnd, NewOr2);
|
2010-09-09 06:16:17 +08:00
|
|
|
}
|
2014-04-25 13:29:35 +08:00
|
|
|
return nullptr;
|
2010-09-09 06:16:17 +08:00
|
|
|
}
|
|
|
|
|
2014-12-03 18:39:15 +08:00
|
|
|
/// Try to fold a signed range checked with lower bound 0 to an unsigned icmp.
|
|
|
|
/// Example: (icmp sge x, 0) & (icmp slt x, n) --> icmp ult x, n
|
|
|
|
/// If \p Inverted is true then the check is for the inverted range, e.g.
|
|
|
|
/// (icmp slt x, 0) | (icmp sgt x, n) --> icmp ugt x, n
|
|
|
|
Value *InstCombiner::simplifyRangeCheck(ICmpInst *Cmp0, ICmpInst *Cmp1,
|
|
|
|
bool Inverted) {
|
|
|
|
// Check the lower range comparison, e.g. x >= 0
|
|
|
|
// InstCombine already ensured that if there is a constant it's on the RHS.
|
|
|
|
ConstantInt *RangeStart = dyn_cast<ConstantInt>(Cmp0->getOperand(1));
|
|
|
|
if (!RangeStart)
|
|
|
|
return nullptr;
|
|
|
|
|
|
|
|
ICmpInst::Predicate Pred0 = (Inverted ? Cmp0->getInversePredicate() :
|
|
|
|
Cmp0->getPredicate());
|
|
|
|
|
|
|
|
// Accept x > -1 or x >= 0 (after potentially inverting the predicate).
|
|
|
|
if (!((Pred0 == ICmpInst::ICMP_SGT && RangeStart->isMinusOne()) ||
|
|
|
|
(Pred0 == ICmpInst::ICMP_SGE && RangeStart->isZero())))
|
|
|
|
return nullptr;
|
|
|
|
|
|
|
|
ICmpInst::Predicate Pred1 = (Inverted ? Cmp1->getInversePredicate() :
|
|
|
|
Cmp1->getPredicate());
|
|
|
|
|
|
|
|
Value *Input = Cmp0->getOperand(0);
|
|
|
|
Value *RangeEnd;
|
|
|
|
if (Cmp1->getOperand(0) == Input) {
|
|
|
|
// For the upper range compare we have: icmp x, n
|
|
|
|
RangeEnd = Cmp1->getOperand(1);
|
|
|
|
} else if (Cmp1->getOperand(1) == Input) {
|
|
|
|
// For the upper range compare we have: icmp n, x
|
|
|
|
RangeEnd = Cmp1->getOperand(0);
|
|
|
|
Pred1 = ICmpInst::getSwappedPredicate(Pred1);
|
|
|
|
} else {
|
|
|
|
return nullptr;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Check the upper range comparison, e.g. x < n
|
|
|
|
ICmpInst::Predicate NewPred;
|
|
|
|
switch (Pred1) {
|
|
|
|
case ICmpInst::ICMP_SLT: NewPred = ICmpInst::ICMP_ULT; break;
|
|
|
|
case ICmpInst::ICMP_SLE: NewPred = ICmpInst::ICMP_ULE; break;
|
|
|
|
default: return nullptr;
|
|
|
|
}
|
|
|
|
|
|
|
|
// This simplification is only valid if the upper range is not negative.
|
|
|
|
bool IsNegative, IsNotNegative;
|
2014-12-26 17:10:14 +08:00
|
|
|
ComputeSignBit(RangeEnd, IsNotNegative, IsNegative, /*Depth=*/0, Cmp1);
|
2014-12-03 18:39:15 +08:00
|
|
|
if (!IsNotNegative)
|
|
|
|
return nullptr;
|
|
|
|
|
|
|
|
if (Inverted)
|
|
|
|
NewPred = ICmpInst::getInversePredicate(NewPred);
|
|
|
|
|
|
|
|
return Builder->CreateICmp(NewPred, Input, RangeEnd);
|
|
|
|
}
|
|
|
|
|
2015-09-09 02:24:36 +08:00
|
|
|
/// Fold (icmp)&(icmp) if possible.
|
2010-03-05 16:46:26 +08:00
|
|
|
Value *InstCombiner::FoldAndOfICmps(ICmpInst *LHS, ICmpInst *RHS) {
|
2010-01-05 15:50:36 +08:00
|
|
|
ICmpInst::Predicate LHSCC = LHS->getPredicate(), RHSCC = RHS->getPredicate();
|
|
|
|
|
|
|
|
// (icmp1 A, B) & (icmp2 A, B) --> (icmp3 A, B)
|
|
|
|
if (PredicatesFoldable(LHSCC, RHSCC)) {
|
|
|
|
if (LHS->getOperand(0) == RHS->getOperand(1) &&
|
|
|
|
LHS->getOperand(1) == RHS->getOperand(0))
|
|
|
|
LHS->swapOperands();
|
|
|
|
if (LHS->getOperand(0) == RHS->getOperand(0) &&
|
|
|
|
LHS->getOperand(1) == RHS->getOperand(1)) {
|
|
|
|
Value *Op0 = LHS->getOperand(0), *Op1 = LHS->getOperand(1);
|
|
|
|
unsigned Code = getICmpCode(LHS) & getICmpCode(RHS);
|
|
|
|
bool isSigned = LHS->isSigned() || RHS->isSigned();
|
2011-12-17 09:20:32 +08:00
|
|
|
return getNewICmpValue(isSigned, Code, Op0, Op1, Builder);
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
}
|
2010-09-09 06:16:17 +08:00
|
|
|
|
2011-02-10 13:17:27 +08:00
|
|
|
// handle (roughly): (icmp eq (A & B), C) & (icmp eq (A & D), E)
|
2013-09-04 19:57:13 +08:00
|
|
|
if (Value *V = foldLogOpOfMaskedICmps(LHS, RHS, true, Builder))
|
2011-02-10 13:17:27 +08:00
|
|
|
return V;
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2014-12-03 18:39:15 +08:00
|
|
|
// E.g. (icmp sge x, 0) & (icmp slt x, n) --> icmp ult x, n
|
|
|
|
if (Value *V = simplifyRangeCheck(LHS, RHS, /*Inverted=*/false))
|
|
|
|
return V;
|
|
|
|
|
|
|
|
// E.g. (icmp slt x, n) & (icmp sge x, 0) --> icmp ult x, n
|
|
|
|
if (Value *V = simplifyRangeCheck(RHS, LHS, /*Inverted=*/false))
|
|
|
|
return V;
|
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
// This only handles icmp of constants: (icmp1 A, C1) & (icmp2 B, C2).
|
|
|
|
Value *Val = LHS->getOperand(0), *Val2 = RHS->getOperand(0);
|
|
|
|
ConstantInt *LHSCst = dyn_cast<ConstantInt>(LHS->getOperand(1));
|
|
|
|
ConstantInt *RHSCst = dyn_cast<ConstantInt>(RHS->getOperand(1));
|
2014-04-25 13:29:35 +08:00
|
|
|
if (!LHSCst || !RHSCst) return nullptr;
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
if (LHSCst == RHSCst && LHSCC == RHSCC) {
|
|
|
|
// (icmp ult A, C) & (icmp ult B, C) --> (icmp ult (A|B), C)
|
2016-01-19 03:17:58 +08:00
|
|
|
// where C is a power of 2 or
|
2010-01-05 15:50:36 +08:00
|
|
|
// (icmp eq A, 0) & (icmp eq B, 0) --> (icmp eq (A|B), 0)
|
2016-01-19 03:17:58 +08:00
|
|
|
if ((LHSCC == ICmpInst::ICMP_ULT && LHSCst->getValue().isPowerOf2()) ||
|
|
|
|
(LHSCC == ICmpInst::ICMP_EQ && LHSCst->isZero())) {
|
2010-01-05 15:50:36 +08:00
|
|
|
Value *NewOr = Builder->CreateOr(Val, Val2);
|
2010-03-05 16:46:26 +08:00
|
|
|
return Builder->CreateICmp(LHSCC, NewOr, LHSCst);
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
}
|
2011-04-29 00:58:40 +08:00
|
|
|
|
2011-04-29 04:09:57 +08:00
|
|
|
// (trunc x) == C1 & (and x, CA) == C2 -> (and x, CA|CMAX) == C1|C2
|
2011-04-29 00:58:40 +08:00
|
|
|
// where CMAX is the all ones value for the truncated type,
|
2012-09-27 18:14:43 +08:00
|
|
|
// iff the lower bits of C2 and CA are zero.
|
2012-02-29 09:46:50 +08:00
|
|
|
if (LHSCC == ICmpInst::ICMP_EQ && LHSCC == RHSCC &&
|
2011-04-29 00:58:40 +08:00
|
|
|
LHS->hasOneUse() && RHS->hasOneUse()) {
|
|
|
|
Value *V;
|
2014-04-25 13:29:35 +08:00
|
|
|
ConstantInt *AndCst, *SmallCst = nullptr, *BigCst = nullptr;
|
2011-04-29 00:58:40 +08:00
|
|
|
|
|
|
|
// (trunc x) == C1 & (and x, CA) == C2
|
2012-12-20 15:15:54 +08:00
|
|
|
// (and x, CA) == C2 & (trunc x) == C1
|
2011-04-29 00:58:40 +08:00
|
|
|
if (match(Val2, m_Trunc(m_Value(V))) &&
|
|
|
|
match(Val, m_And(m_Specific(V), m_ConstantInt(AndCst)))) {
|
|
|
|
SmallCst = RHSCst;
|
|
|
|
BigCst = LHSCst;
|
2012-12-20 15:15:54 +08:00
|
|
|
} else if (match(Val, m_Trunc(m_Value(V))) &&
|
|
|
|
match(Val2, m_And(m_Specific(V), m_ConstantInt(AndCst)))) {
|
2011-04-29 00:58:40 +08:00
|
|
|
SmallCst = LHSCst;
|
|
|
|
BigCst = RHSCst;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (SmallCst && BigCst) {
|
|
|
|
unsigned BigBitSize = BigCst->getType()->getBitWidth();
|
|
|
|
unsigned SmallBitSize = SmallCst->getType()->getBitWidth();
|
|
|
|
|
|
|
|
// Check that the low bits are zero.
|
|
|
|
APInt Low = APInt::getLowBitsSet(BigBitSize, SmallBitSize);
|
2011-04-29 05:38:51 +08:00
|
|
|
if ((Low & AndCst->getValue()) == 0 && (Low & BigCst->getValue()) == 0) {
|
2011-04-29 00:58:40 +08:00
|
|
|
Value *NewAnd = Builder->CreateAnd(V, Low | AndCst->getValue());
|
|
|
|
APInt N = SmallCst->getValue().zext(BigBitSize) | BigCst->getValue();
|
|
|
|
Value *NewVal = ConstantInt::get(AndCst->getType()->getContext(), N);
|
|
|
|
return Builder->CreateICmp(LHSCC, NewAnd, NewVal);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2012-01-09 02:32:24 +08:00
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
// From here on, we only handle:
|
|
|
|
// (icmp1 A, C1) & (icmp2 A, C2) --> something simpler.
|
2014-04-25 13:29:35 +08:00
|
|
|
if (Val != Val2) return nullptr;
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
// ICMP_[US][GL]E X, CST is folded to ICMP_[US][GL]T elsewhere.
|
|
|
|
if (LHSCC == ICmpInst::ICMP_UGE || LHSCC == ICmpInst::ICMP_ULE ||
|
|
|
|
RHSCC == ICmpInst::ICMP_UGE || RHSCC == ICmpInst::ICMP_ULE ||
|
|
|
|
LHSCC == ICmpInst::ICMP_SGE || LHSCC == ICmpInst::ICMP_SLE ||
|
|
|
|
RHSCC == ICmpInst::ICMP_SGE || RHSCC == ICmpInst::ICMP_SLE)
|
2014-04-25 13:29:35 +08:00
|
|
|
return nullptr;
|
2011-03-01 23:05:01 +08:00
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
// We can't fold (ugt x, C) & (sgt x, C2).
|
|
|
|
if (!PredicatesFoldable(LHSCC, RHSCC))
|
2014-04-25 13:29:35 +08:00
|
|
|
return nullptr;
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
// Ensure that the larger constant is on the RHS.
|
|
|
|
bool ShouldSwap;
|
|
|
|
if (CmpInst::isSigned(LHSCC) ||
|
2012-12-20 15:09:41 +08:00
|
|
|
(ICmpInst::isEquality(LHSCC) &&
|
2010-01-05 15:50:36 +08:00
|
|
|
CmpInst::isSigned(RHSCC)))
|
|
|
|
ShouldSwap = LHSCst->getValue().sgt(RHSCst->getValue());
|
|
|
|
else
|
|
|
|
ShouldSwap = LHSCst->getValue().ugt(RHSCst->getValue());
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
if (ShouldSwap) {
|
|
|
|
std::swap(LHS, RHS);
|
|
|
|
std::swap(LHSCst, RHSCst);
|
|
|
|
std::swap(LHSCC, RHSCC);
|
|
|
|
}
|
|
|
|
|
2010-02-11 00:03:48 +08:00
|
|
|
// At this point, we know we have two icmp instructions
|
2010-01-05 15:50:36 +08:00
|
|
|
// comparing a value against two constants and and'ing the result
|
|
|
|
// together. Because of the above check, we know that we only have
|
2012-12-20 15:09:41 +08:00
|
|
|
// icmp eq, icmp ne, icmp [su]lt, and icmp [SU]gt here. We also know
|
|
|
|
// (from the icmp folding check above), that the two constants
|
2010-01-05 15:50:36 +08:00
|
|
|
// are not equal and that the larger constant is on the RHS
|
|
|
|
assert(LHSCst != RHSCst && "Compares not folded above?");
|
|
|
|
|
|
|
|
switch (LHSCC) {
|
|
|
|
default: llvm_unreachable("Unknown integer condition code!");
|
|
|
|
case ICmpInst::ICMP_EQ:
|
|
|
|
switch (RHSCC) {
|
|
|
|
default: llvm_unreachable("Unknown integer condition code!");
|
|
|
|
case ICmpInst::ICMP_NE: // (X == 13 & X != 15) -> X == 13
|
|
|
|
case ICmpInst::ICMP_ULT: // (X == 13 & X < 15) -> X == 13
|
|
|
|
case ICmpInst::ICMP_SLT: // (X == 13 & X < 15) -> X == 13
|
2010-03-05 16:46:26 +08:00
|
|
|
return LHS;
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
case ICmpInst::ICMP_NE:
|
|
|
|
switch (RHSCC) {
|
|
|
|
default: llvm_unreachable("Unknown integer condition code!");
|
|
|
|
case ICmpInst::ICMP_ULT:
|
|
|
|
if (LHSCst == SubOne(RHSCst)) // (X != 13 & X u< 14) -> X < 13
|
2010-03-05 16:46:26 +08:00
|
|
|
return Builder->CreateICmpULT(Val, LHSCst);
|
2014-10-12 22:02:34 +08:00
|
|
|
if (LHSCst->isNullValue()) // (X != 0 & X u< 14) -> X-1 u< 13
|
|
|
|
return InsertRangeTest(Val, AddOne(LHSCst), RHSCst, false, true);
|
2010-01-05 15:50:36 +08:00
|
|
|
break; // (X != 13 & X u< 15) -> no change
|
|
|
|
case ICmpInst::ICMP_SLT:
|
|
|
|
if (LHSCst == SubOne(RHSCst)) // (X != 13 & X s< 14) -> X < 13
|
2010-03-05 16:46:26 +08:00
|
|
|
return Builder->CreateICmpSLT(Val, LHSCst);
|
2010-01-05 15:50:36 +08:00
|
|
|
break; // (X != 13 & X s< 15) -> no change
|
|
|
|
case ICmpInst::ICMP_EQ: // (X != 13 & X == 15) -> X == 15
|
|
|
|
case ICmpInst::ICMP_UGT: // (X != 13 & X u> 15) -> X u> 15
|
|
|
|
case ICmpInst::ICMP_SGT: // (X != 13 & X s> 15) -> X s> 15
|
2010-03-05 16:46:26 +08:00
|
|
|
return RHS;
|
2010-01-05 15:50:36 +08:00
|
|
|
case ICmpInst::ICMP_NE:
|
2013-08-16 08:15:20 +08:00
|
|
|
// Special case to get the ordering right when the values wrap around
|
|
|
|
// zero.
|
2013-08-17 01:03:36 +08:00
|
|
|
if (LHSCst->getValue() == 0 && RHSCst->getValue().isAllOnesValue())
|
2013-08-16 08:15:20 +08:00
|
|
|
std::swap(LHSCst, RHSCst);
|
2010-01-05 15:50:36 +08:00
|
|
|
if (LHSCst == SubOne(RHSCst)){// (X != 13 & X != 14) -> X-13 >u 1
|
|
|
|
Constant *AddCST = ConstantExpr::getNeg(LHSCst);
|
|
|
|
Value *Add = Builder->CreateAdd(Val, AddCST, Val->getName()+".off");
|
2013-08-16 08:15:20 +08:00
|
|
|
return Builder->CreateICmpUGT(Add, ConstantInt::get(Add->getType(), 1),
|
|
|
|
Val->getName()+".cmp");
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
break; // (X != 13 & X != 15) -> no change
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case ICmpInst::ICMP_ULT:
|
|
|
|
switch (RHSCC) {
|
|
|
|
default: llvm_unreachable("Unknown integer condition code!");
|
|
|
|
case ICmpInst::ICMP_EQ: // (X u< 13 & X == 15) -> false
|
|
|
|
case ICmpInst::ICMP_UGT: // (X u< 13 & X u> 15) -> false
|
2010-03-05 16:46:26 +08:00
|
|
|
return ConstantInt::get(CmpInst::makeCmpResultType(LHS->getType()), 0);
|
2010-01-05 15:50:36 +08:00
|
|
|
case ICmpInst::ICMP_SGT: // (X u< 13 & X s> 15) -> no change
|
|
|
|
break;
|
|
|
|
case ICmpInst::ICMP_NE: // (X u< 13 & X != 15) -> X u< 13
|
|
|
|
case ICmpInst::ICMP_ULT: // (X u< 13 & X u< 15) -> X u< 13
|
2010-03-05 16:46:26 +08:00
|
|
|
return LHS;
|
2010-01-05 15:50:36 +08:00
|
|
|
case ICmpInst::ICMP_SLT: // (X u< 13 & X s< 15) -> no change
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case ICmpInst::ICMP_SLT:
|
|
|
|
switch (RHSCC) {
|
|
|
|
default: llvm_unreachable("Unknown integer condition code!");
|
|
|
|
case ICmpInst::ICMP_UGT: // (X s< 13 & X u> 15) -> no change
|
|
|
|
break;
|
|
|
|
case ICmpInst::ICMP_NE: // (X s< 13 & X != 15) -> X < 13
|
|
|
|
case ICmpInst::ICMP_SLT: // (X s< 13 & X s< 15) -> X < 13
|
2010-03-05 16:46:26 +08:00
|
|
|
return LHS;
|
2010-01-05 15:50:36 +08:00
|
|
|
case ICmpInst::ICMP_ULT: // (X s< 13 & X u< 15) -> no change
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case ICmpInst::ICMP_UGT:
|
|
|
|
switch (RHSCC) {
|
|
|
|
default: llvm_unreachable("Unknown integer condition code!");
|
|
|
|
case ICmpInst::ICMP_EQ: // (X u> 13 & X == 15) -> X == 15
|
|
|
|
case ICmpInst::ICMP_UGT: // (X u> 13 & X u> 15) -> X u> 15
|
2010-03-05 16:46:26 +08:00
|
|
|
return RHS;
|
2010-01-05 15:50:36 +08:00
|
|
|
case ICmpInst::ICMP_SGT: // (X u> 13 & X s> 15) -> no change
|
|
|
|
break;
|
|
|
|
case ICmpInst::ICMP_NE:
|
|
|
|
if (RHSCst == AddOne(LHSCst)) // (X u> 13 & X != 14) -> X u> 14
|
2010-03-05 16:46:26 +08:00
|
|
|
return Builder->CreateICmp(LHSCC, Val, RHSCst);
|
2010-01-05 15:50:36 +08:00
|
|
|
break; // (X u> 13 & X != 15) -> no change
|
|
|
|
case ICmpInst::ICMP_ULT: // (X u> 13 & X u< 15) -> (X-14) <u 1
|
2010-03-05 16:46:26 +08:00
|
|
|
return InsertRangeTest(Val, AddOne(LHSCst), RHSCst, false, true);
|
2010-01-05 15:50:36 +08:00
|
|
|
case ICmpInst::ICMP_SLT: // (X u> 13 & X s< 15) -> no change
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case ICmpInst::ICMP_SGT:
|
|
|
|
switch (RHSCC) {
|
|
|
|
default: llvm_unreachable("Unknown integer condition code!");
|
|
|
|
case ICmpInst::ICMP_EQ: // (X s> 13 & X == 15) -> X == 15
|
|
|
|
case ICmpInst::ICMP_SGT: // (X s> 13 & X s> 15) -> X s> 15
|
2010-03-05 16:46:26 +08:00
|
|
|
return RHS;
|
2010-01-05 15:50:36 +08:00
|
|
|
case ICmpInst::ICMP_UGT: // (X s> 13 & X u> 15) -> no change
|
|
|
|
break;
|
|
|
|
case ICmpInst::ICMP_NE:
|
|
|
|
if (RHSCst == AddOne(LHSCst)) // (X s> 13 & X != 14) -> X s> 14
|
2010-03-05 16:46:26 +08:00
|
|
|
return Builder->CreateICmp(LHSCC, Val, RHSCst);
|
2010-01-05 15:50:36 +08:00
|
|
|
break; // (X s> 13 & X != 15) -> no change
|
|
|
|
case ICmpInst::ICMP_SLT: // (X s> 13 & X s< 15) -> (X-14) s< 1
|
2010-03-05 16:46:26 +08:00
|
|
|
return InsertRangeTest(Val, AddOne(LHSCst), RHSCst, true, true);
|
2010-01-05 15:50:36 +08:00
|
|
|
case ICmpInst::ICMP_ULT: // (X s> 13 & X u< 15) -> no change
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2014-04-25 13:29:35 +08:00
|
|
|
return nullptr;
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
|
2015-09-09 02:24:36 +08:00
|
|
|
/// Optimize (fcmp)&(fcmp). NOTE: Unlike the rest of instcombine, this returns
|
|
|
|
/// a Value which should already be inserted into the function.
|
2010-03-05 16:46:26 +08:00
|
|
|
Value *InstCombiner::FoldAndOfFCmps(FCmpInst *LHS, FCmpInst *RHS) {
|
[InstCombine] Simplify and correct folding fcmps with the same children
Summary: Take advantage of FCmpInst::Predicate's bit pattern and handle (fcmp *, x, y) | (fcmp *, x, y) and (fcmp *, x, y) & (fcmp *, x, y) more consistently. Also fold more FCmpInst::FCMP_FALSE and FCmpInst::FCMP_TRUE to constants.
Currently InstCombine wrongly folds (fcmp ogt, x, y) | (fcmp ord, x, y) to (fcmp ogt, x, y); this patch also fixes that.
Reviewers: spatel
Subscribers: llvm-commits, iteratee, echristo
Differential Revision: http://reviews.llvm.org/D21775
llvm-svn: 274156
2016-06-30 04:10:17 +08:00
|
|
|
Value *Op0LHS = LHS->getOperand(0), *Op0RHS = LHS->getOperand(1);
|
|
|
|
Value *Op1LHS = RHS->getOperand(0), *Op1RHS = RHS->getOperand(1);
|
|
|
|
FCmpInst::Predicate Op0CC = LHS->getPredicate(), Op1CC = RHS->getPredicate();
|
|
|
|
|
|
|
|
if (Op0LHS == Op1RHS && Op0RHS == Op1LHS) {
|
|
|
|
// Swap RHS operands to match LHS.
|
|
|
|
Op1CC = FCmpInst::getSwappedPredicate(Op1CC);
|
|
|
|
std::swap(Op1LHS, Op1RHS);
|
|
|
|
}
|
|
|
|
|
|
|
|
// Simplify (fcmp cc0 x, y) & (fcmp cc1 x, y).
|
|
|
|
// Suppose the relation between x and y is R, where R is one of
|
|
|
|
// U(1000), L(0100), G(0010) or E(0001), and CC0 and CC1 are the bitmasks for
|
|
|
|
// testing the desired relations.
|
|
|
|
//
|
|
|
|
// Since (R & CC0) and (R & CC1) are either R or 0, we actually have this:
|
|
|
|
// bool(R & CC0) && bool(R & CC1)
|
|
|
|
// = bool((R & CC0) & (R & CC1))
|
|
|
|
// = bool(R & (CC0 & CC1)) <= by re-association, commutation, and idempotency
|
|
|
|
if (Op0LHS == Op1LHS && Op0RHS == Op1RHS)
|
|
|
|
return getFCmpValue(getFCmpCode(Op0CC) & getFCmpCode(Op1CC), Op0LHS, Op0RHS,
|
|
|
|
Builder);
|
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
if (LHS->getPredicate() == FCmpInst::FCMP_ORD &&
|
|
|
|
RHS->getPredicate() == FCmpInst::FCMP_ORD) {
|
2013-04-13 05:56:23 +08:00
|
|
|
if (LHS->getOperand(0)->getType() != RHS->getOperand(0)->getType())
|
2014-04-25 13:29:35 +08:00
|
|
|
return nullptr;
|
2013-04-13 05:56:23 +08:00
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
// (fcmp ord x, c) & (fcmp ord y, c) -> (fcmp ord x, y)
|
|
|
|
if (ConstantFP *LHSC = dyn_cast<ConstantFP>(LHS->getOperand(1)))
|
|
|
|
if (ConstantFP *RHSC = dyn_cast<ConstantFP>(RHS->getOperand(1))) {
|
|
|
|
// If either of the constants are nans, then the whole thing returns
|
|
|
|
// false.
|
|
|
|
if (LHSC->getValueAPF().isNaN() || RHSC->getValueAPF().isNaN())
|
2013-06-06 08:37:23 +08:00
|
|
|
return Builder->getFalse();
|
2010-03-05 16:46:26 +08:00
|
|
|
return Builder->CreateFCmpORD(LHS->getOperand(0), RHS->getOperand(0));
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
// Handle vector zeros. This occurs because the canonical form of
|
|
|
|
// "fcmp ord x,x" is "fcmp ord x, 0".
|
|
|
|
if (isa<ConstantAggregateZero>(LHS->getOperand(1)) &&
|
|
|
|
isa<ConstantAggregateZero>(RHS->getOperand(1)))
|
2010-03-05 16:46:26 +08:00
|
|
|
return Builder->CreateFCmpORD(LHS->getOperand(0), RHS->getOperand(0));
|
2014-04-25 13:29:35 +08:00
|
|
|
return nullptr;
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2014-04-25 13:29:35 +08:00
|
|
|
return nullptr;
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
|
2015-09-09 04:14:13 +08:00
|
|
|
/// Match De Morgan's Laws:
|
|
|
|
/// (~A & ~B) == (~(A | B))
|
|
|
|
/// (~A | ~B) == (~(A & B))
|
|
|
|
static Instruction *matchDeMorgansLaws(BinaryOperator &I,
|
|
|
|
InstCombiner::BuilderTy *Builder) {
|
|
|
|
auto Opcode = I.getOpcode();
|
|
|
|
assert((Opcode == Instruction::And || Opcode == Instruction::Or) &&
|
|
|
|
"Trying to match De Morgan's Laws with something other than and/or");
|
[InstCombine] match De Morgan's Law hidden by zext ops (PR22723)
This is a fix for PR22723:
https://llvm.org/bugs/show_bug.cgi?id=22723
My first attempt at this was to change what I thought was the root problem:
xor (zext i1 X to i32), 1 --> zext (xor i1 X, true) to i32
...but we create the opposite pattern in InstCombiner::visitZExt(), so infinite loop!
My next idea was to fix the matchIfNot() implementation in PatternMatch, but that would
mean potentially returning a different size for the match than what was input. I think
this would require all users of m_Not to check the size of the returned match, so I
abandoned that idea.
I settled on just fixing the exact case presented in the PR. This patch does allow the
2 functions in PR22723 to compile identically (x86):
bool test(bool x, bool y) { return !x | !y; }
bool test(bool x, bool y) { return !x || !y; }
...
andb %sil, %dil
xorb $1, %dil
movb %dil, %al
retq
Differential Revision: http://reviews.llvm.org/D12705
llvm-svn: 248634
2015-09-26 07:21:38 +08:00
|
|
|
// Flip the logic operation.
|
|
|
|
if (Opcode == Instruction::And)
|
|
|
|
Opcode = Instruction::Or;
|
|
|
|
else
|
|
|
|
Opcode = Instruction::And;
|
2015-09-09 04:14:13 +08:00
|
|
|
|
|
|
|
Value *Op0 = I.getOperand(0);
|
|
|
|
Value *Op1 = I.getOperand(1);
|
|
|
|
// TODO: Use pattern matchers instead of dyn_cast.
|
|
|
|
if (Value *Op0NotVal = dyn_castNotVal(Op0))
|
|
|
|
if (Value *Op1NotVal = dyn_castNotVal(Op1))
|
|
|
|
if (Op0->hasOneUse() && Op1->hasOneUse()) {
|
|
|
|
Value *LogicOp = Builder->CreateBinOp(Opcode, Op0NotVal, Op1NotVal,
|
|
|
|
I.getName() + ".demorgan");
|
|
|
|
return BinaryOperator::CreateNot(LogicOp);
|
|
|
|
}
|
|
|
|
|
[InstCombine] match De Morgan's Law hidden by zext ops (PR22723)
This is a fix for PR22723:
https://llvm.org/bugs/show_bug.cgi?id=22723
My first attempt at this was to change what I thought was the root problem:
xor (zext i1 X to i32), 1 --> zext (xor i1 X, true) to i32
...but we create the opposite pattern in InstCombiner::visitZExt(), so infinite loop!
My next idea was to fix the matchIfNot() implementation in PatternMatch, but that would
mean potentially returning a different size for the match than what was input. I think
this would require all users of m_Not to check the size of the returned match, so I
abandoned that idea.
I settled on just fixing the exact case presented in the PR. This patch does allow the
2 functions in PR22723 to compile identically (x86):
bool test(bool x, bool y) { return !x | !y; }
bool test(bool x, bool y) { return !x || !y; }
...
andb %sil, %dil
xorb $1, %dil
movb %dil, %al
retq
Differential Revision: http://reviews.llvm.org/D12705
llvm-svn: 248634
2015-09-26 07:21:38 +08:00
|
|
|
// De Morgan's Law in disguise:
|
|
|
|
// (zext(bool A) ^ 1) & (zext(bool B) ^ 1) -> zext(~(A | B))
|
|
|
|
// (zext(bool A) ^ 1) | (zext(bool B) ^ 1) -> zext(~(A & B))
|
|
|
|
Value *A = nullptr;
|
|
|
|
Value *B = nullptr;
|
|
|
|
ConstantInt *C1 = nullptr;
|
|
|
|
if (match(Op0, m_OneUse(m_Xor(m_ZExt(m_Value(A)), m_ConstantInt(C1)))) &&
|
|
|
|
match(Op1, m_OneUse(m_Xor(m_ZExt(m_Value(B)), m_Specific(C1))))) {
|
|
|
|
// TODO: This check could be loosened to handle different type sizes.
|
|
|
|
// Alternatively, we could fix the definition of m_Not to recognize a not
|
|
|
|
// operation hidden by a zext?
|
|
|
|
if (A->getType()->isIntegerTy(1) && B->getType()->isIntegerTy(1) &&
|
|
|
|
C1->isOne()) {
|
|
|
|
Value *LogicOp = Builder->CreateBinOp(Opcode, A, B,
|
|
|
|
I.getName() + ".demorgan");
|
|
|
|
Value *Not = Builder->CreateNot(LogicOp);
|
|
|
|
return CastInst::CreateZExtOrBitCast(Not, I.getType());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2015-09-09 04:14:13 +08:00
|
|
|
return nullptr;
|
|
|
|
}
|
|
|
|
|
2016-02-24 00:36:07 +08:00
|
|
|
Instruction *InstCombiner::foldCastedBitwiseLogic(BinaryOperator &I) {
|
2016-02-24 07:56:23 +08:00
|
|
|
auto LogicOpc = I.getOpcode();
|
2016-02-25 01:00:34 +08:00
|
|
|
assert((LogicOpc == Instruction::And || LogicOpc == Instruction::Or ||
|
|
|
|
LogicOpc == Instruction::Xor) &&
|
2016-02-24 07:56:23 +08:00
|
|
|
"Unexpected opcode for bitwise logic folding");
|
|
|
|
|
2016-02-24 00:36:07 +08:00
|
|
|
Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);
|
2016-02-24 01:41:34 +08:00
|
|
|
CastInst *Cast0 = dyn_cast<CastInst>(Op0);
|
[InstCombine] transform bitcasted bitwise logic ops with constants (PR26702)
Given that we're not actually reducing the instruction count in the included
regression tests, I think we would call this a canonicalization step.
The motivation comes from the example in PR26702:
https://llvm.org/bugs/show_bug.cgi?id=26702
If we hoist the bitwise logic ahead of the bitcast, the previously unoptimizable
example of:
define <4 x i32> @is_negative(<4 x i32> %x) {
%lobit = ashr <4 x i32> %x, <i32 31, i32 31, i32 31, i32 31>
%not = xor <4 x i32> %lobit, <i32 -1, i32 -1, i32 -1, i32 -1>
%bc = bitcast <4 x i32> %not to <2 x i64>
%notnot = xor <2 x i64> %bc, <i64 -1, i64 -1>
%bc2 = bitcast <2 x i64> %notnot to <4 x i32>
ret <4 x i32> %bc2
}
Simplifies to the expected:
define <4 x i32> @is_negative(<4 x i32> %x) {
%lobit = ashr <4 x i32> %x, <i32 31, i32 31, i32 31, i32 31>
ret <4 x i32> %lobit
}
Differential Revision: http://reviews.llvm.org/D17583
llvm-svn: 262645
2016-03-04 03:19:04 +08:00
|
|
|
if (!Cast0)
|
|
|
|
return nullptr;
|
|
|
|
|
|
|
|
// This must be a cast from an integer or integer vector source type to allow
|
|
|
|
// transformation of the logic operation to the source type.
|
|
|
|
Type *DestTy = I.getType();
|
|
|
|
Type *SrcTy = Cast0->getSrcTy();
|
|
|
|
if (!SrcTy->isIntOrIntVectorTy())
|
|
|
|
return nullptr;
|
|
|
|
|
|
|
|
// If one operand is a bitcast and the other is a constant, move the logic
|
|
|
|
// operation ahead of the bitcast. That is, do the logic operation in the
|
|
|
|
// original type. This can eliminate useless bitcasts and allow normal
|
|
|
|
// combines that would otherwise be impeded by the bitcast. Canonicalization
|
|
|
|
// ensures that if there is a constant operand, it will be the second operand.
|
|
|
|
Value *BC = nullptr;
|
|
|
|
Constant *C = nullptr;
|
|
|
|
if ((match(Op0, m_BitCast(m_Value(BC))) && match(Op1, m_Constant(C)))) {
|
|
|
|
// A bitcast of a constant will be removed.
|
|
|
|
Value *NewConstant = Builder->CreateBitCast(C, SrcTy);
|
|
|
|
Value *NewOp = Builder->CreateBinOp(LogicOpc, BC, NewConstant, I.getName());
|
|
|
|
return CastInst::CreateBitOrPointerCast(NewOp, DestTy);
|
|
|
|
}
|
|
|
|
|
2016-02-24 01:41:34 +08:00
|
|
|
CastInst *Cast1 = dyn_cast<CastInst>(Op1);
|
[InstCombine] transform bitcasted bitwise logic ops with constants (PR26702)
Given that we're not actually reducing the instruction count in the included
regression tests, I think we would call this a canonicalization step.
The motivation comes from the example in PR26702:
https://llvm.org/bugs/show_bug.cgi?id=26702
If we hoist the bitwise logic ahead of the bitcast, the previously unoptimizable
example of:
define <4 x i32> @is_negative(<4 x i32> %x) {
%lobit = ashr <4 x i32> %x, <i32 31, i32 31, i32 31, i32 31>
%not = xor <4 x i32> %lobit, <i32 -1, i32 -1, i32 -1, i32 -1>
%bc = bitcast <4 x i32> %not to <2 x i64>
%notnot = xor <2 x i64> %bc, <i64 -1, i64 -1>
%bc2 = bitcast <2 x i64> %notnot to <4 x i32>
ret <4 x i32> %bc2
}
Simplifies to the expected:
define <4 x i32> @is_negative(<4 x i32> %x) {
%lobit = ashr <4 x i32> %x, <i32 31, i32 31, i32 31, i32 31>
ret <4 x i32> %lobit
}
Differential Revision: http://reviews.llvm.org/D17583
llvm-svn: 262645
2016-03-04 03:19:04 +08:00
|
|
|
if (!Cast1)
|
2016-02-24 00:59:21 +08:00
|
|
|
return nullptr;
|
2016-02-24 00:36:07 +08:00
|
|
|
|
[InstCombine] transform bitcasted bitwise logic ops with constants (PR26702)
Given that we're not actually reducing the instruction count in the included
regression tests, I think we would call this a canonicalization step.
The motivation comes from the example in PR26702:
https://llvm.org/bugs/show_bug.cgi?id=26702
If we hoist the bitwise logic ahead of the bitcast, the previously unoptimizable
example of:
define <4 x i32> @is_negative(<4 x i32> %x) {
%lobit = ashr <4 x i32> %x, <i32 31, i32 31, i32 31, i32 31>
%not = xor <4 x i32> %lobit, <i32 -1, i32 -1, i32 -1, i32 -1>
%bc = bitcast <4 x i32> %not to <2 x i64>
%notnot = xor <2 x i64> %bc, <i64 -1, i64 -1>
%bc2 = bitcast <2 x i64> %notnot to <4 x i32>
ret <4 x i32> %bc2
}
Simplifies to the expected:
define <4 x i32> @is_negative(<4 x i32> %x) {
%lobit = ashr <4 x i32> %x, <i32 31, i32 31, i32 31, i32 31>
ret <4 x i32> %lobit
}
Differential Revision: http://reviews.llvm.org/D17583
llvm-svn: 262645
2016-03-04 03:19:04 +08:00
|
|
|
// Both operands of the logic operation are casts. The casts must be of the
|
|
|
|
// same type for reduction.
|
2016-02-24 01:41:34 +08:00
|
|
|
auto CastOpcode = Cast0->getOpcode();
|
[InstCombine] transform bitcasted bitwise logic ops with constants (PR26702)
Given that we're not actually reducing the instruction count in the included
regression tests, I think we would call this a canonicalization step.
The motivation comes from the example in PR26702:
https://llvm.org/bugs/show_bug.cgi?id=26702
If we hoist the bitwise logic ahead of the bitcast, the previously unoptimizable
example of:
define <4 x i32> @is_negative(<4 x i32> %x) {
%lobit = ashr <4 x i32> %x, <i32 31, i32 31, i32 31, i32 31>
%not = xor <4 x i32> %lobit, <i32 -1, i32 -1, i32 -1, i32 -1>
%bc = bitcast <4 x i32> %not to <2 x i64>
%notnot = xor <2 x i64> %bc, <i64 -1, i64 -1>
%bc2 = bitcast <2 x i64> %notnot to <4 x i32>
ret <4 x i32> %bc2
}
Simplifies to the expected:
define <4 x i32> @is_negative(<4 x i32> %x) {
%lobit = ashr <4 x i32> %x, <i32 31, i32 31, i32 31, i32 31>
ret <4 x i32> %lobit
}
Differential Revision: http://reviews.llvm.org/D17583
llvm-svn: 262645
2016-03-04 03:19:04 +08:00
|
|
|
if (CastOpcode != Cast1->getOpcode() || SrcTy != Cast1->getSrcTy())
|
2016-02-24 01:41:34 +08:00
|
|
|
return nullptr;
|
|
|
|
|
|
|
|
Value *Cast0Src = Cast0->getOperand(0);
|
|
|
|
Value *Cast1Src = Cast1->getOperand(0);
|
|
|
|
|
2016-02-24 07:56:23 +08:00
|
|
|
// fold (logic (cast A), (cast B)) -> (cast (logic A, B))
|
2016-02-24 00:59:21 +08:00
|
|
|
|
2016-02-24 01:41:34 +08:00
|
|
|
// Only do this if the casts both really cause code to be generated.
|
2016-02-24 07:56:23 +08:00
|
|
|
if ((!isa<ICmpInst>(Cast0Src) || !isa<ICmpInst>(Cast1Src)) &&
|
|
|
|
ShouldOptimizeCast(CastOpcode, Cast0Src, DestTy) &&
|
2016-02-24 01:41:34 +08:00
|
|
|
ShouldOptimizeCast(CastOpcode, Cast1Src, DestTy)) {
|
2016-02-24 07:56:23 +08:00
|
|
|
Value *NewOp = Builder->CreateBinOp(LogicOpc, Cast0Src, Cast1Src,
|
|
|
|
I.getName());
|
2016-02-24 01:41:34 +08:00
|
|
|
return CastInst::Create(CastOpcode, NewOp, DestTy);
|
2016-02-24 00:36:07 +08:00
|
|
|
}
|
2016-02-24 01:41:34 +08:00
|
|
|
|
2016-02-25 01:00:34 +08:00
|
|
|
// For now, only 'and'/'or' have optimizations after this.
|
|
|
|
if (LogicOpc == Instruction::Xor)
|
|
|
|
return nullptr;
|
|
|
|
|
2016-02-24 07:56:23 +08:00
|
|
|
// If this is logic(cast(icmp), cast(icmp)), try to fold this even if the
|
2016-02-24 01:41:34 +08:00
|
|
|
// cast is otherwise not optimizable. This happens for vector sexts.
|
2016-02-24 07:56:23 +08:00
|
|
|
ICmpInst *ICmp0 = dyn_cast<ICmpInst>(Cast0Src);
|
|
|
|
ICmpInst *ICmp1 = dyn_cast<ICmpInst>(Cast1Src);
|
|
|
|
if (ICmp0 && ICmp1) {
|
|
|
|
Value *Res = LogicOpc == Instruction::And ? FoldAndOfICmps(ICmp0, ICmp1)
|
|
|
|
: FoldOrOfICmps(ICmp0, ICmp1, &I);
|
|
|
|
if (Res)
|
|
|
|
return CastInst::Create(CastOpcode, Res, DestTy);
|
|
|
|
return nullptr;
|
|
|
|
}
|
2016-02-24 01:41:34 +08:00
|
|
|
|
2016-02-24 07:56:23 +08:00
|
|
|
// If this is logic(cast(fcmp), cast(fcmp)), try to fold this even if the
|
2016-02-24 01:41:34 +08:00
|
|
|
// cast is otherwise not optimizable. This happens for vector sexts.
|
2016-02-24 07:56:23 +08:00
|
|
|
FCmpInst *FCmp0 = dyn_cast<FCmpInst>(Cast0Src);
|
|
|
|
FCmpInst *FCmp1 = dyn_cast<FCmpInst>(Cast1Src);
|
|
|
|
if (FCmp0 && FCmp1) {
|
|
|
|
Value *Res = LogicOpc == Instruction::And ? FoldAndOfFCmps(FCmp0, FCmp1)
|
|
|
|
: FoldOrOfFCmps(FCmp0, FCmp1);
|
|
|
|
if (Res)
|
|
|
|
return CastInst::Create(CastOpcode, Res, DestTy);
|
|
|
|
return nullptr;
|
|
|
|
}
|
2016-02-24 01:41:34 +08:00
|
|
|
|
2016-02-24 00:36:07 +08:00
|
|
|
return nullptr;
|
|
|
|
}
|
|
|
|
|
2016-05-28 05:41:29 +08:00
|
|
|
static Instruction *foldBoolSextMaskToSelect(BinaryOperator &I) {
|
|
|
|
Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);
|
|
|
|
|
|
|
|
// Canonicalize SExt or Not to the LHS
|
|
|
|
if (match(Op1, m_SExt(m_Value())) || match(Op1, m_Not(m_Value()))) {
|
|
|
|
std::swap(Op0, Op1);
|
|
|
|
}
|
|
|
|
|
|
|
|
// Fold (and (sext bool to A), B) --> (select bool, B, 0)
|
|
|
|
Value *X = nullptr;
|
|
|
|
if (match(Op0, m_SExt(m_Value(X))) &&
|
|
|
|
X->getType()->getScalarType()->isIntegerTy(1)) {
|
|
|
|
Value *Zero = Constant::getNullValue(Op1->getType());
|
|
|
|
return SelectInst::Create(X, Op1, Zero);
|
|
|
|
}
|
|
|
|
|
|
|
|
// Fold (and ~(sext bool to A), B) --> (select bool, 0, B)
|
|
|
|
if (match(Op0, m_Not(m_SExt(m_Value(X)))) &&
|
|
|
|
X->getType()->getScalarType()->isIntegerTy(1)) {
|
|
|
|
Value *Zero = Constant::getNullValue(Op0->getType());
|
|
|
|
return SelectInst::Create(X, Zero, Op1);
|
|
|
|
}
|
|
|
|
|
|
|
|
return nullptr;
|
|
|
|
}
|
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
Instruction *InstCombiner::visitAnd(BinaryOperator &I) {
|
2010-11-13 23:10:37 +08:00
|
|
|
bool Changed = SimplifyAssociativeOrCommutative(I);
|
2010-01-05 15:50:36 +08:00
|
|
|
Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);
|
|
|
|
|
2014-05-11 16:46:12 +08:00
|
|
|
if (Value *V = SimplifyVectorOp(I))
|
2016-02-02 06:23:39 +08:00
|
|
|
return replaceInstUsesWith(I, V);
|
2014-05-11 16:46:12 +08:00
|
|
|
|
2015-01-04 20:03:27 +08:00
|
|
|
if (Value *V = SimplifyAndInst(Op0, Op1, DL, TLI, DT, AC))
|
2016-02-02 06:23:39 +08:00
|
|
|
return replaceInstUsesWith(I, V);
|
2010-01-05 15:50:36 +08:00
|
|
|
|
2010-12-22 21:36:08 +08:00
|
|
|
// (A|B)&(A|C) -> A|(B&C) etc
|
|
|
|
if (Value *V = SimplifyUsingDistributiveLaws(I))
|
2016-02-02 06:23:39 +08:00
|
|
|
return replaceInstUsesWith(I, V);
|
2010-11-23 22:23:47 +08:00
|
|
|
|
2012-12-20 15:09:41 +08:00
|
|
|
// See if we can simplify any instructions used by the instruction whose sole
|
2010-01-05 15:50:36 +08:00
|
|
|
// purpose is to compute bits we don't care about.
|
|
|
|
if (SimplifyDemandedInstructionBits(I))
|
2012-12-20 15:09:41 +08:00
|
|
|
return &I;
|
2010-01-05 15:50:36 +08:00
|
|
|
|
2014-12-04 17:44:01 +08:00
|
|
|
if (Value *V = SimplifyBSwap(I))
|
2016-02-02 06:23:39 +08:00
|
|
|
return replaceInstUsesWith(I, V);
|
2014-12-04 17:44:01 +08:00
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
if (ConstantInt *AndRHS = dyn_cast<ConstantInt>(Op1)) {
|
|
|
|
const APInt &AndRHSMask = AndRHS->getValue();
|
|
|
|
|
|
|
|
// Optimize a variety of ((val OP C1) & C2) combinations...
|
|
|
|
if (BinaryOperator *Op0I = dyn_cast<BinaryOperator>(Op0)) {
|
|
|
|
Value *Op0LHS = Op0I->getOperand(0);
|
|
|
|
Value *Op0RHS = Op0I->getOperand(1);
|
|
|
|
switch (Op0I->getOpcode()) {
|
|
|
|
default: break;
|
|
|
|
case Instruction::Xor:
|
2011-02-10 13:17:27 +08:00
|
|
|
case Instruction::Or: {
|
2010-01-05 15:50:36 +08:00
|
|
|
// If the mask is only needed on one incoming arm, push it up.
|
|
|
|
if (!Op0I->hasOneUse()) break;
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2011-02-10 13:17:27 +08:00
|
|
|
APInt NotAndRHS(~AndRHSMask);
|
Make use of @llvm.assume in ValueTracking (computeKnownBits, etc.)
This change, which allows @llvm.assume to be used from within computeKnownBits
(and other associated functions in ValueTracking), adds some (optional)
parameters to computeKnownBits and friends. These functions now (optionally)
take a "context" instruction pointer, an AssumptionTracker pointer, and also a
DomTree pointer, and most of the changes are just to pass this new information
when it is easily available from InstSimplify, InstCombine, etc.
As explained below, the significant conceptual change is that known properties
of a value might depend on the control-flow location of the use (because we
care that the @llvm.assume dominates the use because assumptions have
control-flow dependencies). This means that, when we ask if bits are known in a
value, we might get different answers for different uses.
The significant changes are all in ValueTracking. Two main changes: First, as
with the rest of the code, new parameters need to be passed around. To make
this easier, I grouped them into a structure, and I made internal static
versions of the relevant functions that take this structure as a parameter. The
new code does as you might expect, it looks for @llvm.assume calls that make
use of the value we're trying to learn something about (often indirectly),
attempts to pattern match that expression, and uses the result if successful.
By making use of the AssumptionTracker, the process of finding @llvm.assume
calls is not expensive.
Part of the structure being passed around inside ValueTracking is a set of
already-considered @llvm.assume calls. This is to prevent a query using, for
example, the assume(a == b), to recurse on itself. The context and DT params
are used to find applicable assumptions. An assumption needs to dominate the
context instruction, or come after it deterministically. In this latter case we
only handle the specific case where both the assumption and the context
instruction are in the same block, and we need to exclude assumptions from
being used to simplify their own ephemeral values (those which contribute only
to the assumption) because otherwise the assumption would prove its feeding
comparison trivial and would be removed.
This commit adds the plumbing and the logic for a simple masked-bit propagation
(just enough to write a regression test). Future commits add more patterns
(and, correspondingly, more regression tests).
llvm-svn: 217342
2014-09-08 02:57:58 +08:00
|
|
|
if (MaskedValueIsZero(Op0LHS, NotAndRHS, 0, &I)) {
|
2010-01-05 15:50:36 +08:00
|
|
|
// Not masking anything out for the LHS, move to RHS.
|
|
|
|
Value *NewRHS = Builder->CreateAnd(Op0RHS, AndRHS,
|
|
|
|
Op0RHS->getName()+".masked");
|
|
|
|
return BinaryOperator::Create(Op0I->getOpcode(), Op0LHS, NewRHS);
|
|
|
|
}
|
|
|
|
if (!isa<Constant>(Op0RHS) &&
|
Make use of @llvm.assume in ValueTracking (computeKnownBits, etc.)
This change, which allows @llvm.assume to be used from within computeKnownBits
(and other associated functions in ValueTracking), adds some (optional)
parameters to computeKnownBits and friends. These functions now (optionally)
take a "context" instruction pointer, an AssumptionTracker pointer, and also a
DomTree pointer, and most of the changes are just to pass this new information
when it is easily available from InstSimplify, InstCombine, etc.
As explained below, the significant conceptual change is that known properties
of a value might depend on the control-flow location of the use (because we
care that the @llvm.assume dominates the use because assumptions have
control-flow dependencies). This means that, when we ask if bits are known in a
value, we might get different answers for different uses.
The significant changes are all in ValueTracking. Two main changes: First, as
with the rest of the code, new parameters need to be passed around. To make
this easier, I grouped them into a structure, and I made internal static
versions of the relevant functions that take this structure as a parameter. The
new code does as you might expect, it looks for @llvm.assume calls that make
use of the value we're trying to learn something about (often indirectly),
attempts to pattern match that expression, and uses the result if successful.
By making use of the AssumptionTracker, the process of finding @llvm.assume
calls is not expensive.
Part of the structure being passed around inside ValueTracking is a set of
already-considered @llvm.assume calls. This is to prevent a query using, for
example, the assume(a == b), to recurse on itself. The context and DT params
are used to find applicable assumptions. An assumption needs to dominate the
context instruction, or come after it deterministically. In this latter case we
only handle the specific case where both the assumption and the context
instruction are in the same block, and we need to exclude assumptions from
being used to simplify their own ephemeral values (those which contribute only
to the assumption) because otherwise the assumption would prove its feeding
comparison trivial and would be removed.
This commit adds the plumbing and the logic for a simple masked-bit propagation
(just enough to write a regression test). Future commits add more patterns
(and, correspondingly, more regression tests).
llvm-svn: 217342
2014-09-08 02:57:58 +08:00
|
|
|
MaskedValueIsZero(Op0RHS, NotAndRHS, 0, &I)) {
|
2010-01-05 15:50:36 +08:00
|
|
|
// Not masking anything out for the RHS, move to LHS.
|
|
|
|
Value *NewLHS = Builder->CreateAnd(Op0LHS, AndRHS,
|
|
|
|
Op0LHS->getName()+".masked");
|
|
|
|
return BinaryOperator::Create(Op0I->getOpcode(), NewLHS, Op0RHS);
|
|
|
|
}
|
|
|
|
|
|
|
|
break;
|
2011-02-10 13:17:27 +08:00
|
|
|
}
|
2010-01-05 15:50:36 +08:00
|
|
|
case Instruction::Add:
|
2012-09-27 18:14:43 +08:00
|
|
|
// ((A & N) + B) & AndRHS -> (A + B) & AndRHS iff N&AndRHS == AndRHS.
|
|
|
|
// ((A | N) + B) & AndRHS -> (A + B) & AndRHS iff N&AndRHS == 0
|
|
|
|
// ((A ^ N) + B) & AndRHS -> (A + B) & AndRHS iff N&AndRHS == 0
|
2010-01-05 15:50:36 +08:00
|
|
|
if (Value *V = FoldLogicalPlusAnd(Op0LHS, Op0RHS, AndRHS, false, I))
|
|
|
|
return BinaryOperator::CreateAnd(V, AndRHS);
|
|
|
|
if (Value *V = FoldLogicalPlusAnd(Op0RHS, Op0LHS, AndRHS, false, I))
|
|
|
|
return BinaryOperator::CreateAnd(V, AndRHS); // Add commutes
|
|
|
|
break;
|
|
|
|
|
|
|
|
case Instruction::Sub:
|
2012-09-27 18:14:43 +08:00
|
|
|
// ((A & N) - B) & AndRHS -> (A - B) & AndRHS iff N&AndRHS == AndRHS.
|
|
|
|
// ((A | N) - B) & AndRHS -> (A - B) & AndRHS iff N&AndRHS == 0
|
|
|
|
// ((A ^ N) - B) & AndRHS -> (A - B) & AndRHS iff N&AndRHS == 0
|
2010-01-05 15:50:36 +08:00
|
|
|
if (Value *V = FoldLogicalPlusAnd(Op0LHS, Op0RHS, AndRHS, true, I))
|
|
|
|
return BinaryOperator::CreateAnd(V, AndRHS);
|
2015-08-20 23:35:00 +08:00
|
|
|
|
|
|
|
// -x & 1 -> x & 1
|
|
|
|
if (AndRHSMask == 1 && match(Op0LHS, m_Zero()))
|
|
|
|
return BinaryOperator::CreateAnd(Op0RHS, AndRHS);
|
2010-01-05 15:50:36 +08:00
|
|
|
|
2012-09-27 18:14:43 +08:00
|
|
|
// (A - N) & AndRHS -> -N & AndRHS iff A&AndRHS==0 and AndRHS
|
2010-01-05 15:50:36 +08:00
|
|
|
// has 1's for all bits that the subtraction with A might affect.
|
2011-02-10 13:17:27 +08:00
|
|
|
if (Op0I->hasOneUse() && !match(Op0LHS, m_Zero())) {
|
2010-01-05 15:50:36 +08:00
|
|
|
uint32_t BitWidth = AndRHSMask.getBitWidth();
|
|
|
|
uint32_t Zeros = AndRHSMask.countLeadingZeros();
|
|
|
|
APInt Mask = APInt::getLowBitsSet(BitWidth, BitWidth - Zeros);
|
|
|
|
|
Make use of @llvm.assume in ValueTracking (computeKnownBits, etc.)
This change, which allows @llvm.assume to be used from within computeKnownBits
(and other associated functions in ValueTracking), adds some (optional)
parameters to computeKnownBits and friends. These functions now (optionally)
take a "context" instruction pointer, an AssumptionTracker pointer, and also a
DomTree pointer, and most of the changes are just to pass this new information
when it is easily available from InstSimplify, InstCombine, etc.
As explained below, the significant conceptual change is that known properties
of a value might depend on the control-flow location of the use (because we
care that the @llvm.assume dominates the use because assumptions have
control-flow dependencies). This means that, when we ask if bits are known in a
value, we might get different answers for different uses.
The significant changes are all in ValueTracking. Two main changes: First, as
with the rest of the code, new parameters need to be passed around. To make
this easier, I grouped them into a structure, and I made internal static
versions of the relevant functions that take this structure as a parameter. The
new code does as you might expect, it looks for @llvm.assume calls that make
use of the value we're trying to learn something about (often indirectly),
attempts to pattern match that expression, and uses the result if successful.
By making use of the AssumptionTracker, the process of finding @llvm.assume
calls is not expensive.
Part of the structure being passed around inside ValueTracking is a set of
already-considered @llvm.assume calls. This is to prevent a query using, for
example, the assume(a == b), to recurse on itself. The context and DT params
are used to find applicable assumptions. An assumption needs to dominate the
context instruction, or come after it deterministically. In this latter case we
only handle the specific case where both the assumption and the context
instruction are in the same block, and we need to exclude assumptions from
being used to simplify their own ephemeral values (those which contribute only
to the assumption) because otherwise the assumption would prove its feeding
comparison trivial and would be removed.
This commit adds the plumbing and the logic for a simple masked-bit propagation
(just enough to write a regression test). Future commits add more patterns
(and, correspondingly, more regression tests).
llvm-svn: 217342
2014-09-08 02:57:58 +08:00
|
|
|
if (MaskedValueIsZero(Op0LHS, Mask, 0, &I)) {
|
2010-01-05 15:50:36 +08:00
|
|
|
Value *NewNeg = Builder->CreateNeg(Op0RHS);
|
|
|
|
return BinaryOperator::CreateAnd(NewNeg, AndRHS);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
|
|
|
|
case Instruction::Shl:
|
|
|
|
case Instruction::LShr:
|
|
|
|
// (1 << x) & 1 --> zext(x == 0)
|
|
|
|
// (1 >> x) & 1 --> zext(x == 0)
|
|
|
|
if (AndRHSMask == 1 && Op0LHS == AndRHS) {
|
|
|
|
Value *NewICmp =
|
|
|
|
Builder->CreateICmpEQ(Op0RHS, Constant::getNullValue(I.getType()));
|
|
|
|
return new ZExtInst(NewICmp, I.getType());
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
if (ConstantInt *Op0CI = dyn_cast<ConstantInt>(Op0I->getOperand(1)))
|
|
|
|
if (Instruction *Res = OptAndOp(Op0I, Op0CI, AndRHS, I))
|
|
|
|
return Res;
|
2011-02-10 13:17:27 +08:00
|
|
|
}
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2011-02-10 13:17:27 +08:00
|
|
|
// If this is an integer truncation, and if the source is an 'and' with
|
|
|
|
// immediate, transform it. This frequently occurs for bitfield accesses.
|
|
|
|
{
|
2014-04-25 13:29:35 +08:00
|
|
|
Value *X = nullptr; ConstantInt *YC = nullptr;
|
2011-02-10 13:17:27 +08:00
|
|
|
if (match(Op0, m_Trunc(m_And(m_Value(X), m_ConstantInt(YC))))) {
|
|
|
|
// Change: and (trunc (and X, YC) to T), C2
|
|
|
|
// into : and (trunc X to T), trunc(YC) & C2
|
2012-12-20 15:09:41 +08:00
|
|
|
// This will fold the two constants together, which may allow
|
2011-02-10 13:17:27 +08:00
|
|
|
// other simplifications.
|
|
|
|
Value *NewCast = Builder->CreateTrunc(X, I.getType(), "and.shrunk");
|
|
|
|
Constant *C3 = ConstantExpr::getTrunc(YC, I.getType());
|
|
|
|
C3 = ConstantExpr::getAnd(C3, AndRHS);
|
|
|
|
return BinaryOperator::CreateAnd(NewCast, C3);
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Try to fold constant and into select arguments.
|
|
|
|
if (SelectInst *SI = dyn_cast<SelectInst>(Op0))
|
|
|
|
if (Instruction *R = FoldOpIntoSelect(I, SI))
|
|
|
|
return R;
|
|
|
|
if (isa<PHINode>(Op0))
|
|
|
|
if (Instruction *NV = FoldOpIntoPhi(I))
|
|
|
|
return NV;
|
|
|
|
}
|
|
|
|
|
2015-09-09 04:14:13 +08:00
|
|
|
if (Instruction *DeMorgan = matchDeMorgansLaws(I, Builder))
|
|
|
|
return DeMorgan;
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
{
|
2014-04-25 13:29:35 +08:00
|
|
|
Value *A = nullptr, *B = nullptr, *C = nullptr, *D = nullptr;
|
2010-01-05 15:50:36 +08:00
|
|
|
// (A|B) & ~(A&B) -> A^B
|
|
|
|
if (match(Op0, m_Or(m_Value(A), m_Value(B))) &&
|
|
|
|
match(Op1, m_Not(m_And(m_Value(C), m_Value(D)))) &&
|
|
|
|
((A == C && B == D) || (A == D && B == C)))
|
|
|
|
return BinaryOperator::CreateXor(A, B);
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
// ~(A&B) & (A|B) -> A^B
|
|
|
|
if (match(Op1, m_Or(m_Value(A), m_Value(B))) &&
|
|
|
|
match(Op0, m_Not(m_And(m_Value(C), m_Value(D)))) &&
|
|
|
|
((A == C && B == D) || (A == D && B == C)))
|
|
|
|
return BinaryOperator::CreateXor(A, B);
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2011-09-20 05:58:15 +08:00
|
|
|
// A&(A^B) => A & ~B
|
|
|
|
{
|
|
|
|
Value *tmpOp0 = Op0;
|
|
|
|
Value *tmpOp1 = Op1;
|
2016-01-19 02:36:38 +08:00
|
|
|
if (match(Op0, m_OneUse(m_Xor(m_Value(A), m_Value(B))))) {
|
2011-09-20 05:58:15 +08:00
|
|
|
if (A == Op1 || B == Op1 ) {
|
|
|
|
tmpOp1 = Op0;
|
|
|
|
tmpOp0 = Op1;
|
|
|
|
// Simplify below
|
|
|
|
}
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
|
2016-01-19 02:36:38 +08:00
|
|
|
if (match(tmpOp1, m_OneUse(m_Xor(m_Value(A), m_Value(B))))) {
|
2011-09-20 05:58:15 +08:00
|
|
|
if (B == tmpOp0) {
|
|
|
|
std::swap(A, B);
|
|
|
|
}
|
2016-01-19 01:50:23 +08:00
|
|
|
// Notice that the pattern (A&(~B)) is actually (A&(-1^B)), so if
|
2011-09-20 05:58:15 +08:00
|
|
|
// A is originally -1 (or a vector of -1 and undefs), then we enter
|
|
|
|
// an endless loop. By checking that A is non-constant we ensure that
|
|
|
|
// we will never get to the loop.
|
|
|
|
if (A == tmpOp0 && !isa<Constant>(A)) // A&(A^B) -> A & ~B
|
2011-09-28 04:39:19 +08:00
|
|
|
return BinaryOperator::CreateAnd(A, Builder->CreateNot(B));
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// (A&((~A)|B)) -> A&B
|
|
|
|
if (match(Op0, m_Or(m_Not(m_Specific(Op1)), m_Value(A))) ||
|
|
|
|
match(Op0, m_Or(m_Value(A), m_Not(m_Specific(Op1)))))
|
|
|
|
return BinaryOperator::CreateAnd(A, Op1);
|
|
|
|
if (match(Op1, m_Or(m_Not(m_Specific(Op0)), m_Value(A))) ||
|
|
|
|
match(Op1, m_Or(m_Value(A), m_Not(m_Specific(Op0)))))
|
|
|
|
return BinaryOperator::CreateAnd(A, Op0);
|
InstCombine: Simplify (A ^ B) or/and (A ^ B ^ C)
While we can already transform A | (A ^ B) into A | B, things get bad
once we have (A ^ B) | (A ^ B ^ Cst) because reassociation will morph
this into (A ^ B) | ((A ^ Cst) ^ B). Our existing patterns fail once
this happens.
To fix this, we add a new pattern which looks through the tree of xor
binary operators to see that, in fact, there exists a redundant xor
operation.
What follows bellow is a correctness proof of the transform using CVC3.
$ cat t.cvc
A, B, C : BITVECTOR(64);
QUERY BVXOR(A, B) | BVXOR(BVXOR(B, C), A) = BVXOR(A, B) | C;
QUERY BVXOR(BVXOR(A, C), B) | BVXOR(A, B) = BVXOR(A, B) | C;
QUERY BVXOR(A, B) & BVXOR(BVXOR(B, C), A) = BVXOR(A, B) & ~C;
QUERY BVXOR(BVXOR(A, C), B) & BVXOR(A, B) = BVXOR(A, B) & ~C;
$ cvc3 < t.cvc
Valid.
Valid.
Valid.
Valid.
llvm-svn: 214342
2014-07-31 05:26:37 +08:00
|
|
|
|
|
|
|
// (A ^ B) & ((B ^ C) ^ A) -> (A ^ B) & ~C
|
|
|
|
if (match(Op0, m_Xor(m_Value(A), m_Value(B))))
|
|
|
|
if (match(Op1, m_Xor(m_Xor(m_Specific(B), m_Value(C)), m_Specific(A))))
|
|
|
|
if (Op1->hasOneUse() || cast<BinaryOperator>(Op1)->hasOneUse())
|
|
|
|
return BinaryOperator::CreateAnd(Op0, Builder->CreateNot(C));
|
|
|
|
|
|
|
|
// ((A ^ C) ^ B) & (B ^ A) -> (B ^ A) & ~C
|
|
|
|
if (match(Op0, m_Xor(m_Xor(m_Value(A), m_Value(C)), m_Value(B))))
|
|
|
|
if (match(Op1, m_Xor(m_Specific(B), m_Specific(A))))
|
|
|
|
if (Op0->hasOneUse() || cast<BinaryOperator>(Op0)->hasOneUse())
|
|
|
|
return BinaryOperator::CreateAnd(Op1, Builder->CreateNot(C));
|
2014-08-01 12:59:26 +08:00
|
|
|
|
|
|
|
// (A | B) & ((~A) ^ B) -> (A & B)
|
|
|
|
if (match(Op0, m_Or(m_Value(A), m_Value(B))) &&
|
|
|
|
match(Op1, m_Xor(m_Not(m_Specific(A)), m_Specific(B))))
|
|
|
|
return BinaryOperator::CreateAnd(A, B);
|
|
|
|
|
|
|
|
// ((~A) ^ B) & (A | B) -> (A & B)
|
|
|
|
if (match(Op0, m_Xor(m_Not(m_Value(A)), m_Value(B))) &&
|
|
|
|
match(Op1, m_Or(m_Specific(A), m_Specific(B))))
|
|
|
|
return BinaryOperator::CreateAnd(A, B);
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2014-08-30 14:18:20 +08:00
|
|
|
{
|
|
|
|
ICmpInst *LHS = dyn_cast<ICmpInst>(Op0);
|
|
|
|
ICmpInst *RHS = dyn_cast<ICmpInst>(Op1);
|
|
|
|
if (LHS && RHS)
|
2010-03-05 16:46:26 +08:00
|
|
|
if (Value *Res = FoldAndOfICmps(LHS, RHS))
|
2016-02-02 06:23:39 +08:00
|
|
|
return replaceInstUsesWith(I, Res);
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2014-08-30 14:18:20 +08:00
|
|
|
// TODO: Make this recursive; it's a little tricky because an arbitrary
|
|
|
|
// number of 'and' instructions might have to be created.
|
|
|
|
Value *X, *Y;
|
|
|
|
if (LHS && match(Op1, m_OneUse(m_And(m_Value(X), m_Value(Y))))) {
|
|
|
|
if (auto *Cmp = dyn_cast<ICmpInst>(X))
|
|
|
|
if (Value *Res = FoldAndOfICmps(LHS, Cmp))
|
2016-02-02 06:23:39 +08:00
|
|
|
return replaceInstUsesWith(I, Builder->CreateAnd(Res, Y));
|
2014-08-30 14:18:20 +08:00
|
|
|
if (auto *Cmp = dyn_cast<ICmpInst>(Y))
|
|
|
|
if (Value *Res = FoldAndOfICmps(LHS, Cmp))
|
2016-02-02 06:23:39 +08:00
|
|
|
return replaceInstUsesWith(I, Builder->CreateAnd(Res, X));
|
2014-08-30 14:18:20 +08:00
|
|
|
}
|
|
|
|
if (RHS && match(Op0, m_OneUse(m_And(m_Value(X), m_Value(Y))))) {
|
|
|
|
if (auto *Cmp = dyn_cast<ICmpInst>(X))
|
|
|
|
if (Value *Res = FoldAndOfICmps(Cmp, RHS))
|
2016-02-02 06:23:39 +08:00
|
|
|
return replaceInstUsesWith(I, Builder->CreateAnd(Res, Y));
|
2014-08-30 14:18:20 +08:00
|
|
|
if (auto *Cmp = dyn_cast<ICmpInst>(Y))
|
|
|
|
if (Value *Res = FoldAndOfICmps(Cmp, RHS))
|
2016-02-02 06:23:39 +08:00
|
|
|
return replaceInstUsesWith(I, Builder->CreateAnd(Res, X));
|
2014-08-30 14:18:20 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2010-02-11 14:26:33 +08:00
|
|
|
// If and'ing two fcmp, try combine them into one.
|
|
|
|
if (FCmpInst *LHS = dyn_cast<FCmpInst>(I.getOperand(0)))
|
|
|
|
if (FCmpInst *RHS = dyn_cast<FCmpInst>(I.getOperand(1)))
|
2010-03-05 16:46:26 +08:00
|
|
|
if (Value *Res = FoldAndOfFCmps(LHS, RHS))
|
2016-02-02 06:23:39 +08:00
|
|
|
return replaceInstUsesWith(I, Res);
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2016-02-24 00:36:07 +08:00
|
|
|
if (Instruction *CastedAnd = foldCastedBitwiseLogic(I))
|
|
|
|
return CastedAnd;
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2016-05-28 05:41:29 +08:00
|
|
|
if (Instruction *Select = foldBoolSextMaskToSelect(I))
|
|
|
|
return Select;
|
2013-01-30 14:35:22 +08:00
|
|
|
|
2014-04-25 13:29:35 +08:00
|
|
|
return Changed ? &I : nullptr;
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
|
2016-05-26 00:22:14 +08:00
|
|
|
/// Given an OR instruction, check to see if this is a bswap idiom. If so,
|
|
|
|
/// insert the new intrinsic and return it.
|
|
|
|
Instruction *InstCombiner::MatchBSwap(BinaryOperator &I) {
|
2016-05-26 22:58:51 +08:00
|
|
|
Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);
|
|
|
|
|
|
|
|
// Look through zero extends.
|
|
|
|
if (Instruction *Ext = dyn_cast<ZExtInst>(Op0))
|
|
|
|
Op0 = Ext->getOperand(0);
|
|
|
|
|
|
|
|
if (Instruction *Ext = dyn_cast<ZExtInst>(Op1))
|
|
|
|
Op1 = Ext->getOperand(0);
|
|
|
|
|
|
|
|
// (A | B) | C and A | (B | C) -> bswap if possible.
|
|
|
|
bool OrOfOrs = match(Op0, m_Or(m_Value(), m_Value())) ||
|
|
|
|
match(Op1, m_Or(m_Value(), m_Value()));
|
|
|
|
|
|
|
|
// (A >> B) | (C << D) and (A << B) | (B >> C) -> bswap if possible.
|
|
|
|
bool OrOfShifts = match(Op0, m_LogicalShift(m_Value(), m_Value())) &&
|
|
|
|
match(Op1, m_LogicalShift(m_Value(), m_Value()));
|
|
|
|
|
|
|
|
// (A & B) | (C & D) -> bswap if possible.
|
|
|
|
bool OrOfAnds = match(Op0, m_And(m_Value(), m_Value())) &&
|
|
|
|
match(Op1, m_And(m_Value(), m_Value()));
|
|
|
|
|
|
|
|
if (!OrOfOrs && !OrOfShifts && !OrOfAnds)
|
|
|
|
return nullptr;
|
|
|
|
|
2016-01-15 17:20:19 +08:00
|
|
|
SmallVector<Instruction*, 4> Insts;
|
2016-05-26 00:22:14 +08:00
|
|
|
if (!recognizeBSwapOrBitReverseIdiom(&I, true, false, Insts))
|
2015-12-11 18:04:51 +08:00
|
|
|
return nullptr;
|
2016-01-15 17:20:19 +08:00
|
|
|
Instruction *LastInst = Insts.pop_back_val();
|
|
|
|
LastInst->removeFromParent();
|
2015-12-15 01:24:23 +08:00
|
|
|
|
2016-01-15 17:20:19 +08:00
|
|
|
for (auto *Inst : Insts)
|
|
|
|
Worklist.Add(Inst);
|
|
|
|
return LastInst;
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
|
2016-06-25 02:26:02 +08:00
|
|
|
/// We have an expression of the form (A & C) | (B & D). If A is (Cond?-1:0)
|
|
|
|
/// and B is ~(Cond?-1,0), then simplify this expression to "Cond ? C : D".
|
2016-06-25 02:55:27 +08:00
|
|
|
static Value *matchSelectFromAndOr(Value *A, Value *C, Value *B, Value *D,
|
[InstCombine] look through bitcasts to find selects
There was concern that creating bitcasts for the simpler potential select pattern:
define <2 x i64> @vecBitcastOp1(<4 x i1> %cmp, <2 x i64> %a) {
%a2 = add <2 x i64> %a, %a
%sext = sext <4 x i1> %cmp to <4 x i32>
%bc = bitcast <4 x i32> %sext to <2 x i64>
%and = and <2 x i64> %a2, %bc
ret <2 x i64> %and
}
might lead to worse code for some targets, so this patch is matching the larger
patterns seen in the test cases.
The motivating example for this patch is this IR produced via SSE intrinsics in C:
define <2 x i64> @gibson(<2 x i64> %a, <2 x i64> %b) {
%t0 = bitcast <2 x i64> %a to <4 x i32>
%t1 = bitcast <2 x i64> %b to <4 x i32>
%cmp = icmp sgt <4 x i32> %t0, %t1
%sext = sext <4 x i1> %cmp to <4 x i32>
%t2 = bitcast <4 x i32> %sext to <2 x i64>
%and = and <2 x i64> %t2, %a
%neg = xor <4 x i32> %sext, <i32 -1, i32 -1, i32 -1, i32 -1>
%neg2 = bitcast <4 x i32> %neg to <2 x i64>
%and2 = and <2 x i64> %neg2, %b
%or = or <2 x i64> %and, %and2
ret <2 x i64> %or
}
For an AVX target, this is currently:
vpcmpgtd %xmm1, %xmm0, %xmm2
vpand %xmm0, %xmm2, %xmm0
vpandn %xmm1, %xmm2, %xmm1
vpor %xmm1, %xmm0, %xmm0
retq
With this patch, it becomes:
vpmaxsd %xmm1, %xmm0, %xmm0
Differential Revision: http://reviews.llvm.org/D20774
llvm-svn: 271676
2016-06-03 22:42:07 +08:00
|
|
|
InstCombiner::BuilderTy &Builder) {
|
2016-06-25 02:55:27 +08:00
|
|
|
// The potential condition of the select may be bitcasted. In that case, look
|
|
|
|
// through its bitcast and the corresponding bitcast of the 'not' condition.
|
|
|
|
Type *OrigType = A->getType();
|
|
|
|
Value *SrcA, *SrcB;
|
|
|
|
if (match(A, m_BitCast(m_Value(SrcA))) &&
|
|
|
|
match(B, m_BitCast(m_Value(SrcB)))) {
|
|
|
|
A = SrcA;
|
|
|
|
B = SrcB;
|
[InstCombine] look through bitcasts to find selects
There was concern that creating bitcasts for the simpler potential select pattern:
define <2 x i64> @vecBitcastOp1(<4 x i1> %cmp, <2 x i64> %a) {
%a2 = add <2 x i64> %a, %a
%sext = sext <4 x i1> %cmp to <4 x i32>
%bc = bitcast <4 x i32> %sext to <2 x i64>
%and = and <2 x i64> %a2, %bc
ret <2 x i64> %and
}
might lead to worse code for some targets, so this patch is matching the larger
patterns seen in the test cases.
The motivating example for this patch is this IR produced via SSE intrinsics in C:
define <2 x i64> @gibson(<2 x i64> %a, <2 x i64> %b) {
%t0 = bitcast <2 x i64> %a to <4 x i32>
%t1 = bitcast <2 x i64> %b to <4 x i32>
%cmp = icmp sgt <4 x i32> %t0, %t1
%sext = sext <4 x i1> %cmp to <4 x i32>
%t2 = bitcast <4 x i32> %sext to <2 x i64>
%and = and <2 x i64> %t2, %a
%neg = xor <4 x i32> %sext, <i32 -1, i32 -1, i32 -1, i32 -1>
%neg2 = bitcast <4 x i32> %neg to <2 x i64>
%and2 = and <2 x i64> %neg2, %b
%or = or <2 x i64> %and, %and2
ret <2 x i64> %or
}
For an AVX target, this is currently:
vpcmpgtd %xmm1, %xmm0, %xmm2
vpand %xmm0, %xmm2, %xmm0
vpandn %xmm1, %xmm2, %xmm1
vpor %xmm1, %xmm0, %xmm0
retq
With this patch, it becomes:
vpmaxsd %xmm1, %xmm0, %xmm0
Differential Revision: http://reviews.llvm.org/D20774
llvm-svn: 271676
2016-06-03 22:42:07 +08:00
|
|
|
}
|
|
|
|
|
2016-06-25 02:55:27 +08:00
|
|
|
// The condition must be a value of -1/0, and B must be the 'not' of that
|
|
|
|
// condition.
|
|
|
|
Value *Cond;
|
|
|
|
if (match(A, m_SExt(m_Value(Cond))) &&
|
|
|
|
Cond->getType()->getScalarType()->isIntegerTy(1) &&
|
|
|
|
match(B, m_CombineOr(m_Not(m_SExt(m_Specific(Cond))),
|
|
|
|
m_SExt(m_Not(m_Specific(Cond)))))) {
|
[InstCombine] look through bitcasts to find selects
There was concern that creating bitcasts for the simpler potential select pattern:
define <2 x i64> @vecBitcastOp1(<4 x i1> %cmp, <2 x i64> %a) {
%a2 = add <2 x i64> %a, %a
%sext = sext <4 x i1> %cmp to <4 x i32>
%bc = bitcast <4 x i32> %sext to <2 x i64>
%and = and <2 x i64> %a2, %bc
ret <2 x i64> %and
}
might lead to worse code for some targets, so this patch is matching the larger
patterns seen in the test cases.
The motivating example for this patch is this IR produced via SSE intrinsics in C:
define <2 x i64> @gibson(<2 x i64> %a, <2 x i64> %b) {
%t0 = bitcast <2 x i64> %a to <4 x i32>
%t1 = bitcast <2 x i64> %b to <4 x i32>
%cmp = icmp sgt <4 x i32> %t0, %t1
%sext = sext <4 x i1> %cmp to <4 x i32>
%t2 = bitcast <4 x i32> %sext to <2 x i64>
%and = and <2 x i64> %t2, %a
%neg = xor <4 x i32> %sext, <i32 -1, i32 -1, i32 -1, i32 -1>
%neg2 = bitcast <4 x i32> %neg to <2 x i64>
%and2 = and <2 x i64> %neg2, %b
%or = or <2 x i64> %and, %and2
ret <2 x i64> %or
}
For an AVX target, this is currently:
vpcmpgtd %xmm1, %xmm0, %xmm2
vpand %xmm0, %xmm2, %xmm0
vpandn %xmm1, %xmm2, %xmm1
vpor %xmm1, %xmm0, %xmm0
retq
With this patch, it becomes:
vpmaxsd %xmm1, %xmm0, %xmm0
Differential Revision: http://reviews.llvm.org/D20774
llvm-svn: 271676
2016-06-03 22:42:07 +08:00
|
|
|
// ((bc Cond) & C) | ((bc ~Cond) & D) --> bc (select Cond, (bc C), (bc D))
|
2016-06-25 02:55:27 +08:00
|
|
|
// The bitcasts will either all exist or all not exist. The builder will
|
|
|
|
// not create unnecessary casts if the types already match.
|
|
|
|
Value *BitcastC = Builder.CreateBitCast(C, A->getType());
|
|
|
|
Value *BitcastD = Builder.CreateBitCast(D, A->getType());
|
|
|
|
Value *Select = Builder.CreateSelect(Cond, BitcastC, BitcastD);
|
|
|
|
return Builder.CreateBitCast(Select, OrigType);
|
[InstCombine] look through bitcasts to find selects
There was concern that creating bitcasts for the simpler potential select pattern:
define <2 x i64> @vecBitcastOp1(<4 x i1> %cmp, <2 x i64> %a) {
%a2 = add <2 x i64> %a, %a
%sext = sext <4 x i1> %cmp to <4 x i32>
%bc = bitcast <4 x i32> %sext to <2 x i64>
%and = and <2 x i64> %a2, %bc
ret <2 x i64> %and
}
might lead to worse code for some targets, so this patch is matching the larger
patterns seen in the test cases.
The motivating example for this patch is this IR produced via SSE intrinsics in C:
define <2 x i64> @gibson(<2 x i64> %a, <2 x i64> %b) {
%t0 = bitcast <2 x i64> %a to <4 x i32>
%t1 = bitcast <2 x i64> %b to <4 x i32>
%cmp = icmp sgt <4 x i32> %t0, %t1
%sext = sext <4 x i1> %cmp to <4 x i32>
%t2 = bitcast <4 x i32> %sext to <2 x i64>
%and = and <2 x i64> %t2, %a
%neg = xor <4 x i32> %sext, <i32 -1, i32 -1, i32 -1, i32 -1>
%neg2 = bitcast <4 x i32> %neg to <2 x i64>
%and2 = and <2 x i64> %neg2, %b
%or = or <2 x i64> %and, %and2
ret <2 x i64> %or
}
For an AVX target, this is currently:
vpcmpgtd %xmm1, %xmm0, %xmm2
vpand %xmm0, %xmm2, %xmm0
vpandn %xmm1, %xmm2, %xmm1
vpor %xmm1, %xmm0, %xmm0
retq
With this patch, it becomes:
vpmaxsd %xmm1, %xmm0, %xmm0
Differential Revision: http://reviews.llvm.org/D20774
llvm-svn: 271676
2016-06-03 22:42:07 +08:00
|
|
|
}
|
2016-06-03 02:03:05 +08:00
|
|
|
|
2014-04-25 13:29:35 +08:00
|
|
|
return nullptr;
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
|
2015-09-09 02:24:36 +08:00
|
|
|
/// Fold (icmp)|(icmp) if possible.
|
Make use of @llvm.assume in ValueTracking (computeKnownBits, etc.)
This change, which allows @llvm.assume to be used from within computeKnownBits
(and other associated functions in ValueTracking), adds some (optional)
parameters to computeKnownBits and friends. These functions now (optionally)
take a "context" instruction pointer, an AssumptionTracker pointer, and also a
DomTree pointer, and most of the changes are just to pass this new information
when it is easily available from InstSimplify, InstCombine, etc.
As explained below, the significant conceptual change is that known properties
of a value might depend on the control-flow location of the use (because we
care that the @llvm.assume dominates the use because assumptions have
control-flow dependencies). This means that, when we ask if bits are known in a
value, we might get different answers for different uses.
The significant changes are all in ValueTracking. Two main changes: First, as
with the rest of the code, new parameters need to be passed around. To make
this easier, I grouped them into a structure, and I made internal static
versions of the relevant functions that take this structure as a parameter. The
new code does as you might expect, it looks for @llvm.assume calls that make
use of the value we're trying to learn something about (often indirectly),
attempts to pattern match that expression, and uses the result if successful.
By making use of the AssumptionTracker, the process of finding @llvm.assume
calls is not expensive.
Part of the structure being passed around inside ValueTracking is a set of
already-considered @llvm.assume calls. This is to prevent a query using, for
example, the assume(a == b), to recurse on itself. The context and DT params
are used to find applicable assumptions. An assumption needs to dominate the
context instruction, or come after it deterministically. In this latter case we
only handle the specific case where both the assumption and the context
instruction are in the same block, and we need to exclude assumptions from
being used to simplify their own ephemeral values (those which contribute only
to the assumption) because otherwise the assumption would prove its feeding
comparison trivial and would be removed.
This commit adds the plumbing and the logic for a simple masked-bit propagation
(just enough to write a regression test). Future commits add more patterns
(and, correspondingly, more regression tests).
llvm-svn: 217342
2014-09-08 02:57:58 +08:00
|
|
|
Value *InstCombiner::FoldOrOfICmps(ICmpInst *LHS, ICmpInst *RHS,
|
|
|
|
Instruction *CxtI) {
|
2010-01-05 15:50:36 +08:00
|
|
|
ICmpInst::Predicate LHSCC = LHS->getPredicate(), RHSCC = RHS->getPredicate();
|
|
|
|
|
2013-11-13 06:38:59 +08:00
|
|
|
// Fold (iszero(A & K1) | iszero(A & K2)) -> (A & (K1 | K2)) != (K1 | K2)
|
|
|
|
// if K1 and K2 are a one-bit mask.
|
|
|
|
ConstantInt *LHSCst = dyn_cast<ConstantInt>(LHS->getOperand(1));
|
|
|
|
ConstantInt *RHSCst = dyn_cast<ConstantInt>(RHS->getOperand(1));
|
|
|
|
|
|
|
|
if (LHS->getPredicate() == ICmpInst::ICMP_EQ && LHSCst && LHSCst->isZero() &&
|
|
|
|
RHS->getPredicate() == ICmpInst::ICMP_EQ && RHSCst && RHSCst->isZero()) {
|
|
|
|
|
|
|
|
BinaryOperator *LAnd = dyn_cast<BinaryOperator>(LHS->getOperand(0));
|
|
|
|
BinaryOperator *RAnd = dyn_cast<BinaryOperator>(RHS->getOperand(0));
|
|
|
|
if (LAnd && RAnd && LAnd->hasOneUse() && RHS->hasOneUse() &&
|
|
|
|
LAnd->getOpcode() == Instruction::And &&
|
|
|
|
RAnd->getOpcode() == Instruction::And) {
|
|
|
|
|
2014-04-25 13:29:35 +08:00
|
|
|
Value *Mask = nullptr;
|
|
|
|
Value *Masked = nullptr;
|
2013-11-13 06:38:59 +08:00
|
|
|
if (LAnd->getOperand(0) == RAnd->getOperand(0) &&
|
2015-03-10 10:37:25 +08:00
|
|
|
isKnownToBeAPowerOfTwo(LAnd->getOperand(1), DL, false, 0, AC, CxtI,
|
|
|
|
DT) &&
|
|
|
|
isKnownToBeAPowerOfTwo(RAnd->getOperand(1), DL, false, 0, AC, CxtI,
|
|
|
|
DT)) {
|
2013-11-13 06:38:59 +08:00
|
|
|
Mask = Builder->CreateOr(LAnd->getOperand(1), RAnd->getOperand(1));
|
|
|
|
Masked = Builder->CreateAnd(LAnd->getOperand(0), Mask);
|
|
|
|
} else if (LAnd->getOperand(1) == RAnd->getOperand(1) &&
|
2015-03-10 10:37:25 +08:00
|
|
|
isKnownToBeAPowerOfTwo(LAnd->getOperand(0), DL, false, 0, AC,
|
|
|
|
CxtI, DT) &&
|
|
|
|
isKnownToBeAPowerOfTwo(RAnd->getOperand(0), DL, false, 0, AC,
|
|
|
|
CxtI, DT)) {
|
2013-11-13 06:38:59 +08:00
|
|
|
Mask = Builder->CreateOr(LAnd->getOperand(0), RAnd->getOperand(0));
|
|
|
|
Masked = Builder->CreateAnd(LAnd->getOperand(1), Mask);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (Masked)
|
|
|
|
return Builder->CreateICmp(ICmpInst::ICMP_NE, Masked, Mask);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-08-21 06:55:40 +08:00
|
|
|
// Fold (icmp ult/ule (A + C1), C3) | (icmp ult/ule (A + C2), C3)
|
|
|
|
// --> (icmp ult/ule ((A & ~(C1 ^ C2)) + max(C1, C2)), C3)
|
|
|
|
// The original condition actually refers to the following two ranges:
|
|
|
|
// [MAX_UINT-C1+1, MAX_UINT-C1+1+C3] and [MAX_UINT-C2+1, MAX_UINT-C2+1+C3]
|
|
|
|
// We can fold these two ranges if:
|
|
|
|
// 1) C1 and C2 is unsigned greater than C3.
|
|
|
|
// 2) The two ranges are separated.
|
|
|
|
// 3) C1 ^ C2 is one-bit mask.
|
|
|
|
// 4) LowRange1 ^ LowRange2 and HighRange1 ^ HighRange2 are one-bit mask.
|
|
|
|
// This implies all values in the two ranges differ by exactly one bit.
|
|
|
|
|
|
|
|
if ((LHSCC == ICmpInst::ICMP_ULT || LHSCC == ICmpInst::ICMP_ULE) &&
|
|
|
|
LHSCC == RHSCC && LHSCst && RHSCst && LHS->hasOneUse() &&
|
|
|
|
RHS->hasOneUse() && LHSCst->getType() == RHSCst->getType() &&
|
|
|
|
LHSCst->getValue() == (RHSCst->getValue())) {
|
|
|
|
|
|
|
|
Value *LAdd = LHS->getOperand(0);
|
|
|
|
Value *RAdd = RHS->getOperand(0);
|
|
|
|
|
|
|
|
Value *LAddOpnd, *RAddOpnd;
|
|
|
|
ConstantInt *LAddCst, *RAddCst;
|
|
|
|
if (match(LAdd, m_Add(m_Value(LAddOpnd), m_ConstantInt(LAddCst))) &&
|
|
|
|
match(RAdd, m_Add(m_Value(RAddOpnd), m_ConstantInt(RAddCst))) &&
|
|
|
|
LAddCst->getValue().ugt(LHSCst->getValue()) &&
|
|
|
|
RAddCst->getValue().ugt(LHSCst->getValue())) {
|
|
|
|
|
|
|
|
APInt DiffCst = LAddCst->getValue() ^ RAddCst->getValue();
|
|
|
|
if (LAddOpnd == RAddOpnd && DiffCst.isPowerOf2()) {
|
|
|
|
ConstantInt *MaxAddCst = nullptr;
|
|
|
|
if (LAddCst->getValue().ult(RAddCst->getValue()))
|
|
|
|
MaxAddCst = RAddCst;
|
|
|
|
else
|
|
|
|
MaxAddCst = LAddCst;
|
|
|
|
|
|
|
|
APInt RRangeLow = -RAddCst->getValue();
|
|
|
|
APInt RRangeHigh = RRangeLow + LHSCst->getValue();
|
|
|
|
APInt LRangeLow = -LAddCst->getValue();
|
|
|
|
APInt LRangeHigh = LRangeLow + LHSCst->getValue();
|
|
|
|
APInt LowRangeDiff = RRangeLow ^ LRangeLow;
|
|
|
|
APInt HighRangeDiff = RRangeHigh ^ LRangeHigh;
|
|
|
|
APInt RangeDiff = LRangeLow.sgt(RRangeLow) ? LRangeLow - RRangeLow
|
|
|
|
: RRangeLow - LRangeLow;
|
|
|
|
|
|
|
|
if (LowRangeDiff.isPowerOf2() && LowRangeDiff == HighRangeDiff &&
|
|
|
|
RangeDiff.ugt(LHSCst->getValue())) {
|
|
|
|
Value *MaskCst = ConstantInt::get(LAddCst->getType(), ~DiffCst);
|
|
|
|
|
|
|
|
Value *NewAnd = Builder->CreateAnd(LAddOpnd, MaskCst);
|
|
|
|
Value *NewAdd = Builder->CreateAdd(NewAnd, MaxAddCst);
|
|
|
|
return (Builder->CreateICmp(LHS->getPredicate(), NewAdd, LHSCst));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
// (icmp1 A, B) | (icmp2 A, B) --> (icmp3 A, B)
|
|
|
|
if (PredicatesFoldable(LHSCC, RHSCC)) {
|
|
|
|
if (LHS->getOperand(0) == RHS->getOperand(1) &&
|
|
|
|
LHS->getOperand(1) == RHS->getOperand(0))
|
|
|
|
LHS->swapOperands();
|
|
|
|
if (LHS->getOperand(0) == RHS->getOperand(0) &&
|
|
|
|
LHS->getOperand(1) == RHS->getOperand(1)) {
|
|
|
|
Value *Op0 = LHS->getOperand(0), *Op1 = LHS->getOperand(1);
|
|
|
|
unsigned Code = getICmpCode(LHS) | getICmpCode(RHS);
|
|
|
|
bool isSigned = LHS->isSigned() || RHS->isSigned();
|
2011-12-17 09:20:32 +08:00
|
|
|
return getNewICmpValue(isSigned, Code, Op0, Op1, Builder);
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
}
|
2010-12-21 00:21:59 +08:00
|
|
|
|
|
|
|
// handle (roughly):
|
|
|
|
// (icmp ne (A & B), C) | (icmp ne (A & D), E)
|
2013-09-04 19:57:13 +08:00
|
|
|
if (Value *V = foldLogOpOfMaskedICmps(LHS, RHS, false, Builder))
|
2010-12-21 00:21:59 +08:00
|
|
|
return V;
|
2010-09-09 06:16:17 +08:00
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
Value *Val = LHS->getOperand(0), *Val2 = RHS->getOperand(0);
|
InstCombine: (icmp eq B, 0) | (icmp ult A, B) -> (icmp ule A, B-1)
This transform allows us to turn IR that looks like:
%1 = icmp eq i64 %b, 0
%2 = icmp ult i64 %a, %b
%3 = or i1 %1, %2
ret i1 %3
into:
%0 = add i64 %b, -1
%1 = icmp uge i64 %0, %a
ret i1 %1
which means we go from lowering:
cmpq %rsi, %rdi
setb %cl
testq %rsi, %rsi
sete %al
orb %cl, %al
ret
to lowering:
decq %rsi
cmpq %rdi, %rsi
setae %al
ret
llvm-svn: 185677
2013-07-05 08:31:17 +08:00
|
|
|
if (LHS->hasOneUse() || RHS->hasOneUse()) {
|
|
|
|
// (icmp eq B, 0) | (icmp ult A, B) -> (icmp ule A, B-1)
|
|
|
|
// (icmp eq B, 0) | (icmp ugt B, A) -> (icmp ule A, B-1)
|
2014-04-25 13:29:35 +08:00
|
|
|
Value *A = nullptr, *B = nullptr;
|
InstCombine: (icmp eq B, 0) | (icmp ult A, B) -> (icmp ule A, B-1)
This transform allows us to turn IR that looks like:
%1 = icmp eq i64 %b, 0
%2 = icmp ult i64 %a, %b
%3 = or i1 %1, %2
ret i1 %3
into:
%0 = add i64 %b, -1
%1 = icmp uge i64 %0, %a
ret i1 %1
which means we go from lowering:
cmpq %rsi, %rdi
setb %cl
testq %rsi, %rsi
sete %al
orb %cl, %al
ret
to lowering:
decq %rsi
cmpq %rdi, %rsi
setae %al
ret
llvm-svn: 185677
2013-07-05 08:31:17 +08:00
|
|
|
if (LHSCC == ICmpInst::ICMP_EQ && LHSCst && LHSCst->isZero()) {
|
|
|
|
B = Val;
|
|
|
|
if (RHSCC == ICmpInst::ICMP_ULT && Val == RHS->getOperand(1))
|
|
|
|
A = Val2;
|
|
|
|
else if (RHSCC == ICmpInst::ICMP_UGT && Val == Val2)
|
|
|
|
A = RHS->getOperand(1);
|
|
|
|
}
|
|
|
|
// (icmp ult A, B) | (icmp eq B, 0) -> (icmp ule A, B-1)
|
|
|
|
// (icmp ugt B, A) | (icmp eq B, 0) -> (icmp ule A, B-1)
|
|
|
|
else if (RHSCC == ICmpInst::ICMP_EQ && RHSCst && RHSCst->isZero()) {
|
|
|
|
B = Val2;
|
|
|
|
if (LHSCC == ICmpInst::ICMP_ULT && Val2 == LHS->getOperand(1))
|
|
|
|
A = Val;
|
|
|
|
else if (LHSCC == ICmpInst::ICMP_UGT && Val2 == Val)
|
|
|
|
A = LHS->getOperand(1);
|
|
|
|
}
|
|
|
|
if (A && B)
|
|
|
|
return Builder->CreateICmp(
|
|
|
|
ICmpInst::ICMP_UGE,
|
|
|
|
Builder->CreateAdd(B, ConstantInt::getSigned(B->getType(), -1)), A);
|
|
|
|
}
|
|
|
|
|
2014-12-03 18:39:15 +08:00
|
|
|
// E.g. (icmp slt x, 0) | (icmp sgt x, n) --> icmp ugt x, n
|
|
|
|
if (Value *V = simplifyRangeCheck(LHS, RHS, /*Inverted=*/true))
|
|
|
|
return V;
|
|
|
|
|
|
|
|
// E.g. (icmp sgt x, n) | (icmp slt x, 0) --> icmp ugt x, n
|
|
|
|
if (Value *V = simplifyRangeCheck(RHS, LHS, /*Inverted=*/true))
|
|
|
|
return V;
|
|
|
|
|
InstCombine: (icmp eq B, 0) | (icmp ult A, B) -> (icmp ule A, B-1)
This transform allows us to turn IR that looks like:
%1 = icmp eq i64 %b, 0
%2 = icmp ult i64 %a, %b
%3 = or i1 %1, %2
ret i1 %3
into:
%0 = add i64 %b, -1
%1 = icmp uge i64 %0, %a
ret i1 %1
which means we go from lowering:
cmpq %rsi, %rdi
setb %cl
testq %rsi, %rsi
sete %al
orb %cl, %al
ret
to lowering:
decq %rsi
cmpq %rdi, %rsi
setae %al
ret
llvm-svn: 185677
2013-07-05 08:31:17 +08:00
|
|
|
// This only handles icmp of constants: (icmp1 A, C1) | (icmp2 B, C2).
|
2014-04-25 13:29:35 +08:00
|
|
|
if (!LHSCst || !RHSCst) return nullptr;
|
2010-01-05 15:50:36 +08:00
|
|
|
|
2010-08-02 17:32:13 +08:00
|
|
|
if (LHSCst == RHSCst && LHSCC == RHSCC) {
|
|
|
|
// (icmp ne A, 0) | (icmp ne B, 0) --> (icmp ne (A|B), 0)
|
|
|
|
if (LHSCC == ICmpInst::ICMP_NE && LHSCst->isZero()) {
|
|
|
|
Value *NewOr = Builder->CreateOr(Val, Val2);
|
|
|
|
return Builder->CreateICmp(LHSCC, NewOr, LHSCst);
|
|
|
|
}
|
2012-01-09 02:32:24 +08:00
|
|
|
}
|
|
|
|
|
2010-12-21 04:00:31 +08:00
|
|
|
// (icmp ult (X + CA), C1) | (icmp eq X, C2) -> (icmp ule (X + CA), C1)
|
2012-09-27 18:14:43 +08:00
|
|
|
// iff C2 + CA == C1.
|
2010-12-21 04:00:31 +08:00
|
|
|
if (LHSCC == ICmpInst::ICMP_ULT && RHSCC == ICmpInst::ICMP_EQ) {
|
2010-12-21 00:18:51 +08:00
|
|
|
ConstantInt *AddCst;
|
|
|
|
if (match(Val, m_Add(m_Specific(Val2), m_ConstantInt(AddCst))))
|
|
|
|
if (RHSCst->getValue() + AddCst->getValue() == LHSCst->getValue())
|
2010-12-21 04:00:31 +08:00
|
|
|
return Builder->CreateICmpULE(Val, LHSCst);
|
2010-12-21 00:18:51 +08:00
|
|
|
}
|
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
// From here on, we only handle:
|
|
|
|
// (icmp1 A, C1) | (icmp2 A, C2) --> something simpler.
|
2014-04-25 13:29:35 +08:00
|
|
|
if (Val != Val2) return nullptr;
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
// ICMP_[US][GL]E X, CST is folded to ICMP_[US][GL]T elsewhere.
|
|
|
|
if (LHSCC == ICmpInst::ICMP_UGE || LHSCC == ICmpInst::ICMP_ULE ||
|
|
|
|
RHSCC == ICmpInst::ICMP_UGE || RHSCC == ICmpInst::ICMP_ULE ||
|
|
|
|
LHSCC == ICmpInst::ICMP_SGE || LHSCC == ICmpInst::ICMP_SLE ||
|
|
|
|
RHSCC == ICmpInst::ICMP_SGE || RHSCC == ICmpInst::ICMP_SLE)
|
2014-04-25 13:29:35 +08:00
|
|
|
return nullptr;
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
// We can't fold (ugt x, C) | (sgt x, C2).
|
|
|
|
if (!PredicatesFoldable(LHSCC, RHSCC))
|
2014-04-25 13:29:35 +08:00
|
|
|
return nullptr;
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
// Ensure that the larger constant is on the RHS.
|
|
|
|
bool ShouldSwap;
|
|
|
|
if (CmpInst::isSigned(LHSCC) ||
|
2012-12-20 15:09:41 +08:00
|
|
|
(ICmpInst::isEquality(LHSCC) &&
|
2010-01-05 15:50:36 +08:00
|
|
|
CmpInst::isSigned(RHSCC)))
|
|
|
|
ShouldSwap = LHSCst->getValue().sgt(RHSCst->getValue());
|
|
|
|
else
|
|
|
|
ShouldSwap = LHSCst->getValue().ugt(RHSCst->getValue());
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
if (ShouldSwap) {
|
|
|
|
std::swap(LHS, RHS);
|
|
|
|
std::swap(LHSCst, RHSCst);
|
|
|
|
std::swap(LHSCC, RHSCC);
|
|
|
|
}
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2010-02-11 00:03:48 +08:00
|
|
|
// At this point, we know we have two icmp instructions
|
2010-01-05 15:50:36 +08:00
|
|
|
// comparing a value against two constants and or'ing the result
|
|
|
|
// together. Because of the above check, we know that we only have
|
|
|
|
// ICMP_EQ, ICMP_NE, ICMP_LT, and ICMP_GT here. We also know (from the
|
|
|
|
// icmp folding check above), that the two constants are not
|
|
|
|
// equal.
|
|
|
|
assert(LHSCst != RHSCst && "Compares not folded above?");
|
|
|
|
|
|
|
|
switch (LHSCC) {
|
|
|
|
default: llvm_unreachable("Unknown integer condition code!");
|
|
|
|
case ICmpInst::ICMP_EQ:
|
|
|
|
switch (RHSCC) {
|
|
|
|
default: llvm_unreachable("Unknown integer condition code!");
|
|
|
|
case ICmpInst::ICMP_EQ:
|
2012-12-31 08:34:55 +08:00
|
|
|
if (LHS->getOperand(0) == RHS->getOperand(0)) {
|
2012-12-31 09:40:44 +08:00
|
|
|
// if LHSCst and RHSCst differ only by one bit:
|
2015-12-03 00:15:07 +08:00
|
|
|
// (A == C1 || A == C2) -> (A | (C1 ^ C2)) == C2
|
2013-01-01 02:26:42 +08:00
|
|
|
assert(LHSCst->getValue().ule(LHSCst->getValue()));
|
|
|
|
|
2012-12-31 08:34:55 +08:00
|
|
|
APInt Xor = LHSCst->getValue() ^ RHSCst->getValue();
|
|
|
|
if (Xor.isPowerOf2()) {
|
2015-12-03 00:15:07 +08:00
|
|
|
Value *Cst = Builder->getInt(Xor);
|
|
|
|
Value *Or = Builder->CreateOr(LHS->getOperand(0), Cst);
|
|
|
|
return Builder->CreateICmp(ICmpInst::ICMP_EQ, Or, RHSCst);
|
2012-12-31 08:34:55 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2013-04-15 05:15:43 +08:00
|
|
|
if (LHSCst == SubOne(RHSCst)) {
|
|
|
|
// (X == 13 | X == 14) -> X-13 <u 2
|
|
|
|
Constant *AddCST = ConstantExpr::getNeg(LHSCst);
|
|
|
|
Value *Add = Builder->CreateAdd(Val, AddCST, Val->getName()+".off");
|
|
|
|
AddCST = ConstantExpr::getSub(AddOne(RHSCst), LHSCst);
|
|
|
|
return Builder->CreateICmpULT(Add, AddCST);
|
|
|
|
}
|
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
break; // (X == 13 | X == 15) -> no change
|
|
|
|
case ICmpInst::ICMP_UGT: // (X == 13 | X u> 14) -> no change
|
|
|
|
case ICmpInst::ICMP_SGT: // (X == 13 | X s> 14) -> no change
|
|
|
|
break;
|
|
|
|
case ICmpInst::ICMP_NE: // (X == 13 | X != 15) -> X != 15
|
|
|
|
case ICmpInst::ICMP_ULT: // (X == 13 | X u< 15) -> X u< 15
|
|
|
|
case ICmpInst::ICMP_SLT: // (X == 13 | X s< 15) -> X s< 15
|
2010-03-05 16:46:26 +08:00
|
|
|
return RHS;
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
case ICmpInst::ICMP_NE:
|
|
|
|
switch (RHSCC) {
|
|
|
|
default: llvm_unreachable("Unknown integer condition code!");
|
|
|
|
case ICmpInst::ICMP_EQ: // (X != 13 | X == 15) -> X != 13
|
|
|
|
case ICmpInst::ICMP_UGT: // (X != 13 | X u> 15) -> X != 13
|
|
|
|
case ICmpInst::ICMP_SGT: // (X != 13 | X s> 15) -> X != 13
|
2010-03-05 16:46:26 +08:00
|
|
|
return LHS;
|
2010-01-05 15:50:36 +08:00
|
|
|
case ICmpInst::ICMP_NE: // (X != 13 | X != 15) -> true
|
|
|
|
case ICmpInst::ICMP_ULT: // (X != 13 | X u< 15) -> true
|
|
|
|
case ICmpInst::ICMP_SLT: // (X != 13 | X s< 15) -> true
|
2013-06-06 08:37:23 +08:00
|
|
|
return Builder->getTrue();
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
case ICmpInst::ICMP_ULT:
|
|
|
|
switch (RHSCC) {
|
|
|
|
default: llvm_unreachable("Unknown integer condition code!");
|
|
|
|
case ICmpInst::ICMP_EQ: // (X u< 13 | X == 14) -> no change
|
|
|
|
break;
|
|
|
|
case ICmpInst::ICMP_UGT: // (X u< 13 | X u> 15) -> (X-13) u> 2
|
|
|
|
// If RHSCst is [us]MAXINT, it is always false. Not handling
|
|
|
|
// this can cause overflow.
|
|
|
|
if (RHSCst->isMaxValue(false))
|
2010-03-05 16:46:26 +08:00
|
|
|
return LHS;
|
|
|
|
return InsertRangeTest(Val, LHSCst, AddOne(RHSCst), false, false);
|
2010-01-05 15:50:36 +08:00
|
|
|
case ICmpInst::ICMP_SGT: // (X u< 13 | X s> 15) -> no change
|
|
|
|
break;
|
|
|
|
case ICmpInst::ICMP_NE: // (X u< 13 | X != 15) -> X != 15
|
|
|
|
case ICmpInst::ICMP_ULT: // (X u< 13 | X u< 15) -> X u< 15
|
2010-03-05 16:46:26 +08:00
|
|
|
return RHS;
|
2010-01-05 15:50:36 +08:00
|
|
|
case ICmpInst::ICMP_SLT: // (X u< 13 | X s< 15) -> no change
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case ICmpInst::ICMP_SLT:
|
|
|
|
switch (RHSCC) {
|
|
|
|
default: llvm_unreachable("Unknown integer condition code!");
|
|
|
|
case ICmpInst::ICMP_EQ: // (X s< 13 | X == 14) -> no change
|
|
|
|
break;
|
|
|
|
case ICmpInst::ICMP_SGT: // (X s< 13 | X s> 15) -> (X-13) s> 2
|
|
|
|
// If RHSCst is [us]MAXINT, it is always false. Not handling
|
|
|
|
// this can cause overflow.
|
|
|
|
if (RHSCst->isMaxValue(true))
|
2010-03-05 16:46:26 +08:00
|
|
|
return LHS;
|
|
|
|
return InsertRangeTest(Val, LHSCst, AddOne(RHSCst), true, false);
|
2010-01-05 15:50:36 +08:00
|
|
|
case ICmpInst::ICMP_UGT: // (X s< 13 | X u> 15) -> no change
|
|
|
|
break;
|
|
|
|
case ICmpInst::ICMP_NE: // (X s< 13 | X != 15) -> X != 15
|
|
|
|
case ICmpInst::ICMP_SLT: // (X s< 13 | X s< 15) -> X s< 15
|
2010-03-05 16:46:26 +08:00
|
|
|
return RHS;
|
2010-01-05 15:50:36 +08:00
|
|
|
case ICmpInst::ICMP_ULT: // (X s< 13 | X u< 15) -> no change
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case ICmpInst::ICMP_UGT:
|
|
|
|
switch (RHSCC) {
|
|
|
|
default: llvm_unreachable("Unknown integer condition code!");
|
|
|
|
case ICmpInst::ICMP_EQ: // (X u> 13 | X == 15) -> X u> 13
|
|
|
|
case ICmpInst::ICMP_UGT: // (X u> 13 | X u> 15) -> X u> 13
|
2010-03-05 16:46:26 +08:00
|
|
|
return LHS;
|
2010-01-05 15:50:36 +08:00
|
|
|
case ICmpInst::ICMP_SGT: // (X u> 13 | X s> 15) -> no change
|
|
|
|
break;
|
|
|
|
case ICmpInst::ICMP_NE: // (X u> 13 | X != 15) -> true
|
|
|
|
case ICmpInst::ICMP_ULT: // (X u> 13 | X u< 15) -> true
|
2013-06-06 08:37:23 +08:00
|
|
|
return Builder->getTrue();
|
2010-01-05 15:50:36 +08:00
|
|
|
case ICmpInst::ICMP_SLT: // (X u> 13 | X s< 15) -> no change
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case ICmpInst::ICMP_SGT:
|
|
|
|
switch (RHSCC) {
|
|
|
|
default: llvm_unreachable("Unknown integer condition code!");
|
|
|
|
case ICmpInst::ICMP_EQ: // (X s> 13 | X == 15) -> X > 13
|
|
|
|
case ICmpInst::ICMP_SGT: // (X s> 13 | X s> 15) -> X > 13
|
2010-03-05 16:46:26 +08:00
|
|
|
return LHS;
|
2010-01-05 15:50:36 +08:00
|
|
|
case ICmpInst::ICMP_UGT: // (X s> 13 | X u> 15) -> no change
|
|
|
|
break;
|
|
|
|
case ICmpInst::ICMP_NE: // (X s> 13 | X != 15) -> true
|
|
|
|
case ICmpInst::ICMP_SLT: // (X s> 13 | X s< 15) -> true
|
2013-06-06 08:37:23 +08:00
|
|
|
return Builder->getTrue();
|
2010-01-05 15:50:36 +08:00
|
|
|
case ICmpInst::ICMP_ULT: // (X s> 13 | X u< 15) -> no change
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
2014-04-25 13:29:35 +08:00
|
|
|
return nullptr;
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
|
2015-09-09 02:24:36 +08:00
|
|
|
/// Optimize (fcmp)|(fcmp). NOTE: Unlike the rest of instcombine, this returns
|
|
|
|
/// a Value which should already be inserted into the function.
|
2010-03-05 16:46:26 +08:00
|
|
|
Value *InstCombiner::FoldOrOfFCmps(FCmpInst *LHS, FCmpInst *RHS) {
|
[InstCombine] Simplify and correct folding fcmps with the same children
Summary: Take advantage of FCmpInst::Predicate's bit pattern and handle (fcmp *, x, y) | (fcmp *, x, y) and (fcmp *, x, y) & (fcmp *, x, y) more consistently. Also fold more FCmpInst::FCMP_FALSE and FCmpInst::FCMP_TRUE to constants.
Currently InstCombine wrongly folds (fcmp ogt, x, y) | (fcmp ord, x, y) to (fcmp ogt, x, y); this patch also fixes that.
Reviewers: spatel
Subscribers: llvm-commits, iteratee, echristo
Differential Revision: http://reviews.llvm.org/D21775
llvm-svn: 274156
2016-06-30 04:10:17 +08:00
|
|
|
Value *Op0LHS = LHS->getOperand(0), *Op0RHS = LHS->getOperand(1);
|
|
|
|
Value *Op1LHS = RHS->getOperand(0), *Op1RHS = RHS->getOperand(1);
|
|
|
|
FCmpInst::Predicate Op0CC = LHS->getPredicate(), Op1CC = RHS->getPredicate();
|
|
|
|
|
|
|
|
if (Op0LHS == Op1RHS && Op0RHS == Op1LHS) {
|
|
|
|
// Swap RHS operands to match LHS.
|
|
|
|
Op1CC = FCmpInst::getSwappedPredicate(Op1CC);
|
|
|
|
std::swap(Op1LHS, Op1RHS);
|
|
|
|
}
|
|
|
|
|
|
|
|
// Simplify (fcmp cc0 x, y) | (fcmp cc1 x, y).
|
|
|
|
// This is a similar transformation to the one in FoldAndOfFCmps.
|
|
|
|
//
|
|
|
|
// Since (R & CC0) and (R & CC1) are either R or 0, we actually have this:
|
|
|
|
// bool(R & CC0) || bool(R & CC1)
|
|
|
|
// = bool((R & CC0) | (R & CC1))
|
|
|
|
// = bool(R & (CC0 | CC1)) <= by reversed distribution (contribution? ;)
|
|
|
|
if (Op0LHS == Op1LHS && Op0RHS == Op1RHS)
|
|
|
|
return getFCmpValue(getFCmpCode(Op0CC) | getFCmpCode(Op1CC), Op0LHS, Op0RHS,
|
|
|
|
Builder);
|
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
if (LHS->getPredicate() == FCmpInst::FCMP_UNO &&
|
2012-12-20 15:09:41 +08:00
|
|
|
RHS->getPredicate() == FCmpInst::FCMP_UNO &&
|
2010-01-05 15:50:36 +08:00
|
|
|
LHS->getOperand(0)->getType() == RHS->getOperand(0)->getType()) {
|
|
|
|
if (ConstantFP *LHSC = dyn_cast<ConstantFP>(LHS->getOperand(1)))
|
|
|
|
if (ConstantFP *RHSC = dyn_cast<ConstantFP>(RHS->getOperand(1))) {
|
|
|
|
// If either of the constants are nans, then the whole thing returns
|
|
|
|
// true.
|
|
|
|
if (LHSC->getValueAPF().isNaN() || RHSC->getValueAPF().isNaN())
|
2013-06-06 08:37:23 +08:00
|
|
|
return Builder->getTrue();
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
// Otherwise, no need to compare the two constants, compare the
|
|
|
|
// rest.
|
2010-03-05 16:46:26 +08:00
|
|
|
return Builder->CreateFCmpUNO(LHS->getOperand(0), RHS->getOperand(0));
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
// Handle vector zeros. This occurs because the canonical form of
|
|
|
|
// "fcmp uno x,x" is "fcmp uno x, 0".
|
|
|
|
if (isa<ConstantAggregateZero>(LHS->getOperand(1)) &&
|
|
|
|
isa<ConstantAggregateZero>(RHS->getOperand(1)))
|
2010-03-05 16:46:26 +08:00
|
|
|
return Builder->CreateFCmpUNO(LHS->getOperand(0), RHS->getOperand(0));
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2014-04-25 13:29:35 +08:00
|
|
|
return nullptr;
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2014-04-25 13:29:35 +08:00
|
|
|
return nullptr;
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
|
2015-09-09 02:24:36 +08:00
|
|
|
/// This helper function folds:
|
2010-01-05 15:50:36 +08:00
|
|
|
///
|
|
|
|
/// ((A | B) & C1) | (B & C2)
|
|
|
|
///
|
|
|
|
/// into:
|
2012-12-20 15:09:41 +08:00
|
|
|
///
|
2010-01-05 15:50:36 +08:00
|
|
|
/// (A & C1) | B
|
|
|
|
///
|
|
|
|
/// when the XOR of the two constants is "all ones" (-1).
|
|
|
|
Instruction *InstCombiner::FoldOrWithConstants(BinaryOperator &I, Value *Op,
|
|
|
|
Value *A, Value *B, Value *C) {
|
|
|
|
ConstantInt *CI1 = dyn_cast<ConstantInt>(C);
|
2014-04-25 13:29:35 +08:00
|
|
|
if (!CI1) return nullptr;
|
2010-01-05 15:50:36 +08:00
|
|
|
|
2014-04-25 13:29:35 +08:00
|
|
|
Value *V1 = nullptr;
|
|
|
|
ConstantInt *CI2 = nullptr;
|
|
|
|
if (!match(Op, m_And(m_Value(V1), m_ConstantInt(CI2)))) return nullptr;
|
2010-01-05 15:50:36 +08:00
|
|
|
|
|
|
|
APInt Xor = CI1->getValue() ^ CI2->getValue();
|
2014-04-25 13:29:35 +08:00
|
|
|
if (!Xor.isAllOnesValue()) return nullptr;
|
2010-01-05 15:50:36 +08:00
|
|
|
|
|
|
|
if (V1 == A || V1 == B) {
|
|
|
|
Value *NewOp = Builder->CreateAnd((V1 == A) ? B : A, CI1);
|
|
|
|
return BinaryOperator::CreateOr(NewOp, V1);
|
|
|
|
}
|
|
|
|
|
2014-04-25 13:29:35 +08:00
|
|
|
return nullptr;
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
|
2014-08-21 13:14:48 +08:00
|
|
|
/// \brief This helper function folds:
|
|
|
|
///
|
|
|
|
/// ((A | B) & C1) ^ (B & C2)
|
|
|
|
///
|
|
|
|
/// into:
|
|
|
|
///
|
|
|
|
/// (A & C1) ^ B
|
|
|
|
///
|
|
|
|
/// when the XOR of the two constants is "all ones" (-1).
|
|
|
|
Instruction *InstCombiner::FoldXorWithConstants(BinaryOperator &I, Value *Op,
|
|
|
|
Value *A, Value *B, Value *C) {
|
|
|
|
ConstantInt *CI1 = dyn_cast<ConstantInt>(C);
|
|
|
|
if (!CI1)
|
|
|
|
return nullptr;
|
|
|
|
|
|
|
|
Value *V1 = nullptr;
|
|
|
|
ConstantInt *CI2 = nullptr;
|
|
|
|
if (!match(Op, m_And(m_Value(V1), m_ConstantInt(CI2))))
|
|
|
|
return nullptr;
|
|
|
|
|
|
|
|
APInt Xor = CI1->getValue() ^ CI2->getValue();
|
|
|
|
if (!Xor.isAllOnesValue())
|
|
|
|
return nullptr;
|
|
|
|
|
|
|
|
if (V1 == A || V1 == B) {
|
|
|
|
Value *NewOp = Builder->CreateAnd(V1 == A ? B : A, CI1);
|
|
|
|
return BinaryOperator::CreateXor(NewOp, V1);
|
|
|
|
}
|
|
|
|
|
|
|
|
return nullptr;
|
|
|
|
}
|
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
Instruction *InstCombiner::visitOr(BinaryOperator &I) {
|
2010-11-13 23:10:37 +08:00
|
|
|
bool Changed = SimplifyAssociativeOrCommutative(I);
|
2010-01-05 15:50:36 +08:00
|
|
|
Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);
|
|
|
|
|
2014-05-11 16:46:12 +08:00
|
|
|
if (Value *V = SimplifyVectorOp(I))
|
2016-02-02 06:23:39 +08:00
|
|
|
return replaceInstUsesWith(I, V);
|
2014-05-11 16:46:12 +08:00
|
|
|
|
2015-01-04 20:03:27 +08:00
|
|
|
if (Value *V = SimplifyOrInst(Op0, Op1, DL, TLI, DT, AC))
|
2016-02-02 06:23:39 +08:00
|
|
|
return replaceInstUsesWith(I, V);
|
2010-03-03 08:35:56 +08:00
|
|
|
|
2010-12-22 21:36:08 +08:00
|
|
|
// (A&B)|(A&C) -> A&(B|C) etc
|
|
|
|
if (Value *V = SimplifyUsingDistributiveLaws(I))
|
2016-02-02 06:23:39 +08:00
|
|
|
return replaceInstUsesWith(I, V);
|
2010-11-23 22:23:47 +08:00
|
|
|
|
2012-12-20 15:09:41 +08:00
|
|
|
// See if we can simplify any instructions used by the instruction whose sole
|
2010-01-05 15:50:36 +08:00
|
|
|
// purpose is to compute bits we don't care about.
|
|
|
|
if (SimplifyDemandedInstructionBits(I))
|
|
|
|
return &I;
|
|
|
|
|
2014-12-04 17:44:01 +08:00
|
|
|
if (Value *V = SimplifyBSwap(I))
|
2016-02-02 06:23:39 +08:00
|
|
|
return replaceInstUsesWith(I, V);
|
2014-12-04 17:44:01 +08:00
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
if (ConstantInt *RHS = dyn_cast<ConstantInt>(Op1)) {
|
2014-04-25 13:29:35 +08:00
|
|
|
ConstantInt *C1 = nullptr; Value *X = nullptr;
|
2010-01-05 15:50:36 +08:00
|
|
|
// (X & C1) | C2 --> (X | C2) & (C1|C2)
|
2012-09-27 18:14:43 +08:00
|
|
|
// iff (C1 & C2) == 0.
|
2010-01-05 15:50:36 +08:00
|
|
|
if (match(Op0, m_And(m_Value(X), m_ConstantInt(C1))) &&
|
2010-03-03 08:35:56 +08:00
|
|
|
(RHS->getValue() & C1->getValue()) != 0 &&
|
2010-01-05 15:50:36 +08:00
|
|
|
Op0->hasOneUse()) {
|
|
|
|
Value *Or = Builder->CreateOr(X, RHS);
|
|
|
|
Or->takeName(Op0);
|
2012-12-20 15:09:41 +08:00
|
|
|
return BinaryOperator::CreateAnd(Or,
|
2013-06-06 08:37:23 +08:00
|
|
|
Builder->getInt(RHS->getValue() | C1->getValue()));
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
// (X ^ C1) | C2 --> (X | C2) ^ (C1&~C2)
|
|
|
|
if (match(Op0, m_Xor(m_Value(X), m_ConstantInt(C1))) &&
|
|
|
|
Op0->hasOneUse()) {
|
|
|
|
Value *Or = Builder->CreateOr(X, RHS);
|
|
|
|
Or->takeName(Op0);
|
|
|
|
return BinaryOperator::CreateXor(Or,
|
2013-06-06 08:37:23 +08:00
|
|
|
Builder->getInt(C1->getValue() & ~RHS->getValue()));
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
// Try to fold constant and into select arguments.
|
|
|
|
if (SelectInst *SI = dyn_cast<SelectInst>(Op0))
|
|
|
|
if (Instruction *R = FoldOpIntoSelect(I, SI))
|
|
|
|
return R;
|
2010-03-03 08:35:56 +08:00
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
if (isa<PHINode>(Op0))
|
|
|
|
if (Instruction *NV = FoldOpIntoPhi(I))
|
|
|
|
return NV;
|
|
|
|
}
|
|
|
|
|
2016-05-26 22:58:51 +08:00
|
|
|
// Given an OR instruction, check to see if this is a bswap.
|
|
|
|
if (Instruction *BSwap = MatchBSwap(I))
|
|
|
|
return BSwap;
|
|
|
|
|
2014-04-25 13:29:35 +08:00
|
|
|
Value *A = nullptr, *B = nullptr;
|
|
|
|
ConstantInt *C1 = nullptr, *C2 = nullptr;
|
2010-01-05 15:50:36 +08:00
|
|
|
|
2012-09-27 18:14:43 +08:00
|
|
|
// (X^C)|Y -> (X|Y)^C iff Y&C == 0
|
2010-01-05 15:50:36 +08:00
|
|
|
if (Op0->hasOneUse() &&
|
|
|
|
match(Op0, m_Xor(m_Value(A), m_ConstantInt(C1))) &&
|
Make use of @llvm.assume in ValueTracking (computeKnownBits, etc.)
This change, which allows @llvm.assume to be used from within computeKnownBits
(and other associated functions in ValueTracking), adds some (optional)
parameters to computeKnownBits and friends. These functions now (optionally)
take a "context" instruction pointer, an AssumptionTracker pointer, and also a
DomTree pointer, and most of the changes are just to pass this new information
when it is easily available from InstSimplify, InstCombine, etc.
As explained below, the significant conceptual change is that known properties
of a value might depend on the control-flow location of the use (because we
care that the @llvm.assume dominates the use because assumptions have
control-flow dependencies). This means that, when we ask if bits are known in a
value, we might get different answers for different uses.
The significant changes are all in ValueTracking. Two main changes: First, as
with the rest of the code, new parameters need to be passed around. To make
this easier, I grouped them into a structure, and I made internal static
versions of the relevant functions that take this structure as a parameter. The
new code does as you might expect, it looks for @llvm.assume calls that make
use of the value we're trying to learn something about (often indirectly),
attempts to pattern match that expression, and uses the result if successful.
By making use of the AssumptionTracker, the process of finding @llvm.assume
calls is not expensive.
Part of the structure being passed around inside ValueTracking is a set of
already-considered @llvm.assume calls. This is to prevent a query using, for
example, the assume(a == b), to recurse on itself. The context and DT params
are used to find applicable assumptions. An assumption needs to dominate the
context instruction, or come after it deterministically. In this latter case we
only handle the specific case where both the assumption and the context
instruction are in the same block, and we need to exclude assumptions from
being used to simplify their own ephemeral values (those which contribute only
to the assumption) because otherwise the assumption would prove its feeding
comparison trivial and would be removed.
This commit adds the plumbing and the logic for a simple masked-bit propagation
(just enough to write a regression test). Future commits add more patterns
(and, correspondingly, more regression tests).
llvm-svn: 217342
2014-09-08 02:57:58 +08:00
|
|
|
MaskedValueIsZero(Op1, C1->getValue(), 0, &I)) {
|
2010-01-05 15:50:36 +08:00
|
|
|
Value *NOr = Builder->CreateOr(A, Op1);
|
|
|
|
NOr->takeName(Op0);
|
|
|
|
return BinaryOperator::CreateXor(NOr, C1);
|
|
|
|
}
|
|
|
|
|
2012-09-27 18:14:43 +08:00
|
|
|
// Y|(X^C) -> (X|Y)^C iff Y&C == 0
|
2010-01-05 15:50:36 +08:00
|
|
|
if (Op1->hasOneUse() &&
|
|
|
|
match(Op1, m_Xor(m_Value(A), m_ConstantInt(C1))) &&
|
Make use of @llvm.assume in ValueTracking (computeKnownBits, etc.)
This change, which allows @llvm.assume to be used from within computeKnownBits
(and other associated functions in ValueTracking), adds some (optional)
parameters to computeKnownBits and friends. These functions now (optionally)
take a "context" instruction pointer, an AssumptionTracker pointer, and also a
DomTree pointer, and most of the changes are just to pass this new information
when it is easily available from InstSimplify, InstCombine, etc.
As explained below, the significant conceptual change is that known properties
of a value might depend on the control-flow location of the use (because we
care that the @llvm.assume dominates the use because assumptions have
control-flow dependencies). This means that, when we ask if bits are known in a
value, we might get different answers for different uses.
The significant changes are all in ValueTracking. Two main changes: First, as
with the rest of the code, new parameters need to be passed around. To make
this easier, I grouped them into a structure, and I made internal static
versions of the relevant functions that take this structure as a parameter. The
new code does as you might expect, it looks for @llvm.assume calls that make
use of the value we're trying to learn something about (often indirectly),
attempts to pattern match that expression, and uses the result if successful.
By making use of the AssumptionTracker, the process of finding @llvm.assume
calls is not expensive.
Part of the structure being passed around inside ValueTracking is a set of
already-considered @llvm.assume calls. This is to prevent a query using, for
example, the assume(a == b), to recurse on itself. The context and DT params
are used to find applicable assumptions. An assumption needs to dominate the
context instruction, or come after it deterministically. In this latter case we
only handle the specific case where both the assumption and the context
instruction are in the same block, and we need to exclude assumptions from
being used to simplify their own ephemeral values (those which contribute only
to the assumption) because otherwise the assumption would prove its feeding
comparison trivial and would be removed.
This commit adds the plumbing and the logic for a simple masked-bit propagation
(just enough to write a regression test). Future commits add more patterns
(and, correspondingly, more regression tests).
llvm-svn: 217342
2014-09-08 02:57:58 +08:00
|
|
|
MaskedValueIsZero(Op0, C1->getValue(), 0, &I)) {
|
2010-01-05 15:50:36 +08:00
|
|
|
Value *NOr = Builder->CreateOr(A, Op0);
|
|
|
|
NOr->takeName(Op0);
|
|
|
|
return BinaryOperator::CreateXor(NOr, C1);
|
|
|
|
}
|
|
|
|
|
2014-07-23 02:09:41 +08:00
|
|
|
// ((~A & B) | A) -> (A | B)
|
|
|
|
if (match(Op0, m_And(m_Not(m_Value(A)), m_Value(B))) &&
|
|
|
|
match(Op1, m_Specific(A)))
|
|
|
|
return BinaryOperator::CreateOr(A, B);
|
|
|
|
|
|
|
|
// ((A & B) | ~A) -> (~A | B)
|
|
|
|
if (match(Op0, m_And(m_Value(A), m_Value(B))) &&
|
|
|
|
match(Op1, m_Not(m_Specific(A))))
|
|
|
|
return BinaryOperator::CreateOr(Builder->CreateNot(A), B);
|
|
|
|
|
2014-08-01 12:50:31 +08:00
|
|
|
// (A & (~B)) | (A ^ B) -> (A ^ B)
|
|
|
|
if (match(Op0, m_And(m_Value(A), m_Not(m_Value(B)))) &&
|
|
|
|
match(Op1, m_Xor(m_Specific(A), m_Specific(B))))
|
|
|
|
return BinaryOperator::CreateXor(A, B);
|
|
|
|
|
|
|
|
// (A ^ B) | ( A & (~B)) -> (A ^ B)
|
|
|
|
if (match(Op0, m_Xor(m_Value(A), m_Value(B))) &&
|
|
|
|
match(Op1, m_And(m_Specific(A), m_Not(m_Specific(B)))))
|
|
|
|
return BinaryOperator::CreateXor(A, B);
|
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
// (A & C)|(B & D)
|
2014-04-25 13:29:35 +08:00
|
|
|
Value *C = nullptr, *D = nullptr;
|
2010-01-05 15:50:36 +08:00
|
|
|
if (match(Op0, m_And(m_Value(A), m_Value(C))) &&
|
|
|
|
match(Op1, m_And(m_Value(B), m_Value(D)))) {
|
2014-04-25 13:29:35 +08:00
|
|
|
Value *V1 = nullptr, *V2 = nullptr;
|
2010-01-05 15:50:36 +08:00
|
|
|
C1 = dyn_cast<ConstantInt>(C);
|
|
|
|
C2 = dyn_cast<ConstantInt>(D);
|
|
|
|
if (C1 && C2) { // (A & C1)|(B & C2)
|
|
|
|
if ((C1->getValue() & C2->getValue()) == 0) {
|
add one more bitfield optimization, allowing clang to generate
good code on PR4216:
_test_bitfield: ## @test_bitfield
orl $32962, %edi
movl $4294941946, %eax
andq %rdi, %rax
ret
instead of:
_test_bitfield:
movl $4294941696, %ecx
movl %edi, %eax
orl $194, %edi
orl $32768, %eax
andq $250, %rdi
andq %rax, %rcx
movq %rdi, %rax
orq %rcx, %rax
ret
Evan is looking into the remaining andq+imm -> andl optimization.
llvm-svn: 93147
2010-01-11 14:55:24 +08:00
|
|
|
// ((V | N) & C1) | (V & C2) --> (V|N) & (C1|C2)
|
2012-09-27 18:14:43 +08:00
|
|
|
// iff (C1&C2) == 0 and (N&~C1) == 0
|
2010-01-05 15:50:36 +08:00
|
|
|
if (match(A, m_Or(m_Value(V1), m_Value(V2))) &&
|
Make use of @llvm.assume in ValueTracking (computeKnownBits, etc.)
This change, which allows @llvm.assume to be used from within computeKnownBits
(and other associated functions in ValueTracking), adds some (optional)
parameters to computeKnownBits and friends. These functions now (optionally)
take a "context" instruction pointer, an AssumptionTracker pointer, and also a
DomTree pointer, and most of the changes are just to pass this new information
when it is easily available from InstSimplify, InstCombine, etc.
As explained below, the significant conceptual change is that known properties
of a value might depend on the control-flow location of the use (because we
care that the @llvm.assume dominates the use because assumptions have
control-flow dependencies). This means that, when we ask if bits are known in a
value, we might get different answers for different uses.
The significant changes are all in ValueTracking. Two main changes: First, as
with the rest of the code, new parameters need to be passed around. To make
this easier, I grouped them into a structure, and I made internal static
versions of the relevant functions that take this structure as a parameter. The
new code does as you might expect, it looks for @llvm.assume calls that make
use of the value we're trying to learn something about (often indirectly),
attempts to pattern match that expression, and uses the result if successful.
By making use of the AssumptionTracker, the process of finding @llvm.assume
calls is not expensive.
Part of the structure being passed around inside ValueTracking is a set of
already-considered @llvm.assume calls. This is to prevent a query using, for
example, the assume(a == b), to recurse on itself. The context and DT params
are used to find applicable assumptions. An assumption needs to dominate the
context instruction, or come after it deterministically. In this latter case we
only handle the specific case where both the assumption and the context
instruction are in the same block, and we need to exclude assumptions from
being used to simplify their own ephemeral values (those which contribute only
to the assumption) because otherwise the assumption would prove its feeding
comparison trivial and would be removed.
This commit adds the plumbing and the logic for a simple masked-bit propagation
(just enough to write a regression test). Future commits add more patterns
(and, correspondingly, more regression tests).
llvm-svn: 217342
2014-09-08 02:57:58 +08:00
|
|
|
((V1 == B &&
|
|
|
|
MaskedValueIsZero(V2, ~C1->getValue(), 0, &I)) || // (V|N)
|
|
|
|
(V2 == B &&
|
|
|
|
MaskedValueIsZero(V1, ~C1->getValue(), 0, &I)))) // (N|V)
|
2010-01-05 15:50:36 +08:00
|
|
|
return BinaryOperator::CreateAnd(A,
|
2013-06-06 08:37:23 +08:00
|
|
|
Builder->getInt(C1->getValue()|C2->getValue()));
|
2010-01-05 15:50:36 +08:00
|
|
|
// Or commutes, try both ways.
|
|
|
|
if (match(B, m_Or(m_Value(V1), m_Value(V2))) &&
|
Make use of @llvm.assume in ValueTracking (computeKnownBits, etc.)
This change, which allows @llvm.assume to be used from within computeKnownBits
(and other associated functions in ValueTracking), adds some (optional)
parameters to computeKnownBits and friends. These functions now (optionally)
take a "context" instruction pointer, an AssumptionTracker pointer, and also a
DomTree pointer, and most of the changes are just to pass this new information
when it is easily available from InstSimplify, InstCombine, etc.
As explained below, the significant conceptual change is that known properties
of a value might depend on the control-flow location of the use (because we
care that the @llvm.assume dominates the use because assumptions have
control-flow dependencies). This means that, when we ask if bits are known in a
value, we might get different answers for different uses.
The significant changes are all in ValueTracking. Two main changes: First, as
with the rest of the code, new parameters need to be passed around. To make
this easier, I grouped them into a structure, and I made internal static
versions of the relevant functions that take this structure as a parameter. The
new code does as you might expect, it looks for @llvm.assume calls that make
use of the value we're trying to learn something about (often indirectly),
attempts to pattern match that expression, and uses the result if successful.
By making use of the AssumptionTracker, the process of finding @llvm.assume
calls is not expensive.
Part of the structure being passed around inside ValueTracking is a set of
already-considered @llvm.assume calls. This is to prevent a query using, for
example, the assume(a == b), to recurse on itself. The context and DT params
are used to find applicable assumptions. An assumption needs to dominate the
context instruction, or come after it deterministically. In this latter case we
only handle the specific case where both the assumption and the context
instruction are in the same block, and we need to exclude assumptions from
being used to simplify their own ephemeral values (those which contribute only
to the assumption) because otherwise the assumption would prove its feeding
comparison trivial and would be removed.
This commit adds the plumbing and the logic for a simple masked-bit propagation
(just enough to write a regression test). Future commits add more patterns
(and, correspondingly, more regression tests).
llvm-svn: 217342
2014-09-08 02:57:58 +08:00
|
|
|
((V1 == A &&
|
|
|
|
MaskedValueIsZero(V2, ~C2->getValue(), 0, &I)) || // (V|N)
|
|
|
|
(V2 == A &&
|
|
|
|
MaskedValueIsZero(V1, ~C2->getValue(), 0, &I)))) // (N|V)
|
2010-01-05 15:50:36 +08:00
|
|
|
return BinaryOperator::CreateAnd(B,
|
2013-06-06 08:37:23 +08:00
|
|
|
Builder->getInt(C1->getValue()|C2->getValue()));
|
2012-12-20 15:09:41 +08:00
|
|
|
|
add one more bitfield optimization, allowing clang to generate
good code on PR4216:
_test_bitfield: ## @test_bitfield
orl $32962, %edi
movl $4294941946, %eax
andq %rdi, %rax
ret
instead of:
_test_bitfield:
movl $4294941696, %ecx
movl %edi, %eax
orl $194, %edi
orl $32768, %eax
andq $250, %rdi
andq %rax, %rcx
movq %rdi, %rax
orq %rcx, %rax
ret
Evan is looking into the remaining andq+imm -> andl optimization.
llvm-svn: 93147
2010-01-11 14:55:24 +08:00
|
|
|
// ((V|C3)&C1) | ((V|C4)&C2) --> (V|C3|C4)&(C1|C2)
|
2012-09-27 18:14:43 +08:00
|
|
|
// iff (C1&C2) == 0 and (C3&~C1) == 0 and (C4&~C2) == 0.
|
2014-04-25 13:29:35 +08:00
|
|
|
ConstantInt *C3 = nullptr, *C4 = nullptr;
|
add one more bitfield optimization, allowing clang to generate
good code on PR4216:
_test_bitfield: ## @test_bitfield
orl $32962, %edi
movl $4294941946, %eax
andq %rdi, %rax
ret
instead of:
_test_bitfield:
movl $4294941696, %ecx
movl %edi, %eax
orl $194, %edi
orl $32768, %eax
andq $250, %rdi
andq %rax, %rcx
movq %rdi, %rax
orq %rcx, %rax
ret
Evan is looking into the remaining andq+imm -> andl optimization.
llvm-svn: 93147
2010-01-11 14:55:24 +08:00
|
|
|
if (match(A, m_Or(m_Value(V1), m_ConstantInt(C3))) &&
|
|
|
|
(C3->getValue() & ~C1->getValue()) == 0 &&
|
|
|
|
match(B, m_Or(m_Specific(V1), m_ConstantInt(C4))) &&
|
|
|
|
(C4->getValue() & ~C2->getValue()) == 0) {
|
|
|
|
V2 = Builder->CreateOr(V1, ConstantExpr::getOr(C3, C4), "bitfield");
|
|
|
|
return BinaryOperator::CreateAnd(V2,
|
2013-06-06 08:37:23 +08:00
|
|
|
Builder->getInt(C1->getValue()|C2->getValue()));
|
add one more bitfield optimization, allowing clang to generate
good code on PR4216:
_test_bitfield: ## @test_bitfield
orl $32962, %edi
movl $4294941946, %eax
andq %rdi, %rax
ret
instead of:
_test_bitfield:
movl $4294941696, %ecx
movl %edi, %eax
orl $194, %edi
orl $32768, %eax
andq $250, %rdi
andq %rax, %rcx
movq %rdi, %rax
orq %rcx, %rax
ret
Evan is looking into the remaining andq+imm -> andl optimization.
llvm-svn: 93147
2010-01-11 14:55:24 +08:00
|
|
|
}
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-06-25 02:26:02 +08:00
|
|
|
// (Cond & C) | (~Cond & D) -> Cond ? C : D, and commuted variants.
|
2016-06-25 02:55:27 +08:00
|
|
|
if (Value *V = matchSelectFromAndOr(A, C, B, D, *Builder))
|
|
|
|
return replaceInstUsesWith(I, V);
|
|
|
|
if (Value *V = matchSelectFromAndOr(A, C, D, B, *Builder))
|
|
|
|
return replaceInstUsesWith(I, V);
|
|
|
|
if (Value *V = matchSelectFromAndOr(C, A, B, D, *Builder))
|
|
|
|
return replaceInstUsesWith(I, V);
|
|
|
|
if (Value *V = matchSelectFromAndOr(C, A, D, B, *Builder))
|
|
|
|
return replaceInstUsesWith(I, V);
|
|
|
|
if (Value *V = matchSelectFromAndOr(B, D, A, C, *Builder))
|
|
|
|
return replaceInstUsesWith(I, V);
|
|
|
|
if (Value *V = matchSelectFromAndOr(B, D, C, A, *Builder))
|
|
|
|
return replaceInstUsesWith(I, V);
|
|
|
|
if (Value *V = matchSelectFromAndOr(D, B, A, C, *Builder))
|
|
|
|
return replaceInstUsesWith(I, V);
|
|
|
|
if (Value *V = matchSelectFromAndOr(D, B, C, A, *Builder))
|
|
|
|
return replaceInstUsesWith(I, V);
|
2010-01-05 15:50:36 +08:00
|
|
|
|
|
|
|
// ((A&~B)|(~A&B)) -> A^B
|
|
|
|
if ((match(C, m_Not(m_Specific(D))) &&
|
|
|
|
match(B, m_Not(m_Specific(A)))))
|
|
|
|
return BinaryOperator::CreateXor(A, D);
|
|
|
|
// ((~B&A)|(~A&B)) -> A^B
|
|
|
|
if ((match(A, m_Not(m_Specific(D))) &&
|
|
|
|
match(B, m_Not(m_Specific(C)))))
|
|
|
|
return BinaryOperator::CreateXor(C, D);
|
|
|
|
// ((A&~B)|(B&~A)) -> A^B
|
|
|
|
if ((match(C, m_Not(m_Specific(B))) &&
|
|
|
|
match(D, m_Not(m_Specific(A)))))
|
|
|
|
return BinaryOperator::CreateXor(A, B);
|
|
|
|
// ((~B&A)|(B&~A)) -> A^B
|
|
|
|
if ((match(A, m_Not(m_Specific(B))) &&
|
|
|
|
match(D, m_Not(m_Specific(C)))))
|
|
|
|
return BinaryOperator::CreateXor(C, B);
|
2010-07-12 21:34:22 +08:00
|
|
|
|
|
|
|
// ((A|B)&1)|(B&-2) -> (A&1) | B
|
|
|
|
if (match(A, m_Or(m_Value(V1), m_Specific(B))) ||
|
|
|
|
match(A, m_Or(m_Specific(B), m_Value(V1)))) {
|
|
|
|
Instruction *Ret = FoldOrWithConstants(I, Op1, V1, B, C);
|
|
|
|
if (Ret) return Ret;
|
|
|
|
}
|
|
|
|
// (B&-2)|((A|B)&1) -> (A&1) | B
|
|
|
|
if (match(B, m_Or(m_Specific(A), m_Value(V1))) ||
|
|
|
|
match(B, m_Or(m_Value(V1), m_Specific(A)))) {
|
|
|
|
Instruction *Ret = FoldOrWithConstants(I, Op0, A, V1, D);
|
|
|
|
if (Ret) return Ret;
|
|
|
|
}
|
2014-08-21 13:14:48 +08:00
|
|
|
// ((A^B)&1)|(B&-2) -> (A&1) ^ B
|
|
|
|
if (match(A, m_Xor(m_Value(V1), m_Specific(B))) ||
|
|
|
|
match(A, m_Xor(m_Specific(B), m_Value(V1)))) {
|
|
|
|
Instruction *Ret = FoldXorWithConstants(I, Op1, V1, B, C);
|
|
|
|
if (Ret) return Ret;
|
|
|
|
}
|
|
|
|
// (B&-2)|((A^B)&1) -> (A&1) ^ B
|
|
|
|
if (match(B, m_Xor(m_Specific(A), m_Value(V1))) ||
|
|
|
|
match(B, m_Xor(m_Value(V1), m_Specific(A)))) {
|
|
|
|
Instruction *Ret = FoldXorWithConstants(I, Op0, A, V1, D);
|
|
|
|
if (Ret) return Ret;
|
|
|
|
}
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
2012-12-20 15:09:41 +08:00
|
|
|
|
InstCombine: Simplify (A ^ B) or/and (A ^ B ^ C)
While we can already transform A | (A ^ B) into A | B, things get bad
once we have (A ^ B) | (A ^ B ^ Cst) because reassociation will morph
this into (A ^ B) | ((A ^ Cst) ^ B). Our existing patterns fail once
this happens.
To fix this, we add a new pattern which looks through the tree of xor
binary operators to see that, in fact, there exists a redundant xor
operation.
What follows bellow is a correctness proof of the transform using CVC3.
$ cat t.cvc
A, B, C : BITVECTOR(64);
QUERY BVXOR(A, B) | BVXOR(BVXOR(B, C), A) = BVXOR(A, B) | C;
QUERY BVXOR(BVXOR(A, C), B) | BVXOR(A, B) = BVXOR(A, B) | C;
QUERY BVXOR(A, B) & BVXOR(BVXOR(B, C), A) = BVXOR(A, B) & ~C;
QUERY BVXOR(BVXOR(A, C), B) & BVXOR(A, B) = BVXOR(A, B) & ~C;
$ cvc3 < t.cvc
Valid.
Valid.
Valid.
Valid.
llvm-svn: 214342
2014-07-31 05:26:37 +08:00
|
|
|
// (A ^ B) | ((B ^ C) ^ A) -> (A ^ B) | C
|
|
|
|
if (match(Op0, m_Xor(m_Value(A), m_Value(B))))
|
|
|
|
if (match(Op1, m_Xor(m_Xor(m_Specific(B), m_Value(C)), m_Specific(A))))
|
|
|
|
if (Op1->hasOneUse() || cast<BinaryOperator>(Op1)->hasOneUse())
|
|
|
|
return BinaryOperator::CreateOr(Op0, C);
|
|
|
|
|
|
|
|
// ((A ^ C) ^ B) | (B ^ A) -> (B ^ A) | C
|
|
|
|
if (match(Op0, m_Xor(m_Xor(m_Value(A), m_Value(C)), m_Value(B))))
|
|
|
|
if (match(Op1, m_Xor(m_Specific(B), m_Specific(A))))
|
|
|
|
if (Op0->hasOneUse() || cast<BinaryOperator>(Op0)->hasOneUse())
|
|
|
|
return BinaryOperator::CreateOr(Op1, C);
|
|
|
|
|
2014-08-14 14:41:38 +08:00
|
|
|
// ((B | C) & A) | B -> B | (A & C)
|
|
|
|
if (match(Op0, m_And(m_Or(m_Specific(Op1), m_Value(C)), m_Value(A))))
|
|
|
|
return BinaryOperator::CreateOr(Op1, Builder->CreateAnd(A, C));
|
|
|
|
|
2015-09-09 04:14:13 +08:00
|
|
|
if (Instruction *DeMorgan = matchDeMorgansLaws(I, Builder))
|
|
|
|
return DeMorgan;
|
2010-01-05 15:50:36 +08:00
|
|
|
|
2011-02-20 21:23:43 +08:00
|
|
|
// Canonicalize xor to the RHS.
|
2012-03-16 08:52:42 +08:00
|
|
|
bool SwappedForXor = false;
|
|
|
|
if (match(Op0, m_Xor(m_Value(), m_Value()))) {
|
2011-02-20 21:23:43 +08:00
|
|
|
std::swap(Op0, Op1);
|
2012-03-16 08:52:42 +08:00
|
|
|
SwappedForXor = true;
|
|
|
|
}
|
2011-02-20 21:23:43 +08:00
|
|
|
|
|
|
|
// A | ( A ^ B) -> A | B
|
|
|
|
// A | (~A ^ B) -> A | ~B
|
2012-04-27 07:29:14 +08:00
|
|
|
// (A & B) | (A ^ B)
|
2011-02-20 21:23:43 +08:00
|
|
|
if (match(Op1, m_Xor(m_Value(A), m_Value(B)))) {
|
|
|
|
if (Op0 == A || Op0 == B)
|
|
|
|
return BinaryOperator::CreateOr(A, B);
|
|
|
|
|
2012-04-27 07:29:14 +08:00
|
|
|
if (match(Op0, m_And(m_Specific(A), m_Specific(B))) ||
|
|
|
|
match(Op0, m_And(m_Specific(B), m_Specific(A))))
|
|
|
|
return BinaryOperator::CreateOr(A, B);
|
|
|
|
|
2011-02-20 21:23:43 +08:00
|
|
|
if (Op1->hasOneUse() && match(A, m_Not(m_Specific(Op0)))) {
|
|
|
|
Value *Not = Builder->CreateNot(B, B->getName()+".not");
|
|
|
|
return BinaryOperator::CreateOr(Not, Op0);
|
|
|
|
}
|
|
|
|
if (Op1->hasOneUse() && match(B, m_Not(m_Specific(Op0)))) {
|
|
|
|
Value *Not = Builder->CreateNot(A, A->getName()+".not");
|
|
|
|
return BinaryOperator::CreateOr(Not, Op0);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// A | ~(A | B) -> A | ~B
|
|
|
|
// A | ~(A ^ B) -> A | ~B
|
|
|
|
if (match(Op1, m_Not(m_Value(A))))
|
|
|
|
if (BinaryOperator *B = dyn_cast<BinaryOperator>(A))
|
2011-02-20 23:20:01 +08:00
|
|
|
if ((Op0 == B->getOperand(0) || Op0 == B->getOperand(1)) &&
|
|
|
|
Op1->hasOneUse() && (B->getOpcode() == Instruction::Or ||
|
|
|
|
B->getOpcode() == Instruction::Xor)) {
|
|
|
|
Value *NotOp = Op0 == B->getOperand(0) ? B->getOperand(1) :
|
|
|
|
B->getOperand(0);
|
|
|
|
Value *Not = Builder->CreateNot(NotOp, NotOp->getName()+".not");
|
|
|
|
return BinaryOperator::CreateOr(Not, Op0);
|
|
|
|
}
|
2011-02-20 21:23:43 +08:00
|
|
|
|
2014-08-01 12:41:43 +08:00
|
|
|
// (A & B) | ((~A) ^ B) -> (~A ^ B)
|
|
|
|
if (match(Op0, m_And(m_Value(A), m_Value(B))) &&
|
|
|
|
match(Op1, m_Xor(m_Not(m_Specific(A)), m_Specific(B))))
|
|
|
|
return BinaryOperator::CreateXor(Builder->CreateNot(A), B);
|
|
|
|
|
|
|
|
// ((~A) ^ B) | (A & B) -> (~A ^ B)
|
|
|
|
if (match(Op0, m_Xor(m_Not(m_Value(A)), m_Value(B))) &&
|
|
|
|
match(Op1, m_And(m_Specific(A), m_Specific(B))))
|
|
|
|
return BinaryOperator::CreateXor(Builder->CreateNot(A), B);
|
|
|
|
|
2012-03-16 08:52:42 +08:00
|
|
|
if (SwappedForXor)
|
|
|
|
std::swap(Op0, Op1);
|
|
|
|
|
2014-11-29 03:58:29 +08:00
|
|
|
{
|
|
|
|
ICmpInst *LHS = dyn_cast<ICmpInst>(Op0);
|
|
|
|
ICmpInst *RHS = dyn_cast<ICmpInst>(Op1);
|
|
|
|
if (LHS && RHS)
|
Make use of @llvm.assume in ValueTracking (computeKnownBits, etc.)
This change, which allows @llvm.assume to be used from within computeKnownBits
(and other associated functions in ValueTracking), adds some (optional)
parameters to computeKnownBits and friends. These functions now (optionally)
take a "context" instruction pointer, an AssumptionTracker pointer, and also a
DomTree pointer, and most of the changes are just to pass this new information
when it is easily available from InstSimplify, InstCombine, etc.
As explained below, the significant conceptual change is that known properties
of a value might depend on the control-flow location of the use (because we
care that the @llvm.assume dominates the use because assumptions have
control-flow dependencies). This means that, when we ask if bits are known in a
value, we might get different answers for different uses.
The significant changes are all in ValueTracking. Two main changes: First, as
with the rest of the code, new parameters need to be passed around. To make
this easier, I grouped them into a structure, and I made internal static
versions of the relevant functions that take this structure as a parameter. The
new code does as you might expect, it looks for @llvm.assume calls that make
use of the value we're trying to learn something about (often indirectly),
attempts to pattern match that expression, and uses the result if successful.
By making use of the AssumptionTracker, the process of finding @llvm.assume
calls is not expensive.
Part of the structure being passed around inside ValueTracking is a set of
already-considered @llvm.assume calls. This is to prevent a query using, for
example, the assume(a == b), to recurse on itself. The context and DT params
are used to find applicable assumptions. An assumption needs to dominate the
context instruction, or come after it deterministically. In this latter case we
only handle the specific case where both the assumption and the context
instruction are in the same block, and we need to exclude assumptions from
being used to simplify their own ephemeral values (those which contribute only
to the assumption) because otherwise the assumption would prove its feeding
comparison trivial and would be removed.
This commit adds the plumbing and the logic for a simple masked-bit propagation
(just enough to write a regression test). Future commits add more patterns
(and, correspondingly, more regression tests).
llvm-svn: 217342
2014-09-08 02:57:58 +08:00
|
|
|
if (Value *Res = FoldOrOfICmps(LHS, RHS, &I))
|
2016-02-02 06:23:39 +08:00
|
|
|
return replaceInstUsesWith(I, Res);
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2014-11-29 03:58:29 +08:00
|
|
|
// TODO: Make this recursive; it's a little tricky because an arbitrary
|
|
|
|
// number of 'or' instructions might have to be created.
|
|
|
|
Value *X, *Y;
|
|
|
|
if (LHS && match(Op1, m_OneUse(m_Or(m_Value(X), m_Value(Y))))) {
|
|
|
|
if (auto *Cmp = dyn_cast<ICmpInst>(X))
|
|
|
|
if (Value *Res = FoldOrOfICmps(LHS, Cmp, &I))
|
2016-02-02 06:23:39 +08:00
|
|
|
return replaceInstUsesWith(I, Builder->CreateOr(Res, Y));
|
2014-11-29 03:58:29 +08:00
|
|
|
if (auto *Cmp = dyn_cast<ICmpInst>(Y))
|
|
|
|
if (Value *Res = FoldOrOfICmps(LHS, Cmp, &I))
|
2016-02-02 06:23:39 +08:00
|
|
|
return replaceInstUsesWith(I, Builder->CreateOr(Res, X));
|
2014-11-29 03:58:29 +08:00
|
|
|
}
|
|
|
|
if (RHS && match(Op0, m_OneUse(m_Or(m_Value(X), m_Value(Y))))) {
|
|
|
|
if (auto *Cmp = dyn_cast<ICmpInst>(X))
|
|
|
|
if (Value *Res = FoldOrOfICmps(Cmp, RHS, &I))
|
2016-02-02 06:23:39 +08:00
|
|
|
return replaceInstUsesWith(I, Builder->CreateOr(Res, Y));
|
2014-11-29 03:58:29 +08:00
|
|
|
if (auto *Cmp = dyn_cast<ICmpInst>(Y))
|
|
|
|
if (Value *Res = FoldOrOfICmps(Cmp, RHS, &I))
|
2016-02-02 06:23:39 +08:00
|
|
|
return replaceInstUsesWith(I, Builder->CreateOr(Res, X));
|
2014-11-29 03:58:29 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2010-02-11 14:26:33 +08:00
|
|
|
// (fcmp uno x, c) | (fcmp uno y, c) -> (fcmp uno x, y)
|
|
|
|
if (FCmpInst *LHS = dyn_cast<FCmpInst>(I.getOperand(0)))
|
|
|
|
if (FCmpInst *RHS = dyn_cast<FCmpInst>(I.getOperand(1)))
|
2010-03-05 16:46:26 +08:00
|
|
|
if (Value *Res = FoldOrOfFCmps(LHS, RHS))
|
2016-02-02 06:23:39 +08:00
|
|
|
return replaceInstUsesWith(I, Res);
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2016-02-24 07:56:23 +08:00
|
|
|
if (Instruction *CastedOr = foldCastedBitwiseLogic(I))
|
|
|
|
return CastedOr;
|
2011-04-15 06:41:27 +08:00
|
|
|
|
|
|
|
// or(sext(A), B) -> A ? -1 : B where A is an i1
|
|
|
|
// or(A, sext(B)) -> B ? -1 : A where B is an i1
|
|
|
|
if (match(Op0, m_SExt(m_Value(A))) && A->getType()->isIntegerTy(1))
|
|
|
|
return SelectInst::Create(A, ConstantInt::getSigned(I.getType(), -1), Op1);
|
|
|
|
if (match(Op1, m_SExt(m_Value(A))) && A->getType()->isIntegerTy(1))
|
|
|
|
return SelectInst::Create(A, ConstantInt::getSigned(I.getType(), -1), Op0);
|
|
|
|
|
2010-09-14 01:59:27 +08:00
|
|
|
// Note: If we've gotten to the point of visiting the outer OR, then the
|
|
|
|
// inner one couldn't be simplified. If it was a constant, then it won't
|
|
|
|
// be simplified by a later pass either, so we try swapping the inner/outer
|
|
|
|
// ORs in the hopes that we'll be able to simplify it this way.
|
|
|
|
// (X|C) | V --> (X|V) | C
|
|
|
|
if (Op0->hasOneUse() && !isa<ConstantInt>(Op1) &&
|
|
|
|
match(Op0, m_Or(m_Value(A), m_ConstantInt(C1)))) {
|
|
|
|
Value *Inner = Builder->CreateOr(A, Op1);
|
|
|
|
Inner->takeName(Op0);
|
|
|
|
return BinaryOperator::CreateOr(Inner, C1);
|
|
|
|
}
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2013-02-17 07:41:36 +08:00
|
|
|
// Change (or (bool?A:B),(bool?C:D)) --> (bool?(or A,C):(or B,D))
|
|
|
|
// Since this OR statement hasn't been optimized further yet, we hope
|
|
|
|
// that this transformation will allow the new ORs to be optimized.
|
|
|
|
{
|
2014-04-25 13:29:35 +08:00
|
|
|
Value *X = nullptr, *Y = nullptr;
|
2013-02-17 07:41:36 +08:00
|
|
|
if (Op0->hasOneUse() && Op1->hasOneUse() &&
|
|
|
|
match(Op0, m_Select(m_Value(X), m_Value(A), m_Value(B))) &&
|
|
|
|
match(Op1, m_Select(m_Value(Y), m_Value(C), m_Value(D))) && X == Y) {
|
|
|
|
Value *orTrue = Builder->CreateOr(A, C);
|
|
|
|
Value *orFalse = Builder->CreateOr(B, D);
|
|
|
|
return SelectInst::Create(X, orTrue, orFalse);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-04-25 13:29:35 +08:00
|
|
|
return Changed ? &I : nullptr;
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
Instruction *InstCombiner::visitXor(BinaryOperator &I) {
|
2010-11-13 23:10:37 +08:00
|
|
|
bool Changed = SimplifyAssociativeOrCommutative(I);
|
2010-01-05 15:50:36 +08:00
|
|
|
Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);
|
|
|
|
|
2014-05-11 16:46:12 +08:00
|
|
|
if (Value *V = SimplifyVectorOp(I))
|
2016-02-02 06:23:39 +08:00
|
|
|
return replaceInstUsesWith(I, V);
|
2014-05-11 16:46:12 +08:00
|
|
|
|
2015-01-04 20:03:27 +08:00
|
|
|
if (Value *V = SimplifyXorInst(Op0, Op1, DL, TLI, DT, AC))
|
2016-02-02 06:23:39 +08:00
|
|
|
return replaceInstUsesWith(I, V);
|
2010-01-05 15:50:36 +08:00
|
|
|
|
2010-12-22 21:36:08 +08:00
|
|
|
// (A&B)^(A&C) -> A&(B^C) etc
|
|
|
|
if (Value *V = SimplifyUsingDistributiveLaws(I))
|
2016-02-02 06:23:39 +08:00
|
|
|
return replaceInstUsesWith(I, V);
|
2010-11-23 22:23:47 +08:00
|
|
|
|
2012-12-20 15:09:41 +08:00
|
|
|
// See if we can simplify any instructions used by the instruction whose sole
|
2010-01-05 15:50:36 +08:00
|
|
|
// purpose is to compute bits we don't care about.
|
|
|
|
if (SimplifyDemandedInstructionBits(I))
|
|
|
|
return &I;
|
|
|
|
|
2014-12-04 17:44:01 +08:00
|
|
|
if (Value *V = SimplifyBSwap(I))
|
2016-02-02 06:23:39 +08:00
|
|
|
return replaceInstUsesWith(I, V);
|
2014-12-04 17:44:01 +08:00
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
// Is this a ~ operation?
|
|
|
|
if (Value *NotOp = dyn_castNotVal(&I)) {
|
|
|
|
if (BinaryOperator *Op0I = dyn_cast<BinaryOperator>(NotOp)) {
|
2012-12-20 15:09:41 +08:00
|
|
|
if (Op0I->getOpcode() == Instruction::And ||
|
2010-01-05 15:50:36 +08:00
|
|
|
Op0I->getOpcode() == Instruction::Or) {
|
|
|
|
// ~(~X & Y) --> (X | ~Y) - De Morgan's Law
|
|
|
|
// ~(~X | Y) === (X & ~Y) - De Morgan's Law
|
|
|
|
if (dyn_castNotVal(Op0I->getOperand(1)))
|
|
|
|
Op0I->swapOperands();
|
|
|
|
if (Value *Op0NotVal = dyn_castNotVal(Op0I->getOperand(0))) {
|
|
|
|
Value *NotY =
|
|
|
|
Builder->CreateNot(Op0I->getOperand(1),
|
|
|
|
Op0I->getOperand(1)->getName()+".not");
|
|
|
|
if (Op0I->getOpcode() == Instruction::And)
|
|
|
|
return BinaryOperator::CreateOr(Op0NotVal, NotY);
|
|
|
|
return BinaryOperator::CreateAnd(Op0NotVal, NotY);
|
|
|
|
}
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
// ~(X & Y) --> (~X | ~Y) - De Morgan's Law
|
|
|
|
// ~(X | Y) === (~X & ~Y) - De Morgan's Law
|
2015-02-24 08:08:41 +08:00
|
|
|
if (IsFreeToInvert(Op0I->getOperand(0),
|
|
|
|
Op0I->getOperand(0)->hasOneUse()) &&
|
|
|
|
IsFreeToInvert(Op0I->getOperand(1),
|
|
|
|
Op0I->getOperand(1)->hasOneUse())) {
|
2010-01-05 15:50:36 +08:00
|
|
|
Value *NotX =
|
|
|
|
Builder->CreateNot(Op0I->getOperand(0), "notlhs");
|
|
|
|
Value *NotY =
|
|
|
|
Builder->CreateNot(Op0I->getOperand(1), "notrhs");
|
|
|
|
if (Op0I->getOpcode() == Instruction::And)
|
|
|
|
return BinaryOperator::CreateOr(NotX, NotY);
|
|
|
|
return BinaryOperator::CreateAnd(NotX, NotY);
|
|
|
|
}
|
2010-01-20 02:16:19 +08:00
|
|
|
|
|
|
|
} else if (Op0I->getOpcode() == Instruction::AShr) {
|
|
|
|
// ~(~X >>s Y) --> (X >>s Y)
|
|
|
|
if (Value *Op0NotVal = dyn_castNotVal(Op0I->getOperand(0)))
|
|
|
|
return BinaryOperator::CreateAShr(Op0NotVal, Op0I->getOperand(1));
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2015-02-13 04:26:46 +08:00
|
|
|
if (Constant *RHS = dyn_cast<Constant>(Op1)) {
|
|
|
|
if (RHS->isAllOnesValue() && Op0->hasOneUse())
|
2010-01-05 15:50:36 +08:00
|
|
|
// xor (cmp A, B), true = not (cmp A, B) = !cmp A, B
|
2010-04-09 22:53:59 +08:00
|
|
|
if (CmpInst *CI = dyn_cast<CmpInst>(Op0))
|
|
|
|
return CmpInst::Create(CI->getOpcode(),
|
|
|
|
CI->getInversePredicate(),
|
|
|
|
CI->getOperand(0), CI->getOperand(1));
|
2015-02-13 04:26:46 +08:00
|
|
|
}
|
2010-01-05 15:50:36 +08:00
|
|
|
|
2015-02-13 04:26:46 +08:00
|
|
|
if (ConstantInt *RHS = dyn_cast<ConstantInt>(Op1)) {
|
2010-01-05 15:50:36 +08:00
|
|
|
// fold (xor(zext(cmp)), 1) and (xor(sext(cmp)), -1) to ext(!cmp).
|
|
|
|
if (CastInst *Op0C = dyn_cast<CastInst>(Op0)) {
|
|
|
|
if (CmpInst *CI = dyn_cast<CmpInst>(Op0C->getOperand(0))) {
|
|
|
|
if (CI->hasOneUse() && Op0C->hasOneUse()) {
|
|
|
|
Instruction::CastOps Opcode = Op0C->getOpcode();
|
|
|
|
if ((Opcode == Instruction::ZExt || Opcode == Instruction::SExt) &&
|
2013-06-06 08:37:23 +08:00
|
|
|
(RHS == ConstantExpr::getCast(Opcode, Builder->getTrue(),
|
2010-01-05 15:50:36 +08:00
|
|
|
Op0C->getDestTy()))) {
|
|
|
|
CI->setPredicate(CI->getInversePredicate());
|
|
|
|
return CastInst::Create(Opcode, CI, Op0C->getType());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (BinaryOperator *Op0I = dyn_cast<BinaryOperator>(Op0)) {
|
|
|
|
// ~(c-X) == X-c-1 == X+(-c-1)
|
|
|
|
if (Op0I->getOpcode() == Instruction::Sub && RHS->isAllOnesValue())
|
|
|
|
if (Constant *Op0I0C = dyn_cast<Constant>(Op0I->getOperand(0))) {
|
|
|
|
Constant *NegOp0I0C = ConstantExpr::getNeg(Op0I0C);
|
|
|
|
Constant *ConstantRHS = ConstantExpr::getSub(NegOp0I0C,
|
|
|
|
ConstantInt::get(I.getType(), 1));
|
|
|
|
return BinaryOperator::CreateAdd(Op0I->getOperand(1), ConstantRHS);
|
|
|
|
}
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
if (ConstantInt *Op0CI = dyn_cast<ConstantInt>(Op0I->getOperand(1))) {
|
|
|
|
if (Op0I->getOpcode() == Instruction::Add) {
|
|
|
|
// ~(X-c) --> (-c-1)-X
|
|
|
|
if (RHS->isAllOnesValue()) {
|
|
|
|
Constant *NegOp0CI = ConstantExpr::getNeg(Op0CI);
|
|
|
|
return BinaryOperator::CreateSub(
|
|
|
|
ConstantExpr::getSub(NegOp0CI,
|
|
|
|
ConstantInt::get(I.getType(), 1)),
|
|
|
|
Op0I->getOperand(0));
|
|
|
|
} else if (RHS->getValue().isSignBit()) {
|
|
|
|
// (X + C) ^ signbit -> (X + C + signbit)
|
2013-06-06 08:37:23 +08:00
|
|
|
Constant *C = Builder->getInt(RHS->getValue() + Op0CI->getValue());
|
2010-01-05 15:50:36 +08:00
|
|
|
return BinaryOperator::CreateAdd(Op0I->getOperand(0), C);
|
|
|
|
|
|
|
|
}
|
|
|
|
} else if (Op0I->getOpcode() == Instruction::Or) {
|
2012-09-27 18:14:43 +08:00
|
|
|
// (X|C1)^C2 -> X^(C1|C2) iff X&~C1 == 0
|
Make use of @llvm.assume in ValueTracking (computeKnownBits, etc.)
This change, which allows @llvm.assume to be used from within computeKnownBits
(and other associated functions in ValueTracking), adds some (optional)
parameters to computeKnownBits and friends. These functions now (optionally)
take a "context" instruction pointer, an AssumptionTracker pointer, and also a
DomTree pointer, and most of the changes are just to pass this new information
when it is easily available from InstSimplify, InstCombine, etc.
As explained below, the significant conceptual change is that known properties
of a value might depend on the control-flow location of the use (because we
care that the @llvm.assume dominates the use because assumptions have
control-flow dependencies). This means that, when we ask if bits are known in a
value, we might get different answers for different uses.
The significant changes are all in ValueTracking. Two main changes: First, as
with the rest of the code, new parameters need to be passed around. To make
this easier, I grouped them into a structure, and I made internal static
versions of the relevant functions that take this structure as a parameter. The
new code does as you might expect, it looks for @llvm.assume calls that make
use of the value we're trying to learn something about (often indirectly),
attempts to pattern match that expression, and uses the result if successful.
By making use of the AssumptionTracker, the process of finding @llvm.assume
calls is not expensive.
Part of the structure being passed around inside ValueTracking is a set of
already-considered @llvm.assume calls. This is to prevent a query using, for
example, the assume(a == b), to recurse on itself. The context and DT params
are used to find applicable assumptions. An assumption needs to dominate the
context instruction, or come after it deterministically. In this latter case we
only handle the specific case where both the assumption and the context
instruction are in the same block, and we need to exclude assumptions from
being used to simplify their own ephemeral values (those which contribute only
to the assumption) because otherwise the assumption would prove its feeding
comparison trivial and would be removed.
This commit adds the plumbing and the logic for a simple masked-bit propagation
(just enough to write a regression test). Future commits add more patterns
(and, correspondingly, more regression tests).
llvm-svn: 217342
2014-09-08 02:57:58 +08:00
|
|
|
if (MaskedValueIsZero(Op0I->getOperand(0), Op0CI->getValue(),
|
|
|
|
0, &I)) {
|
2010-01-05 15:50:36 +08:00
|
|
|
Constant *NewRHS = ConstantExpr::getOr(Op0CI, RHS);
|
|
|
|
// Anything in both C1 and C2 is known to be zero, remove it from
|
|
|
|
// NewRHS.
|
|
|
|
Constant *CommonBits = ConstantExpr::getAnd(Op0CI, RHS);
|
2012-12-20 15:09:41 +08:00
|
|
|
NewRHS = ConstantExpr::getAnd(NewRHS,
|
2010-01-05 15:50:36 +08:00
|
|
|
ConstantExpr::getNot(CommonBits));
|
|
|
|
Worklist.Add(Op0I);
|
|
|
|
I.setOperand(0, Op0I->getOperand(0));
|
|
|
|
I.setOperand(1, NewRHS);
|
|
|
|
return &I;
|
|
|
|
}
|
2012-11-27 05:44:25 +08:00
|
|
|
} else if (Op0I->getOpcode() == Instruction::LShr) {
|
|
|
|
// ((X^C1) >> C2) ^ C3 -> (X>>C2) ^ ((C1>>C2)^C3)
|
|
|
|
// E1 = "X ^ C1"
|
2012-12-20 15:09:41 +08:00
|
|
|
BinaryOperator *E1;
|
2012-11-27 05:44:25 +08:00
|
|
|
ConstantInt *C1;
|
|
|
|
if (Op0I->hasOneUse() &&
|
|
|
|
(E1 = dyn_cast<BinaryOperator>(Op0I->getOperand(0))) &&
|
|
|
|
E1->getOpcode() == Instruction::Xor &&
|
|
|
|
(C1 = dyn_cast<ConstantInt>(E1->getOperand(1)))) {
|
|
|
|
// fold (C1 >> C2) ^ C3
|
|
|
|
ConstantInt *C2 = Op0CI, *C3 = RHS;
|
|
|
|
APInt FoldConst = C1->getValue().lshr(C2->getValue());
|
|
|
|
FoldConst ^= C3->getValue();
|
|
|
|
// Prepare the two operands.
|
|
|
|
Value *Opnd0 = Builder->CreateLShr(E1->getOperand(0), C2);
|
|
|
|
Opnd0->takeName(Op0I);
|
|
|
|
cast<Instruction>(Opnd0)->setDebugLoc(I.getDebugLoc());
|
|
|
|
Value *FoldVal = ConstantInt::get(Opnd0->getType(), FoldConst);
|
|
|
|
|
|
|
|
return BinaryOperator::CreateXor(Opnd0, FoldVal);
|
|
|
|
}
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Try to fold constant and into select arguments.
|
|
|
|
if (SelectInst *SI = dyn_cast<SelectInst>(Op0))
|
|
|
|
if (Instruction *R = FoldOpIntoSelect(I, SI))
|
|
|
|
return R;
|
|
|
|
if (isa<PHINode>(Op0))
|
|
|
|
if (Instruction *NV = FoldOpIntoPhi(I))
|
|
|
|
return NV;
|
|
|
|
}
|
|
|
|
|
|
|
|
BinaryOperator *Op1I = dyn_cast<BinaryOperator>(Op1);
|
|
|
|
if (Op1I) {
|
|
|
|
Value *A, *B;
|
|
|
|
if (match(Op1I, m_Or(m_Value(A), m_Value(B)))) {
|
|
|
|
if (A == Op0) { // B^(B|A) == (A|B)^B
|
|
|
|
Op1I->swapOperands();
|
|
|
|
I.swapOperands();
|
|
|
|
std::swap(Op0, Op1);
|
|
|
|
} else if (B == Op0) { // B^(A|B) == (A|B)^B
|
|
|
|
I.swapOperands(); // Simplified below.
|
|
|
|
std::swap(Op0, Op1);
|
|
|
|
}
|
2012-12-20 15:09:41 +08:00
|
|
|
} else if (match(Op1I, m_And(m_Value(A), m_Value(B))) &&
|
2010-01-05 15:50:36 +08:00
|
|
|
Op1I->hasOneUse()){
|
|
|
|
if (A == Op0) { // A^(A&B) -> A^(B&A)
|
|
|
|
Op1I->swapOperands();
|
|
|
|
std::swap(A, B);
|
|
|
|
}
|
|
|
|
if (B == Op0) { // A^(B&A) -> (B&A)^A
|
|
|
|
I.swapOperands(); // Simplified below.
|
|
|
|
std::swap(Op0, Op1);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
BinaryOperator *Op0I = dyn_cast<BinaryOperator>(Op0);
|
|
|
|
if (Op0I) {
|
|
|
|
Value *A, *B;
|
|
|
|
if (match(Op0I, m_Or(m_Value(A), m_Value(B))) &&
|
|
|
|
Op0I->hasOneUse()) {
|
|
|
|
if (A == Op1) // (B|A)^B == (A|B)^B
|
|
|
|
std::swap(A, B);
|
|
|
|
if (B == Op1) // (A|B)^B == A & ~B
|
2011-09-28 04:39:19 +08:00
|
|
|
return BinaryOperator::CreateAnd(A, Builder->CreateNot(Op1));
|
2012-12-20 15:09:41 +08:00
|
|
|
} else if (match(Op0I, m_And(m_Value(A), m_Value(B))) &&
|
2010-01-05 15:50:36 +08:00
|
|
|
Op0I->hasOneUse()){
|
|
|
|
if (A == Op1) // (A&B)^A -> (B&A)^A
|
|
|
|
std::swap(A, B);
|
|
|
|
if (B == Op1 && // (B&A)^A == ~B & A
|
|
|
|
!isa<ConstantInt>(Op1)) { // Canonical form is (B&C)^C
|
2011-09-28 04:39:19 +08:00
|
|
|
return BinaryOperator::CreateAnd(Builder->CreateNot(A), Op1);
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2012-12-20 15:09:41 +08:00
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
if (Op0I && Op1I) {
|
|
|
|
Value *A, *B, *C, *D;
|
|
|
|
// (A & B)^(A | B) -> A ^ B
|
|
|
|
if (match(Op0I, m_And(m_Value(A), m_Value(B))) &&
|
|
|
|
match(Op1I, m_Or(m_Value(C), m_Value(D)))) {
|
2012-12-20 15:09:41 +08:00
|
|
|
if ((A == C && B == D) || (A == D && B == C))
|
2010-01-05 15:50:36 +08:00
|
|
|
return BinaryOperator::CreateXor(A, B);
|
|
|
|
}
|
|
|
|
// (A | B)^(A & B) -> A ^ B
|
|
|
|
if (match(Op0I, m_Or(m_Value(A), m_Value(B))) &&
|
|
|
|
match(Op1I, m_And(m_Value(C), m_Value(D)))) {
|
2012-12-20 15:09:41 +08:00
|
|
|
if ((A == C && B == D) || (A == D && B == C))
|
2010-01-05 15:50:36 +08:00
|
|
|
return BinaryOperator::CreateXor(A, B);
|
|
|
|
}
|
2014-08-14 14:46:25 +08:00
|
|
|
// (A | ~B) ^ (~A | B) -> A ^ B
|
|
|
|
if (match(Op0I, m_Or(m_Value(A), m_Not(m_Value(B)))) &&
|
|
|
|
match(Op1I, m_Or(m_Not(m_Specific(A)), m_Specific(B)))) {
|
|
|
|
return BinaryOperator::CreateXor(A, B);
|
|
|
|
}
|
|
|
|
// (~A | B) ^ (A | ~B) -> A ^ B
|
|
|
|
if (match(Op0I, m_Or(m_Not(m_Value(A)), m_Value(B))) &&
|
|
|
|
match(Op1I, m_Or(m_Specific(A), m_Not(m_Specific(B))))) {
|
|
|
|
return BinaryOperator::CreateXor(A, B);
|
|
|
|
}
|
2014-08-19 16:19:19 +08:00
|
|
|
// (A & ~B) ^ (~A & B) -> A ^ B
|
|
|
|
if (match(Op0I, m_And(m_Value(A), m_Not(m_Value(B)))) &&
|
|
|
|
match(Op1I, m_And(m_Not(m_Specific(A)), m_Specific(B)))) {
|
|
|
|
return BinaryOperator::CreateXor(A, B);
|
|
|
|
}
|
|
|
|
// (~A & B) ^ (A & ~B) -> A ^ B
|
|
|
|
if (match(Op0I, m_And(m_Not(m_Value(A)), m_Value(B))) &&
|
|
|
|
match(Op1I, m_And(m_Specific(A), m_Not(m_Specific(B))))) {
|
|
|
|
return BinaryOperator::CreateXor(A, B);
|
|
|
|
}
|
2014-09-05 14:09:24 +08:00
|
|
|
// (A ^ C)^(A | B) -> ((~A) & B) ^ C
|
|
|
|
if (match(Op0I, m_Xor(m_Value(D), m_Value(C))) &&
|
|
|
|
match(Op1I, m_Or(m_Value(A), m_Value(B)))) {
|
|
|
|
if (D == A)
|
|
|
|
return BinaryOperator::CreateXor(
|
|
|
|
Builder->CreateAnd(Builder->CreateNot(A), B), C);
|
|
|
|
if (D == B)
|
|
|
|
return BinaryOperator::CreateXor(
|
|
|
|
Builder->CreateAnd(Builder->CreateNot(B), A), C);
|
|
|
|
}
|
|
|
|
// (A | B)^(A ^ C) -> ((~A) & B) ^ C
|
2014-08-13 13:13:14 +08:00
|
|
|
if (match(Op0I, m_Or(m_Value(A), m_Value(B))) &&
|
2014-09-05 14:09:24 +08:00
|
|
|
match(Op1I, m_Xor(m_Value(D), m_Value(C)))) {
|
|
|
|
if (D == A)
|
|
|
|
return BinaryOperator::CreateXor(
|
|
|
|
Builder->CreateAnd(Builder->CreateNot(A), B), C);
|
|
|
|
if (D == B)
|
|
|
|
return BinaryOperator::CreateXor(
|
|
|
|
Builder->CreateAnd(Builder->CreateNot(B), A), C);
|
2014-08-13 13:13:14 +08:00
|
|
|
}
|
2014-07-23 02:30:54 +08:00
|
|
|
// (A & B) ^ (A ^ B) -> (A | B)
|
|
|
|
if (match(Op0I, m_And(m_Value(A), m_Value(B))) &&
|
|
|
|
match(Op1I, m_Xor(m_Specific(A), m_Specific(B))))
|
|
|
|
return BinaryOperator::CreateOr(A, B);
|
|
|
|
// (A ^ B) ^ (A & B) -> (A | B)
|
|
|
|
if (match(Op0I, m_Xor(m_Value(A), m_Value(B))) &&
|
|
|
|
match(Op1I, m_And(m_Specific(A), m_Specific(B))))
|
|
|
|
return BinaryOperator::CreateOr(A, B);
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
2010-11-23 22:23:47 +08:00
|
|
|
|
2014-07-22 23:37:39 +08:00
|
|
|
Value *A = nullptr, *B = nullptr;
|
2014-08-01 13:07:20 +08:00
|
|
|
// (A & ~B) ^ (~A) -> ~(A & B)
|
|
|
|
if (match(Op0, m_And(m_Value(A), m_Not(m_Value(B)))) &&
|
|
|
|
match(Op1, m_Not(m_Specific(A))))
|
|
|
|
return BinaryOperator::CreateNot(Builder->CreateAnd(A, B));
|
|
|
|
|
2010-01-05 15:50:36 +08:00
|
|
|
// (icmp1 A, B) ^ (icmp2 A, B) --> (icmp3 A, B)
|
|
|
|
if (ICmpInst *RHS = dyn_cast<ICmpInst>(I.getOperand(1)))
|
|
|
|
if (ICmpInst *LHS = dyn_cast<ICmpInst>(I.getOperand(0)))
|
|
|
|
if (PredicatesFoldable(LHS->getPredicate(), RHS->getPredicate())) {
|
|
|
|
if (LHS->getOperand(0) == RHS->getOperand(1) &&
|
|
|
|
LHS->getOperand(1) == RHS->getOperand(0))
|
|
|
|
LHS->swapOperands();
|
|
|
|
if (LHS->getOperand(0) == RHS->getOperand(0) &&
|
|
|
|
LHS->getOperand(1) == RHS->getOperand(1)) {
|
|
|
|
Value *Op0 = LHS->getOperand(0), *Op1 = LHS->getOperand(1);
|
|
|
|
unsigned Code = getICmpCode(LHS) ^ getICmpCode(RHS);
|
|
|
|
bool isSigned = LHS->isSigned() || RHS->isSigned();
|
2016-02-02 06:23:39 +08:00
|
|
|
return replaceInstUsesWith(I,
|
2011-12-17 09:20:32 +08:00
|
|
|
getNewICmpValue(isSigned, Code, Op0, Op1,
|
|
|
|
Builder));
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-02-25 01:00:34 +08:00
|
|
|
if (Instruction *CastedXor = foldCastedBitwiseLogic(I))
|
|
|
|
return CastedXor;
|
2010-01-05 15:50:36 +08:00
|
|
|
|
2014-04-25 13:29:35 +08:00
|
|
|
return Changed ? &I : nullptr;
|
2010-01-05 15:50:36 +08:00
|
|
|
}
|