llvm-project/llvm/lib/CodeGen/GlobalISel/IRTranslator.cpp

//===- llvm/CodeGen/GlobalISel/IRTranslator.cpp - IRTranslator ---*- C++ -*-==//
//
//                     The LLVM Compiler Infrastructure
//
// This file is distributed under the University of Illinois Open Source
// License. See LICENSE.TXT for details.
//
//===----------------------------------------------------------------------===//
/// \file
/// This file implements the IRTranslator class.
//===----------------------------------------------------------------------===//

#include "llvm/CodeGen/GlobalISel/IRTranslator.h"
#include "llvm/ADT/STLExtras.h"
#include "llvm/ADT/ScopeExit.h"
#include "llvm/ADT/SmallSet.h"
#include "llvm/ADT/SmallVector.h"
#include "llvm/Analysis/OptimizationDiagnosticInfo.h"
#include "llvm/CodeGen/Analysis.h"
#include "llvm/CodeGen/GlobalISel/CallLowering.h"
#include "llvm/CodeGen/LowLevelType.h"
#include "llvm/CodeGen/MachineBasicBlock.h"
#include "llvm/CodeGen/MachineFrameInfo.h"
#include "llvm/CodeGen/MachineFunction.h"
#include "llvm/CodeGen/MachineInstrBuilder.h"
#include "llvm/CodeGen/MachineMemOperand.h"
#include "llvm/CodeGen/MachineOperand.h"
#include "llvm/CodeGen/MachineRegisterInfo.h"
#include "llvm/CodeGen/TargetPassConfig.h"
#include "llvm/IR/BasicBlock.h"
#include "llvm/IR/Constant.h"
#include "llvm/IR/Constants.h"
#include "llvm/IR/DataLayout.h"
#include "llvm/IR/DebugInfo.h"
#include "llvm/IR/DerivedTypes.h"
#include "llvm/IR/Function.h"
#include "llvm/IR/GetElementPtrTypeIterator.h"
#include "llvm/IR/InlineAsm.h"
#include "llvm/IR/InstrTypes.h"
#include "llvm/IR/Instructions.h"
#include "llvm/IR/IntrinsicInst.h"
#include "llvm/IR/Intrinsics.h"
#include "llvm/IR/LLVMContext.h"
#include "llvm/IR/Metadata.h"
#include "llvm/IR/Type.h"
#include "llvm/IR/User.h"
#include "llvm/IR/Value.h"
#include "llvm/MC/MCContext.h"
#include "llvm/Pass.h"
#include "llvm/Support/Casting.h"
#include "llvm/Support/CodeGen.h"
#include "llvm/Support/Debug.h"
#include "llvm/Support/ErrorHandling.h"
#include "llvm/Support/LowLevelTypeImpl.h"
#include "llvm/Support/MathExtras.h"
#include "llvm/Support/raw_ostream.h"
#include "llvm/Target/TargetFrameLowering.h"
#include "llvm/Target/TargetIntrinsicInfo.h"
#include "llvm/Target/TargetLowering.h"
#include "llvm/Target/TargetMachine.h"
#include "llvm/Target/TargetRegisterInfo.h"
#include "llvm/Target/TargetSubtargetInfo.h"
#include <algorithm>
#include <cassert>
#include <cstdint>
#include <iterator>
#include <string>
#include <utility>
#include <vector>

#define DEBUG_TYPE "irtranslator"

using namespace llvm;

char IRTranslator::ID = 0;

INITIALIZE_PASS_BEGIN(IRTranslator, DEBUG_TYPE, "IRTranslator LLVM IR -> MI",
                false, false)
INITIALIZE_PASS_DEPENDENCY(TargetPassConfig)
INITIALIZE_PASS_END(IRTranslator, DEBUG_TYPE, "IRTranslator LLVM IR -> MI",
                false, false)

static void reportTranslationError(MachineFunction &MF,
                                   const TargetPassConfig &TPC,
                                   OptimizationRemarkEmitter &ORE,
                                   OptimizationRemarkMissed &R) {
  MF.getProperties().set(MachineFunctionProperties::Property::FailedISel);

  // Print the function name explicitly if we don't have a debug location (which
  // makes the diagnostic less useful) or if we're going to emit a raw error.
  if (!R.getLocation().isValid() || TPC.isGlobalISelAbortEnabled())
    R << (" (in function: " + MF.getName() + ")").str();

  if (TPC.isGlobalISelAbortEnabled())
    report_fatal_error(R.getMsg());
  else
    ORE.emit(R);
}

IRTranslator::IRTranslator() : MachineFunctionPass(ID) {
  initializeIRTranslatorPass(*PassRegistry::getPassRegistry());
}

void IRTranslator::getAnalysisUsage(AnalysisUsage &AU) const {
  AU.addRequired<TargetPassConfig>();
  MachineFunctionPass::getAnalysisUsage(AU);
}

unsigned IRTranslator::getOrCreateVReg(const Value &Val) {
  unsigned &ValReg = ValToVReg[&Val];

  if (ValReg)
    return ValReg;

  // Fill ValRegsSequence with the sequence of registers
  // we need to concat together to produce the value.
  assert(Val.getType()->isSized() &&
         "Don't know how to create an empty vreg");
  unsigned VReg =
      MRI->createGenericVirtualRegister(getLLTForType(*Val.getType(), *DL));
  ValReg = VReg;

  if (auto CV = dyn_cast<Constant>(&Val)) {
    bool Success = translate(*CV, VReg);
    if (!Success) {
      OptimizationRemarkMissed R("gisel-irtranslator", "GISelFailure",
                                 MF->getFunction()->getSubprogram(),
                                 &MF->getFunction()->getEntryBlock());
      R << "unable to translate constant: " << ore::NV("Type", Val.getType());
      reportTranslationError(*MF, *TPC, *ORE, R);
      return VReg;
    }
  }

  return VReg;
}

int IRTranslator::getOrCreateFrameIndex(const AllocaInst &AI) {
  if (FrameIndices.find(&AI) != FrameIndices.end())
    return FrameIndices[&AI];

  unsigned ElementSize = DL->getTypeStoreSize(AI.getAllocatedType());
  unsigned Size =
      ElementSize * cast<ConstantInt>(AI.getArraySize())->getZExtValue();

  // Always allocate at least one byte.
  Size = std::max(Size, 1u);

  unsigned Alignment = AI.getAlignment();
  if (!Alignment)
    Alignment = DL->getABITypeAlignment(AI.getAllocatedType());

  int &FI = FrameIndices[&AI];
  FI = MF->getFrameInfo().CreateStackObject(Size, Alignment, false, &AI);
  return FI;
}

unsigned IRTranslator::getMemOpAlignment(const Instruction &I) {
  unsigned Alignment = 0;
  Type *ValTy = nullptr;
  if (const StoreInst *SI = dyn_cast<StoreInst>(&I)) {
    Alignment = SI->getAlignment();
    ValTy = SI->getValueOperand()->getType();
  } else if (const LoadInst *LI = dyn_cast<LoadInst>(&I)) {
    Alignment = LI->getAlignment();
    ValTy = LI->getType();
  } else {
    OptimizationRemarkMissed R("gisel-irtranslator", "", &I);
    R << "unable to translate memop: " << ore::NV("Opcode", &I);
    reportTranslationError(*MF, *TPC, *ORE, R);
    return 1;
  }

  return Alignment ? Alignment : DL->getABITypeAlignment(ValTy);
}

MachineBasicBlock &IRTranslator::getMBB(const BasicBlock &BB) {
  MachineBasicBlock *&MBB = BBToMBB[&BB];
  assert(MBB && "BasicBlock was not encountered before");
  return *MBB;
}

void IRTranslator::addMachineCFGPred(CFGEdge Edge, MachineBasicBlock *NewPred) {
  assert(NewPred && "new predecessor must be a real MachineBasicBlock");
  MachinePreds[Edge].push_back(NewPred);
}

bool IRTranslator::translateBinaryOp(unsigned Opcode, const User &U,
                                     MachineIRBuilder &MIRBuilder) {
  // FIXME: handle signed/unsigned wrapping flags.

  // Get or create a virtual register for each value.
  // Unless the value is a Constant => loadimm cst?
  // or inline constant each time?
  // Creation of a virtual register needs to have a size.
  unsigned Op0 = getOrCreateVReg(*U.getOperand(0));
  unsigned Op1 = getOrCreateVReg(*U.getOperand(1));
  unsigned Res = getOrCreateVReg(U);
  MIRBuilder.buildInstr(Opcode).addDef(Res).addUse(Op0).addUse(Op1);
  return true;
}

bool IRTranslator::translateFSub(const User &U, MachineIRBuilder &MIRBuilder) {
  // -0.0 - X --> G_FNEG
  if (isa<Constant>(U.getOperand(0)) &&
      U.getOperand(0) == ConstantFP::getZeroValueForNegation(U.getType())) {
    MIRBuilder.buildInstr(TargetOpcode::G_FNEG)
        .addDef(getOrCreateVReg(U))
        .addUse(getOrCreateVReg(*U.getOperand(1)));
    return true;
  }
  return translateBinaryOp(TargetOpcode::G_FSUB, U, MIRBuilder);
}

bool IRTranslator::translateCompare(const User &U,
                                    MachineIRBuilder &MIRBuilder) {
  const CmpInst *CI = dyn_cast<CmpInst>(&U);
  unsigned Op0 = getOrCreateVReg(*U.getOperand(0));
  unsigned Op1 = getOrCreateVReg(*U.getOperand(1));
  unsigned Res = getOrCreateVReg(U);
  CmpInst::Predicate Pred =
      CI ? CI->getPredicate() : static_cast<CmpInst::Predicate>(
                                    cast<ConstantExpr>(U).getPredicate());
  if (CmpInst::isIntPredicate(Pred))
    MIRBuilder.buildICmp(Pred, Res, Op0, Op1);
  else if (Pred == CmpInst::FCMP_FALSE)
    MIRBuilder.buildCopy(
        Res, getOrCreateVReg(*Constant::getNullValue(CI->getType())));
  else if (Pred == CmpInst::FCMP_TRUE)
    MIRBuilder.buildCopy(
        Res, getOrCreateVReg(*Constant::getAllOnesValue(CI->getType())));
  else
    MIRBuilder.buildFCmp(Pred, Res, Op0, Op1);

  return true;
}

bool IRTranslator::translateRet(const User &U, MachineIRBuilder &MIRBuilder) {
  const ReturnInst &RI = cast<ReturnInst>(U);
  const Value *Ret = RI.getReturnValue();
  // The target may mess up with the insertion point, but
  // this is not important as a return is the last instruction
  // of the block anyway.
  return CLI->lowerReturn(MIRBuilder, Ret, !Ret ? 0 : getOrCreateVReg(*Ret));
}

bool IRTranslator::translateBr(const User &U, MachineIRBuilder &MIRBuilder) {
  const BranchInst &BrInst = cast<BranchInst>(U);
  unsigned Succ = 0;
  if (!BrInst.isUnconditional()) {
    // We want a G_BRCOND to the true BB followed by an unconditional branch.
    unsigned Tst = getOrCreateVReg(*BrInst.getCondition());
    const BasicBlock &TrueTgt = *cast<BasicBlock>(BrInst.getSuccessor(Succ++));
    MachineBasicBlock &TrueBB = getMBB(TrueTgt);
    MIRBuilder.buildBrCond(Tst, TrueBB);
  }

  const BasicBlock &BrTgt = *cast<BasicBlock>(BrInst.getSuccessor(Succ));
  MachineBasicBlock &TgtBB = getMBB(BrTgt);
  MachineBasicBlock &CurBB = MIRBuilder.getMBB();

  // If the unconditional target is the layout successor, fallthrough.
  if (!CurBB.isLayoutSuccessor(&TgtBB))
    MIRBuilder.buildBr(TgtBB);

  // Link successors.
  for (const BasicBlock *Succ : BrInst.successors())
    CurBB.addSuccessor(&getMBB(*Succ));
  return true;
}

bool IRTranslator::translateSwitch(const User &U,
                                   MachineIRBuilder &MIRBuilder) {
  // For now, just translate as a chain of conditional branches.
  // FIXME: could we share most of the logic/code in
  // SelectionDAGBuilder::visitSwitch between SelectionDAG and GlobalISel?
  // At first sight, it seems most of the logic in there is independent of
  // SelectionDAG-specifics and a lot of work went in to optimize switch
  // lowering in there.

  const SwitchInst &SwInst = cast<SwitchInst>(U);
  const unsigned SwCondValue = getOrCreateVReg(*SwInst.getCondition());
  const BasicBlock *OrigBB = SwInst.getParent();

  LLT LLTi1 = getLLTForType(*Type::getInt1Ty(U.getContext()), *DL);
  for (auto &CaseIt : SwInst.cases()) {
    const unsigned CaseValueReg = getOrCreateVReg(*CaseIt.getCaseValue());
    const unsigned Tst = MRI->createGenericVirtualRegister(LLTi1);
    MIRBuilder.buildICmp(CmpInst::ICMP_EQ, Tst, CaseValueReg, SwCondValue);
    MachineBasicBlock &CurMBB = MIRBuilder.getMBB();
    const BasicBlock *TrueBB = CaseIt.getCaseSuccessor();
    MachineBasicBlock &TrueMBB = getMBB(*TrueBB);

    MIRBuilder.buildBrCond(Tst, TrueMBB);
    CurMBB.addSuccessor(&TrueMBB);
    addMachineCFGPred({OrigBB, TrueBB}, &CurMBB);

    MachineBasicBlock *FalseMBB =
        MF->CreateMachineBasicBlock(SwInst.getParent());
    // Insert the comparison blocks one after the other.
    MF->insert(std::next(CurMBB.getIterator()), FalseMBB);
    MIRBuilder.buildBr(*FalseMBB);
    CurMBB.addSuccessor(FalseMBB);

    MIRBuilder.setMBB(*FalseMBB);
  }
  // handle default case
  const BasicBlock *DefaultBB = SwInst.getDefaultDest();
  MachineBasicBlock &DefaultMBB = getMBB(*DefaultBB);
  MIRBuilder.buildBr(DefaultMBB);
  MachineBasicBlock &CurMBB = MIRBuilder.getMBB();
  CurMBB.addSuccessor(&DefaultMBB);
  addMachineCFGPred({OrigBB, DefaultBB}, &CurMBB);

  return true;
}

bool IRTranslator::translateIndirectBr(const User &U,
                                       MachineIRBuilder &MIRBuilder) {
  const IndirectBrInst &BrInst = cast<IndirectBrInst>(U);

  const unsigned Tgt = getOrCreateVReg(*BrInst.getAddress());
  MIRBuilder.buildBrIndirect(Tgt);

  // Link successors.
  MachineBasicBlock &CurBB = MIRBuilder.getMBB();
  for (const BasicBlock *Succ : BrInst.successors())
    CurBB.addSuccessor(&getMBB(*Succ));

  return true;
}

bool IRTranslator::translateLoad(const User &U, MachineIRBuilder &MIRBuilder) {
  const LoadInst &LI = cast<LoadInst>(U);

  auto Flags = LI.isVolatile() ? MachineMemOperand::MOVolatile
                               : MachineMemOperand::MONone;
  Flags |= MachineMemOperand::MOLoad;

  unsigned Res = getOrCreateVReg(LI);
  unsigned Addr = getOrCreateVReg(*LI.getPointerOperand());

  MIRBuilder.buildLoad(
      Res, Addr,
      *MF->getMachineMemOperand(MachinePointerInfo(LI.getPointerOperand()),
                                Flags, DL->getTypeStoreSize(LI.getType()),
                                getMemOpAlignment(LI), AAMDNodes(), nullptr,
                                LI.getSynchScope(), LI.getOrdering()));
  return true;
}

bool IRTranslator::translateStore(const User &U, MachineIRBuilder &MIRBuilder) {
  const StoreInst &SI = cast<StoreInst>(U);
  auto Flags = SI.isVolatile() ? MachineMemOperand::MOVolatile
                               : MachineMemOperand::MONone;
  Flags |= MachineMemOperand::MOStore;

  unsigned Val = getOrCreateVReg(*SI.getValueOperand());
  unsigned Addr = getOrCreateVReg(*SI.getPointerOperand());

  MIRBuilder.buildStore(
      Val, Addr,
      *MF->getMachineMemOperand(
          MachinePointerInfo(SI.getPointerOperand()), Flags,
          DL->getTypeStoreSize(SI.getValueOperand()->getType()),
          getMemOpAlignment(SI), AAMDNodes(), nullptr, SI.getSynchScope(),
          SI.getOrdering()));
  return true;
}

bool IRTranslator::translateExtractValue(const User &U,
                                         MachineIRBuilder &MIRBuilder) {
  const Value *Src = U.getOperand(0);
  Type *Int32Ty = Type::getInt32Ty(U.getContext());
  SmallVector<Value *, 1> Indices;

  // If Src is a single element ConstantStruct, translate extractvalue
  // to that element to avoid inserting a cast instruction.
  if (auto CS = dyn_cast<ConstantStruct>(Src))
    if (CS->getNumOperands() == 1) {
      unsigned Res = getOrCreateVReg(*CS->getOperand(0));
      ValToVReg[&U] = Res;
      return true;
    }

  // getIndexedOffsetInType is designed for GEPs, so the first index is the
  // usual array element rather than looking into the actual aggregate.
  Indices.push_back(ConstantInt::get(Int32Ty, 0));

  if (const ExtractValueInst *EVI = dyn_cast<ExtractValueInst>(&U)) {
    for (auto Idx : EVI->indices())
      Indices.push_back(ConstantInt::get(Int32Ty, Idx));
  } else {
    for (unsigned i = 1; i < U.getNumOperands(); ++i)
      Indices.push_back(U.getOperand(i));
  }

  uint64_t Offset = 8 * DL->getIndexedOffsetInType(Src->getType(), Indices);

  unsigned Res = getOrCreateVReg(U);
  MIRBuilder.buildExtract(Res, getOrCreateVReg(*Src), Offset);

  return true;
}

bool IRTranslator::translateInsertValue(const User &U,
                                        MachineIRBuilder &MIRBuilder) {
  const Value *Src = U.getOperand(0);
  Type *Int32Ty = Type::getInt32Ty(U.getContext());
  SmallVector<Value *, 1> Indices;

  // getIndexedOffsetInType is designed for GEPs, so the first index is the
  // usual array element rather than looking into the actual aggregate.
  Indices.push_back(ConstantInt::get(Int32Ty, 0));

  if (const InsertValueInst *IVI = dyn_cast<InsertValueInst>(&U)) {
    for (auto Idx : IVI->indices())
      Indices.push_back(ConstantInt::get(Int32Ty, Idx));
  } else {
    for (unsigned i = 2; i < U.getNumOperands(); ++i)
      Indices.push_back(U.getOperand(i));
  }

  uint64_t Offset = 8 * DL->getIndexedOffsetInType(Src->getType(), Indices);

  unsigned Res = getOrCreateVReg(U);
  unsigned Inserted = getOrCreateVReg(*U.getOperand(1));
  MIRBuilder.buildInsert(Res, getOrCreateVReg(*Src), Inserted, Offset);

  return true;
}

bool IRTranslator::translateSelect(const User &U,
                                   MachineIRBuilder &MIRBuilder) {
  unsigned Res = getOrCreateVReg(U);
  unsigned Tst = getOrCreateVReg(*U.getOperand(0));
  unsigned Op0 = getOrCreateVReg(*U.getOperand(1));
  unsigned Op1 = getOrCreateVReg(*U.getOperand(2));
  MIRBuilder.buildSelect(Res, Tst, Op0, Op1);
  return true;
}

bool IRTranslator::translateBitCast(const User &U,
                                    MachineIRBuilder &MIRBuilder) {
  // If we're bitcasting to the source type, we can reuse the source vreg.
  if (getLLTForType(*U.getOperand(0)->getType(), *DL) ==
      getLLTForType(*U.getType(), *DL)) {
    // Get the source vreg now, to avoid invalidating ValToVReg.
    unsigned SrcReg = getOrCreateVReg(*U.getOperand(0));
    unsigned &Reg = ValToVReg[&U];
    // If we already assigned a vreg for this bitcast, we can't change that.
    // Emit a copy to satisfy the users we already emitted.
    if (Reg)
      MIRBuilder.buildCopy(Reg, SrcReg);
    else
      Reg = SrcReg;
    return true;
  }
  return translateCast(TargetOpcode::G_BITCAST, U, MIRBuilder);
}

bool IRTranslator::translateCast(unsigned Opcode, const User &U,
                                 MachineIRBuilder &MIRBuilder) {
  unsigned Op = getOrCreateVReg(*U.getOperand(0));
  unsigned Res = getOrCreateVReg(U);
  MIRBuilder.buildInstr(Opcode).addDef(Res).addUse(Op);
  return true;
}

bool IRTranslator::translateGetElementPtr(const User &U,
                                          MachineIRBuilder &MIRBuilder) {
  // FIXME: support vector GEPs.
  if (U.getType()->isVectorTy())
    return false;

  Value &Op0 = *U.getOperand(0);
  unsigned BaseReg = getOrCreateVReg(Op0);
  Type *PtrIRTy = Op0.getType();
  LLT PtrTy = getLLTForType(*PtrIRTy, *DL);
  Type *OffsetIRTy = DL->getIntPtrType(PtrIRTy);
  LLT OffsetTy = getLLTForType(*OffsetIRTy, *DL);

  int64_t Offset = 0;
  for (gep_type_iterator GTI = gep_type_begin(&U), E = gep_type_end(&U);
       GTI != E; ++GTI) {
    const Value *Idx = GTI.getOperand();
    if (StructType *StTy = GTI.getStructTypeOrNull()) {
      unsigned Field = cast<Constant>(Idx)->getUniqueInteger().getZExtValue();
      Offset += DL->getStructLayout(StTy)->getElementOffset(Field);
      continue;
    } else {
      uint64_t ElementSize = DL->getTypeAllocSize(GTI.getIndexedType());

      // If this is a scalar constant or a splat vector of constants,
      // handle it quickly.
      if (const auto *CI = dyn_cast<ConstantInt>(Idx)) {
        Offset += ElementSize * CI->getSExtValue();
        continue;
      }

      if (Offset != 0) {
        unsigned NewBaseReg = MRI->createGenericVirtualRegister(PtrTy);
        unsigned OffsetReg =
            getOrCreateVReg(*ConstantInt::get(OffsetIRTy, Offset));
        MIRBuilder.buildGEP(NewBaseReg, BaseReg, OffsetReg);

        BaseReg = NewBaseReg;
        Offset = 0;
      }

      // N = N + Idx * ElementSize;
      unsigned ElementSizeReg =
          getOrCreateVReg(*ConstantInt::get(OffsetIRTy, ElementSize));

      unsigned IdxReg = getOrCreateVReg(*Idx);
      if (MRI->getType(IdxReg) != OffsetTy) {
        unsigned NewIdxReg = MRI->createGenericVirtualRegister(OffsetTy);
        MIRBuilder.buildSExtOrTrunc(NewIdxReg, IdxReg);
        IdxReg = NewIdxReg;
      }

      unsigned OffsetReg = MRI->createGenericVirtualRegister(OffsetTy);
      MIRBuilder.buildMul(OffsetReg, ElementSizeReg, IdxReg);

      unsigned NewBaseReg = MRI->createGenericVirtualRegister(PtrTy);
      MIRBuilder.buildGEP(NewBaseReg, BaseReg, OffsetReg);
      BaseReg = NewBaseReg;
    }
  }

  if (Offset != 0) {
    unsigned OffsetReg = getOrCreateVReg(*ConstantInt::get(OffsetIRTy, Offset));
    MIRBuilder.buildGEP(getOrCreateVReg(U), BaseReg, OffsetReg);
    return true;
  }

  MIRBuilder.buildCopy(getOrCreateVReg(U), BaseReg);
  return true;
}

bool IRTranslator::translateMemfunc(const CallInst &CI,
                                    MachineIRBuilder &MIRBuilder,
                                    unsigned ID) {
  LLT SizeTy = getLLTForType(*CI.getArgOperand(2)->getType(), *DL);
  Type *DstTy = CI.getArgOperand(0)->getType();
  if (cast<PointerType>(DstTy)->getAddressSpace() != 0 ||
      SizeTy.getSizeInBits() != DL->getPointerSizeInBits(0))
    return false;

  SmallVector<CallLowering::ArgInfo, 8> Args;
  for (int i = 0; i < 3; ++i) {
    const auto &Arg = CI.getArgOperand(i);
    Args.emplace_back(getOrCreateVReg(*Arg), Arg->getType());
  }

  const char *Callee;
  switch (ID) {
  case Intrinsic::memmove:
  case Intrinsic::memcpy: {
    Type *SrcTy = CI.getArgOperand(1)->getType();
    if(cast<PointerType>(SrcTy)->getAddressSpace() != 0)
      return false;
    Callee = ID == Intrinsic::memcpy ? "memcpy" : "memmove";
    break;
  }
  case Intrinsic::memset:
    Callee = "memset";
    break;
  default:
    return false;
  }

  return CLI->lowerCall(MIRBuilder, CI.getCallingConv(),
                        MachineOperand::CreateES(Callee),
                        CallLowering::ArgInfo(0, CI.getType()), Args);
}

void IRTranslator::getStackGuard(unsigned DstReg,
                                 MachineIRBuilder &MIRBuilder) {
  const TargetRegisterInfo *TRI = MF->getSubtarget().getRegisterInfo();
  MRI->setRegClass(DstReg, TRI->getPointerRegClass(*MF));
  auto MIB = MIRBuilder.buildInstr(TargetOpcode::LOAD_STACK_GUARD);
  MIB.addDef(DstReg);

  auto &TLI = *MF->getSubtarget().getTargetLowering();
  Value *Global = TLI.getSDagStackGuard(*MF->getFunction()->getParent());
  if (!Global)
    return;

  MachinePointerInfo MPInfo(Global);
  MachineInstr::mmo_iterator MemRefs = MF->allocateMemRefsArray(1);
  auto Flags = MachineMemOperand::MOLoad | MachineMemOperand::MOInvariant |
               MachineMemOperand::MODereferenceable;
  *MemRefs =
      MF->getMachineMemOperand(MPInfo, Flags, DL->getPointerSizeInBits() / 8,
                               DL->getPointerABIAlignment());
  MIB.setMemRefs(MemRefs, MemRefs + 1);
}

bool IRTranslator::translateOverflowIntrinsic(const CallInst &CI, unsigned Op,
                                              MachineIRBuilder &MIRBuilder) {
  LLT Ty = getLLTForType(*CI.getOperand(0)->getType(), *DL);
  LLT s1 = LLT::scalar(1);
  unsigned Width = Ty.getSizeInBits();
  unsigned Res = MRI->createGenericVirtualRegister(Ty);
  unsigned Overflow = MRI->createGenericVirtualRegister(s1);
  auto MIB = MIRBuilder.buildInstr(Op)
                 .addDef(Res)
                 .addDef(Overflow)
                 .addUse(getOrCreateVReg(*CI.getOperand(0)))
                 .addUse(getOrCreateVReg(*CI.getOperand(1)));

  if (Op == TargetOpcode::G_UADDE || Op == TargetOpcode::G_USUBE) {
    unsigned Zero = getOrCreateVReg(
        *Constant::getNullValue(Type::getInt1Ty(CI.getContext())));
    MIB.addUse(Zero);
  }

  MIRBuilder.buildSequence(getOrCreateVReg(CI), {Res, Overflow}, {0, Width});
  return true;
}

bool IRTranslator::translateKnownIntrinsic(const CallInst &CI, Intrinsic::ID ID,
                                           MachineIRBuilder &MIRBuilder) {
  switch (ID) {
  default:
    break;
  case Intrinsic::lifetime_start:
  case Intrinsic::lifetime_end:
    // Stack coloring is not enabled in O0 (which we care about now) so we can
    // drop these. Make sure someone notices when we start compiling at higher
    // opts though.
    if (MF->getTarget().getOptLevel() != CodeGenOpt::None)
      return false;
    return true;
  case Intrinsic::dbg_declare: {
    const DbgDeclareInst &DI = cast<DbgDeclareInst>(CI);
    assert(DI.getVariable() && "Missing variable");

    const Value *Address = DI.getAddress();
    if (!Address || isa<UndefValue>(Address)) {
      DEBUG(dbgs() << "Dropping debug info for " << DI << "\n");
      return true;
    }

    assert(DI.getVariable()->isValidLocationForIntrinsic(
               MIRBuilder.getDebugLoc()) &&
           "Expected inlined-at fields to agree");
    auto AI = dyn_cast<AllocaInst>(Address);
    if (AI && AI->isStaticAlloca()) {
      // Static allocas are tracked at the MF level, no need for DBG_VALUE
      // instructions (in fact, they get ignored if they *do* exist).
      MF->setVariableDbgInfo(DI.getVariable(), DI.getExpression(),
                             getOrCreateFrameIndex(*AI), DI.getDebugLoc());
    } else
      MIRBuilder.buildDirectDbgValue(getOrCreateVReg(*Address),
                                     DI.getVariable(), DI.getExpression());
    return true;
  }
  case Intrinsic::vaend:
    // No target I know of cares about va_end. Certainly no in-tree target
    // does. Simplest intrinsic ever!
    return true;
  case Intrinsic::vastart: {
    auto &TLI = *MF->getSubtarget().getTargetLowering();
    Value *Ptr = CI.getArgOperand(0);
    unsigned ListSize = TLI.getVaListSizeInBits(*DL) / 8;

    MIRBuilder.buildInstr(TargetOpcode::G_VASTART)
        .addUse(getOrCreateVReg(*Ptr))
        .addMemOperand(MF->getMachineMemOperand(
            MachinePointerInfo(Ptr), MachineMemOperand::MOStore, ListSize, 0));
    return true;
  }
  case Intrinsic::dbg_value: {
    // This form of DBG_VALUE is target-independent.
    const DbgValueInst &DI = cast<DbgValueInst>(CI);
    const Value *V = DI.getValue();
    assert(DI.getVariable()->isValidLocationForIntrinsic(
               MIRBuilder.getDebugLoc()) &&
           "Expected inlined-at fields to agree");
    if (!V) {
      // Currently the optimizer can produce this; insert an undef to
      // help debugging.  Probably the optimizer should not do this.
      MIRBuilder.buildIndirectDbgValue(0, DI.getOffset(), DI.getVariable(),
                                       DI.getExpression());
    } else if (const auto *CI = dyn_cast<Constant>(V)) {
      MIRBuilder.buildConstDbgValue(*CI, DI.getOffset(), DI.getVariable(),
                                    DI.getExpression());
    } else {
      unsigned Reg = getOrCreateVReg(*V);
      // FIXME: This does not handle register-indirect values at offset 0. The
      // direct/indirect thing shouldn't really be handled by something as
      // implicit as reg+noreg vs reg+imm in the first palce, but it seems
      // pretty baked in right now.
      if (DI.getOffset() != 0)
        MIRBuilder.buildIndirectDbgValue(Reg, DI.getOffset(), DI.getVariable(),
                                         DI.getExpression());
      else
        MIRBuilder.buildDirectDbgValue(Reg, DI.getVariable(),
                                       DI.getExpression());
    }
    return true;
  }
  case Intrinsic::uadd_with_overflow:
    return translateOverflowIntrinsic(CI, TargetOpcode::G_UADDE, MIRBuilder);
  case Intrinsic::sadd_with_overflow:
    return translateOverflowIntrinsic(CI, TargetOpcode::G_SADDO, MIRBuilder);
  case Intrinsic::usub_with_overflow:
    return translateOverflowIntrinsic(CI, TargetOpcode::G_USUBE, MIRBuilder);
  case Intrinsic::ssub_with_overflow:
    return translateOverflowIntrinsic(CI, TargetOpcode::G_SSUBO, MIRBuilder);
  case Intrinsic::umul_with_overflow:
    return translateOverflowIntrinsic(CI, TargetOpcode::G_UMULO, MIRBuilder);
  case Intrinsic::smul_with_overflow:
    return translateOverflowIntrinsic(CI, TargetOpcode::G_SMULO, MIRBuilder);
  case Intrinsic::pow:
    MIRBuilder.buildInstr(TargetOpcode::G_FPOW)
        .addDef(getOrCreateVReg(CI))
        .addUse(getOrCreateVReg(*CI.getArgOperand(0)))
        .addUse(getOrCreateVReg(*CI.getArgOperand(1)));
    return true;
  case Intrinsic::exp:
    MIRBuilder.buildInstr(TargetOpcode::G_FEXP)
        .addDef(getOrCreateVReg(CI))
        .addUse(getOrCreateVReg(*CI.getArgOperand(0)));
    return true;
  case Intrinsic::exp2:
    MIRBuilder.buildInstr(TargetOpcode::G_FEXP2)
        .addDef(getOrCreateVReg(CI))
        .addUse(getOrCreateVReg(*CI.getArgOperand(0)));
    return true;
  case Intrinsic::fma:
    MIRBuilder.buildInstr(TargetOpcode::G_FMA)
        .addDef(getOrCreateVReg(CI))
        .addUse(getOrCreateVReg(*CI.getArgOperand(0)))
        .addUse(getOrCreateVReg(*CI.getArgOperand(1)))
        .addUse(getOrCreateVReg(*CI.getArgOperand(2)));
    return true;
  case Intrinsic::memcpy:
  case Intrinsic::memmove:
  case Intrinsic::memset:
    return translateMemfunc(CI, MIRBuilder, ID);
  case Intrinsic::eh_typeid_for: {
    GlobalValue *GV = ExtractTypeInfo(CI.getArgOperand(0));
    unsigned Reg = getOrCreateVReg(CI);
    unsigned TypeID = MF->getTypeIDFor(GV);
    MIRBuilder.buildConstant(Reg, TypeID);
    return true;
  }
  case Intrinsic::objectsize: {
    // If we don't know by now, we're never going to know.
    const ConstantInt *Min = cast<ConstantInt>(CI.getArgOperand(1));

    MIRBuilder.buildConstant(getOrCreateVReg(CI), Min->isZero() ? -1ULL : 0);
    return true;
  }
  case Intrinsic::stackguard:
    getStackGuard(getOrCreateVReg(CI), MIRBuilder);
    return true;
  case Intrinsic::stackprotector: {
    LLT PtrTy = getLLTForType(*CI.getArgOperand(0)->getType(), *DL);
    unsigned GuardVal = MRI->createGenericVirtualRegister(PtrTy);
    getStackGuard(GuardVal, MIRBuilder);

    AllocaInst *Slot = cast<AllocaInst>(CI.getArgOperand(1));
    MIRBuilder.buildStore(
        GuardVal, getOrCreateVReg(*Slot),
        *MF->getMachineMemOperand(
            MachinePointerInfo::getFixedStack(*MF,
                                              getOrCreateFrameIndex(*Slot)),
            MachineMemOperand::MOStore | MachineMemOperand::MOVolatile,
            PtrTy.getSizeInBits() / 8, 8));
    return true;
  }
  }
  return false;
}

bool IRTranslator::translateInlineAsm(const CallInst &CI,
                                      MachineIRBuilder &MIRBuilder) {
  const InlineAsm &IA = cast<InlineAsm>(*CI.getCalledValue());
  if (!IA.getConstraintString().empty())
    return false;

  unsigned ExtraInfo = 0;
  if (IA.hasSideEffects())
    ExtraInfo |= InlineAsm::Extra_HasSideEffects;
  if (IA.getDialect() == InlineAsm::AD_Intel)
    ExtraInfo |= InlineAsm::Extra_AsmDialect;

  MIRBuilder.buildInstr(TargetOpcode::INLINEASM)
    .addExternalSymbol(IA.getAsmString().c_str())
    .addImm(ExtraInfo);

  return true;
}

bool IRTranslator::translateCall(const User &U, MachineIRBuilder &MIRBuilder) {
  const CallInst &CI = cast<CallInst>(U);
  auto TII = MF->getTarget().getIntrinsicInfo();
  const Function *F = CI.getCalledFunction();

  if (CI.isInlineAsm())
    return translateInlineAsm(CI, MIRBuilder);

  if (!F || !F->isIntrinsic()) {
    unsigned Res = CI.getType()->isVoidTy() ? 0 : getOrCreateVReg(CI);
    SmallVector<unsigned, 8> Args;
    for (auto &Arg: CI.arg_operands())
      Args.push_back(getOrCreateVReg(*Arg));

    MF->getFrameInfo().setHasCalls(true);
    return CLI->lowerCall(MIRBuilder, &CI, Res, Args, [&]() {
      return getOrCreateVReg(*CI.getCalledValue());
    });
  }

  Intrinsic::ID ID = F->getIntrinsicID();
  if (TII && ID == Intrinsic::not_intrinsic)
    ID = static_cast<Intrinsic::ID>(TII->getIntrinsicID(F));

  assert(ID != Intrinsic::not_intrinsic && "unknown intrinsic");

  if (translateKnownIntrinsic(CI, ID, MIRBuilder))
    return true;

  unsigned Res = CI.getType()->isVoidTy() ? 0 : getOrCreateVReg(CI);
  MachineInstrBuilder MIB =
      MIRBuilder.buildIntrinsic(ID, Res, !CI.doesNotAccessMemory());

  for (auto &Arg : CI.arg_operands()) {
    // Some intrinsics take metadata parameters. Reject them.
    if (isa<MetadataAsValue>(Arg))
      return false;
    MIB.addUse(getOrCreateVReg(*Arg));
  }

  // Add a MachineMemOperand if it is a target mem intrinsic.
  const TargetLowering &TLI = *MF->getSubtarget().getTargetLowering();
  TargetLowering::IntrinsicInfo Info;
  // TODO: Add a GlobalISel version of getTgtMemIntrinsic.
  if (TLI.getTgtMemIntrinsic(Info, CI, ID)) {
    MachineMemOperand::Flags Flags =
        Info.vol ? MachineMemOperand::MOVolatile : MachineMemOperand::MONone;
    Flags |=
        Info.readMem ? MachineMemOperand::MOLoad : MachineMemOperand::MOStore;
    uint64_t Size = Info.memVT.getSizeInBits() >> 3;
    MIB.addMemOperand(MF->getMachineMemOperand(MachinePointerInfo(Info.ptrVal),
                                               Flags, Size, Info.align));
  }

  return true;
}

bool IRTranslator::translateInvoke(const User &U,
                                   MachineIRBuilder &MIRBuilder) {
  const InvokeInst &I = cast<InvokeInst>(U);
  MCContext &Context = MF->getContext();

  const BasicBlock *ReturnBB = I.getSuccessor(0);
  const BasicBlock *EHPadBB = I.getSuccessor(1);

  const Value *Callee = I.getCalledValue();
  const Function *Fn = dyn_cast<Function>(Callee);
  if (isa<InlineAsm>(Callee))
    return false;

  // FIXME: support invoking patchpoint and statepoint intrinsics.
  if (Fn && Fn->isIntrinsic())
    return false;

  // FIXME: support whatever these are.
  if (I.countOperandBundlesOfType(LLVMContext::OB_deopt))
    return false;

  // FIXME: support Windows exception handling.
  if (!isa<LandingPadInst>(EHPadBB->front()))
    return false;

  // Emit the actual call, bracketed by EH_LABELs so that the MF knows about
  // the region covered by the try.
  MCSymbol *BeginSymbol = Context.createTempSymbol();
  MIRBuilder.buildInstr(TargetOpcode::EH_LABEL).addSym(BeginSymbol);

  unsigned Res = I.getType()->isVoidTy() ? 0 : getOrCreateVReg(I);
  SmallVector<unsigned, 8> Args;
  for (auto &Arg: I.arg_operands())
    Args.push_back(getOrCreateVReg(*Arg));

  if (!CLI->lowerCall(MIRBuilder, &I, Res, Args,
                      [&]() { return getOrCreateVReg(*I.getCalledValue()); }))
    return false;

  MCSymbol *EndSymbol = Context.createTempSymbol();
  MIRBuilder.buildInstr(TargetOpcode::EH_LABEL).addSym(EndSymbol);

  // FIXME: track probabilities.
  MachineBasicBlock &EHPadMBB = getMBB(*EHPadBB),
                    &ReturnMBB = getMBB(*ReturnBB);
  MF->addInvoke(&EHPadMBB, BeginSymbol, EndSymbol);
  MIRBuilder.getMBB().addSuccessor(&ReturnMBB);
  MIRBuilder.getMBB().addSuccessor(&EHPadMBB);
  MIRBuilder.buildBr(ReturnMBB);

  return true;
}

bool IRTranslator::translateLandingPad(const User &U,
                                       MachineIRBuilder &MIRBuilder) {
  const LandingPadInst &LP = cast<LandingPadInst>(U);

  MachineBasicBlock &MBB = MIRBuilder.getMBB();
  addLandingPadInfo(LP, MBB);

  MBB.setIsEHPad();

  // If there aren't registers to copy the values into (e.g., during SjLj
  // exceptions), then don't bother.
  auto &TLI = *MF->getSubtarget().getTargetLowering();
  const Constant *PersonalityFn = MF->getFunction()->getPersonalityFn();
  if (TLI.getExceptionPointerRegister(PersonalityFn) == 0 &&
      TLI.getExceptionSelectorRegister(PersonalityFn) == 0)
    return true;

  // If landingpad's return type is token type, we don't create DAG nodes
  // for its exception pointer and selector value. The extraction of exception
  // pointer or selector value from token type landingpads is not currently
  // supported.
  if (LP.getType()->isTokenTy())
    return true;

  // Add a label to mark the beginning of the landing pad.  Deletion of the
  // landing pad can thus be detected via the MachineModuleInfo.
  MIRBuilder.buildInstr(TargetOpcode::EH_LABEL)
    .addSym(MF->addLandingPad(&MBB));

  LLT Ty = getLLTForType(*LP.getType(), *DL);
  unsigned Undef = MRI->createGenericVirtualRegister(Ty);
  MIRBuilder.buildUndef(Undef);

  SmallVector<LLT, 2> Tys;
  for (Type *Ty : cast<StructType>(LP.getType())->elements())
    Tys.push_back(getLLTForType(*Ty, *DL));
  assert(Tys.size() == 2 && "Only two-valued landingpads are supported");

  // Mark exception register as live in.
  unsigned ExceptionReg = TLI.getExceptionPointerRegister(PersonalityFn);
  if (!ExceptionReg)
    return false;

  MBB.addLiveIn(ExceptionReg);
  unsigned VReg = MRI->createGenericVirtualRegister(Tys[0]),
           Tmp = MRI->createGenericVirtualRegister(Ty);
  MIRBuilder.buildCopy(VReg, ExceptionReg);
  MIRBuilder.buildInsert(Tmp, Undef, VReg, 0);

  unsigned SelectorReg = TLI.getExceptionSelectorRegister(PersonalityFn);
  if (!SelectorReg)
    return false;

  MBB.addLiveIn(SelectorReg);

  // N.b. the exception selector register always has pointer type and may not
  // match the actual IR-level type in the landingpad so an extra cast is
  // needed.
  unsigned PtrVReg = MRI->createGenericVirtualRegister(Tys[0]);
  MIRBuilder.buildCopy(PtrVReg, SelectorReg);

  VReg = MRI->createGenericVirtualRegister(Tys[1]);
  MIRBuilder.buildInstr(TargetOpcode::G_PTRTOINT).addDef(VReg).addUse(PtrVReg);
  MIRBuilder.buildInsert(getOrCreateVReg(LP), Tmp, VReg,
                         Tys[0].getSizeInBits());
  return true;
}

bool IRTranslator::translateAlloca(const User &U,
                                   MachineIRBuilder &MIRBuilder) {
  auto &AI = cast<AllocaInst>(U);

  if (AI.isStaticAlloca()) {
    unsigned Res = getOrCreateVReg(AI);
    int FI = getOrCreateFrameIndex(AI);
    MIRBuilder.buildFrameIndex(Res, FI);
    return true;
  }

  // Now we're in the harder dynamic case.
  Type *Ty = AI.getAllocatedType();
  unsigned Align =
      std::max((unsigned)DL->getPrefTypeAlignment(Ty), AI.getAlignment());

  unsigned NumElts = getOrCreateVReg(*AI.getArraySize());

  Type *IntPtrIRTy = DL->getIntPtrType(AI.getType());
  LLT IntPtrTy = getLLTForType(*IntPtrIRTy, *DL);
  if (MRI->getType(NumElts) != IntPtrTy) {
    unsigned ExtElts = MRI->createGenericVirtualRegister(IntPtrTy);
    MIRBuilder.buildZExtOrTrunc(ExtElts, NumElts);
    NumElts = ExtElts;
  }

  unsigned AllocSize = MRI->createGenericVirtualRegister(IntPtrTy);
  unsigned TySize =
      getOrCreateVReg(*ConstantInt::get(IntPtrIRTy, -DL->getTypeAllocSize(Ty)));
  MIRBuilder.buildMul(AllocSize, NumElts, TySize);

  LLT PtrTy = getLLTForType(*AI.getType(), *DL);
  auto &TLI = *MF->getSubtarget().getTargetLowering();
  unsigned SPReg = TLI.getStackPointerRegisterToSaveRestore();

  unsigned SPTmp = MRI->createGenericVirtualRegister(PtrTy);
  MIRBuilder.buildCopy(SPTmp, SPReg);

  unsigned AllocTmp = MRI->createGenericVirtualRegister(PtrTy);
  MIRBuilder.buildGEP(AllocTmp, SPTmp, AllocSize);

  // Handle alignment. We have to realign if the allocation granule was smaller
  // than stack alignment, or the specific alloca requires more than stack
  // alignment.
  unsigned StackAlign =
      MF->getSubtarget().getFrameLowering()->getStackAlignment();
  Align = std::max(Align, StackAlign);
  if (Align > StackAlign || DL->getTypeAllocSize(Ty) % StackAlign != 0) {
    // Round the size of the allocation up to the stack alignment size
    // by add SA-1 to the size. This doesn't overflow because we're computing
    // an address inside an alloca.
    unsigned AlignedAlloc = MRI->createGenericVirtualRegister(PtrTy);
    MIRBuilder.buildPtrMask(AlignedAlloc, AllocTmp, Log2_32(Align));
    AllocTmp = AlignedAlloc;
  }

  MIRBuilder.buildCopy(SPReg, AllocTmp);
  MIRBuilder.buildCopy(getOrCreateVReg(AI), AllocTmp);

  MF->getFrameInfo().CreateVariableSizedObject(Align ? Align : 1, &AI);
  assert(MF->getFrameInfo().hasVarSizedObjects());
  return true;
}

bool IRTranslator::translateVAArg(const User &U, MachineIRBuilder &MIRBuilder) {
  // FIXME: We may need more info about the type. Because of how LLT works,
  // we're completely discarding the i64/double distinction here (amongst
  // others). Fortunately the ABIs I know of where that matters don't use va_arg
  // anyway but that's not guaranteed.
  MIRBuilder.buildInstr(TargetOpcode::G_VAARG)
    .addDef(getOrCreateVReg(U))
    .addUse(getOrCreateVReg(*U.getOperand(0)))
    .addImm(DL->getABITypeAlignment(U.getType()));
  return true;
}

bool IRTranslator::translateInsertElement(const User &U,
                                          MachineIRBuilder &MIRBuilder) {
  // If it is a <1 x Ty> vector, use the scalar as it is
  // not a legal vector type in LLT.
  if (U.getType()->getVectorNumElements() == 1) {
    unsigned Elt = getOrCreateVReg(*U.getOperand(1));
    ValToVReg[&U] = Elt;
    return true;
  }
  unsigned Res = getOrCreateVReg(U);
  unsigned Val = getOrCreateVReg(*U.getOperand(0));
  unsigned Elt = getOrCreateVReg(*U.getOperand(1));
  unsigned Idx = getOrCreateVReg(*U.getOperand(2));
  MIRBuilder.buildInsertVectorElement(Res, Val, Elt, Idx);
  return true;
}

bool IRTranslator::translateExtractElement(const User &U,
                                           MachineIRBuilder &MIRBuilder) {
  // If it is a <1 x Ty> vector, use the scalar as it is
  // not a legal vector type in LLT.
  if (U.getOperand(0)->getType()->getVectorNumElements() == 1) {
    unsigned Elt = getOrCreateVReg(*U.getOperand(0));
    ValToVReg[&U] = Elt;
    return true;
  }
  unsigned Res = getOrCreateVReg(U);
  unsigned Val = getOrCreateVReg(*U.getOperand(0));
  unsigned Idx = getOrCreateVReg(*U.getOperand(1));
  MIRBuilder.buildExtractVectorElement(Res, Val, Idx);
  return true;
}

bool IRTranslator::translateShuffleVector(const User &U,
                                          MachineIRBuilder &MIRBuilder) {
  MIRBuilder.buildInstr(TargetOpcode::G_SHUFFLE_VECTOR)
      .addDef(getOrCreateVReg(U))
      .addUse(getOrCreateVReg(*U.getOperand(0)))
      .addUse(getOrCreateVReg(*U.getOperand(1)))
      .addUse(getOrCreateVReg(*U.getOperand(2)));
  return true;
}

bool IRTranslator::translatePHI(const User &U, MachineIRBuilder &MIRBuilder) {
  const PHINode &PI = cast<PHINode>(U);
  auto MIB = MIRBuilder.buildInstr(TargetOpcode::PHI);
  MIB.addDef(getOrCreateVReg(PI));

  PendingPHIs.emplace_back(&PI, MIB.getInstr());
  return true;
}

void IRTranslator::finishPendingPhis() {
  for (std::pair<const PHINode *, MachineInstr *> &Phi : PendingPHIs) {
    const PHINode *PI = Phi.first;
    MachineInstrBuilder MIB(*MF, Phi.second);

    // All MachineBasicBlocks exist, add them to the PHI. We assume IRTranslator
    // won't create extra control flow here, otherwise we need to find the
    // dominating predecessor here (or perhaps force the weirder IRTranslators
    // to provide a simple boundary).
    SmallSet<const BasicBlock *, 4> HandledPreds;

    for (unsigned i = 0; i < PI->getNumIncomingValues(); ++i) {
      auto IRPred = PI->getIncomingBlock(i);
      if (HandledPreds.count(IRPred))
        continue;

      HandledPreds.insert(IRPred);
      unsigned ValReg = getOrCreateVReg(*PI->getIncomingValue(i));
      for (auto Pred : getMachinePredBBs({IRPred, PI->getParent()})) {
        assert(Pred->isSuccessor(MIB->getParent()) &&
               "incorrect CFG at MachineBasicBlock level");
        MIB.addUse(ValReg);
        MIB.addMBB(Pred);
      }
    }
  }
}

bool IRTranslator::translate(const Instruction &Inst) {
  CurBuilder.setDebugLoc(Inst.getDebugLoc());
  switch(Inst.getOpcode()) {
#define HANDLE_INST(NUM, OPCODE, CLASS) \
    case Instruction::OPCODE: return translate##OPCODE(Inst, CurBuilder);
#include "llvm/IR/Instruction.def"
  default:
    return false;
  }
}

bool IRTranslator::translate(const Constant &C, unsigned Reg) {
  if (auto CI = dyn_cast<ConstantInt>(&C))
    EntryBuilder.buildConstant(Reg, *CI);
  else if (auto CF = dyn_cast<ConstantFP>(&C))
    EntryBuilder.buildFConstant(Reg, *CF);
  else if (isa<UndefValue>(C))
    EntryBuilder.buildUndef(Reg);
  else if (isa<ConstantPointerNull>(C))
    EntryBuilder.buildConstant(Reg, 0);
  else if (auto GV = dyn_cast<GlobalValue>(&C))
    EntryBuilder.buildGlobalValue(Reg, GV);
  else if (auto CAZ = dyn_cast<ConstantAggregateZero>(&C)) {
    if (!CAZ->getType()->isVectorTy())
      return false;
    // Return the scalar if it is a <1 x Ty> vector.
    if (CAZ->getNumElements() == 1)
      return translate(*CAZ->getElementValue(0u), Reg);
    std::vector<unsigned> Ops;
    for (unsigned i = 0; i < CAZ->getNumElements(); ++i) {
      Constant &Elt = *CAZ->getElementValue(i);
      Ops.push_back(getOrCreateVReg(Elt));
    }
    EntryBuilder.buildMerge(Reg, Ops);
  } else if (auto CV = dyn_cast<ConstantDataVector>(&C)) {
    // Return the scalar if it is a <1 x Ty> vector.
    if (CV->getNumElements() == 1)
      return translate(*CV->getElementAsConstant(0), Reg);
    std::vector<unsigned> Ops;
    for (unsigned i = 0; i < CV->getNumElements(); ++i) {
      Constant &Elt = *CV->getElementAsConstant(i);
      Ops.push_back(getOrCreateVReg(Elt));
    }
    EntryBuilder.buildMerge(Reg, Ops);
  } else if (auto CE = dyn_cast<ConstantExpr>(&C)) {
    switch(CE->getOpcode()) {
#define HANDLE_INST(NUM, OPCODE, CLASS)                         \
      case Instruction::OPCODE: return translate##OPCODE(*CE, EntryBuilder);
#include "llvm/IR/Instruction.def"
    default:
      return false;
    }
  } else if (auto CS = dyn_cast<ConstantStruct>(&C)) {
    // Return the element if it is a single element ConstantStruct.
    if (CS->getNumOperands() == 1) {
      unsigned EltReg = getOrCreateVReg(*CS->getOperand(0));
      EntryBuilder.buildCast(Reg, EltReg);
      return true;
    }
    SmallVector<unsigned, 4> Ops;
    SmallVector<uint64_t, 4> Indices;
    uint64_t Offset = 0;
    for (unsigned i = 0; i < CS->getNumOperands(); ++i) {
      unsigned OpReg = getOrCreateVReg(*CS->getOperand(i));
      Ops.push_back(OpReg);
      Indices.push_back(Offset);
      Offset += MRI->getType(OpReg).getSizeInBits();
    }
    EntryBuilder.buildSequence(Reg, Ops, Indices);
  } else if (auto CV = dyn_cast<ConstantVector>(&C)) {
    if (CV->getNumOperands() == 1)
      return translate(*CV->getOperand(0), Reg);
    SmallVector<unsigned, 4> Ops;
    for (unsigned i = 0; i < CV->getNumOperands(); ++i) {
      Ops.push_back(getOrCreateVReg(*CV->getOperand(i)));
    }
    EntryBuilder.buildMerge(Reg, Ops);
  } else
    return false;

  return true;
}

void IRTranslator::finalizeFunction() {
  // Release the memory used by the different maps we
  // needed during the translation.
  PendingPHIs.clear();
  ValToVReg.clear();
  FrameIndices.clear();
  MachinePreds.clear();
  // MachineIRBuilder::DebugLoc can outlive the DILocation it holds. Clear it
  // to avoid accessing free’d memory (in runOnMachineFunction) and to avoid
  // destroying it twice (in ~IRTranslator() and ~LLVMContext())
  EntryBuilder = MachineIRBuilder();
  CurBuilder = MachineIRBuilder();
}

bool IRTranslator::runOnMachineFunction(MachineFunction &CurMF) {
  MF = &CurMF;
  const Function &F = *MF->getFunction();
  if (F.empty())
    return false;
  CLI = MF->getSubtarget().getCallLowering();
  CurBuilder.setMF(*MF);
  EntryBuilder.setMF(*MF);
  MRI = &MF->getRegInfo();
  DL = &F.getParent()->getDataLayout();
  TPC = &getAnalysis<TargetPassConfig>();
  ORE = llvm::make_unique<OptimizationRemarkEmitter>(&F);

  assert(PendingPHIs.empty() && "stale PHIs");

  // Release the per-function state when we return, whether we succeeded or not.
  auto FinalizeOnReturn = make_scope_exit([this]() { finalizeFunction(); });

  // Setup a separate basic-block for the arguments and constants
  MachineBasicBlock *EntryBB = MF->CreateMachineBasicBlock();
  MF->push_back(EntryBB);
  EntryBuilder.setMBB(*EntryBB);

  // Create all blocks, in IR order, to preserve the layout.
  for (const BasicBlock &BB: F) {
    auto *&MBB = BBToMBB[&BB];

    MBB = MF->CreateMachineBasicBlock(&BB);
    MF->push_back(MBB);

    if (BB.hasAddressTaken())
      MBB->setHasAddressTaken();
  }

  // Make our arguments/constants entry block fallthrough to the IR entry block.
  EntryBB->addSuccessor(&getMBB(F.front()));

  // Lower the actual args into this basic block.
  SmallVector<unsigned, 8> VRegArgs;
  for (const Argument &Arg: F.args())
    VRegArgs.push_back(getOrCreateVReg(Arg));
  if (!CLI->lowerFormalArguments(EntryBuilder, F, VRegArgs)) {
    OptimizationRemarkMissed R("gisel-irtranslator", "GISelFailure",
                               MF->getFunction()->getSubprogram(),
                               &MF->getFunction()->getEntryBlock());
    R << "unable to lower arguments: " << ore::NV("Prototype", F.getType());
    reportTranslationError(*MF, *TPC, *ORE, R);
    return false;
  }

  // And translate the function!
  for (const BasicBlock &BB: F) {
    MachineBasicBlock &MBB = getMBB(BB);
    // Set the insertion point of all the following translations to
    // the end of this basic block.
    CurBuilder.setMBB(MBB);

    for (const Instruction &Inst: BB) {
      if (translate(Inst))
        continue;

      std::string InstStrStorage;
      raw_string_ostream InstStr(InstStrStorage);
      InstStr << Inst;

      OptimizationRemarkMissed R("gisel-irtranslator", "GISelFailure",
                                 Inst.getDebugLoc(), &BB);
      R << "unable to translate instruction: " << ore::NV("Opcode", &Inst)
        << ": '" << InstStr.str() << "'";
      reportTranslationError(*MF, *TPC, *ORE, R);
      return false;
    }
  }

  finishPendingPhis();

  // Merge the argument lowering and constants block with its single
  // successor, the LLVM-IR entry block.  We want the basic block to
  // be maximal.
  assert(EntryBB->succ_size() == 1 &&
         "Custom BB used for lowering should have only one successor");
  // Get the successor of the current entry block.
  MachineBasicBlock &NewEntryBB = **EntryBB->succ_begin();
  assert(NewEntryBB.pred_size() == 1 &&
         "LLVM-IR entry block has a predecessor!?");
  // Move all the instruction from the current entry block to the
  // new entry block.
  NewEntryBB.splice(NewEntryBB.begin(), EntryBB, EntryBB->begin(),
                    EntryBB->end());

  // Update the live-in information for the new entry block.
  for (const MachineBasicBlock::RegisterMaskPair &LiveIn : EntryBB->liveins())
    NewEntryBB.addLiveIn(LiveIn);
  NewEntryBB.sortUniqueLiveIns();

  // Get rid of the now empty basic block.
  EntryBB->removeSuccessor(&NewEntryBB);
  MF->remove(EntryBB);
  MF->DeleteMachineBasicBlock(EntryBB);

  assert(&MF->front() == &NewEntryBB &&
         "New entry wasn't next in the list of basic block!");

  return false;
}
-												[CodeGen] Fix some Clang-tidy modernize-use-using and Include What You Use warnings; other minor fixes (NFC).

llvm-svn: 306341

											
										
										
											2017-06-27 06:44:03 +08:00
+								//===- llvm/CodeGen/GlobalISel/IRTranslator.cpp - IRTranslator ---*- C++ -*-==//
-												[GlobalISel] Add the proper cmake plumbing.

This patch adds the necessary plumbing to cmake to build the sources related to
GlobalISel.

To build the sources related to GlobalISel, we need to add -DBUILD_GLOBAL_ISEL=ON.
By default, this is OFF, thus GlobalISel sources will not impact people that do
not explicitly opt-in.

Differential Revision: http://reviews.llvm.org/D15983

llvm-svn: 258344

											
										
										
											2016-01-21 04:58:56 +08:00
+								//
 								//                     The LLVM Compiler Infrastructure
 								//
 								// This file is distributed under the University of Illinois Open Source
 								// License. See LICENSE.TXT for details.
 								//
 								//===----------------------------------------------------------------------===//
 								/// \file
 								/// This file implements the IRTranslator class.
 								//===----------------------------------------------------------------------===//
 								#include "llvm/CodeGen/GlobalISel/IRTranslator.h"
-												[CodeGen] Fix some Clang-tidy modernize-use-using and Include What You Use warnings; other minor fixes (NFC).

llvm-svn: 306341

											
										
										
											2017-06-27 06:44:03 +08:00
+								#include "llvm/ADT/STLExtras.h"
-												[GlobalISel] Finalize translated function on scope exit. NFC.

This is the compromise between having a per-function IRTranslator
and manually managing the per-function state.

llvm-svn: 296046

											
										
										
											2017-02-24 07:57:28 +08:00
+								#include "llvm/ADT/ScopeExit.h"
-												[GlobalISel] track predecessor mapping during switch lowering.

Correctly populating Machine PHIs relies on knowing exactly how the IR level
CFG was lowered to MachineIR. This needs to be tracked by any translation
phases that meddle (currently only SwitchInst handling).

This reapplies r291973 which was reverted because of testing failures. Fixes:

 + Don't return an ArrayRef to a local temporary.
 + Incorporate Kristof's suggested comment improvements.

llvm-svn: 292278

											
										
										
											2017-01-18 06:13:50 +08:00
+								#include "llvm/ADT/SmallSet.h"
-												[GlobalISel] Add the necessary plumbing to lower formal arguments.

llvm-svn: 260579

											
										
										
											2016-02-12 03:59:41 +08:00
+								#include "llvm/ADT/SmallVector.h"
-												[GlobalISel] Emit opt remarks on isel fallbacks.

Having more fine-grained information on the specific construct that
caused us to fallback is valuable for large-scale data collection.

We still have the fallback warning, that's also used for FastISel.
We still need to remove the fallback warning, and teach FastISel to also
emit remarks (it currently has a combination of the warning, stats, and
debug prints: the remarks could unify all three).

The abort-on-fallback path could also be better handled using remarks:
one could imagine a "-Rpass-error", analoguous to "-Werror", which would
promote missed/failed remarks to errors.  It's not clear whether that
would be useful for other remarks though, so we're not there yet.

llvm-svn: 296013

											
										
										
											2017-02-24 05:05:42 +08:00
+								#include "llvm/Analysis/OptimizationDiagnosticInfo.h"
-												GlobalISel: translate invoke and landingpad instructions

Pretty bare-bones support for exception handling (no weird MSVC stuff, no SjLj
etc), but it should get things going.

llvm-svn: 286407

											
										
										
											2016-11-10 06:39:54 +08:00
+								#include "llvm/CodeGen/Analysis.h"
-												Sort the remaining #include lines in include/... and lib/....

I did this a long time ago with a janky python script, but now
clang-format has built-in support for this. I fed clang-format every
line with a #include and let it re-sort things according to the precise
LLVM rules for include ordering baked into clang-format these days.

I've reverted a number of files where the results of sorting includes
isn't healthy. Either places where we have legacy code relying on
particular include ordering (where possible, I'll fix these separately)
or where we have particular formatting around #include lines that
I didn't want to disturb in this patch.

This patch is *entirely* mechanical. If you get merge conflicts or
anything, just ignore the changes in this patch and run clang-format
over your #include lines in the files.

Sorry for any noise here, but it is important to keep these things
stable. I was seeing an increasing number of patches with irrelevant
re-ordering of #include lines because clang-format was used. This patch
at least isolates that churn, makes it easy to skip when resolving
conflicts, and gets us to a clean baseline (again).

llvm-svn: 304787

											
										
										
											2017-06-06 19:49:48 +08:00
+								#include "llvm/CodeGen/GlobalISel/CallLowering.h"
-												[CodeGen] Fix some Clang-tidy modernize-use-using and Include What You Use warnings; other minor fixes (NFC).

llvm-svn: 306341

											
										
										
											2017-06-27 06:44:03 +08:00
+								#include "llvm/CodeGen/LowLevelType.h"
 								#include "llvm/CodeGen/MachineBasicBlock.h"
-												GlobalISel: implement alloca instruction

llvm-svn: 276433

											
										
										
											2016-07-23 00:59:52 +08:00
+								#include "llvm/CodeGen/MachineFrameInfo.h"
-												Sort the remaining #include lines in include/... and lib/....

I did this a long time ago with a janky python script, but now
clang-format has built-in support for this. I fed clang-format every
line with a #include and let it re-sort things according to the precise
LLVM rules for include ordering baked into clang-format these days.

I've reverted a number of files where the results of sorting includes
isn't healthy. Either places where we have legacy code relying on
particular include ordering (where possible, I'll fix these separately)
or where we have particular formatting around #include lines that
I didn't want to disturb in this patch.

This patch is *entirely* mechanical. If you get merge conflicts or
anything, just ignore the changes in this patch and run clang-format
over your #include lines in the files.

Sorry for any noise here, but it is important to keep these things
stable. I was seeing an increasing number of patches with irrelevant
re-ordering of #include lines because clang-format was used. This patch
at least isolates that churn, makes it easy to skip when resolving
conflicts, and gets us to a clean baseline (again).

llvm-svn: 304787

											
										
										
											2017-06-06 19:49:48 +08:00
+								#include "llvm/CodeGen/MachineFunction.h"
-												[CodeGen] Fix some Clang-tidy modernize-use-using and Include What You Use warnings; other minor fixes (NFC).

llvm-svn: 306341

											
										
										
											2017-06-27 06:44:03 +08:00
+								#include "llvm/CodeGen/MachineInstrBuilder.h"
 								#include "llvm/CodeGen/MachineMemOperand.h"
 								#include "llvm/CodeGen/MachineOperand.h"
-												[GlobalISel][IRTranslator] Teach the pass how to translate Add instructions.

llvm-svn: 260549

											
										
										
											2016-02-12 01:51:31 +08:00
+								#include "llvm/CodeGen/MachineRegisterInfo.h"
-												[IRTranslator] Do not abort when the target wants to fall back.

Every pass in the GlobalISel pipeline will need to do something similar.

llvm-svn: 279886

											
										
										
											2016-08-27 07:49:05 +08:00
+								#include "llvm/CodeGen/TargetPassConfig.h"
-												[CodeGen] Fix some Clang-tidy modernize-use-using and Include What You Use warnings; other minor fixes (NFC).

llvm-svn: 306341

											
										
										
											2017-06-27 06:44:03 +08:00
+								#include "llvm/IR/BasicBlock.h"
-												[GlobalISel][IRTranslator] Teach the pass how to translate Add instructions.

llvm-svn: 260549

											
										
										
											2016-02-12 01:51:31 +08:00
+								#include "llvm/IR/Constant.h"
-												[CodeGen] Fix some Clang-tidy modernize-use-using and Include What You Use warnings; other minor fixes (NFC).

llvm-svn: 306341

											
										
										
											2017-06-27 06:44:03 +08:00
+								#include "llvm/IR/Constants.h"
 								#include "llvm/IR/DataLayout.h"
-												GlobalISel: support debug intrinsics.

The translation scheme is mostly cribbed from FastISel, and it's not entirely
convincing semantically. But it does seem to work in the common cases and allow
variables to be printed so it can't be all wrong.

llvm-svn: 293228

											
										
										
											2017-01-27 07:39:14 +08:00
+								#include "llvm/IR/DebugInfo.h"
-												[CodeGen] Fix some Clang-tidy modernize-use-using and Include What You Use warnings; other minor fixes (NFC).

llvm-svn: 306341

											
										
										
											2017-06-27 06:44:03 +08:00
+								#include "llvm/IR/DerivedTypes.h"
-												[GlobalISel] More detailed skeleton for the IRTranslator.

llvm-svn: 260456

											
										
										
											2016-02-11 06:59:27 +08:00
+								#include "llvm/IR/Function.h"
-												GlobalISel: translate GEP instructions.

Unlike SDag, we use a separate G_GEP instruction (much simplified, only taking
a single byte offset) to preserve the pointer type information through
selection.

llvm-svn: 281205

											
										
										
											2016-09-12 19:20:22 +08:00
+								#include "llvm/IR/GetElementPtrTypeIterator.h"
-												[CodeGen] Fix some Clang-tidy modernize-use-using and Include What You Use warnings; other minor fixes (NFC).

llvm-svn: 306341

											
										
										
											2017-06-27 06:44:03 +08:00
+								#include "llvm/IR/InlineAsm.h"
 								#include "llvm/IR/InstrTypes.h"
 								#include "llvm/IR/Instructions.h"
-												GlobalISel: support translation of intrinsic calls.

These come in two variants for now: G_INTRINSIC and G_INTRINSIC_W_SIDE_EFFECTS.
We may decide to split the latter up with finer-grained restrictions later, if
necessary.

llvm-svn: 277224

											
										
										
											2016-07-30 06:32:36 +08:00
+								#include "llvm/IR/IntrinsicInst.h"
-												[CodeGen] Fix some Clang-tidy modernize-use-using and Include What You Use warnings; other minor fixes (NFC).

llvm-svn: 306341

											
										
										
											2017-06-27 06:44:03 +08:00
+								#include "llvm/IR/Intrinsics.h"
 								#include "llvm/IR/LLVMContext.h"
 								#include "llvm/IR/Metadata.h"
-												[GlobalISel][IRTranslator] Teach the pass how to translate Add instructions.

llvm-svn: 260549

											
										
										
											2016-02-12 01:51:31 +08:00
+								#include "llvm/IR/Type.h"
-												[CodeGen] Fix some Clang-tidy modernize-use-using and Include What You Use warnings; other minor fixes (NFC).

llvm-svn: 306341

											
										
										
											2017-06-27 06:44:03 +08:00
+								#include "llvm/IR/User.h"
-												[GlobalISel][IRTranslator] Teach the pass how to translate Add instructions.

llvm-svn: 260549

											
										
										
											2016-02-12 01:51:31 +08:00
+								#include "llvm/IR/Value.h"
-												[CodeGen] Fix some Clang-tidy modernize-use-using and Include What You Use warnings; other minor fixes (NFC).

llvm-svn: 306341

											
										
										
											2017-06-27 06:44:03 +08:00
+								#include "llvm/MC/MCContext.h"
 								#include "llvm/Pass.h"
 								#include "llvm/Support/Casting.h"
 								#include "llvm/Support/CodeGen.h"
 								#include "llvm/Support/Debug.h"
 								#include "llvm/Support/ErrorHandling.h"
 								#include "llvm/Support/LowLevelTypeImpl.h"
 								#include "llvm/Support/MathExtras.h"
 								#include "llvm/Support/raw_ostream.h"
-												GlobalISel: translate dynamic alloca instructions.

llvm-svn: 294022

											
										
										
											2017-02-04 02:22:45 +08:00
+								#include "llvm/Target/TargetFrameLowering.h"
-												GlobalISel: support translation of intrinsic calls.

These come in two variants for now: G_INTRINSIC and G_INTRINSIC_W_SIDE_EFFECTS.
We may decide to split the latter up with finer-grained restrictions later, if
necessary.

llvm-svn: 277224

											
										
										
											2016-07-30 06:32:36 +08:00
+								#include "llvm/Target/TargetIntrinsicInfo.h"
-												[GlobalISel] Teach the IRTranslator how to lower returns.

llvm-svn: 260562

											
										
										
											2016-02-12 02:53:28 +08:00
+								#include "llvm/Target/TargetLowering.h"
-												[CodeGen] Fix some Clang-tidy modernize-use-using and Include What You Use warnings; other minor fixes (NFC).

llvm-svn: 306341

											
										
										
											2017-06-27 06:44:03 +08:00
+								#include "llvm/Target/TargetMachine.h"
 								#include "llvm/Target/TargetRegisterInfo.h"
 								#include "llvm/Target/TargetSubtargetInfo.h"
 								#include <algorithm>
 								#include <cassert>
 								#include <cstdint>
 								#include <iterator>
 								#include <string>
 								#include <utility>
 								#include <vector>
-												[GlobalISel] More detailed skeleton for the IRTranslator.

llvm-svn: 260456

											
										
										
											2016-02-11 06:59:27 +08:00
 								#define DEBUG_TYPE "irtranslator"
-												[GlobalISel] Add the proper cmake plumbing.

This patch adds the necessary plumbing to cmake to build the sources related to
GlobalISel.

To build the sources related to GlobalISel, we need to add -DBUILD_GLOBAL_ISEL=ON.
By default, this is OFF, thus GlobalISel sources will not impact people that do
not explicitly opt-in.

Differential Revision: http://reviews.llvm.org/D15983

llvm-svn: 258344

											
										
										
											2016-01-21 04:58:56 +08:00
+								using namespace llvm;
 								char IRTranslator::ID = 0;
-												[CodeGen] Fix some Clang-tidy modernize-use-using and Include What You Use warnings; other minor fixes (NFC).

llvm-svn: 306341

											
										
										
											2017-06-27 06:44:03 +08:00
-												[IRTranslator] Do not abort when the target wants to fall back.

Every pass in the GlobalISel pipeline will need to do something similar.

llvm-svn: 279886

											
										
										
											2016-08-27 07:49:05 +08:00
+								INITIALIZE_PASS_BEGIN(IRTranslator, DEBUG_TYPE, "IRTranslator LLVM IR -> MI",
 								                false, false)
 								INITIALIZE_PASS_DEPENDENCY(TargetPassConfig)
 								INITIALIZE_PASS_END(IRTranslator, DEBUG_TYPE, "IRTranslator LLVM IR -> MI",
-												GlobalISel: remove redundant ';'s. NFC

llvm-svn: 276723

											
										
										
											2016-07-26 11:29:18 +08:00
+								                false, false)
-												[GlobalISel] Add the proper cmake plumbing.

This patch adds the necessary plumbing to cmake to build the sources related to
GlobalISel.

To build the sources related to GlobalISel, we need to add -DBUILD_GLOBAL_ISEL=ON.
By default, this is OFF, thus GlobalISel sources will not impact people that do
not explicitly opt-in.

Differential Revision: http://reviews.llvm.org/D15983

llvm-svn: 258344

											
										
										
											2016-01-21 04:58:56 +08:00
-												[GlobalISel] Emit opt remarks on isel fallbacks.

Having more fine-grained information on the specific construct that
caused us to fallback is valuable for large-scale data collection.

We still have the fallback warning, that's also used for FastISel.
We still need to remove the fallback warning, and teach FastISel to also
emit remarks (it currently has a combination of the warning, stats, and
debug prints: the remarks could unify all three).

The abort-on-fallback path could also be better handled using remarks:
one could imagine a "-Rpass-error", analoguous to "-Werror", which would
promote missed/failed remarks to errors.  It's not clear whether that
would be useful for other remarks though, so we're not there yet.

llvm-svn: 296013

											
										
										
											2017-02-24 05:05:42 +08:00
+								static void reportTranslationError(MachineFunction &MF,
 								                                   const TargetPassConfig &TPC,
 								                                   OptimizationRemarkEmitter &ORE,
 								                                   OptimizationRemarkMissed &R) {
 								  MF.getProperties().set(MachineFunctionProperties::Property::FailedISel);
 								  // Print the function name explicitly if we don't have a debug location (which
 								  // makes the diagnostic less useful) or if we're going to emit a raw error.
 								  if (!R.getLocation().isValid() || TPC.isGlobalISelAbortEnabled())
 								    R << (" (in function: " + MF.getName() + ")").str();
 								  if (TPC.isGlobalISelAbortEnabled())
 								    report_fatal_error(R.getMsg());
 								  else
 								    ORE.emit(R);
-												GlobalISel: improve error diagnostics when IRTranslation fails.

llvm-svn: 286190

											
										
										
											2016-11-08 09:12:17 +08:00
+								}
-												[CodeGen] Fix some Clang-tidy modernize-use-using and Include What You Use warnings; other minor fixes (NFC).

llvm-svn: 306341

											
										
										
											2017-06-27 06:44:03 +08:00
+								IRTranslator::IRTranslator() : MachineFunctionPass(ID) {
-												[GlobalISel] Introduce initializer method to support start/stop-after features.

llvm-svn: 262896

											
										
										
											2016-03-08 09:38:55 +08:00
+								  initializeIRTranslatorPass(*PassRegistry::getPassRegistry());
-												[GlobalISel][IRTranslator] Change the ownership of the MIRBuilder field.

llvm-svn: 260551

											
										
										
											2016-02-12 01:53:23 +08:00
+								}
-												[IRTranslator] Do not abort when the target wants to fall back.

Every pass in the GlobalISel pipeline will need to do something similar.

llvm-svn: 279886

											
										
										
											2016-08-27 07:49:05 +08:00
+								void IRTranslator::getAnalysisUsage(AnalysisUsage &AU) const {
 								  AU.addRequired<TargetPassConfig>();
 								  MachineFunctionPass::getAnalysisUsage(AU);
 								}
-												[IRTranslator] Update getOrCreateVReg API to use references.
A value that we want to keep in a virtual register cannot be null.
Reflect that in the API.

llvm-svn: 263263

											
										
										
											2016-03-12 01:27:54 +08:00
+								unsigned IRTranslator::getOrCreateVReg(const Value &Val) {
 								  unsigned &ValReg = ValToVReg[&Val];
-												GlobalISel: rework getOrCreateVReg to avoid double lookup. NFC.

Thanks to Quentin for suggesting the refactoring.

llvm-svn: 293087

											
										
										
											2017-01-26 04:58:22 +08:00
 								  if (ValReg)
 								    return ValReg;
 								  // Fill ValRegsSequence with the sequence of registers
 								  // we need to concat together to produce the value.
 								  assert(Val.getType()->isSized() &&
 								         "Don't know how to create an empty vreg");
-												Recommit: [globalisel] Change LLT constructor string into an LLT-based object that knows how to generate it.

Summary:
This will allow future patches to inspect the details of the LLT. The implementation is now split between
the Support and CodeGen libraries to allow TableGen to use this class without introducing layering concerns.

Thanks to Ahmed Bougacha for finding a reasonable way to avoid the layering issue and providing the version of this patch without that problem.

The problem with the previous commit appears to have been that TableGen was including CodeGen/LowLevelType.h instead of Support/LowLevelTypeImpl.h.

Reviewers: t.p.northover, qcolombet, rovka, aditya_nandakumar, ab, javed.absar

Subscribers: arsenm, nhaehnle, mgorny, dberris, llvm-commits, kristof.beyls

Differential Revision: https://reviews.llvm.org/D30046

llvm-svn: 297241

											
										
										
											2017-03-08 07:20:35 +08:00
+								  unsigned VReg =
 								      MRI->createGenericVirtualRegister(getLLTForType(*Val.getType(), *DL));
-												GlobalISel: rework getOrCreateVReg to avoid double lookup. NFC.

Thanks to Quentin for suggesting the refactoring.

llvm-svn: 293087

											
										
										
											2017-01-26 04:58:22 +08:00
+								  ValReg = VReg;
 								  if (auto CV = dyn_cast<Constant>(&Val)) {
 								    bool Success = translate(*CV, VReg);
 								    if (!Success) {
-												[GlobalISel] Emit opt remarks on isel fallbacks.

Having more fine-grained information on the specific construct that
caused us to fallback is valuable for large-scale data collection.

We still have the fallback warning, that's also used for FastISel.
We still need to remove the fallback warning, and teach FastISel to also
emit remarks (it currently has a combination of the warning, stats, and
debug prints: the remarks could unify all three).

The abort-on-fallback path could also be better handled using remarks:
one could imagine a "-Rpass-error", analoguous to "-Werror", which would
promote missed/failed remarks to errors.  It's not clear whether that
would be useful for other remarks though, so we're not there yet.

llvm-svn: 296013

											
										
										
											2017-02-24 05:05:42 +08:00
+								      OptimizationRemarkMissed R("gisel-irtranslator", "GISelFailure",
-												[GlobalISel] Use the DISubprogram for translation failure remarks.

Justin added support for DISubprogram locs in r295531 and r296052.
Use that instead of no-loc for constants and arguments.

llvm-svn: 296058

											
										
										
											2017-02-24 08:34:44 +08:00
+								                                 MF->getFunction()->getSubprogram(),
-												[GlobalISel] Emit opt remarks on isel fallbacks.

Having more fine-grained information on the specific construct that
caused us to fallback is valuable for large-scale data collection.

We still have the fallback warning, that's also used for FastISel.
We still need to remove the fallback warning, and teach FastISel to also
emit remarks (it currently has a combination of the warning, stats, and
debug prints: the remarks could unify all three).

The abort-on-fallback path could also be better handled using remarks:
one could imagine a "-Rpass-error", analoguous to "-Werror", which would
promote missed/failed remarks to errors.  It's not clear whether that
would be useful for other remarks though, so we're not there yet.

llvm-svn: 296013

											
										
										
											2017-02-24 05:05:42 +08:00
+								                                 &MF->getFunction()->getEntryBlock());
 								      R << "unable to translate constant: " << ore::NV("Type", Val.getType());
 								      reportTranslationError(*MF, *TPC, *ORE, R);
 								      return VReg;
-												GlobalISel: first translation support for Constants.

For now put them all in the entry block. This should be correct but may give
poor runtime performance. Hopefully MachineSinking combined with
isReMaterializable can solve those issues, but if not the interface is sound
enough to support alternatives.

llvm-svn: 278168

											
										
										
											2016-08-10 05:28:04 +08:00
+								    }
-												[GlobalISel][IRTranslator] Teach the pass how to translate Add instructions.

llvm-svn: 260549

											
										
										
											2016-02-12 01:51:31 +08:00
+								  }
-												GlobalISel: prevent heap use-after-free when looking up VReg.

Translating the constant can create more VRegs, which can invalidate the
reference into the DenseMap. So we have to look up the value again after all
that's happened.

llvm-svn: 292675

											
										
										
											2017-01-21 07:25:17 +08:00
-												GlobalISel: rework getOrCreateVReg to avoid double lookup. NFC.

Thanks to Quentin for suggesting the refactoring.

llvm-svn: 293087

											
										
										
											2017-01-26 04:58:22 +08:00
+								  return VReg;
-												[GlobalISel][IRTranslator] Teach the pass how to translate Add instructions.

llvm-svn: 260549

											
										
										
											2016-02-12 01:51:31 +08:00
+								}
-												GlobalISel: translate stack protector intrinsics

llvm-svn: 285614

											
										
										
											2016-11-01 02:30:59 +08:00
+								int IRTranslator::getOrCreateFrameIndex(const AllocaInst &AI) {
 								  if (FrameIndices.find(&AI) != FrameIndices.end())
 								    return FrameIndices[&AI];
 								  unsigned ElementSize = DL->getTypeStoreSize(AI.getAllocatedType());
 								  unsigned Size =
 								      ElementSize * cast<ConstantInt>(AI.getArraySize())->getZExtValue();
 								  // Always allocate at least one byte.
 								  Size = std::max(Size, 1u);
 								  unsigned Alignment = AI.getAlignment();
 								  if (!Alignment)
 								    Alignment = DL->getABITypeAlignment(AI.getAllocatedType());
 								  int &FI = FrameIndices[&AI];
-												GlobalISel: store the current MachineFunction as direct state. NFC.

Having to ask the MIRBuilder for the current function is a little awkward, and
I'm intending to improve how that's threaded through anyway.

llvm-svn: 288983

											
										
										
											2016-12-08 05:17:47 +08:00
+								  FI = MF->getFrameInfo().CreateStackObject(Size, Alignment, false, &AI);
-												GlobalISel: translate stack protector intrinsics

llvm-svn: 285614

											
										
										
											2016-11-01 02:30:59 +08:00
+								  return FI;
 								}
-												GlobalISel: add generic load and store instructions.

Pretty straightforward, the only oddity is the MachineMemOperand (which it's
surprisingly difficult to share code for).

llvm-svn: 276799

											
										
										
											2016-07-27 04:23:26 +08:00
+								unsigned IRTranslator::getMemOpAlignment(const Instruction &I) {
 								  unsigned Alignment = 0;
 								  Type *ValTy = nullptr;
 								  if (const StoreInst *SI = dyn_cast<StoreInst>(&I)) {
 								    Alignment = SI->getAlignment();
 								    ValTy = SI->getValueOperand()->getType();
 								  } else if (const LoadInst *LI = dyn_cast<LoadInst>(&I)) {
 								    Alignment = LI->getAlignment();
 								    ValTy = LI->getType();
-												[GlobalISel] Emit opt remarks on isel fallbacks.

Having more fine-grained information on the specific construct that
caused us to fallback is valuable for large-scale data collection.

We still have the fallback warning, that's also used for FastISel.
We still need to remove the fallback warning, and teach FastISel to also
emit remarks (it currently has a combination of the warning, stats, and
debug prints: the remarks could unify all three).

The abort-on-fallback path could also be better handled using remarks:
one could imagine a "-Rpass-error", analoguous to "-Werror", which would
promote missed/failed remarks to errors.  It's not clear whether that
would be useful for other remarks though, so we're not there yet.

llvm-svn: 296013

											
										
										
											2017-02-24 05:05:42 +08:00
+								  } else {
 								    OptimizationRemarkMissed R("gisel-irtranslator", "", &I);
 								    R << "unable to translate memop: " << ore::NV("Opcode", &I);
 								    reportTranslationError(*MF, *TPC, *ORE, R);
-												[IRTranslator] Do not abort when the target wants to fall back.

Every pass in the GlobalISel pipeline will need to do something similar.

llvm-svn: 279886

											
										
										
											2016-08-27 07:49:05 +08:00
+								    return 1;
-												[GlobalISel] Emit opt remarks on isel fallbacks.

Having more fine-grained information on the specific construct that
caused us to fallback is valuable for large-scale data collection.

We still have the fallback warning, that's also used for FastISel.
We still need to remove the fallback warning, and teach FastISel to also
emit remarks (it currently has a combination of the warning, stats, and
debug prints: the remarks could unify all three).

The abort-on-fallback path could also be better handled using remarks:
one could imagine a "-Rpass-error", analoguous to "-Werror", which would
promote missed/failed remarks to errors.  It's not clear whether that
would be useful for other remarks though, so we're not there yet.

llvm-svn: 296013

											
										
										
											2017-02-24 05:05:42 +08:00
+								  }
-												GlobalISel: add generic load and store instructions.

Pretty straightforward, the only oddity is the MachineMemOperand (which it's
surprisingly difficult to share code for).

llvm-svn: 276799

											
										
										
											2016-07-27 04:23:26 +08:00
 								  return Alignment ? Alignment : DL->getABITypeAlignment(ValTy);
 								}
-												[GlobalISel] Preserve IR block layout.

It makes the output function layout more predictable;  the layout has
an effect on performance, we don't want it to be at the mercy of the
translator's visitation order and such.
The predictable output is also easier to digest.

getOrCreateBB isn't appropriately named anymore, as it never needs to
create anything.  Rename it and extract the MBB creation logic out of it.

A couple tests were sensitive to the order. Update them.

llvm-svn: 297868

											
										
										
											2017-03-16 02:22:33 +08:00
+								MachineBasicBlock &IRTranslator::getMBB(const BasicBlock &BB) {
-												[IRTranslator] Update getOrCreateBB API to use references.
A null basic block is invalid, so just pass a reference.

llvm-svn: 263260

											
										
										
											2016-03-12 01:27:43 +08:00
+								  MachineBasicBlock *&MBB = BBToMBB[&BB];
-												[GlobalISel] Preserve IR block layout.

It makes the output function layout more predictable;  the layout has
an effect on performance, we don't want it to be at the mercy of the
translator's visitation order and such.
The predictable output is also easier to digest.

getOrCreateBB isn't appropriately named anymore, as it never needs to
create anything.  Rename it and extract the MBB creation logic out of it.

A couple tests were sensitive to the order. Update them.

llvm-svn: 297868

											
										
										
											2017-03-16 02:22:33 +08:00
+								  assert(MBB && "BasicBlock was not encountered before");
-												[GlobalISel][IRTranslator] Teach the pass how to translate Add instructions.

llvm-svn: 260549

											
										
										
											2016-02-12 01:51:31 +08:00
+								  return *MBB;
 								}
-												[GlobalISel] track predecessor mapping during switch lowering.

Correctly populating Machine PHIs relies on knowing exactly how the IR level
CFG was lowered to MachineIR. This needs to be tracked by any translation
phases that meddle (currently only SwitchInst handling).

This reapplies r291973 which was reverted because of testing failures. Fixes:

 + Don't return an ArrayRef to a local temporary.
 + Incorporate Kristof's suggested comment improvements.

llvm-svn: 292278

											
										
										
											2017-01-18 06:13:50 +08:00
+								void IRTranslator::addMachineCFGPred(CFGEdge Edge, MachineBasicBlock *NewPred) {
 								  assert(NewPred && "new predecessor must be a real MachineBasicBlock");
 								  MachinePreds[Edge].push_back(NewPred);
 								}
-												GlobalISel: use correct builder for ConstantExprs.

ConstantExpr instances were emitting code into the current block rather than
the entry block. This meant they didn't necessarily dominate all uses, which is
clearly wrong.

llvm-svn: 288985

											
										
										
											2016-12-08 05:29:15 +08:00
+								bool IRTranslator::translateBinaryOp(unsigned Opcode, const User &U,
 								                                     MachineIRBuilder &MIRBuilder) {
-												GlobalISel: make translate* functions take the most specialized class possible.

NFC.

llvm-svn: 277188

											
										
										
											2016-07-30 02:11:21 +08:00
+								  // FIXME: handle signed/unsigned wrapping flags.
-												[GlobalISel] More detailed skeleton for the IRTranslator.

llvm-svn: 260456

											
										
										
											2016-02-11 06:59:27 +08:00
+								  // Get or create a virtual register for each value.
 								  // Unless the value is a Constant => loadimm cst?
 								  // or inline constant each time?
 								  // Creation of a virtual register needs to have a size.
-												GlobalISel: support same ConstantExprs as Instructions.

It's more than just inttoptr, but the others can't be tested until we have
support for non-trivial constants (they currently get unavoidably folded to a
ConstantInt).

llvm-svn: 278303

											
										
										
											2016-08-11 07:02:41 +08:00
+								  unsigned Op0 = getOrCreateVReg(*U.getOperand(0));
 								  unsigned Op1 = getOrCreateVReg(*U.getOperand(1));
 								  unsigned Res = getOrCreateVReg(U);
-												GlobalISel: move type information to MachineRegisterInfo.

We want each register to have a canonical type, which means the best place to
store this is in MachineRegisterInfo rather than on every MachineInstr that
happens to use or define that register.

Most changes following from this are pretty simple (you need an MRI anyway if
you're going to be doing any transformations, so just check the type there).
But legalization doesn't really want to check redundant operands (when, for
example, a G_ADD only ever has one type) so I've made use of MCInstrDesc's
operand type field to encode these constraints and limit legalization's work.

As an added bonus, more validation is possible, both in MachineVerifier and
MachineIRBuilder (coming soon).

llvm-svn: 281035

											
										
										
											2016-09-09 19:46:34 +08:00
+								  MIRBuilder.buildInstr(Opcode).addDef(Res).addUse(Op0).addUse(Op1);
-												[GlobalISel][IRTranslator] Teach the pass how to translate Add instructions.

llvm-svn: 260549

											
										
										
											2016-02-12 01:51:31 +08:00
+								  return true;
-												[GlobalISel] Add the proper cmake plumbing.

This patch adds the necessary plumbing to cmake to build the sources related to
GlobalISel.

To build the sources related to GlobalISel, we need to add -DBUILD_GLOBAL_ISEL=ON.
By default, this is OFF, thus GlobalISel sources will not impact people that do
not explicitly opt-in.

Differential Revision: http://reviews.llvm.org/D15983

llvm-svn: 258344

											
										
										
											2016-01-21 04:58:56 +08:00
+								}
-												[GlobalISel] Translate floating-point negation

Reviewers: qcolombet, javed.absar, aditya_nandakumar, dsanders, t.p.northover, ab

Reviewed By: qcolombet

Subscribers: dberris, rovka, llvm-commits, kristof.beyls

Differential Revision: https://reviews.llvm.org/D30671

llvm-svn: 297171

											
										
										
											2017-03-08 02:03:28 +08:00
+								bool IRTranslator::translateFSub(const User &U, MachineIRBuilder &MIRBuilder) {
 								  // -0.0 - X --> G_FNEG
 								  if (isa<Constant>(U.getOperand(0)) &&
 								      U.getOperand(0) == ConstantFP::getZeroValueForNegation(U.getType())) {
 								    MIRBuilder.buildInstr(TargetOpcode::G_FNEG)
 								        .addDef(getOrCreateVReg(U))
 								        .addUse(getOrCreateVReg(*U.getOperand(1)));
 								    return true;
 								  }
 								  return translateBinaryOp(TargetOpcode::G_FSUB, U, MIRBuilder);
 								}
-												GlobalISel: use correct builder for ConstantExprs.

ConstantExpr instances were emitting code into the current block rather than
the entry block. This meant they didn't necessarily dominate all uses, which is
clearly wrong.

llvm-svn: 288985

											
										
										
											2016-12-08 05:29:15 +08:00
+								bool IRTranslator::translateCompare(const User &U,
 								                                    MachineIRBuilder &MIRBuilder) {
-												GlobalISel: translate floating-point comparisons

llvm-svn: 279319

											
										
										
											2016-08-20 04:48:16 +08:00
+								  const CmpInst *CI = dyn_cast<CmpInst>(&U);
 								  unsigned Op0 = getOrCreateVReg(*U.getOperand(0));
 								  unsigned Op1 = getOrCreateVReg(*U.getOperand(1));
 								  unsigned Res = getOrCreateVReg(U);
 								  CmpInst::Predicate Pred =
 								      CI ? CI->getPredicate() : static_cast<CmpInst::Predicate>(
 								                                    cast<ConstantExpr>(U).getPredicate());
 								  if (CmpInst::isIntPredicate(Pred))
-												GlobalISel: move type information to MachineRegisterInfo.

We want each register to have a canonical type, which means the best place to
store this is in MachineRegisterInfo rather than on every MachineInstr that
happens to use or define that register.

Most changes following from this are pretty simple (you need an MRI anyway if
you're going to be doing any transformations, so just check the type there).
But legalization doesn't really want to check redundant operands (when, for
example, a G_ADD only ever has one type) so I've made use of MCInstrDesc's
operand type field to encode these constraints and limit legalization's work.

As an added bonus, more validation is possible, both in MachineVerifier and
MachineIRBuilder (coming soon).

llvm-svn: 281035

											
										
										
											2016-09-09 19:46:34 +08:00
+								    MIRBuilder.buildICmp(Pred, Res, Op0, Op1);
-												GlobalISel: correctly handle trivial fcmp predicates.

It makes sense to only do them once in IRTranslator rather than making everyone
deal with them.

llvm-svn: 297304

											
										
										
											2017-03-09 02:49:54 +08:00
+								  else if (Pred == CmpInst::FCMP_FALSE)
-												[GlobalISel] Avoid translating synthetic constants to new G_CONSTANTS.

Currently, we create a G_CONSTANT for every "synthetic" integer
constant operand (for instance, for the G_GEP offset).
Instead, share the G_CONSTANTs we might have created by going through
the ValueToVReg machinery.

When we're emitting synthetic constants, we do need to get Constants from
the context.  One could argue that we shouldn't modify the context at
all (for instance, this means that we're going to use a tad more memory
if the constant wasn't used elsewhere), but constants are mostly
harmless.  We currently do this for extractvalue and all.

For constant fcmp, this does mean we'll emit an extra COPY, which is not
necessarily more optimal than an extra materialized constant.
But that preserves the current intended design of uniqued G_CONSTANTs,
and the rematerialization problem exists elsewhere and should be
resolved with a single coherent solution.

llvm-svn: 297875

											
										
										
											2017-03-16 03:21:11 +08:00
+								    MIRBuilder.buildCopy(
 								        Res, getOrCreateVReg(*Constant::getNullValue(CI->getType())));
 								  else if (Pred == CmpInst::FCMP_TRUE)
 								    MIRBuilder.buildCopy(
 								        Res, getOrCreateVReg(*Constant::getAllOnesValue(CI->getType())));
-												GlobalISel: translate floating-point comparisons

llvm-svn: 279319

											
										
										
											2016-08-20 04:48:16 +08:00
+								  else
-												GlobalISel: move type information to MachineRegisterInfo.

We want each register to have a canonical type, which means the best place to
store this is in MachineRegisterInfo rather than on every MachineInstr that
happens to use or define that register.

Most changes following from this are pretty simple (you need an MRI anyway if
you're going to be doing any transformations, so just check the type there).
But legalization doesn't really want to check redundant operands (when, for
example, a G_ADD only ever has one type) so I've made use of MCInstrDesc's
operand type field to encode these constraints and limit legalization's work.

As an added bonus, more validation is possible, both in MachineVerifier and
MachineIRBuilder (coming soon).

llvm-svn: 281035

											
										
										
											2016-09-09 19:46:34 +08:00
+								    MIRBuilder.buildFCmp(Pred, Res, Op0, Op1);
-												GlobalISel: translate floating-point comparisons

llvm-svn: 279319

											
										
										
											2016-08-20 04:48:16 +08:00
-												GlobalISel: support irtranslation of icmp instructions.

llvm-svn: 278969

											
										
										
											2016-08-18 04:25:25 +08:00
+								  return true;
 								}
-												GlobalISel: use correct builder for ConstantExprs.

ConstantExpr instances were emitting code into the current block rather than
the entry block. This meant they didn't necessarily dominate all uses, which is
clearly wrong.

llvm-svn: 288985

											
										
										
											2016-12-08 05:29:15 +08:00
+								bool IRTranslator::translateRet(const User &U, MachineIRBuilder &MIRBuilder) {
-												GlobalISel: support same ConstantExprs as Instructions.

It's more than just inttoptr, but the others can't be tested until we have
support for non-trivial constants (they currently get unavoidably folded to a
ConstantInt).

llvm-svn: 278303

											
										
										
											2016-08-11 07:02:41 +08:00
+								  const ReturnInst &RI = cast<ReturnInst>(U);
-												GlobalISel: make translate* functions take the most specialized class possible.

NFC.

llvm-svn: 277188

											
										
										
											2016-07-30 02:11:21 +08:00
+								  const Value *Ret = RI.getReturnValue();
-												[GlobalISel] Teach the IRTranslator how to lower returns.

llvm-svn: 260562

											
										
										
											2016-02-12 02:53:28 +08:00
+								  // The target may mess up with the insertion point, but
 								  // this is not important as a return is the last instruction
 								  // of the block anyway.
-												[GlobalISel] Coding style and whitespace fixes

Reviewers: qcolombet

Subscribers: joker.eph, llvm-commits, vkalintiris

Differential Revision: http://reviews.llvm.org/D19119

llvm-svn: 266342

											
										
										
											2016-04-15 01:23:33 +08:00
+								  return CLI->lowerReturn(MIRBuilder, Ret, !Ret ? 0 : getOrCreateVReg(*Ret));
-												[GlobalISel] Teach the IRTranslator how to lower returns.

llvm-svn: 260562

											
										
										
											2016-02-12 02:53:28 +08:00
+								}
-												GlobalISel: use correct builder for ConstantExprs.

ConstantExpr instances were emitting code into the current block rather than
the entry block. This meant they didn't necessarily dominate all uses, which is
clearly wrong.

llvm-svn: 288985

											
										
										
											2016-12-08 05:29:15 +08:00
+								bool IRTranslator::translateBr(const User &U, MachineIRBuilder &MIRBuilder) {
-												GlobalISel: support same ConstantExprs as Instructions.

It's more than just inttoptr, but the others can't be tested until we have
support for non-trivial constants (they currently get unavoidably folded to a
ConstantInt).

llvm-svn: 278303

											
										
										
											2016-08-11 07:02:41 +08:00
+								  const BranchInst &BrInst = cast<BranchInst>(U);
-												GlobalISel: add generic conditional branch.

Just the basic equivalent to DAG's condbr for now, we'll get to things like
br_cc when we start doing more legalization.

llvm-svn: 277184

											
										
										
											2016-07-30 01:58:00 +08:00
+								  unsigned Succ = 0;
 								  if (!BrInst.isUnconditional()) {
 								    // We want a G_BRCOND to the true BB followed by an unconditional branch.
 								    unsigned Tst = getOrCreateVReg(*BrInst.getCondition());
 								    const BasicBlock &TrueTgt = *cast<BasicBlock>(BrInst.getSuccessor(Succ++));
-												[GlobalISel] Preserve IR block layout.

It makes the output function layout more predictable;  the layout has
an effect on performance, we don't want it to be at the mercy of the
translator's visitation order and such.
The predictable output is also easier to digest.

getOrCreateBB isn't appropriately named anymore, as it never needs to
create anything.  Rename it and extract the MBB creation logic out of it.

A couple tests were sensitive to the order. Update them.

llvm-svn: 297868

											
										
										
											2017-03-16 02:22:33 +08:00
+								    MachineBasicBlock &TrueBB = getMBB(TrueTgt);
-												GlobalISel: move type information to MachineRegisterInfo.

We want each register to have a canonical type, which means the best place to
store this is in MachineRegisterInfo rather than on every MachineInstr that
happens to use or define that register.

Most changes following from this are pretty simple (you need an MRI anyway if
you're going to be doing any transformations, so just check the type there).
But legalization doesn't really want to check redundant operands (when, for
example, a G_ADD only ever has one type) so I've made use of MCInstrDesc's
operand type field to encode these constraints and limit legalization's work.

As an added bonus, more validation is possible, both in MachineVerifier and
MachineIRBuilder (coming soon).

llvm-svn: 281035

											
										
										
											2016-09-09 19:46:34 +08:00
+								    MIRBuilder.buildBrCond(Tst, TrueBB);
-												[IRTranslator] Translate unconditional branches.

llvm-svn: 263265

											
										
										
											2016-03-12 01:28:03 +08:00
+								  }
-												GlobalISel: add generic conditional branch.

Just the basic equivalent to DAG's condbr for now, we'll get to things like
br_cc when we start doing more legalization.

llvm-svn: 277184

											
										
										
											2016-07-30 01:58:00 +08:00
 								  const BasicBlock &BrTgt = *cast<BasicBlock>(BrInst.getSuccessor(Succ));
-												[GlobalISel] Preserve IR block layout.

It makes the output function layout more predictable;  the layout has
an effect on performance, we don't want it to be at the mercy of the
translator's visitation order and such.
The predictable output is also easier to digest.

getOrCreateBB isn't appropriately named anymore, as it never needs to
create anything.  Rename it and extract the MBB creation logic out of it.

A couple tests were sensitive to the order. Update them.

llvm-svn: 297868

											
										
										
											2017-03-16 02:22:33 +08:00
+								  MachineBasicBlock &TgtBB = getMBB(BrTgt);
-												[GlobalISel] Don't translate br to layout successor.

MI can represent fallthrough to layout successor blocks, and our
post-isel representation uses that extensively.

We might as well use it too, to avoid translating and carrying along
unnecessary branches.

llvm-svn: 298459

											
										
										
											2017-03-22 07:42:50 +08:00
+								  MachineBasicBlock &CurBB = MIRBuilder.getMBB();
 								  // If the unconditional target is the layout successor, fallthrough.
 								  if (!CurBB.isLayoutSuccessor(&TgtBB))
 								    MIRBuilder.buildBr(TgtBB);
-												GlobalISel: add generic conditional branch.

Just the basic equivalent to DAG's condbr for now, we'll get to things like
br_cc when we start doing more legalization.

llvm-svn: 277184

											
										
										
											2016-07-30 01:58:00 +08:00
-												[IRTranslator] Translate unconditional branches.

llvm-svn: 263265

											
										
										
											2016-03-12 01:28:03 +08:00
+								  // Link successors.
 								  for (const BasicBlock *Succ : BrInst.successors())
-												[GlobalISel] Preserve IR block layout.

It makes the output function layout more predictable;  the layout has
an effect on performance, we don't want it to be at the mercy of the
translator's visitation order and such.
The predictable output is also easier to digest.

getOrCreateBB isn't appropriately named anymore, as it never needs to
create anything.  Rename it and extract the MBB creation logic out of it.

A couple tests were sensitive to the order. Update them.

llvm-svn: 297868

											
										
										
											2017-03-16 02:22:33 +08:00
+								    CurBB.addSuccessor(&getMBB(*Succ));
-												[IRTranslator] Translate unconditional branches.

llvm-svn: 263265

											
										
										
											2016-03-12 01:28:03 +08:00
+								  return true;
 								}
-												[GlobalISel] Add support for switch statements

This commit does this using a trivial chain of conditional branches.  In the
future, we probably want to reuse the optimized switch lowering used in
SelectionDAG.

Differential Revision: https://reviews.llvm.org/D28176

llvm-svn: 291099

											
										
										
											2017-01-05 19:28:51 +08:00
+								bool IRTranslator::translateSwitch(const User &U,
 								                                   MachineIRBuilder &MIRBuilder) {
 								  // For now, just translate as a chain of conditional branches.
 								  // FIXME: could we share most of the logic/code in
 								  // SelectionDAGBuilder::visitSwitch between SelectionDAG and GlobalISel?
 								  // At first sight, it seems most of the logic in there is independent of
 								  // SelectionDAG-specifics and a lot of work went in to optimize switch
 								  // lowering in there.
 								  const SwitchInst &SwInst = cast<SwitchInst>(U);
 								  const unsigned SwCondValue = getOrCreateVReg(*SwInst.getCondition());
-												[GlobalISel] track predecessor mapping during switch lowering.

Correctly populating Machine PHIs relies on knowing exactly how the IR level
CFG was lowered to MachineIR. This needs to be tracked by any translation
phases that meddle (currently only SwitchInst handling).

This reapplies r291973 which was reverted because of testing failures. Fixes:

 + Don't return an ArrayRef to a local temporary.
 + Incorporate Kristof's suggested comment improvements.

llvm-svn: 292278

											
										
										
											2017-01-18 06:13:50 +08:00
+								  const BasicBlock *OrigBB = SwInst.getParent();
-												[GlobalISel] Add support for switch statements

This commit does this using a trivial chain of conditional branches.  In the
future, we probably want to reuse the optimized switch lowering used in
SelectionDAG.

Differential Revision: https://reviews.llvm.org/D28176

llvm-svn: 291099

											
										
										
											2017-01-05 19:28:51 +08:00
-												Recommit: [globalisel] Change LLT constructor string into an LLT-based object that knows how to generate it.

Summary:
This will allow future patches to inspect the details of the LLT. The implementation is now split between
the Support and CodeGen libraries to allow TableGen to use this class without introducing layering concerns.

Thanks to Ahmed Bougacha for finding a reasonable way to avoid the layering issue and providing the version of this patch without that problem.

The problem with the previous commit appears to have been that TableGen was including CodeGen/LowLevelType.h instead of Support/LowLevelTypeImpl.h.

Reviewers: t.p.northover, qcolombet, rovka, aditya_nandakumar, ab, javed.absar

Subscribers: arsenm, nhaehnle, mgorny, dberris, llvm-commits, kristof.beyls

Differential Revision: https://reviews.llvm.org/D30046

llvm-svn: 297241

											
										
										
											2017-03-08 07:20:35 +08:00
+								  LLT LLTi1 = getLLTForType(*Type::getInt1Ty(U.getContext()), *DL);
-												[GlobalISel] Add support for switch statements

This commit does this using a trivial chain of conditional branches.  In the
future, we probably want to reuse the optimized switch lowering used in
SelectionDAG.

Differential Revision: https://reviews.llvm.org/D28176

llvm-svn: 291099

											
										
										
											2017-01-05 19:28:51 +08:00
+								  for (auto &CaseIt : SwInst.cases()) {
 								    const unsigned CaseValueReg = getOrCreateVReg(*CaseIt.getCaseValue());
 								    const unsigned Tst = MRI->createGenericVirtualRegister(LLTi1);
 								    MIRBuilder.buildICmp(CmpInst::ICMP_EQ, Tst, CaseValueReg, SwCondValue);
-												[GlobalISel] track predecessor mapping during switch lowering.

Correctly populating Machine PHIs relies on knowing exactly how the IR level
CFG was lowered to MachineIR. This needs to be tracked by any translation
phases that meddle (currently only SwitchInst handling).

This reapplies r291973 which was reverted because of testing failures. Fixes:

 + Don't return an ArrayRef to a local temporary.
 + Incorporate Kristof's suggested comment improvements.

llvm-svn: 292278

											
										
										
											2017-01-18 06:13:50 +08:00
+								    MachineBasicBlock &CurMBB = MIRBuilder.getMBB();
 								    const BasicBlock *TrueBB = CaseIt.getCaseSuccessor();
-												[GlobalISel] Preserve IR block layout.

It makes the output function layout more predictable;  the layout has
an effect on performance, we don't want it to be at the mercy of the
translator's visitation order and such.
The predictable output is also easier to digest.

getOrCreateBB isn't appropriately named anymore, as it never needs to
create anything.  Rename it and extract the MBB creation logic out of it.

A couple tests were sensitive to the order. Update them.

llvm-svn: 297868

											
										
										
											2017-03-16 02:22:33 +08:00
+								    MachineBasicBlock &TrueMBB = getMBB(*TrueBB);
-												[GlobalISel] Add support for switch statements

This commit does this using a trivial chain of conditional branches.  In the
future, we probably want to reuse the optimized switch lowering used in
SelectionDAG.

Differential Revision: https://reviews.llvm.org/D28176

llvm-svn: 291099

											
										
										
											2017-01-05 19:28:51 +08:00
-												[GlobalISel] track predecessor mapping during switch lowering.

Correctly populating Machine PHIs relies on knowing exactly how the IR level
CFG was lowered to MachineIR. This needs to be tracked by any translation
phases that meddle (currently only SwitchInst handling).

This reapplies r291973 which was reverted because of testing failures. Fixes:

 + Don't return an ArrayRef to a local temporary.
 + Incorporate Kristof's suggested comment improvements.

llvm-svn: 292278

											
										
										
											2017-01-18 06:13:50 +08:00
+								    MIRBuilder.buildBrCond(Tst, TrueMBB);
 								    CurMBB.addSuccessor(&TrueMBB);
 								    addMachineCFGPred({OrigBB, TrueBB}, &CurMBB);
-												[GlobalISel] Add support for switch statements

This commit does this using a trivial chain of conditional branches.  In the
future, we probably want to reuse the optimized switch lowering used in
SelectionDAG.

Differential Revision: https://reviews.llvm.org/D28176

llvm-svn: 291099

											
										
										
											2017-01-05 19:28:51 +08:00
-												[GlobalISel] track predecessor mapping during switch lowering.

Correctly populating Machine PHIs relies on knowing exactly how the IR level
CFG was lowered to MachineIR. This needs to be tracked by any translation
phases that meddle (currently only SwitchInst handling).

This reapplies r291973 which was reverted because of testing failures. Fixes:

 + Don't return an ArrayRef to a local temporary.
 + Incorporate Kristof's suggested comment improvements.

llvm-svn: 292278

											
										
										
											2017-01-18 06:13:50 +08:00
+								    MachineBasicBlock *FalseMBB =
-												[GlobalISel] Add support for switch statements

This commit does this using a trivial chain of conditional branches.  In the
future, we probably want to reuse the optimized switch lowering used in
SelectionDAG.

Differential Revision: https://reviews.llvm.org/D28176

llvm-svn: 291099

											
										
										
											2017-01-05 19:28:51 +08:00
+								        MF->CreateMachineBasicBlock(SwInst.getParent());
-												[GlobalISel] Insert translated switch icmp blocks after switch parent.

Now that we preserve the IR layout, we would end up with all the newly
synthesized switch comparison blocks at the end of the function.
Instead, use a hopefully more reasonable layout, with the comparison
blocks immediately following the switch comparison blocks.

llvm-svn: 297869

											
										
										
											2017-03-16 02:22:37 +08:00
+								    // Insert the comparison blocks one after the other.
 								    MF->insert(std::next(CurMBB.getIterator()), FalseMBB);
-												[GlobalISel] track predecessor mapping during switch lowering.

Correctly populating Machine PHIs relies on knowing exactly how the IR level
CFG was lowered to MachineIR. This needs to be tracked by any translation
phases that meddle (currently only SwitchInst handling).

This reapplies r291973 which was reverted because of testing failures. Fixes:

 + Don't return an ArrayRef to a local temporary.
 + Incorporate Kristof's suggested comment improvements.

llvm-svn: 292278

											
										
										
											2017-01-18 06:13:50 +08:00
+								    MIRBuilder.buildBr(*FalseMBB);
 								    CurMBB.addSuccessor(FalseMBB);
-												[GlobalISel] Add support for switch statements

This commit does this using a trivial chain of conditional branches.  In the
future, we probably want to reuse the optimized switch lowering used in
SelectionDAG.

Differential Revision: https://reviews.llvm.org/D28176

llvm-svn: 291099

											
										
										
											2017-01-05 19:28:51 +08:00
-												[GlobalISel] track predecessor mapping during switch lowering.

Correctly populating Machine PHIs relies on knowing exactly how the IR level
CFG was lowered to MachineIR. This needs to be tracked by any translation
phases that meddle (currently only SwitchInst handling).

This reapplies r291973 which was reverted because of testing failures. Fixes:

 + Don't return an ArrayRef to a local temporary.
 + Incorporate Kristof's suggested comment improvements.

llvm-svn: 292278

											
										
										
											2017-01-18 06:13:50 +08:00
+								    MIRBuilder.setMBB(*FalseMBB);
-												[GlobalISel] Add support for switch statements

This commit does this using a trivial chain of conditional branches.  In the
future, we probably want to reuse the optimized switch lowering used in
SelectionDAG.

Differential Revision: https://reviews.llvm.org/D28176

llvm-svn: 291099

											
										
										
											2017-01-05 19:28:51 +08:00
+								  }
 								  // handle default case
-												[GlobalISel] track predecessor mapping during switch lowering.

Correctly populating Machine PHIs relies on knowing exactly how the IR level
CFG was lowered to MachineIR. This needs to be tracked by any translation
phases that meddle (currently only SwitchInst handling).

This reapplies r291973 which was reverted because of testing failures. Fixes:

 + Don't return an ArrayRef to a local temporary.
 + Incorporate Kristof's suggested comment improvements.

llvm-svn: 292278

											
										
										
											2017-01-18 06:13:50 +08:00
+								  const BasicBlock *DefaultBB = SwInst.getDefaultDest();
-												[GlobalISel] Preserve IR block layout.

It makes the output function layout more predictable;  the layout has
an effect on performance, we don't want it to be at the mercy of the
translator's visitation order and such.
The predictable output is also easier to digest.

getOrCreateBB isn't appropriately named anymore, as it never needs to
create anything.  Rename it and extract the MBB creation logic out of it.

A couple tests were sensitive to the order. Update them.

llvm-svn: 297868

											
										
										
											2017-03-16 02:22:33 +08:00
+								  MachineBasicBlock &DefaultMBB = getMBB(*DefaultBB);
-												[GlobalISel] track predecessor mapping during switch lowering.

Correctly populating Machine PHIs relies on knowing exactly how the IR level
CFG was lowered to MachineIR. This needs to be tracked by any translation
phases that meddle (currently only SwitchInst handling).

This reapplies r291973 which was reverted because of testing failures. Fixes:

 + Don't return an ArrayRef to a local temporary.
 + Incorporate Kristof's suggested comment improvements.

llvm-svn: 292278

											
										
										
											2017-01-18 06:13:50 +08:00
+								  MIRBuilder.buildBr(DefaultMBB);
 								  MachineBasicBlock &CurMBB = MIRBuilder.getMBB();
 								  CurMBB.addSuccessor(&DefaultMBB);
 								  addMachineCFGPred({OrigBB, DefaultBB}, &CurMBB);
-												[GlobalISel] Add support for switch statements

This commit does this using a trivial chain of conditional branches.  In the
future, we probably want to reuse the optimized switch lowering used in
SelectionDAG.

Differential Revision: https://reviews.llvm.org/D28176

llvm-svn: 291099

											
										
										
											2017-01-05 19:28:51 +08:00
 								  return true;
 								}
-												[GlobalISel] Add support for indirectbr

Differential Revision: https://reviews.llvm.org/D28079

llvm-svn: 293470

											
										
										
											2017-01-30 17:13:18 +08:00
+								bool IRTranslator::translateIndirectBr(const User &U,
 								                                       MachineIRBuilder &MIRBuilder) {
 								  const IndirectBrInst &BrInst = cast<IndirectBrInst>(U);
 								  const unsigned Tgt = getOrCreateVReg(*BrInst.getAddress());
 								  MIRBuilder.buildBrIndirect(Tgt);
 								  // Link successors.
 								  MachineBasicBlock &CurBB = MIRBuilder.getMBB();
 								  for (const BasicBlock *Succ : BrInst.successors())
-												[GlobalISel] Preserve IR block layout.

It makes the output function layout more predictable;  the layout has
an effect on performance, we don't want it to be at the mercy of the
translator's visitation order and such.
The predictable output is also easier to digest.

getOrCreateBB isn't appropriately named anymore, as it never needs to
create anything.  Rename it and extract the MBB creation logic out of it.

A couple tests were sensitive to the order. Update them.

llvm-svn: 297868

											
										
										
											2017-03-16 02:22:33 +08:00
+								    CurBB.addSuccessor(&getMBB(*Succ));
-												[GlobalISel] Add support for indirectbr

Differential Revision: https://reviews.llvm.org/D28079

llvm-svn: 293470

											
										
										
											2017-01-30 17:13:18 +08:00
 								  return true;
 								}
-												GlobalISel: use correct builder for ConstantExprs.

ConstantExpr instances were emitting code into the current block rather than
the entry block. This meant they didn't necessarily dominate all uses, which is
clearly wrong.

llvm-svn: 288985

											
										
										
											2016-12-08 05:29:15 +08:00
+								bool IRTranslator::translateLoad(const User &U, MachineIRBuilder &MIRBuilder) {
-												GlobalISel: support same ConstantExprs as Instructions.

It's more than just inttoptr, but the others can't be tested until we have
support for non-trivial constants (they currently get unavoidably folded to a
ConstantInt).

llvm-svn: 278303

											
										
										
											2016-08-11 07:02:41 +08:00
+								  const LoadInst &LI = cast<LoadInst>(U);
-												[IRTranslator] Do not abort when the target wants to fall back.

Every pass in the GlobalISel pipeline will need to do something similar.

llvm-svn: 279886

											
										
										
											2016-08-27 07:49:05 +08:00
-												GlobalISel: support translating volatile loads and stores.

llvm-svn: 284603

											
										
										
											2016-10-19 23:55:06 +08:00
+								  auto Flags = LI.isVolatile() ? MachineMemOperand::MOVolatile
 								                               : MachineMemOperand::MONone;
 								  Flags |= MachineMemOperand::MOLoad;
-												GlobalISel: add generic load and store instructions.

Pretty straightforward, the only oddity is the MachineMemOperand (which it's
surprisingly difficult to share code for).

llvm-svn: 276799

											
										
										
											2016-07-27 04:23:26 +08:00
 								  unsigned Res = getOrCreateVReg(LI);
 								  unsigned Addr = getOrCreateVReg(*LI.getPointerOperand());
-												Recommit: [globalisel] Change LLT constructor string into an LLT-based object that knows how to generate it.

Summary:
This will allow future patches to inspect the details of the LLT. The implementation is now split between
the Support and CodeGen libraries to allow TableGen to use this class without introducing layering concerns.

Thanks to Ahmed Bougacha for finding a reasonable way to avoid the layering issue and providing the version of this patch without that problem.

The problem with the previous commit appears to have been that TableGen was including CodeGen/LowLevelType.h instead of Support/LowLevelTypeImpl.h.

Reviewers: t.p.northover, qcolombet, rovka, aditya_nandakumar, ab, javed.absar

Subscribers: arsenm, nhaehnle, mgorny, dberris, llvm-commits, kristof.beyls

Differential Revision: https://reviews.llvm.org/D30046

llvm-svn: 297241

											
										
										
											2017-03-08 07:20:35 +08:00
-												GlobalISel: add generic load and store instructions.

Pretty straightforward, the only oddity is the MachineMemOperand (which it's
surprisingly difficult to share code for).

llvm-svn: 276799

											
										
										
											2016-07-27 04:23:26 +08:00
+								  MIRBuilder.buildLoad(
-												GlobalISel: move type information to MachineRegisterInfo.

We want each register to have a canonical type, which means the best place to
store this is in MachineRegisterInfo rather than on every MachineInstr that
happens to use or define that register.

Most changes following from this are pretty simple (you need an MRI anyway if
you're going to be doing any transformations, so just check the type there).
But legalization doesn't really want to check redundant operands (when, for
example, a G_ADD only ever has one type) so I've made use of MCInstrDesc's
operand type field to encode these constraints and limit legalization's work.

As an added bonus, more validation is possible, both in MachineVerifier and
MachineIRBuilder (coming soon).

llvm-svn: 281035

											
										
										
											2016-09-09 19:46:34 +08:00
+								      Res, Addr,
-												GlobalISel: store the current MachineFunction as direct state. NFC.

Having to ask the MIRBuilder for the current function is a little awkward, and
I'm intending to improve how that's threaded through anyway.

llvm-svn: 288983

											
										
										
											2016-12-08 05:17:47 +08:00
+								      *MF->getMachineMemOperand(MachinePointerInfo(LI.getPointerOperand()),
 								                                Flags, DL->getTypeStoreSize(LI.getType()),
-												GlobalISel: represent atomic loads & stores via the MachineMemOperand.

Also make sure the AArch64 backend doesn't try to convert them into normal
loads and stores.

llvm-svn: 294993

											
										
										
											2017-02-14 06:14:16 +08:00
+								                                getMemOpAlignment(LI), AAMDNodes(), nullptr,
 								                                LI.getSynchScope(), LI.getOrdering()));
-												GlobalISel: add generic load and store instructions.

Pretty straightforward, the only oddity is the MachineMemOperand (which it's
surprisingly difficult to share code for).

llvm-svn: 276799

											
										
										
											2016-07-27 04:23:26 +08:00
+								  return true;
 								}
-												GlobalISel: use correct builder for ConstantExprs.

ConstantExpr instances were emitting code into the current block rather than
the entry block. This meant they didn't necessarily dominate all uses, which is
clearly wrong.

llvm-svn: 288985

											
										
										
											2016-12-08 05:29:15 +08:00
+								bool IRTranslator::translateStore(const User &U, MachineIRBuilder &MIRBuilder) {
-												GlobalISel: support same ConstantExprs as Instructions.

It's more than just inttoptr, but the others can't be tested until we have
support for non-trivial constants (they currently get unavoidably folded to a
ConstantInt).

llvm-svn: 278303

											
										
										
											2016-08-11 07:02:41 +08:00
+								  const StoreInst &SI = cast<StoreInst>(U);
-												GlobalISel: support translating volatile loads and stores.

llvm-svn: 284603

											
										
										
											2016-10-19 23:55:06 +08:00
+								  auto Flags = SI.isVolatile() ? MachineMemOperand::MOVolatile
 								                               : MachineMemOperand::MONone;
 								  Flags |= MachineMemOperand::MOStore;
-												GlobalISel: add generic load and store instructions.

Pretty straightforward, the only oddity is the MachineMemOperand (which it's
surprisingly difficult to share code for).

llvm-svn: 276799

											
										
										
											2016-07-27 04:23:26 +08:00
 								  unsigned Val = getOrCreateVReg(*SI.getValueOperand());
 								  unsigned Addr = getOrCreateVReg(*SI.getPointerOperand());
 								  MIRBuilder.buildStore(
-												GlobalISel: store the current MachineFunction as direct state. NFC.

Having to ask the MIRBuilder for the current function is a little awkward, and
I'm intending to improve how that's threaded through anyway.

llvm-svn: 288983

											
										
										
											2016-12-08 05:17:47 +08:00
+								      Val, Addr,
 								      *MF->getMachineMemOperand(
 								          MachinePointerInfo(SI.getPointerOperand()), Flags,
 								          DL->getTypeStoreSize(SI.getValueOperand()->getType()),
-												GlobalISel: represent atomic loads & stores via the MachineMemOperand.

Also make sure the AArch64 backend doesn't try to convert them into normal
loads and stores.

llvm-svn: 294993

											
										
										
											2017-02-14 06:14:16 +08:00
+								          getMemOpAlignment(SI), AAMDNodes(), nullptr, SI.getSynchScope(),
 								          SI.getOrdering()));
-												GlobalISel: add generic load and store instructions.

Pretty straightforward, the only oddity is the MachineMemOperand (which it's
surprisingly difficult to share code for).

llvm-svn: 276799

											
										
										
											2016-07-27 04:23:26 +08:00
+								  return true;
 								}
-												GlobalISel: use correct builder for ConstantExprs.

ConstantExpr instances were emitting code into the current block rather than
the entry block. This meant they didn't necessarily dominate all uses, which is
clearly wrong.

llvm-svn: 288985

											
										
										
											2016-12-08 05:29:15 +08:00
+								bool IRTranslator::translateExtractValue(const User &U,
 								                                         MachineIRBuilder &MIRBuilder) {
-												GlobalISel: fix insert/extract to work on ConstantExprs too.

No tests yet unfortunately (ConstantFolding reduces all supported constants to
ConstantInts before we get to translation). Soon.

llvm-svn: 279308

											
										
										
											2016-08-20 04:09:03 +08:00
+								  const Value *Src = U.getOperand(0);
 								  Type *Int32Ty = Type::getInt32Ty(U.getContext());
-												GlobalISel: support translation of extractvalue instructions.

llvm-svn: 279285

											
										
										
											2016-08-20 01:47:05 +08:00
+								  SmallVector<Value *, 1> Indices;
-												[GlobalISel] IRTranslator: Translate ConstantStruct

Reviewers: qcolombet, ab, t.p.northover, aditya_nandakumar, dsanders

Reviewed By: qcolombet

Subscribers: rovka, kristof.beyls, javed.absar, igorb, llvm-commits

Differential Revision: https://reviews.llvm.org/D33317

llvm-svn: 303412

											
										
										
											2017-05-19 17:47:02 +08:00
+								  // If Src is a single element ConstantStruct, translate extractvalue
 								  // to that element to avoid inserting a cast instruction.
 								  if (auto CS = dyn_cast<ConstantStruct>(Src))
 								    if (CS->getNumOperands() == 1) {
 								      unsigned Res = getOrCreateVReg(*CS->getOperand(0));
 								      ValToVReg[&U] = Res;
 								      return true;
 								    }
-												GlobalISel: support translation of extractvalue instructions.

llvm-svn: 279285

											
										
										
											2016-08-20 01:47:05 +08:00
+								  // getIndexedOffsetInType is designed for GEPs, so the first index is the
 								  // usual array element rather than looking into the actual aggregate.
 								  Indices.push_back(ConstantInt::get(Int32Ty, 0));
-												GlobalISel: fix insert/extract to work on ConstantExprs too.

No tests yet unfortunately (ConstantFolding reduces all supported constants to
ConstantInts before we get to translation). Soon.

llvm-svn: 279308

											
										
										
											2016-08-20 04:09:03 +08:00
 								  if (const ExtractValueInst *EVI = dyn_cast<ExtractValueInst>(&U)) {
 								    for (auto Idx : EVI->indices())
 								      Indices.push_back(ConstantInt::get(Int32Ty, Idx));
 								  } else {
 								    for (unsigned i = 1; i < U.getNumOperands(); ++i)
 								      Indices.push_back(U.getOperand(i));
 								  }
-												GlobalISel: support translation of extractvalue instructions.

llvm-svn: 279285

											
										
										
											2016-08-20 01:47:05 +08:00
 								  uint64_t Offset = 8 * DL->getIndexedOffsetInType(Src->getType(), Indices);
-												GlobalISel: fix insert/extract to work on ConstantExprs too.

No tests yet unfortunately (ConstantFolding reduces all supported constants to
ConstantInts before we get to translation). Soon.

llvm-svn: 279308

											
										
										
											2016-08-20 04:09:03 +08:00
+								  unsigned Res = getOrCreateVReg(U);
-												GlobalISel: restrict G_EXTRACT instruction to just one operand.

A bit more painful than G_INSERT because it was more widely used, but this
should simplify the handling of extract operations in most locations.

llvm-svn: 297100

											
										
										
											2017-03-07 07:50:28 +08:00
+								  MIRBuilder.buildExtract(Res, getOrCreateVReg(*Src), Offset);
-												GlobalISel: support translation of extractvalue instructions.

llvm-svn: 279285

											
										
										
											2016-08-20 01:47:05 +08:00
 								  return true;
 								}
-												GlobalISel: use correct builder for ConstantExprs.

ConstantExpr instances were emitting code into the current block rather than
the entry block. This meant they didn't necessarily dominate all uses, which is
clearly wrong.

llvm-svn: 288985

											
										
										
											2016-12-08 05:29:15 +08:00
+								bool IRTranslator::translateInsertValue(const User &U,
 								                                        MachineIRBuilder &MIRBuilder) {
-												GlobalISel: fix insert/extract to work on ConstantExprs too.

No tests yet unfortunately (ConstantFolding reduces all supported constants to
ConstantInts before we get to translation). Soon.

llvm-svn: 279308

											
										
										
											2016-08-20 04:09:03 +08:00
+								  const Value *Src = U.getOperand(0);
 								  Type *Int32Ty = Type::getInt32Ty(U.getContext());
-												GlobalISel: translate insertvalue instructions.

This adds a G_INSERT instruction, which technically makes G_SEQUENCE redundant
(it's equivalent to a G_INSERT into an IMPLICIT_DEF). We'll leave G_SEQUENCE
for now though: it's likely to be far more common as it's a fundamental part of
legalization, so avoiding the mess and bloat of the extra IMPLICIT_DEFs is
probably worthwhile.

llvm-svn: 279306

											
										
										
											2016-08-20 04:08:55 +08:00
+								  SmallVector<Value *, 1> Indices;
 								  // getIndexedOffsetInType is designed for GEPs, so the first index is the
 								  // usual array element rather than looking into the actual aggregate.
 								  Indices.push_back(ConstantInt::get(Int32Ty, 0));
-												GlobalISel: fix insert/extract to work on ConstantExprs too.

No tests yet unfortunately (ConstantFolding reduces all supported constants to
ConstantInts before we get to translation). Soon.

llvm-svn: 279308

											
										
										
											2016-08-20 04:09:03 +08:00
 								  if (const InsertValueInst *IVI = dyn_cast<InsertValueInst>(&U)) {
 								    for (auto Idx : IVI->indices())
 								      Indices.push_back(ConstantInt::get(Int32Ty, Idx));
 								  } else {
 								    for (unsigned i = 2; i < U.getNumOperands(); ++i)
 								      Indices.push_back(U.getOperand(i));
 								  }
-												GlobalISel: translate insertvalue instructions.

This adds a G_INSERT instruction, which technically makes G_SEQUENCE redundant
(it's equivalent to a G_INSERT into an IMPLICIT_DEF). We'll leave G_SEQUENCE
for now though: it's likely to be far more common as it's a fundamental part of
legalization, so avoiding the mess and bloat of the extra IMPLICIT_DEFs is
probably worthwhile.

llvm-svn: 279306

											
										
										
											2016-08-20 04:08:55 +08:00
 								  uint64_t Offset = 8 * DL->getIndexedOffsetInType(Src->getType(), Indices);
-												GlobalISel: fix insert/extract to work on ConstantExprs too.

No tests yet unfortunately (ConstantFolding reduces all supported constants to
ConstantInts before we get to translation). Soon.

llvm-svn: 279308

											
										
										
											2016-08-20 04:09:03 +08:00
+								  unsigned Res = getOrCreateVReg(U);
-												[GlobalISel] Remove non-determinism from IRTranslator.

This showed up in r300535/r300537, which were reverted in r300538 due to
some of the introduced tests in there failing on some bots, due to the
non-determinism fixed in this commit.

Re-committing r300535/r300537 will add 2 tests for the change in this
commit.

llvm-svn: 300663

											
										
										
											2017-04-19 14:38:37 +08:00
+								  unsigned Inserted = getOrCreateVReg(*U.getOperand(1));
 								  MIRBuilder.buildInsert(Res, getOrCreateVReg(*Src), Inserted, Offset);
-												GlobalISel: translate insertvalue instructions.

This adds a G_INSERT instruction, which technically makes G_SEQUENCE redundant
(it's equivalent to a G_INSERT into an IMPLICIT_DEF). We'll leave G_SEQUENCE
for now though: it's likely to be far more common as it's a fundamental part of
legalization, so avoiding the mess and bloat of the extra IMPLICIT_DEFs is
probably worthwhile.

llvm-svn: 279306

											
										
										
											2016-08-20 04:08:55 +08:00
 								  return true;
 								}
-												GlobalISel: use correct builder for ConstantExprs.

ConstantExpr instances were emitting code into the current block rather than
the entry block. This meant they didn't necessarily dominate all uses, which is
clearly wrong.

llvm-svn: 288985

											
										
										
											2016-12-08 05:29:15 +08:00
+								bool IRTranslator::translateSelect(const User &U,
 								                                   MachineIRBuilder &MIRBuilder) {
-												[GlobalISel] Remove non-determinism from IRTranslator.

This showed up in r300535/r300537, which were reverted in r300538 due to
some of the introduced tests in there failing on some bots, due to the
non-determinism fixed in this commit.

Re-committing r300535/r300537 will add 2 tests for the change in this
commit.

llvm-svn: 300663

											
										
										
											2017-04-19 14:38:37 +08:00
+								  unsigned Res = getOrCreateVReg(U);
 								  unsigned Tst = getOrCreateVReg(*U.getOperand(0));
 								  unsigned Op0 = getOrCreateVReg(*U.getOperand(1));
 								  unsigned Op1 = getOrCreateVReg(*U.getOperand(2));
 								  MIRBuilder.buildSelect(Res, Tst, Op0, Op1);
-												GlobalISel: support translating select instructions.

llvm-svn: 279309

											
										
										
											2016-08-20 04:09:07 +08:00
+								  return true;
 								}
-												GlobalISel: use correct builder for ConstantExprs.

ConstantExpr instances were emitting code into the current block rather than
the entry block. This meant they didn't necessarily dominate all uses, which is
clearly wrong.

llvm-svn: 288985

											
										
										
											2016-12-08 05:29:15 +08:00
+								bool IRTranslator::translateBitCast(const User &U,
 								                                    MachineIRBuilder &MIRBuilder) {
-												[GlobalISel] Avoid invalidating ValToVReg when translating no-op bitcast.

When we translate a no-op (same type) bitcast, we try to be clever and
only emit a COPY if we already assigned a vreg to the defined value.
However, when we didn't, we tried to assign to a reference into the
ValToVReg DenseMap, even though the RHS of the assignment
(getOrCreateVReg) could potentially grow that DenseMap, invalidating the
reference.

Avoid that by getting the source vreg first.
I audited the rest of the translator; this is the only tricky case.

The test is quite unwieldy, as the problem is caused by the DenseMap
growing, which happens after the 47th mapped value.

llvm-svn: 297208

											
										
										
											2017-03-08 04:53:06 +08:00
+								  // If we're bitcasting to the source type, we can reuse the source vreg.
-												Recommit: [globalisel] Change LLT constructor string into an LLT-based object that knows how to generate it.

Summary:
This will allow future patches to inspect the details of the LLT. The implementation is now split between
the Support and CodeGen libraries to allow TableGen to use this class without introducing layering concerns.

Thanks to Ahmed Bougacha for finding a reasonable way to avoid the layering issue and providing the version of this patch without that problem.

The problem with the previous commit appears to have been that TableGen was including CodeGen/LowLevelType.h instead of Support/LowLevelTypeImpl.h.

Reviewers: t.p.northover, qcolombet, rovka, aditya_nandakumar, ab, javed.absar

Subscribers: arsenm, nhaehnle, mgorny, dberris, llvm-commits, kristof.beyls

Differential Revision: https://reviews.llvm.org/D30046

llvm-svn: 297241

											
										
										
											2017-03-08 07:20:35 +08:00
+								  if (getLLTForType(*U.getOperand(0)->getType(), *DL) ==
 								      getLLTForType(*U.getType(), *DL)) {
-												[GlobalISel] Avoid invalidating ValToVReg when translating no-op bitcast.

When we translate a no-op (same type) bitcast, we try to be clever and
only emit a COPY if we already assigned a vreg to the defined value.
However, when we didn't, we tried to assign to a reference into the
ValToVReg DenseMap, even though the RHS of the assignment
(getOrCreateVReg) could potentially grow that DenseMap, invalidating the
reference.

Avoid that by getting the source vreg first.
I audited the rest of the translator; this is the only tricky case.

The test is quite unwieldy, as the problem is caused by the DenseMap
growing, which happens after the 47th mapped value.

llvm-svn: 297208

											
										
										
											2017-03-08 04:53:06 +08:00
+								    // Get the source vreg now, to avoid invalidating ValToVReg.
 								    unsigned SrcReg = getOrCreateVReg(*U.getOperand(0));
-												GlobalISel: support same ConstantExprs as Instructions.

It's more than just inttoptr, but the others can't be tested until we have
support for non-trivial constants (they currently get unavoidably folded to a
ConstantInt).

llvm-svn: 278303

											
										
										
											2016-08-11 07:02:41 +08:00
+								    unsigned &Reg = ValToVReg[&U];
-												[GlobalISel] Avoid invalidating ValToVReg when translating no-op bitcast.

When we translate a no-op (same type) bitcast, we try to be clever and
only emit a COPY if we already assigned a vreg to the defined value.
However, when we didn't, we tried to assign to a reference into the
ValToVReg DenseMap, even though the RHS of the assignment
(getOrCreateVReg) could potentially grow that DenseMap, invalidating the
reference.

Avoid that by getting the source vreg first.
I audited the rest of the translator; this is the only tricky case.

The test is quite unwieldy, as the problem is caused by the DenseMap
growing, which happens after the 47th mapped value.

llvm-svn: 297208

											
										
										
											2017-03-08 04:53:06 +08:00
+								    // If we already assigned a vreg for this bitcast, we can't change that.
 								    // Emit a copy to satisfy the users we already emitted.
-												GlobalISel: avoid inserting redundant COPYs for bitcasts.

If the value produced by the bitcast hasn't been referenced yet, we can simply
reuse the input register avoiding an unnecessary COPY instruction.

llvm-svn: 278245

											
										
										
											2016-08-11 00:51:14 +08:00
+								    if (Reg)
-												[GlobalISel] Avoid invalidating ValToVReg when translating no-op bitcast.

When we translate a no-op (same type) bitcast, we try to be clever and
only emit a COPY if we already assigned a vreg to the defined value.
However, when we didn't, we tried to assign to a reference into the
ValToVReg DenseMap, even though the RHS of the assignment
(getOrCreateVReg) could potentially grow that DenseMap, invalidating the
reference.

Avoid that by getting the source vreg first.
I audited the rest of the translator; this is the only tricky case.

The test is quite unwieldy, as the problem is caused by the DenseMap
growing, which happens after the 47th mapped value.

llvm-svn: 297208

											
										
										
											2017-03-08 04:53:06 +08:00
+								      MIRBuilder.buildCopy(Reg, SrcReg);
-												GlobalISel: avoid inserting redundant COPYs for bitcasts.

If the value produced by the bitcast hasn't been referenced yet, we can simply
reuse the input register avoiding an unnecessary COPY instruction.

llvm-svn: 278245

											
										
										
											2016-08-11 00:51:14 +08:00
+								    else
-												[GlobalISel] Avoid invalidating ValToVReg when translating no-op bitcast.

When we translate a no-op (same type) bitcast, we try to be clever and
only emit a COPY if we already assigned a vreg to the defined value.
However, when we didn't, we tried to assign to a reference into the
ValToVReg DenseMap, even though the RHS of the assignment
(getOrCreateVReg) could potentially grow that DenseMap, invalidating the
reference.

Avoid that by getting the source vreg first.
I audited the rest of the translator; this is the only tricky case.

The test is quite unwieldy, as the problem is caused by the DenseMap
growing, which happens after the 47th mapped value.

llvm-svn: 297208

											
										
										
											2017-03-08 04:53:06 +08:00
+								      Reg = SrcReg;
-												GlobalISel: add generic casts to IRTranslator

This adds LLVM's 3 main cast instructions (inttoptr, ptrtoint, bitcast) to the
IRTranslator. The first two are direct translations (with 2 MachineInstr types
each). Since LLT discards information, a bitcast might become trivial and we
emit a COPY in those cases instead.

llvm-svn: 276690

											
										
										
											2016-07-26 05:01:29 +08:00
+								    return true;
 								  }
-												GlobalISel: use correct builder for ConstantExprs.

ConstantExpr instances were emitting code into the current block rather than
the entry block. This meant they didn't necessarily dominate all uses, which is
clearly wrong.

llvm-svn: 288985

											
										
										
											2016-12-08 05:29:15 +08:00
+								  return translateCast(TargetOpcode::G_BITCAST, U, MIRBuilder);
-												GlobalISel: add generic casts to IRTranslator

This adds LLVM's 3 main cast instructions (inttoptr, ptrtoint, bitcast) to the
IRTranslator. The first two are direct translations (with 2 MachineInstr types
each). Since LLT discards information, a bitcast might become trivial and we
emit a COPY in those cases instead.

llvm-svn: 276690

											
										
										
											2016-07-26 05:01:29 +08:00
+								}
-												GlobalISel: use correct builder for ConstantExprs.

ConstantExpr instances were emitting code into the current block rather than
the entry block. This meant they didn't necessarily dominate all uses, which is
clearly wrong.

llvm-svn: 288985

											
										
										
											2016-12-08 05:29:15 +08:00
+								bool IRTranslator::translateCast(unsigned Opcode, const User &U,
 								                                 MachineIRBuilder &MIRBuilder) {
-												GlobalISel: support same ConstantExprs as Instructions.

It's more than just inttoptr, but the others can't be tested until we have
support for non-trivial constants (they currently get unavoidably folded to a
ConstantInt).

llvm-svn: 278303

											
										
										
											2016-08-11 07:02:41 +08:00
+								  unsigned Op = getOrCreateVReg(*U.getOperand(0));
 								  unsigned Res = getOrCreateVReg(U);
-												GlobalISel: move type information to MachineRegisterInfo.

We want each register to have a canonical type, which means the best place to
store this is in MachineRegisterInfo rather than on every MachineInstr that
happens to use or define that register.

Most changes following from this are pretty simple (you need an MRI anyway if
you're going to be doing any transformations, so just check the type there).
But legalization doesn't really want to check redundant operands (when, for
example, a G_ADD only ever has one type) so I've made use of MCInstrDesc's
operand type field to encode these constraints and limit legalization's work.

As an added bonus, more validation is possible, both in MachineVerifier and
MachineIRBuilder (coming soon).

llvm-svn: 281035

											
										
										
											2016-09-09 19:46:34 +08:00
+								  MIRBuilder.buildInstr(Opcode).addDef(Res).addUse(Op);
-												GlobalISel: add generic casts to IRTranslator

This adds LLVM's 3 main cast instructions (inttoptr, ptrtoint, bitcast) to the
IRTranslator. The first two are direct translations (with 2 MachineInstr types
each). Since LLT discards information, a bitcast might become trivial and we
emit a COPY in those cases instead.

llvm-svn: 276690

											
										
										
											2016-07-26 05:01:29 +08:00
+								  return true;
 								}
-												GlobalISel: use correct builder for ConstantExprs.

ConstantExpr instances were emitting code into the current block rather than
the entry block. This meant they didn't necessarily dominate all uses, which is
clearly wrong.

llvm-svn: 288985

											
										
										
											2016-12-08 05:29:15 +08:00
+								bool IRTranslator::translateGetElementPtr(const User &U,
 								                                          MachineIRBuilder &MIRBuilder) {
-												GlobalISel: translate GEP instructions.

Unlike SDag, we use a separate G_GEP instruction (much simplified, only taking
a single byte offset) to preserve the pointer type information through
selection.

llvm-svn: 281205

											
										
										
											2016-09-12 19:20:22 +08:00
+								  // FIXME: support vector GEPs.
 								  if (U.getType()->isVectorTy())
 								    return false;
 								  Value &Op0 = *U.getOperand(0);
 								  unsigned BaseReg = getOrCreateVReg(Op0);
-												[GlobalISel] Avoid translating synthetic constants to new G_CONSTANTS.

Currently, we create a G_CONSTANT for every "synthetic" integer
constant operand (for instance, for the G_GEP offset).
Instead, share the G_CONSTANTs we might have created by going through
the ValueToVReg machinery.

When we're emitting synthetic constants, we do need to get Constants from
the context.  One could argue that we shouldn't modify the context at
all (for instance, this means that we're going to use a tad more memory
if the constant wasn't used elsewhere), but constants are mostly
harmless.  We currently do this for extractvalue and all.

For constant fcmp, this does mean we'll emit an extra COPY, which is not
necessarily more optimal than an extra materialized constant.
But that preserves the current intended design of uniqued G_CONSTANTs,
and the rematerialization problem exists elsewhere and should be
resolved with a single coherent solution.

llvm-svn: 297875

											
										
										
											2017-03-16 03:21:11 +08:00
+								  Type *PtrIRTy = Op0.getType();
 								  LLT PtrTy = getLLTForType(*PtrIRTy, *DL);
 								  Type *OffsetIRTy = DL->getIntPtrType(PtrIRTy);
 								  LLT OffsetTy = getLLTForType(*OffsetIRTy, *DL);
-												GlobalISel: translate GEP instructions.

Unlike SDag, we use a separate G_GEP instruction (much simplified, only taking
a single byte offset) to preserve the pointer type information through
selection.

llvm-svn: 281205

											
										
										
											2016-09-12 19:20:22 +08:00
 								  int64_t Offset = 0;
 								  for (gep_type_iterator GTI = gep_type_begin(&U), E = gep_type_end(&U);
 								       GTI != E; ++GTI) {
 								    const Value *Idx = GTI.getOperand();
-												Fix GlobalISel build.

llvm-svn: 288460

											
										
										
											2016-12-02 10:55:30 +08:00
+								    if (StructType *StTy = GTI.getStructTypeOrNull()) {
-												GlobalISel: translate GEP instructions.

Unlike SDag, we use a separate G_GEP instruction (much simplified, only taking
a single byte offset) to preserve the pointer type information through
selection.

llvm-svn: 281205

											
										
										
											2016-09-12 19:20:22 +08:00
+								      unsigned Field = cast<Constant>(Idx)->getUniqueInteger().getZExtValue();
 								      Offset += DL->getStructLayout(StTy)->getElementOffset(Field);
 								      continue;
 								    } else {
 								      uint64_t ElementSize = DL->getTypeAllocSize(GTI.getIndexedType());
 								      // If this is a scalar constant or a splat vector of constants,
 								      // handle it quickly.
 								      if (const auto *CI = dyn_cast<ConstantInt>(Idx)) {
 								        Offset += ElementSize * CI->getSExtValue();
 								        continue;
 								      }
 								      if (Offset != 0) {
 								        unsigned NewBaseReg = MRI->createGenericVirtualRegister(PtrTy);
-												[GlobalISel] Avoid translating synthetic constants to new G_CONSTANTS.

Currently, we create a G_CONSTANT for every "synthetic" integer
constant operand (for instance, for the G_GEP offset).
Instead, share the G_CONSTANTs we might have created by going through
the ValueToVReg machinery.

When we're emitting synthetic constants, we do need to get Constants from
the context.  One could argue that we shouldn't modify the context at
all (for instance, this means that we're going to use a tad more memory
if the constant wasn't used elsewhere), but constants are mostly
harmless.  We currently do this for extractvalue and all.

For constant fcmp, this does mean we'll emit an extra COPY, which is not
necessarily more optimal than an extra materialized constant.
But that preserves the current intended design of uniqued G_CONSTANTs,
and the rematerialization problem exists elsewhere and should be
resolved with a single coherent solution.

llvm-svn: 297875

											
										
										
											2017-03-16 03:21:11 +08:00
+								        unsigned OffsetReg =
 								            getOrCreateVReg(*ConstantInt::get(OffsetIRTy, Offset));
-												GlobalISel: translate GEP instructions.

Unlike SDag, we use a separate G_GEP instruction (much simplified, only taking
a single byte offset) to preserve the pointer type information through
selection.

llvm-svn: 281205

											
										
										
											2016-09-12 19:20:22 +08:00
+								        MIRBuilder.buildGEP(NewBaseReg, BaseReg, OffsetReg);
 								        BaseReg = NewBaseReg;
 								        Offset = 0;
 								      }
 								      // N = N + Idx * ElementSize;
-												[GlobalISel] Avoid translating synthetic constants to new G_CONSTANTS.

Currently, we create a G_CONSTANT for every "synthetic" integer
constant operand (for instance, for the G_GEP offset).
Instead, share the G_CONSTANTs we might have created by going through
the ValueToVReg machinery.

When we're emitting synthetic constants, we do need to get Constants from
the context.  One could argue that we shouldn't modify the context at
all (for instance, this means that we're going to use a tad more memory
if the constant wasn't used elsewhere), but constants are mostly
harmless.  We currently do this for extractvalue and all.

For constant fcmp, this does mean we'll emit an extra COPY, which is not
necessarily more optimal than an extra materialized constant.
But that preserves the current intended design of uniqued G_CONSTANTs,
and the rematerialization problem exists elsewhere and should be
resolved with a single coherent solution.

llvm-svn: 297875

											
										
										
											2017-03-16 03:21:11 +08:00
+								      unsigned ElementSizeReg =
 								          getOrCreateVReg(*ConstantInt::get(OffsetIRTy, ElementSize));
-												GlobalISel: translate GEP instructions.

Unlike SDag, we use a separate G_GEP instruction (much simplified, only taking
a single byte offset) to preserve the pointer type information through
selection.

llvm-svn: 281205

											
										
										
											2016-09-12 19:20:22 +08:00
 								      unsigned IdxReg = getOrCreateVReg(*Idx);
 								      if (MRI->getType(IdxReg) != OffsetTy) {
 								        unsigned NewIdxReg = MRI->createGenericVirtualRegister(OffsetTy);
 								        MIRBuilder.buildSExtOrTrunc(NewIdxReg, IdxReg);
 								        IdxReg = NewIdxReg;
 								      }
 								      unsigned OffsetReg = MRI->createGenericVirtualRegister(OffsetTy);
 								      MIRBuilder.buildMul(OffsetReg, ElementSizeReg, IdxReg);
 								      unsigned NewBaseReg = MRI->createGenericVirtualRegister(PtrTy);
 								      MIRBuilder.buildGEP(NewBaseReg, BaseReg, OffsetReg);
 								      BaseReg = NewBaseReg;
 								    }
 								  }
 								  if (Offset != 0) {
-												[GlobalISel] Avoid translating synthetic constants to new G_CONSTANTS.

Currently, we create a G_CONSTANT for every "synthetic" integer
constant operand (for instance, for the G_GEP offset).
Instead, share the G_CONSTANTs we might have created by going through
the ValueToVReg machinery.

When we're emitting synthetic constants, we do need to get Constants from
the context.  One could argue that we shouldn't modify the context at
all (for instance, this means that we're going to use a tad more memory
if the constant wasn't used elsewhere), but constants are mostly
harmless.  We currently do this for extractvalue and all.

For constant fcmp, this does mean we'll emit an extra COPY, which is not
necessarily more optimal than an extra materialized constant.
But that preserves the current intended design of uniqued G_CONSTANTs,
and the rematerialization problem exists elsewhere and should be
resolved with a single coherent solution.

llvm-svn: 297875

											
										
										
											2017-03-16 03:21:11 +08:00
+								    unsigned OffsetReg = getOrCreateVReg(*ConstantInt::get(OffsetIRTy, Offset));
-												GlobalISel: translate GEP instructions.

Unlike SDag, we use a separate G_GEP instruction (much simplified, only taking
a single byte offset) to preserve the pointer type information through
selection.

llvm-svn: 281205

											
										
										
											2016-09-12 19:20:22 +08:00
+								    MIRBuilder.buildGEP(getOrCreateVReg(U), BaseReg, OffsetReg);
 								    return true;
 								  }
 								  MIRBuilder.buildCopy(getOrCreateVReg(U), BaseReg);
 								  return true;
 								}
-												GlobalISel: translate memset & memmove.

llvm-svn: 293541

											
										
										
											2017-01-31 03:33:07 +08:00
+								bool IRTranslator::translateMemfunc(const CallInst &CI,
 								                                    MachineIRBuilder &MIRBuilder,
 								                                    unsigned ID) {
-												Recommit: [globalisel] Change LLT constructor string into an LLT-based object that knows how to generate it.

Summary:
This will allow future patches to inspect the details of the LLT. The implementation is now split between
the Support and CodeGen libraries to allow TableGen to use this class without introducing layering concerns.

Thanks to Ahmed Bougacha for finding a reasonable way to avoid the layering issue and providing the version of this patch without that problem.

The problem with the previous commit appears to have been that TableGen was including CodeGen/LowLevelType.h instead of Support/LowLevelTypeImpl.h.

Reviewers: t.p.northover, qcolombet, rovka, aditya_nandakumar, ab, javed.absar

Subscribers: arsenm, nhaehnle, mgorny, dberris, llvm-commits, kristof.beyls

Differential Revision: https://reviews.llvm.org/D30046

llvm-svn: 297241

											
										
										
											2017-03-08 07:20:35 +08:00
+								  LLT SizeTy = getLLTForType(*CI.getArgOperand(2)->getType(), *DL);
-												GlobalISel: translate memset & memmove.

llvm-svn: 293541

											
										
										
											2017-01-31 03:33:07 +08:00
+								  Type *DstTy = CI.getArgOperand(0)->getType();
 								  if (cast<PointerType>(DstTy)->getAddressSpace() != 0 ||
-												GlobalISel: translate memcpy intrinsics.

llvm-svn: 284525

											
										
										
											2016-10-19 04:03:45 +08:00
+								      SizeTy.getSizeInBits() != DL->getPointerSizeInBits(0))
 								    return false;
 								  SmallVector<CallLowering::ArgInfo, 8> Args;
 								  for (int i = 0; i < 3; ++i) {
 								    const auto &Arg = CI.getArgOperand(i);
 								    Args.emplace_back(getOrCreateVReg(*Arg), Arg->getType());
 								  }
-												GlobalISel: translate memset & memmove.

llvm-svn: 293541

											
										
										
											2017-01-31 03:33:07 +08:00
+								  const char *Callee;
 								  switch (ID) {
 								  case Intrinsic::memmove:
 								  case Intrinsic::memcpy: {
 								    Type *SrcTy = CI.getArgOperand(1)->getType();
 								    if(cast<PointerType>(SrcTy)->getAddressSpace() != 0)
 								      return false;
 								    Callee = ID == Intrinsic::memcpy ? "memcpy" : "memmove";
 								    break;
 								  }
 								  case Intrinsic::memset:
 								    Callee = "memset";
 								    break;
 								  default:
 								    return false;
 								  }
-												GlobalISel: translate memcpy intrinsics.

llvm-svn: 284525

											
										
										
											2016-10-19 04:03:45 +08:00
-												[GlobalISel] Use the correct calling conv for calls

This commit adds a parameter that lets us pass in the calling convention
of the call to CallLowering::lowerCall. This allows us to handle
situations where the calling convetion of the callee is different from
that of the caller.

Differential Revision: https://reviews.llvm.org/D31039

llvm-svn: 298254

											
										
										
											2017-03-20 22:40:18 +08:00
+								  return CLI->lowerCall(MIRBuilder, CI.getCallingConv(),
 								                        MachineOperand::CreateES(Callee),
-												GlobalISel: translate memcpy intrinsics.

llvm-svn: 284525

											
										
										
											2016-10-19 04:03:45 +08:00
+								                        CallLowering::ArgInfo(0, CI.getType()), Args);
 								}
-												GlobalISel: translate GEP instructions.

Unlike SDag, we use a separate G_GEP instruction (much simplified, only taking
a single byte offset) to preserve the pointer type information through
selection.

llvm-svn: 281205

											
										
										
											2016-09-12 19:20:22 +08:00
-												GlobalISel: use correct builder for ConstantExprs.

ConstantExpr instances were emitting code into the current block rather than
the entry block. This meant they didn't necessarily dominate all uses, which is
clearly wrong.

llvm-svn: 288985

											
										
										
											2016-12-08 05:29:15 +08:00
+								void IRTranslator::getStackGuard(unsigned DstReg,
 								                                 MachineIRBuilder &MIRBuilder) {
-												GlobalISel: set correct regclass for LOAD_STACK_GUARD.

Since it's not actually a generic MI, its register operands need a RegClass,
which is conveniently the target's pointer RegClass.

llvm-svn: 293335

											
										
										
											2017-01-28 05:31:24 +08:00
+								  const TargetRegisterInfo *TRI = MF->getSubtarget().getRegisterInfo();
 								  MRI->setRegClass(DstReg, TRI->getPointerRegClass(*MF));
-												GlobalISel: translate stack protector intrinsics

llvm-svn: 285614

											
										
										
											2016-11-01 02:30:59 +08:00
+								  auto MIB = MIRBuilder.buildInstr(TargetOpcode::LOAD_STACK_GUARD);
 								  MIB.addDef(DstReg);
-												GlobalISel: store the current MachineFunction as direct state. NFC.

Having to ask the MIRBuilder for the current function is a little awkward, and
I'm intending to improve how that's threaded through anyway.

llvm-svn: 288983

											
										
										
											2016-12-08 05:17:47 +08:00
+								  auto &TLI = *MF->getSubtarget().getTargetLowering();
 								  Value *Global = TLI.getSDagStackGuard(*MF->getFunction()->getParent());
-												GlobalISel: translate stack protector intrinsics

llvm-svn: 285614

											
										
										
											2016-11-01 02:30:59 +08:00
+								  if (!Global)
 								    return;
 								  MachinePointerInfo MPInfo(Global);
-												GlobalISel: store the current MachineFunction as direct state. NFC.

Having to ask the MIRBuilder for the current function is a little awkward, and
I'm intending to improve how that's threaded through anyway.

llvm-svn: 288983

											
										
										
											2016-12-08 05:17:47 +08:00
+								  MachineInstr::mmo_iterator MemRefs = MF->allocateMemRefsArray(1);
-												GlobalISel: translate stack protector intrinsics

llvm-svn: 285614

											
										
										
											2016-11-01 02:30:59 +08:00
+								  auto Flags = MachineMemOperand::MOLoad | MachineMemOperand::MOInvariant |
 								               MachineMemOperand::MODereferenceable;
 								  *MemRefs =
-												GlobalISel: store the current MachineFunction as direct state. NFC.

Having to ask the MIRBuilder for the current function is a little awkward, and
I'm intending to improve how that's threaded through anyway.

llvm-svn: 288983

											
										
										
											2016-12-08 05:17:47 +08:00
+								      MF->getMachineMemOperand(MPInfo, Flags, DL->getPointerSizeInBits() / 8,
 								                               DL->getPointerABIAlignment());
-												GlobalISel: translate stack protector intrinsics

llvm-svn: 285614

											
										
										
											2016-11-01 02:30:59 +08:00
+								  MIB.setMemRefs(MemRefs, MemRefs + 1);
 								}
-												GlobalISel: factor overflow handling into separate function. NFC.

llvm-svn: 289149

											
										
										
											2016-12-09 06:44:00 +08:00
+								bool IRTranslator::translateOverflowIntrinsic(const CallInst &CI, unsigned Op,
 								                                              MachineIRBuilder &MIRBuilder) {
-												Recommit: [globalisel] Change LLT constructor string into an LLT-based object that knows how to generate it.

Summary:
This will allow future patches to inspect the details of the LLT. The implementation is now split between
the Support and CodeGen libraries to allow TableGen to use this class without introducing layering concerns.

Thanks to Ahmed Bougacha for finding a reasonable way to avoid the layering issue and providing the version of this patch without that problem.

The problem with the previous commit appears to have been that TableGen was including CodeGen/LowLevelType.h instead of Support/LowLevelTypeImpl.h.

Reviewers: t.p.northover, qcolombet, rovka, aditya_nandakumar, ab, javed.absar

Subscribers: arsenm, nhaehnle, mgorny, dberris, llvm-commits, kristof.beyls

Differential Revision: https://reviews.llvm.org/D30046

llvm-svn: 297241

											
										
										
											2017-03-08 07:20:35 +08:00
+								  LLT Ty = getLLTForType(*CI.getOperand(0)->getType(), *DL);
-												GlobalISel: factor overflow handling into separate function. NFC.

llvm-svn: 289149

											
										
										
											2016-12-09 06:44:00 +08:00
+								  LLT s1 = LLT::scalar(1);
 								  unsigned Width = Ty.getSizeInBits();
 								  unsigned Res = MRI->createGenericVirtualRegister(Ty);
 								  unsigned Overflow = MRI->createGenericVirtualRegister(s1);
 								  auto MIB = MIRBuilder.buildInstr(Op)
 								                 .addDef(Res)
 								                 .addDef(Overflow)
 								                 .addUse(getOrCreateVReg(*CI.getOperand(0)))
 								                 .addUse(getOrCreateVReg(*CI.getOperand(1)));
 								  if (Op == TargetOpcode::G_UADDE || Op == TargetOpcode::G_USUBE) {
-												[GlobalISel] Avoid translating synthetic constants to new G_CONSTANTS.

Currently, we create a G_CONSTANT for every "synthetic" integer
constant operand (for instance, for the G_GEP offset).
Instead, share the G_CONSTANTs we might have created by going through
the ValueToVReg machinery.

When we're emitting synthetic constants, we do need to get Constants from
the context.  One could argue that we shouldn't modify the context at
all (for instance, this means that we're going to use a tad more memory
if the constant wasn't used elsewhere), but constants are mostly
harmless.  We currently do this for extractvalue and all.

For constant fcmp, this does mean we'll emit an extra COPY, which is not
necessarily more optimal than an extra materialized constant.
But that preserves the current intended design of uniqued G_CONSTANTs,
and the rematerialization problem exists elsewhere and should be
resolved with a single coherent solution.

llvm-svn: 297875

											
										
										
											2017-03-16 03:21:11 +08:00
+								    unsigned Zero = getOrCreateVReg(
 								        *Constant::getNullValue(Type::getInt1Ty(CI.getContext())));
-												GlobalISel: factor overflow handling into separate function. NFC.

llvm-svn: 289149

											
										
										
											2016-12-09 06:44:00 +08:00
+								    MIB.addUse(Zero);
 								  }
-												GlobalISel: convert buildSequence to use non-deprecated instructions.

G_SEQUENCE is going away soon so as a first step the MachineIRBuilder needs to
be taught how to emulate it with alternatives. We use G_MERGE_VALUES where
possible, and a sequence of G_INSERTs if not.

llvm-svn: 306119

											
										
										
											2017-06-24 00:15:37 +08:00
+								  MIRBuilder.buildSequence(getOrCreateVReg(CI), {Res, Overflow}, {0, Width});
-												GlobalISel: factor overflow handling into separate function. NFC.

llvm-svn: 289149

											
										
										
											2016-12-09 06:44:00 +08:00
+								  return true;
 								}
-												GlobalISel: use correct builder for ConstantExprs.

ConstantExpr instances were emitting code into the current block rather than
the entry block. This meant they didn't necessarily dominate all uses, which is
clearly wrong.

llvm-svn: 288985

											
										
										
											2016-12-08 05:29:15 +08:00
+								bool IRTranslator::translateKnownIntrinsic(const CallInst &CI, Intrinsic::ID ID,
 								                                           MachineIRBuilder &MIRBuilder) {
-												GlobalISel: support overflow arithmetic intrinsics.

Unsigned addition and subtraction can reuse the instructions created to
legalize large width operations (i.e. both produce and consume a carry flag).
Signed operations and multiplies get a dedicated op-with-overflow instruction.

Once this is produced the two values are combined into a struct register (which
will almost always be merged with a corresponding G_EXTRACT as part of
legalization).

llvm-svn: 279278

											
										
										
											2016-08-20 01:17:06 +08:00
+								  switch (ID) {
-												GlobalISel: factor overflow handling into separate function. NFC.

llvm-svn: 289149

											
										
										
											2016-12-09 06:44:00 +08:00
+								  default:
 								    break;
-												GlobalISel: drop lifetime intrinsics during translation.

We don't use them yet and they just cause problems.

llvm-svn: 294770

											
										
										
											2017-02-11 03:10:38 +08:00
+								  case Intrinsic::lifetime_start:
 								  case Intrinsic::lifetime_end:
 								    // Stack coloring is not enabled in O0 (which we care about now) so we can
 								    // drop these. Make sure someone notices when we start compiling at higher
 								    // opts though.
 								    if (MF->getTarget().getOptLevel() != CodeGenOpt::None)
 								      return false;
 								    return true;
-												GlobalISel: support debug intrinsics.

The translation scheme is mostly cribbed from FastISel, and it's not entirely
convincing semantically. But it does seem to work in the common cases and allow
variables to be printed so it can't be all wrong.

llvm-svn: 293228

											
										
										
											2017-01-27 07:39:14 +08:00
+								  case Intrinsic::dbg_declare: {
 								    const DbgDeclareInst &DI = cast<DbgDeclareInst>(CI);
 								    assert(DI.getVariable() && "Missing variable");
 								    const Value *Address = DI.getAddress();
 								    if (!Address || isa<UndefValue>(Address)) {
 								      DEBUG(dbgs() << "Dropping debug info for " << DI << "\n");
 								      return true;
 								    }
 								    assert(DI.getVariable()->isValidLocationForIntrinsic(
 								               MIRBuilder.getDebugLoc()) &&
 								           "Expected inlined-at fields to agree");
-												GlobalISel: put debug info for static allocas in the MachineFunction.

The good reason to do this is that static allocas are pretty simple to handle
(especially at -O0) and avoiding tracking DBG_VALUEs throughout the pipeline
should give some kind of performance benefit.

The bad reason is that the debug pipeline is an unholy mess of implicit
contracts, where determining whether "DBG_VALUE %reg, imm" actually implies a
load or not involves the services of at least 3 soothsayers and the sacrifice
of at least one chicken.  And it still gets it wrong if the variable is at SP
directly.

llvm-svn: 297410

											
										
										
											2017-03-10 05:12:06 +08:00
+								    auto AI = dyn_cast<AllocaInst>(Address);
 								    if (AI && AI->isStaticAlloca()) {
 								      // Static allocas are tracked at the MF level, no need for DBG_VALUE
 								      // instructions (in fact, they get ignored if they *do* exist).
 								      MF->setVariableDbgInfo(DI.getVariable(), DI.getExpression(),
 								                             getOrCreateFrameIndex(*AI), DI.getDebugLoc());
-												GlobalISel: support debug intrinsics.

The translation scheme is mostly cribbed from FastISel, and it's not entirely
convincing semantically. But it does seem to work in the common cases and allow
variables to be printed so it can't be all wrong.

llvm-svn: 293228

											
										
										
											2017-01-27 07:39:14 +08:00
+								    } else
-												GlobalISel: put debug info for static allocas in the MachineFunction.

The good reason to do this is that static allocas are pretty simple to handle
(especially at -O0) and avoiding tracking DBG_VALUEs throughout the pipeline
should give some kind of performance benefit.

The bad reason is that the debug pipeline is an unholy mess of implicit
contracts, where determining whether "DBG_VALUE %reg, imm" actually implies a
load or not involves the services of at least 3 soothsayers and the sacrifice
of at least one chicken.  And it still gets it wrong if the variable is at SP
directly.

llvm-svn: 297410

											
										
										
											2017-03-10 05:12:06 +08:00
+								      MIRBuilder.buildDirectDbgValue(getOrCreateVReg(*Address),
 								                                     DI.getVariable(), DI.getExpression());
-												GlobalISel: fall back gracefully for debug intrinsics.

Supporting them properly is a reasonably complex chunk of work, so to allow bot
testing before then we should at least be able to fall back to DAG ISel.

llvm-svn: 289150

											
										
										
											2016-12-09 06:44:13 +08:00
+								    return true;
-												GlobalISel: support debug intrinsics.

The translation scheme is mostly cribbed from FastISel, and it's not entirely
convincing semantically. But it does seem to work in the common cases and allow
variables to be printed so it can't be all wrong.

llvm-svn: 293228

											
										
										
											2017-01-27 07:39:14 +08:00
+								  }
-												GlobalISel: translate @llvm.va_end intrinsic.

Turns out no-one actually cares about this one (at least) in tree so we can
just drop it entirely.

llvm-svn: 294345

											
										
										
											2017-02-08 04:08:59 +08:00
+								  case Intrinsic::vaend:
 								    // No target I know of cares about va_end. Certainly no in-tree target
 								    // does. Simplest intrinsic ever!
 								    return true;
-												GlobalISel: translate @llvm.va_start intrinsic.

Because we need to preserve the memory access being performed we need a
separate instruction to represent this.

llvm-svn: 294492

											
										
										
											2017-02-09 01:57:20 +08:00
+								  case Intrinsic::vastart: {
 								    auto &TLI = *MF->getSubtarget().getTargetLowering();
 								    Value *Ptr = CI.getArgOperand(0);
 								    unsigned ListSize = TLI.getVaListSizeInBits(*DL) / 8;
 								    MIRBuilder.buildInstr(TargetOpcode::G_VASTART)
 								        .addUse(getOrCreateVReg(*Ptr))
 								        .addMemOperand(MF->getMachineMemOperand(
 								            MachinePointerInfo(Ptr), MachineMemOperand::MOStore, ListSize, 0));
 								    return true;
 								  }
-												GlobalISel: support debug intrinsics.

The translation scheme is mostly cribbed from FastISel, and it's not entirely
convincing semantically. But it does seem to work in the common cases and allow
variables to be printed so it can't be all wrong.

llvm-svn: 293228

											
										
										
											2017-01-27 07:39:14 +08:00
+								  case Intrinsic::dbg_value: {
 								    // This form of DBG_VALUE is target-independent.
 								    const DbgValueInst &DI = cast<DbgValueInst>(CI);
 								    const Value *V = DI.getValue();
 								    assert(DI.getVariable()->isValidLocationForIntrinsic(
 								               MIRBuilder.getDebugLoc()) &&
 								           "Expected inlined-at fields to agree");
 								    if (!V) {
 								      // Currently the optimizer can produce this; insert an undef to
 								      // help debugging.  Probably the optimizer should not do this.
 								      MIRBuilder.buildIndirectDbgValue(0, DI.getOffset(), DI.getVariable(),
 								                                       DI.getExpression());
 								    } else if (const auto *CI = dyn_cast<Constant>(V)) {
 								      MIRBuilder.buildConstDbgValue(*CI, DI.getOffset(), DI.getVariable(),
 								                                    DI.getExpression());
 								    } else {
 								      unsigned Reg = getOrCreateVReg(*V);
 								      // FIXME: This does not handle register-indirect values at offset 0. The
 								      // direct/indirect thing shouldn't really be handled by something as
 								      // implicit as reg+noreg vs reg+imm in the first palce, but it seems
 								      // pretty baked in right now.
 								      if (DI.getOffset() != 0)
 								        MIRBuilder.buildIndirectDbgValue(Reg, DI.getOffset(), DI.getVariable(),
 								                                         DI.getExpression());
 								      else
 								        MIRBuilder.buildDirectDbgValue(Reg, DI.getVariable(),
 								                                       DI.getExpression());
 								    }
 								    return true;
 								  }
-												GlobalISel: factor overflow handling into separate function. NFC.

llvm-svn: 289149

											
										
										
											2016-12-09 06:44:00 +08:00
+								  case Intrinsic::uadd_with_overflow:
 								    return translateOverflowIntrinsic(CI, TargetOpcode::G_UADDE, MIRBuilder);
 								  case Intrinsic::sadd_with_overflow:
 								    return translateOverflowIntrinsic(CI, TargetOpcode::G_SADDO, MIRBuilder);
 								  case Intrinsic::usub_with_overflow:
 								    return translateOverflowIntrinsic(CI, TargetOpcode::G_USUBE, MIRBuilder);
 								  case Intrinsic::ssub_with_overflow:
 								    return translateOverflowIntrinsic(CI, TargetOpcode::G_SSUBO, MIRBuilder);
 								  case Intrinsic::umul_with_overflow:
 								    return translateOverflowIntrinsic(CI, TargetOpcode::G_UMULO, MIRBuilder);
 								  case Intrinsic::smul_with_overflow:
 								    return translateOverflowIntrinsic(CI, TargetOpcode::G_SMULO, MIRBuilder);
-												GlobalISel: translate @llvm.pow intrinsic to G_FPOW.

It'll usually be immediately legalized back to a libcall, but occasionally
something can be done with it so we'd just as well enable that flexibility from
the start.

llvm-svn: 294530

											
										
										
											2017-02-09 07:23:32 +08:00
+								  case Intrinsic::pow:
 								    MIRBuilder.buildInstr(TargetOpcode::G_FPOW)
 								        .addDef(getOrCreateVReg(CI))
 								        .addUse(getOrCreateVReg(*CI.getArgOperand(0)))
 								        .addUse(getOrCreateVReg(*CI.getArgOperand(1)));
 								    return true;
-												[GISel]: Add G_FEXP, G_FEXP2 opcodes

Also add IRTranslator support.
https://reviews.llvm.org/D34710

llvm-svn: 306475

											
										
										
											2017-06-28 06:19:32 +08:00
+								  case Intrinsic::exp:
 								    MIRBuilder.buildInstr(TargetOpcode::G_FEXP)
 								        .addDef(getOrCreateVReg(CI))
 								        .addUse(getOrCreateVReg(*CI.getArgOperand(0)));
 								    return true;
 								  case Intrinsic::exp2:
 								    MIRBuilder.buildInstr(TargetOpcode::G_FEXP2)
 								        .addDef(getOrCreateVReg(CI))
 								        .addUse(getOrCreateVReg(*CI.getArgOperand(0)));
 								    return true;
-												[GISel]: Add G_FMA opcode for fused multiply adds

https://reviews.llvm.org/D34372

Reviewed by dsanders

llvm-svn: 305824

											
										
										
											2017-06-21 03:25:23 +08:00
+								  case Intrinsic::fma:
 								    MIRBuilder.buildInstr(TargetOpcode::G_FMA)
 								        .addDef(getOrCreateVReg(CI))
 								        .addUse(getOrCreateVReg(*CI.getArgOperand(0)))
 								        .addUse(getOrCreateVReg(*CI.getArgOperand(1)))
 								        .addUse(getOrCreateVReg(*CI.getArgOperand(2)));
 								    return true;
-												GlobalISel: translate memcpy intrinsics.

llvm-svn: 284525

											
										
										
											2016-10-19 04:03:45 +08:00
+								  case Intrinsic::memcpy:
-												GlobalISel: translate memset & memmove.

llvm-svn: 293541

											
										
										
											2017-01-31 03:33:07 +08:00
+								  case Intrinsic::memmove:
 								  case Intrinsic::memset:
 								    return translateMemfunc(CI, MIRBuilder, ID);
-												GlobalISel: translate invoke and landingpad instructions

Pretty bare-bones support for exception handling (no weird MSVC stuff, no SjLj
etc), but it should get things going.

llvm-svn: 286407

											
										
										
											2016-11-10 06:39:54 +08:00
+								  case Intrinsic::eh_typeid_for: {
 								    GlobalValue *GV = ExtractTypeInfo(CI.getArgOperand(0));
 								    unsigned Reg = getOrCreateVReg(CI);
-												GlobalISel: store the current MachineFunction as direct state. NFC.

Having to ask the MIRBuilder for the current function is a little awkward, and
I'm intending to improve how that's threaded through anyway.

llvm-svn: 288983

											
										
										
											2016-12-08 05:17:47 +08:00
+								    unsigned TypeID = MF->getTypeIDFor(GV);
-												GlobalISel: translate invoke and landingpad instructions

Pretty bare-bones support for exception handling (no weird MSVC stuff, no SjLj
etc), but it should get things going.

llvm-svn: 286407

											
										
										
											2016-11-10 06:39:54 +08:00
+								    MIRBuilder.buildConstant(Reg, TypeID);
 								    return true;
 								  }
-												GlobalISel: translate the @llvm.objectsize intrinsic.

llvm-svn: 284527

											
										
										
											2016-10-19 04:03:51 +08:00
+								  case Intrinsic::objectsize: {
 								    // If we don't know by now, we're never going to know.
 								    const ConstantInt *Min = cast<ConstantInt>(CI.getArgOperand(1));
 								    MIRBuilder.buildConstant(getOrCreateVReg(CI), Min->isZero() ? -1ULL : 0);
 								    return true;
 								  }
-												GlobalISel: translate stack protector intrinsics

llvm-svn: 285614

											
										
										
											2016-11-01 02:30:59 +08:00
+								  case Intrinsic::stackguard:
-												GlobalISel: use correct builder for ConstantExprs.

ConstantExpr instances were emitting code into the current block rather than
the entry block. This meant they didn't necessarily dominate all uses, which is
clearly wrong.

llvm-svn: 288985

											
										
										
											2016-12-08 05:29:15 +08:00
+								    getStackGuard(getOrCreateVReg(CI), MIRBuilder);
-												GlobalISel: translate stack protector intrinsics

llvm-svn: 285614

											
										
										
											2016-11-01 02:30:59 +08:00
+								    return true;
 								  case Intrinsic::stackprotector: {
-												Recommit: [globalisel] Change LLT constructor string into an LLT-based object that knows how to generate it.

Summary:
This will allow future patches to inspect the details of the LLT. The implementation is now split between
the Support and CodeGen libraries to allow TableGen to use this class without introducing layering concerns.

Thanks to Ahmed Bougacha for finding a reasonable way to avoid the layering issue and providing the version of this patch without that problem.

The problem with the previous commit appears to have been that TableGen was including CodeGen/LowLevelType.h instead of Support/LowLevelTypeImpl.h.

Reviewers: t.p.northover, qcolombet, rovka, aditya_nandakumar, ab, javed.absar

Subscribers: arsenm, nhaehnle, mgorny, dberris, llvm-commits, kristof.beyls

Differential Revision: https://reviews.llvm.org/D30046

llvm-svn: 297241

											
										
										
											2017-03-08 07:20:35 +08:00
+								    LLT PtrTy = getLLTForType(*CI.getArgOperand(0)->getType(), *DL);
-												GlobalISel: translate stack protector intrinsics

llvm-svn: 285614

											
										
										
											2016-11-01 02:30:59 +08:00
+								    unsigned GuardVal = MRI->createGenericVirtualRegister(PtrTy);
-												GlobalISel: use correct builder for ConstantExprs.

ConstantExpr instances were emitting code into the current block rather than
the entry block. This meant they didn't necessarily dominate all uses, which is
clearly wrong.

llvm-svn: 288985

											
										
										
											2016-12-08 05:29:15 +08:00
+								    getStackGuard(GuardVal, MIRBuilder);
-												GlobalISel: translate stack protector intrinsics

llvm-svn: 285614

											
										
										
											2016-11-01 02:30:59 +08:00
 								    AllocaInst *Slot = cast<AllocaInst>(CI.getArgOperand(1));
 								    MIRBuilder.buildStore(
 								        GuardVal, getOrCreateVReg(*Slot),
-												GlobalISel: store the current MachineFunction as direct state. NFC.

Having to ask the MIRBuilder for the current function is a little awkward, and
I'm intending to improve how that's threaded through anyway.

llvm-svn: 288983

											
										
										
											2016-12-08 05:17:47 +08:00
+								        *MF->getMachineMemOperand(
 								            MachinePointerInfo::getFixedStack(*MF,
 								                                              getOrCreateFrameIndex(*Slot)),
-												GlobalISel: translate stack protector intrinsics

llvm-svn: 285614

											
										
										
											2016-11-01 02:30:59 +08:00
+								            MachineMemOperand::MOStore | MachineMemOperand::MOVolatile,
 								            PtrTy.getSizeInBits() / 8, 8));
 								    return true;
 								  }
-												GlobalISel: support overflow arithmetic intrinsics.

Unsigned addition and subtraction can reuse the instructions created to
legalize large width operations (i.e. both produce and consume a carry flag).
Signed operations and multiplies get a dedicated op-with-overflow instruction.

Once this is produced the two values are combined into a struct register (which
will almost always be merged with a corresponding G_EXTRACT as part of
legalization).

llvm-svn: 279278

											
										
										
											2016-08-20 01:17:06 +08:00
+								  }
-												GlobalISel: factor overflow handling into separate function. NFC.

llvm-svn: 289149

											
										
										
											2016-12-09 06:44:00 +08:00
+								  return false;
-												GlobalISel: support overflow arithmetic intrinsics.

Unsigned addition and subtraction can reuse the instructions created to
legalize large width operations (i.e. both produce and consume a carry flag).
Signed operations and multiplies get a dedicated op-with-overflow instruction.

Once this is produced the two values are combined into a struct register (which
will almost always be merged with a corresponding G_EXTRACT as part of
legalization).

llvm-svn: 279278

											
										
										
											2016-08-20 01:17:06 +08:00
+								}
-												GlobalISel: support trivial inlineasm calls.

They're used for nefarious purposes by ObjC.

llvm-svn: 297422

											
										
										
											2017-03-10 07:36:26 +08:00
+								bool IRTranslator::translateInlineAsm(const CallInst &CI,
 								                                      MachineIRBuilder &MIRBuilder) {
 								  const InlineAsm &IA = cast<InlineAsm>(*CI.getCalledValue());
 								  if (!IA.getConstraintString().empty())
 								    return false;
 								  unsigned ExtraInfo = 0;
 								  if (IA.hasSideEffects())
 								    ExtraInfo |= InlineAsm::Extra_HasSideEffects;
 								  if (IA.getDialect() == InlineAsm::AD_Intel)
 								    ExtraInfo |= InlineAsm::Extra_AsmDialect;
 								  MIRBuilder.buildInstr(TargetOpcode::INLINEASM)
 								    .addExternalSymbol(IA.getAsmString().c_str())
 								    .addImm(ExtraInfo);
 								  return true;
 								}
-												GlobalISel: use correct builder for ConstantExprs.

ConstantExpr instances were emitting code into the current block rather than
the entry block. This meant they didn't necessarily dominate all uses, which is
clearly wrong.

llvm-svn: 288985

											
										
										
											2016-12-08 05:29:15 +08:00
+								bool IRTranslator::translateCall(const User &U, MachineIRBuilder &MIRBuilder) {
-												GlobalISel: support same ConstantExprs as Instructions.

It's more than just inttoptr, but the others can't be tested until we have
support for non-trivial constants (they currently get unavoidably folded to a
ConstantInt).

llvm-svn: 278303

											
										
										
											2016-08-11 07:02:41 +08:00
+								  const CallInst &CI = cast<CallInst>(U);
-												GlobalISel: store the current MachineFunction as direct state. NFC.

Having to ask the MIRBuilder for the current function is a little awkward, and
I'm intending to improve how that's threaded through anyway.

llvm-svn: 288983

											
										
										
											2016-12-08 05:17:47 +08:00
+								  auto TII = MF->getTarget().getIntrinsicInfo();
-												GlobalISel: implement simple function calls on AArch64.

We're still limited in the arguments we support, but this at least handles the
basic cases.

llvm-svn: 278293

											
										
										
											2016-08-11 05:44:01 +08:00
+								  const Function *F = CI.getCalledFunction();
-												AArch64: fall back to DAG ISel for inline assembly.

We can't currently handle "calls" to inlineasm strings so it's better to let
the DAG handle it than generate rubbish.

llvm-svn: 292540

											
										
										
											2017-01-20 07:59:35 +08:00
+								  if (CI.isInlineAsm())
-												GlobalISel: support trivial inlineasm calls.

They're used for nefarious purposes by ObjC.

llvm-svn: 297422

											
										
										
											2017-03-10 07:36:26 +08:00
+								    return translateInlineAsm(CI, MIRBuilder);
-												AArch64: fall back to DAG ISel for inline assembly.

We can't currently handle "calls" to inlineasm strings so it's better to let
the DAG handle it than generate rubbish.

llvm-svn: 292540

											
										
										
											2017-01-20 07:59:35 +08:00
-												GlobalISel: implement simple function calls on AArch64.

We're still limited in the arguments we support, but this at least handles the
basic cases.

llvm-svn: 278293

											
										
										
											2016-08-11 05:44:01 +08:00
+								  if (!F || !F->isIntrinsic()) {
 								    unsigned Res = CI.getType()->isVoidTy() ? 0 : getOrCreateVReg(CI);
 								    SmallVector<unsigned, 8> Args;
 								    for (auto &Arg: CI.arg_operands())
 								      Args.push_back(getOrCreateVReg(*Arg));
-												GlobalISel: inform FrameLowering when we emit a function call.

Amongst other things (I expect) this is necessary to ensure decent backtraces
when an "unreachable" is involved.

llvm-svn: 297413

											
										
										
											2017-03-10 06:00:39 +08:00
+								    MF->getFrameInfo().setHasCalls(true);
-												[GlobalISel] Use ImmutableCallSite instead of templates. NFC.

ImmutableCallSite abstracts away CallInst and InvokeInst. Use it!

llvm-svn: 297426

											
										
										
											2017-03-10 08:25:44 +08:00
+								    return CLI->lowerCall(MIRBuilder, &CI, Res, Args, [&]() {
-												GlobalISel: rework CallLowering so that it can be used for libcalls too.

There should be no functional change here, I'm just making the implementation
of "frem" (to libcall) legalization easier for a followup.

llvm-svn: 279987

											
										
										
											2016-08-30 03:07:08 +08:00
+								      return getOrCreateVReg(*CI.getCalledValue());
 								    });
-												GlobalISel: implement simple function calls on AArch64.

We're still limited in the arguments we support, but this at least handles the
basic cases.

llvm-svn: 278293

											
										
										
											2016-08-11 05:44:01 +08:00
+								  }
 								  Intrinsic::ID ID = F->getIntrinsicID();
-												GlobalISel: support translation of intrinsic calls.

These come in two variants for now: G_INTRINSIC and G_INTRINSIC_W_SIDE_EFFECTS.
We may decide to split the latter up with finer-grained restrictions later, if
necessary.

llvm-svn: 277224

											
										
										
											2016-07-30 06:32:36 +08:00
+								  if (TII && ID == Intrinsic::not_intrinsic)
-												GlobalISel: implement simple function calls on AArch64.

We're still limited in the arguments we support, but this at least handles the
basic cases.

llvm-svn: 278293

											
										
										
											2016-08-11 05:44:01 +08:00
+								    ID = static_cast<Intrinsic::ID>(TII->getIntrinsicID(F));
-												GlobalISel: support translation of intrinsic calls.

These come in two variants for now: G_INTRINSIC and G_INTRINSIC_W_SIDE_EFFECTS.
We may decide to split the latter up with finer-grained restrictions later, if
necessary.

llvm-svn: 277224

											
										
										
											2016-07-30 06:32:36 +08:00
-												GlobalISel: implement simple function calls on AArch64.

We're still limited in the arguments we support, but this at least handles the
basic cases.

llvm-svn: 278293

											
										
										
											2016-08-11 05:44:01 +08:00
+								  assert(ID != Intrinsic::not_intrinsic && "unknown intrinsic");
-												GlobalISel: support translation of intrinsic calls.

These come in two variants for now: G_INTRINSIC and G_INTRINSIC_W_SIDE_EFFECTS.
We may decide to split the latter up with finer-grained restrictions later, if
necessary.

llvm-svn: 277224

											
										
										
											2016-07-30 06:32:36 +08:00
-												GlobalISel: use correct builder for ConstantExprs.

ConstantExpr instances were emitting code into the current block rather than
the entry block. This meant they didn't necessarily dominate all uses, which is
clearly wrong.

llvm-svn: 288985

											
										
										
											2016-12-08 05:29:15 +08:00
+								  if (translateKnownIntrinsic(CI, ID, MIRBuilder))
-												GlobalISel: support overflow arithmetic intrinsics.

Unsigned addition and subtraction can reuse the instructions created to
legalize large width operations (i.e. both produce and consume a carry flag).
Signed operations and multiplies get a dedicated op-with-overflow instruction.

Once this is produced the two values are combined into a struct register (which
will almost always be merged with a corresponding G_EXTRACT as part of
legalization).

llvm-svn: 279278

											
										
										
											2016-08-20 01:17:06 +08:00
+								    return true;
-												GlobalISel: support translation of intrinsic calls.

These come in two variants for now: G_INTRINSIC and G_INTRINSIC_W_SIDE_EFFECTS.
We may decide to split the latter up with finer-grained restrictions later, if
necessary.

llvm-svn: 277224

											
										
										
											2016-07-30 06:32:36 +08:00
+								  unsigned Res = CI.getType()->isVoidTy() ? 0 : getOrCreateVReg(CI);
 								  MachineInstrBuilder MIB =
-												GlobalISel: move type information to MachineRegisterInfo.

We want each register to have a canonical type, which means the best place to
store this is in MachineRegisterInfo rather than on every MachineInstr that
happens to use or define that register.

Most changes following from this are pretty simple (you need an MRI anyway if
you're going to be doing any transformations, so just check the type there).
But legalization doesn't really want to check redundant operands (when, for
example, a G_ADD only ever has one type) so I've made use of MCInstrDesc's
operand type field to encode these constraints and limit legalization's work.

As an added bonus, more validation is possible, both in MachineVerifier and
MachineIRBuilder (coming soon).

llvm-svn: 281035

											
										
										
											2016-09-09 19:46:34 +08:00
+								      MIRBuilder.buildIntrinsic(ID, Res, !CI.doesNotAccessMemory());
-												GlobalISel: support translation of intrinsic calls.

These come in two variants for now: G_INTRINSIC and G_INTRINSIC_W_SIDE_EFFECTS.
We may decide to split the latter up with finer-grained restrictions later, if
necessary.

llvm-svn: 277224

											
										
										
											2016-07-30 06:32:36 +08:00
 								  for (auto &Arg : CI.arg_operands()) {
-												[GlobalISel] Don't translate intrinsics with metadata parameters.

Some intrinsics take metadata parameters.  These all need custom
handling of some form, and cannot possibly be lowered generically to
G_INTRINSIC calls with vreg operands.
Reject them, instead of hitting an assert later in getOrCreateVReg.

llvm-svn: 297209

											
										
										
											2017-03-08 04:53:09 +08:00
+								    // Some intrinsics take metadata parameters. Reject them.
 								    if (isa<MetadataAsValue>(Arg))
 								      return false;
-												[GlobalISel]: Create VREGs for ConstantInt args

This patch changes the behavior of IRTranslating intrinsics where we
now create VREG + G_CONSTANT for ConstantInt values. We already do this
for FloatingPoint values. This makes it easier for the backends to
select code and it won't have to de-duplicate creation+selection of
constants.

Reviewed by: ab

llvm-svn: 298473

											
										
										
											2017-03-22 09:16:39 +08:00
+								    MIB.addUse(getOrCreateVReg(*Arg));
-												GlobalISel: support translation of intrinsic calls.

These come in two variants for now: G_INTRINSIC and G_INTRINSIC_W_SIDE_EFFECTS.
We may decide to split the latter up with finer-grained restrictions later, if
necessary.

llvm-svn: 277224

											
										
										
											2016-07-30 06:32:36 +08:00
+								  }
-												[GlobalISel] IRTranslator: Add MachineMemOperand to target memory intrinsics

Reviewers: qcolombet, ab, t.p.northover, aditya_nandakumar, dsanders

Reviewed By: qcolombet

Subscribers: rovka, kristof.beyls, javed.absar, igorb, llvm-commits

Differential Revision: https://reviews.llvm.org/D33724

llvm-svn: 304743

											
										
										
											2017-06-06 06:17:17 +08:00
 								  // Add a MachineMemOperand if it is a target mem intrinsic.
 								  const TargetLowering &TLI = *MF->getSubtarget().getTargetLowering();
 								  TargetLowering::IntrinsicInfo Info;
 								  // TODO: Add a GlobalISel version of getTgtMemIntrinsic.
 								  if (TLI.getTgtMemIntrinsic(Info, CI, ID)) {
 								    MachineMemOperand::Flags Flags =
 								        Info.vol ? MachineMemOperand::MOVolatile : MachineMemOperand::MONone;
 								    Flags |=
 								        Info.readMem ? MachineMemOperand::MOLoad : MachineMemOperand::MOStore;
 								    uint64_t Size = Info.memVT.getSizeInBits() >> 3;
 								    MIB.addMemOperand(MF->getMachineMemOperand(MachinePointerInfo(Info.ptrVal),
 								                                               Flags, Size, Info.align));
 								  }
-												GlobalISel: support translation of intrinsic calls.

These come in two variants for now: G_INTRINSIC and G_INTRINSIC_W_SIDE_EFFECTS.
We may decide to split the latter up with finer-grained restrictions later, if
necessary.

llvm-svn: 277224

											
										
										
											2016-07-30 06:32:36 +08:00
+								  return true;
 								}
-												GlobalISel: use correct builder for ConstantExprs.

ConstantExpr instances were emitting code into the current block rather than
the entry block. This meant they didn't necessarily dominate all uses, which is
clearly wrong.

llvm-svn: 288985

											
										
										
											2016-12-08 05:29:15 +08:00
+								bool IRTranslator::translateInvoke(const User &U,
 								                                   MachineIRBuilder &MIRBuilder) {
-												GlobalISel: translate invoke and landingpad instructions

Pretty bare-bones support for exception handling (no weird MSVC stuff, no SjLj
etc), but it should get things going.

llvm-svn: 286407

											
										
										
											2016-11-10 06:39:54 +08:00
+								  const InvokeInst &I = cast<InvokeInst>(U);
-												GlobalISel: store the current MachineFunction as direct state. NFC.

Having to ask the MIRBuilder for the current function is a little awkward, and
I'm intending to improve how that's threaded through anyway.

llvm-svn: 288983

											
										
										
											2016-12-08 05:17:47 +08:00
+								  MCContext &Context = MF->getContext();
-												GlobalISel: translate invoke and landingpad instructions

Pretty bare-bones support for exception handling (no weird MSVC stuff, no SjLj
etc), but it should get things going.

llvm-svn: 286407

											
										
										
											2016-11-10 06:39:54 +08:00
 								  const BasicBlock *ReturnBB = I.getSuccessor(0);
 								  const BasicBlock *EHPadBB = I.getSuccessor(1);
-												[GlobalISel] Fallback when failing to translate invoke.

We unintentionally stopped falling back in r293670.

While there, change an unusual construct.

llvm-svn: 297425

											
										
										
											2017-03-10 08:25:35 +08:00
+								  const Value *Callee = I.getCalledValue();
-												GlobalISel: translate invoke and landingpad instructions

Pretty bare-bones support for exception handling (no weird MSVC stuff, no SjLj
etc), but it should get things going.

llvm-svn: 286407

											
										
										
											2016-11-10 06:39:54 +08:00
+								  const Function *Fn = dyn_cast<Function>(Callee);
 								  if (isa<InlineAsm>(Callee))
 								    return false;
 								  // FIXME: support invoking patchpoint and statepoint intrinsics.
 								  if (Fn && Fn->isIntrinsic())
 								    return false;
 								  // FIXME: support whatever these are.
 								  if (I.countOperandBundlesOfType(LLVMContext::OB_deopt))
 								    return false;
 								  // FIXME: support Windows exception handling.
 								  if (!isa<LandingPadInst>(EHPadBB->front()))
 								    return false;
-												Move most EH from MachineModuleInfo to MachineFunction

Recommitting r288293 with some extra fixes for GlobalISel code.

Most of the exception handling members in MachineModuleInfo is actually
per function data (talks about the "current function") so it is better
to keep it at the function instead of the module.

This is a necessary step to have machine module passes work properly.

Also:
- Rename TidyLandingPads() to tidyLandingPads()
- Use doxygen member groups instead of "//===- EH ---"... so it is clear
  where a group ends.
- I had to add an ugly const_cast at two places in the AsmPrinter
  because the available MachineFunction pointers are const, but the code
  wants to call tidyLandingPads() in between
  (markFunctionEnd()/endFunction()).

Differential Revision: https://reviews.llvm.org/D27227

llvm-svn: 288405

											
										
										
											2016-12-02 03:32:15 +08:00
+								  // Emit the actual call, bracketed by EH_LABELs so that the MF knows about
-												GlobalISel: translate invoke and landingpad instructions

Pretty bare-bones support for exception handling (no weird MSVC stuff, no SjLj
etc), but it should get things going.

llvm-svn: 286407

											
										
										
											2016-11-10 06:39:54 +08:00
+								  // the region covered by the try.
-												Move most EH from MachineModuleInfo to MachineFunction

Recommitting r288293 with some extra fixes for GlobalISel code.

Most of the exception handling members in MachineModuleInfo is actually
per function data (talks about the "current function") so it is better
to keep it at the function instead of the module.

This is a necessary step to have machine module passes work properly.

Also:
- Rename TidyLandingPads() to tidyLandingPads()
- Use doxygen member groups instead of "//===- EH ---"... so it is clear
  where a group ends.
- I had to add an ugly const_cast at two places in the AsmPrinter
  because the available MachineFunction pointers are const, but the code
  wants to call tidyLandingPads() in between
  (markFunctionEnd()/endFunction()).

Differential Revision: https://reviews.llvm.org/D27227

llvm-svn: 288405

											
										
										
											2016-12-02 03:32:15 +08:00
+								  MCSymbol *BeginSymbol = Context.createTempSymbol();
-												GlobalISel: translate invoke and landingpad instructions

Pretty bare-bones support for exception handling (no weird MSVC stuff, no SjLj
etc), but it should get things going.

llvm-svn: 286407

											
										
										
											2016-11-10 06:39:54 +08:00
+								  MIRBuilder.buildInstr(TargetOpcode::EH_LABEL).addSym(BeginSymbol);
 								  unsigned Res = I.getType()->isVoidTy() ? 0 : getOrCreateVReg(I);
-												GlobalISel: merge invoke and call translation paths.

Well, sort of. But the lower-level code that invoke used to be using completely
botched the handling of varargs functions, which hopefully won't be possible if
they're using the same code.

llvm-svn: 293670

											
										
										
											2017-02-01 02:36:11 +08:00
+								  SmallVector<unsigned, 8> Args;
-												GlobalISel: translate invoke and landingpad instructions

Pretty bare-bones support for exception handling (no weird MSVC stuff, no SjLj
etc), but it should get things going.

llvm-svn: 286407

											
										
										
											2016-11-10 06:39:54 +08:00
+								  for (auto &Arg: I.arg_operands())
-												GlobalISel: merge invoke and call translation paths.

Well, sort of. But the lower-level code that invoke used to be using completely
botched the handling of varargs functions, which hopefully won't be possible if
they're using the same code.

llvm-svn: 293670

											
										
										
											2017-02-01 02:36:11 +08:00
+								    Args.push_back(getOrCreateVReg(*Arg));
-												GlobalISel: translate invoke and landingpad instructions

Pretty bare-bones support for exception handling (no weird MSVC stuff, no SjLj
etc), but it should get things going.

llvm-svn: 286407

											
										
										
											2016-11-10 06:39:54 +08:00
-												[GlobalISel] Use ImmutableCallSite instead of templates. NFC.

ImmutableCallSite abstracts away CallInst and InvokeInst. Use it!

llvm-svn: 297426

											
										
										
											2017-03-10 08:25:44 +08:00
+								  if (!CLI->lowerCall(MIRBuilder, &I, Res, Args,
-												[GlobalISel] Fallback when failing to translate invoke.

We unintentionally stopped falling back in r293670.

While there, change an unusual construct.

llvm-svn: 297425

											
										
										
											2017-03-10 08:25:35 +08:00
+								                      [&]() { return getOrCreateVReg(*I.getCalledValue()); }))
 								    return false;
-												GlobalISel: translate invoke and landingpad instructions

Pretty bare-bones support for exception handling (no weird MSVC stuff, no SjLj
etc), but it should get things going.

llvm-svn: 286407

											
										
										
											2016-11-10 06:39:54 +08:00
-												Move most EH from MachineModuleInfo to MachineFunction

Recommitting r288293 with some extra fixes for GlobalISel code.

Most of the exception handling members in MachineModuleInfo is actually
per function data (talks about the "current function") so it is better
to keep it at the function instead of the module.

This is a necessary step to have machine module passes work properly.

Also:
- Rename TidyLandingPads() to tidyLandingPads()
- Use doxygen member groups instead of "//===- EH ---"... so it is clear
  where a group ends.
- I had to add an ugly const_cast at two places in the AsmPrinter
  because the available MachineFunction pointers are const, but the code
  wants to call tidyLandingPads() in between
  (markFunctionEnd()/endFunction()).

Differential Revision: https://reviews.llvm.org/D27227

llvm-svn: 288405

											
										
										
											2016-12-02 03:32:15 +08:00
+								  MCSymbol *EndSymbol = Context.createTempSymbol();
-												GlobalISel: translate invoke and landingpad instructions

Pretty bare-bones support for exception handling (no weird MSVC stuff, no SjLj
etc), but it should get things going.

llvm-svn: 286407

											
										
										
											2016-11-10 06:39:54 +08:00
+								  MIRBuilder.buildInstr(TargetOpcode::EH_LABEL).addSym(EndSymbol);
 								  // FIXME: track probabilities.
-												[GlobalISel] Preserve IR block layout.

It makes the output function layout more predictable;  the layout has
an effect on performance, we don't want it to be at the mercy of the
translator's visitation order and such.
The predictable output is also easier to digest.

getOrCreateBB isn't appropriately named anymore, as it never needs to
create anything.  Rename it and extract the MBB creation logic out of it.

A couple tests were sensitive to the order. Update them.

llvm-svn: 297868

											
										
										
											2017-03-16 02:22:33 +08:00
+								  MachineBasicBlock &EHPadMBB = getMBB(*EHPadBB),
 								                    &ReturnMBB = getMBB(*ReturnBB);
-												GlobalISel: store the current MachineFunction as direct state. NFC.

Having to ask the MIRBuilder for the current function is a little awkward, and
I'm intending to improve how that's threaded through anyway.

llvm-svn: 288983

											
										
										
											2016-12-08 05:17:47 +08:00
+								  MF->addInvoke(&EHPadMBB, BeginSymbol, EndSymbol);
-												GlobalISel: translate invoke and landingpad instructions

Pretty bare-bones support for exception handling (no weird MSVC stuff, no SjLj
etc), but it should get things going.

llvm-svn: 286407

											
										
										
											2016-11-10 06:39:54 +08:00
+								  MIRBuilder.getMBB().addSuccessor(&ReturnMBB);
 								  MIRBuilder.getMBB().addSuccessor(&EHPadMBB);
-												GlobalISel: the translation of an invoke must branch to the good block.

Otherwise bad things happen if the basic block order isn't trivial after an
invoke.

llvm-svn: 293679

											
										
										
											2017-02-01 04:12:18 +08:00
+								  MIRBuilder.buildBr(ReturnMBB);
-												GlobalISel: translate invoke and landingpad instructions

Pretty bare-bones support for exception handling (no weird MSVC stuff, no SjLj
etc), but it should get things going.

llvm-svn: 286407

											
										
										
											2016-11-10 06:39:54 +08:00
 								  return true;
 								}
-												GlobalISel: use correct builder for ConstantExprs.

ConstantExpr instances were emitting code into the current block rather than
the entry block. This meant they didn't necessarily dominate all uses, which is
clearly wrong.

llvm-svn: 288985

											
										
										
											2016-12-08 05:29:15 +08:00
+								bool IRTranslator::translateLandingPad(const User &U,
 								                                       MachineIRBuilder &MIRBuilder) {
-												GlobalISel: translate invoke and landingpad instructions

Pretty bare-bones support for exception handling (no weird MSVC stuff, no SjLj
etc), but it should get things going.

llvm-svn: 286407

											
										
										
											2016-11-10 06:39:54 +08:00
+								  const LandingPadInst &LP = cast<LandingPadInst>(U);
 								  MachineBasicBlock &MBB = MIRBuilder.getMBB();
-												Move most EH from MachineModuleInfo to MachineFunction

Recommitting r288293 with some extra fixes for GlobalISel code.

Most of the exception handling members in MachineModuleInfo is actually
per function data (talks about the "current function") so it is better
to keep it at the function instead of the module.

This is a necessary step to have machine module passes work properly.

Also:
- Rename TidyLandingPads() to tidyLandingPads()
- Use doxygen member groups instead of "//===- EH ---"... so it is clear
  where a group ends.
- I had to add an ugly const_cast at two places in the AsmPrinter
  because the available MachineFunction pointers are const, but the code
  wants to call tidyLandingPads() in between
  (markFunctionEnd()/endFunction()).

Differential Revision: https://reviews.llvm.org/D27227

llvm-svn: 288405

											
										
										
											2016-12-02 03:32:15 +08:00
+								  addLandingPadInfo(LP, MBB);
-												GlobalISel: translate invoke and landingpad instructions

Pretty bare-bones support for exception handling (no weird MSVC stuff, no SjLj
etc), but it should get things going.

llvm-svn: 286407

											
										
										
											2016-11-10 06:39:54 +08:00
 								  MBB.setIsEHPad();
 								  // If there aren't registers to copy the values into (e.g., during SjLj
 								  // exceptions), then don't bother.
-												GlobalISel: store the current MachineFunction as direct state. NFC.

Having to ask the MIRBuilder for the current function is a little awkward, and
I'm intending to improve how that's threaded through anyway.

llvm-svn: 288983

											
										
										
											2016-12-08 05:17:47 +08:00
+								  auto &TLI = *MF->getSubtarget().getTargetLowering();
 								  const Constant *PersonalityFn = MF->getFunction()->getPersonalityFn();
-												GlobalISel: translate invoke and landingpad instructions

Pretty bare-bones support for exception handling (no weird MSVC stuff, no SjLj
etc), but it should get things going.

llvm-svn: 286407

											
										
										
											2016-11-10 06:39:54 +08:00
+								  if (TLI.getExceptionPointerRegister(PersonalityFn) == 0 &&
 								      TLI.getExceptionSelectorRegister(PersonalityFn) == 0)
 								    return true;
 								  // If landingpad's return type is token type, we don't create DAG nodes
 								  // for its exception pointer and selector value. The extraction of exception
 								  // pointer or selector value from token type landingpads is not currently
 								  // supported.
 								  if (LP.getType()->isTokenTy())
 								    return true;
 								  // Add a label to mark the beginning of the landing pad.  Deletion of the
 								  // landing pad can thus be detected via the MachineModuleInfo.
 								  MIRBuilder.buildInstr(TargetOpcode::EH_LABEL)
-												GlobalISel: store the current MachineFunction as direct state. NFC.

Having to ask the MIRBuilder for the current function is a little awkward, and
I'm intending to improve how that's threaded through anyway.

llvm-svn: 288983

											
										
										
											2016-12-08 05:17:47 +08:00
+								    .addSym(MF->addLandingPad(&MBB));
-												GlobalISel: translate invoke and landingpad instructions

Pretty bare-bones support for exception handling (no weird MSVC stuff, no SjLj
etc), but it should get things going.

llvm-svn: 286407

											
										
										
											2016-11-10 06:39:54 +08:00
-												Fix additional constructor call missed by r297241.

It was added between my build+test and my commit.

llvm-svn: 297244

											
										
										
											2017-03-08 07:32:10 +08:00
+								  LLT Ty = getLLTForType(*LP.getType(), *DL);
-												GlobalISel: use inserts for landingpad instead of sequences.

llvm-svn: 297237

											
										
										
											2017-03-08 07:04:06 +08:00
+								  unsigned Undef = MRI->createGenericVirtualRegister(Ty);
 								  MIRBuilder.buildUndef(Undef);
-												GlobalISel: Use the correct types when translating landingpad instructions

There was a bug here where we were using p0 instead of s32 for the
selector type in the landingpad. Instead of hardcoding these types we
should get the types from the landingpad instruction directly.

Note that we replicate an assert from SDAG here to only support
two-valued landingpads.

llvm-svn: 292995

											
										
										
											2017-01-25 08:16:53 +08:00
+								  SmallVector<LLT, 2> Tys;
 								  for (Type *Ty : cast<StructType>(LP.getType())->elements())
-												Recommit: [globalisel] Change LLT constructor string into an LLT-based object that knows how to generate it.

Summary:
This will allow future patches to inspect the details of the LLT. The implementation is now split between
the Support and CodeGen libraries to allow TableGen to use this class without introducing layering concerns.

Thanks to Ahmed Bougacha for finding a reasonable way to avoid the layering issue and providing the version of this patch without that problem.

The problem with the previous commit appears to have been that TableGen was including CodeGen/LowLevelType.h instead of Support/LowLevelTypeImpl.h.

Reviewers: t.p.northover, qcolombet, rovka, aditya_nandakumar, ab, javed.absar

Subscribers: arsenm, nhaehnle, mgorny, dberris, llvm-commits, kristof.beyls

Differential Revision: https://reviews.llvm.org/D30046

llvm-svn: 297241

											
										
										
											2017-03-08 07:20:35 +08:00
+								    Tys.push_back(getLLTForType(*Ty, *DL));
-												GlobalISel: Use the correct types when translating landingpad instructions

There was a bug here where we were using p0 instead of s32 for the
selector type in the landingpad. Instead of hardcoding these types we
should get the types from the landingpad instruction directly.

Note that we replicate an assert from SDAG here to only support
two-valued landingpads.

llvm-svn: 292995

											
										
										
											2017-01-25 08:16:53 +08:00
+								  assert(Tys.size() == 2 && "Only two-valued landingpads are supported");
-												GlobalISel: translate invoke and landingpad instructions

Pretty bare-bones support for exception handling (no weird MSVC stuff, no SjLj
etc), but it should get things going.

llvm-svn: 286407

											
										
										
											2016-11-10 06:39:54 +08:00
+								  // Mark exception register as live in.
-												GlobalISel: use inserts for landingpad instead of sequences.

llvm-svn: 297237

											
										
										
											2017-03-08 07:04:06 +08:00
+								  unsigned ExceptionReg = TLI.getExceptionPointerRegister(PersonalityFn);
 								  if (!ExceptionReg)
 								    return false;
-												GlobalISel: translate invoke and landingpad instructions

Pretty bare-bones support for exception handling (no weird MSVC stuff, no SjLj
etc), but it should get things going.

llvm-svn: 286407

											
										
										
											2016-11-10 06:39:54 +08:00
-												GlobalISel: use inserts for landingpad instead of sequences.

llvm-svn: 297237

											
										
										
											2017-03-08 07:04:06 +08:00
+								  MBB.addLiveIn(ExceptionReg);
 								  unsigned VReg = MRI->createGenericVirtualRegister(Tys[0]),
 								           Tmp = MRI->createGenericVirtualRegister(Ty);
 								  MIRBuilder.buildCopy(VReg, ExceptionReg);
 								  MIRBuilder.buildInsert(Tmp, Undef, VReg, 0);
 								  unsigned SelectorReg = TLI.getExceptionSelectorRegister(PersonalityFn);
 								  if (!SelectorReg)
 								    return false;
 								  MBB.addLiveIn(SelectorReg);
 								  // N.b. the exception selector register always has pointer type and may not
 								  // match the actual IR-level type in the landingpad so an extra cast is
 								  // needed.
 								  unsigned PtrVReg = MRI->createGenericVirtualRegister(Tys[0]);
 								  MIRBuilder.buildCopy(PtrVReg, SelectorReg);
-												GlobalISel: translate invoke and landingpad instructions

Pretty bare-bones support for exception handling (no weird MSVC stuff, no SjLj
etc), but it should get things going.

llvm-svn: 286407

											
										
										
											2016-11-10 06:39:54 +08:00
-												GlobalISel: use inserts for landingpad instead of sequences.

llvm-svn: 297237

											
										
										
											2017-03-08 07:04:06 +08:00
+								  VReg = MRI->createGenericVirtualRegister(Tys[1]);
 								  MIRBuilder.buildInstr(TargetOpcode::G_PTRTOINT).addDef(VReg).addUse(PtrVReg);
 								  MIRBuilder.buildInsert(getOrCreateVReg(LP), Tmp, VReg,
 								                         Tys[0].getSizeInBits());
-												GlobalISel: translate invoke and landingpad instructions

Pretty bare-bones support for exception handling (no weird MSVC stuff, no SjLj
etc), but it should get things going.

llvm-svn: 286407

											
										
										
											2016-11-10 06:39:54 +08:00
+								  return true;
 								}
-												GlobalISel: translate dynamic alloca instructions.

llvm-svn: 294022

											
										
										
											2017-02-04 02:22:45 +08:00
+								bool IRTranslator::translateAlloca(const User &U,
 								                                   MachineIRBuilder &MIRBuilder) {
 								  auto &AI = cast<AllocaInst>(U);
 								  if (AI.isStaticAlloca()) {
 								    unsigned Res = getOrCreateVReg(AI);
 								    int FI = getOrCreateFrameIndex(AI);
 								    MIRBuilder.buildFrameIndex(Res, FI);
 								    return true;
 								  }
 								  // Now we're in the harder dynamic case.
 								  Type *Ty = AI.getAllocatedType();
 								  unsigned Align =
 								      std::max((unsigned)DL->getPrefTypeAlignment(Ty), AI.getAlignment());
 								  unsigned NumElts = getOrCreateVReg(*AI.getArraySize());
-												[GlobalISel] Avoid translating synthetic constants to new G_CONSTANTS.

Currently, we create a G_CONSTANT for every "synthetic" integer
constant operand (for instance, for the G_GEP offset).
Instead, share the G_CONSTANTs we might have created by going through
the ValueToVReg machinery.

When we're emitting synthetic constants, we do need to get Constants from
the context.  One could argue that we shouldn't modify the context at
all (for instance, this means that we're going to use a tad more memory
if the constant wasn't used elsewhere), but constants are mostly
harmless.  We currently do this for extractvalue and all.

For constant fcmp, this does mean we'll emit an extra COPY, which is not
necessarily more optimal than an extra materialized constant.
But that preserves the current intended design of uniqued G_CONSTANTs,
and the rematerialization problem exists elsewhere and should be
resolved with a single coherent solution.

llvm-svn: 297875

											
										
										
											2017-03-16 03:21:11 +08:00
+								  Type *IntPtrIRTy = DL->getIntPtrType(AI.getType());
 								  LLT IntPtrTy = getLLTForType(*IntPtrIRTy, *DL);
-												GlobalISel: translate dynamic alloca instructions.

llvm-svn: 294022

											
										
										
											2017-02-04 02:22:45 +08:00
+								  if (MRI->getType(NumElts) != IntPtrTy) {
 								    unsigned ExtElts = MRI->createGenericVirtualRegister(IntPtrTy);
 								    MIRBuilder.buildZExtOrTrunc(ExtElts, NumElts);
 								    NumElts = ExtElts;
 								  }
 								  unsigned AllocSize = MRI->createGenericVirtualRegister(IntPtrTy);
-												[GlobalISel] Avoid translating synthetic constants to new G_CONSTANTS.

Currently, we create a G_CONSTANT for every "synthetic" integer
constant operand (for instance, for the G_GEP offset).
Instead, share the G_CONSTANTs we might have created by going through
the ValueToVReg machinery.

When we're emitting synthetic constants, we do need to get Constants from
the context.  One could argue that we shouldn't modify the context at
all (for instance, this means that we're going to use a tad more memory
if the constant wasn't used elsewhere), but constants are mostly
harmless.  We currently do this for extractvalue and all.

For constant fcmp, this does mean we'll emit an extra COPY, which is not
necessarily more optimal than an extra materialized constant.
But that preserves the current intended design of uniqued G_CONSTANTs,
and the rematerialization problem exists elsewhere and should be
resolved with a single coherent solution.

llvm-svn: 297875

											
										
										
											2017-03-16 03:21:11 +08:00
+								  unsigned TySize =
 								      getOrCreateVReg(*ConstantInt::get(IntPtrIRTy, -DL->getTypeAllocSize(Ty)));
-												GlobalISel: translate dynamic alloca instructions.

llvm-svn: 294022

											
										
										
											2017-02-04 02:22:45 +08:00
+								  MIRBuilder.buildMul(AllocSize, NumElts, TySize);
-												Recommit: [globalisel] Change LLT constructor string into an LLT-based object that knows how to generate it.

Summary:
This will allow future patches to inspect the details of the LLT. The implementation is now split between
the Support and CodeGen libraries to allow TableGen to use this class without introducing layering concerns.

Thanks to Ahmed Bougacha for finding a reasonable way to avoid the layering issue and providing the version of this patch without that problem.

The problem with the previous commit appears to have been that TableGen was including CodeGen/LowLevelType.h instead of Support/LowLevelTypeImpl.h.

Reviewers: t.p.northover, qcolombet, rovka, aditya_nandakumar, ab, javed.absar

Subscribers: arsenm, nhaehnle, mgorny, dberris, llvm-commits, kristof.beyls

Differential Revision: https://reviews.llvm.org/D30046

llvm-svn: 297241

											
										
										
											2017-03-08 07:20:35 +08:00
+								  LLT PtrTy = getLLTForType(*AI.getType(), *DL);
-												GlobalISel: translate dynamic alloca instructions.

llvm-svn: 294022

											
										
										
											2017-02-04 02:22:45 +08:00
+								  auto &TLI = *MF->getSubtarget().getTargetLowering();
 								  unsigned SPReg = TLI.getStackPointerRegisterToSaveRestore();
 								  unsigned SPTmp = MRI->createGenericVirtualRegister(PtrTy);
 								  MIRBuilder.buildCopy(SPTmp, SPReg);
-												GlobalISel: introduce G_PTR_MASK to simplify alloca handling.

This instruction clears the low bits of a pointer without requiring (possibly
dodgy if pointers aren't ints) conversions to and from an integer. Since (as
far as I'm aware) all masks are statically known, the instruction takes an
immediate operand rather than a register to specify the mask.

llvm-svn: 295103

											
										
										
											2017-02-15 04:56:18 +08:00
+								  unsigned AllocTmp = MRI->createGenericVirtualRegister(PtrTy);
 								  MIRBuilder.buildGEP(AllocTmp, SPTmp, AllocSize);
-												GlobalISel: translate dynamic alloca instructions.

llvm-svn: 294022

											
										
										
											2017-02-04 02:22:45 +08:00
 								  // Handle alignment. We have to realign if the allocation granule was smaller
 								  // than stack alignment, or the specific alloca requires more than stack
 								  // alignment.
 								  unsigned StackAlign =
 								      MF->getSubtarget().getFrameLowering()->getStackAlignment();
 								  Align = std::max(Align, StackAlign);
 								  if (Align > StackAlign || DL->getTypeAllocSize(Ty) % StackAlign != 0) {
 								    // Round the size of the allocation up to the stack alignment size
 								    // by add SA-1 to the size. This doesn't overflow because we're computing
 								    // an address inside an alloca.
-												GlobalISel: introduce G_PTR_MASK to simplify alloca handling.

This instruction clears the low bits of a pointer without requiring (possibly
dodgy if pointers aren't ints) conversions to and from an integer. Since (as
far as I'm aware) all masks are statically known, the instruction takes an
immediate operand rather than a register to specify the mask.

llvm-svn: 295103

											
										
										
											2017-02-15 04:56:18 +08:00
+								    unsigned AlignedAlloc = MRI->createGenericVirtualRegister(PtrTy);
 								    MIRBuilder.buildPtrMask(AlignedAlloc, AllocTmp, Log2_32(Align));
 								    AllocTmp = AlignedAlloc;
-												GlobalISel: translate dynamic alloca instructions.

llvm-svn: 294022

											
										
										
											2017-02-04 02:22:45 +08:00
+								  }
-												GlobalISel: introduce G_PTR_MASK to simplify alloca handling.

This instruction clears the low bits of a pointer without requiring (possibly
dodgy if pointers aren't ints) conversions to and from an integer. Since (as
far as I'm aware) all masks are statically known, the instruction takes an
immediate operand rather than a register to specify the mask.

llvm-svn: 295103

											
										
										
											2017-02-15 04:56:18 +08:00
+								  MIRBuilder.buildCopy(SPReg, AllocTmp);
 								  MIRBuilder.buildCopy(getOrCreateVReg(AI), AllocTmp);
-												[IRTranslator] Do not abort when the target wants to fall back.

Every pass in the GlobalISel pipeline will need to do something similar.

llvm-svn: 279886

											
										
										
											2016-08-27 07:49:05 +08:00
-												GlobalISel: translate dynamic alloca instructions.

llvm-svn: 294022

											
										
										
											2017-02-04 02:22:45 +08:00
+								  MF->getFrameInfo().CreateVariableSizedObject(Align ? Align : 1, &AI);
 								  assert(MF->getFrameInfo().hasVarSizedObjects());
-												GlobalISel: implement alloca instruction

llvm-svn: 276433

											
										
										
											2016-07-23 00:59:52 +08:00
+								  return true;
 								}
-												GlobalISel: support translating va_arg

Since (say) i128 and [16 x i8] map to the same type in generic MIR, we also
need to attach the required alignment info.

llvm-svn: 295254

											
										
										
											2017-02-16 07:22:33 +08:00
+								bool IRTranslator::translateVAArg(const User &U, MachineIRBuilder &MIRBuilder) {
 								  // FIXME: We may need more info about the type. Because of how LLT works,
 								  // we're completely discarding the i64/double distinction here (amongst
 								  // others). Fortunately the ABIs I know of where that matters don't use va_arg
 								  // anyway but that's not guaranteed.
 								  MIRBuilder.buildInstr(TargetOpcode::G_VAARG)
 								    .addDef(getOrCreateVReg(U))
 								    .addUse(getOrCreateVReg(*U.getOperand(0)))
 								    .addImm(DL->getABITypeAlignment(U.getType()));
 								  return true;
 								}
-												[GlobalISel] Translate insertelement and extractelement

Reviewers: qcolombet, aditya_nandakumar, dsanders, ab, t.p.northover, javed.absar

Reviewed By: qcolombet

Subscribers: dberris, rovka, llvm-commits, kristof.beyls

Differential Revision: https://reviews.llvm.org/D30761

llvm-svn: 297495

											
										
										
											2017-03-11 03:08:28 +08:00
+								bool IRTranslator::translateInsertElement(const User &U,
 								                                          MachineIRBuilder &MIRBuilder) {
 								  // If it is a <1 x Ty> vector, use the scalar as it is
 								  // not a legal vector type in LLT.
 								  if (U.getType()->getVectorNumElements() == 1) {
 								    unsigned Elt = getOrCreateVReg(*U.getOperand(1));
 								    ValToVReg[&U] = Elt;
 								    return true;
 								  }
-												[GlobalISel] Remove non-determinism from IRTranslator.

This showed up in r300535/r300537, which were reverted in r300538 due to
some of the introduced tests in there failing on some bots, due to the
non-determinism fixed in this commit.

Re-committing r300535/r300537 will add 2 tests for the change in this
commit.

llvm-svn: 300663

											
										
										
											2017-04-19 14:38:37 +08:00
+								  unsigned Res = getOrCreateVReg(U);
 								  unsigned Val = getOrCreateVReg(*U.getOperand(0));
 								  unsigned Elt = getOrCreateVReg(*U.getOperand(1));
 								  unsigned Idx = getOrCreateVReg(*U.getOperand(2));
 								  MIRBuilder.buildInsertVectorElement(Res, Val, Elt, Idx);
-												[GlobalISel] Translate insertelement and extractelement

Reviewers: qcolombet, aditya_nandakumar, dsanders, ab, t.p.northover, javed.absar

Reviewed By: qcolombet

Subscribers: dberris, rovka, llvm-commits, kristof.beyls

Differential Revision: https://reviews.llvm.org/D30761

llvm-svn: 297495

											
										
										
											2017-03-11 03:08:28 +08:00
+								  return true;
 								}
 								bool IRTranslator::translateExtractElement(const User &U,
 								                                           MachineIRBuilder &MIRBuilder) {
 								  // If it is a <1 x Ty> vector, use the scalar as it is
 								  // not a legal vector type in LLT.
 								  if (U.getOperand(0)->getType()->getVectorNumElements() == 1) {
 								    unsigned Elt = getOrCreateVReg(*U.getOperand(0));
 								    ValToVReg[&U] = Elt;
 								    return true;
 								  }
-												[GlobalISel] Remove non-determinism from IRTranslator.

This showed up in r300535/r300537, which were reverted in r300538 due to
some of the introduced tests in there failing on some bots, due to the
non-determinism fixed in this commit.

Re-committing r300535/r300537 will add 2 tests for the change in this
commit.

llvm-svn: 300663

											
										
										
											2017-04-19 14:38:37 +08:00
+								  unsigned Res = getOrCreateVReg(U);
 								  unsigned Val = getOrCreateVReg(*U.getOperand(0));
 								  unsigned Idx = getOrCreateVReg(*U.getOperand(1));
 								  MIRBuilder.buildExtractVectorElement(Res, Val, Idx);
-												[GlobalISel] Translate insertelement and extractelement

Reviewers: qcolombet, aditya_nandakumar, dsanders, ab, t.p.northover, javed.absar

Reviewed By: qcolombet

Subscribers: dberris, rovka, llvm-commits, kristof.beyls

Differential Revision: https://reviews.llvm.org/D30761

llvm-svn: 297495

											
										
										
											2017-03-11 03:08:28 +08:00
+								  return true;
 								}
-												[GlobalISel] Translate shufflevector

Reviewers: qcolombet, aditya_nandakumar, t.p.northover, javed.absar, ab, dsanders

Reviewed By: javed.absar

Subscribers: dberris, rovka, llvm-commits, kristof.beyls

Differential Revision: https://reviews.llvm.org/D30962

llvm-svn: 298347

											
										
										
											2017-03-21 16:44:13 +08:00
+								bool IRTranslator::translateShuffleVector(const User &U,
 								                                          MachineIRBuilder &MIRBuilder) {
 								  MIRBuilder.buildInstr(TargetOpcode::G_SHUFFLE_VECTOR)
 								      .addDef(getOrCreateVReg(U))
 								      .addUse(getOrCreateVReg(*U.getOperand(0)))
 								      .addUse(getOrCreateVReg(*U.getOperand(1)))
 								      .addUse(getOrCreateVReg(*U.getOperand(2)));
 								  return true;
 								}
-												GlobalISel: use correct builder for ConstantExprs.

ConstantExpr instances were emitting code into the current block rather than
the entry block. This meant they didn't necessarily dominate all uses, which is
clearly wrong.

llvm-svn: 288985

											
										
										
											2016-12-08 05:29:15 +08:00
+								bool IRTranslator::translatePHI(const User &U, MachineIRBuilder &MIRBuilder) {
-												GlobalISel: support same ConstantExprs as Instructions.

It's more than just inttoptr, but the others can't be tested until we have
support for non-trivial constants (they currently get unavoidably folded to a
ConstantInt).

llvm-svn: 278303

											
										
										
											2016-08-11 07:02:41 +08:00
+								  const PHINode &PI = cast<PHINode>(U);
-												GlobalISel: remove G_TYPE and G_PHI

These instructions were only necessary when type information was stored in the
MachineInstr (because only generic MachineInstrs possessed a type). Now that
it's in MachineRegisterInfo, COPY and PHI work fine.

llvm-svn: 281037

											
										
										
											2016-09-09 19:47:31 +08:00
+								  auto MIB = MIRBuilder.buildInstr(TargetOpcode::PHI);
-												GlobalISel: IRTranslate PHI instructions

llvm-svn: 277835

											
										
										
											2016-08-06 01:16:40 +08:00
+								  MIB.addDef(getOrCreateVReg(PI));
 								  PendingPHIs.emplace_back(&PI, MIB.getInstr());
 								  return true;
 								}
 								void IRTranslator::finishPendingPhis() {
 								  for (std::pair<const PHINode *, MachineInstr *> &Phi : PendingPHIs) {
 								    const PHINode *PI = Phi.first;
-												GlobalISel: use correct builder for ConstantExprs.

ConstantExpr instances were emitting code into the current block rather than
the entry block. This meant they didn't necessarily dominate all uses, which is
clearly wrong.

llvm-svn: 288985

											
										
										
											2016-12-08 05:29:15 +08:00
+								    MachineInstrBuilder MIB(*MF, Phi.second);
-												GlobalISel: IRTranslate PHI instructions

llvm-svn: 277835

											
										
										
											2016-08-06 01:16:40 +08:00
 								    // All MachineBasicBlocks exist, add them to the PHI. We assume IRTranslator
 								    // won't create extra control flow here, otherwise we need to find the
 								    // dominating predecessor here (or perhaps force the weirder IRTranslators
 								    // to provide a simple boundary).
-												[GlobalISel] track predecessor mapping during switch lowering.

Correctly populating Machine PHIs relies on knowing exactly how the IR level
CFG was lowered to MachineIR. This needs to be tracked by any translation
phases that meddle (currently only SwitchInst handling).

This reapplies r291973 which was reverted because of testing failures. Fixes:

 + Don't return an ArrayRef to a local temporary.
 + Incorporate Kristof's suggested comment improvements.

llvm-svn: 292278

											
										
										
											2017-01-18 06:13:50 +08:00
+								    SmallSet<const BasicBlock *, 4> HandledPreds;
-												GlobalISel: IRTranslate PHI instructions

llvm-svn: 277835

											
										
										
											2016-08-06 01:16:40 +08:00
+								    for (unsigned i = 0; i < PI->getNumIncomingValues(); ++i) {
-												[GlobalISel] track predecessor mapping during switch lowering.

Correctly populating Machine PHIs relies on knowing exactly how the IR level
CFG was lowered to MachineIR. This needs to be tracked by any translation
phases that meddle (currently only SwitchInst handling).

This reapplies r291973 which was reverted because of testing failures. Fixes:

 + Don't return an ArrayRef to a local temporary.
 + Incorporate Kristof's suggested comment improvements.

llvm-svn: 292278

											
										
										
											2017-01-18 06:13:50 +08:00
+								      auto IRPred = PI->getIncomingBlock(i);
 								      if (HandledPreds.count(IRPred))
 								        continue;
 								      HandledPreds.insert(IRPred);
 								      unsigned ValReg = getOrCreateVReg(*PI->getIncomingValue(i));
 								      for (auto Pred : getMachinePredBBs({IRPred, PI->getParent()})) {
 								        assert(Pred->isSuccessor(MIB->getParent()) &&
 								               "incorrect CFG at MachineBasicBlock level");
 								        MIB.addUse(ValReg);
 								        MIB.addMBB(Pred);
 								      }
-												GlobalISel: IRTranslate PHI instructions

llvm-svn: 277835

											
										
										
											2016-08-06 01:16:40 +08:00
+								    }
 								  }
 								}
-												[GlobalISel] More detailed skeleton for the IRTranslator.

llvm-svn: 260456

											
										
										
											2016-02-11 06:59:27 +08:00
+								bool IRTranslator::translate(const Instruction &Inst) {
-												GlobalISel: use correct builder for ConstantExprs.

ConstantExpr instances were emitting code into the current block rather than
the entry block. This meant they didn't necessarily dominate all uses, which is
clearly wrong.

llvm-svn: 288985

											
										
										
											2016-12-08 05:29:15 +08:00
+								  CurBuilder.setDebugLoc(Inst.getDebugLoc());
-												[GlobalISel] More detailed skeleton for the IRTranslator.

llvm-svn: 260456

											
										
										
											2016-02-11 06:59:27 +08:00
+								  switch(Inst.getOpcode()) {
-												GlobalISel: support same ConstantExprs as Instructions.

It's more than just inttoptr, but the others can't be tested until we have
support for non-trivial constants (they currently get unavoidably folded to a
ConstantInt).

llvm-svn: 278303

											
										
										
											2016-08-11 07:02:41 +08:00
+								#define HANDLE_INST(NUM, OPCODE, CLASS) \
-												GlobalISel: use correct builder for ConstantExprs.

ConstantExpr instances were emitting code into the current block rather than
the entry block. This meant they didn't necessarily dominate all uses, which is
clearly wrong.

llvm-svn: 288985

											
										
										
											2016-12-08 05:29:15 +08:00
+								    case Instruction::OPCODE: return translate##OPCODE(Inst, CurBuilder);
-												GlobalISel: support same ConstantExprs as Instructions.

It's more than just inttoptr, but the others can't be tested until we have
support for non-trivial constants (they currently get unavoidably folded to a
ConstantInt).

llvm-svn: 278303

											
										
										
											2016-08-11 07:02:41 +08:00
+								#include "llvm/IR/Instruction.def"
-												[GlobalISel] Teach the IRTranslator how to lower returns.

llvm-svn: 260562

											
										
										
											2016-02-12 02:53:28 +08:00
+								  default:
-												[IRTranslator] Simplify error handling for translating constants. NFC.

We don't need to check whether the fallback path is enabled to return
false. Just do that all the time on error cases, the caller knows (or
at least should know!) how to handle the failing case.

llvm-svn: 297535

											
										
										
											2017-03-11 08:28:33 +08:00
+								    return false;
-												[GlobalISel] More detailed skeleton for the IRTranslator.

llvm-svn: 260456

											
										
										
											2016-02-11 06:59:27 +08:00
+								  }
-												[GlobalISel] Add the proper cmake plumbing.

This patch adds the necessary plumbing to cmake to build the sources related to
GlobalISel.

To build the sources related to GlobalISel, we need to add -DBUILD_GLOBAL_ISEL=ON.
By default, this is OFF, thus GlobalISel sources will not impact people that do
not explicitly opt-in.

Differential Revision: http://reviews.llvm.org/D15983

llvm-svn: 258344

											
										
										
											2016-01-21 04:58:56 +08:00
+								}
-												GlobalISel: first translation support for Constants.

For now put them all in the entry block. This should be correct but may give
poor runtime performance. Hopefully MachineSinking combined with
isReMaterializable can solve those issues, but if not the interface is sound
enough to support alternatives.

llvm-svn: 278168

											
										
										
											2016-08-10 05:28:04 +08:00
+								bool IRTranslator::translate(const Constant &C, unsigned Reg) {
-												GlobalISel: support 'undef' constant.

llvm-svn: 278174

											
										
										
											2016-08-10 07:01:30 +08:00
+								  if (auto CI = dyn_cast<ConstantInt>(&C))
-												GlobalISel: translate constants larger than 64 bits.

llvm-svn: 288713

											
										
										
											2016-12-06 05:54:17 +08:00
+								    EntryBuilder.buildConstant(Reg, *CI);
-												GlobalISel: translate floating-point constants

llvm-svn: 279311

											
										
										
											2016-08-20 04:09:15 +08:00
+								  else if (auto CF = dyn_cast<ConstantFP>(&C))
-												GlobalISel: move type information to MachineRegisterInfo.

We want each register to have a canonical type, which means the best place to
store this is in MachineRegisterInfo rather than on every MachineInstr that
happens to use or define that register.

Most changes following from this are pretty simple (you need an MRI anyway if
you're going to be doing any transformations, so just check the type there).
But legalization doesn't really want to check redundant operands (when, for
example, a G_ADD only ever has one type) so I've made use of MCInstrDesc's
operand type field to encode these constraints and limit legalization's work.

As an added bonus, more validation is possible, both in MachineVerifier and
MachineIRBuilder (coming soon).

llvm-svn: 281035

											
										
										
											2016-09-09 19:46:34 +08:00
+								    EntryBuilder.buildFConstant(Reg, *CF);
-												GlobalISel: support 'undef' constant.

llvm-svn: 278174

											
										
										
											2016-08-10 07:01:30 +08:00
+								  else if (isa<UndefValue>(C))
-												GlobalISel: add buildUndef method to MachineIRBuilder. NFC.

llvm-svn: 297044

											
										
										
											2017-03-07 02:36:40 +08:00
+								    EntryBuilder.buildUndef(Reg);
-												GlobalISel: support 'null' constant in translation.

It's sharing the integer G_CONSTANT for now since I don't *think* it creates
any ambiguity (even on weird archs). If that turns out wrong we can create a
G_PTRCONSTANT or something.

llvm-svn: 278423

											
										
										
											2016-08-12 05:40:55 +08:00
+								  else if (isa<ConstantPointerNull>(C))
-												GlobalISel: make G_CONSTANT take a ConstantInt rather than int64_t.

This makes it more similar to the floating-point constant, and also allows for
larger constants to be translated later. There's no real functional change in
this patch though, just syntax updates.

llvm-svn: 288712

											
										
										
											2016-12-06 05:47:07 +08:00
+								    EntryBuilder.buildConstant(Reg, 0);
-												GlobalISel: support translation of global addresses.

llvm-svn: 281207

											
										
										
											2016-09-12 20:10:41 +08:00
+								  else if (auto GV = dyn_cast<GlobalValue>(&C))
 								    EntryBuilder.buildGlobalValue(Reg, GV);
-												GlobalISel: Translate ConstantAggregateZero vectors

Reviewers: qcolombet, aditya_nandakumar, dsanders, ab, t.p.northover, javed.absar

Reviewed By: qcolombet

Subscribers: dberris, rovka, llvm-commits, kristof.beyls

Differential Revision: https://reviews.llvm.org/D30259

llvm-svn: 297509

											
										
										
											2017-03-11 05:23:13 +08:00
+								  else if (auto CAZ = dyn_cast<ConstantAggregateZero>(&C)) {
 								    if (!CAZ->getType()->isVectorTy())
 								      return false;
-												[GlobalISel] IRTranslator: Return the scalar for <1 x Ty> constant vectors

Summary:
<1 x Ty> is not a legal vector type in LLT, we shouldn’t build G_MERGE_VALUES
instruction for them.

Reviewers: qcolombet, aditya_nandakumar, dsanders, t.p.northover, ab, javed.absar

Reviewed By: qcolombet

Subscribers: dberris, rovka, kristof.beyls, llvm-commits

Differential Revision: https://reviews.llvm.org/D30948

llvm-svn: 297792

											
										
										
											2017-03-15 07:45:06 +08:00
+								    // Return the scalar if it is a <1 x Ty> vector.
 								    if (CAZ->getNumElements() == 1)
 								      return translate(*CAZ->getElementValue(0u), Reg);
-												GlobalISel: Translate ConstantAggregateZero vectors

Reviewers: qcolombet, aditya_nandakumar, dsanders, ab, t.p.northover, javed.absar

Reviewed By: qcolombet

Subscribers: dberris, rovka, llvm-commits, kristof.beyls

Differential Revision: https://reviews.llvm.org/D30259

llvm-svn: 297509

											
										
										
											2017-03-11 05:23:13 +08:00
+								    std::vector<unsigned> Ops;
 								    for (unsigned i = 0; i < CAZ->getNumElements(); ++i) {
 								      Constant &Elt = *CAZ->getElementValue(i);
 								      Ops.push_back(getOrCreateVReg(Elt));
 								    }
 								    EntryBuilder.buildMerge(Reg, Ops);
-												GlobalISel: Translate ConstantDataVector

Reviewers: qcolombet, aditya_nandakumar, dsanders, t.p.northover, javed.absar, ab

Reviewed By: qcolombet, dsanders, ab

Subscribers: dberris, rovka, llvm-commits, kristof.beyls

Differential Revision: https://reviews.llvm.org/D30216

llvm-svn: 297670

											
										
										
											2017-03-14 05:36:19 +08:00
+								  } else if (auto CV = dyn_cast<ConstantDataVector>(&C)) {
-												[GlobalISel] IRTranslator: Return the scalar for <1 x Ty> constant vectors

Summary:
<1 x Ty> is not a legal vector type in LLT, we shouldn’t build G_MERGE_VALUES
instruction for them.

Reviewers: qcolombet, aditya_nandakumar, dsanders, t.p.northover, ab, javed.absar

Reviewed By: qcolombet

Subscribers: dberris, rovka, kristof.beyls, llvm-commits

Differential Revision: https://reviews.llvm.org/D30948

llvm-svn: 297792

											
										
										
											2017-03-15 07:45:06 +08:00
+								    // Return the scalar if it is a <1 x Ty> vector.
 								    if (CV->getNumElements() == 1)
 								      return translate(*CV->getElementAsConstant(0), Reg);
-												GlobalISel: Translate ConstantDataVector

Reviewers: qcolombet, aditya_nandakumar, dsanders, t.p.northover, javed.absar, ab

Reviewed By: qcolombet, dsanders, ab

Subscribers: dberris, rovka, llvm-commits, kristof.beyls

Differential Revision: https://reviews.llvm.org/D30216

llvm-svn: 297670

											
										
										
											2017-03-14 05:36:19 +08:00
+								    std::vector<unsigned> Ops;
 								    for (unsigned i = 0; i < CV->getNumElements(); ++i) {
 								      Constant &Elt = *CV->getElementAsConstant(i);
 								      Ops.push_back(getOrCreateVReg(Elt));
 								    }
 								    EntryBuilder.buildMerge(Reg, Ops);
-												GlobalISel: Translate ConstantAggregateZero vectors

Reviewers: qcolombet, aditya_nandakumar, dsanders, ab, t.p.northover, javed.absar

Reviewed By: qcolombet

Subscribers: dberris, rovka, llvm-commits, kristof.beyls

Differential Revision: https://reviews.llvm.org/D30259

llvm-svn: 297509

											
										
										
											2017-03-11 05:23:13 +08:00
+								  } else if (auto CE = dyn_cast<ConstantExpr>(&C)) {
-												GlobalISel: support same ConstantExprs as Instructions.

It's more than just inttoptr, but the others can't be tested until we have
support for non-trivial constants (they currently get unavoidably folded to a
ConstantInt).

llvm-svn: 278303

											
										
										
											2016-08-11 07:02:41 +08:00
+								    switch(CE->getOpcode()) {
 								#define HANDLE_INST(NUM, OPCODE, CLASS)                         \
-												GlobalISel: use correct builder for ConstantExprs.

ConstantExpr instances were emitting code into the current block rather than
the entry block. This meant they didn't necessarily dominate all uses, which is
clearly wrong.

llvm-svn: 288985

											
										
										
											2016-12-08 05:29:15 +08:00
+								      case Instruction::OPCODE: return translate##OPCODE(*CE, EntryBuilder);
-												GlobalISel: support same ConstantExprs as Instructions.

It's more than just inttoptr, but the others can't be tested until we have
support for non-trivial constants (they currently get unavoidably folded to a
ConstantInt).

llvm-svn: 278303

											
										
										
											2016-08-11 07:02:41 +08:00
+								#include "llvm/IR/Instruction.def"
 								    default:
-												[IRTranslator] Simplify error handling for translating constants. NFC.

We don't need to check whether the fallback path is enabled to return
false. Just do that all the time on error cases, the caller knows (or
at least should know!) how to handle the failing case.

llvm-svn: 297535

											
										
										
											2017-03-11 08:28:33 +08:00
+								      return false;
-												GlobalISel: support same ConstantExprs as Instructions.

It's more than just inttoptr, but the others can't be tested until we have
support for non-trivial constants (they currently get unavoidably folded to a
ConstantInt).

llvm-svn: 278303

											
										
										
											2016-08-11 07:02:41 +08:00
+								    }
-												[GlobalISel] IRTranslator: Translate ConstantStruct

Reviewers: qcolombet, ab, t.p.northover, aditya_nandakumar, dsanders

Reviewed By: qcolombet

Subscribers: rovka, kristof.beyls, javed.absar, igorb, llvm-commits

Differential Revision: https://reviews.llvm.org/D33317

llvm-svn: 303412

											
										
										
											2017-05-19 17:47:02 +08:00
+								  } else if (auto CS = dyn_cast<ConstantStruct>(&C)) {
 								    // Return the element if it is a single element ConstantStruct.
 								    if (CS->getNumOperands() == 1) {
 								      unsigned EltReg = getOrCreateVReg(*CS->getOperand(0));
 								      EntryBuilder.buildCast(Reg, EltReg);
 								      return true;
 								    }
 								    SmallVector<unsigned, 4> Ops;
 								    SmallVector<uint64_t, 4> Indices;
 								    uint64_t Offset = 0;
 								    for (unsigned i = 0; i < CS->getNumOperands(); ++i) {
 								      unsigned OpReg = getOrCreateVReg(*CS->getOperand(i));
 								      Ops.push_back(OpReg);
 								      Indices.push_back(Offset);
 								      Offset += MRI->getType(OpReg).getSizeInBits();
 								    }
 								    EntryBuilder.buildSequence(Reg, Ops, Indices);
-												[GISel]: Add support to translate ConstantVectors

Reviewed by Quentin
https://reviews.llvm.org/D32814

llvm-svn: 302196

											
										
										
											2017-05-05 05:43:12 +08:00
+								  } else if (auto CV = dyn_cast<ConstantVector>(&C)) {
 								    if (CV->getNumOperands() == 1)
 								      return translate(*CV->getOperand(0), Reg);
 								    SmallVector<unsigned, 4> Ops;
 								    for (unsigned i = 0; i < CV->getNumOperands(); ++i) {
 								      Ops.push_back(getOrCreateVReg(*CV->getOperand(i)));
 								    }
 								    EntryBuilder.buildMerge(Reg, Ops);
-												[IRTranslator] Simplify error handling for translating constants. NFC.

We don't need to check whether the fallback path is enabled to return
false. Just do that all the time on error cases, the caller knows (or
at least should know!) how to handle the failing case.

llvm-svn: 297535

											
										
										
											2017-03-11 08:28:33 +08:00
+								  } else
-												[IRTranslator] Do not abort when the target wants to fall back.

Every pass in the GlobalISel pipeline will need to do something similar.

llvm-svn: 279886

											
										
										
											2016-08-27 07:49:05 +08:00
+								    return false;
-												GlobalISel: first translation support for Constants.

For now put them all in the entry block. This should be correct but may give
poor runtime performance. Hopefully MachineSinking combined with
isReMaterializable can solve those issues, but if not the interface is sound
enough to support alternatives.

llvm-svn: 278168

											
										
										
											2016-08-10 05:28:04 +08:00
-												GlobalISel: support 'undef' constant.

llvm-svn: 278174

											
										
										
											2016-08-10 07:01:30 +08:00
+								  return true;
-												GlobalISel: first translation support for Constants.

For now put them all in the entry block. This should be correct but may give
poor runtime performance. Hopefully MachineSinking combined with
isReMaterializable can solve those issues, but if not the interface is sound
enough to support alternatives.

llvm-svn: 278168

											
										
										
											2016-08-10 05:28:04 +08:00
+								}
-												GlobalISel: clear vreg mapping after translating each function

Otherwise we only materialize (shared) constants in the first function they
appear in. This doesn't go well.

llvm-svn: 278351

											
										
										
											2016-08-12 00:21:29 +08:00
+								void IRTranslator::finalizeFunction() {
-												[GlobalISel] More detailed skeleton for the IRTranslator.

llvm-svn: 260456

											
										
										
											2016-02-11 06:59:27 +08:00
+								  // Release the memory used by the different maps we
 								  // needed during the translation.
-												GlobalISel: avoid looking too closely at PHIs when we bail.

The function used to finish off PHIs by adding the relevant basic blocks can
fail if we're aborting and still don't actually have the needed
MachineBasicBlocks. So avoid trying in that case.

llvm-svn: 288727

											
										
										
											2016-12-06 07:10:19 +08:00
+								  PendingPHIs.clear();
-												[IRTranslator] Use a single virtual register to represent any Value.
PR26161.

llvm-svn: 260602

											
										
										
											2016-02-12 05:48:32 +08:00
+								  ValToVReg.clear();
-												GlobalISel: translate stack protector intrinsics

llvm-svn: 285614

											
										
										
											2016-11-01 02:30:59 +08:00
+								  FrameIndices.clear();
-												[GlobalISel] track predecessor mapping during switch lowering.

Correctly populating Machine PHIs relies on knowing exactly how the IR level
CFG was lowered to MachineIR. This needs to be tracked by any translation
phases that meddle (currently only SwitchInst handling).

This reapplies r291973 which was reverted because of testing failures. Fixes:

 + Don't return an ArrayRef to a local temporary.
 + Incorporate Kristof's suggested comment improvements.

llvm-svn: 292278

											
										
										
											2017-01-18 06:13:50 +08:00
+								  MachinePreds.clear();
-												[GISel]: Fix undefined behavior in IRTranslator

Make sure IRTranslator->MachineIRBuilder->DebugLoc doesn't
outlive the DILocation. Clear it at the end of
IRTranslator::runOnMachineFunction

llvm-svn: 303277

											
										
										
											2017-05-18 01:41:55 +08:00
+								  // MachineIRBuilder::DebugLoc can outlive the DILocation it holds. Clear it
 								  // to avoid accessing free’d memory (in runOnMachineFunction) and to avoid
 								  // destroying it twice (in ~IRTranslator() and ~LLVMContext())
 								  EntryBuilder = MachineIRBuilder();
 								  CurBuilder = MachineIRBuilder();
-												[GlobalISel] Add the proper cmake plumbing.

This patch adds the necessary plumbing to cmake to build the sources related to
GlobalISel.

To build the sources related to GlobalISel, we need to add -DBUILD_GLOBAL_ISEL=ON.
By default, this is OFF, thus GlobalISel sources will not impact people that do
not explicitly opt-in.

Differential Revision: http://reviews.llvm.org/D15983

llvm-svn: 258344

											
										
										
											2016-01-21 04:58:56 +08:00
+								}
-												GlobalISel: store the current MachineFunction as direct state. NFC.

Having to ask the MIRBuilder for the current function is a little awkward, and
I'm intending to improve how that's threaded through anyway.

llvm-svn: 288983

											
										
										
											2016-12-08 05:17:47 +08:00
+								bool IRTranslator::runOnMachineFunction(MachineFunction &CurMF) {
 								  MF = &CurMF;
 								  const Function &F = *MF->getFunction();
-												[GlobalISel] Add the necessary plumbing to lower formal arguments.

llvm-svn: 260579

											
										
										
											2016-02-12 03:59:41 +08:00
+								  if (F.empty())
 								    return false;
-												GlobalISel: store the current MachineFunction as direct state. NFC.

Having to ask the MIRBuilder for the current function is a little awkward, and
I'm intending to improve how that's threaded through anyway.

llvm-svn: 288983

											
										
										
											2016-12-08 05:17:47 +08:00
+								  CLI = MF->getSubtarget().getCallLowering();
-												GlobalISel: use correct builder for ConstantExprs.

ConstantExpr instances were emitting code into the current block rather than
the entry block. This meant they didn't necessarily dominate all uses, which is
clearly wrong.

llvm-svn: 288985

											
										
										
											2016-12-08 05:29:15 +08:00
+								  CurBuilder.setMF(*MF);
-												GlobalISel: store the current MachineFunction as direct state. NFC.

Having to ask the MIRBuilder for the current function is a little awkward, and
I'm intending to improve how that's threaded through anyway.

llvm-svn: 288983

											
										
										
											2016-12-08 05:17:47 +08:00
+								  EntryBuilder.setMF(*MF);
 								  MRI = &MF->getRegInfo();
-												GlobalISel: implement alloca instruction

llvm-svn: 276433

											
										
										
											2016-07-23 00:59:52 +08:00
+								  DL = &F.getParent()->getDataLayout();
-												[IRTranslator] Do not abort when the target wants to fall back.

Every pass in the GlobalISel pipeline will need to do something similar.

llvm-svn: 279886

											
										
										
											2016-08-27 07:49:05 +08:00
+								  TPC = &getAnalysis<TargetPassConfig>();
-												[CodeGen] Fix some Clang-tidy modernize-use-using and Include What You Use warnings; other minor fixes (NFC).

llvm-svn: 306341

											
										
										
											2017-06-27 06:44:03 +08:00
+								  ORE = llvm::make_unique<OptimizationRemarkEmitter>(&F);
-												GlobalISel: implement alloca instruction

llvm-svn: 276433

											
										
										
											2016-07-23 00:59:52 +08:00
-												GlobalISel: clear pending phis after MachineFunction translated

Test is just reordering the existing functions (it would trigger for any
function after one with a phi).

llvm-svn: 277841

											
										
										
											2016-08-06 01:50:36 +08:00
+								  assert(PendingPHIs.empty() && "stale PHIs");
-												[GlobalISel] Finalize translated function on scope exit. NFC.

This is the compromise between having a per-function IRTranslator
and manually managing the per-function state.

llvm-svn: 296046

											
										
										
											2017-02-24 07:57:28 +08:00
+								  // Release the per-function state when we return, whether we succeeded or not.
 								  auto FinalizeOnReturn = make_scope_exit([this]() { finalizeFunction(); });
-												[GlobalISel] Preserve IR block layout.

It makes the output function layout more predictable;  the layout has
an effect on performance, we don't want it to be at the mercy of the
translator's visitation order and such.
The predictable output is also easier to digest.

getOrCreateBB isn't appropriately named anymore, as it never needs to
create anything.  Rename it and extract the MBB creation logic out of it.

A couple tests were sensitive to the order. Update them.

llvm-svn: 297868

											
										
										
											2017-03-16 02:22:33 +08:00
+								  // Setup a separate basic-block for the arguments and constants
-												GlobalISel: store the current MachineFunction as direct state. NFC.

Having to ask the MIRBuilder for the current function is a little awkward, and
I'm intending to improve how that's threaded through anyway.

llvm-svn: 288983

											
										
										
											2016-12-08 05:17:47 +08:00
+								  MachineBasicBlock *EntryBB = MF->CreateMachineBasicBlock();
 								  MF->push_back(EntryBB);
-												GlobalISel: simplify MachineIRBuilder interface.

MachineIRBuilder had weird before/after and beginning/end flags for the insert
point. Unfortunately the non-default means that instructions will be inserted
in reverse order which is almost never what anyone wants.

Really, I think we just want (like IRBuilder has) the ability to insert at any
C++ iterator-style point (i.e. before any instruction or before MBB.end()). So
this fixes MIRBuilders to behave like IRBuilders in this respect.

llvm-svn: 288980

											
										
										
											2016-12-08 05:05:38 +08:00
+								  EntryBuilder.setMBB(*EntryBB);
-												[GlobalISel] Preserve IR block layout.

It makes the output function layout more predictable;  the layout has
an effect on performance, we don't want it to be at the mercy of the
translator's visitation order and such.
The predictable output is also easier to digest.

getOrCreateBB isn't appropriately named anymore, as it never needs to
create anything.  Rename it and extract the MBB creation logic out of it.

A couple tests were sensitive to the order. Update them.

llvm-svn: 297868

											
										
										
											2017-03-16 02:22:33 +08:00
+								  // Create all blocks, in IR order, to preserve the layout.
 								  for (const BasicBlock &BB: F) {
 								    auto *&MBB = BBToMBB[&BB];
 								    MBB = MF->CreateMachineBasicBlock(&BB);
 								    MF->push_back(MBB);
 								    if (BB.hasAddressTaken())
 								      MBB->setHasAddressTaken();
 								  }
 								  // Make our arguments/constants entry block fallthrough to the IR entry block.
 								  EntryBB->addSuccessor(&getMBB(F.front()));
-												GlobalISel: simplify MachineIRBuilder interface.

MachineIRBuilder had weird before/after and beginning/end flags for the insert
point. Unfortunately the non-default means that instructions will be inserted
in reverse order which is almost never what anyone wants.

Really, I think we just want (like IRBuilder has) the ability to insert at any
C++ iterator-style point (i.e. before any instruction or before MBB.end()). So
this fixes MIRBuilders to behave like IRBuilders in this respect.

llvm-svn: 288980

											
										
										
											2016-12-08 05:05:38 +08:00
+								  // Lower the actual args into this basic block.
-												[GlobalISel] Add the necessary plumbing to lower formal arguments.

llvm-svn: 260579

											
										
										
											2016-02-12 03:59:41 +08:00
+								  SmallVector<unsigned, 8> VRegArgs;
 								  for (const Argument &Arg: F.args())
-												[IRTranslator] Update getOrCreateVReg API to use references.
A value that we want to keep in a virtual register cannot be null.
Reflect that in the API.

llvm-svn: 263263

											
										
										
											2016-03-12 01:27:54 +08:00
+								    VRegArgs.push_back(getOrCreateVReg(Arg));
-												[GlobalISel] Remove now-unnecessary variable. NFC.

Since r296047, we're able to return early on failures.
Don't track whether we succeeded.

llvm-svn: 296057

											
										
										
											2017-02-24 08:34:41 +08:00
+								  if (!CLI->lowerFormalArguments(EntryBuilder, F, VRegArgs)) {
-												[GlobalISel] Use the DISubprogram for translation failure remarks.

Justin added support for DISubprogram locs in r295531 and r296052.
Use that instead of no-loc for constants and arguments.

llvm-svn: 296058

											
										
										
											2017-02-24 08:34:44 +08:00
+								    OptimizationRemarkMissed R("gisel-irtranslator", "GISelFailure",
 								                               MF->getFunction()->getSubprogram(),
-												[GlobalISel] Emit opt remarks on isel fallbacks.

Having more fine-grained information on the specific construct that
caused us to fallback is valuable for large-scale data collection.

We still have the fallback warning, that's also used for FastISel.
We still need to remove the fallback warning, and teach FastISel to also
emit remarks (it currently has a combination of the warning, stats, and
debug prints: the remarks could unify all three).

The abort-on-fallback path could also be better handled using remarks:
one could imagine a "-Rpass-error", analoguous to "-Werror", which would
promote missed/failed remarks to errors.  It's not clear whether that
would be useful for other remarks though, so we're not there yet.

llvm-svn: 296013

											
										
										
											2017-02-24 05:05:42 +08:00
+								                               &MF->getFunction()->getEntryBlock());
 								    R << "unable to lower arguments: " << ore::NV("Prototype", F.getType());
 								    reportTranslationError(*MF, *TPC, *ORE, R);
 								    return false;
-												[IRTranslator] Do not abort when the target wants to fall back.

Every pass in the GlobalISel pipeline will need to do something similar.

llvm-svn: 279886

											
										
										
											2016-08-27 07:49:05 +08:00
+								  }
-												[GlobalISel] Add the necessary plumbing to lower formal arguments.

llvm-svn: 260579

											
										
										
											2016-02-12 03:59:41 +08:00
-												GlobalISel: simplify MachineIRBuilder interface.

MachineIRBuilder had weird before/after and beginning/end flags for the insert
point. Unfortunately the non-default means that instructions will be inserted
in reverse order which is almost never what anyone wants.

Really, I think we just want (like IRBuilder has) the ability to insert at any
C++ iterator-style point (i.e. before any instruction or before MBB.end()). So
this fixes MIRBuilders to behave like IRBuilders in this respect.

llvm-svn: 288980

											
										
										
											2016-12-08 05:05:38 +08:00
+								  // And translate the function!
-												[GlobalISel] More detailed skeleton for the IRTranslator.

llvm-svn: 260456

											
										
										
											2016-02-11 06:59:27 +08:00
+								  for (const BasicBlock &BB: F) {
-												[GlobalISel] Preserve IR block layout.

It makes the output function layout more predictable;  the layout has
an effect on performance, we don't want it to be at the mercy of the
translator's visitation order and such.
The predictable output is also easier to digest.

getOrCreateBB isn't appropriately named anymore, as it never needs to
create anything.  Rename it and extract the MBB creation logic out of it.

A couple tests were sensitive to the order. Update them.

llvm-svn: 297868

											
										
										
											2017-03-16 02:22:33 +08:00
+								    MachineBasicBlock &MBB = getMBB(BB);
-												[MachineIRBuilder] Rename the setter for MBB for consistency with the getter.

llvm-svn: 263261

											
										
										
											2016-03-12 01:27:47 +08:00
+								    // Set the insertion point of all the following translations to
 								    // the end of this basic block.
-												GlobalISel: use correct builder for ConstantExprs.

ConstantExpr instances were emitting code into the current block rather than
the entry block. This meant they didn't necessarily dominate all uses, which is
clearly wrong.

llvm-svn: 288985

											
										
										
											2016-12-08 05:29:15 +08:00
+								    CurBuilder.setMBB(MBB);
-												GlobalISel: translate invoke and landingpad instructions

Pretty bare-bones support for exception handling (no weird MSVC stuff, no SjLj
etc), but it should get things going.

llvm-svn: 286407

											
										
										
											2016-11-10 06:39:54 +08:00
-												[GlobalISel] More detailed skeleton for the IRTranslator.

llvm-svn: 260456

											
										
										
											2016-02-11 06:59:27 +08:00
+								    for (const Instruction &Inst: BB) {
-												[GlobalISel] Remove now-unnecessary variable. NFC.

Since r296047, we're able to return early on failures.
Don't track whether we succeeded.

llvm-svn: 296057

											
										
										
											2017-02-24 08:34:41 +08:00
+								      if (translate(Inst))
 								        continue;
 								      std::string InstStrStorage;
 								      raw_string_ostream InstStr(InstStrStorage);
 								      InstStr << Inst;
-												[GlobalISel] Use the same name for all remarks.

While there, switch to the explicit ctor.

llvm-svn: 296059

											
										
										
											2017-02-24 08:34:47 +08:00
+								      OptimizationRemarkMissed R("gisel-irtranslator", "GISelFailure",
 								                                 Inst.getDebugLoc(), &BB);
-												[GlobalISel] Remove now-unnecessary variable. NFC.

Since r296047, we're able to return early on failures.
Don't track whether we succeeded.

llvm-svn: 296057

											
										
										
											2017-02-24 08:34:41 +08:00
+								      R << "unable to translate instruction: " << ore::NV("Opcode", &Inst)
 								        << ": '" << InstStr.str() << "'";
 								      reportTranslationError(*MF, *TPC, *ORE, R);
 								      return false;
-												[GlobalISel] More detailed skeleton for the IRTranslator.

llvm-svn: 260456

											
										
										
											2016-02-11 06:59:27 +08:00
+								    }
 								  }
-												GlobalISel: freeze reserved regs after IRTranslator.

We can freeze the registers after the MachineFrameInfo has been configured (by
telling it about calls, inline asm, ...). This doesn't happen at all yet, but
will be part of IR translation.

Fixes -verify-machineinstrs assertion.

llvm-svn: 275221

											
										
										
											2016-07-13 06:23:42 +08:00
-												[GlobalISel] Don't translate other blocks when one failed.

We were stopping the translation of the parent block when the
translation of an instruction failed, but we were still trying to
translate the other blocks of the parent function.

Don't do that.

llvm-svn: 296047

											
										
										
											2017-02-24 07:57:36 +08:00
+								  finishPendingPhis();
 								  // Merge the argument lowering and constants block with its single
 								  // successor, the LLVM-IR entry block.  We want the basic block to
 								  // be maximal.
 								  assert(EntryBB->succ_size() == 1 &&
 								         "Custom BB used for lowering should have only one successor");
 								  // Get the successor of the current entry block.
 								  MachineBasicBlock &NewEntryBB = **EntryBB->succ_begin();
 								  assert(NewEntryBB.pred_size() == 1 &&
 								         "LLVM-IR entry block has a predecessor!?");
 								  // Move all the instruction from the current entry block to the
 								  // new entry block.
 								  NewEntryBB.splice(NewEntryBB.begin(), EntryBB, EntryBB->begin(),
 								                    EntryBB->end());
 								  // Update the live-in information for the new entry block.
 								  for (const MachineBasicBlock::RegisterMaskPair &LiveIn : EntryBB->liveins())
 								    NewEntryBB.addLiveIn(LiveIn);
 								  NewEntryBB.sortUniqueLiveIns();
 								  // Get rid of the now empty basic block.
 								  EntryBB->removeSuccessor(&NewEntryBB);
 								  MF->remove(EntryBB);
 								  MF->DeleteMachineBasicBlock(EntryBB);
 								  assert(&MF->front() == &NewEntryBB &&
 								         "New entry wasn't next in the list of basic block!");
-												GlobalISel: IRTranslate PHI instructions

llvm-svn: 277835

											
										
										
											2016-08-06 01:16:40 +08:00
-												[GlobalISel] Add the proper cmake plumbing.

This patch adds the necessary plumbing to cmake to build the sources related to
GlobalISel.

To build the sources related to GlobalISel, we need to add -DBUILD_GLOBAL_ISEL=ON.
By default, this is OFF, thus GlobalISel sources will not impact people that do
not explicitly opt-in.

Differential Revision: http://reviews.llvm.org/D15983

llvm-svn: 258344

											
										
										
											2016-01-21 04:58:56 +08:00
+								  return false;
 								}