2012-05-05 04:18:50 +08:00
|
|
|
//===-- NVPTXAsmPrinter.cpp - NVPTX LLVM assembly writer ------------------===//
|
|
|
|
//
|
|
|
|
// The LLVM Compiler Infrastructure
|
|
|
|
//
|
|
|
|
// This file is distributed under the University of Illinois Open Source
|
|
|
|
// License. See LICENSE.TXT for details.
|
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
//
|
|
|
|
// This file contains a printer that converts from our internal representation
|
|
|
|
// of machine-dependent LLVM code to NVPTX assembly language.
|
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
2012-06-28 08:05:13 +08:00
|
|
|
#include "NVPTXAsmPrinter.h"
|
2014-01-07 19:48:04 +08:00
|
|
|
#include "InstPrinter/NVPTXInstPrinter.h"
|
2012-12-04 00:50:05 +08:00
|
|
|
#include "MCTargetDesc/NVPTXMCAsmInfo.h"
|
2012-05-05 04:18:50 +08:00
|
|
|
#include "NVPTX.h"
|
|
|
|
#include "NVPTXInstrInfo.h"
|
2013-08-06 22:13:27 +08:00
|
|
|
#include "NVPTXMCExpr.h"
|
2015-01-14 19:23:27 +08:00
|
|
|
#include "NVPTXMachineFunctionInfo.h"
|
2012-05-05 04:18:50 +08:00
|
|
|
#include "NVPTXRegisterInfo.h"
|
2012-12-04 00:50:05 +08:00
|
|
|
#include "NVPTXTargetMachine.h"
|
2012-06-28 08:05:13 +08:00
|
|
|
#include "NVPTXUtilities.h"
|
2012-12-04 00:50:05 +08:00
|
|
|
#include "cl_common_defines.h"
|
2012-05-05 04:18:50 +08:00
|
|
|
#include "llvm/ADT/StringExtras.h"
|
2012-12-04 00:50:05 +08:00
|
|
|
#include "llvm/Analysis/ConstantFolding.h"
|
2012-05-05 04:18:50 +08:00
|
|
|
#include "llvm/CodeGen/Analysis.h"
|
|
|
|
#include "llvm/CodeGen/MachineFrameInfo.h"
|
2015-02-01 10:27:45 +08:00
|
|
|
#include "llvm/CodeGen/MachineLoopInfo.h"
|
2012-05-05 04:18:50 +08:00
|
|
|
#include "llvm/CodeGen/MachineModuleInfo.h"
|
2012-12-04 00:50:05 +08:00
|
|
|
#include "llvm/CodeGen/MachineRegisterInfo.h"
|
2014-03-06 08:46:21 +08:00
|
|
|
#include "llvm/IR/DebugInfo.h"
|
2013-01-02 19:36:10 +08:00
|
|
|
#include "llvm/IR/DerivedTypes.h"
|
|
|
|
#include "llvm/IR/Function.h"
|
|
|
|
#include "llvm/IR/GlobalVariable.h"
|
2014-01-08 05:19:40 +08:00
|
|
|
#include "llvm/IR/Mangler.h"
|
2013-01-02 19:36:10 +08:00
|
|
|
#include "llvm/IR/Module.h"
|
|
|
|
#include "llvm/IR/Operator.h"
|
2012-05-05 04:18:50 +08:00
|
|
|
#include "llvm/MC/MCStreamer.h"
|
|
|
|
#include "llvm/MC/MCSymbol.h"
|
2012-12-04 00:50:05 +08:00
|
|
|
#include "llvm/Support/CommandLine.h"
|
2012-05-05 04:18:50 +08:00
|
|
|
#include "llvm/Support/ErrorHandling.h"
|
|
|
|
#include "llvm/Support/FormattedStream.h"
|
|
|
|
#include "llvm/Support/Path.h"
|
2012-12-04 00:50:05 +08:00
|
|
|
#include "llvm/Support/TargetRegistry.h"
|
|
|
|
#include "llvm/Support/TimeValue.h"
|
|
|
|
#include "llvm/Target/TargetLoweringObjectFile.h"
|
2015-02-01 10:27:45 +08:00
|
|
|
#include "llvm/Transforms/Utils/UnrollLoop.h"
|
2012-06-28 08:05:13 +08:00
|
|
|
#include <sstream>
|
2012-05-05 04:18:50 +08:00
|
|
|
using namespace llvm;
|
|
|
|
|
|
|
|
#define DEPOTNAME "__local_depot"
|
|
|
|
|
|
|
|
static cl::opt<bool>
|
2013-10-19 07:38:13 +08:00
|
|
|
EmitLineNumbers("nvptx-emit-line-numbers", cl::Hidden,
|
2012-05-05 04:18:50 +08:00
|
|
|
cl::desc("NVPTX Specific: Emit Line numbers even without -G"),
|
|
|
|
cl::init(true));
|
|
|
|
|
2013-10-27 19:31:46 +08:00
|
|
|
static cl::opt<bool>
|
2013-10-19 07:38:13 +08:00
|
|
|
InterleaveSrc("nvptx-emit-src", cl::ZeroOrMore, cl::Hidden,
|
2013-03-30 22:29:21 +08:00
|
|
|
cl::desc("NVPTX Specific: Emit source line in ptx file"),
|
2013-10-27 19:31:46 +08:00
|
|
|
cl::init(false));
|
2012-05-05 04:18:50 +08:00
|
|
|
|
2012-11-17 05:03:51 +08:00
|
|
|
namespace {
|
|
|
|
/// DiscoverDependentGlobals - Return a set of GlobalVariables on which \p V
|
|
|
|
/// depends.
|
2013-05-20 20:13:32 +08:00
|
|
|
void DiscoverDependentGlobals(const Value *V,
|
|
|
|
DenseSet<const GlobalVariable *> &Globals) {
|
|
|
|
if (const GlobalVariable *GV = dyn_cast<GlobalVariable>(V))
|
2012-11-17 05:03:51 +08:00
|
|
|
Globals.insert(GV);
|
|
|
|
else {
|
2013-05-20 20:13:32 +08:00
|
|
|
if (const User *U = dyn_cast<User>(V)) {
|
2012-11-17 05:03:51 +08:00
|
|
|
for (unsigned i = 0, e = U->getNumOperands(); i != e; ++i) {
|
|
|
|
DiscoverDependentGlobals(U->getOperand(i), Globals);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2012-05-05 04:18:50 +08:00
|
|
|
|
2012-11-17 05:03:51 +08:00
|
|
|
/// VisitGlobalVariableForEmission - Add \p GV to the list of GlobalVariable
|
|
|
|
/// instances to be emitted, but only after any dependents have been added
|
|
|
|
/// first.
|
2013-03-30 22:29:21 +08:00
|
|
|
void VisitGlobalVariableForEmission(
|
2013-05-20 20:13:32 +08:00
|
|
|
const GlobalVariable *GV, SmallVectorImpl<const GlobalVariable *> &Order,
|
|
|
|
DenseSet<const GlobalVariable *> &Visited,
|
|
|
|
DenseSet<const GlobalVariable *> &Visiting) {
|
2012-11-17 05:03:51 +08:00
|
|
|
// Have we already visited this one?
|
2013-03-30 22:29:21 +08:00
|
|
|
if (Visited.count(GV))
|
|
|
|
return;
|
2012-11-17 05:03:51 +08:00
|
|
|
|
|
|
|
// Do we have a circular dependency?
|
2014-10-10 23:32:50 +08:00
|
|
|
if (!Visiting.insert(GV).second)
|
2012-11-17 05:03:51 +08:00
|
|
|
report_fatal_error("Circular dependency found in global variable set");
|
|
|
|
|
|
|
|
// Make sure we visit all dependents first
|
2013-05-20 20:13:32 +08:00
|
|
|
DenseSet<const GlobalVariable *> Others;
|
2012-11-17 05:03:51 +08:00
|
|
|
for (unsigned i = 0, e = GV->getNumOperands(); i != e; ++i)
|
|
|
|
DiscoverDependentGlobals(GV->getOperand(i), Others);
|
2013-03-30 22:29:21 +08:00
|
|
|
|
2013-05-20 20:13:32 +08:00
|
|
|
for (DenseSet<const GlobalVariable *>::iterator I = Others.begin(),
|
|
|
|
E = Others.end();
|
2013-03-30 22:29:21 +08:00
|
|
|
I != E; ++I)
|
2012-11-17 05:03:51 +08:00
|
|
|
VisitGlobalVariableForEmission(*I, Order, Visited, Visiting);
|
|
|
|
|
|
|
|
// Now we can visit ourself
|
|
|
|
Order.push_back(GV);
|
|
|
|
Visited.insert(GV);
|
|
|
|
Visiting.erase(GV);
|
|
|
|
}
|
|
|
|
}
|
2012-05-05 04:18:50 +08:00
|
|
|
|
2013-03-30 22:29:21 +08:00
|
|
|
void NVPTXAsmPrinter::emitLineNumberAsDotLoc(const MachineInstr &MI) {
|
2012-05-05 04:18:50 +08:00
|
|
|
if (!EmitLineNumbers)
|
|
|
|
return;
|
|
|
|
if (ignoreLoc(MI))
|
|
|
|
return;
|
|
|
|
|
|
|
|
DebugLoc curLoc = MI.getDebugLoc();
|
|
|
|
|
2015-03-31 03:14:47 +08:00
|
|
|
if (!prevDebugLoc && !curLoc)
|
2012-05-05 04:18:50 +08:00
|
|
|
return;
|
|
|
|
|
|
|
|
if (prevDebugLoc == curLoc)
|
|
|
|
return;
|
|
|
|
|
|
|
|
prevDebugLoc = curLoc;
|
|
|
|
|
2015-03-31 03:14:47 +08:00
|
|
|
if (!curLoc)
|
2012-05-05 04:18:50 +08:00
|
|
|
return;
|
|
|
|
|
2015-04-16 09:37:00 +08:00
|
|
|
auto *Scope = cast_or_null<MDScope>(curLoc.getScope());
|
2013-06-28 13:43:10 +08:00
|
|
|
if (!Scope)
|
|
|
|
return;
|
2012-05-05 04:18:50 +08:00
|
|
|
|
2015-04-16 09:37:00 +08:00
|
|
|
StringRef fileName(Scope->getFilename());
|
|
|
|
StringRef dirName(Scope->getDirectory());
|
2012-05-05 04:18:50 +08:00
|
|
|
SmallString<128> FullPathName = dirName;
|
|
|
|
if (!dirName.empty() && !sys::path::is_absolute(fileName)) {
|
|
|
|
sys::path::append(FullPathName, fileName);
|
2015-03-30 23:42:36 +08:00
|
|
|
fileName = FullPathName;
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
|
|
|
|
2015-03-30 23:42:36 +08:00
|
|
|
if (filenameMap.find(fileName) == filenameMap.end())
|
2012-05-05 04:18:50 +08:00
|
|
|
return;
|
|
|
|
|
|
|
|
// Emit the line from the source file.
|
2013-10-27 19:31:46 +08:00
|
|
|
if (InterleaveSrc)
|
2015-03-30 23:42:36 +08:00
|
|
|
this->emitSrcInText(fileName, curLoc.getLine());
|
2012-05-05 04:18:50 +08:00
|
|
|
|
|
|
|
std::stringstream temp;
|
2015-03-30 23:42:36 +08:00
|
|
|
temp << "\t.loc " << filenameMap[fileName] << " " << curLoc.getLine()
|
2013-03-30 22:29:21 +08:00
|
|
|
<< " " << curLoc.getCol();
|
2015-04-25 03:11:51 +08:00
|
|
|
OutStreamer->EmitRawText(temp.str());
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
void NVPTXAsmPrinter::EmitInstruction(const MachineInstr *MI) {
|
|
|
|
SmallString<128> Str;
|
|
|
|
raw_svector_ostream OS(Str);
|
2015-02-19 08:08:23 +08:00
|
|
|
if (static_cast<NVPTXTargetMachine &>(TM).getDrvInterface() == NVPTX::CUDA)
|
2012-05-05 04:18:50 +08:00
|
|
|
emitLineNumberAsDotLoc(*MI);
|
2013-08-06 22:13:27 +08:00
|
|
|
|
|
|
|
MCInst Inst;
|
|
|
|
lowerToMCInst(MI, Inst);
|
2015-04-25 03:11:51 +08:00
|
|
|
EmitToStreamer(*OutStreamer, Inst);
|
2013-08-06 22:13:27 +08:00
|
|
|
}
|
|
|
|
|
2014-04-09 23:39:15 +08:00
|
|
|
// Handle symbol backtracking for targets that do not support image handles
|
|
|
|
bool NVPTXAsmPrinter::lowerImageHandleOperand(const MachineInstr *MI,
|
|
|
|
unsigned OpNo, MCOperand &MCOp) {
|
|
|
|
const MachineOperand &MO = MI->getOperand(OpNo);
|
2014-07-17 19:59:04 +08:00
|
|
|
const MCInstrDesc &MCID = MI->getDesc();
|
2014-04-09 23:39:15 +08:00
|
|
|
|
2014-07-17 19:59:04 +08:00
|
|
|
if (MCID.TSFlags & NVPTXII::IsTexFlag) {
|
2014-04-09 23:39:15 +08:00
|
|
|
// This is a texture fetch, so operand 4 is a texref and operand 5 is
|
|
|
|
// a samplerref
|
2014-07-17 19:59:04 +08:00
|
|
|
if (OpNo == 4 && MO.isImm()) {
|
2014-04-09 23:39:15 +08:00
|
|
|
lowerImageHandleSymbol(MO.getImm(), MCOp);
|
|
|
|
return true;
|
|
|
|
}
|
2014-07-17 19:59:04 +08:00
|
|
|
if (OpNo == 5 && MO.isImm() && !(MCID.TSFlags & NVPTXII::IsTexModeUnifiedFlag)) {
|
2014-04-09 23:39:15 +08:00
|
|
|
lowerImageHandleSymbol(MO.getImm(), MCOp);
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
return false;
|
2014-07-17 19:59:04 +08:00
|
|
|
} else if (MCID.TSFlags & NVPTXII::IsSuldMask) {
|
|
|
|
unsigned VecSize =
|
|
|
|
1 << (((MCID.TSFlags & NVPTXII::IsSuldMask) >> NVPTXII::IsSuldShift) - 1);
|
2014-04-09 23:39:15 +08:00
|
|
|
|
2014-07-17 19:59:04 +08:00
|
|
|
// For a surface load of vector size N, the Nth operand will be the surfref
|
|
|
|
if (OpNo == VecSize && MO.isImm()) {
|
2014-04-09 23:39:15 +08:00
|
|
|
lowerImageHandleSymbol(MO.getImm(), MCOp);
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
return false;
|
2014-07-17 19:59:04 +08:00
|
|
|
} else if (MCID.TSFlags & NVPTXII::IsSustFlag) {
|
2014-04-09 23:39:15 +08:00
|
|
|
// This is a surface store, so operand 0 is a surfref
|
2014-07-17 19:59:04 +08:00
|
|
|
if (OpNo == 0 && MO.isImm()) {
|
2014-04-09 23:39:15 +08:00
|
|
|
lowerImageHandleSymbol(MO.getImm(), MCOp);
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
return false;
|
2014-07-17 19:59:04 +08:00
|
|
|
} else if (MCID.TSFlags & NVPTXII::IsSurfTexQueryFlag) {
|
2014-04-09 23:39:15 +08:00
|
|
|
// This is a query, so operand 1 is a surfref/texref
|
2014-07-17 19:59:04 +08:00
|
|
|
if (OpNo == 1 && MO.isImm()) {
|
2014-04-09 23:39:15 +08:00
|
|
|
lowerImageHandleSymbol(MO.getImm(), MCOp);
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
return false;
|
|
|
|
}
|
2014-07-17 19:59:04 +08:00
|
|
|
|
|
|
|
return false;
|
2014-04-09 23:39:15 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
void NVPTXAsmPrinter::lowerImageHandleSymbol(unsigned Index, MCOperand &MCOp) {
|
|
|
|
// Ewwww
|
|
|
|
TargetMachine &TM = const_cast<TargetMachine&>(MF->getTarget());
|
|
|
|
NVPTXTargetMachine &nvTM = static_cast<NVPTXTargetMachine&>(TM);
|
|
|
|
const NVPTXMachineFunctionInfo *MFI = MF->getInfo<NVPTXMachineFunctionInfo>();
|
|
|
|
const char *Sym = MFI->getImageHandleSymbol(Index);
|
|
|
|
std::string *SymNamePtr =
|
|
|
|
nvTM.getManagedStrPool()->getManagedString(Sym);
|
|
|
|
MCOp = GetSymbolRef(OutContext.GetOrCreateSymbol(
|
|
|
|
StringRef(SymNamePtr->c_str())));
|
|
|
|
}
|
|
|
|
|
2013-08-06 22:13:27 +08:00
|
|
|
void NVPTXAsmPrinter::lowerToMCInst(const MachineInstr *MI, MCInst &OutMI) {
|
|
|
|
OutMI.setOpcode(MI->getOpcode());
|
2013-11-15 20:30:04 +08:00
|
|
|
// Special: Do not mangle symbol operand of CALL_PROTOTYPE
|
|
|
|
if (MI->getOpcode() == NVPTX::CALL_PROTOTYPE) {
|
|
|
|
const MachineOperand &MO = MI->getOperand(0);
|
2014-04-09 23:39:15 +08:00
|
|
|
OutMI.addOperand(GetSymbolRef(
|
2013-11-15 20:30:04 +08:00
|
|
|
OutContext.GetOrCreateSymbol(Twine(MO.getSymbolName()))));
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2013-08-06 22:13:27 +08:00
|
|
|
for (unsigned i = 0, e = MI->getNumOperands(); i != e; ++i) {
|
|
|
|
const MachineOperand &MO = MI->getOperand(i);
|
|
|
|
|
|
|
|
MCOperand MCOp;
|
2015-02-19 08:08:14 +08:00
|
|
|
if (!nvptxSubtarget->hasImageHandles()) {
|
2014-04-09 23:39:15 +08:00
|
|
|
if (lowerImageHandleOperand(MI, i, MCOp)) {
|
|
|
|
OutMI.addOperand(MCOp);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2013-08-06 22:13:27 +08:00
|
|
|
if (lowerOperand(MO, MCOp))
|
|
|
|
OutMI.addOperand(MCOp);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
bool NVPTXAsmPrinter::lowerOperand(const MachineOperand &MO,
|
|
|
|
MCOperand &MCOp) {
|
|
|
|
switch (MO.getType()) {
|
|
|
|
default: llvm_unreachable("unknown operand type");
|
|
|
|
case MachineOperand::MO_Register:
|
|
|
|
MCOp = MCOperand::CreateReg(encodeVirtualRegister(MO.getReg()));
|
|
|
|
break;
|
|
|
|
case MachineOperand::MO_Immediate:
|
|
|
|
MCOp = MCOperand::CreateImm(MO.getImm());
|
|
|
|
break;
|
|
|
|
case MachineOperand::MO_MachineBasicBlock:
|
|
|
|
MCOp = MCOperand::CreateExpr(MCSymbolRefExpr::Create(
|
|
|
|
MO.getMBB()->getSymbol(), OutContext));
|
|
|
|
break;
|
|
|
|
case MachineOperand::MO_ExternalSymbol:
|
2014-04-09 23:39:15 +08:00
|
|
|
MCOp = GetSymbolRef(GetExternalSymbolSymbol(MO.getSymbolName()));
|
2013-08-06 22:13:27 +08:00
|
|
|
break;
|
|
|
|
case MachineOperand::MO_GlobalAddress:
|
2014-04-09 23:39:15 +08:00
|
|
|
MCOp = GetSymbolRef(getSymbol(MO.getGlobal()));
|
2013-08-06 22:13:27 +08:00
|
|
|
break;
|
|
|
|
case MachineOperand::MO_FPImmediate: {
|
|
|
|
const ConstantFP *Cnt = MO.getFPImm();
|
|
|
|
APFloat Val = Cnt->getValueAPF();
|
|
|
|
|
|
|
|
switch (Cnt->getType()->getTypeID()) {
|
|
|
|
default: report_fatal_error("Unsupported FP type"); break;
|
|
|
|
case Type::FloatTyID:
|
|
|
|
MCOp = MCOperand::CreateExpr(
|
|
|
|
NVPTXFloatMCExpr::CreateConstantFPSingle(Val, OutContext));
|
|
|
|
break;
|
|
|
|
case Type::DoubleTyID:
|
|
|
|
MCOp = MCOperand::CreateExpr(
|
|
|
|
NVPTXFloatMCExpr::CreateConstantFPDouble(Val, OutContext));
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
unsigned NVPTXAsmPrinter::encodeVirtualRegister(unsigned Reg) {
|
2013-08-06 22:13:31 +08:00
|
|
|
if (TargetRegisterInfo::isVirtualRegister(Reg)) {
|
|
|
|
const TargetRegisterClass *RC = MRI->getRegClass(Reg);
|
|
|
|
|
|
|
|
DenseMap<unsigned, unsigned> &RegMap = VRegMapping[RC];
|
|
|
|
unsigned RegNum = RegMap[Reg];
|
|
|
|
|
|
|
|
// Encode the register class in the upper 4 bits
|
|
|
|
// Must be kept in sync with NVPTXInstPrinter::printRegName
|
|
|
|
unsigned Ret = 0;
|
|
|
|
if (RC == &NVPTX::Int1RegsRegClass) {
|
|
|
|
Ret = (1 << 28);
|
|
|
|
} else if (RC == &NVPTX::Int16RegsRegClass) {
|
|
|
|
Ret = (2 << 28);
|
|
|
|
} else if (RC == &NVPTX::Int32RegsRegClass) {
|
|
|
|
Ret = (3 << 28);
|
|
|
|
} else if (RC == &NVPTX::Int64RegsRegClass) {
|
|
|
|
Ret = (4 << 28);
|
|
|
|
} else if (RC == &NVPTX::Float32RegsRegClass) {
|
|
|
|
Ret = (5 << 28);
|
|
|
|
} else if (RC == &NVPTX::Float64RegsRegClass) {
|
|
|
|
Ret = (6 << 28);
|
|
|
|
} else {
|
|
|
|
report_fatal_error("Bad register class");
|
|
|
|
}
|
|
|
|
|
|
|
|
// Insert the vreg number
|
|
|
|
Ret |= (RegNum & 0x0FFFFFFF);
|
|
|
|
return Ret;
|
2013-08-06 22:13:27 +08:00
|
|
|
} else {
|
2013-08-06 22:13:31 +08:00
|
|
|
// Some special-use registers are actually physical registers.
|
|
|
|
// Encode this as the register class ID of 0 and the real register ID.
|
|
|
|
return Reg & 0x0FFFFFFF;
|
2013-08-06 22:13:27 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-04-09 23:39:15 +08:00
|
|
|
MCOperand NVPTXAsmPrinter::GetSymbolRef(const MCSymbol *Symbol) {
|
2013-08-06 22:13:27 +08:00
|
|
|
const MCExpr *Expr;
|
2013-08-07 07:06:42 +08:00
|
|
|
Expr = MCSymbolRefExpr::Create(Symbol, MCSymbolRefExpr::VK_None,
|
|
|
|
OutContext);
|
2013-08-06 22:13:27 +08:00
|
|
|
return MCOperand::CreateExpr(Expr);
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
|
|
|
|
2013-03-30 22:29:21 +08:00
|
|
|
void NVPTXAsmPrinter::printReturnValStr(const Function *F, raw_ostream &O) {
|
2015-01-27 03:03:15 +08:00
|
|
|
const DataLayout *TD = TM.getDataLayout();
|
2015-02-19 08:08:14 +08:00
|
|
|
const TargetLowering *TLI = nvptxSubtarget->getTargetLowering();
|
2012-05-05 04:18:50 +08:00
|
|
|
|
|
|
|
Type *Ty = F->getReturnType();
|
|
|
|
|
2015-02-19 08:08:14 +08:00
|
|
|
bool isABI = (nvptxSubtarget->getSmVersion() >= 20);
|
2012-05-05 04:18:50 +08:00
|
|
|
|
|
|
|
if (Ty->getTypeID() == Type::VoidTyID)
|
|
|
|
return;
|
|
|
|
|
|
|
|
O << " (";
|
|
|
|
|
|
|
|
if (isABI) {
|
2013-12-08 03:34:20 +08:00
|
|
|
if (Ty->isFloatingPointTy() || Ty->isIntegerTy()) {
|
2012-05-05 04:18:50 +08:00
|
|
|
unsigned size = 0;
|
|
|
|
if (const IntegerType *ITy = dyn_cast<IntegerType>(Ty)) {
|
|
|
|
size = ITy->getBitWidth();
|
2013-03-30 22:29:21 +08:00
|
|
|
if (size < 32)
|
|
|
|
size = 32;
|
2012-05-05 04:18:50 +08:00
|
|
|
} else {
|
2013-03-30 22:29:21 +08:00
|
|
|
assert(Ty->isFloatingPointTy() && "Floating point type expected here");
|
2012-05-05 04:18:50 +08:00
|
|
|
size = Ty->getPrimitiveSizeInBits();
|
|
|
|
}
|
|
|
|
|
|
|
|
O << ".param .b" << size << " func_retval0";
|
2013-03-30 22:29:21 +08:00
|
|
|
} else if (isa<PointerType>(Ty)) {
|
2012-05-05 04:18:50 +08:00
|
|
|
O << ".param .b" << TLI->getPointerTy().getSizeInBits()
|
2013-03-30 22:29:21 +08:00
|
|
|
<< " func_retval0";
|
2015-01-05 18:15:49 +08:00
|
|
|
} else if ((Ty->getTypeID() == Type::StructTyID) || isa<VectorType>(Ty)) {
|
|
|
|
unsigned totalsz = TD->getTypeAllocSize(Ty);
|
|
|
|
unsigned retAlignment = 0;
|
|
|
|
if (!llvm::getAlign(*F, 0, retAlignment))
|
|
|
|
retAlignment = TD->getABITypeAlignment(Ty);
|
|
|
|
O << ".param .align " << retAlignment << " .b8 func_retval0[" << totalsz
|
|
|
|
<< "]";
|
|
|
|
} else
|
|
|
|
llvm_unreachable("Unknown return type");
|
2012-05-05 04:18:50 +08:00
|
|
|
} else {
|
|
|
|
SmallVector<EVT, 16> vtparts;
|
|
|
|
ComputeValueVTs(*TLI, Ty, vtparts);
|
|
|
|
unsigned idx = 0;
|
2013-03-30 22:29:21 +08:00
|
|
|
for (unsigned i = 0, e = vtparts.size(); i != e; ++i) {
|
2012-05-05 04:18:50 +08:00
|
|
|
unsigned elems = 1;
|
|
|
|
EVT elemtype = vtparts[i];
|
|
|
|
if (vtparts[i].isVector()) {
|
|
|
|
elems = vtparts[i].getVectorNumElements();
|
|
|
|
elemtype = vtparts[i].getVectorElementType();
|
|
|
|
}
|
|
|
|
|
2013-03-30 22:29:21 +08:00
|
|
|
for (unsigned j = 0, je = elems; j != je; ++j) {
|
2012-05-05 04:18:50 +08:00
|
|
|
unsigned sz = elemtype.getSizeInBits();
|
2013-03-30 22:29:21 +08:00
|
|
|
if (elemtype.isInteger() && (sz < 32))
|
|
|
|
sz = 32;
|
2012-05-05 04:18:50 +08:00
|
|
|
O << ".reg .b" << sz << " func_retval" << idx;
|
2013-03-30 22:29:21 +08:00
|
|
|
if (j < je - 1)
|
|
|
|
O << ", ";
|
2012-05-05 04:18:50 +08:00
|
|
|
++idx;
|
|
|
|
}
|
2013-03-30 22:29:21 +08:00
|
|
|
if (i < e - 1)
|
2012-05-05 04:18:50 +08:00
|
|
|
O << ", ";
|
|
|
|
}
|
|
|
|
}
|
|
|
|
O << ") ";
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
void NVPTXAsmPrinter::printReturnValStr(const MachineFunction &MF,
|
|
|
|
raw_ostream &O) {
|
|
|
|
const Function *F = MF.getFunction();
|
|
|
|
printReturnValStr(F, O);
|
|
|
|
}
|
|
|
|
|
2015-02-01 10:27:45 +08:00
|
|
|
// Return true if MBB is the header of a loop marked with
|
|
|
|
// llvm.loop.unroll.disable.
|
2015-02-04 01:57:38 +08:00
|
|
|
// TODO: consider "#pragma unroll 1" which is equivalent to "#pragma nounroll".
|
2015-02-01 10:27:45 +08:00
|
|
|
bool NVPTXAsmPrinter::isLoopHeaderOfNoUnroll(
|
|
|
|
const MachineBasicBlock &MBB) const {
|
|
|
|
MachineLoopInfo &LI = getAnalysis<MachineLoopInfo>();
|
2015-02-04 01:57:38 +08:00
|
|
|
// TODO: isLoopHeader() should take "const MachineBasicBlock *".
|
2015-02-01 10:27:45 +08:00
|
|
|
// We insert .pragma "nounroll" only to the loop header.
|
|
|
|
if (!LI.isLoopHeader(const_cast<MachineBasicBlock *>(&MBB)))
|
|
|
|
return false;
|
|
|
|
|
|
|
|
// llvm.loop.unroll.disable is marked on the back edges of a loop. Therefore,
|
|
|
|
// we iterate through each back edge of the loop with header MBB, and check
|
|
|
|
// whether its metadata contains llvm.loop.unroll.disable.
|
|
|
|
for (auto I = MBB.pred_begin(); I != MBB.pred_end(); ++I) {
|
|
|
|
const MachineBasicBlock *PMBB = *I;
|
|
|
|
if (LI.getLoopFor(PMBB) != LI.getLoopFor(&MBB)) {
|
|
|
|
// Edges from other loops to MBB are not back edges.
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
if (const BasicBlock *PBB = PMBB->getBasicBlock()) {
|
2015-02-03 04:41:11 +08:00
|
|
|
if (MDNode *LoopID = PBB->getTerminator()->getMetadata("llvm.loop")) {
|
2015-02-01 10:27:45 +08:00
|
|
|
if (GetUnrollMetadata(LoopID, "llvm.loop.unroll.disable"))
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
void NVPTXAsmPrinter::EmitBasicBlockStart(const MachineBasicBlock &MBB) const {
|
|
|
|
AsmPrinter::EmitBasicBlockStart(MBB);
|
|
|
|
if (isLoopHeaderOfNoUnroll(MBB))
|
2015-04-25 03:11:51 +08:00
|
|
|
OutStreamer->EmitRawText(StringRef("\t.pragma \"nounroll\";\n"));
|
2015-02-01 10:27:45 +08:00
|
|
|
}
|
|
|
|
|
2012-05-05 04:18:50 +08:00
|
|
|
void NVPTXAsmPrinter::EmitFunctionEntryLabel() {
|
|
|
|
SmallString<128> Str;
|
|
|
|
raw_svector_ostream O(Str);
|
|
|
|
|
2013-05-20 20:13:32 +08:00
|
|
|
if (!GlobalsEmitted) {
|
|
|
|
emitGlobals(*MF->getFunction()->getParent());
|
|
|
|
GlobalsEmitted = true;
|
|
|
|
}
|
|
|
|
|
2012-05-05 04:18:50 +08:00
|
|
|
// Set up
|
|
|
|
MRI = &MF->getRegInfo();
|
|
|
|
F = MF->getFunction();
|
2013-03-30 22:29:21 +08:00
|
|
|
emitLinkageDirective(F, O);
|
2012-05-05 04:18:50 +08:00
|
|
|
if (llvm::isKernelFunction(*F))
|
|
|
|
O << ".entry ";
|
|
|
|
else {
|
|
|
|
O << ".func ";
|
|
|
|
printReturnValStr(*MF, O);
|
|
|
|
}
|
|
|
|
|
|
|
|
O << *CurrentFnSym;
|
|
|
|
|
|
|
|
emitFunctionParamList(*MF, O);
|
|
|
|
|
|
|
|
if (llvm::isKernelFunction(*F))
|
|
|
|
emitKernelFunctionDirectives(*F, O);
|
|
|
|
|
2015-04-25 03:11:51 +08:00
|
|
|
OutStreamer->EmitRawText(O.str());
|
2012-05-05 04:18:50 +08:00
|
|
|
|
|
|
|
prevDebugLoc = DebugLoc();
|
|
|
|
}
|
|
|
|
|
|
|
|
void NVPTXAsmPrinter::EmitFunctionBodyStart() {
|
2013-05-31 20:14:49 +08:00
|
|
|
VRegMapping.clear();
|
2015-04-25 03:11:51 +08:00
|
|
|
OutStreamer->EmitRawText(StringRef("{\n"));
|
2012-05-05 04:18:50 +08:00
|
|
|
setAndEmitFunctionVirtualRegisters(*MF);
|
|
|
|
|
|
|
|
SmallString<128> Str;
|
|
|
|
raw_svector_ostream O(Str);
|
|
|
|
emitDemotedVars(MF->getFunction(), O);
|
2015-04-25 03:11:51 +08:00
|
|
|
OutStreamer->EmitRawText(O.str());
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
void NVPTXAsmPrinter::EmitFunctionBodyEnd() {
|
2015-04-25 03:11:51 +08:00
|
|
|
OutStreamer->EmitRawText(StringRef("}\n"));
|
2013-05-31 20:14:49 +08:00
|
|
|
VRegMapping.clear();
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
|
|
|
|
2013-10-11 20:39:36 +08:00
|
|
|
void NVPTXAsmPrinter::emitImplicitDef(const MachineInstr *MI) const {
|
|
|
|
unsigned RegNo = MI->getOperand(0).getReg();
|
2015-03-25 07:37:10 +08:00
|
|
|
if (TargetRegisterInfo::isVirtualRegister(RegNo)) {
|
2015-04-25 03:11:51 +08:00
|
|
|
OutStreamer->AddComment(Twine("implicit-def: ") +
|
|
|
|
getVirtualRegisterName(RegNo));
|
2013-10-11 20:39:36 +08:00
|
|
|
} else {
|
2015-04-25 03:11:51 +08:00
|
|
|
OutStreamer->AddComment(Twine("implicit-def: ") +
|
|
|
|
nvptxSubtarget->getRegisterInfo()->getName(RegNo));
|
2013-10-11 20:39:36 +08:00
|
|
|
}
|
2015-04-25 03:11:51 +08:00
|
|
|
OutStreamer->AddBlankLine();
|
2013-10-11 20:39:36 +08:00
|
|
|
}
|
|
|
|
|
2013-03-30 22:29:21 +08:00
|
|
|
void NVPTXAsmPrinter::emitKernelFunctionDirectives(const Function &F,
|
|
|
|
raw_ostream &O) const {
|
2012-05-05 04:18:50 +08:00
|
|
|
// If the NVVM IR has some of reqntid* specified, then output
|
|
|
|
// the reqntid directive, and set the unspecified ones to 1.
|
|
|
|
// If none of reqntid* is specified, don't output reqntid directive.
|
|
|
|
unsigned reqntidx, reqntidy, reqntidz;
|
|
|
|
bool specified = false;
|
2015-03-24 00:26:23 +08:00
|
|
|
if (!llvm::getReqNTIDx(F, reqntidx))
|
2013-03-30 22:29:21 +08:00
|
|
|
reqntidx = 1;
|
|
|
|
else
|
|
|
|
specified = true;
|
2015-03-24 00:26:23 +08:00
|
|
|
if (!llvm::getReqNTIDy(F, reqntidy))
|
2013-03-30 22:29:21 +08:00
|
|
|
reqntidy = 1;
|
|
|
|
else
|
|
|
|
specified = true;
|
2015-03-24 00:26:23 +08:00
|
|
|
if (!llvm::getReqNTIDz(F, reqntidz))
|
2013-03-30 22:29:21 +08:00
|
|
|
reqntidz = 1;
|
|
|
|
else
|
|
|
|
specified = true;
|
2012-05-05 04:18:50 +08:00
|
|
|
|
|
|
|
if (specified)
|
2013-03-30 22:29:21 +08:00
|
|
|
O << ".reqntid " << reqntidx << ", " << reqntidy << ", " << reqntidz
|
|
|
|
<< "\n";
|
2012-05-05 04:18:50 +08:00
|
|
|
|
|
|
|
// If the NVVM IR has some of maxntid* specified, then output
|
|
|
|
// the maxntid directive, and set the unspecified ones to 1.
|
|
|
|
// If none of maxntid* is specified, don't output maxntid directive.
|
|
|
|
unsigned maxntidx, maxntidy, maxntidz;
|
|
|
|
specified = false;
|
2015-03-24 00:26:23 +08:00
|
|
|
if (!llvm::getMaxNTIDx(F, maxntidx))
|
2013-03-30 22:29:21 +08:00
|
|
|
maxntidx = 1;
|
|
|
|
else
|
|
|
|
specified = true;
|
2015-03-24 00:26:23 +08:00
|
|
|
if (!llvm::getMaxNTIDy(F, maxntidy))
|
2013-03-30 22:29:21 +08:00
|
|
|
maxntidy = 1;
|
|
|
|
else
|
|
|
|
specified = true;
|
2015-03-24 00:26:23 +08:00
|
|
|
if (!llvm::getMaxNTIDz(F, maxntidz))
|
2013-03-30 22:29:21 +08:00
|
|
|
maxntidz = 1;
|
|
|
|
else
|
|
|
|
specified = true;
|
2012-05-05 04:18:50 +08:00
|
|
|
|
|
|
|
if (specified)
|
2013-03-30 22:29:21 +08:00
|
|
|
O << ".maxntid " << maxntidx << ", " << maxntidy << ", " << maxntidz
|
|
|
|
<< "\n";
|
2012-05-05 04:18:50 +08:00
|
|
|
|
|
|
|
unsigned mincta;
|
|
|
|
if (llvm::getMinCTASm(F, mincta))
|
|
|
|
O << ".minnctapersm " << mincta << "\n";
|
|
|
|
}
|
|
|
|
|
2013-10-11 20:39:36 +08:00
|
|
|
std::string
|
|
|
|
NVPTXAsmPrinter::getVirtualRegisterName(unsigned Reg) const {
|
|
|
|
const TargetRegisterClass *RC = MRI->getRegClass(Reg);
|
|
|
|
|
|
|
|
std::string Name;
|
|
|
|
raw_string_ostream NameStr(Name);
|
2012-05-05 04:18:50 +08:00
|
|
|
|
2013-10-11 20:39:36 +08:00
|
|
|
VRegRCMap::const_iterator I = VRegMapping.find(RC);
|
|
|
|
assert(I != VRegMapping.end() && "Bad register class");
|
|
|
|
const DenseMap<unsigned, unsigned> &RegMap = I->second;
|
2012-05-05 04:18:50 +08:00
|
|
|
|
2013-10-11 20:39:36 +08:00
|
|
|
VRegMap::const_iterator VI = RegMap.find(Reg);
|
|
|
|
assert(VI != RegMap.end() && "Bad virtual register");
|
|
|
|
unsigned MappedVR = VI->second;
|
|
|
|
|
|
|
|
NameStr << getNVPTXRegClassStr(RC) << MappedVR;
|
|
|
|
|
|
|
|
NameStr.flush();
|
|
|
|
return Name;
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
|
|
|
|
2013-10-11 20:39:36 +08:00
|
|
|
void NVPTXAsmPrinter::emitVirtualRegister(unsigned int vr,
|
2013-03-30 22:29:21 +08:00
|
|
|
raw_ostream &O) {
|
2013-10-11 20:39:36 +08:00
|
|
|
O << getVirtualRegisterName(vr);
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
|
|
|
|
2013-03-30 22:29:21 +08:00
|
|
|
void NVPTXAsmPrinter::printVecModifiedImmediate(
|
|
|
|
const MachineOperand &MO, const char *Modifier, raw_ostream &O) {
|
|
|
|
static const char vecelem[] = { '0', '1', '2', '3', '0', '1', '2', '3' };
|
|
|
|
int Imm = (int) MO.getImm();
|
|
|
|
if (0 == strcmp(Modifier, "vecelem"))
|
2012-05-05 04:18:50 +08:00
|
|
|
O << "_" << vecelem[Imm];
|
2013-03-30 22:29:21 +08:00
|
|
|
else if (0 == strcmp(Modifier, "vecv4comm1")) {
|
|
|
|
if ((Imm < 0) || (Imm > 3))
|
2012-05-05 04:18:50 +08:00
|
|
|
O << "//";
|
2013-03-30 22:29:21 +08:00
|
|
|
} else if (0 == strcmp(Modifier, "vecv4comm2")) {
|
|
|
|
if ((Imm < 4) || (Imm > 7))
|
2012-05-05 04:18:50 +08:00
|
|
|
O << "//";
|
2013-03-30 22:29:21 +08:00
|
|
|
} else if (0 == strcmp(Modifier, "vecv4pos")) {
|
|
|
|
if (Imm < 0)
|
|
|
|
Imm = 0;
|
|
|
|
O << "_" << vecelem[Imm % 4];
|
|
|
|
} else if (0 == strcmp(Modifier, "vecv2comm1")) {
|
|
|
|
if ((Imm < 0) || (Imm > 1))
|
2012-05-05 04:18:50 +08:00
|
|
|
O << "//";
|
2013-03-30 22:29:21 +08:00
|
|
|
} else if (0 == strcmp(Modifier, "vecv2comm2")) {
|
|
|
|
if ((Imm < 2) || (Imm > 3))
|
2012-05-05 04:18:50 +08:00
|
|
|
O << "//";
|
2013-03-30 22:29:21 +08:00
|
|
|
} else if (0 == strcmp(Modifier, "vecv2pos")) {
|
|
|
|
if (Imm < 0)
|
|
|
|
Imm = 0;
|
|
|
|
O << "_" << vecelem[Imm % 2];
|
|
|
|
} else
|
2012-05-24 15:02:50 +08:00
|
|
|
llvm_unreachable("Unknown Modifier on immediate operand");
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
|
|
|
|
2013-06-29 01:58:04 +08:00
|
|
|
|
|
|
|
|
2013-03-30 22:29:21 +08:00
|
|
|
void NVPTXAsmPrinter::emitDeclaration(const Function *F, raw_ostream &O) {
|
2012-05-05 04:18:50 +08:00
|
|
|
|
2013-03-30 22:29:21 +08:00
|
|
|
emitLinkageDirective(F, O);
|
2012-05-05 04:18:50 +08:00
|
|
|
if (llvm::isKernelFunction(*F))
|
|
|
|
O << ".entry ";
|
|
|
|
else
|
|
|
|
O << ".func ";
|
|
|
|
printReturnValStr(F, O);
|
2014-04-01 00:11:57 +08:00
|
|
|
O << *getSymbol(F) << "\n";
|
2012-05-05 04:18:50 +08:00
|
|
|
emitFunctionParamList(F, O);
|
|
|
|
O << ";\n";
|
|
|
|
}
|
|
|
|
|
2013-03-30 22:29:21 +08:00
|
|
|
static bool usedInGlobalVarDef(const Constant *C) {
|
2012-05-05 04:18:50 +08:00
|
|
|
if (!C)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
if (const GlobalVariable *GV = dyn_cast<GlobalVariable>(C)) {
|
2015-03-30 23:42:36 +08:00
|
|
|
if (GV->getName() == "llvm.used")
|
2012-05-05 04:18:50 +08:00
|
|
|
return false;
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2014-03-09 11:16:01 +08:00
|
|
|
for (const User *U : C->users())
|
|
|
|
if (const Constant *C = dyn_cast<Constant>(U))
|
|
|
|
if (usedInGlobalVarDef(C))
|
|
|
|
return true;
|
|
|
|
|
2012-05-05 04:18:50 +08:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2013-03-30 22:29:21 +08:00
|
|
|
static bool usedInOneFunc(const User *U, Function const *&oneFunc) {
|
2012-05-05 04:18:50 +08:00
|
|
|
if (const GlobalVariable *othergv = dyn_cast<GlobalVariable>(U)) {
|
2015-03-30 23:42:36 +08:00
|
|
|
if (othergv->getName() == "llvm.used")
|
2012-05-05 04:18:50 +08:00
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (const Instruction *instr = dyn_cast<Instruction>(U)) {
|
|
|
|
if (instr->getParent() && instr->getParent()->getParent()) {
|
|
|
|
const Function *curFunc = instr->getParent()->getParent();
|
|
|
|
if (oneFunc && (curFunc != oneFunc))
|
|
|
|
return false;
|
|
|
|
oneFunc = curFunc;
|
|
|
|
return true;
|
2013-03-30 22:29:21 +08:00
|
|
|
} else
|
2012-05-05 04:18:50 +08:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2014-03-09 11:16:01 +08:00
|
|
|
for (const User *UU : U->users())
|
2015-03-24 00:26:23 +08:00
|
|
|
if (!usedInOneFunc(UU, oneFunc))
|
2012-05-05 04:18:50 +08:00
|
|
|
return false;
|
2014-03-09 11:16:01 +08:00
|
|
|
|
2012-05-05 04:18:50 +08:00
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Find out if a global variable can be demoted to local scope.
|
|
|
|
* Currently, this is valid for CUDA shared variables, which have local
|
|
|
|
* scope and global lifetime. So the conditions to check are :
|
|
|
|
* 1. Is the global variable in shared address space?
|
|
|
|
* 2. Does it have internal linkage?
|
|
|
|
* 3. Is the global variable referenced only in one function?
|
|
|
|
*/
|
|
|
|
static bool canDemoteGlobalVar(const GlobalVariable *gv, Function const *&f) {
|
2015-03-24 00:26:23 +08:00
|
|
|
if (!gv->hasInternalLinkage())
|
2012-05-05 04:18:50 +08:00
|
|
|
return false;
|
|
|
|
const PointerType *Pty = gv->getType();
|
|
|
|
if (Pty->getAddressSpace() != llvm::ADDRESS_SPACE_SHARED)
|
|
|
|
return false;
|
|
|
|
|
2014-04-25 13:30:21 +08:00
|
|
|
const Function *oneFunc = nullptr;
|
2012-05-05 04:18:50 +08:00
|
|
|
|
|
|
|
bool flag = usedInOneFunc(gv, oneFunc);
|
2015-03-24 00:26:23 +08:00
|
|
|
if (!flag)
|
2012-05-05 04:18:50 +08:00
|
|
|
return false;
|
|
|
|
if (!oneFunc)
|
|
|
|
return false;
|
|
|
|
f = oneFunc;
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
static bool useFuncSeen(const Constant *C,
|
|
|
|
llvm::DenseMap<const Function *, bool> &seenMap) {
|
2014-03-09 11:16:01 +08:00
|
|
|
for (const User *U : C->users()) {
|
|
|
|
if (const Constant *cu = dyn_cast<Constant>(U)) {
|
2012-05-05 04:18:50 +08:00
|
|
|
if (useFuncSeen(cu, seenMap))
|
|
|
|
return true;
|
2014-03-09 11:16:01 +08:00
|
|
|
} else if (const Instruction *I = dyn_cast<Instruction>(U)) {
|
2012-05-05 04:18:50 +08:00
|
|
|
const BasicBlock *bb = I->getParent();
|
2013-03-30 22:29:21 +08:00
|
|
|
if (!bb)
|
|
|
|
continue;
|
2012-05-05 04:18:50 +08:00
|
|
|
const Function *caller = bb->getParent();
|
2013-03-30 22:29:21 +08:00
|
|
|
if (!caller)
|
|
|
|
continue;
|
2012-05-05 04:18:50 +08:00
|
|
|
if (seenMap.find(caller) != seenMap.end())
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2013-05-20 20:13:32 +08:00
|
|
|
void NVPTXAsmPrinter::emitDeclarations(const Module &M, raw_ostream &O) {
|
2012-05-05 04:18:50 +08:00
|
|
|
llvm::DenseMap<const Function *, bool> seenMap;
|
2013-03-30 22:29:21 +08:00
|
|
|
for (Module::const_iterator FI = M.begin(), FE = M.end(); FI != FE; ++FI) {
|
2012-05-05 04:18:50 +08:00
|
|
|
const Function *F = FI;
|
|
|
|
|
|
|
|
if (F->isDeclaration()) {
|
|
|
|
if (F->use_empty())
|
|
|
|
continue;
|
|
|
|
if (F->getIntrinsicID())
|
|
|
|
continue;
|
|
|
|
emitDeclaration(F, O);
|
|
|
|
continue;
|
|
|
|
}
|
2014-03-09 11:16:01 +08:00
|
|
|
for (const User *U : F->users()) {
|
|
|
|
if (const Constant *C = dyn_cast<Constant>(U)) {
|
2012-05-05 04:18:50 +08:00
|
|
|
if (usedInGlobalVarDef(C)) {
|
|
|
|
// The use is in the initialization of a global variable
|
|
|
|
// that is a function pointer, so print a declaration
|
|
|
|
// for the original function
|
|
|
|
emitDeclaration(F, O);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
// Emit a declaration of this function if the function that
|
|
|
|
// uses this constant expr has already been seen.
|
|
|
|
if (useFuncSeen(C, seenMap)) {
|
|
|
|
emitDeclaration(F, O);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-03-09 11:16:01 +08:00
|
|
|
if (!isa<Instruction>(U))
|
2013-03-30 22:29:21 +08:00
|
|
|
continue;
|
2014-03-09 11:16:01 +08:00
|
|
|
const Instruction *instr = cast<Instruction>(U);
|
2012-05-05 04:18:50 +08:00
|
|
|
const BasicBlock *bb = instr->getParent();
|
2013-03-30 22:29:21 +08:00
|
|
|
if (!bb)
|
|
|
|
continue;
|
2012-05-05 04:18:50 +08:00
|
|
|
const Function *caller = bb->getParent();
|
2013-03-30 22:29:21 +08:00
|
|
|
if (!caller)
|
|
|
|
continue;
|
2012-05-05 04:18:50 +08:00
|
|
|
|
|
|
|
// If a caller has already been seen, then the caller is
|
|
|
|
// appearing in the module before the callee. so print out
|
|
|
|
// a declaration for the callee.
|
|
|
|
if (seenMap.find(caller) != seenMap.end()) {
|
|
|
|
emitDeclaration(F, O);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
seenMap[F] = true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
void NVPTXAsmPrinter::recordAndEmitFilenames(Module &M) {
|
|
|
|
DebugInfoFinder DbgFinder;
|
|
|
|
DbgFinder.processModule(M);
|
|
|
|
|
2013-03-30 22:29:21 +08:00
|
|
|
unsigned i = 1;
|
2015-04-16 07:19:27 +08:00
|
|
|
for (const MDCompileUnit *DIUnit : DbgFinder.compile_units()) {
|
|
|
|
StringRef Filename = DIUnit->getFilename();
|
|
|
|
StringRef Dirname = DIUnit->getDirectory();
|
2012-05-05 04:18:50 +08:00
|
|
|
SmallString<128> FullPathName = Dirname;
|
|
|
|
if (!Dirname.empty() && !sys::path::is_absolute(Filename)) {
|
|
|
|
sys::path::append(FullPathName, Filename);
|
2015-03-30 23:42:36 +08:00
|
|
|
Filename = FullPathName;
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
2015-03-30 23:42:36 +08:00
|
|
|
if (filenameMap.find(Filename) != filenameMap.end())
|
2012-05-05 04:18:50 +08:00
|
|
|
continue;
|
2015-03-30 23:42:36 +08:00
|
|
|
filenameMap[Filename] = i;
|
2015-04-25 03:11:51 +08:00
|
|
|
OutStreamer->EmitDwarfFileDirective(i, "", Filename);
|
2012-05-05 04:18:50 +08:00
|
|
|
++i;
|
|
|
|
}
|
|
|
|
|
2015-04-14 11:40:37 +08:00
|
|
|
for (MDSubprogram *SP : DbgFinder.subprograms()) {
|
|
|
|
StringRef Filename = SP->getFilename();
|
|
|
|
StringRef Dirname = SP->getDirectory();
|
2012-05-05 04:18:50 +08:00
|
|
|
SmallString<128> FullPathName = Dirname;
|
|
|
|
if (!Dirname.empty() && !sys::path::is_absolute(Filename)) {
|
|
|
|
sys::path::append(FullPathName, Filename);
|
2015-03-30 23:42:36 +08:00
|
|
|
Filename = FullPathName;
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
2015-03-30 23:42:36 +08:00
|
|
|
if (filenameMap.find(Filename) != filenameMap.end())
|
2012-05-05 04:18:50 +08:00
|
|
|
continue;
|
2015-03-30 23:42:36 +08:00
|
|
|
filenameMap[Filename] = i;
|
2012-05-05 04:18:50 +08:00
|
|
|
++i;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2013-03-30 22:29:21 +08:00
|
|
|
bool NVPTXAsmPrinter::doInitialization(Module &M) {
|
2015-02-19 08:08:14 +08:00
|
|
|
// Construct a default subtarget off of the TargetMachine defaults. The
|
|
|
|
// rest of NVPTX isn't friendly to change subtargets per function and
|
|
|
|
// so the default TargetMachine will have all of the options.
|
|
|
|
StringRef TT = TM.getTargetTriple();
|
|
|
|
StringRef CPU = TM.getTargetCPU();
|
|
|
|
StringRef FS = TM.getTargetFeatureString();
|
|
|
|
const NVPTXTargetMachine &NTM = static_cast<const NVPTXTargetMachine &>(TM);
|
2015-02-19 08:08:27 +08:00
|
|
|
const NVPTXSubtarget STI(TT, CPU, FS, NTM);
|
2012-05-05 04:18:50 +08:00
|
|
|
|
|
|
|
SmallString<128> Str1;
|
|
|
|
raw_svector_ostream OS1(Str1);
|
|
|
|
|
|
|
|
MMI = getAnalysisIfAvailable<MachineModuleInfo>();
|
|
|
|
MMI->AnalyzeModule(M);
|
|
|
|
|
|
|
|
// We need to call the parent's one explicitly.
|
|
|
|
//bool Result = AsmPrinter::doInitialization(M);
|
|
|
|
|
|
|
|
// Initialize TargetLoweringObjectFile.
|
2013-03-30 22:29:21 +08:00
|
|
|
const_cast<TargetLoweringObjectFile &>(getObjFileLowering())
|
|
|
|
.Initialize(OutContext, TM);
|
2012-05-05 04:18:50 +08:00
|
|
|
|
2015-01-27 03:03:15 +08:00
|
|
|
Mang = new Mangler(TM.getDataLayout());
|
2012-05-05 04:18:50 +08:00
|
|
|
|
|
|
|
// Emit header before any dwarf directives are emitted below.
|
2015-02-19 08:08:14 +08:00
|
|
|
emitHeader(M, OS1, STI);
|
2015-04-25 03:11:51 +08:00
|
|
|
OutStreamer->EmitRawText(OS1.str());
|
2012-05-05 04:18:50 +08:00
|
|
|
|
|
|
|
// Already commented out
|
|
|
|
//bool Result = AsmPrinter::doInitialization(M);
|
|
|
|
|
2013-07-01 21:00:14 +08:00
|
|
|
// Emit module-level inline asm if it exists.
|
|
|
|
if (!M.getModuleInlineAsm().empty()) {
|
2015-04-25 03:11:51 +08:00
|
|
|
OutStreamer->AddComment("Start of file scope inline assembly");
|
|
|
|
OutStreamer->AddBlankLine();
|
|
|
|
OutStreamer->EmitRawText(StringRef(M.getModuleInlineAsm()));
|
|
|
|
OutStreamer->AddBlankLine();
|
|
|
|
OutStreamer->AddComment("End of file scope inline assembly");
|
|
|
|
OutStreamer->AddBlankLine();
|
2013-07-01 21:00:14 +08:00
|
|
|
}
|
|
|
|
|
2015-02-19 08:08:14 +08:00
|
|
|
// If we're not NVCL we're CUDA, go ahead and emit filenames.
|
|
|
|
if (Triple(TM.getTargetTriple()).getOS() != Triple::NVCL)
|
2012-05-05 04:18:50 +08:00
|
|
|
recordAndEmitFilenames(M);
|
|
|
|
|
2013-05-20 20:13:32 +08:00
|
|
|
GlobalsEmitted = false;
|
|
|
|
|
|
|
|
return false; // success
|
|
|
|
}
|
|
|
|
|
|
|
|
void NVPTXAsmPrinter::emitGlobals(const Module &M) {
|
2012-05-05 04:18:50 +08:00
|
|
|
SmallString<128> Str2;
|
|
|
|
raw_svector_ostream OS2(Str2);
|
|
|
|
|
|
|
|
emitDeclarations(M, OS2);
|
|
|
|
|
2012-11-17 05:03:51 +08:00
|
|
|
// As ptxas does not support forward references of globals, we need to first
|
|
|
|
// sort the list of module-level globals in def-use order. We visit each
|
|
|
|
// global variable in order, and ensure that we emit it *after* its dependent
|
|
|
|
// globals. We use a little extra memory maintaining both a set and a list to
|
|
|
|
// have fast searches while maintaining a strict ordering.
|
2013-05-20 20:13:32 +08:00
|
|
|
SmallVector<const GlobalVariable *, 8> Globals;
|
|
|
|
DenseSet<const GlobalVariable *> GVVisited;
|
|
|
|
DenseSet<const GlobalVariable *> GVVisiting;
|
2012-11-17 05:03:51 +08:00
|
|
|
|
|
|
|
// Visit each global variable, in order
|
2013-05-20 20:13:32 +08:00
|
|
|
for (Module::const_global_iterator I = M.global_begin(), E = M.global_end();
|
|
|
|
I != E; ++I)
|
2012-11-17 05:03:51 +08:00
|
|
|
VisitGlobalVariableForEmission(I, Globals, GVVisited, GVVisiting);
|
|
|
|
|
2013-03-30 22:29:21 +08:00
|
|
|
assert(GVVisited.size() == M.getGlobalList().size() &&
|
2012-11-17 05:03:51 +08:00
|
|
|
"Missed a global variable");
|
|
|
|
assert(GVVisiting.size() == 0 && "Did not fully process a global variable");
|
|
|
|
|
|
|
|
// Print out module-level global variables in proper order
|
|
|
|
for (unsigned i = 0, e = Globals.size(); i != e; ++i)
|
|
|
|
printModuleLevelGV(Globals[i], OS2);
|
2012-05-05 04:18:50 +08:00
|
|
|
|
|
|
|
OS2 << '\n';
|
|
|
|
|
2015-04-25 03:11:51 +08:00
|
|
|
OutStreamer->EmitRawText(OS2.str());
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
|
|
|
|
2015-02-19 08:08:14 +08:00
|
|
|
void NVPTXAsmPrinter::emitHeader(Module &M, raw_ostream &O,
|
|
|
|
const NVPTXSubtarget &STI) {
|
2012-05-05 04:18:50 +08:00
|
|
|
O << "//\n";
|
|
|
|
O << "// Generated by LLVM NVPTX Back-End\n";
|
|
|
|
O << "//\n";
|
|
|
|
O << "\n";
|
|
|
|
|
2015-02-19 08:08:14 +08:00
|
|
|
unsigned PTXVersion = STI.getPTXVersion();
|
2012-11-12 11:16:43 +08:00
|
|
|
O << ".version " << (PTXVersion / 10) << "." << (PTXVersion % 10) << "\n";
|
2012-05-05 04:18:50 +08:00
|
|
|
|
|
|
|
O << ".target ";
|
2015-02-19 08:08:14 +08:00
|
|
|
O << STI.getTargetName();
|
2012-05-05 04:18:50 +08:00
|
|
|
|
2015-02-19 08:22:47 +08:00
|
|
|
const NVPTXTargetMachine &NTM = static_cast<const NVPTXTargetMachine &>(TM);
|
|
|
|
if (NTM.getDrvInterface() == NVPTX::NVCL)
|
2012-05-05 04:18:50 +08:00
|
|
|
O << ", texmode_independent";
|
2015-02-19 08:08:23 +08:00
|
|
|
else {
|
2015-02-19 08:08:14 +08:00
|
|
|
if (!STI.hasDouble())
|
2012-05-05 04:18:50 +08:00
|
|
|
O << ", map_f64_to_f32";
|
|
|
|
}
|
|
|
|
|
|
|
|
if (MAI->doesSupportDebugInformation())
|
|
|
|
O << ", debug";
|
|
|
|
|
|
|
|
O << "\n";
|
|
|
|
|
|
|
|
O << ".address_size ";
|
2015-02-19 08:22:47 +08:00
|
|
|
if (NTM.is64Bit())
|
2012-05-05 04:18:50 +08:00
|
|
|
O << "64";
|
|
|
|
else
|
|
|
|
O << "32";
|
|
|
|
O << "\n";
|
|
|
|
|
|
|
|
O << "\n";
|
|
|
|
}
|
|
|
|
|
|
|
|
bool NVPTXAsmPrinter::doFinalization(Module &M) {
|
2013-05-20 20:13:32 +08:00
|
|
|
// If we did not emit any functions, then the global declarations have not
|
|
|
|
// yet been emitted.
|
|
|
|
if (!GlobalsEmitted) {
|
|
|
|
emitGlobals(M);
|
|
|
|
GlobalsEmitted = true;
|
|
|
|
}
|
|
|
|
|
2012-05-05 04:18:50 +08:00
|
|
|
// XXX Temproarily remove global variables so that doFinalization() will not
|
|
|
|
// emit them again (global variables are emitted at beginning).
|
|
|
|
|
|
|
|
Module::GlobalListType &global_list = M.getGlobalList();
|
|
|
|
int i, n = global_list.size();
|
2014-08-26 10:03:35 +08:00
|
|
|
GlobalVariable **gv_array = new GlobalVariable *[n];
|
2012-05-05 04:18:50 +08:00
|
|
|
|
|
|
|
// first, back-up GlobalVariable in gv_array
|
|
|
|
i = 0;
|
|
|
|
for (Module::global_iterator I = global_list.begin(), E = global_list.end();
|
2013-03-30 22:29:21 +08:00
|
|
|
I != E; ++I)
|
2012-05-05 04:18:50 +08:00
|
|
|
gv_array[i++] = &*I;
|
|
|
|
|
|
|
|
// second, empty global_list
|
|
|
|
while (!global_list.empty())
|
|
|
|
global_list.remove(global_list.begin());
|
|
|
|
|
|
|
|
// call doFinalization
|
|
|
|
bool ret = AsmPrinter::doFinalization(M);
|
|
|
|
|
|
|
|
// now we restore global variables
|
2013-03-30 22:29:21 +08:00
|
|
|
for (i = 0; i < n; i++)
|
2012-05-05 04:18:50 +08:00
|
|
|
global_list.insert(global_list.end(), gv_array[i]);
|
|
|
|
|
2014-04-09 23:38:52 +08:00
|
|
|
clearAnnotationCache(&M);
|
2014-08-26 10:03:35 +08:00
|
|
|
|
|
|
|
delete[] gv_array;
|
2012-05-05 04:18:50 +08:00
|
|
|
return ret;
|
|
|
|
|
|
|
|
//bool Result = AsmPrinter::doFinalization(M);
|
|
|
|
// Instead of calling the parents doFinalization, we may
|
|
|
|
// clone parents doFinalization and customize here.
|
|
|
|
// Currently, we if NVISA out the EmitGlobals() in
|
|
|
|
// parent's doFinalization, which is too intrusive.
|
|
|
|
//
|
|
|
|
// Same for the doInitialization.
|
|
|
|
//return Result;
|
|
|
|
}
|
|
|
|
|
|
|
|
// This function emits appropriate linkage directives for
|
|
|
|
// functions and global variables.
|
|
|
|
//
|
|
|
|
// extern function declaration -> .extern
|
|
|
|
// extern function definition -> .visible
|
|
|
|
// external global variable with init -> .visible
|
|
|
|
// external without init -> .extern
|
|
|
|
// appending -> not allowed, assert.
|
2014-06-28 02:35:10 +08:00
|
|
|
// for any linkage other than
|
|
|
|
// internal, private, linker_private,
|
|
|
|
// linker_private_weak, linker_private_weak_def_auto,
|
|
|
|
// we emit -> .weak.
|
2012-05-05 04:18:50 +08:00
|
|
|
|
2013-03-30 22:29:21 +08:00
|
|
|
void NVPTXAsmPrinter::emitLinkageDirective(const GlobalValue *V,
|
|
|
|
raw_ostream &O) {
|
2015-02-19 08:08:23 +08:00
|
|
|
if (static_cast<NVPTXTargetMachine &>(TM).getDrvInterface() == NVPTX::CUDA) {
|
2012-05-05 04:18:50 +08:00
|
|
|
if (V->hasExternalLinkage()) {
|
|
|
|
if (isa<GlobalVariable>(V)) {
|
|
|
|
const GlobalVariable *GVar = cast<GlobalVariable>(V);
|
|
|
|
if (GVar) {
|
|
|
|
if (GVar->hasInitializer())
|
|
|
|
O << ".visible ";
|
|
|
|
else
|
|
|
|
O << ".extern ";
|
|
|
|
}
|
|
|
|
} else if (V->isDeclaration())
|
|
|
|
O << ".extern ";
|
|
|
|
else
|
|
|
|
O << ".visible ";
|
|
|
|
} else if (V->hasAppendingLinkage()) {
|
|
|
|
std::string msg;
|
|
|
|
msg.append("Error: ");
|
|
|
|
msg.append("Symbol ");
|
|
|
|
if (V->hasName())
|
2015-03-30 23:42:36 +08:00
|
|
|
msg.append(V->getName());
|
2012-05-05 04:18:50 +08:00
|
|
|
msg.append("has unsupported appending linkage type");
|
|
|
|
llvm_unreachable(msg.c_str());
|
2014-06-28 02:35:10 +08:00
|
|
|
} else if (!V->hasInternalLinkage() &&
|
|
|
|
!V->hasPrivateLinkage()) {
|
|
|
|
O << ".weak ";
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2013-05-20 20:13:32 +08:00
|
|
|
void NVPTXAsmPrinter::printModuleLevelGV(const GlobalVariable *GVar,
|
|
|
|
raw_ostream &O,
|
2012-05-05 04:18:50 +08:00
|
|
|
bool processDemoted) {
|
|
|
|
|
|
|
|
// Skip meta data
|
|
|
|
if (GVar->hasSection()) {
|
2014-06-03 10:41:57 +08:00
|
|
|
if (GVar->getSection() == StringRef("llvm.metadata"))
|
2012-05-05 04:18:50 +08:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2014-06-28 02:35:53 +08:00
|
|
|
// Skip LLVM intrinsic global variables
|
|
|
|
if (GVar->getName().startswith("llvm.") ||
|
|
|
|
GVar->getName().startswith("nvvm."))
|
|
|
|
return;
|
|
|
|
|
2015-01-27 03:03:15 +08:00
|
|
|
const DataLayout *TD = TM.getDataLayout();
|
2012-05-05 04:18:50 +08:00
|
|
|
|
|
|
|
// GlobalVariables are always constant pointers themselves.
|
|
|
|
const PointerType *PTy = GVar->getType();
|
|
|
|
Type *ETy = PTy->getElementType();
|
|
|
|
|
|
|
|
if (GVar->hasExternalLinkage()) {
|
|
|
|
if (GVar->hasInitializer())
|
|
|
|
O << ".visible ";
|
|
|
|
else
|
|
|
|
O << ".extern ";
|
2014-06-28 02:35:56 +08:00
|
|
|
} else if (GVar->hasLinkOnceLinkage() || GVar->hasWeakLinkage() ||
|
|
|
|
GVar->hasAvailableExternallyLinkage() ||
|
|
|
|
GVar->hasCommonLinkage()) {
|
|
|
|
O << ".weak ";
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
if (llvm::isTexture(*GVar)) {
|
|
|
|
O << ".global .texref " << llvm::getTextureName(*GVar) << ";\n";
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (llvm::isSurface(*GVar)) {
|
|
|
|
O << ".global .surfref " << llvm::getSurfaceName(*GVar) << ";\n";
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (GVar->isDeclaration()) {
|
|
|
|
// (extern) declarations, no definition or initializer
|
|
|
|
// Currently the only known declaration is for an automatic __local
|
|
|
|
// (.shared) promoted to global.
|
|
|
|
emitPTXGlobalVariable(GVar, O);
|
|
|
|
O << ";\n";
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (llvm::isSampler(*GVar)) {
|
|
|
|
O << ".global .samplerref " << llvm::getSamplerName(*GVar);
|
|
|
|
|
2014-04-25 13:30:21 +08:00
|
|
|
const Constant *Initializer = nullptr;
|
2012-05-05 04:18:50 +08:00
|
|
|
if (GVar->hasInitializer())
|
|
|
|
Initializer = GVar->getInitializer();
|
2014-04-25 13:30:21 +08:00
|
|
|
const ConstantInt *CI = nullptr;
|
2012-05-05 04:18:50 +08:00
|
|
|
if (Initializer)
|
|
|
|
CI = dyn_cast<ConstantInt>(Initializer);
|
|
|
|
if (CI) {
|
2013-03-30 22:29:21 +08:00
|
|
|
unsigned sample = CI->getZExtValue();
|
2012-05-05 04:18:50 +08:00
|
|
|
|
|
|
|
O << " = { ";
|
|
|
|
|
2013-03-30 22:29:21 +08:00
|
|
|
for (int i = 0,
|
|
|
|
addr = ((sample & __CLK_ADDRESS_MASK) >> __CLK_ADDRESS_BASE);
|
|
|
|
i < 3; i++) {
|
2012-05-05 04:18:50 +08:00
|
|
|
O << "addr_mode_" << i << " = ";
|
|
|
|
switch (addr) {
|
2013-03-30 22:29:21 +08:00
|
|
|
case 0:
|
|
|
|
O << "wrap";
|
|
|
|
break;
|
|
|
|
case 1:
|
|
|
|
O << "clamp_to_border";
|
|
|
|
break;
|
|
|
|
case 2:
|
|
|
|
O << "clamp_to_edge";
|
|
|
|
break;
|
|
|
|
case 3:
|
|
|
|
O << "wrap";
|
|
|
|
break;
|
|
|
|
case 4:
|
|
|
|
O << "mirror";
|
|
|
|
break;
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
2013-03-30 22:29:21 +08:00
|
|
|
O << ", ";
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
|
|
|
O << "filter_mode = ";
|
2013-03-30 22:29:21 +08:00
|
|
|
switch ((sample & __CLK_FILTER_MASK) >> __CLK_FILTER_BASE) {
|
|
|
|
case 0:
|
|
|
|
O << "nearest";
|
|
|
|
break;
|
|
|
|
case 1:
|
|
|
|
O << "linear";
|
|
|
|
break;
|
|
|
|
case 2:
|
2014-06-18 13:05:13 +08:00
|
|
|
llvm_unreachable("Anisotropic filtering is not supported");
|
2013-03-30 22:29:21 +08:00
|
|
|
default:
|
|
|
|
O << "nearest";
|
|
|
|
break;
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
2013-03-30 22:29:21 +08:00
|
|
|
if (!((sample & __CLK_NORMALIZED_MASK) >> __CLK_NORMALIZED_BASE)) {
|
2012-05-05 04:18:50 +08:00
|
|
|
O << ", force_unnormalized_coords = 1";
|
|
|
|
}
|
|
|
|
O << " }";
|
|
|
|
}
|
|
|
|
|
|
|
|
O << ";\n";
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (GVar->hasPrivateLinkage()) {
|
|
|
|
|
|
|
|
if (!strncmp(GVar->getName().data(), "unrollpragma", 12))
|
|
|
|
return;
|
|
|
|
|
|
|
|
// FIXME - need better way (e.g. Metadata) to avoid generating this global
|
|
|
|
if (!strncmp(GVar->getName().data(), "filename", 8))
|
|
|
|
return;
|
|
|
|
if (GVar->use_empty())
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2014-04-25 13:30:21 +08:00
|
|
|
const Function *demotedFunc = nullptr;
|
2012-05-05 04:18:50 +08:00
|
|
|
if (!processDemoted && canDemoteGlobalVar(GVar, demotedFunc)) {
|
2015-03-30 23:42:36 +08:00
|
|
|
O << "// " << GVar->getName() << " has been demoted\n";
|
2012-05-05 04:18:50 +08:00
|
|
|
if (localDecls.find(demotedFunc) != localDecls.end())
|
|
|
|
localDecls[demotedFunc].push_back(GVar);
|
|
|
|
else {
|
2013-05-20 20:13:32 +08:00
|
|
|
std::vector<const GlobalVariable *> temp;
|
2012-05-05 04:18:50 +08:00
|
|
|
temp.push_back(GVar);
|
|
|
|
localDecls[demotedFunc] = temp;
|
|
|
|
}
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
O << ".";
|
|
|
|
emitPTXAddressSpace(PTy->getAddressSpace(), O);
|
2014-06-28 02:35:58 +08:00
|
|
|
|
|
|
|
if (isManaged(*GVar)) {
|
|
|
|
O << " .attribute(.managed)";
|
|
|
|
}
|
|
|
|
|
2012-05-05 04:18:50 +08:00
|
|
|
if (GVar->getAlignment() == 0)
|
|
|
|
O << " .align " << (int) TD->getPrefTypeAlignment(ETy);
|
|
|
|
else
|
|
|
|
O << " .align " << GVar->getAlignment();
|
|
|
|
|
2014-12-18 01:59:04 +08:00
|
|
|
if (ETy->isFloatingPointTy() || ETy->isIntegerTy() || ETy->isPointerTy()) {
|
2012-05-05 04:18:50 +08:00
|
|
|
O << " .";
|
2013-05-20 20:13:28 +08:00
|
|
|
// Special case: ABI requires that we use .u8 for predicates
|
|
|
|
if (ETy->isIntegerTy(1))
|
|
|
|
O << "u8";
|
|
|
|
else
|
|
|
|
O << getPTXFundamentalTypeStr(ETy, false);
|
2012-05-05 04:18:50 +08:00
|
|
|
O << " ";
|
2014-04-01 00:11:57 +08:00
|
|
|
O << *getSymbol(GVar);
|
2012-05-05 04:18:50 +08:00
|
|
|
|
|
|
|
// Ptx allows variable initilization only for constant and global state
|
|
|
|
// spaces.
|
2014-06-28 02:36:01 +08:00
|
|
|
if (GVar->hasInitializer()) {
|
|
|
|
if ((PTy->getAddressSpace() == llvm::ADDRESS_SPACE_GLOBAL) ||
|
|
|
|
(PTy->getAddressSpace() == llvm::ADDRESS_SPACE_CONST)) {
|
|
|
|
const Constant *Initializer = GVar->getInitializer();
|
2015-04-24 10:57:30 +08:00
|
|
|
// 'undef' is treated as there is no value specified.
|
2014-06-28 02:36:01 +08:00
|
|
|
if (!Initializer->isNullValue() && !isa<UndefValue>(Initializer)) {
|
|
|
|
O << " = ";
|
|
|
|
printScalarConstant(Initializer, O);
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
// The frontend adds zero-initializer to variables that don't have an
|
|
|
|
// initial value, so skip warning for this case.
|
|
|
|
if (!GVar->getInitializer()->isNullValue()) {
|
2015-03-30 23:42:36 +08:00
|
|
|
std::string warnMsg =
|
|
|
|
("initial value of '" + GVar->getName() +
|
|
|
|
"' is not allowed in addrspace(" +
|
|
|
|
Twine(llvm::utostr_32(PTy->getAddressSpace())) + ")").str();
|
2014-06-28 02:36:01 +08:00
|
|
|
report_fatal_error(warnMsg.c_str());
|
|
|
|
}
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
} else {
|
2013-03-30 22:29:21 +08:00
|
|
|
unsigned int ElementSize = 0;
|
2012-05-05 04:18:50 +08:00
|
|
|
|
|
|
|
// Although PTX has direct support for struct type and array type and
|
|
|
|
// LLVM IR is very similar to PTX, the LLVM CodeGen does not support for
|
|
|
|
// targets that support these high level field accesses. Structs, arrays
|
|
|
|
// and vectors are lowered into arrays of bytes.
|
|
|
|
switch (ETy->getTypeID()) {
|
|
|
|
case Type::StructTyID:
|
|
|
|
case Type::ArrayTyID:
|
|
|
|
case Type::VectorTyID:
|
|
|
|
ElementSize = TD->getTypeStoreSize(ETy);
|
|
|
|
// Ptx allows variable initilization only for constant and
|
|
|
|
// global state spaces.
|
|
|
|
if (((PTy->getAddressSpace() == llvm::ADDRESS_SPACE_GLOBAL) ||
|
2013-03-30 22:29:21 +08:00
|
|
|
(PTy->getAddressSpace() == llvm::ADDRESS_SPACE_CONST)) &&
|
|
|
|
GVar->hasInitializer()) {
|
2013-05-20 20:13:32 +08:00
|
|
|
const Constant *Initializer = GVar->getInitializer();
|
2013-03-30 22:29:21 +08:00
|
|
|
if (!isa<UndefValue>(Initializer) && !Initializer->isNullValue()) {
|
2012-05-05 04:18:50 +08:00
|
|
|
AggBuffer aggBuffer(ElementSize, O, *this);
|
|
|
|
bufferAggregateConstant(Initializer, &aggBuffer);
|
|
|
|
if (aggBuffer.numSymbols) {
|
2015-02-19 08:08:14 +08:00
|
|
|
if (static_cast<const NVPTXTargetMachine &>(TM).is64Bit()) {
|
2014-04-01 00:11:57 +08:00
|
|
|
O << " .u64 " << *getSymbol(GVar) << "[";
|
2013-03-30 22:29:21 +08:00
|
|
|
O << ElementSize / 8;
|
|
|
|
} else {
|
2014-04-01 00:11:57 +08:00
|
|
|
O << " .u32 " << *getSymbol(GVar) << "[";
|
2013-03-30 22:29:21 +08:00
|
|
|
O << ElementSize / 4;
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
|
|
|
O << "]";
|
2013-03-30 22:29:21 +08:00
|
|
|
} else {
|
2014-04-01 00:11:57 +08:00
|
|
|
O << " .b8 " << *getSymbol(GVar) << "[";
|
2012-05-05 04:18:50 +08:00
|
|
|
O << ElementSize;
|
|
|
|
O << "]";
|
|
|
|
}
|
2013-03-30 22:29:21 +08:00
|
|
|
O << " = {";
|
2012-05-05 04:18:50 +08:00
|
|
|
aggBuffer.print();
|
|
|
|
O << "}";
|
2013-03-30 22:29:21 +08:00
|
|
|
} else {
|
2014-04-01 00:11:57 +08:00
|
|
|
O << " .b8 " << *getSymbol(GVar);
|
2012-05-05 04:18:50 +08:00
|
|
|
if (ElementSize) {
|
2013-03-30 22:29:21 +08:00
|
|
|
O << "[";
|
2012-05-05 04:18:50 +08:00
|
|
|
O << ElementSize;
|
|
|
|
O << "]";
|
|
|
|
}
|
|
|
|
}
|
2013-03-30 22:29:21 +08:00
|
|
|
} else {
|
2014-04-01 00:11:57 +08:00
|
|
|
O << " .b8 " << *getSymbol(GVar);
|
2012-05-05 04:18:50 +08:00
|
|
|
if (ElementSize) {
|
2013-03-30 22:29:21 +08:00
|
|
|
O << "[";
|
2012-05-05 04:18:50 +08:00
|
|
|
O << ElementSize;
|
|
|
|
O << "]";
|
|
|
|
}
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
default:
|
2014-06-18 13:05:13 +08:00
|
|
|
llvm_unreachable("type not supported yet");
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
}
|
|
|
|
O << ";\n";
|
|
|
|
}
|
|
|
|
|
|
|
|
void NVPTXAsmPrinter::emitDemotedVars(const Function *f, raw_ostream &O) {
|
|
|
|
if (localDecls.find(f) == localDecls.end())
|
|
|
|
return;
|
|
|
|
|
2013-05-20 20:13:32 +08:00
|
|
|
std::vector<const GlobalVariable *> &gvars = localDecls[f];
|
2012-05-05 04:18:50 +08:00
|
|
|
|
2013-03-30 22:29:21 +08:00
|
|
|
for (unsigned i = 0, e = gvars.size(); i != e; ++i) {
|
2012-05-05 04:18:50 +08:00
|
|
|
O << "\t// demoted variable\n\t";
|
|
|
|
printModuleLevelGV(gvars[i], O, true);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
void NVPTXAsmPrinter::emitPTXAddressSpace(unsigned int AddressSpace,
|
|
|
|
raw_ostream &O) const {
|
|
|
|
switch (AddressSpace) {
|
|
|
|
case llvm::ADDRESS_SPACE_LOCAL:
|
2013-03-30 22:29:21 +08:00
|
|
|
O << "local";
|
2012-05-05 04:18:50 +08:00
|
|
|
break;
|
|
|
|
case llvm::ADDRESS_SPACE_GLOBAL:
|
2013-03-30 22:29:21 +08:00
|
|
|
O << "global";
|
2012-05-05 04:18:50 +08:00
|
|
|
break;
|
|
|
|
case llvm::ADDRESS_SPACE_CONST:
|
2013-03-30 22:29:21 +08:00
|
|
|
O << "const";
|
2012-05-05 04:18:50 +08:00
|
|
|
break;
|
|
|
|
case llvm::ADDRESS_SPACE_SHARED:
|
2013-03-30 22:29:21 +08:00
|
|
|
O << "shared";
|
2012-05-05 04:18:50 +08:00
|
|
|
break;
|
|
|
|
default:
|
2013-02-09 21:34:15 +08:00
|
|
|
report_fatal_error("Bad address space found while emitting PTX");
|
|
|
|
break;
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2013-03-30 22:29:21 +08:00
|
|
|
std::string
|
|
|
|
NVPTXAsmPrinter::getPTXFundamentalTypeStr(const Type *Ty, bool useB4PTR) const {
|
2012-05-05 04:18:50 +08:00
|
|
|
switch (Ty->getTypeID()) {
|
|
|
|
default:
|
|
|
|
llvm_unreachable("unexpected type");
|
|
|
|
break;
|
|
|
|
case Type::IntegerTyID: {
|
|
|
|
unsigned NumBits = cast<IntegerType>(Ty)->getBitWidth();
|
|
|
|
if (NumBits == 1)
|
|
|
|
return "pred";
|
|
|
|
else if (NumBits <= 64) {
|
|
|
|
std::string name = "u";
|
|
|
|
return name + utostr(NumBits);
|
|
|
|
} else {
|
|
|
|
llvm_unreachable("Integer too large");
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case Type::FloatTyID:
|
|
|
|
return "f32";
|
|
|
|
case Type::DoubleTyID:
|
|
|
|
return "f64";
|
|
|
|
case Type::PointerTyID:
|
2015-02-19 08:08:14 +08:00
|
|
|
if (static_cast<const NVPTXTargetMachine &>(TM).is64Bit())
|
2013-03-30 22:29:21 +08:00
|
|
|
if (useB4PTR)
|
|
|
|
return "b64";
|
|
|
|
else
|
|
|
|
return "u64";
|
|
|
|
else if (useB4PTR)
|
|
|
|
return "b32";
|
2012-05-05 04:18:50 +08:00
|
|
|
else
|
2013-03-30 22:29:21 +08:00
|
|
|
return "u32";
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
|
|
|
llvm_unreachable("unexpected type");
|
2014-04-25 13:30:21 +08:00
|
|
|
return nullptr;
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
|
|
|
|
2013-03-30 22:29:21 +08:00
|
|
|
void NVPTXAsmPrinter::emitPTXGlobalVariable(const GlobalVariable *GVar,
|
2012-05-05 04:18:50 +08:00
|
|
|
raw_ostream &O) {
|
|
|
|
|
2015-01-27 03:03:15 +08:00
|
|
|
const DataLayout *TD = TM.getDataLayout();
|
2012-05-05 04:18:50 +08:00
|
|
|
|
|
|
|
// GlobalVariables are always constant pointers themselves.
|
|
|
|
const PointerType *PTy = GVar->getType();
|
|
|
|
Type *ETy = PTy->getElementType();
|
|
|
|
|
|
|
|
O << ".";
|
|
|
|
emitPTXAddressSpace(PTy->getAddressSpace(), O);
|
|
|
|
if (GVar->getAlignment() == 0)
|
|
|
|
O << " .align " << (int) TD->getPrefTypeAlignment(ETy);
|
|
|
|
else
|
|
|
|
O << " .align " << GVar->getAlignment();
|
|
|
|
|
2014-12-18 01:59:04 +08:00
|
|
|
if (ETy->isFloatingPointTy() || ETy->isIntegerTy() || ETy->isPointerTy()) {
|
2012-05-05 04:18:50 +08:00
|
|
|
O << " .";
|
|
|
|
O << getPTXFundamentalTypeStr(ETy);
|
|
|
|
O << " ";
|
2014-04-01 00:11:57 +08:00
|
|
|
O << *getSymbol(GVar);
|
2012-05-05 04:18:50 +08:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2013-03-30 22:29:21 +08:00
|
|
|
int64_t ElementSize = 0;
|
2012-05-05 04:18:50 +08:00
|
|
|
|
|
|
|
// Although PTX has direct support for struct type and array type and LLVM IR
|
|
|
|
// is very similar to PTX, the LLVM CodeGen does not support for targets that
|
|
|
|
// support these high level field accesses. Structs and arrays are lowered
|
|
|
|
// into arrays of bytes.
|
|
|
|
switch (ETy->getTypeID()) {
|
|
|
|
case Type::StructTyID:
|
|
|
|
case Type::ArrayTyID:
|
|
|
|
case Type::VectorTyID:
|
|
|
|
ElementSize = TD->getTypeStoreSize(ETy);
|
2014-04-01 00:11:57 +08:00
|
|
|
O << " .b8 " << *getSymbol(GVar) << "[";
|
2012-05-05 04:18:50 +08:00
|
|
|
if (ElementSize) {
|
2013-03-30 22:29:21 +08:00
|
|
|
O << itostr(ElementSize);
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
|
|
|
O << "]";
|
|
|
|
break;
|
|
|
|
default:
|
2014-06-18 13:05:13 +08:00
|
|
|
llvm_unreachable("type not supported yet");
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
2013-03-30 22:29:21 +08:00
|
|
|
return;
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
|
|
|
|
2013-03-30 22:29:21 +08:00
|
|
|
static unsigned int getOpenCLAlignment(const DataLayout *TD, Type *Ty) {
|
2013-12-08 03:34:20 +08:00
|
|
|
if (Ty->isSingleValueType())
|
2012-05-05 04:18:50 +08:00
|
|
|
return TD->getPrefTypeAlignment(Ty);
|
|
|
|
|
|
|
|
const ArrayType *ATy = dyn_cast<ArrayType>(Ty);
|
|
|
|
if (ATy)
|
|
|
|
return getOpenCLAlignment(TD, ATy->getElementType());
|
|
|
|
|
|
|
|
const StructType *STy = dyn_cast<StructType>(Ty);
|
|
|
|
if (STy) {
|
|
|
|
unsigned int alignStruct = 1;
|
|
|
|
// Go through each element of the struct and find the
|
|
|
|
// largest alignment.
|
2013-03-30 22:29:21 +08:00
|
|
|
for (unsigned i = 0, e = STy->getNumElements(); i != e; i++) {
|
2012-05-05 04:18:50 +08:00
|
|
|
Type *ETy = STy->getElementType(i);
|
|
|
|
unsigned int align = getOpenCLAlignment(TD, ETy);
|
|
|
|
if (align > alignStruct)
|
|
|
|
alignStruct = align;
|
|
|
|
}
|
|
|
|
return alignStruct;
|
|
|
|
}
|
|
|
|
|
|
|
|
const FunctionType *FTy = dyn_cast<FunctionType>(Ty);
|
|
|
|
if (FTy)
|
Revert the majority of the next patch in the address space series:
r165941: Resubmit the changes to llvm core to update the functions to
support different pointer sizes on a per address space basis.
Despite this commit log, this change primarily changed stuff outside of
VMCore, and those changes do not carry any tests for correctness (or
even plausibility), and we have consistently found questionable or flat
out incorrect cases in these changes. Most of them are probably correct,
but we need to devise a system that makes it more clear when we have
handled the address space concerns correctly, and ideally each pass that
gets updated would receive an accompanying test case that exercises that
pass specificaly w.r.t. alternate address spaces.
However, from this commit, I have retained the new C API entry points.
Those were an orthogonal change that probably should have been split
apart, but they seem entirely good.
In several places the changes were very obvious cleanups with no actual
multiple address space code added; these I have not reverted when
I spotted them.
In a few other places there were merge conflicts due to a cleaner
solution being implemented later, often not using address spaces at all.
In those cases, I've preserved the new code which isn't address space
dependent.
This is part of my ongoing effort to clean out the partial address space
code which carries high risk and low test coverage, and not likely to be
finished before the 3.2 release looms closer. Duncan and I would both
like to see the above issues addressed before we return to these
changes.
llvm-svn: 167222
2012-11-01 17:14:31 +08:00
|
|
|
return TD->getPointerPrefAlignment();
|
2012-05-05 04:18:50 +08:00
|
|
|
return TD->getPrefTypeAlignment(Ty);
|
|
|
|
}
|
|
|
|
|
|
|
|
void NVPTXAsmPrinter::printParamName(Function::const_arg_iterator I,
|
|
|
|
int paramIndex, raw_ostream &O) {
|
2015-02-19 08:08:23 +08:00
|
|
|
O << *getSymbol(I->getParent()) << "_param_" << paramIndex;
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
void NVPTXAsmPrinter::printParamName(int paramIndex, raw_ostream &O) {
|
2015-02-19 08:08:23 +08:00
|
|
|
O << *CurrentFnSym << "_param_" << paramIndex;
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
|
|
|
|
2013-03-30 22:29:21 +08:00
|
|
|
void NVPTXAsmPrinter::emitFunctionParamList(const Function *F, raw_ostream &O) {
|
2015-01-27 03:03:15 +08:00
|
|
|
const DataLayout *TD = TM.getDataLayout();
|
2012-12-08 07:16:57 +08:00
|
|
|
const AttributeSet &PAL = F->getAttributes();
|
2015-02-19 08:08:14 +08:00
|
|
|
const TargetLowering *TLI = nvptxSubtarget->getTargetLowering();
|
2012-05-05 04:18:50 +08:00
|
|
|
Function::const_arg_iterator I, E;
|
|
|
|
unsigned paramIndex = 0;
|
|
|
|
bool first = true;
|
|
|
|
bool isKernelFunc = llvm::isKernelFunction(*F);
|
2015-02-19 08:08:14 +08:00
|
|
|
bool isABI = (nvptxSubtarget->getSmVersion() >= 20);
|
2012-05-05 04:18:50 +08:00
|
|
|
MVT thePointerTy = TLI->getPointerTy();
|
|
|
|
|
|
|
|
O << "(\n";
|
|
|
|
|
|
|
|
for (I = F->arg_begin(), E = F->arg_end(); I != E; ++I, paramIndex++) {
|
2013-03-25 05:17:47 +08:00
|
|
|
Type *Ty = I->getType();
|
2012-05-05 04:18:50 +08:00
|
|
|
|
|
|
|
if (!first)
|
|
|
|
O << ",\n";
|
|
|
|
|
|
|
|
first = false;
|
|
|
|
|
|
|
|
// Handle image/sampler parameters
|
2014-04-09 23:39:15 +08:00
|
|
|
if (isKernelFunction(*F)) {
|
|
|
|
if (isSampler(*I) || isImage(*I)) {
|
|
|
|
if (isImage(*I)) {
|
|
|
|
std::string sname = I->getName();
|
|
|
|
if (isImageWriteOnly(*I) || isImageReadWrite(*I)) {
|
2015-02-19 08:08:14 +08:00
|
|
|
if (nvptxSubtarget->hasImageHandles())
|
2014-04-09 23:39:15 +08:00
|
|
|
O << "\t.param .u64 .ptr .surfref ";
|
|
|
|
else
|
|
|
|
O << "\t.param .surfref ";
|
|
|
|
O << *CurrentFnSym << "_param_" << paramIndex;
|
|
|
|
}
|
|
|
|
else { // Default image is read_only
|
2015-02-19 08:08:14 +08:00
|
|
|
if (nvptxSubtarget->hasImageHandles())
|
2014-04-09 23:39:15 +08:00
|
|
|
O << "\t.param .u64 .ptr .texref ";
|
|
|
|
else
|
|
|
|
O << "\t.param .texref ";
|
|
|
|
O << *CurrentFnSym << "_param_" << paramIndex;
|
|
|
|
}
|
|
|
|
} else {
|
2015-02-19 08:08:14 +08:00
|
|
|
if (nvptxSubtarget->hasImageHandles())
|
2014-04-09 23:39:15 +08:00
|
|
|
O << "\t.param .u64 .ptr .samplerref ";
|
|
|
|
else
|
|
|
|
O << "\t.param .samplerref ";
|
|
|
|
O << *CurrentFnSym << "_param_" << paramIndex;
|
|
|
|
}
|
|
|
|
continue;
|
|
|
|
}
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
|
|
|
|
2015-03-24 00:26:23 +08:00
|
|
|
if (!PAL.hasAttribute(paramIndex + 1, Attribute::ByVal)) {
|
2014-01-29 02:35:29 +08:00
|
|
|
if (Ty->isAggregateType() || Ty->isVectorTy()) {
|
|
|
|
// Just print .param .align <a> .b8 .param[size];
|
2013-03-25 05:17:47 +08:00
|
|
|
// <a> = PAL.getparamalignment
|
|
|
|
// size = typeallocsize of element type
|
2013-03-30 22:29:21 +08:00
|
|
|
unsigned align = PAL.getParamAlignment(paramIndex + 1);
|
2013-03-25 05:17:47 +08:00
|
|
|
if (align == 0)
|
|
|
|
align = TD->getABITypeAlignment(Ty);
|
|
|
|
|
|
|
|
unsigned sz = TD->getTypeAllocSize(Ty);
|
2013-03-30 22:29:21 +08:00
|
|
|
O << "\t.param .align " << align << " .b8 ";
|
2013-03-25 05:17:47 +08:00
|
|
|
printParamName(I, paramIndex, O);
|
|
|
|
O << "[" << sz << "]";
|
|
|
|
|
|
|
|
continue;
|
|
|
|
}
|
2012-05-05 04:18:50 +08:00
|
|
|
// Just a scalar
|
|
|
|
const PointerType *PTy = dyn_cast<PointerType>(Ty);
|
|
|
|
if (isKernelFunc) {
|
|
|
|
if (PTy) {
|
|
|
|
// Special handling for pointer arguments to kernel
|
|
|
|
O << "\t.param .u" << thePointerTy.getSizeInBits() << " ";
|
|
|
|
|
2015-02-19 08:08:23 +08:00
|
|
|
if (static_cast<NVPTXTargetMachine &>(TM).getDrvInterface() !=
|
|
|
|
NVPTX::CUDA) {
|
2012-05-05 04:18:50 +08:00
|
|
|
Type *ETy = PTy->getElementType();
|
|
|
|
int addrSpace = PTy->getAddressSpace();
|
2013-03-30 22:29:21 +08:00
|
|
|
switch (addrSpace) {
|
2012-05-05 04:18:50 +08:00
|
|
|
default:
|
|
|
|
O << ".ptr ";
|
|
|
|
break;
|
2013-06-10 21:29:47 +08:00
|
|
|
case llvm::ADDRESS_SPACE_CONST:
|
2012-05-05 04:18:50 +08:00
|
|
|
O << ".ptr .const ";
|
|
|
|
break;
|
|
|
|
case llvm::ADDRESS_SPACE_SHARED:
|
|
|
|
O << ".ptr .shared ";
|
|
|
|
break;
|
|
|
|
case llvm::ADDRESS_SPACE_GLOBAL:
|
|
|
|
O << ".ptr .global ";
|
|
|
|
break;
|
|
|
|
}
|
2013-03-30 22:29:21 +08:00
|
|
|
O << ".align " << (int) getOpenCLAlignment(TD, ETy) << " ";
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
|
|
|
printParamName(I, paramIndex, O);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
// non-pointer scalar to kernel func
|
2013-05-20 20:13:28 +08:00
|
|
|
O << "\t.param .";
|
|
|
|
// Special case: predicate operands become .u8 types
|
|
|
|
if (Ty->isIntegerTy(1))
|
|
|
|
O << "u8";
|
|
|
|
else
|
|
|
|
O << getPTXFundamentalTypeStr(Ty);
|
|
|
|
O << " ";
|
2012-05-05 04:18:50 +08:00
|
|
|
printParamName(I, paramIndex, O);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
// Non-kernel function, just print .param .b<size> for ABI
|
2013-12-05 13:44:44 +08:00
|
|
|
// and .reg .b<size> for non-ABI
|
2012-05-05 04:18:50 +08:00
|
|
|
unsigned sz = 0;
|
|
|
|
if (isa<IntegerType>(Ty)) {
|
|
|
|
sz = cast<IntegerType>(Ty)->getBitWidth();
|
2013-03-30 22:29:21 +08:00
|
|
|
if (sz < 32)
|
|
|
|
sz = 32;
|
|
|
|
} else if (isa<PointerType>(Ty))
|
2012-05-05 04:18:50 +08:00
|
|
|
sz = thePointerTy.getSizeInBits();
|
|
|
|
else
|
|
|
|
sz = Ty->getPrimitiveSizeInBits();
|
|
|
|
if (isABI)
|
|
|
|
O << "\t.param .b" << sz << " ";
|
|
|
|
else
|
|
|
|
O << "\t.reg .b" << sz << " ";
|
|
|
|
printParamName(I, paramIndex, O);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
// param has byVal attribute. So should be a pointer
|
|
|
|
const PointerType *PTy = dyn_cast<PointerType>(Ty);
|
2013-03-30 22:29:21 +08:00
|
|
|
assert(PTy && "Param with byval attribute should be a pointer type");
|
2012-05-05 04:18:50 +08:00
|
|
|
Type *ETy = PTy->getElementType();
|
|
|
|
|
|
|
|
if (isABI || isKernelFunc) {
|
2014-01-29 02:35:29 +08:00
|
|
|
// Just print .param .align <a> .b8 .param[size];
|
2012-05-05 04:18:50 +08:00
|
|
|
// <a> = PAL.getparamalignment
|
|
|
|
// size = typeallocsize of element type
|
2013-03-30 22:29:21 +08:00
|
|
|
unsigned align = PAL.getParamAlignment(paramIndex + 1);
|
2012-11-10 07:50:24 +08:00
|
|
|
if (align == 0)
|
|
|
|
align = TD->getABITypeAlignment(ETy);
|
|
|
|
|
2012-05-05 04:18:50 +08:00
|
|
|
unsigned sz = TD->getTypeAllocSize(ETy);
|
2013-03-30 22:29:21 +08:00
|
|
|
O << "\t.param .align " << align << " .b8 ";
|
2012-05-05 04:18:50 +08:00
|
|
|
printParamName(I, paramIndex, O);
|
|
|
|
O << "[" << sz << "]";
|
|
|
|
continue;
|
|
|
|
} else {
|
|
|
|
// Split the ETy into constituent parts and
|
|
|
|
// print .param .b<size> <name> for each part.
|
|
|
|
// Further, if a part is vector, print the above for
|
|
|
|
// each vector element.
|
|
|
|
SmallVector<EVT, 16> vtparts;
|
|
|
|
ComputeValueVTs(*TLI, ETy, vtparts);
|
2013-03-30 22:29:21 +08:00
|
|
|
for (unsigned i = 0, e = vtparts.size(); i != e; ++i) {
|
2012-05-05 04:18:50 +08:00
|
|
|
unsigned elems = 1;
|
|
|
|
EVT elemtype = vtparts[i];
|
|
|
|
if (vtparts[i].isVector()) {
|
|
|
|
elems = vtparts[i].getVectorNumElements();
|
|
|
|
elemtype = vtparts[i].getVectorElementType();
|
|
|
|
}
|
|
|
|
|
2013-03-30 22:29:21 +08:00
|
|
|
for (unsigned j = 0, je = elems; j != je; ++j) {
|
2012-05-05 04:18:50 +08:00
|
|
|
unsigned sz = elemtype.getSizeInBits();
|
2013-03-30 22:29:21 +08:00
|
|
|
if (elemtype.isInteger() && (sz < 32))
|
|
|
|
sz = 32;
|
2012-05-05 04:18:50 +08:00
|
|
|
O << "\t.reg .b" << sz << " ";
|
|
|
|
printParamName(I, paramIndex, O);
|
2013-03-30 22:29:21 +08:00
|
|
|
if (j < je - 1)
|
|
|
|
O << ",\n";
|
2012-05-05 04:18:50 +08:00
|
|
|
++paramIndex;
|
|
|
|
}
|
2013-03-30 22:29:21 +08:00
|
|
|
if (i < e - 1)
|
2012-05-05 04:18:50 +08:00
|
|
|
O << ",\n";
|
|
|
|
}
|
|
|
|
--paramIndex;
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
O << "\n)\n";
|
|
|
|
}
|
|
|
|
|
|
|
|
void NVPTXAsmPrinter::emitFunctionParamList(const MachineFunction &MF,
|
|
|
|
raw_ostream &O) {
|
|
|
|
const Function *F = MF.getFunction();
|
|
|
|
emitFunctionParamList(F, O);
|
|
|
|
}
|
|
|
|
|
2013-03-30 22:29:21 +08:00
|
|
|
void NVPTXAsmPrinter::setAndEmitFunctionVirtualRegisters(
|
|
|
|
const MachineFunction &MF) {
|
2012-05-05 04:18:50 +08:00
|
|
|
SmallString<128> Str;
|
|
|
|
raw_svector_ostream O(Str);
|
|
|
|
|
|
|
|
// Map the global virtual register number to a register class specific
|
|
|
|
// virtual register number starting from 1 with that class.
|
2014-08-05 10:39:49 +08:00
|
|
|
const TargetRegisterInfo *TRI = MF.getSubtarget().getRegisterInfo();
|
2012-05-05 04:18:50 +08:00
|
|
|
//unsigned numRegClasses = TRI->getNumRegClasses();
|
|
|
|
|
|
|
|
// Emit the Fake Stack Object
|
|
|
|
const MachineFrameInfo *MFI = MF.getFrameInfo();
|
|
|
|
int NumBytes = (int) MFI->getStackSize();
|
|
|
|
if (NumBytes) {
|
2013-03-30 22:29:21 +08:00
|
|
|
O << "\t.local .align " << MFI->getMaxAlignment() << " .b8 \t" << DEPOTNAME
|
|
|
|
<< getFunctionNumber() << "[" << NumBytes << "];\n";
|
2015-02-19 08:08:27 +08:00
|
|
|
if (static_cast<const NVPTXTargetMachine &>(MF.getTarget()).is64Bit()) {
|
2012-05-05 04:18:50 +08:00
|
|
|
O << "\t.reg .b64 \t%SP;\n";
|
|
|
|
O << "\t.reg .b64 \t%SPL;\n";
|
2013-03-30 22:29:21 +08:00
|
|
|
} else {
|
2012-05-05 04:18:50 +08:00
|
|
|
O << "\t.reg .b32 \t%SP;\n";
|
|
|
|
O << "\t.reg .b32 \t%SPL;\n";
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Go through all virtual registers to establish the mapping between the
|
|
|
|
// global virtual
|
|
|
|
// register number and the per class virtual register number.
|
|
|
|
// We use the per class virtual register number in the ptx output.
|
|
|
|
unsigned int numVRs = MRI->getNumVirtRegs();
|
2013-03-30 22:29:21 +08:00
|
|
|
for (unsigned i = 0; i < numVRs; i++) {
|
2012-05-05 04:18:50 +08:00
|
|
|
unsigned int vr = TRI->index2VirtReg(i);
|
|
|
|
const TargetRegisterClass *RC = MRI->getRegClass(vr);
|
2013-05-31 20:14:49 +08:00
|
|
|
DenseMap<unsigned, unsigned> ®map = VRegMapping[RC];
|
2012-05-05 04:18:50 +08:00
|
|
|
int n = regmap.size();
|
2013-03-30 22:29:21 +08:00
|
|
|
regmap.insert(std::make_pair(vr, n + 1));
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
// Emit register declarations
|
|
|
|
// @TODO: Extract out the real register usage
|
2013-05-31 20:14:49 +08:00
|
|
|
// O << "\t.reg .pred %p<" << NVPTXNumRegisters << ">;\n";
|
|
|
|
// O << "\t.reg .s16 %rc<" << NVPTXNumRegisters << ">;\n";
|
|
|
|
// O << "\t.reg .s16 %rs<" << NVPTXNumRegisters << ">;\n";
|
|
|
|
// O << "\t.reg .s32 %r<" << NVPTXNumRegisters << ">;\n";
|
2014-07-17 00:26:58 +08:00
|
|
|
// O << "\t.reg .s64 %rd<" << NVPTXNumRegisters << ">;\n";
|
2013-05-31 20:14:49 +08:00
|
|
|
// O << "\t.reg .f32 %f<" << NVPTXNumRegisters << ">;\n";
|
2014-07-17 00:26:58 +08:00
|
|
|
// O << "\t.reg .f64 %fd<" << NVPTXNumRegisters << ">;\n";
|
2012-05-05 04:18:50 +08:00
|
|
|
|
|
|
|
// Emit declaration of the virtual registers or 'physical' registers for
|
|
|
|
// each register class
|
2013-05-31 20:14:49 +08:00
|
|
|
for (unsigned i=0; i< TRI->getNumRegClasses(); i++) {
|
|
|
|
const TargetRegisterClass *RC = TRI->getRegClass(i);
|
|
|
|
DenseMap<unsigned, unsigned> ®map = VRegMapping[RC];
|
|
|
|
std::string rcname = getNVPTXRegClassName(RC);
|
|
|
|
std::string rcStr = getNVPTXRegClassStr(RC);
|
|
|
|
int n = regmap.size();
|
|
|
|
|
|
|
|
// Only declare those registers that may be used.
|
|
|
|
if (n) {
|
|
|
|
O << "\t.reg " << rcname << " \t" << rcStr << "<" << (n+1)
|
|
|
|
<< ">;\n";
|
|
|
|
}
|
|
|
|
}
|
2012-05-05 04:18:50 +08:00
|
|
|
|
2015-04-25 03:11:51 +08:00
|
|
|
OutStreamer->EmitRawText(O.str());
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
void NVPTXAsmPrinter::printFPConstant(const ConstantFP *Fp, raw_ostream &O) {
|
2013-03-30 22:29:21 +08:00
|
|
|
APFloat APF = APFloat(Fp->getValueAPF()); // make a copy
|
2012-05-05 04:18:50 +08:00
|
|
|
bool ignored;
|
|
|
|
unsigned int numHex;
|
|
|
|
const char *lead;
|
|
|
|
|
2013-03-30 22:29:21 +08:00
|
|
|
if (Fp->getType()->getTypeID() == Type::FloatTyID) {
|
2012-05-05 04:18:50 +08:00
|
|
|
numHex = 8;
|
|
|
|
lead = "0f";
|
2013-03-30 22:29:21 +08:00
|
|
|
APF.convert(APFloat::IEEEsingle, APFloat::rmNearestTiesToEven, &ignored);
|
2012-05-05 04:18:50 +08:00
|
|
|
} else if (Fp->getType()->getTypeID() == Type::DoubleTyID) {
|
|
|
|
numHex = 16;
|
|
|
|
lead = "0d";
|
2013-03-30 22:29:21 +08:00
|
|
|
APF.convert(APFloat::IEEEdouble, APFloat::rmNearestTiesToEven, &ignored);
|
2012-05-05 04:18:50 +08:00
|
|
|
} else
|
|
|
|
llvm_unreachable("unsupported fp type");
|
|
|
|
|
|
|
|
APInt API = APF.bitcastToAPInt();
|
|
|
|
std::string hexstr(utohexstr(API.getZExtValue()));
|
|
|
|
O << lead;
|
|
|
|
if (hexstr.length() < numHex)
|
|
|
|
O << std::string(numHex - hexstr.length(), '0');
|
|
|
|
O << utohexstr(API.getZExtValue());
|
|
|
|
}
|
|
|
|
|
2013-05-20 20:13:32 +08:00
|
|
|
void NVPTXAsmPrinter::printScalarConstant(const Constant *CPV, raw_ostream &O) {
|
|
|
|
if (const ConstantInt *CI = dyn_cast<ConstantInt>(CPV)) {
|
2012-05-05 04:18:50 +08:00
|
|
|
O << CI->getValue();
|
|
|
|
return;
|
|
|
|
}
|
2013-05-20 20:13:32 +08:00
|
|
|
if (const ConstantFP *CFP = dyn_cast<ConstantFP>(CPV)) {
|
2012-05-05 04:18:50 +08:00
|
|
|
printFPConstant(CFP, O);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
if (isa<ConstantPointerNull>(CPV)) {
|
|
|
|
O << "0";
|
|
|
|
return;
|
|
|
|
}
|
2013-05-20 20:13:32 +08:00
|
|
|
if (const GlobalValue *GVar = dyn_cast<GlobalValue>(CPV)) {
|
2014-04-09 23:39:11 +08:00
|
|
|
PointerType *PTy = dyn_cast<PointerType>(GVar->getType());
|
|
|
|
bool IsNonGenericPointer = false;
|
|
|
|
if (PTy && PTy->getAddressSpace() != 0) {
|
|
|
|
IsNonGenericPointer = true;
|
|
|
|
}
|
|
|
|
if (EmitGeneric && !isa<Function>(CPV) && !IsNonGenericPointer) {
|
|
|
|
O << "generic(";
|
|
|
|
O << *getSymbol(GVar);
|
|
|
|
O << ")";
|
|
|
|
} else {
|
|
|
|
O << *getSymbol(GVar);
|
|
|
|
}
|
2012-05-05 04:18:50 +08:00
|
|
|
return;
|
|
|
|
}
|
2013-05-20 20:13:32 +08:00
|
|
|
if (const ConstantExpr *Cexpr = dyn_cast<ConstantExpr>(CPV)) {
|
|
|
|
const Value *v = Cexpr->stripPointerCasts();
|
2014-04-09 23:39:11 +08:00
|
|
|
PointerType *PTy = dyn_cast<PointerType>(Cexpr->getType());
|
|
|
|
bool IsNonGenericPointer = false;
|
|
|
|
if (PTy && PTy->getAddressSpace() != 0) {
|
|
|
|
IsNonGenericPointer = true;
|
|
|
|
}
|
2013-05-20 20:13:32 +08:00
|
|
|
if (const GlobalValue *GVar = dyn_cast<GlobalValue>(v)) {
|
2014-04-09 23:39:11 +08:00
|
|
|
if (EmitGeneric && !isa<Function>(v) && !IsNonGenericPointer) {
|
|
|
|
O << "generic(";
|
|
|
|
O << *getSymbol(GVar);
|
|
|
|
O << ")";
|
|
|
|
} else {
|
|
|
|
O << *getSymbol(GVar);
|
|
|
|
}
|
2012-05-05 04:18:50 +08:00
|
|
|
return;
|
|
|
|
} else {
|
2014-12-17 03:16:17 +08:00
|
|
|
O << *lowerConstant(CPV);
|
2012-05-05 04:18:50 +08:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
llvm_unreachable("Not scalar type found in printScalarConstant()");
|
|
|
|
}
|
|
|
|
|
2013-05-20 20:13:32 +08:00
|
|
|
void NVPTXAsmPrinter::bufferLEByte(const Constant *CPV, int Bytes,
|
2012-05-05 04:18:50 +08:00
|
|
|
AggBuffer *aggBuffer) {
|
|
|
|
|
2015-01-27 03:03:15 +08:00
|
|
|
const DataLayout *TD = TM.getDataLayout();
|
2012-05-05 04:18:50 +08:00
|
|
|
|
|
|
|
if (isa<UndefValue>(CPV) || CPV->isNullValue()) {
|
|
|
|
int s = TD->getTypeAllocSize(CPV->getType());
|
2013-03-30 22:29:21 +08:00
|
|
|
if (s < Bytes)
|
2012-05-05 04:18:50 +08:00
|
|
|
s = Bytes;
|
|
|
|
aggBuffer->addZeros(s);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
unsigned char *ptr;
|
|
|
|
switch (CPV->getType()->getTypeID()) {
|
|
|
|
|
|
|
|
case Type::IntegerTyID: {
|
|
|
|
const Type *ETy = CPV->getType();
|
2013-03-30 22:29:21 +08:00
|
|
|
if (ETy == Type::getInt8Ty(CPV->getContext())) {
|
2015-04-10 19:24:51 +08:00
|
|
|
unsigned char c = (unsigned char)cast<ConstantInt>(CPV)->getZExtValue();
|
2012-05-05 04:18:50 +08:00
|
|
|
ptr = &c;
|
|
|
|
aggBuffer->addBytes(ptr, 1, Bytes);
|
2013-03-30 22:29:21 +08:00
|
|
|
} else if (ETy == Type::getInt16Ty(CPV->getContext())) {
|
2015-04-10 19:24:51 +08:00
|
|
|
short int16 = (short)cast<ConstantInt>(CPV)->getZExtValue();
|
2013-03-30 22:29:21 +08:00
|
|
|
ptr = (unsigned char *)&int16;
|
2012-05-05 04:18:50 +08:00
|
|
|
aggBuffer->addBytes(ptr, 2, Bytes);
|
2013-03-30 22:29:21 +08:00
|
|
|
} else if (ETy == Type::getInt32Ty(CPV->getContext())) {
|
2013-05-20 20:13:32 +08:00
|
|
|
if (const ConstantInt *constInt = dyn_cast<ConstantInt>(CPV)) {
|
2013-03-30 22:29:21 +08:00
|
|
|
int int32 = (int)(constInt->getZExtValue());
|
|
|
|
ptr = (unsigned char *)&int32;
|
2012-05-05 04:18:50 +08:00
|
|
|
aggBuffer->addBytes(ptr, 4, Bytes);
|
|
|
|
break;
|
2013-05-20 20:13:32 +08:00
|
|
|
} else if (const ConstantExpr *Cexpr = dyn_cast<ConstantExpr>(CPV)) {
|
|
|
|
if (const ConstantInt *constInt = dyn_cast<ConstantInt>(
|
2015-03-10 10:37:25 +08:00
|
|
|
ConstantFoldConstantExpression(Cexpr, *TD))) {
|
2013-03-30 22:29:21 +08:00
|
|
|
int int32 = (int)(constInt->getZExtValue());
|
|
|
|
ptr = (unsigned char *)&int32;
|
2012-05-05 04:18:50 +08:00
|
|
|
aggBuffer->addBytes(ptr, 4, Bytes);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
if (Cexpr->getOpcode() == Instruction::PtrToInt) {
|
|
|
|
Value *v = Cexpr->getOperand(0)->stripPointerCasts();
|
2015-04-24 10:57:30 +08:00
|
|
|
aggBuffer->addSymbol(v, Cexpr->getOperand(0));
|
2012-05-05 04:18:50 +08:00
|
|
|
aggBuffer->addZeros(4);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
2012-05-24 15:02:50 +08:00
|
|
|
llvm_unreachable("unsupported integer const type");
|
2013-03-30 22:29:21 +08:00
|
|
|
} else if (ETy == Type::getInt64Ty(CPV->getContext())) {
|
2013-05-20 20:13:32 +08:00
|
|
|
if (const ConstantInt *constInt = dyn_cast<ConstantInt>(CPV)) {
|
2013-03-30 22:29:21 +08:00
|
|
|
long long int64 = (long long)(constInt->getZExtValue());
|
|
|
|
ptr = (unsigned char *)&int64;
|
2012-05-05 04:18:50 +08:00
|
|
|
aggBuffer->addBytes(ptr, 8, Bytes);
|
|
|
|
break;
|
2013-05-20 20:13:32 +08:00
|
|
|
} else if (const ConstantExpr *Cexpr = dyn_cast<ConstantExpr>(CPV)) {
|
|
|
|
if (const ConstantInt *constInt = dyn_cast<ConstantInt>(
|
2015-03-10 10:37:25 +08:00
|
|
|
ConstantFoldConstantExpression(Cexpr, *TD))) {
|
2013-03-30 22:29:21 +08:00
|
|
|
long long int64 = (long long)(constInt->getZExtValue());
|
|
|
|
ptr = (unsigned char *)&int64;
|
2012-05-05 04:18:50 +08:00
|
|
|
aggBuffer->addBytes(ptr, 8, Bytes);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
if (Cexpr->getOpcode() == Instruction::PtrToInt) {
|
|
|
|
Value *v = Cexpr->getOperand(0)->stripPointerCasts();
|
2015-04-24 10:57:30 +08:00
|
|
|
aggBuffer->addSymbol(v, Cexpr->getOperand(0));
|
2012-05-05 04:18:50 +08:00
|
|
|
aggBuffer->addZeros(8);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
llvm_unreachable("unsupported integer const type");
|
2012-05-24 15:02:50 +08:00
|
|
|
} else
|
2012-05-05 04:18:50 +08:00
|
|
|
llvm_unreachable("unsupported integer const type");
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case Type::FloatTyID:
|
|
|
|
case Type::DoubleTyID: {
|
2013-05-20 20:13:32 +08:00
|
|
|
const ConstantFP *CFP = dyn_cast<ConstantFP>(CPV);
|
2013-03-30 22:29:21 +08:00
|
|
|
const Type *Ty = CFP->getType();
|
2012-05-05 04:18:50 +08:00
|
|
|
if (Ty == Type::getFloatTy(CPV->getContext())) {
|
2013-03-30 22:29:21 +08:00
|
|
|
float float32 = (float) CFP->getValueAPF().convertToFloat();
|
|
|
|
ptr = (unsigned char *)&float32;
|
2012-05-05 04:18:50 +08:00
|
|
|
aggBuffer->addBytes(ptr, 4, Bytes);
|
|
|
|
} else if (Ty == Type::getDoubleTy(CPV->getContext())) {
|
|
|
|
double float64 = CFP->getValueAPF().convertToDouble();
|
2013-03-30 22:29:21 +08:00
|
|
|
ptr = (unsigned char *)&float64;
|
2012-05-05 04:18:50 +08:00
|
|
|
aggBuffer->addBytes(ptr, 8, Bytes);
|
2013-03-30 22:29:21 +08:00
|
|
|
} else {
|
2012-05-05 04:18:50 +08:00
|
|
|
llvm_unreachable("unsupported fp const type");
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case Type::PointerTyID: {
|
2013-05-20 20:13:32 +08:00
|
|
|
if (const GlobalValue *GVar = dyn_cast<GlobalValue>(CPV)) {
|
2015-04-24 10:57:30 +08:00
|
|
|
aggBuffer->addSymbol(GVar, GVar);
|
2013-05-20 20:13:32 +08:00
|
|
|
} else if (const ConstantExpr *Cexpr = dyn_cast<ConstantExpr>(CPV)) {
|
|
|
|
const Value *v = Cexpr->stripPointerCasts();
|
2015-04-24 10:57:30 +08:00
|
|
|
aggBuffer->addSymbol(v, Cexpr);
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
|
|
|
unsigned int s = TD->getTypeAllocSize(CPV->getType());
|
|
|
|
aggBuffer->addZeros(s);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
case Type::ArrayTyID:
|
|
|
|
case Type::VectorTyID:
|
|
|
|
case Type::StructTyID: {
|
|
|
|
if (isa<ConstantArray>(CPV) || isa<ConstantVector>(CPV) ||
|
2013-09-19 20:51:46 +08:00
|
|
|
isa<ConstantStruct>(CPV) || isa<ConstantDataSequential>(CPV)) {
|
2012-05-05 04:18:50 +08:00
|
|
|
int ElementSize = TD->getTypeAllocSize(CPV->getType());
|
|
|
|
bufferAggregateConstant(CPV, aggBuffer);
|
2013-03-30 22:29:21 +08:00
|
|
|
if (Bytes > ElementSize)
|
|
|
|
aggBuffer->addZeros(Bytes - ElementSize);
|
|
|
|
} else if (isa<ConstantAggregateZero>(CPV))
|
2012-05-05 04:18:50 +08:00
|
|
|
aggBuffer->addZeros(Bytes);
|
|
|
|
else
|
|
|
|
llvm_unreachable("Unexpected Constant type");
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
default:
|
|
|
|
llvm_unreachable("unsupported type");
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2013-05-20 20:13:32 +08:00
|
|
|
void NVPTXAsmPrinter::bufferAggregateConstant(const Constant *CPV,
|
2012-05-05 04:18:50 +08:00
|
|
|
AggBuffer *aggBuffer) {
|
2015-01-27 03:03:15 +08:00
|
|
|
const DataLayout *TD = TM.getDataLayout();
|
2012-05-05 04:18:50 +08:00
|
|
|
int Bytes;
|
|
|
|
|
|
|
|
// Old constants
|
|
|
|
if (isa<ConstantArray>(CPV) || isa<ConstantVector>(CPV)) {
|
|
|
|
if (CPV->getNumOperands())
|
|
|
|
for (unsigned i = 0, e = CPV->getNumOperands(); i != e; ++i)
|
|
|
|
bufferLEByte(cast<Constant>(CPV->getOperand(i)), 0, aggBuffer);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (const ConstantDataSequential *CDS =
|
2013-03-30 22:29:21 +08:00
|
|
|
dyn_cast<ConstantDataSequential>(CPV)) {
|
2012-05-05 04:18:50 +08:00
|
|
|
if (CDS->getNumElements())
|
|
|
|
for (unsigned i = 0; i < CDS->getNumElements(); ++i)
|
|
|
|
bufferLEByte(cast<Constant>(CDS->getElementAsConstant(i)), 0,
|
|
|
|
aggBuffer);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (isa<ConstantStruct>(CPV)) {
|
|
|
|
if (CPV->getNumOperands()) {
|
|
|
|
StructType *ST = cast<StructType>(CPV->getType());
|
|
|
|
for (unsigned i = 0, e = CPV->getNumOperands(); i != e; ++i) {
|
2013-03-30 22:29:21 +08:00
|
|
|
if (i == (e - 1))
|
2012-05-05 04:18:50 +08:00
|
|
|
Bytes = TD->getStructLayout(ST)->getElementOffset(0) +
|
2013-03-30 22:29:21 +08:00
|
|
|
TD->getTypeAllocSize(ST) -
|
|
|
|
TD->getStructLayout(ST)->getElementOffset(i);
|
2012-05-05 04:18:50 +08:00
|
|
|
else
|
2013-03-30 22:29:21 +08:00
|
|
|
Bytes = TD->getStructLayout(ST)->getElementOffset(i + 1) -
|
|
|
|
TD->getStructLayout(ST)->getElementOffset(i);
|
|
|
|
bufferLEByte(cast<Constant>(CPV->getOperand(i)), Bytes, aggBuffer);
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
return;
|
|
|
|
}
|
2012-05-24 15:02:50 +08:00
|
|
|
llvm_unreachable("unsupported constant type in printAggregateConstant()");
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
// buildTypeNameMap - Run through symbol table looking for type names.
|
|
|
|
//
|
|
|
|
|
|
|
|
bool NVPTXAsmPrinter::isImageType(const Type *Ty) {
|
|
|
|
|
|
|
|
std::map<const Type *, std::string>::iterator PI = TypeNameMap.find(Ty);
|
|
|
|
|
2013-03-30 22:29:21 +08:00
|
|
|
if (PI != TypeNameMap.end() && (!PI->second.compare("struct._image1d_t") ||
|
|
|
|
!PI->second.compare("struct._image2d_t") ||
|
|
|
|
!PI->second.compare("struct._image3d_t")))
|
2012-05-05 04:18:50 +08:00
|
|
|
return true;
|
|
|
|
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2013-03-30 22:29:21 +08:00
|
|
|
bool NVPTXAsmPrinter::ignoreLoc(const MachineInstr &MI) {
|
|
|
|
switch (MI.getOpcode()) {
|
2012-05-05 04:18:50 +08:00
|
|
|
default:
|
|
|
|
return false;
|
2013-03-30 22:29:21 +08:00
|
|
|
case NVPTX::CallArgBeginInst:
|
|
|
|
case NVPTX::CallArgEndInst0:
|
|
|
|
case NVPTX::CallArgEndInst1:
|
|
|
|
case NVPTX::CallArgF32:
|
|
|
|
case NVPTX::CallArgF64:
|
|
|
|
case NVPTX::CallArgI16:
|
|
|
|
case NVPTX::CallArgI32:
|
|
|
|
case NVPTX::CallArgI32imm:
|
|
|
|
case NVPTX::CallArgI64:
|
|
|
|
case NVPTX::CallArgParam:
|
|
|
|
case NVPTX::CallVoidInst:
|
|
|
|
case NVPTX::CallVoidInstReg:
|
|
|
|
case NVPTX::Callseq_End:
|
2012-05-05 04:18:50 +08:00
|
|
|
case NVPTX::CallVoidInstReg64:
|
2013-03-30 22:29:21 +08:00
|
|
|
case NVPTX::DeclareParamInst:
|
|
|
|
case NVPTX::DeclareRetMemInst:
|
|
|
|
case NVPTX::DeclareRetRegInst:
|
|
|
|
case NVPTX::DeclareRetScalarInst:
|
|
|
|
case NVPTX::DeclareScalarParamInst:
|
|
|
|
case NVPTX::DeclareScalarRegInst:
|
|
|
|
case NVPTX::StoreParamF32:
|
|
|
|
case NVPTX::StoreParamF64:
|
|
|
|
case NVPTX::StoreParamI16:
|
|
|
|
case NVPTX::StoreParamI32:
|
|
|
|
case NVPTX::StoreParamI64:
|
|
|
|
case NVPTX::StoreParamI8:
|
|
|
|
case NVPTX::StoreRetvalF32:
|
|
|
|
case NVPTX::StoreRetvalF64:
|
|
|
|
case NVPTX::StoreRetvalI16:
|
|
|
|
case NVPTX::StoreRetvalI32:
|
|
|
|
case NVPTX::StoreRetvalI64:
|
|
|
|
case NVPTX::StoreRetvalI8:
|
|
|
|
case NVPTX::LastCallArgF32:
|
|
|
|
case NVPTX::LastCallArgF64:
|
|
|
|
case NVPTX::LastCallArgI16:
|
|
|
|
case NVPTX::LastCallArgI32:
|
|
|
|
case NVPTX::LastCallArgI32imm:
|
|
|
|
case NVPTX::LastCallArgI64:
|
|
|
|
case NVPTX::LastCallArgParam:
|
|
|
|
case NVPTX::LoadParamMemF32:
|
|
|
|
case NVPTX::LoadParamMemF64:
|
|
|
|
case NVPTX::LoadParamMemI16:
|
|
|
|
case NVPTX::LoadParamMemI32:
|
|
|
|
case NVPTX::LoadParamMemI64:
|
|
|
|
case NVPTX::LoadParamMemI8:
|
|
|
|
case NVPTX::PrototypeInst:
|
|
|
|
case NVPTX::DBG_VALUE:
|
2012-05-05 04:18:50 +08:00
|
|
|
return true;
|
|
|
|
}
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2013-08-24 09:17:23 +08:00
|
|
|
/// PrintAsmOperand - Print out an operand for an inline asm expression.
|
|
|
|
///
|
|
|
|
bool NVPTXAsmPrinter::PrintAsmOperand(const MachineInstr *MI, unsigned OpNo,
|
|
|
|
unsigned AsmVariant,
|
|
|
|
const char *ExtraCode, raw_ostream &O) {
|
|
|
|
if (ExtraCode && ExtraCode[0]) {
|
|
|
|
if (ExtraCode[1] != 0)
|
|
|
|
return true; // Unknown modifier.
|
|
|
|
|
|
|
|
switch (ExtraCode[0]) {
|
|
|
|
default:
|
|
|
|
// See if this is a generic print operand
|
|
|
|
return AsmPrinter::PrintAsmOperand(MI, OpNo, AsmVariant, ExtraCode, O);
|
|
|
|
case 'r':
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
printOperand(MI, OpNo, O);
|
|
|
|
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool NVPTXAsmPrinter::PrintAsmMemoryOperand(
|
|
|
|
const MachineInstr *MI, unsigned OpNo, unsigned AsmVariant,
|
|
|
|
const char *ExtraCode, raw_ostream &O) {
|
|
|
|
if (ExtraCode && ExtraCode[0])
|
|
|
|
return true; // Unknown modifier
|
|
|
|
|
|
|
|
O << '[';
|
|
|
|
printMemOperand(MI, OpNo, O);
|
|
|
|
O << ']';
|
|
|
|
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
void NVPTXAsmPrinter::printOperand(const MachineInstr *MI, int opNum,
|
|
|
|
raw_ostream &O, const char *Modifier) {
|
|
|
|
const MachineOperand &MO = MI->getOperand(opNum);
|
|
|
|
switch (MO.getType()) {
|
|
|
|
case MachineOperand::MO_Register:
|
|
|
|
if (TargetRegisterInfo::isPhysicalRegister(MO.getReg())) {
|
|
|
|
if (MO.getReg() == NVPTX::VRDepot)
|
|
|
|
O << DEPOTNAME << getFunctionNumber();
|
|
|
|
else
|
|
|
|
O << NVPTXInstPrinter::getRegisterName(MO.getReg());
|
|
|
|
} else {
|
2013-10-11 20:39:36 +08:00
|
|
|
emitVirtualRegister(MO.getReg(), O);
|
2013-08-24 09:17:23 +08:00
|
|
|
}
|
|
|
|
return;
|
|
|
|
|
|
|
|
case MachineOperand::MO_Immediate:
|
|
|
|
if (!Modifier)
|
|
|
|
O << MO.getImm();
|
|
|
|
else if (strstr(Modifier, "vec") == Modifier)
|
|
|
|
printVecModifiedImmediate(MO, Modifier, O);
|
|
|
|
else
|
|
|
|
llvm_unreachable(
|
|
|
|
"Don't know how to handle modifier on immediate operand");
|
|
|
|
return;
|
|
|
|
|
|
|
|
case MachineOperand::MO_FPImmediate:
|
|
|
|
printFPConstant(MO.getFPImm(), O);
|
|
|
|
break;
|
|
|
|
|
|
|
|
case MachineOperand::MO_GlobalAddress:
|
2014-04-01 00:11:57 +08:00
|
|
|
O << *getSymbol(MO.getGlobal());
|
2013-08-24 09:17:23 +08:00
|
|
|
break;
|
|
|
|
|
|
|
|
case MachineOperand::MO_MachineBasicBlock:
|
|
|
|
O << *MO.getMBB()->getSymbol();
|
|
|
|
return;
|
|
|
|
|
|
|
|
default:
|
|
|
|
llvm_unreachable("Operand type not supported.");
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
void NVPTXAsmPrinter::printMemOperand(const MachineInstr *MI, int opNum,
|
|
|
|
raw_ostream &O, const char *Modifier) {
|
|
|
|
printOperand(MI, opNum, O);
|
|
|
|
|
|
|
|
if (Modifier && !strcmp(Modifier, "add")) {
|
|
|
|
O << ", ";
|
|
|
|
printOperand(MI, opNum + 1, O);
|
|
|
|
} else {
|
|
|
|
if (MI->getOperand(opNum + 1).isImm() &&
|
|
|
|
MI->getOperand(opNum + 1).getImm() == 0)
|
|
|
|
return; // don't print ',0' or '+0'
|
|
|
|
O << "+";
|
|
|
|
printOperand(MI, opNum + 1, O);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2012-05-05 04:18:50 +08:00
|
|
|
void NVPTXAsmPrinter::emitSrcInText(StringRef filename, unsigned line) {
|
|
|
|
std::stringstream temp;
|
2015-03-30 23:42:36 +08:00
|
|
|
LineReader *reader = this->getReader(filename);
|
2012-05-05 04:18:50 +08:00
|
|
|
temp << "\n//";
|
|
|
|
temp << filename.str();
|
|
|
|
temp << ":";
|
|
|
|
temp << line;
|
|
|
|
temp << " ";
|
|
|
|
temp << reader->readLine(line);
|
|
|
|
temp << "\n";
|
2015-04-25 03:11:51 +08:00
|
|
|
this->OutStreamer->EmitRawText(temp.str());
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
LineReader *NVPTXAsmPrinter::getReader(std::string filename) {
|
2014-04-25 13:30:21 +08:00
|
|
|
if (!reader) {
|
2013-03-30 22:29:21 +08:00
|
|
|
reader = new LineReader(filename);
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
if (reader->fileName() != filename) {
|
|
|
|
delete reader;
|
2013-03-30 22:29:21 +08:00
|
|
|
reader = new LineReader(filename);
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
return reader;
|
|
|
|
}
|
|
|
|
|
2013-03-30 22:29:21 +08:00
|
|
|
std::string LineReader::readLine(unsigned lineNum) {
|
2012-05-05 04:18:50 +08:00
|
|
|
if (lineNum < theCurLine) {
|
|
|
|
theCurLine = 0;
|
2013-03-30 22:29:21 +08:00
|
|
|
fstr.seekg(0, std::ios::beg);
|
2012-05-05 04:18:50 +08:00
|
|
|
}
|
|
|
|
while (theCurLine < lineNum) {
|
2013-03-30 22:29:21 +08:00
|
|
|
fstr.getline(buff, 500);
|
2012-05-05 04:18:50 +08:00
|
|
|
theCurLine++;
|
|
|
|
}
|
|
|
|
return buff;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Force static initialization.
|
|
|
|
extern "C" void LLVMInitializeNVPTXAsmPrinter() {
|
|
|
|
RegisterAsmPrinter<NVPTXAsmPrinter> X(TheNVPTXTarget32);
|
|
|
|
RegisterAsmPrinter<NVPTXAsmPrinter> Y(TheNVPTXTarget64);
|
|
|
|
}
|