llvm-project/llvm/lib/Target/NVPTX/NVPTXISelDAGToDAG.h

//===-- NVPTXISelDAGToDAG.h - A dag to dag inst selector for NVPTX --------===//
//
//                     The LLVM Compiler Infrastructure
//
// This file is distributed under the University of Illinois Open Source
// License. See LICENSE.TXT for details.
//
//===----------------------------------------------------------------------===//
//
// This file defines an instruction selector for the NVPTX target.
//
//===----------------------------------------------------------------------===//

#define DEBUG_TYPE "nvptx-isel"

#include "NVPTX.h"
#include "NVPTXISelLowering.h"
#include "NVPTXRegisterInfo.h"
#include "NVPTXTargetMachine.h"
#include "llvm/CodeGen/SelectionDAGISel.h"
#include "llvm/IR/Intrinsics.h"
#include "llvm/Support/Compiler.h"
using namespace llvm;

namespace {

class LLVM_LIBRARY_VISIBILITY NVPTXDAGToDAGISel : public SelectionDAGISel {

  // If true, generate corresponding FPCONTRACT. This is
  // language dependent (i.e. CUDA and OpenCL works differently).
  bool doFMADF32;
  bool doFMAF64;
  bool doFMAF32;
  bool doFMAF64AGG;
  bool doFMAF32AGG;
  bool allowFMA;

  // 0: use div.approx
  // 1: use div.full
  // 2: For sm_20 and later, ieee-compliant div.rnd.f32 can be generated;
  //    Otherwise, use div.full
  int do_DIVF32_PREC;

  // If true, generate sqrt.rn, else generate sqrt.approx. If FTZ
  // is true, then generate the corresponding FTZ version.
  bool do_SQRTF32_PREC;

  // If true, add .ftz to f32 instructions.
  // This is only meaningful for sm_20 and later, as the default
  // is not ftz.
  // For sm earlier than sm_20, f32 denorms are always ftz by the
  // hardware.
  // We always add the .ftz modifier regardless of the sm value
  // when Use32FTZ is true.
  bool UseF32FTZ;

  // If true, generate mul.wide from sext and mul
  bool doMulWide;

public:
  explicit NVPTXDAGToDAGISel(NVPTXTargetMachine &tm,
                             CodeGenOpt::Level OptLevel);

  // Pass Name
  virtual const char *getPassName() const {
    return "NVPTX DAG->DAG Pattern Instruction Selection";
  }

  const NVPTXSubtarget &Subtarget;

  virtual bool SelectInlineAsmMemoryOperand(
      const SDValue &Op, char ConstraintCode, std::vector<SDValue> &OutOps);
private:
// Include the pieces autogenerated from the target description.
#include "NVPTXGenDAGISel.inc"

  SDNode *Select(SDNode *N);
  SDNode *SelectLoad(SDNode *N);
  SDNode *SelectLoadVector(SDNode *N);
  SDNode *SelectLDGLDUVector(SDNode *N);
  SDNode *SelectStore(SDNode *N);
  SDNode *SelectStoreVector(SDNode *N);
  SDNode *SelectLoadParam(SDNode *N);
  SDNode *SelectStoreRetval(SDNode *N);
  SDNode *SelectStoreParam(SDNode *N);
        
  inline SDValue getI32Imm(unsigned Imm) {
    return CurDAG->getTargetConstant(Imm, MVT::i32);
  }

  // Match direct address complex pattern.
  bool SelectDirectAddr(SDValue N, SDValue &Address);

  bool SelectADDRri_imp(SDNode *OpNode, SDValue Addr, SDValue &Base,
                        SDValue &Offset, MVT mvt);
  bool SelectADDRri(SDNode *OpNode, SDValue Addr, SDValue &Base,
                    SDValue &Offset);
  bool SelectADDRri64(SDNode *OpNode, SDValue Addr, SDValue &Base,
                      SDValue &Offset);

  bool SelectADDRsi_imp(SDNode *OpNode, SDValue Addr, SDValue &Base,
                        SDValue &Offset, MVT mvt);
  bool SelectADDRsi(SDNode *OpNode, SDValue Addr, SDValue &Base,
                    SDValue &Offset);
  bool SelectADDRsi64(SDNode *OpNode, SDValue Addr, SDValue &Base,
                      SDValue &Offset);

  bool ChkMemSDNodeAddressSpace(SDNode *N, unsigned int spN) const;

  bool UndefOrImm(SDValue Op, SDValue N, SDValue &Retval);

};
}
This patch adds a new NVPTX back-end to LLVM which supports code generation for NVIDIA PTX 3.0. This back-end will (eventually) replace the current PTX back-end, while maintaining compatibility with it. The new target machines are: nvptx (old ptx32) => 32-bit PTX nvptx64 (old ptx64) => 64-bit PTX The sources are based on the internal NVIDIA NVPTX back-end, and contain more functionality than the current PTX back-end currently provides. NV_CONTRIB llvm-svn: 156196 2012-05-05 04:18:50 +08:00			`//===-- NVPTXISelDAGToDAG.h - A dag to dag inst selector for NVPTX --------===//`
			`//`
			`// The LLVM Compiler Infrastructure`
			`//`
			`// This file is distributed under the University of Illinois Open Source`
			`// License. See LICENSE.TXT for details.`
			`//`
			`//===----------------------------------------------------------------------===//`
			`//`
			`// This file defines an instruction selector for the NVPTX target.`
			`//`
			`//===----------------------------------------------------------------------===//`

			`#define DEBUG_TYPE "nvptx-isel"`

			`#include "NVPTX.h"`
			`#include "NVPTXISelLowering.h"`
			`#include "NVPTXRegisterInfo.h"`
			`#include "NVPTXTargetMachine.h"`
			`#include "llvm/CodeGen/SelectionDAGISel.h"`
Move all of the header files which are involved in modelling the LLVM IR into their new header subdirectory: include/llvm/IR. This matches the directory structure of lib, and begins to correct a long standing point of file layout clutter in LLVM. There are still more header files to move here, but I wanted to handle them in separate commits to make tracking what files make sense at each layer easier. The only really questionable files here are the target intrinsic tablegen files. But that's a battle I'd rather not fight today. I've updated both CMake and Makefile build systems (I think, and my tests think, but I may have missed something). I've also re-sorted the includes throughout the project. I'll be committing updates to Clang, DragonEgg, and Polly momentarily. llvm-svn: 171366 2013-01-02 19:36:10 +08:00			`#include "llvm/IR/Intrinsics.h"`
Use the new script to sort the includes of every file under lib. Sooooo many of these had incorrect or strange main module includes. I have manually inspected all of these, and fixed the main module include to be the nearest plausible thing I could find. If you own or care about any of these source files, I encourage you to take some time and check that these edits were sensible. I can't have broken anything (I strictly added headers, and reordered them, never removed), but they may not be the headers you'd really like to identify as containing the API being implemented. Many forward declarations and missing includes were added to a header files to allow them to parse cleanly when included first. The main module rule does in fact have its merits. =] llvm-svn: 169131 2012-12-04 00:50:05 +08:00			`#include "llvm/Support/Compiler.h"`
This patch adds a new NVPTX back-end to LLVM which supports code generation for NVIDIA PTX 3.0. This back-end will (eventually) replace the current PTX back-end, while maintaining compatibility with it. The new target machines are: nvptx (old ptx32) => 32-bit PTX nvptx64 (old ptx64) => 64-bit PTX The sources are based on the internal NVIDIA NVPTX back-end, and contain more functionality than the current PTX back-end currently provides. NV_CONTRIB llvm-svn: 156196 2012-05-05 04:18:50 +08:00			`using namespace llvm;`

			`namespace {`

			`class LLVM_LIBRARY_VISIBILITY NVPTXDAGToDAGISel : public SelectionDAGISel {`

			`// If true, generate corresponding FPCONTRACT. This is`
			`// language dependent (i.e. CUDA and OpenCL works differently).`
			`bool doFMADF32;`
			`bool doFMAF64;`
			`bool doFMAF32;`
			`bool doFMAF64AGG;`
			`bool doFMAF32AGG;`
			`bool allowFMA;`

			`// 0: use div.approx`
			`// 1: use div.full`
			`// 2: For sm_20 and later, ieee-compliant div.rnd.f32 can be generated;`
			`// Otherwise, use div.full`
			`int do_DIVF32_PREC;`

[NVPTX] Add @llvm.nvvm.sqrt.f() intrinsic llvm-svn: 182394 2013-05-22 00:51:30 +08:00			`// If true, generate sqrt.rn, else generate sqrt.approx. If FTZ`
			`// is true, then generate the corresponding FTZ version.`
			`bool do_SQRTF32_PREC;`

This patch adds a new NVPTX back-end to LLVM which supports code generation for NVIDIA PTX 3.0. This back-end will (eventually) replace the current PTX back-end, while maintaining compatibility with it. The new target machines are: nvptx (old ptx32) => 32-bit PTX nvptx64 (old ptx64) => 64-bit PTX The sources are based on the internal NVIDIA NVPTX back-end, and contain more functionality than the current PTX back-end currently provides. NV_CONTRIB llvm-svn: 156196 2012-05-05 04:18:50 +08:00			`// If true, add .ftz to f32 instructions.`
			`// This is only meaningful for sm_20 and later, as the default`
			`// is not ftz.`
			`// For sm earlier than sm_20, f32 denorms are always ftz by the`
			`// hardware.`
			`// We always add the .ftz modifier regardless of the sm value`
			`// when Use32FTZ is true.`
			`bool UseF32FTZ;`

			`// If true, generate mul.wide from sext and mul`
			`bool doMulWide;`

			`public:`
			`explicit NVPTXDAGToDAGISel(NVPTXTargetMachine &tm,`
			`CodeGenOpt::Level OptLevel);`

			`// Pass Name`
			`virtual const char *getPassName() const {`
			`return "NVPTX DAG->DAG Pattern Instruction Selection";`
			`}`

			`const NVPTXSubtarget &Subtarget;`

[NVPTX] Run clang-format on all NVPTX sources. Hopefully this resolves any outstanding style issues and gives us an automated way of ensuring we conform to the style guidelines. llvm-svn: 178415 2013-03-30 22:29:21 +08:00			`virtual bool SelectInlineAsmMemoryOperand(`
			`const SDValue &Op, char ConstraintCode, std::vector<SDValue> &OutOps);`
This patch adds a new NVPTX back-end to LLVM which supports code generation for NVIDIA PTX 3.0. This back-end will (eventually) replace the current PTX back-end, while maintaining compatibility with it. The new target machines are: nvptx (old ptx32) => 32-bit PTX nvptx64 (old ptx64) => 64-bit PTX The sources are based on the internal NVIDIA NVPTX back-end, and contain more functionality than the current PTX back-end currently provides. NV_CONTRIB llvm-svn: 156196 2012-05-05 04:18:50 +08:00			`private:`
[NVPTX] Run clang-format on all NVPTX sources. Hopefully this resolves any outstanding style issues and gives us an automated way of ensuring we conform to the style guidelines. llvm-svn: 178415 2013-03-30 22:29:21 +08:00			`// Include the pieces autogenerated from the target description.`
This patch adds a new NVPTX back-end to LLVM which supports code generation for NVIDIA PTX 3.0. This back-end will (eventually) replace the current PTX back-end, while maintaining compatibility with it. The new target machines are: nvptx (old ptx32) => 32-bit PTX nvptx64 (old ptx64) => 64-bit PTX The sources are based on the internal NVIDIA NVPTX back-end, and contain more functionality than the current PTX back-end currently provides. NV_CONTRIB llvm-svn: 156196 2012-05-05 04:18:50 +08:00			`#include "NVPTXGenDAGISel.inc"`

			`SDNode Select(SDNode N);`
[NVPTX] Disable vector registers Vectors were being manually scalarized by the backend. Instead, let the target-independent code do all of the work. The manual scalarization was from a time before good target-independent support for scalarization in LLVM. However, this forces us to specially-handle vector loads and stores, which we can turn into PTX instructions that produce/consume multiple operands. llvm-svn: 174968 2013-02-12 22:18:49 +08:00			`SDNode SelectLoad(SDNode N);`
			`SDNode SelectLoadVector(SDNode N);`
			`SDNode SelectLDGLDUVector(SDNode N);`
			`SDNode SelectStore(SDNode N);`
			`SDNode SelectStoreVector(SDNode N);`
[NVPTX] Remove i8 register class. PTX support for i8 (.b8, .u8, .s8) is rather poor and we're better off just ignoring it and letting LLVM expand all i8 ops out to i16. llvm-svn: 185174 2013-06-29 01:57:59 +08:00			`SDNode SelectLoadParam(SDNode N);`
			`SDNode SelectStoreRetval(SDNode N);`
			`SDNode SelectStoreParam(SDNode N);`

This patch adds a new NVPTX back-end to LLVM which supports code generation for NVIDIA PTX 3.0. This back-end will (eventually) replace the current PTX back-end, while maintaining compatibility with it. The new target machines are: nvptx (old ptx32) => 32-bit PTX nvptx64 (old ptx64) => 64-bit PTX The sources are based on the internal NVIDIA NVPTX back-end, and contain more functionality than the current PTX back-end currently provides. NV_CONTRIB llvm-svn: 156196 2012-05-05 04:18:50 +08:00			`inline SDValue getI32Imm(unsigned Imm) {`
			`return CurDAG->getTargetConstant(Imm, MVT::i32);`
			`}`

			`// Match direct address complex pattern.`
			`bool SelectDirectAddr(SDValue N, SDValue &Address);`

			`bool SelectADDRri_imp(SDNode *OpNode, SDValue Addr, SDValue &Base,`
			`SDValue &Offset, MVT mvt);`
			`bool SelectADDRri(SDNode *OpNode, SDValue Addr, SDValue &Base,`
			`SDValue &Offset);`
			`bool SelectADDRri64(SDNode *OpNode, SDValue Addr, SDValue &Base,`
			`SDValue &Offset);`

			`bool SelectADDRsi_imp(SDNode *OpNode, SDValue Addr, SDValue &Base,`
			`SDValue &Offset, MVT mvt);`
			`bool SelectADDRsi(SDNode *OpNode, SDValue Addr, SDValue &Base,`
			`SDValue &Offset);`
			`bool SelectADDRsi64(SDNode *OpNode, SDValue Addr, SDValue &Base,`
			`SDValue &Offset);`

			`bool ChkMemSDNodeAddressSpace(SDNode *N, unsigned int spN) const;`

			`bool UndefOrImm(SDValue Op, SDValue N, SDValue &Retval);`

			`};`
			`}`