llvm-project/llvm/lib/Target/AMDGPU/R600TargetTransformInfo.h

//===- R600TargetTransformInfo.h - R600 specific TTI --------*- C++ -*-===//
//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//
//===----------------------------------------------------------------------===//
//
/// \file
/// This file a TargetTransformInfo::Concept conforming object specific to the
/// R600 target machine. It uses the target's detailed information to
/// provide more precise answers to certain TTI queries, while letting the
/// target independent and default TTI implementations handle the rest.
//
//===----------------------------------------------------------------------===//

#ifndef LLVM_LIB_TARGET_AMDGPU_R600TARGETTRANSFORMINFO_H
#define LLVM_LIB_TARGET_AMDGPU_R600TARGETTRANSFORMINFO_H

#include "AMDGPUTargetTransformInfo.h"
#include "llvm/CodeGen/BasicTTIImpl.h"

namespace llvm {

class R600Subtarget;
class AMDGPUTargetLowering;

class R600TTIImpl final : public BasicTTIImplBase<R600TTIImpl> {
  using BaseT = BasicTTIImplBase<R600TTIImpl>;
  using TTI = TargetTransformInfo;

  friend BaseT;

  const R600Subtarget *ST;
  const AMDGPUTargetLowering *TLI;
  AMDGPUTTIImpl CommonTTI;

public:
  explicit R600TTIImpl(const AMDGPUTargetMachine *TM, const Function &F);

  const R600Subtarget *getST() const { return ST; }
  const AMDGPUTargetLowering *getTLI() const { return TLI; }

  void getUnrollingPreferences(Loop *L, ScalarEvolution &SE,
                               TTI::UnrollingPreferences &UP,
                               OptimizationRemarkEmitter *ORE);
  void getPeelingPreferences(Loop *L, ScalarEvolution &SE,
                             TTI::PeelingPreferences &PP);
  unsigned getHardwareNumberOfRegisters(bool Vec) const;
  unsigned getNumberOfRegisters(bool Vec) const;
  TypeSize getRegisterBitWidth(TargetTransformInfo::RegisterKind Vector) const;
  unsigned getMinVectorRegisterBitWidth() const;
  unsigned getLoadStoreVecRegBitWidth(unsigned AddrSpace) const;
  bool isLegalToVectorizeMemChain(unsigned ChainSizeInBytes, Align Alignment,
                                  unsigned AddrSpace) const;
  bool isLegalToVectorizeLoadChain(unsigned ChainSizeInBytes, Align Alignment,
                                   unsigned AddrSpace) const;
  bool isLegalToVectorizeStoreChain(unsigned ChainSizeInBytes, Align Alignment,
                                    unsigned AddrSpace) const;
  unsigned getMaxInterleaveFactor(unsigned VF);
  InstructionCost getCFInstrCost(unsigned Opcode, TTI::TargetCostKind CostKind,
                                 const Instruction *I = nullptr);
  InstructionCost getVectorInstrCost(unsigned Opcode, Type *ValTy,
                                     unsigned Index);
};

} // end namespace llvm

#endif // LLVM_LIB_TARGET_AMDGPU_R600TARGETTRANSFORMINFO_H
[NFC][AMDGPU] Reduce includes dependencies. 1. Splitted out some parts of R600 target to separate modules/headers. 2. Reduced some include lists in headers. 3. Found and fixed issue with override `GCNTargetMachine::getSubtargetImpl()` and `R600TargetMachine::getSubtargetImpl()` had different return value type than base class. 4. Minor forward declarations cleanup. Reviewed By: foad Differential Revision: https://reviews.llvm.org/D108596 2021-08-24 04:50:19 +08:00			`//===- R600TargetTransformInfo.h - R600 specific TTI --------- C++ --===//`
			`//`
			`// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.`
			`// See https://llvm.org/LICENSE.txt for license information.`
			`// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception`
			`//`
			`//===----------------------------------------------------------------------===//`
			`//`
			`/// \file`
			`/// This file a TargetTransformInfo::Concept conforming object specific to the`
			`/// R600 target machine. It uses the target's detailed information to`
			`/// provide more precise answers to certain TTI queries, while letting the`
			`/// target independent and default TTI implementations handle the rest.`
			`//`
			`//===----------------------------------------------------------------------===//`

			`#ifndef LLVM_LIB_TARGET_AMDGPU_R600TARGETTRANSFORMINFO_H`
			`#define LLVM_LIB_TARGET_AMDGPU_R600TARGETTRANSFORMINFO_H`

			`#include "AMDGPUTargetTransformInfo.h"`
			`#include "llvm/CodeGen/BasicTTIImpl.h"`

			`namespace llvm {`

			`class R600Subtarget;`
			`class AMDGPUTargetLowering;`

			`class R600TTIImpl final : public BasicTTIImplBase<R600TTIImpl> {`
			`using BaseT = BasicTTIImplBase<R600TTIImpl>;`
			`using TTI = TargetTransformInfo;`

			`friend BaseT;`

			`const R600Subtarget *ST;`
			`const AMDGPUTargetLowering *TLI;`
			`AMDGPUTTIImpl CommonTTI;`

			`public:`
			`explicit R600TTIImpl(const AMDGPUTargetMachine *TM, const Function &F);`

			`const R600Subtarget *getST() const { return ST; }`
			`const AMDGPUTargetLowering *getTLI() const { return TLI; }`

			`void getUnrollingPreferences(Loop *L, ScalarEvolution &SE,`
			`TTI::UnrollingPreferences &UP,`
			`OptimizationRemarkEmitter *ORE);`
			`void getPeelingPreferences(Loop *L, ScalarEvolution &SE,`
			`TTI::PeelingPreferences &PP);`
			`unsigned getHardwareNumberOfRegisters(bool Vec) const;`
			`unsigned getNumberOfRegisters(bool Vec) const;`
			`TypeSize getRegisterBitWidth(TargetTransformInfo::RegisterKind Vector) const;`
			`unsigned getMinVectorRegisterBitWidth() const;`
			`unsigned getLoadStoreVecRegBitWidth(unsigned AddrSpace) const;`
			`bool isLegalToVectorizeMemChain(unsigned ChainSizeInBytes, Align Alignment,`
			`unsigned AddrSpace) const;`
			`bool isLegalToVectorizeLoadChain(unsigned ChainSizeInBytes, Align Alignment,`
			`unsigned AddrSpace) const;`
			`bool isLegalToVectorizeStoreChain(unsigned ChainSizeInBytes, Align Alignment,`
			`unsigned AddrSpace) const;`
			`unsigned getMaxInterleaveFactor(unsigned VF);`
			`InstructionCost getCFInstrCost(unsigned Opcode, TTI::TargetCostKind CostKind,`
			`const Instruction *I = nullptr);`
			`InstructionCost getVectorInstrCost(unsigned Opcode, Type *ValTy,`
			`unsigned Index);`
			`};`

			`} // end namespace llvm`

			`#endif // LLVM_LIB_TARGET_AMDGPU_R600TARGETTRANSFORMINFO_H`