forked from OSchip/llvm-project
70 lines
2.8 KiB
C
70 lines
2.8 KiB
C
|
//===- R600TargetTransformInfo.h - R600 specific TTI --------*- C++ -*-===//
|
||
|
//
|
||
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
||
|
// See https://llvm.org/LICENSE.txt for license information.
|
||
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
||
|
//
|
||
|
//===----------------------------------------------------------------------===//
|
||
|
//
|
||
|
/// \file
|
||
|
/// This file a TargetTransformInfo::Concept conforming object specific to the
|
||
|
/// R600 target machine. It uses the target's detailed information to
|
||
|
/// provide more precise answers to certain TTI queries, while letting the
|
||
|
/// target independent and default TTI implementations handle the rest.
|
||
|
//
|
||
|
//===----------------------------------------------------------------------===//
|
||
|
|
||
|
#ifndef LLVM_LIB_TARGET_AMDGPU_R600TARGETTRANSFORMINFO_H
|
||
|
#define LLVM_LIB_TARGET_AMDGPU_R600TARGETTRANSFORMINFO_H
|
||
|
|
||
|
#include "AMDGPUTargetTransformInfo.h"
|
||
|
#include "llvm/CodeGen/BasicTTIImpl.h"
|
||
|
|
||
|
namespace llvm {
|
||
|
|
||
|
class R600Subtarget;
|
||
|
class AMDGPUTargetLowering;
|
||
|
|
||
|
class R600TTIImpl final : public BasicTTIImplBase<R600TTIImpl> {
|
||
|
using BaseT = BasicTTIImplBase<R600TTIImpl>;
|
||
|
using TTI = TargetTransformInfo;
|
||
|
|
||
|
friend BaseT;
|
||
|
|
||
|
const R600Subtarget *ST;
|
||
|
const AMDGPUTargetLowering *TLI;
|
||
|
AMDGPUTTIImpl CommonTTI;
|
||
|
|
||
|
public:
|
||
|
explicit R600TTIImpl(const AMDGPUTargetMachine *TM, const Function &F);
|
||
|
|
||
|
const R600Subtarget *getST() const { return ST; }
|
||
|
const AMDGPUTargetLowering *getTLI() const { return TLI; }
|
||
|
|
||
|
void getUnrollingPreferences(Loop *L, ScalarEvolution &SE,
|
||
|
TTI::UnrollingPreferences &UP,
|
||
|
OptimizationRemarkEmitter *ORE);
|
||
|
void getPeelingPreferences(Loop *L, ScalarEvolution &SE,
|
||
|
TTI::PeelingPreferences &PP);
|
||
|
unsigned getHardwareNumberOfRegisters(bool Vec) const;
|
||
|
unsigned getNumberOfRegisters(bool Vec) const;
|
||
|
TypeSize getRegisterBitWidth(TargetTransformInfo::RegisterKind Vector) const;
|
||
|
unsigned getMinVectorRegisterBitWidth() const;
|
||
|
unsigned getLoadStoreVecRegBitWidth(unsigned AddrSpace) const;
|
||
|
bool isLegalToVectorizeMemChain(unsigned ChainSizeInBytes, Align Alignment,
|
||
|
unsigned AddrSpace) const;
|
||
|
bool isLegalToVectorizeLoadChain(unsigned ChainSizeInBytes, Align Alignment,
|
||
|
unsigned AddrSpace) const;
|
||
|
bool isLegalToVectorizeStoreChain(unsigned ChainSizeInBytes, Align Alignment,
|
||
|
unsigned AddrSpace) const;
|
||
|
unsigned getMaxInterleaveFactor(unsigned VF);
|
||
|
InstructionCost getCFInstrCost(unsigned Opcode, TTI::TargetCostKind CostKind,
|
||
|
const Instruction *I = nullptr);
|
||
|
InstructionCost getVectorInstrCost(unsigned Opcode, Type *ValTy,
|
||
|
unsigned Index);
|
||
|
};
|
||
|
|
||
|
} // end namespace llvm
|
||
|
|
||
|
#endif // LLVM_LIB_TARGET_AMDGPU_R600TARGETTRANSFORMINFO_H
|