1//===-- AMDGPUTargetTransformInfo.h - AMDGPU specific TTI -------*- C++ -*-===// 2// 3// The LLVM Compiler Infrastructure 4// 5// This file is distributed under the University of Illinois Open Source 6// License. See LICENSE.TXT for details. 7// 8//===----------------------------------------------------------------------===// 9/// \file 10/// This file a TargetTransformInfo::Concept conforming object specific to the 11/// AMDGPU target machine. It uses the target's detailed information to 12/// provide more precise answers to certain TTI queries, while letting the 13/// target independent and default TTI implementations handle the rest. 14/// 15//===----------------------------------------------------------------------===// 16 17#ifndef LLVM_LIB_TARGET_AMDGPU_AMDGPUTARGETTRANSFORMINFO_H 18#define LLVM_LIB_TARGET_AMDGPU_AMDGPUTARGETTRANSFORMINFO_H 19 20#include "AMDGPU.h" 21#include "AMDGPUTargetMachine.h" 22#include "llvm/Analysis/TargetTransformInfo.h" 23#include "llvm/CodeGen/BasicTTIImpl.h" 24 25namespace llvm { 26class AMDGPUTargetLowering; 27 28class AMDGPUTTIImpl final : public BasicTTIImplBase<AMDGPUTTIImpl> { 29 typedef BasicTTIImplBase<AMDGPUTTIImpl> BaseT; 30 typedef TargetTransformInfo TTI; 31 friend BaseT; 32 33 const AMDGPUSubtarget *ST; 34 const AMDGPUTargetLowering *TLI; 35 36 const AMDGPUSubtarget *getST() const { return ST; } 37 const AMDGPUTargetLowering *getTLI() const { return TLI; } 38 39 40 static inline int getFullRateInstrCost() { 41 return TargetTransformInfo::TCC_Basic; 42 } 43 44 static inline int getHalfRateInstrCost() { 45 return 2 * TargetTransformInfo::TCC_Basic; 46 } 47 48 // TODO: The size is usually 8 bytes, but takes 4x as many cycles. Maybe 49 // should be 2 or 4. 50 static inline int getQuarterRateInstrCost() { 51 return 3 * TargetTransformInfo::TCC_Basic; 52 } 53 54 // On some parts, normal fp64 operations are half rate, and others 55 // quarter. This also applies to some integer operations. 56 inline int get64BitInstrCost() const { 57 return ST->hasHalfRate64Ops() ? 58 getHalfRateInstrCost() : getQuarterRateInstrCost(); 59 } 60 61public: 62 explicit AMDGPUTTIImpl(const AMDGPUTargetMachine *TM, const Function &F) 63 : BaseT(TM, F.getParent()->getDataLayout()), 64 ST(TM->getSubtargetImpl(F)), 65 TLI(ST->getTargetLowering()) {} 66 67 // Provide value semantics. MSVC requires that we spell all of these out. 68 AMDGPUTTIImpl(const AMDGPUTTIImpl &Arg) 69 : BaseT(static_cast<const BaseT &>(Arg)), ST(Arg.ST), TLI(Arg.TLI) {} 70 AMDGPUTTIImpl(AMDGPUTTIImpl &&Arg) 71 : BaseT(std::move(static_cast<BaseT &>(Arg))), ST(std::move(Arg.ST)), 72 TLI(std::move(Arg.TLI)) {} 73 74 bool hasBranchDivergence() { return true; } 75 76 void getUnrollingPreferences(Loop *L, TTI::UnrollingPreferences &UP); 77 78 TTI::PopcntSupportKind getPopcntSupport(unsigned TyWidth) { 79 assert(isPowerOf2_32(TyWidth) && "Ty width must be power of 2"); 80 return TTI::PSK_FastHardware; 81 } 82 83 unsigned getNumberOfRegisters(bool Vector); 84 unsigned getRegisterBitWidth(bool Vector); 85 unsigned getLoadStoreVecRegBitWidth(unsigned AddrSpace); 86 unsigned getMaxInterleaveFactor(unsigned VF); 87 88 int getArithmeticInstrCost( 89 unsigned Opcode, Type *Ty, 90 TTI::OperandValueKind Opd1Info = TTI::OK_AnyValue, 91 TTI::OperandValueKind Opd2Info = TTI::OK_AnyValue, 92 TTI::OperandValueProperties Opd1PropInfo = TTI::OP_None, 93 TTI::OperandValueProperties Opd2PropInfo = TTI::OP_None); 94 95 unsigned getCFInstrCost(unsigned Opcode); 96 97 int getVectorInstrCost(unsigned Opcode, Type *ValTy, unsigned Index); 98 bool isSourceOfDivergence(const Value *V) const; 99 100 unsigned getVectorSplitCost() { return 0; } 101}; 102 103} // end namespace llvm 104 105#endif 106