1 //===-- AMDGPUTargetTransformInfo.h - AMDGPU specific TTI -------*- C++ -*-===// 2 // 3 // The LLVM Compiler Infrastructure 4 // 5 // This file is distributed under the University of Illinois Open Source 6 // License. See LICENSE.TXT for details. 7 // 8 //===----------------------------------------------------------------------===// 9 /// \file 10 /// This file a TargetTransformInfo::Concept conforming object specific to the 11 /// AMDGPU target machine. It uses the target's detailed information to 12 /// provide more precise answers to certain TTI queries, while letting the 13 /// target independent and default TTI implementations handle the rest. 14 /// 15 //===----------------------------------------------------------------------===// 16 17 #ifndef LLVM_LIB_TARGET_AMDGPU_AMDGPUTARGETTRANSFORMINFO_H 18 #define LLVM_LIB_TARGET_AMDGPU_AMDGPUTARGETTRANSFORMINFO_H 19 20 #include "AMDGPU.h" 21 #include "AMDGPUTargetMachine.h" 22 #include "llvm/Analysis/TargetTransformInfo.h" 23 #include "llvm/CodeGen/BasicTTIImpl.h" 24 25 namespace llvm { 26 class AMDGPUTargetLowering; 27 28 class AMDGPUTTIImpl final : public BasicTTIImplBase<AMDGPUTTIImpl> { 29 typedef BasicTTIImplBase<AMDGPUTTIImpl> BaseT; 30 typedef TargetTransformInfo TTI; 31 friend BaseT; 32 33 const AMDGPUSubtarget *ST; 34 const AMDGPUTargetLowering *TLI; 35 getST()36 const AMDGPUSubtarget *getST() const { return ST; } getTLI()37 const AMDGPUTargetLowering *getTLI() const { return TLI; } 38 39 getFullRateInstrCost()40 static inline int getFullRateInstrCost() { 41 return TargetTransformInfo::TCC_Basic; 42 } 43 getHalfRateInstrCost()44 static inline int getHalfRateInstrCost() { 45 return 2 * TargetTransformInfo::TCC_Basic; 46 } 47 48 // TODO: The size is usually 8 bytes, but takes 4x as many cycles. Maybe 49 // should be 2 or 4. getQuarterRateInstrCost()50 static inline int getQuarterRateInstrCost() { 51 return 3 * TargetTransformInfo::TCC_Basic; 52 } 53 54 // On some parts, normal fp64 operations are half rate, and others 55 // quarter. This also applies to some integer operations. get64BitInstrCost()56 inline int get64BitInstrCost() const { 57 return ST->hasHalfRate64Ops() ? 58 getHalfRateInstrCost() : getQuarterRateInstrCost(); 59 } 60 61 public: AMDGPUTTIImpl(const AMDGPUTargetMachine * TM,const Function & F)62 explicit AMDGPUTTIImpl(const AMDGPUTargetMachine *TM, const Function &F) 63 : BaseT(TM, F.getParent()->getDataLayout()), 64 ST(TM->getSubtargetImpl(F)), 65 TLI(ST->getTargetLowering()) {} 66 67 // Provide value semantics. MSVC requires that we spell all of these out. AMDGPUTTIImpl(const AMDGPUTTIImpl & Arg)68 AMDGPUTTIImpl(const AMDGPUTTIImpl &Arg) 69 : BaseT(static_cast<const BaseT &>(Arg)), ST(Arg.ST), TLI(Arg.TLI) {} AMDGPUTTIImpl(AMDGPUTTIImpl && Arg)70 AMDGPUTTIImpl(AMDGPUTTIImpl &&Arg) 71 : BaseT(std::move(static_cast<BaseT &>(Arg))), ST(std::move(Arg.ST)), 72 TLI(std::move(Arg.TLI)) {} 73 hasBranchDivergence()74 bool hasBranchDivergence() { return true; } 75 76 void getUnrollingPreferences(Loop *L, TTI::UnrollingPreferences &UP); 77 getPopcntSupport(unsigned TyWidth)78 TTI::PopcntSupportKind getPopcntSupport(unsigned TyWidth) { 79 assert(isPowerOf2_32(TyWidth) && "Ty width must be power of 2"); 80 return TTI::PSK_FastHardware; 81 } 82 83 unsigned getNumberOfRegisters(bool Vector); 84 unsigned getRegisterBitWidth(bool Vector); 85 unsigned getLoadStoreVecRegBitWidth(unsigned AddrSpace); 86 unsigned getMaxInterleaveFactor(unsigned VF); 87 88 int getArithmeticInstrCost( 89 unsigned Opcode, Type *Ty, 90 TTI::OperandValueKind Opd1Info = TTI::OK_AnyValue, 91 TTI::OperandValueKind Opd2Info = TTI::OK_AnyValue, 92 TTI::OperandValueProperties Opd1PropInfo = TTI::OP_None, 93 TTI::OperandValueProperties Opd2PropInfo = TTI::OP_None); 94 95 unsigned getCFInstrCost(unsigned Opcode); 96 97 int getVectorInstrCost(unsigned Opcode, Type *ValTy, unsigned Index); 98 bool isSourceOfDivergence(const Value *V) const; 99 getVectorSplitCost()100 unsigned getVectorSplitCost() { return 0; } 101 }; 102 103 } // end namespace llvm 104 105 #endif 106