1 //===-- NVPTXISelLowering.h - NVPTX DAG Lowering Interface ------*- C++ -*-===// 2 // 3 // The LLVM Compiler Infrastructure 4 // 5 // This file is distributed under the University of Illinois Open Source 6 // License. See LICENSE.TXT for details. 7 // 8 //===----------------------------------------------------------------------===// 9 // 10 // This file defines the interfaces that NVPTX uses to lower LLVM code into a 11 // selection DAG. 12 // 13 //===----------------------------------------------------------------------===// 14 15 #ifndef NVPTXISELLOWERING_H 16 #define NVPTXISELLOWERING_H 17 18 #include "NVPTX.h" 19 #include "llvm/CodeGen/SelectionDAG.h" 20 #include "llvm/Target/TargetLowering.h" 21 22 namespace llvm { 23 namespace NVPTXISD { 24 enum NodeType { 25 // Start the numbering from where ISD NodeType finishes. 26 FIRST_NUMBER = ISD::BUILTIN_OP_END, 27 Wrapper, 28 CALL, 29 RET_FLAG, 30 LOAD_PARAM, 31 DeclareParam, 32 DeclareScalarParam, 33 DeclareRetParam, 34 DeclareRet, 35 DeclareScalarRet, 36 PrintCall, 37 PrintCallUni, 38 CallArgBegin, 39 CallArg, 40 LastCallArg, 41 CallArgEnd, 42 CallVoid, 43 CallVal, 44 CallSymbol, 45 Prototype, 46 MoveParam, 47 PseudoUseParam, 48 RETURN, 49 CallSeqBegin, 50 CallSeqEnd, 51 CallPrototype, 52 FUN_SHFL_CLAMP, 53 FUN_SHFR_CLAMP, 54 MUL_WIDE_SIGNED, 55 MUL_WIDE_UNSIGNED, 56 IMAD, 57 Dummy, 58 59 LoadV2 = ISD::FIRST_TARGET_MEMORY_OPCODE, 60 LoadV4, 61 LDGV2, // LDG.v2 62 LDGV4, // LDG.v4 63 LDUV2, // LDU.v2 64 LDUV4, // LDU.v4 65 StoreV2, 66 StoreV4, 67 LoadParam, 68 LoadParamV2, 69 LoadParamV4, 70 StoreParam, 71 StoreParamV2, 72 StoreParamV4, 73 StoreParamS32, // to sext and store a <32bit value, not used currently 74 StoreParamU32, // to zext and store a <32bit value, not used currently 75 StoreRetval, 76 StoreRetvalV2, 77 StoreRetvalV4, 78 79 // Texture intrinsics 80 Tex1DFloatI32, 81 Tex1DFloatFloat, 82 Tex1DFloatFloatLevel, 83 Tex1DFloatFloatGrad, 84 Tex1DI32I32, 85 Tex1DI32Float, 86 Tex1DI32FloatLevel, 87 Tex1DI32FloatGrad, 88 Tex1DArrayFloatI32, 89 Tex1DArrayFloatFloat, 90 Tex1DArrayFloatFloatLevel, 91 Tex1DArrayFloatFloatGrad, 92 Tex1DArrayI32I32, 93 Tex1DArrayI32Float, 94 Tex1DArrayI32FloatLevel, 95 Tex1DArrayI32FloatGrad, 96 Tex2DFloatI32, 97 Tex2DFloatFloat, 98 Tex2DFloatFloatLevel, 99 Tex2DFloatFloatGrad, 100 Tex2DI32I32, 101 Tex2DI32Float, 102 Tex2DI32FloatLevel, 103 Tex2DI32FloatGrad, 104 Tex2DArrayFloatI32, 105 Tex2DArrayFloatFloat, 106 Tex2DArrayFloatFloatLevel, 107 Tex2DArrayFloatFloatGrad, 108 Tex2DArrayI32I32, 109 Tex2DArrayI32Float, 110 Tex2DArrayI32FloatLevel, 111 Tex2DArrayI32FloatGrad, 112 Tex3DFloatI32, 113 Tex3DFloatFloat, 114 Tex3DFloatFloatLevel, 115 Tex3DFloatFloatGrad, 116 Tex3DI32I32, 117 Tex3DI32Float, 118 Tex3DI32FloatLevel, 119 Tex3DI32FloatGrad, 120 121 // Surface intrinsics 122 Suld1DI8Trap, 123 Suld1DI16Trap, 124 Suld1DI32Trap, 125 Suld1DV2I8Trap, 126 Suld1DV2I16Trap, 127 Suld1DV2I32Trap, 128 Suld1DV4I8Trap, 129 Suld1DV4I16Trap, 130 Suld1DV4I32Trap, 131 132 Suld1DArrayI8Trap, 133 Suld1DArrayI16Trap, 134 Suld1DArrayI32Trap, 135 Suld1DArrayV2I8Trap, 136 Suld1DArrayV2I16Trap, 137 Suld1DArrayV2I32Trap, 138 Suld1DArrayV4I8Trap, 139 Suld1DArrayV4I16Trap, 140 Suld1DArrayV4I32Trap, 141 142 Suld2DI8Trap, 143 Suld2DI16Trap, 144 Suld2DI32Trap, 145 Suld2DV2I8Trap, 146 Suld2DV2I16Trap, 147 Suld2DV2I32Trap, 148 Suld2DV4I8Trap, 149 Suld2DV4I16Trap, 150 Suld2DV4I32Trap, 151 152 Suld2DArrayI8Trap, 153 Suld2DArrayI16Trap, 154 Suld2DArrayI32Trap, 155 Suld2DArrayV2I8Trap, 156 Suld2DArrayV2I16Trap, 157 Suld2DArrayV2I32Trap, 158 Suld2DArrayV4I8Trap, 159 Suld2DArrayV4I16Trap, 160 Suld2DArrayV4I32Trap, 161 162 Suld3DI8Trap, 163 Suld3DI16Trap, 164 Suld3DI32Trap, 165 Suld3DV2I8Trap, 166 Suld3DV2I16Trap, 167 Suld3DV2I32Trap, 168 Suld3DV4I8Trap, 169 Suld3DV4I16Trap, 170 Suld3DV4I32Trap 171 }; 172 } 173 174 class NVPTXSubtarget; 175 176 //===--------------------------------------------------------------------===// 177 // TargetLowering Implementation 178 //===--------------------------------------------------------------------===// 179 class NVPTXTargetLowering : public TargetLowering { 180 public: 181 explicit NVPTXTargetLowering(NVPTXTargetMachine &TM); 182 SDValue LowerOperation(SDValue Op, SelectionDAG &DAG) const override; 183 184 SDValue LowerGlobalAddress(SDValue Op, SelectionDAG &DAG) const; 185 SDValue LowerGlobalAddress(const GlobalValue *GV, int64_t Offset, 186 SelectionDAG &DAG) const; 187 188 const char *getTargetNodeName(unsigned Opcode) const override; 189 190 bool isTypeSupportedInIntrinsic(MVT VT) const; 191 192 bool getTgtMemIntrinsic(IntrinsicInfo &Info, const CallInst &I, 193 unsigned Intrinsic) const override; 194 195 /// isLegalAddressingMode - Return true if the addressing mode represented 196 /// by AM is legal for this target, for a load/store of the specified type 197 /// Used to guide target specific optimizations, like loop strength 198 /// reduction (LoopStrengthReduce.cpp) and memory optimization for 199 /// address mode (CodeGenPrepare.cpp) 200 bool isLegalAddressingMode(const AddrMode &AM, Type *Ty) const override; 201 202 /// getFunctionAlignment - Return the Log2 alignment of this function. 203 unsigned getFunctionAlignment(const Function *F) const; 204 getSetCCResultType(LLVMContext & Ctx,EVT VT)205 EVT getSetCCResultType(LLVMContext &Ctx, EVT VT) const override { 206 if (VT.isVector()) 207 return EVT::getVectorVT(Ctx, MVT::i1, VT.getVectorNumElements()); 208 return MVT::i1; 209 } 210 211 ConstraintType 212 getConstraintType(const std::string &Constraint) const override; 213 std::pair<unsigned, const TargetRegisterClass *> 214 getRegForInlineAsmConstraint(const std::string &Constraint, 215 MVT VT) const override; 216 217 SDValue LowerFormalArguments( 218 SDValue Chain, CallingConv::ID CallConv, bool isVarArg, 219 const SmallVectorImpl<ISD::InputArg> &Ins, SDLoc dl, SelectionDAG &DAG, 220 SmallVectorImpl<SDValue> &InVals) const override; 221 222 SDValue LowerCall(CallLoweringInfo &CLI, 223 SmallVectorImpl<SDValue> &InVals) const override; 224 225 std::string getPrototype(Type *, const ArgListTy &, 226 const SmallVectorImpl<ISD::OutputArg> &, 227 unsigned retAlignment, 228 const ImmutableCallSite *CS) const; 229 230 SDValue 231 LowerReturn(SDValue Chain, CallingConv::ID CallConv, bool isVarArg, 232 const SmallVectorImpl<ISD::OutputArg> &Outs, 233 const SmallVectorImpl<SDValue> &OutVals, SDLoc dl, 234 SelectionDAG &DAG) const override; 235 236 void LowerAsmOperandForConstraint(SDValue Op, std::string &Constraint, 237 std::vector<SDValue> &Ops, 238 SelectionDAG &DAG) const override; 239 240 NVPTXTargetMachine *nvTM; 241 242 // PTX always uses 32-bit shift amounts getScalarShiftAmountTy(EVT LHSTy)243 MVT getScalarShiftAmountTy(EVT LHSTy) const override { return MVT::i32; } 244 245 TargetLoweringBase::LegalizeTypeAction 246 getPreferredVectorAction(EVT VT) const override; 247 248 private: 249 const NVPTXSubtarget &nvptxSubtarget; // cache the subtarget here 250 251 SDValue getExtSymb(SelectionDAG &DAG, const char *name, int idx, 252 EVT = MVT::i32) const; 253 SDValue getParamSymbol(SelectionDAG &DAG, int idx, EVT) const; 254 SDValue getParamHelpSymbol(SelectionDAG &DAG, int idx); 255 256 SDValue LowerCONCAT_VECTORS(SDValue Op, SelectionDAG &DAG) const; 257 258 SDValue LowerLOAD(SDValue Op, SelectionDAG &DAG) const; 259 SDValue LowerLOADi1(SDValue Op, SelectionDAG &DAG) const; 260 261 SDValue LowerSTORE(SDValue Op, SelectionDAG &DAG) const; 262 SDValue LowerSTOREi1(SDValue Op, SelectionDAG &DAG) const; 263 SDValue LowerSTOREVector(SDValue Op, SelectionDAG &DAG) const; 264 265 SDValue LowerShiftRightParts(SDValue Op, SelectionDAG &DAG) const; 266 SDValue LowerShiftLeftParts(SDValue Op, SelectionDAG &DAG) const; 267 268 void ReplaceNodeResults(SDNode *N, SmallVectorImpl<SDValue> &Results, 269 SelectionDAG &DAG) const override; 270 SDValue PerformDAGCombine(SDNode *N, DAGCombinerInfo &DCI) const override; 271 272 unsigned getArgumentAlignment(SDValue Callee, const ImmutableCallSite *CS, 273 Type *Ty, unsigned Idx) const; 274 }; 275 } // namespace llvm 276 277 #endif // NVPTXISELLOWERING_H 278