• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 //===- NVPTXUtilities.cpp - Utility Functions -----------------------------===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This file contains miscellaneous utility functions
11 //===----------------------------------------------------------------------===//
12 
13 #include "NVPTXUtilities.h"
14 #include "NVPTX.h"
15 #include "llvm/IR/Constants.h"
16 #include "llvm/IR/Function.h"
17 #include "llvm/IR/GlobalVariable.h"
18 #include "llvm/IR/InstIterator.h"
19 #include "llvm/IR/Module.h"
20 #include "llvm/IR/Operator.h"
21 #include "llvm/Support/ManagedStatic.h"
22 #include "llvm/Support/MutexGuard.h"
23 #include <algorithm>
24 #include <cstring>
25 #include <map>
26 #include <string>
27 #include <vector>
28 
29 using namespace llvm;
30 
31 typedef std::map<std::string, std::vector<unsigned> > key_val_pair_t;
32 typedef std::map<const GlobalValue *, key_val_pair_t> global_val_annot_t;
33 typedef std::map<const Module *, global_val_annot_t> per_module_annot_t;
34 
35 ManagedStatic<per_module_annot_t> annotationCache;
36 static sys::Mutex Lock;
37 
clearAnnotationCache(const llvm::Module * Mod)38 void llvm::clearAnnotationCache(const llvm::Module *Mod) {
39   MutexGuard Guard(Lock);
40   annotationCache->erase(Mod);
41 }
42 
cacheAnnotationFromMD(const MDNode * md,key_val_pair_t & retval)43 static void cacheAnnotationFromMD(const MDNode *md, key_val_pair_t &retval) {
44   MutexGuard Guard(Lock);
45   assert(md && "Invalid mdnode for annotation");
46   assert((md->getNumOperands() % 2) == 1 && "Invalid number of operands");
47   // start index = 1, to skip the global variable key
48   // increment = 2, to skip the value for each property-value pairs
49   for (unsigned i = 1, e = md->getNumOperands(); i != e; i += 2) {
50     // property
51     const MDString *prop = dyn_cast<MDString>(md->getOperand(i));
52     assert(prop && "Annotation property not a string");
53 
54     // value
55     ConstantInt *Val = mdconst::dyn_extract<ConstantInt>(md->getOperand(i + 1));
56     assert(Val && "Value operand not a constant int");
57 
58     std::string keyname = prop->getString().str();
59     if (retval.find(keyname) != retval.end())
60       retval[keyname].push_back(Val->getZExtValue());
61     else {
62       std::vector<unsigned> tmp;
63       tmp.push_back(Val->getZExtValue());
64       retval[keyname] = tmp;
65     }
66   }
67 }
68 
cacheAnnotationFromMD(const Module * m,const GlobalValue * gv)69 static void cacheAnnotationFromMD(const Module *m, const GlobalValue *gv) {
70   MutexGuard Guard(Lock);
71   NamedMDNode *NMD = m->getNamedMetadata(llvm::NamedMDForAnnotations);
72   if (!NMD)
73     return;
74   key_val_pair_t tmp;
75   for (unsigned i = 0, e = NMD->getNumOperands(); i != e; ++i) {
76     const MDNode *elem = NMD->getOperand(i);
77 
78     GlobalValue *entity =
79         mdconst::dyn_extract_or_null<GlobalValue>(elem->getOperand(0));
80     // entity may be null due to DCE
81     if (!entity)
82       continue;
83     if (entity != gv)
84       continue;
85 
86     // accumulate annotations for entity in tmp
87     cacheAnnotationFromMD(elem, tmp);
88   }
89 
90   if (tmp.empty()) // no annotations for this gv
91     return;
92 
93   if ((*annotationCache).find(m) != (*annotationCache).end())
94     (*annotationCache)[m][gv] = std::move(tmp);
95   else {
96     global_val_annot_t tmp1;
97     tmp1[gv] = std::move(tmp);
98     (*annotationCache)[m] = std::move(tmp1);
99   }
100 }
101 
findOneNVVMAnnotation(const GlobalValue * gv,std::string prop,unsigned & retval)102 bool llvm::findOneNVVMAnnotation(const GlobalValue *gv, std::string prop,
103                                  unsigned &retval) {
104   MutexGuard Guard(Lock);
105   const Module *m = gv->getParent();
106   if ((*annotationCache).find(m) == (*annotationCache).end())
107     cacheAnnotationFromMD(m, gv);
108   else if ((*annotationCache)[m].find(gv) == (*annotationCache)[m].end())
109     cacheAnnotationFromMD(m, gv);
110   if ((*annotationCache)[m][gv].find(prop) == (*annotationCache)[m][gv].end())
111     return false;
112   retval = (*annotationCache)[m][gv][prop][0];
113   return true;
114 }
115 
findAllNVVMAnnotation(const GlobalValue * gv,std::string prop,std::vector<unsigned> & retval)116 bool llvm::findAllNVVMAnnotation(const GlobalValue *gv, std::string prop,
117                                  std::vector<unsigned> &retval) {
118   MutexGuard Guard(Lock);
119   const Module *m = gv->getParent();
120   if ((*annotationCache).find(m) == (*annotationCache).end())
121     cacheAnnotationFromMD(m, gv);
122   else if ((*annotationCache)[m].find(gv) == (*annotationCache)[m].end())
123     cacheAnnotationFromMD(m, gv);
124   if ((*annotationCache)[m][gv].find(prop) == (*annotationCache)[m][gv].end())
125     return false;
126   retval = (*annotationCache)[m][gv][prop];
127   return true;
128 }
129 
isTexture(const llvm::Value & val)130 bool llvm::isTexture(const llvm::Value &val) {
131   if (const GlobalValue *gv = dyn_cast<GlobalValue>(&val)) {
132     unsigned annot;
133     if (llvm::findOneNVVMAnnotation(
134             gv, llvm::PropertyAnnotationNames[llvm::PROPERTY_ISTEXTURE],
135             annot)) {
136       assert((annot == 1) && "Unexpected annotation on a texture symbol");
137       return true;
138     }
139   }
140   return false;
141 }
142 
isSurface(const llvm::Value & val)143 bool llvm::isSurface(const llvm::Value &val) {
144   if (const GlobalValue *gv = dyn_cast<GlobalValue>(&val)) {
145     unsigned annot;
146     if (llvm::findOneNVVMAnnotation(
147             gv, llvm::PropertyAnnotationNames[llvm::PROPERTY_ISSURFACE],
148             annot)) {
149       assert((annot == 1) && "Unexpected annotation on a surface symbol");
150       return true;
151     }
152   }
153   return false;
154 }
155 
isSampler(const llvm::Value & val)156 bool llvm::isSampler(const llvm::Value &val) {
157   if (const GlobalValue *gv = dyn_cast<GlobalValue>(&val)) {
158     unsigned annot;
159     if (llvm::findOneNVVMAnnotation(
160             gv, llvm::PropertyAnnotationNames[llvm::PROPERTY_ISSAMPLER],
161             annot)) {
162       assert((annot == 1) && "Unexpected annotation on a sampler symbol");
163       return true;
164     }
165   }
166   if (const Argument *arg = dyn_cast<Argument>(&val)) {
167     const Function *func = arg->getParent();
168     std::vector<unsigned> annot;
169     if (llvm::findAllNVVMAnnotation(
170             func, llvm::PropertyAnnotationNames[llvm::PROPERTY_ISSAMPLER],
171             annot)) {
172       if (std::find(annot.begin(), annot.end(), arg->getArgNo()) != annot.end())
173         return true;
174     }
175   }
176   return false;
177 }
178 
isImageReadOnly(const llvm::Value & val)179 bool llvm::isImageReadOnly(const llvm::Value &val) {
180   if (const Argument *arg = dyn_cast<Argument>(&val)) {
181     const Function *func = arg->getParent();
182     std::vector<unsigned> annot;
183     if (llvm::findAllNVVMAnnotation(func,
184                                     llvm::PropertyAnnotationNames[
185                                         llvm::PROPERTY_ISREADONLY_IMAGE_PARAM],
186                                     annot)) {
187       if (std::find(annot.begin(), annot.end(), arg->getArgNo()) != annot.end())
188         return true;
189     }
190   }
191   return false;
192 }
193 
isImageWriteOnly(const llvm::Value & val)194 bool llvm::isImageWriteOnly(const llvm::Value &val) {
195   if (const Argument *arg = dyn_cast<Argument>(&val)) {
196     const Function *func = arg->getParent();
197     std::vector<unsigned> annot;
198     if (llvm::findAllNVVMAnnotation(func,
199                                     llvm::PropertyAnnotationNames[
200                                         llvm::PROPERTY_ISWRITEONLY_IMAGE_PARAM],
201                                     annot)) {
202       if (std::find(annot.begin(), annot.end(), arg->getArgNo()) != annot.end())
203         return true;
204     }
205   }
206   return false;
207 }
208 
isImageReadWrite(const llvm::Value & val)209 bool llvm::isImageReadWrite(const llvm::Value &val) {
210   if (const Argument *arg = dyn_cast<Argument>(&val)) {
211     const Function *func = arg->getParent();
212     std::vector<unsigned> annot;
213     if (llvm::findAllNVVMAnnotation(func,
214                                     llvm::PropertyAnnotationNames[
215                                         llvm::PROPERTY_ISREADWRITE_IMAGE_PARAM],
216                                     annot)) {
217       if (std::find(annot.begin(), annot.end(), arg->getArgNo()) != annot.end())
218         return true;
219     }
220   }
221   return false;
222 }
223 
isImage(const llvm::Value & val)224 bool llvm::isImage(const llvm::Value &val) {
225   return llvm::isImageReadOnly(val) || llvm::isImageWriteOnly(val) ||
226          llvm::isImageReadWrite(val);
227 }
228 
isManaged(const llvm::Value & val)229 bool llvm::isManaged(const llvm::Value &val) {
230   if(const GlobalValue *gv = dyn_cast<GlobalValue>(&val)) {
231     unsigned annot;
232     if(llvm::findOneNVVMAnnotation(gv,
233                           llvm::PropertyAnnotationNames[llvm::PROPERTY_MANAGED],
234                                    annot)) {
235       assert((annot == 1) && "Unexpected annotation on a managed symbol");
236       return true;
237     }
238   }
239   return false;
240 }
241 
getTextureName(const llvm::Value & val)242 std::string llvm::getTextureName(const llvm::Value &val) {
243   assert(val.hasName() && "Found texture variable with no name");
244   return val.getName();
245 }
246 
getSurfaceName(const llvm::Value & val)247 std::string llvm::getSurfaceName(const llvm::Value &val) {
248   assert(val.hasName() && "Found surface variable with no name");
249   return val.getName();
250 }
251 
getSamplerName(const llvm::Value & val)252 std::string llvm::getSamplerName(const llvm::Value &val) {
253   assert(val.hasName() && "Found sampler variable with no name");
254   return val.getName();
255 }
256 
getMaxNTIDx(const Function & F,unsigned & x)257 bool llvm::getMaxNTIDx(const Function &F, unsigned &x) {
258   return (llvm::findOneNVVMAnnotation(
259       &F, llvm::PropertyAnnotationNames[llvm::PROPERTY_MAXNTID_X], x));
260 }
261 
getMaxNTIDy(const Function & F,unsigned & y)262 bool llvm::getMaxNTIDy(const Function &F, unsigned &y) {
263   return (llvm::findOneNVVMAnnotation(
264       &F, llvm::PropertyAnnotationNames[llvm::PROPERTY_MAXNTID_Y], y));
265 }
266 
getMaxNTIDz(const Function & F,unsigned & z)267 bool llvm::getMaxNTIDz(const Function &F, unsigned &z) {
268   return (llvm::findOneNVVMAnnotation(
269       &F, llvm::PropertyAnnotationNames[llvm::PROPERTY_MAXNTID_Z], z));
270 }
271 
getReqNTIDx(const Function & F,unsigned & x)272 bool llvm::getReqNTIDx(const Function &F, unsigned &x) {
273   return (llvm::findOneNVVMAnnotation(
274       &F, llvm::PropertyAnnotationNames[llvm::PROPERTY_REQNTID_X], x));
275 }
276 
getReqNTIDy(const Function & F,unsigned & y)277 bool llvm::getReqNTIDy(const Function &F, unsigned &y) {
278   return (llvm::findOneNVVMAnnotation(
279       &F, llvm::PropertyAnnotationNames[llvm::PROPERTY_REQNTID_Y], y));
280 }
281 
getReqNTIDz(const Function & F,unsigned & z)282 bool llvm::getReqNTIDz(const Function &F, unsigned &z) {
283   return (llvm::findOneNVVMAnnotation(
284       &F, llvm::PropertyAnnotationNames[llvm::PROPERTY_REQNTID_Z], z));
285 }
286 
getMinCTASm(const Function & F,unsigned & x)287 bool llvm::getMinCTASm(const Function &F, unsigned &x) {
288   return (llvm::findOneNVVMAnnotation(
289       &F, llvm::PropertyAnnotationNames[llvm::PROPERTY_MINNCTAPERSM], x));
290 }
291 
isKernelFunction(const Function & F)292 bool llvm::isKernelFunction(const Function &F) {
293   unsigned x = 0;
294   bool retval = llvm::findOneNVVMAnnotation(
295       &F, llvm::PropertyAnnotationNames[llvm::PROPERTY_ISKERNEL_FUNCTION], x);
296   if (!retval) {
297     // There is no NVVM metadata, check the calling convention
298     return F.getCallingConv() == llvm::CallingConv::PTX_Kernel;
299   }
300   return (x == 1);
301 }
302 
getAlign(const Function & F,unsigned index,unsigned & align)303 bool llvm::getAlign(const Function &F, unsigned index, unsigned &align) {
304   std::vector<unsigned> Vs;
305   bool retval = llvm::findAllNVVMAnnotation(
306       &F, llvm::PropertyAnnotationNames[llvm::PROPERTY_ALIGN], Vs);
307   if (!retval)
308     return false;
309   for (int i = 0, e = Vs.size(); i < e; i++) {
310     unsigned v = Vs[i];
311     if ((v >> 16) == index) {
312       align = v & 0xFFFF;
313       return true;
314     }
315   }
316   return false;
317 }
318 
getAlign(const CallInst & I,unsigned index,unsigned & align)319 bool llvm::getAlign(const CallInst &I, unsigned index, unsigned &align) {
320   if (MDNode *alignNode = I.getMetadata("callalign")) {
321     for (int i = 0, n = alignNode->getNumOperands(); i < n; i++) {
322       if (const ConstantInt *CI =
323               mdconst::dyn_extract<ConstantInt>(alignNode->getOperand(i))) {
324         unsigned v = CI->getZExtValue();
325         if ((v >> 16) == index) {
326           align = v & 0xFFFF;
327           return true;
328         }
329         if ((v >> 16) > index) {
330           return false;
331         }
332       }
333     }
334   }
335   return false;
336 }
337 
isBarrierIntrinsic(Intrinsic::ID id)338 bool llvm::isBarrierIntrinsic(Intrinsic::ID id) {
339   if ((id == Intrinsic::nvvm_barrier0) ||
340       (id == Intrinsic::nvvm_barrier0_popc) ||
341       (id == Intrinsic::nvvm_barrier0_and) ||
342       (id == Intrinsic::nvvm_barrier0_or) ||
343       (id == Intrinsic::cuda_syncthreads))
344     return true;
345   return false;
346 }
347 
348 // Interface for checking all memory space transfer related intrinsics
isMemorySpaceTransferIntrinsic(Intrinsic::ID id)349 bool llvm::isMemorySpaceTransferIntrinsic(Intrinsic::ID id) {
350   if (id == Intrinsic::nvvm_ptr_local_to_gen ||
351       id == Intrinsic::nvvm_ptr_shared_to_gen ||
352       id == Intrinsic::nvvm_ptr_global_to_gen ||
353       id == Intrinsic::nvvm_ptr_constant_to_gen ||
354       id == Intrinsic::nvvm_ptr_gen_to_global ||
355       id == Intrinsic::nvvm_ptr_gen_to_shared ||
356       id == Intrinsic::nvvm_ptr_gen_to_local ||
357       id == Intrinsic::nvvm_ptr_gen_to_constant ||
358       id == Intrinsic::nvvm_ptr_gen_to_param) {
359     return true;
360   }
361 
362   return false;
363 }
364 
365 // consider several special intrinsics in striping pointer casts, and
366 // provide an option to ignore GEP indicies for find out the base address only
367 // which could be used in simple alias disambigurate.
368 const Value *
skipPointerTransfer(const Value * V,bool ignore_GEP_indices)369 llvm::skipPointerTransfer(const Value *V, bool ignore_GEP_indices) {
370   V = V->stripPointerCasts();
371   while (true) {
372     if (const IntrinsicInst *IS = dyn_cast<IntrinsicInst>(V)) {
373       if (isMemorySpaceTransferIntrinsic(IS->getIntrinsicID())) {
374         V = IS->getArgOperand(0)->stripPointerCasts();
375         continue;
376       }
377     } else if (ignore_GEP_indices)
378       if (const GEPOperator *GEP = dyn_cast<GEPOperator>(V)) {
379         V = GEP->getPointerOperand()->stripPointerCasts();
380         continue;
381       }
382     break;
383   }
384   return V;
385 }
386 
387 // consider several special intrinsics in striping pointer casts, and
388 // - ignore GEP indicies for find out the base address only, and
389 // - tracking PHINode
390 // which could be used in simple alias disambigurate.
391 const Value *
skipPointerTransfer(const Value * V,std::set<const Value * > & processed)392 llvm::skipPointerTransfer(const Value *V, std::set<const Value *> &processed) {
393   if (processed.find(V) != processed.end())
394     return nullptr;
395   processed.insert(V);
396 
397   const Value *V2 = V->stripPointerCasts();
398   if (V2 != V && processed.find(V2) != processed.end())
399     return nullptr;
400   processed.insert(V2);
401 
402   V = V2;
403 
404   while (true) {
405     if (const IntrinsicInst *IS = dyn_cast<IntrinsicInst>(V)) {
406       if (isMemorySpaceTransferIntrinsic(IS->getIntrinsicID())) {
407         V = IS->getArgOperand(0)->stripPointerCasts();
408         continue;
409       }
410     } else if (const GEPOperator *GEP = dyn_cast<GEPOperator>(V)) {
411       V = GEP->getPointerOperand()->stripPointerCasts();
412       continue;
413     } else if (const PHINode *PN = dyn_cast<PHINode>(V)) {
414       if (V != V2 && processed.find(V) != processed.end())
415         return nullptr;
416       processed.insert(PN);
417       const Value *common = nullptr;
418       for (unsigned i = 0; i != PN->getNumIncomingValues(); ++i) {
419         const Value *pv = PN->getIncomingValue(i);
420         const Value *base = skipPointerTransfer(pv, processed);
421         if (base) {
422           if (!common)
423             common = base;
424           else if (common != base)
425             return PN;
426         }
427       }
428       if (!common)
429         return PN;
430       V = common;
431     }
432     break;
433   }
434   return V;
435 }
436 
437 // The following are some useful utilities for debuggung
438 
getParentBlock(Value * v)439 BasicBlock *llvm::getParentBlock(Value *v) {
440   if (BasicBlock *B = dyn_cast<BasicBlock>(v))
441     return B;
442 
443   if (Instruction *I = dyn_cast<Instruction>(v))
444     return I->getParent();
445 
446   return nullptr;
447 }
448 
getParentFunction(Value * v)449 Function *llvm::getParentFunction(Value *v) {
450   if (Function *F = dyn_cast<Function>(v))
451     return F;
452 
453   if (Instruction *I = dyn_cast<Instruction>(v))
454     return I->getParent()->getParent();
455 
456   if (BasicBlock *B = dyn_cast<BasicBlock>(v))
457     return B->getParent();
458 
459   return nullptr;
460 }
461 
462 // Dump a block by name
dumpBlock(Value * v,char * blockName)463 void llvm::dumpBlock(Value *v, char *blockName) {
464   Function *F = getParentFunction(v);
465   if (!F)
466     return;
467 
468   for (Function::iterator it = F->begin(), ie = F->end(); it != ie; ++it) {
469     BasicBlock *B = it;
470     if (strcmp(B->getName().data(), blockName) == 0) {
471       B->dump();
472       return;
473     }
474   }
475 }
476 
477 // Find an instruction by name
getInst(Value * base,char * instName)478 Instruction *llvm::getInst(Value *base, char *instName) {
479   Function *F = getParentFunction(base);
480   if (!F)
481     return nullptr;
482 
483   for (inst_iterator it = inst_begin(F), ie = inst_end(F); it != ie; ++it) {
484     Instruction *I = &*it;
485     if (strcmp(I->getName().data(), instName) == 0) {
486       return I;
487     }
488   }
489 
490   return nullptr;
491 }
492 
493 // Dump an instruction by nane
dumpInst(Value * base,char * instName)494 void llvm::dumpInst(Value *base, char *instName) {
495   Instruction *I = getInst(base, instName);
496   if (I)
497     I->dump();
498 }
499 
500 // Dump an instruction and all dependent instructions
dumpInstRec(Value * v,std::set<Instruction * > * visited)501 void llvm::dumpInstRec(Value *v, std::set<Instruction *> *visited) {
502   if (Instruction *I = dyn_cast<Instruction>(v)) {
503 
504     if (visited->find(I) != visited->end())
505       return;
506 
507     visited->insert(I);
508 
509     for (unsigned i = 0, e = I->getNumOperands(); i != e; ++i)
510       dumpInstRec(I->getOperand(i), visited);
511 
512     I->dump();
513   }
514 }
515 
516 // Dump an instruction and all dependent instructions
dumpInstRec(Value * v)517 void llvm::dumpInstRec(Value *v) {
518   std::set<Instruction *> visited;
519 
520   //BasicBlock *B = getParentBlock(v);
521 
522   dumpInstRec(v, &visited);
523 }
524 
525 // Dump the parent for Instruction, block or function
dumpParent(Value * v)526 void llvm::dumpParent(Value *v) {
527   if (Instruction *I = dyn_cast<Instruction>(v)) {
528     I->getParent()->dump();
529     return;
530   }
531 
532   if (BasicBlock *B = dyn_cast<BasicBlock>(v)) {
533     B->getParent()->dump();
534     return;
535   }
536 
537   if (Function *F = dyn_cast<Function>(v)) {
538     F->getParent()->dump();
539     return;
540   }
541 }
542