xref: /freebsd/contrib/llvm-project/llvm/lib/Target/NVPTX/NVPTXUtilities.cpp (revision 0fca6ea1d4eea4c934cfff25ac9ee8ad6fe95583)
10b57cec5SDimitry Andric //===- NVPTXUtilities.cpp - Utility Functions -----------------------------===//
20b57cec5SDimitry Andric //
30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
60b57cec5SDimitry Andric //
70b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
80b57cec5SDimitry Andric //
90b57cec5SDimitry Andric // This file contains miscellaneous utility functions
100b57cec5SDimitry Andric //
110b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
120b57cec5SDimitry Andric 
130b57cec5SDimitry Andric #include "NVPTXUtilities.h"
140b57cec5SDimitry Andric #include "NVPTX.h"
15bdd1243dSDimitry Andric #include "NVPTXTargetMachine.h"
160b57cec5SDimitry Andric #include "llvm/IR/Constants.h"
170b57cec5SDimitry Andric #include "llvm/IR/Function.h"
180b57cec5SDimitry Andric #include "llvm/IR/GlobalVariable.h"
190b57cec5SDimitry Andric #include "llvm/IR/InstIterator.h"
200b57cec5SDimitry Andric #include "llvm/IR/Module.h"
210b57cec5SDimitry Andric #include "llvm/IR/Operator.h"
22*0fca6ea1SDimitry Andric #include "llvm/Support/Alignment.h"
238bcb0991SDimitry Andric #include "llvm/Support/Mutex.h"
240b57cec5SDimitry Andric #include <algorithm>
250b57cec5SDimitry Andric #include <cstring>
260b57cec5SDimitry Andric #include <map>
278bcb0991SDimitry Andric #include <mutex>
28*0fca6ea1SDimitry Andric #include <optional>
290b57cec5SDimitry Andric #include <string>
300b57cec5SDimitry Andric #include <vector>
310b57cec5SDimitry Andric 
320b57cec5SDimitry Andric namespace llvm {
330b57cec5SDimitry Andric 
340b57cec5SDimitry Andric namespace {
350b57cec5SDimitry Andric typedef std::map<std::string, std::vector<unsigned> > key_val_pair_t;
360b57cec5SDimitry Andric typedef std::map<const GlobalValue *, key_val_pair_t> global_val_annot_t;
37753f127fSDimitry Andric 
38753f127fSDimitry Andric struct AnnotationCache {
39753f127fSDimitry Andric   sys::Mutex Lock;
40753f127fSDimitry Andric   std::map<const Module *, global_val_annot_t> Cache;
41753f127fSDimitry Andric };
42753f127fSDimitry Andric 
getAnnotationCache()43753f127fSDimitry Andric AnnotationCache &getAnnotationCache() {
44753f127fSDimitry Andric   static AnnotationCache AC;
45753f127fSDimitry Andric   return AC;
46753f127fSDimitry Andric }
470b57cec5SDimitry Andric } // anonymous namespace
480b57cec5SDimitry Andric 
clearAnnotationCache(const Module * Mod)490b57cec5SDimitry Andric void clearAnnotationCache(const Module *Mod) {
50753f127fSDimitry Andric   auto &AC = getAnnotationCache();
51753f127fSDimitry Andric   std::lock_guard<sys::Mutex> Guard(AC.Lock);
52753f127fSDimitry Andric   AC.Cache.erase(Mod);
530b57cec5SDimitry Andric }
540b57cec5SDimitry Andric 
readIntVecFromMDNode(const MDNode * MetadataNode,std::vector<unsigned> & Vec)55*0fca6ea1SDimitry Andric static void readIntVecFromMDNode(const MDNode *MetadataNode,
56*0fca6ea1SDimitry Andric                                  std::vector<unsigned> &Vec) {
57*0fca6ea1SDimitry Andric   for (unsigned i = 0, e = MetadataNode->getNumOperands(); i != e; ++i) {
58*0fca6ea1SDimitry Andric     ConstantInt *Val =
59*0fca6ea1SDimitry Andric         mdconst::extract<ConstantInt>(MetadataNode->getOperand(i));
60*0fca6ea1SDimitry Andric     Vec.push_back(Val->getZExtValue());
61*0fca6ea1SDimitry Andric   }
62*0fca6ea1SDimitry Andric }
63*0fca6ea1SDimitry Andric 
cacheAnnotationFromMD(const MDNode * MetadataNode,key_val_pair_t & retval)64*0fca6ea1SDimitry Andric static void cacheAnnotationFromMD(const MDNode *MetadataNode,
65*0fca6ea1SDimitry Andric                                   key_val_pair_t &retval) {
66753f127fSDimitry Andric   auto &AC = getAnnotationCache();
67753f127fSDimitry Andric   std::lock_guard<sys::Mutex> Guard(AC.Lock);
68*0fca6ea1SDimitry Andric   assert(MetadataNode && "Invalid mdnode for annotation");
69*0fca6ea1SDimitry Andric   assert((MetadataNode->getNumOperands() % 2) == 1 &&
70*0fca6ea1SDimitry Andric          "Invalid number of operands");
710b57cec5SDimitry Andric   // start index = 1, to skip the global variable key
720b57cec5SDimitry Andric   // increment = 2, to skip the value for each property-value pairs
73*0fca6ea1SDimitry Andric   for (unsigned i = 1, e = MetadataNode->getNumOperands(); i != e; i += 2) {
740b57cec5SDimitry Andric     // property
75*0fca6ea1SDimitry Andric     const MDString *prop = dyn_cast<MDString>(MetadataNode->getOperand(i));
760b57cec5SDimitry Andric     assert(prop && "Annotation property not a string");
77*0fca6ea1SDimitry Andric     std::string Key = prop->getString().str();
780b57cec5SDimitry Andric 
790b57cec5SDimitry Andric     // value
80*0fca6ea1SDimitry Andric     if (ConstantInt *Val = mdconst::dyn_extract<ConstantInt>(
81*0fca6ea1SDimitry Andric             MetadataNode->getOperand(i + 1))) {
82*0fca6ea1SDimitry Andric       retval[Key].push_back(Val->getZExtValue());
83*0fca6ea1SDimitry Andric     } else if (MDNode *VecMd =
84*0fca6ea1SDimitry Andric                    dyn_cast<MDNode>(MetadataNode->getOperand(i + 1))) {
85*0fca6ea1SDimitry Andric       // note: only "grid_constant" annotations support vector MDNodes.
86*0fca6ea1SDimitry Andric       // assert: there can only exist one unique key value pair of
87*0fca6ea1SDimitry Andric       // the form (string key, MDNode node). Operands of such a node
88*0fca6ea1SDimitry Andric       // shall always be unsigned ints.
89*0fca6ea1SDimitry Andric       if (retval.find(Key) == retval.end()) {
90*0fca6ea1SDimitry Andric         readIntVecFromMDNode(VecMd, retval[Key]);
91*0fca6ea1SDimitry Andric         continue;
92*0fca6ea1SDimitry Andric       }
93*0fca6ea1SDimitry Andric     } else {
94*0fca6ea1SDimitry Andric       llvm_unreachable("Value operand not a constant int or an mdnode");
950b57cec5SDimitry Andric     }
960b57cec5SDimitry Andric   }
970b57cec5SDimitry Andric }
980b57cec5SDimitry Andric 
cacheAnnotationFromMD(const Module * m,const GlobalValue * gv)990b57cec5SDimitry Andric static void cacheAnnotationFromMD(const Module *m, const GlobalValue *gv) {
100753f127fSDimitry Andric   auto &AC = getAnnotationCache();
101753f127fSDimitry Andric   std::lock_guard<sys::Mutex> Guard(AC.Lock);
1020b57cec5SDimitry Andric   NamedMDNode *NMD = m->getNamedMetadata("nvvm.annotations");
1030b57cec5SDimitry Andric   if (!NMD)
1040b57cec5SDimitry Andric     return;
1050b57cec5SDimitry Andric   key_val_pair_t tmp;
1060b57cec5SDimitry Andric   for (unsigned i = 0, e = NMD->getNumOperands(); i != e; ++i) {
1070b57cec5SDimitry Andric     const MDNode *elem = NMD->getOperand(i);
1080b57cec5SDimitry Andric 
1090b57cec5SDimitry Andric     GlobalValue *entity =
1100b57cec5SDimitry Andric         mdconst::dyn_extract_or_null<GlobalValue>(elem->getOperand(0));
1110b57cec5SDimitry Andric     // entity may be null due to DCE
1120b57cec5SDimitry Andric     if (!entity)
1130b57cec5SDimitry Andric       continue;
1140b57cec5SDimitry Andric     if (entity != gv)
1150b57cec5SDimitry Andric       continue;
1160b57cec5SDimitry Andric 
1170b57cec5SDimitry Andric     // accumulate annotations for entity in tmp
1180b57cec5SDimitry Andric     cacheAnnotationFromMD(elem, tmp);
1190b57cec5SDimitry Andric   }
1200b57cec5SDimitry Andric 
1210b57cec5SDimitry Andric   if (tmp.empty()) // no annotations for this gv
1220b57cec5SDimitry Andric     return;
1230b57cec5SDimitry Andric 
124753f127fSDimitry Andric   if (AC.Cache.find(m) != AC.Cache.end())
125753f127fSDimitry Andric     AC.Cache[m][gv] = std::move(tmp);
1260b57cec5SDimitry Andric   else {
1270b57cec5SDimitry Andric     global_val_annot_t tmp1;
1280b57cec5SDimitry Andric     tmp1[gv] = std::move(tmp);
129753f127fSDimitry Andric     AC.Cache[m] = std::move(tmp1);
1300b57cec5SDimitry Andric   }
1310b57cec5SDimitry Andric }
1320b57cec5SDimitry Andric 
findOneNVVMAnnotation(const GlobalValue * gv,const std::string & prop,unsigned & retval)1330b57cec5SDimitry Andric bool findOneNVVMAnnotation(const GlobalValue *gv, const std::string &prop,
1340b57cec5SDimitry Andric                            unsigned &retval) {
135753f127fSDimitry Andric   auto &AC = getAnnotationCache();
136753f127fSDimitry Andric   std::lock_guard<sys::Mutex> Guard(AC.Lock);
1370b57cec5SDimitry Andric   const Module *m = gv->getParent();
138753f127fSDimitry Andric   if (AC.Cache.find(m) == AC.Cache.end())
1390b57cec5SDimitry Andric     cacheAnnotationFromMD(m, gv);
140753f127fSDimitry Andric   else if (AC.Cache[m].find(gv) == AC.Cache[m].end())
1410b57cec5SDimitry Andric     cacheAnnotationFromMD(m, gv);
142753f127fSDimitry Andric   if (AC.Cache[m][gv].find(prop) == AC.Cache[m][gv].end())
1430b57cec5SDimitry Andric     return false;
144753f127fSDimitry Andric   retval = AC.Cache[m][gv][prop][0];
1450b57cec5SDimitry Andric   return true;
1460b57cec5SDimitry Andric }
1470b57cec5SDimitry Andric 
148*0fca6ea1SDimitry Andric static std::optional<unsigned>
findOneNVVMAnnotation(const GlobalValue & GV,const std::string & PropName)149*0fca6ea1SDimitry Andric findOneNVVMAnnotation(const GlobalValue &GV, const std::string &PropName) {
150*0fca6ea1SDimitry Andric   unsigned RetVal;
151*0fca6ea1SDimitry Andric   if (findOneNVVMAnnotation(&GV, PropName, RetVal))
152*0fca6ea1SDimitry Andric     return RetVal;
153*0fca6ea1SDimitry Andric   return std::nullopt;
154*0fca6ea1SDimitry Andric }
155*0fca6ea1SDimitry Andric 
findAllNVVMAnnotation(const GlobalValue * gv,const std::string & prop,std::vector<unsigned> & retval)1560b57cec5SDimitry Andric bool findAllNVVMAnnotation(const GlobalValue *gv, const std::string &prop,
1570b57cec5SDimitry Andric                            std::vector<unsigned> &retval) {
158753f127fSDimitry Andric   auto &AC = getAnnotationCache();
159753f127fSDimitry Andric   std::lock_guard<sys::Mutex> Guard(AC.Lock);
1600b57cec5SDimitry Andric   const Module *m = gv->getParent();
161753f127fSDimitry Andric   if (AC.Cache.find(m) == AC.Cache.end())
1620b57cec5SDimitry Andric     cacheAnnotationFromMD(m, gv);
163753f127fSDimitry Andric   else if (AC.Cache[m].find(gv) == AC.Cache[m].end())
1640b57cec5SDimitry Andric     cacheAnnotationFromMD(m, gv);
165753f127fSDimitry Andric   if (AC.Cache[m][gv].find(prop) == AC.Cache[m][gv].end())
1660b57cec5SDimitry Andric     return false;
167753f127fSDimitry Andric   retval = AC.Cache[m][gv][prop];
1680b57cec5SDimitry Andric   return true;
1690b57cec5SDimitry Andric }
1700b57cec5SDimitry Andric 
isTexture(const Value & val)1710b57cec5SDimitry Andric bool isTexture(const Value &val) {
1720b57cec5SDimitry Andric   if (const GlobalValue *gv = dyn_cast<GlobalValue>(&val)) {
173*0fca6ea1SDimitry Andric     unsigned Annot;
174*0fca6ea1SDimitry Andric     if (findOneNVVMAnnotation(gv, "texture", Annot)) {
175*0fca6ea1SDimitry Andric       assert((Annot == 1) && "Unexpected annotation on a texture symbol");
1760b57cec5SDimitry Andric       return true;
1770b57cec5SDimitry Andric     }
1780b57cec5SDimitry Andric   }
1790b57cec5SDimitry Andric   return false;
1800b57cec5SDimitry Andric }
1810b57cec5SDimitry Andric 
isSurface(const Value & val)1820b57cec5SDimitry Andric bool isSurface(const Value &val) {
1830b57cec5SDimitry Andric   if (const GlobalValue *gv = dyn_cast<GlobalValue>(&val)) {
184*0fca6ea1SDimitry Andric     unsigned Annot;
185*0fca6ea1SDimitry Andric     if (findOneNVVMAnnotation(gv, "surface", Annot)) {
186*0fca6ea1SDimitry Andric       assert((Annot == 1) && "Unexpected annotation on a surface symbol");
187*0fca6ea1SDimitry Andric       return true;
188*0fca6ea1SDimitry Andric     }
189*0fca6ea1SDimitry Andric   }
190*0fca6ea1SDimitry Andric   return false;
191*0fca6ea1SDimitry Andric }
192*0fca6ea1SDimitry Andric 
argHasNVVMAnnotation(const Value & Val,const std::string & Annotation,const bool StartArgIndexAtOne=false)193*0fca6ea1SDimitry Andric static bool argHasNVVMAnnotation(const Value &Val,
194*0fca6ea1SDimitry Andric                                  const std::string &Annotation,
195*0fca6ea1SDimitry Andric                                  const bool StartArgIndexAtOne = false) {
196*0fca6ea1SDimitry Andric   if (const Argument *Arg = dyn_cast<Argument>(&Val)) {
197*0fca6ea1SDimitry Andric     const Function *Func = Arg->getParent();
198*0fca6ea1SDimitry Andric     std::vector<unsigned> Annot;
199*0fca6ea1SDimitry Andric     if (findAllNVVMAnnotation(Func, Annotation, Annot)) {
200*0fca6ea1SDimitry Andric       const unsigned BaseOffset = StartArgIndexAtOne ? 1 : 0;
201*0fca6ea1SDimitry Andric       if (is_contained(Annot, BaseOffset + Arg->getArgNo())) {
202*0fca6ea1SDimitry Andric         return true;
203*0fca6ea1SDimitry Andric       }
204*0fca6ea1SDimitry Andric     }
205*0fca6ea1SDimitry Andric   }
206*0fca6ea1SDimitry Andric   return false;
207*0fca6ea1SDimitry Andric }
208*0fca6ea1SDimitry Andric 
isParamGridConstant(const Value & V)209*0fca6ea1SDimitry Andric bool isParamGridConstant(const Value &V) {
210*0fca6ea1SDimitry Andric   if (const Argument *Arg = dyn_cast<Argument>(&V)) {
211*0fca6ea1SDimitry Andric     // "grid_constant" counts argument indices starting from 1
212*0fca6ea1SDimitry Andric     if (Arg->hasByValAttr() &&
213*0fca6ea1SDimitry Andric         argHasNVVMAnnotation(*Arg, "grid_constant",
214*0fca6ea1SDimitry Andric                              /*StartArgIndexAtOne*/ true)) {
215*0fca6ea1SDimitry Andric       assert(isKernelFunction(*Arg->getParent()) &&
216*0fca6ea1SDimitry Andric              "only kernel arguments can be grid_constant");
2170b57cec5SDimitry Andric       return true;
2180b57cec5SDimitry Andric     }
2190b57cec5SDimitry Andric   }
2200b57cec5SDimitry Andric   return false;
2210b57cec5SDimitry Andric }
2220b57cec5SDimitry Andric 
isSampler(const Value & val)2230b57cec5SDimitry Andric bool isSampler(const Value &val) {
2240b57cec5SDimitry Andric   const char *AnnotationName = "sampler";
2250b57cec5SDimitry Andric 
2260b57cec5SDimitry Andric   if (const GlobalValue *gv = dyn_cast<GlobalValue>(&val)) {
227*0fca6ea1SDimitry Andric     unsigned Annot;
228*0fca6ea1SDimitry Andric     if (findOneNVVMAnnotation(gv, AnnotationName, Annot)) {
229*0fca6ea1SDimitry Andric       assert((Annot == 1) && "Unexpected annotation on a sampler symbol");
2300b57cec5SDimitry Andric       return true;
2310b57cec5SDimitry Andric     }
2320b57cec5SDimitry Andric   }
233*0fca6ea1SDimitry Andric   return argHasNVVMAnnotation(val, AnnotationName);
2340b57cec5SDimitry Andric }
2350b57cec5SDimitry Andric 
isImageReadOnly(const Value & val)2360b57cec5SDimitry Andric bool isImageReadOnly(const Value &val) {
237*0fca6ea1SDimitry Andric   return argHasNVVMAnnotation(val, "rdoimage");
2380b57cec5SDimitry Andric }
2390b57cec5SDimitry Andric 
isImageWriteOnly(const Value & val)2400b57cec5SDimitry Andric bool isImageWriteOnly(const Value &val) {
241*0fca6ea1SDimitry Andric   return argHasNVVMAnnotation(val, "wroimage");
2420b57cec5SDimitry Andric }
2430b57cec5SDimitry Andric 
isImageReadWrite(const Value & val)2440b57cec5SDimitry Andric bool isImageReadWrite(const Value &val) {
245*0fca6ea1SDimitry Andric   return argHasNVVMAnnotation(val, "rdwrimage");
2460b57cec5SDimitry Andric }
2470b57cec5SDimitry Andric 
isImage(const Value & val)2480b57cec5SDimitry Andric bool isImage(const Value &val) {
2490b57cec5SDimitry Andric   return isImageReadOnly(val) || isImageWriteOnly(val) || isImageReadWrite(val);
2500b57cec5SDimitry Andric }
2510b57cec5SDimitry Andric 
isManaged(const Value & val)2520b57cec5SDimitry Andric bool isManaged(const Value &val) {
2530b57cec5SDimitry Andric   if(const GlobalValue *gv = dyn_cast<GlobalValue>(&val)) {
254*0fca6ea1SDimitry Andric     unsigned Annot;
255*0fca6ea1SDimitry Andric     if (findOneNVVMAnnotation(gv, "managed", Annot)) {
256*0fca6ea1SDimitry Andric       assert((Annot == 1) && "Unexpected annotation on a managed symbol");
2570b57cec5SDimitry Andric       return true;
2580b57cec5SDimitry Andric     }
2590b57cec5SDimitry Andric   }
2600b57cec5SDimitry Andric   return false;
2610b57cec5SDimitry Andric }
2620b57cec5SDimitry Andric 
getTextureName(const Value & val)2630b57cec5SDimitry Andric std::string getTextureName(const Value &val) {
2640b57cec5SDimitry Andric   assert(val.hasName() && "Found texture variable with no name");
2655ffd83dbSDimitry Andric   return std::string(val.getName());
2660b57cec5SDimitry Andric }
2670b57cec5SDimitry Andric 
getSurfaceName(const Value & val)2680b57cec5SDimitry Andric std::string getSurfaceName(const Value &val) {
2690b57cec5SDimitry Andric   assert(val.hasName() && "Found surface variable with no name");
2705ffd83dbSDimitry Andric   return std::string(val.getName());
2710b57cec5SDimitry Andric }
2720b57cec5SDimitry Andric 
getSamplerName(const Value & val)2730b57cec5SDimitry Andric std::string getSamplerName(const Value &val) {
2740b57cec5SDimitry Andric   assert(val.hasName() && "Found sampler variable with no name");
2755ffd83dbSDimitry Andric   return std::string(val.getName());
2760b57cec5SDimitry Andric }
2770b57cec5SDimitry Andric 
getMaxNTIDx(const Function & F)278*0fca6ea1SDimitry Andric std::optional<unsigned> getMaxNTIDx(const Function &F) {
279*0fca6ea1SDimitry Andric   return findOneNVVMAnnotation(F, "maxntidx");
2800b57cec5SDimitry Andric }
2810b57cec5SDimitry Andric 
getMaxNTIDy(const Function & F)282*0fca6ea1SDimitry Andric std::optional<unsigned> getMaxNTIDy(const Function &F) {
283*0fca6ea1SDimitry Andric   return findOneNVVMAnnotation(F, "maxntidy");
2840b57cec5SDimitry Andric }
2850b57cec5SDimitry Andric 
getMaxNTIDz(const Function & F)286*0fca6ea1SDimitry Andric std::optional<unsigned> getMaxNTIDz(const Function &F) {
287*0fca6ea1SDimitry Andric   return findOneNVVMAnnotation(F, "maxntidz");
288*0fca6ea1SDimitry Andric }
289*0fca6ea1SDimitry Andric 
getMaxNTID(const Function & F)290*0fca6ea1SDimitry Andric std::optional<unsigned> getMaxNTID(const Function &F) {
291*0fca6ea1SDimitry Andric   // Note: The semantics here are a bit strange. The PTX ISA states the
292*0fca6ea1SDimitry Andric   // following (11.4.2. Performance-Tuning Directives: .maxntid):
293*0fca6ea1SDimitry Andric   //
294*0fca6ea1SDimitry Andric   //  Note that this directive guarantees that the total number of threads does
295*0fca6ea1SDimitry Andric   //  not exceed the maximum, but does not guarantee that the limit in any
296*0fca6ea1SDimitry Andric   //  particular dimension is not exceeded.
297*0fca6ea1SDimitry Andric   std::optional<unsigned> MaxNTIDx = getMaxNTIDx(F);
298*0fca6ea1SDimitry Andric   std::optional<unsigned> MaxNTIDy = getMaxNTIDy(F);
299*0fca6ea1SDimitry Andric   std::optional<unsigned> MaxNTIDz = getMaxNTIDz(F);
300*0fca6ea1SDimitry Andric   if (MaxNTIDx || MaxNTIDy || MaxNTIDz)
301*0fca6ea1SDimitry Andric     return MaxNTIDx.value_or(1) * MaxNTIDy.value_or(1) * MaxNTIDz.value_or(1);
302*0fca6ea1SDimitry Andric   return std::nullopt;
3030b57cec5SDimitry Andric }
3040b57cec5SDimitry Andric 
getMaxClusterRank(const Function & F,unsigned & x)3055f757f3fSDimitry Andric bool getMaxClusterRank(const Function &F, unsigned &x) {
3065f757f3fSDimitry Andric   return findOneNVVMAnnotation(&F, "maxclusterrank", x);
3075f757f3fSDimitry Andric }
3085f757f3fSDimitry Andric 
getReqNTIDx(const Function & F)309*0fca6ea1SDimitry Andric std::optional<unsigned> getReqNTIDx(const Function &F) {
310*0fca6ea1SDimitry Andric   return findOneNVVMAnnotation(F, "reqntidx");
3110b57cec5SDimitry Andric }
3120b57cec5SDimitry Andric 
getReqNTIDy(const Function & F)313*0fca6ea1SDimitry Andric std::optional<unsigned> getReqNTIDy(const Function &F) {
314*0fca6ea1SDimitry Andric   return findOneNVVMAnnotation(F, "reqntidy");
3150b57cec5SDimitry Andric }
3160b57cec5SDimitry Andric 
getReqNTIDz(const Function & F)317*0fca6ea1SDimitry Andric std::optional<unsigned> getReqNTIDz(const Function &F) {
318*0fca6ea1SDimitry Andric   return findOneNVVMAnnotation(F, "reqntidz");
319*0fca6ea1SDimitry Andric }
320*0fca6ea1SDimitry Andric 
getReqNTID(const Function & F)321*0fca6ea1SDimitry Andric std::optional<unsigned> getReqNTID(const Function &F) {
322*0fca6ea1SDimitry Andric   // Note: The semantics here are a bit strange. See getMaxNTID.
323*0fca6ea1SDimitry Andric   std::optional<unsigned> ReqNTIDx = getReqNTIDx(F);
324*0fca6ea1SDimitry Andric   std::optional<unsigned> ReqNTIDy = getReqNTIDy(F);
325*0fca6ea1SDimitry Andric   std::optional<unsigned> ReqNTIDz = getReqNTIDz(F);
326*0fca6ea1SDimitry Andric   if (ReqNTIDx || ReqNTIDy || ReqNTIDz)
327*0fca6ea1SDimitry Andric     return ReqNTIDx.value_or(1) * ReqNTIDy.value_or(1) * ReqNTIDz.value_or(1);
328*0fca6ea1SDimitry Andric   return std::nullopt;
3290b57cec5SDimitry Andric }
3300b57cec5SDimitry Andric 
getMinCTASm(const Function & F,unsigned & x)3310b57cec5SDimitry Andric bool getMinCTASm(const Function &F, unsigned &x) {
3320b57cec5SDimitry Andric   return findOneNVVMAnnotation(&F, "minctasm", x);
3330b57cec5SDimitry Andric }
3340b57cec5SDimitry Andric 
getMaxNReg(const Function & F,unsigned & x)3350b57cec5SDimitry Andric bool getMaxNReg(const Function &F, unsigned &x) {
3360b57cec5SDimitry Andric   return findOneNVVMAnnotation(&F, "maxnreg", x);
3370b57cec5SDimitry Andric }
3380b57cec5SDimitry Andric 
isKernelFunction(const Function & F)3390b57cec5SDimitry Andric bool isKernelFunction(const Function &F) {
3400b57cec5SDimitry Andric   unsigned x = 0;
341*0fca6ea1SDimitry Andric   if (!findOneNVVMAnnotation(&F, "kernel", x)) {
3420b57cec5SDimitry Andric     // There is no NVVM metadata, check the calling convention
3430b57cec5SDimitry Andric     return F.getCallingConv() == CallingConv::PTX_Kernel;
3440b57cec5SDimitry Andric   }
3450b57cec5SDimitry Andric   return (x == 1);
3460b57cec5SDimitry Andric }
3470b57cec5SDimitry Andric 
getAlign(const Function & F,unsigned Index)348*0fca6ea1SDimitry Andric MaybeAlign getAlign(const Function &F, unsigned Index) {
349*0fca6ea1SDimitry Andric   // First check the alignstack metadata
350*0fca6ea1SDimitry Andric   if (MaybeAlign StackAlign =
351*0fca6ea1SDimitry Andric           F.getAttributes().getAttributes(Index).getStackAlignment())
352*0fca6ea1SDimitry Andric     return StackAlign;
353*0fca6ea1SDimitry Andric 
354*0fca6ea1SDimitry Andric   // If that is missing, check the legacy nvvm metadata
3550b57cec5SDimitry Andric   std::vector<unsigned> Vs;
3560b57cec5SDimitry Andric   bool retval = findAllNVVMAnnotation(&F, "align", Vs);
3570b57cec5SDimitry Andric   if (!retval)
358*0fca6ea1SDimitry Andric     return std::nullopt;
359*0fca6ea1SDimitry Andric   for (unsigned V : Vs)
360*0fca6ea1SDimitry Andric     if ((V >> 16) == Index)
361*0fca6ea1SDimitry Andric       return Align(V & 0xFFFF);
362*0fca6ea1SDimitry Andric 
363*0fca6ea1SDimitry Andric   return std::nullopt;
3640b57cec5SDimitry Andric }
3650b57cec5SDimitry Andric 
getAlign(const CallInst & I,unsigned Index)366*0fca6ea1SDimitry Andric MaybeAlign getAlign(const CallInst &I, unsigned Index) {
367*0fca6ea1SDimitry Andric   // First check the alignstack metadata
368*0fca6ea1SDimitry Andric   if (MaybeAlign StackAlign =
369*0fca6ea1SDimitry Andric           I.getAttributes().getAttributes(Index).getStackAlignment())
370*0fca6ea1SDimitry Andric     return StackAlign;
371*0fca6ea1SDimitry Andric 
372*0fca6ea1SDimitry Andric   // If that is missing, check the legacy nvvm metadata
3730b57cec5SDimitry Andric   if (MDNode *alignNode = I.getMetadata("callalign")) {
3740b57cec5SDimitry Andric     for (int i = 0, n = alignNode->getNumOperands(); i < n; i++) {
3750b57cec5SDimitry Andric       if (const ConstantInt *CI =
3760b57cec5SDimitry Andric               mdconst::dyn_extract<ConstantInt>(alignNode->getOperand(i))) {
377*0fca6ea1SDimitry Andric         unsigned V = CI->getZExtValue();
378*0fca6ea1SDimitry Andric         if ((V >> 16) == Index)
379*0fca6ea1SDimitry Andric           return Align(V & 0xFFFF);
380*0fca6ea1SDimitry Andric         if ((V >> 16) > Index)
381*0fca6ea1SDimitry Andric           return std::nullopt;
3820b57cec5SDimitry Andric       }
3830b57cec5SDimitry Andric     }
3840b57cec5SDimitry Andric   }
385*0fca6ea1SDimitry Andric   return std::nullopt;
3860b57cec5SDimitry Andric }
3870b57cec5SDimitry Andric 
getMaybeBitcastedCallee(const CallBase * CB)388bdd1243dSDimitry Andric Function *getMaybeBitcastedCallee(const CallBase *CB) {
389bdd1243dSDimitry Andric   return dyn_cast<Function>(CB->getCalledOperand()->stripPointerCasts());
390bdd1243dSDimitry Andric }
391bdd1243dSDimitry Andric 
shouldEmitPTXNoReturn(const Value * V,const TargetMachine & TM)392bdd1243dSDimitry Andric bool shouldEmitPTXNoReturn(const Value *V, const TargetMachine &TM) {
393bdd1243dSDimitry Andric   const auto &ST =
394bdd1243dSDimitry Andric       *static_cast<const NVPTXTargetMachine &>(TM).getSubtargetImpl();
395bdd1243dSDimitry Andric   if (!ST.hasNoReturn())
396bdd1243dSDimitry Andric     return false;
397bdd1243dSDimitry Andric 
398bdd1243dSDimitry Andric   assert((isa<Function>(V) || isa<CallInst>(V)) &&
399bdd1243dSDimitry Andric          "Expect either a call instruction or a function");
400bdd1243dSDimitry Andric 
401bdd1243dSDimitry Andric   if (const CallInst *CallI = dyn_cast<CallInst>(V))
402bdd1243dSDimitry Andric     return CallI->doesNotReturn() &&
403bdd1243dSDimitry Andric            CallI->getFunctionType()->getReturnType()->isVoidTy();
404bdd1243dSDimitry Andric 
405bdd1243dSDimitry Andric   const Function *F = cast<Function>(V);
406bdd1243dSDimitry Andric   return F->doesNotReturn() &&
407bdd1243dSDimitry Andric          F->getFunctionType()->getReturnType()->isVoidTy() &&
408bdd1243dSDimitry Andric          !isKernelFunction(*F);
409bdd1243dSDimitry Andric }
410bdd1243dSDimitry Andric 
Isv2x16VT(EVT VT)4115f757f3fSDimitry Andric bool Isv2x16VT(EVT VT) {
4125f757f3fSDimitry Andric   return (VT == MVT::v2f16 || VT == MVT::v2bf16 || VT == MVT::v2i16);
4135f757f3fSDimitry Andric }
4145f757f3fSDimitry Andric 
4150b57cec5SDimitry Andric } // namespace llvm
416