xref: /freebsd/contrib/llvm-project/llvm/lib/Target/NVPTX/NVPTXSubtarget.cpp (revision 357378bbdedf24ce2b90e9bd831af4a9db3ec70a)
1 //===- NVPTXSubtarget.cpp - NVPTX Subtarget Information -------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This file implements the NVPTX specific subclass of TargetSubtarget.
10 //
11 //===----------------------------------------------------------------------===//
12 
13 #include "NVPTXSubtarget.h"
14 #include "NVPTXTargetMachine.h"
15 
16 using namespace llvm;
17 
18 #define DEBUG_TYPE "nvptx-subtarget"
19 
20 #define GET_SUBTARGETINFO_ENUM
21 #define GET_SUBTARGETINFO_TARGET_DESC
22 #define GET_SUBTARGETINFO_CTOR
23 #include "NVPTXGenSubtargetInfo.inc"
24 
25 static cl::opt<bool>
26     NoF16Math("nvptx-no-f16-math", cl::Hidden,
27               cl::desc("NVPTX Specific: Disable generation of f16 math ops."),
28               cl::init(false));
29 // Pin the vtable to this file.
30 void NVPTXSubtarget::anchor() {}
31 
32 NVPTXSubtarget &NVPTXSubtarget::initializeSubtargetDependencies(StringRef CPU,
33                                                                 StringRef FS) {
34     // Provide the default CPU if we don't have one.
35     TargetName = std::string(CPU.empty() ? "sm_30" : CPU);
36 
37     ParseSubtargetFeatures(TargetName, /*TuneCPU*/ TargetName, FS);
38 
39     // Re-map SM version numbers, SmVersion carries the regular SMs which do
40     // have relative order, while FullSmVersion allows distinguishing sm_90 from
41     // sm_90a, which would *not* be a subset of sm_91.
42     SmVersion = getSmVersion();
43 
44     // Set default to PTX 6.0 (CUDA 9.0)
45     if (PTXVersion == 0) {
46       PTXVersion = 60;
47   }
48 
49   return *this;
50 }
51 
52 NVPTXSubtarget::NVPTXSubtarget(const Triple &TT, const std::string &CPU,
53                                const std::string &FS,
54                                const NVPTXTargetMachine &TM)
55     : NVPTXGenSubtargetInfo(TT, CPU, /*TuneCPU*/ CPU, FS), PTXVersion(0),
56       FullSmVersion(200), SmVersion(getSmVersion()), TM(TM),
57       TLInfo(TM, initializeSubtargetDependencies(CPU, FS)) {}
58 
59 bool NVPTXSubtarget::hasImageHandles() const {
60   // Enable handles for Kepler+, where CUDA supports indirect surfaces and
61   // textures
62   if (TM.getDrvInterface() == NVPTX::CUDA)
63     return (SmVersion >= 30);
64 
65   // Disabled, otherwise
66   return false;
67 }
68 
69 bool NVPTXSubtarget::allowFP16Math() const {
70   return hasFP16Math() && NoF16Math == false;
71 }
72