10b57cec5SDimitry Andric //===--- Cuda.h - Cuda ToolChain Implementations ----------------*- C++ -*-===// 20b57cec5SDimitry Andric // 30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information. 50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 60b57cec5SDimitry Andric // 70b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 80b57cec5SDimitry Andric 90b57cec5SDimitry Andric #ifndef LLVM_CLANG_LIB_DRIVER_TOOLCHAINS_CUDA_H 100b57cec5SDimitry Andric #define LLVM_CLANG_LIB_DRIVER_TOOLCHAINS_CUDA_H 110b57cec5SDimitry Andric 120b57cec5SDimitry Andric #include "clang/Basic/Cuda.h" 130b57cec5SDimitry Andric #include "clang/Driver/Action.h" 140b57cec5SDimitry Andric #include "clang/Driver/Multilib.h" 150b57cec5SDimitry Andric #include "clang/Driver/Tool.h" 160b57cec5SDimitry Andric #include "clang/Driver/ToolChain.h" 170b57cec5SDimitry Andric #include "llvm/Support/Compiler.h" 180b57cec5SDimitry Andric #include "llvm/Support/VersionTuple.h" 19e8d8bef9SDimitry Andric #include <bitset> 200b57cec5SDimitry Andric #include <set> 210b57cec5SDimitry Andric #include <vector> 220b57cec5SDimitry Andric 230b57cec5SDimitry Andric namespace clang { 240b57cec5SDimitry Andric namespace driver { 250b57cec5SDimitry Andric 260b57cec5SDimitry Andric /// A class to find a viable CUDA installation 270b57cec5SDimitry Andric class CudaInstallationDetector { 280b57cec5SDimitry Andric private: 290b57cec5SDimitry Andric const Driver &D; 300b57cec5SDimitry Andric bool IsValid = false; 310b57cec5SDimitry Andric CudaVersion Version = CudaVersion::UNKNOWN; 320b57cec5SDimitry Andric std::string InstallPath; 330b57cec5SDimitry Andric std::string BinPath; 340b57cec5SDimitry Andric std::string LibDevicePath; 350b57cec5SDimitry Andric std::string IncludePath; 360b57cec5SDimitry Andric llvm::StringMap<std::string> LibDeviceMap; 370b57cec5SDimitry Andric 380b57cec5SDimitry Andric // CUDA architectures for which we have raised an error in 390b57cec5SDimitry Andric // CheckCudaVersionSupportsArch. 40e8d8bef9SDimitry Andric mutable std::bitset<(int)CudaArch::LAST> ArchsWithBadVersion; 410b57cec5SDimitry Andric 420b57cec5SDimitry Andric public: 430b57cec5SDimitry Andric CudaInstallationDetector(const Driver &D, const llvm::Triple &HostTriple, 440b57cec5SDimitry Andric const llvm::opt::ArgList &Args); 450b57cec5SDimitry Andric 460b57cec5SDimitry Andric void AddCudaIncludeArgs(const llvm::opt::ArgList &DriverArgs, 470b57cec5SDimitry Andric llvm::opt::ArgStringList &CC1Args) const; 480b57cec5SDimitry Andric 490b57cec5SDimitry Andric /// Emit an error if Version does not support the given Arch. 500b57cec5SDimitry Andric /// 510b57cec5SDimitry Andric /// If either Version or Arch is unknown, does not emit an error. Emits at 520b57cec5SDimitry Andric /// most one error per Arch. 530b57cec5SDimitry Andric void CheckCudaVersionSupportsArch(CudaArch Arch) const; 540b57cec5SDimitry Andric 550b57cec5SDimitry Andric /// Check whether we detected a valid Cuda install. 560b57cec5SDimitry Andric bool isValid() const { return IsValid; } 570b57cec5SDimitry Andric /// Print information about the detected CUDA installation. 580b57cec5SDimitry Andric void print(raw_ostream &OS) const; 590b57cec5SDimitry Andric 600b57cec5SDimitry Andric /// Get the detected Cuda install's version. 61349cc55cSDimitry Andric CudaVersion version() const { 62349cc55cSDimitry Andric return Version == CudaVersion::NEW ? CudaVersion::PARTIALLY_SUPPORTED 63349cc55cSDimitry Andric : Version; 64349cc55cSDimitry Andric } 650b57cec5SDimitry Andric /// Get the detected Cuda installation path. 660b57cec5SDimitry Andric StringRef getInstallPath() const { return InstallPath; } 670b57cec5SDimitry Andric /// Get the detected path to Cuda's bin directory. 680b57cec5SDimitry Andric StringRef getBinPath() const { return BinPath; } 690b57cec5SDimitry Andric /// Get the detected Cuda Include path. 700b57cec5SDimitry Andric StringRef getIncludePath() const { return IncludePath; } 710b57cec5SDimitry Andric /// Get the detected Cuda device library path. 720b57cec5SDimitry Andric StringRef getLibDevicePath() const { return LibDevicePath; } 730b57cec5SDimitry Andric /// Get libdevice file for given architecture 740b57cec5SDimitry Andric std::string getLibDeviceFile(StringRef Gpu) const { 750b57cec5SDimitry Andric return LibDeviceMap.lookup(Gpu); 760b57cec5SDimitry Andric } 77aec4c088SDimitry Andric void WarnIfUnsupportedVersion(); 780b57cec5SDimitry Andric }; 790b57cec5SDimitry Andric 800b57cec5SDimitry Andric namespace tools { 810b57cec5SDimitry Andric namespace NVPTX { 820b57cec5SDimitry Andric 830b57cec5SDimitry Andric // Run ptxas, the NVPTX assembler. 840b57cec5SDimitry Andric class LLVM_LIBRARY_VISIBILITY Assembler : public Tool { 850b57cec5SDimitry Andric public: 865ffd83dbSDimitry Andric Assembler(const ToolChain &TC) : Tool("NVPTX::Assembler", "ptxas", TC) {} 870b57cec5SDimitry Andric 880b57cec5SDimitry Andric bool hasIntegratedCPP() const override { return false; } 890b57cec5SDimitry Andric 900b57cec5SDimitry Andric void ConstructJob(Compilation &C, const JobAction &JA, 910b57cec5SDimitry Andric const InputInfo &Output, const InputInfoList &Inputs, 920b57cec5SDimitry Andric const llvm::opt::ArgList &TCArgs, 930b57cec5SDimitry Andric const char *LinkingOutput) const override; 940b57cec5SDimitry Andric }; 950b57cec5SDimitry Andric 960b57cec5SDimitry Andric // Runs fatbinary, which combines GPU object files ("cubin" files) and/or PTX 970b57cec5SDimitry Andric // assembly into a single output file. 98*bdd1243dSDimitry Andric class LLVM_LIBRARY_VISIBILITY FatBinary : public Tool { 990b57cec5SDimitry Andric public: 100*bdd1243dSDimitry Andric FatBinary(const ToolChain &TC) : Tool("NVPTX::Linker", "fatbinary", TC) {} 1010b57cec5SDimitry Andric 1020b57cec5SDimitry Andric bool hasIntegratedCPP() const override { return false; } 1030b57cec5SDimitry Andric 1040b57cec5SDimitry Andric void ConstructJob(Compilation &C, const JobAction &JA, 1050b57cec5SDimitry Andric const InputInfo &Output, const InputInfoList &Inputs, 1060b57cec5SDimitry Andric const llvm::opt::ArgList &TCArgs, 1070b57cec5SDimitry Andric const char *LinkingOutput) const override; 1080b57cec5SDimitry Andric }; 1090b57cec5SDimitry Andric 110*bdd1243dSDimitry Andric // Runs nvlink, which links GPU object files ("cubin" files) into a single file. 111*bdd1243dSDimitry Andric class LLVM_LIBRARY_VISIBILITY Linker : public Tool { 1120b57cec5SDimitry Andric public: 113*bdd1243dSDimitry Andric Linker(const ToolChain &TC) : Tool("NVPTX::Linker", "fatbinary", TC) {} 1140b57cec5SDimitry Andric 1150b57cec5SDimitry Andric bool hasIntegratedCPP() const override { return false; } 1160b57cec5SDimitry Andric 1170b57cec5SDimitry Andric void ConstructJob(Compilation &C, const JobAction &JA, 1180b57cec5SDimitry Andric const InputInfo &Output, const InputInfoList &Inputs, 1190b57cec5SDimitry Andric const llvm::opt::ArgList &TCArgs, 1200b57cec5SDimitry Andric const char *LinkingOutput) const override; 1210b57cec5SDimitry Andric }; 1220b57cec5SDimitry Andric 12381ad6265SDimitry Andric void getNVPTXTargetFeatures(const Driver &D, const llvm::Triple &Triple, 12481ad6265SDimitry Andric const llvm::opt::ArgList &Args, 12581ad6265SDimitry Andric std::vector<StringRef> &Features); 12681ad6265SDimitry Andric 1270b57cec5SDimitry Andric } // end namespace NVPTX 1280b57cec5SDimitry Andric } // end namespace tools 1290b57cec5SDimitry Andric 1300b57cec5SDimitry Andric namespace toolchains { 1310b57cec5SDimitry Andric 132*bdd1243dSDimitry Andric class LLVM_LIBRARY_VISIBILITY NVPTXToolChain : public ToolChain { 1330b57cec5SDimitry Andric public: 134*bdd1243dSDimitry Andric NVPTXToolChain(const Driver &D, const llvm::Triple &Triple, 135*bdd1243dSDimitry Andric const llvm::Triple &HostTriple, 136*bdd1243dSDimitry Andric const llvm::opt::ArgList &Args); 1370b57cec5SDimitry Andric 138*bdd1243dSDimitry Andric NVPTXToolChain(const Driver &D, const llvm::Triple &Triple, 139*bdd1243dSDimitry Andric const llvm::opt::ArgList &Args); 1400b57cec5SDimitry Andric 1410b57cec5SDimitry Andric llvm::opt::DerivedArgList * 1420b57cec5SDimitry Andric TranslateArgs(const llvm::opt::DerivedArgList &Args, StringRef BoundArch, 1430b57cec5SDimitry Andric Action::OffloadKind DeviceOffloadKind) const override; 1445ffd83dbSDimitry Andric 1450b57cec5SDimitry Andric // Never try to use the integrated assembler with CUDA; always fork out to 1460b57cec5SDimitry Andric // ptxas. 1470b57cec5SDimitry Andric bool useIntegratedAs() const override { return false; } 1480b57cec5SDimitry Andric bool isCrossCompiling() const override { return true; } 1490b57cec5SDimitry Andric bool isPICDefault() const override { return false; } 150349cc55cSDimitry Andric bool isPIEDefault(const llvm::opt::ArgList &Args) const override { 151349cc55cSDimitry Andric return false; 152349cc55cSDimitry Andric } 1530b57cec5SDimitry Andric bool isPICDefaultForced() const override { return false; } 1540b57cec5SDimitry Andric bool SupportsProfiling() const override { return false; } 155*bdd1243dSDimitry Andric 156*bdd1243dSDimitry Andric bool IsMathErrnoDefault() const override { return false; } 157*bdd1243dSDimitry Andric 1580b57cec5SDimitry Andric bool supportsDebugInfoOption(const llvm::opt::Arg *A) const override; 1590b57cec5SDimitry Andric void adjustDebugInfoKind(codegenoptions::DebugInfoKind &DebugInfoKind, 1600b57cec5SDimitry Andric const llvm::opt::ArgList &Args) const override; 161*bdd1243dSDimitry Andric 162*bdd1243dSDimitry Andric // NVPTX supports only DWARF2. 163*bdd1243dSDimitry Andric unsigned GetDefaultDwarfVersion() const override { return 2; } 164*bdd1243dSDimitry Andric unsigned getMaxDwarfVersion() const override { return 2; } 165*bdd1243dSDimitry Andric 166*bdd1243dSDimitry Andric CudaInstallationDetector CudaInstallation; 167*bdd1243dSDimitry Andric 168*bdd1243dSDimitry Andric protected: 169*bdd1243dSDimitry Andric Tool *buildAssembler() const override; // ptxas. 170*bdd1243dSDimitry Andric Tool *buildLinker() const override; // nvlink. 171*bdd1243dSDimitry Andric }; 172*bdd1243dSDimitry Andric 173*bdd1243dSDimitry Andric class LLVM_LIBRARY_VISIBILITY CudaToolChain : public NVPTXToolChain { 174*bdd1243dSDimitry Andric public: 175*bdd1243dSDimitry Andric CudaToolChain(const Driver &D, const llvm::Triple &Triple, 176*bdd1243dSDimitry Andric const ToolChain &HostTC, const llvm::opt::ArgList &Args); 177*bdd1243dSDimitry Andric 178*bdd1243dSDimitry Andric const llvm::Triple *getAuxTriple() const override { 179*bdd1243dSDimitry Andric return &HostTC.getTriple(); 180*bdd1243dSDimitry Andric } 181*bdd1243dSDimitry Andric 182*bdd1243dSDimitry Andric std::string getInputFilename(const InputInfo &Input) const override; 183*bdd1243dSDimitry Andric 184*bdd1243dSDimitry Andric llvm::opt::DerivedArgList * 185*bdd1243dSDimitry Andric TranslateArgs(const llvm::opt::DerivedArgList &Args, StringRef BoundArch, 186*bdd1243dSDimitry Andric Action::OffloadKind DeviceOffloadKind) const override; 187*bdd1243dSDimitry Andric void 188*bdd1243dSDimitry Andric addClangTargetOptions(const llvm::opt::ArgList &DriverArgs, 189*bdd1243dSDimitry Andric llvm::opt::ArgStringList &CC1Args, 190*bdd1243dSDimitry Andric Action::OffloadKind DeviceOffloadKind) const override; 191*bdd1243dSDimitry Andric 192*bdd1243dSDimitry Andric llvm::DenormalMode getDefaultDenormalModeForType( 193*bdd1243dSDimitry Andric const llvm::opt::ArgList &DriverArgs, const JobAction &JA, 194*bdd1243dSDimitry Andric const llvm::fltSemantics *FPType = nullptr) const override; 1950b57cec5SDimitry Andric 1960b57cec5SDimitry Andric void AddCudaIncludeArgs(const llvm::opt::ArgList &DriverArgs, 1970b57cec5SDimitry Andric llvm::opt::ArgStringList &CC1Args) const override; 1980b57cec5SDimitry Andric 1990b57cec5SDimitry Andric void addClangWarningOptions(llvm::opt::ArgStringList &CC1Args) const override; 2000b57cec5SDimitry Andric CXXStdlibType GetCXXStdlibType(const llvm::opt::ArgList &Args) const override; 2010b57cec5SDimitry Andric void 2020b57cec5SDimitry Andric AddClangSystemIncludeArgs(const llvm::opt::ArgList &DriverArgs, 2030b57cec5SDimitry Andric llvm::opt::ArgStringList &CC1Args) const override; 2040b57cec5SDimitry Andric void AddClangCXXStdlibIncludeArgs( 2050b57cec5SDimitry Andric const llvm::opt::ArgList &Args, 2060b57cec5SDimitry Andric llvm::opt::ArgStringList &CC1Args) const override; 2070b57cec5SDimitry Andric void AddIAMCUIncludeArgs(const llvm::opt::ArgList &DriverArgs, 2080b57cec5SDimitry Andric llvm::opt::ArgStringList &CC1Args) const override; 2090b57cec5SDimitry Andric 2100b57cec5SDimitry Andric SanitizerMask getSupportedSanitizers() const override; 2110b57cec5SDimitry Andric 2120b57cec5SDimitry Andric VersionTuple 2130b57cec5SDimitry Andric computeMSVCVersion(const Driver *D, 2140b57cec5SDimitry Andric const llvm::opt::ArgList &Args) const override; 2150b57cec5SDimitry Andric 2160b57cec5SDimitry Andric const ToolChain &HostTC; 217*bdd1243dSDimitry Andric 218*bdd1243dSDimitry Andric /// Uses nvptx-arch tool to get arch of the system GPU. Will return error 219*bdd1243dSDimitry Andric /// if unable to find one. 220*bdd1243dSDimitry Andric virtual Expected<SmallVector<std::string>> 221*bdd1243dSDimitry Andric getSystemGPUArchs(const llvm::opt::ArgList &Args) const override; 2220b57cec5SDimitry Andric 2230b57cec5SDimitry Andric protected: 2240b57cec5SDimitry Andric Tool *buildAssembler() const override; // ptxas 2250b57cec5SDimitry Andric Tool *buildLinker() const override; // fatbinary (ok, not really a linker) 2260b57cec5SDimitry Andric }; 2270b57cec5SDimitry Andric 2280b57cec5SDimitry Andric } // end namespace toolchains 2290b57cec5SDimitry Andric } // end namespace driver 2300b57cec5SDimitry Andric } // end namespace clang 2310b57cec5SDimitry Andric 2320b57cec5SDimitry Andric #endif // LLVM_CLANG_LIB_DRIVER_TOOLCHAINS_CUDA_H 233