10b57cec5SDimitry Andric //===--- Cuda.h - Cuda ToolChain Implementations ----------------*- C++ -*-===// 20b57cec5SDimitry Andric // 30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information. 50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 60b57cec5SDimitry Andric // 70b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 80b57cec5SDimitry Andric 90b57cec5SDimitry Andric #ifndef LLVM_CLANG_LIB_DRIVER_TOOLCHAINS_CUDA_H 100b57cec5SDimitry Andric #define LLVM_CLANG_LIB_DRIVER_TOOLCHAINS_CUDA_H 110b57cec5SDimitry Andric 120b57cec5SDimitry Andric #include "clang/Basic/Cuda.h" 130b57cec5SDimitry Andric #include "clang/Driver/Action.h" 140b57cec5SDimitry Andric #include "clang/Driver/Multilib.h" 150b57cec5SDimitry Andric #include "clang/Driver/Tool.h" 160b57cec5SDimitry Andric #include "clang/Driver/ToolChain.h" 170b57cec5SDimitry Andric #include "llvm/Support/Compiler.h" 180b57cec5SDimitry Andric #include "llvm/Support/VersionTuple.h" 19e8d8bef9SDimitry Andric #include <bitset> 200b57cec5SDimitry Andric #include <set> 210b57cec5SDimitry Andric #include <vector> 220b57cec5SDimitry Andric 230b57cec5SDimitry Andric namespace clang { 240b57cec5SDimitry Andric namespace driver { 250b57cec5SDimitry Andric 260b57cec5SDimitry Andric /// A class to find a viable CUDA installation 270b57cec5SDimitry Andric class CudaInstallationDetector { 280b57cec5SDimitry Andric private: 290b57cec5SDimitry Andric const Driver &D; 300b57cec5SDimitry Andric bool IsValid = false; 310b57cec5SDimitry Andric CudaVersion Version = CudaVersion::UNKNOWN; 320b57cec5SDimitry Andric std::string InstallPath; 330b57cec5SDimitry Andric std::string BinPath; 340b57cec5SDimitry Andric std::string LibDevicePath; 350b57cec5SDimitry Andric std::string IncludePath; 360b57cec5SDimitry Andric llvm::StringMap<std::string> LibDeviceMap; 370b57cec5SDimitry Andric 380b57cec5SDimitry Andric // CUDA architectures for which we have raised an error in 390b57cec5SDimitry Andric // CheckCudaVersionSupportsArch. 40*0fca6ea1SDimitry Andric mutable std::bitset<(int)OffloadArch::LAST> ArchsWithBadVersion; 410b57cec5SDimitry Andric 420b57cec5SDimitry Andric public: 430b57cec5SDimitry Andric CudaInstallationDetector(const Driver &D, const llvm::Triple &HostTriple, 440b57cec5SDimitry Andric const llvm::opt::ArgList &Args); 450b57cec5SDimitry Andric 460b57cec5SDimitry Andric void AddCudaIncludeArgs(const llvm::opt::ArgList &DriverArgs, 470b57cec5SDimitry Andric llvm::opt::ArgStringList &CC1Args) const; 480b57cec5SDimitry Andric 490b57cec5SDimitry Andric /// Emit an error if Version does not support the given Arch. 500b57cec5SDimitry Andric /// 510b57cec5SDimitry Andric /// If either Version or Arch is unknown, does not emit an error. Emits at 520b57cec5SDimitry Andric /// most one error per Arch. 53*0fca6ea1SDimitry Andric void CheckCudaVersionSupportsArch(OffloadArch Arch) const; 540b57cec5SDimitry Andric 550b57cec5SDimitry Andric /// Check whether we detected a valid Cuda install. isValid()560b57cec5SDimitry Andric bool isValid() const { return IsValid; } 570b57cec5SDimitry Andric /// Print information about the detected CUDA installation. 580b57cec5SDimitry Andric void print(raw_ostream &OS) const; 590b57cec5SDimitry Andric 600b57cec5SDimitry Andric /// Get the detected Cuda install's version. version()61349cc55cSDimitry Andric CudaVersion version() const { 62349cc55cSDimitry Andric return Version == CudaVersion::NEW ? CudaVersion::PARTIALLY_SUPPORTED 63349cc55cSDimitry Andric : Version; 64349cc55cSDimitry Andric } 650b57cec5SDimitry Andric /// Get the detected Cuda installation path. getInstallPath()660b57cec5SDimitry Andric StringRef getInstallPath() const { return InstallPath; } 670b57cec5SDimitry Andric /// Get the detected path to Cuda's bin directory. getBinPath()680b57cec5SDimitry Andric StringRef getBinPath() const { return BinPath; } 690b57cec5SDimitry Andric /// Get the detected Cuda Include path. getIncludePath()700b57cec5SDimitry Andric StringRef getIncludePath() const { return IncludePath; } 710b57cec5SDimitry Andric /// Get the detected Cuda device library path. getLibDevicePath()720b57cec5SDimitry Andric StringRef getLibDevicePath() const { return LibDevicePath; } 730b57cec5SDimitry Andric /// Get libdevice file for given architecture getLibDeviceFile(StringRef Gpu)740b57cec5SDimitry Andric std::string getLibDeviceFile(StringRef Gpu) const { 750b57cec5SDimitry Andric return LibDeviceMap.lookup(Gpu); 760b57cec5SDimitry Andric } 77aec4c088SDimitry Andric void WarnIfUnsupportedVersion(); 780b57cec5SDimitry Andric }; 790b57cec5SDimitry Andric 800b57cec5SDimitry Andric namespace tools { 810b57cec5SDimitry Andric namespace NVPTX { 820b57cec5SDimitry Andric 830b57cec5SDimitry Andric // Run ptxas, the NVPTX assembler. 845f757f3fSDimitry Andric class LLVM_LIBRARY_VISIBILITY Assembler final : public Tool { 850b57cec5SDimitry Andric public: Assembler(const ToolChain & TC)865ffd83dbSDimitry Andric Assembler(const ToolChain &TC) : Tool("NVPTX::Assembler", "ptxas", TC) {} 870b57cec5SDimitry Andric hasIntegratedCPP()880b57cec5SDimitry Andric bool hasIntegratedCPP() const override { return false; } 890b57cec5SDimitry Andric 900b57cec5SDimitry Andric void ConstructJob(Compilation &C, const JobAction &JA, 910b57cec5SDimitry Andric const InputInfo &Output, const InputInfoList &Inputs, 920b57cec5SDimitry Andric const llvm::opt::ArgList &TCArgs, 930b57cec5SDimitry Andric const char *LinkingOutput) const override; 940b57cec5SDimitry Andric }; 950b57cec5SDimitry Andric 960b57cec5SDimitry Andric // Runs fatbinary, which combines GPU object files ("cubin" files) and/or PTX 970b57cec5SDimitry Andric // assembly into a single output file. 98bdd1243dSDimitry Andric class LLVM_LIBRARY_VISIBILITY FatBinary : public Tool { 990b57cec5SDimitry Andric public: FatBinary(const ToolChain & TC)100bdd1243dSDimitry Andric FatBinary(const ToolChain &TC) : Tool("NVPTX::Linker", "fatbinary", TC) {} 1010b57cec5SDimitry Andric hasIntegratedCPP()1020b57cec5SDimitry Andric bool hasIntegratedCPP() const override { return false; } 1030b57cec5SDimitry Andric 1040b57cec5SDimitry Andric void ConstructJob(Compilation &C, const JobAction &JA, 1050b57cec5SDimitry Andric const InputInfo &Output, const InputInfoList &Inputs, 1060b57cec5SDimitry Andric const llvm::opt::ArgList &TCArgs, 1070b57cec5SDimitry Andric const char *LinkingOutput) const override; 1080b57cec5SDimitry Andric }; 1090b57cec5SDimitry Andric 110bdd1243dSDimitry Andric // Runs nvlink, which links GPU object files ("cubin" files) into a single file. 1115f757f3fSDimitry Andric class LLVM_LIBRARY_VISIBILITY Linker final : public Tool { 1120b57cec5SDimitry Andric public: Linker(const ToolChain & TC)1135f757f3fSDimitry Andric Linker(const ToolChain &TC) : Tool("NVPTX::Linker", "nvlink", TC) {} 1140b57cec5SDimitry Andric hasIntegratedCPP()1150b57cec5SDimitry Andric bool hasIntegratedCPP() const override { return false; } 1160b57cec5SDimitry Andric 1170b57cec5SDimitry Andric void ConstructJob(Compilation &C, const JobAction &JA, 1180b57cec5SDimitry Andric const InputInfo &Output, const InputInfoList &Inputs, 1190b57cec5SDimitry Andric const llvm::opt::ArgList &TCArgs, 1200b57cec5SDimitry Andric const char *LinkingOutput) const override; 1210b57cec5SDimitry Andric }; 1220b57cec5SDimitry Andric 12381ad6265SDimitry Andric void getNVPTXTargetFeatures(const Driver &D, const llvm::Triple &Triple, 12481ad6265SDimitry Andric const llvm::opt::ArgList &Args, 12581ad6265SDimitry Andric std::vector<StringRef> &Features); 12681ad6265SDimitry Andric 1270b57cec5SDimitry Andric } // end namespace NVPTX 1280b57cec5SDimitry Andric } // end namespace tools 1290b57cec5SDimitry Andric 1300b57cec5SDimitry Andric namespace toolchains { 1310b57cec5SDimitry Andric 132bdd1243dSDimitry Andric class LLVM_LIBRARY_VISIBILITY NVPTXToolChain : public ToolChain { 1330b57cec5SDimitry Andric public: 134bdd1243dSDimitry Andric NVPTXToolChain(const Driver &D, const llvm::Triple &Triple, 13506c3fb27SDimitry Andric const llvm::Triple &HostTriple, const llvm::opt::ArgList &Args, 13606c3fb27SDimitry Andric bool Freestanding); 1370b57cec5SDimitry Andric 138bdd1243dSDimitry Andric NVPTXToolChain(const Driver &D, const llvm::Triple &Triple, 139bdd1243dSDimitry Andric const llvm::opt::ArgList &Args); 1400b57cec5SDimitry Andric 1410b57cec5SDimitry Andric llvm::opt::DerivedArgList * 1420b57cec5SDimitry Andric TranslateArgs(const llvm::opt::DerivedArgList &Args, StringRef BoundArch, 1430b57cec5SDimitry Andric Action::OffloadKind DeviceOffloadKind) const override; 1445ffd83dbSDimitry Andric 14506c3fb27SDimitry Andric void 14606c3fb27SDimitry Andric addClangTargetOptions(const llvm::opt::ArgList &DriverArgs, 14706c3fb27SDimitry Andric llvm::opt::ArgStringList &CC1Args, 14806c3fb27SDimitry Andric Action::OffloadKind DeviceOffloadKind) const override; 14906c3fb27SDimitry Andric 1500b57cec5SDimitry Andric // Never try to use the integrated assembler with CUDA; always fork out to 1510b57cec5SDimitry Andric // ptxas. useIntegratedAs()1520b57cec5SDimitry Andric bool useIntegratedAs() const override { return false; } isCrossCompiling()1530b57cec5SDimitry Andric bool isCrossCompiling() const override { return true; } isPICDefault()1540b57cec5SDimitry Andric bool isPICDefault() const override { return false; } isPIEDefault(const llvm::opt::ArgList & Args)155349cc55cSDimitry Andric bool isPIEDefault(const llvm::opt::ArgList &Args) const override { 156349cc55cSDimitry Andric return false; 157349cc55cSDimitry Andric } HasNativeLLVMSupport()158*0fca6ea1SDimitry Andric bool HasNativeLLVMSupport() const override { return true; } isPICDefaultForced()1590b57cec5SDimitry Andric bool isPICDefaultForced() const override { return false; } SupportsProfiling()1600b57cec5SDimitry Andric bool SupportsProfiling() const override { return false; } 161bdd1243dSDimitry Andric IsMathErrnoDefault()162bdd1243dSDimitry Andric bool IsMathErrnoDefault() const override { return false; } 163bdd1243dSDimitry Andric 1640b57cec5SDimitry Andric bool supportsDebugInfoOption(const llvm::opt::Arg *A) const override; 16506c3fb27SDimitry Andric void adjustDebugInfoKind(llvm::codegenoptions::DebugInfoKind &DebugInfoKind, 1660b57cec5SDimitry Andric const llvm::opt::ArgList &Args) const override; 167bdd1243dSDimitry Andric 168bdd1243dSDimitry Andric // NVPTX supports only DWARF2. GetDefaultDwarfVersion()169bdd1243dSDimitry Andric unsigned GetDefaultDwarfVersion() const override { return 2; } getMaxDwarfVersion()170bdd1243dSDimitry Andric unsigned getMaxDwarfVersion() const override { return 2; } 171bdd1243dSDimitry Andric 172*0fca6ea1SDimitry Andric /// Uses nvptx-arch tool to get arch of the system GPU. Will return error 173*0fca6ea1SDimitry Andric /// if unable to find one. 174*0fca6ea1SDimitry Andric virtual Expected<SmallVector<std::string>> 175*0fca6ea1SDimitry Andric getSystemGPUArchs(const llvm::opt::ArgList &Args) const override; 176*0fca6ea1SDimitry Andric 177bdd1243dSDimitry Andric CudaInstallationDetector CudaInstallation; 178bdd1243dSDimitry Andric 179bdd1243dSDimitry Andric protected: 180bdd1243dSDimitry Andric Tool *buildAssembler() const override; // ptxas. 181bdd1243dSDimitry Andric Tool *buildLinker() const override; // nvlink. 18206c3fb27SDimitry Andric 18306c3fb27SDimitry Andric private: 18406c3fb27SDimitry Andric bool Freestanding = false; 185bdd1243dSDimitry Andric }; 186bdd1243dSDimitry Andric 187bdd1243dSDimitry Andric class LLVM_LIBRARY_VISIBILITY CudaToolChain : public NVPTXToolChain { 188bdd1243dSDimitry Andric public: 189bdd1243dSDimitry Andric CudaToolChain(const Driver &D, const llvm::Triple &Triple, 190bdd1243dSDimitry Andric const ToolChain &HostTC, const llvm::opt::ArgList &Args); 191bdd1243dSDimitry Andric getAuxTriple()192bdd1243dSDimitry Andric const llvm::Triple *getAuxTriple() const override { 193bdd1243dSDimitry Andric return &HostTC.getTriple(); 194bdd1243dSDimitry Andric } 195bdd1243dSDimitry Andric HasNativeLLVMSupport()196*0fca6ea1SDimitry Andric bool HasNativeLLVMSupport() const override { return false; } 197*0fca6ea1SDimitry Andric 198bdd1243dSDimitry Andric std::string getInputFilename(const InputInfo &Input) const override; 199bdd1243dSDimitry Andric 200bdd1243dSDimitry Andric llvm::opt::DerivedArgList * 201bdd1243dSDimitry Andric TranslateArgs(const llvm::opt::DerivedArgList &Args, StringRef BoundArch, 202bdd1243dSDimitry Andric Action::OffloadKind DeviceOffloadKind) const override; 203bdd1243dSDimitry Andric void 204bdd1243dSDimitry Andric addClangTargetOptions(const llvm::opt::ArgList &DriverArgs, 205bdd1243dSDimitry Andric llvm::opt::ArgStringList &CC1Args, 206bdd1243dSDimitry Andric Action::OffloadKind DeviceOffloadKind) const override; 207bdd1243dSDimitry Andric 208bdd1243dSDimitry Andric llvm::DenormalMode getDefaultDenormalModeForType( 209bdd1243dSDimitry Andric const llvm::opt::ArgList &DriverArgs, const JobAction &JA, 210bdd1243dSDimitry Andric const llvm::fltSemantics *FPType = nullptr) const override; 2110b57cec5SDimitry Andric 2120b57cec5SDimitry Andric void AddCudaIncludeArgs(const llvm::opt::ArgList &DriverArgs, 2130b57cec5SDimitry Andric llvm::opt::ArgStringList &CC1Args) const override; 2140b57cec5SDimitry Andric 2150b57cec5SDimitry Andric void addClangWarningOptions(llvm::opt::ArgStringList &CC1Args) const override; 2160b57cec5SDimitry Andric CXXStdlibType GetCXXStdlibType(const llvm::opt::ArgList &Args) const override; 2170b57cec5SDimitry Andric void 2180b57cec5SDimitry Andric AddClangSystemIncludeArgs(const llvm::opt::ArgList &DriverArgs, 2190b57cec5SDimitry Andric llvm::opt::ArgStringList &CC1Args) const override; 2200b57cec5SDimitry Andric void AddClangCXXStdlibIncludeArgs( 2210b57cec5SDimitry Andric const llvm::opt::ArgList &Args, 2220b57cec5SDimitry Andric llvm::opt::ArgStringList &CC1Args) const override; 2230b57cec5SDimitry Andric void AddIAMCUIncludeArgs(const llvm::opt::ArgList &DriverArgs, 2240b57cec5SDimitry Andric llvm::opt::ArgStringList &CC1Args) const override; 2250b57cec5SDimitry Andric 2260b57cec5SDimitry Andric SanitizerMask getSupportedSanitizers() const override; 2270b57cec5SDimitry Andric 2280b57cec5SDimitry Andric VersionTuple 2290b57cec5SDimitry Andric computeMSVCVersion(const Driver *D, 2300b57cec5SDimitry Andric const llvm::opt::ArgList &Args) const override; 2310b57cec5SDimitry Andric 2320b57cec5SDimitry Andric const ToolChain &HostTC; 233bdd1243dSDimitry Andric 2340b57cec5SDimitry Andric protected: 2350b57cec5SDimitry Andric Tool *buildAssembler() const override; // ptxas 2360b57cec5SDimitry Andric Tool *buildLinker() const override; // fatbinary (ok, not really a linker) 2370b57cec5SDimitry Andric }; 2380b57cec5SDimitry Andric 2390b57cec5SDimitry Andric } // end namespace toolchains 2400b57cec5SDimitry Andric } // end namespace driver 2410b57cec5SDimitry Andric } // end namespace clang 2420b57cec5SDimitry Andric 2430b57cec5SDimitry Andric #endif // LLVM_CLANG_LIB_DRIVER_TOOLCHAINS_CUDA_H 244