1 //===--- Cuda.h - Cuda ToolChain Implementations ----------------*- C++ -*-===//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
9 #ifndef LLVM_CLANG_LIB_DRIVER_TOOLCHAINS_CUDA_H
10 #define LLVM_CLANG_LIB_DRIVER_TOOLCHAINS_CUDA_H
12 #include "clang/Basic/Cuda.h"
13 #include "clang/Driver/Action.h"
14 #include "clang/Driver/Multilib.h"
15 #include "clang/Driver/Tool.h"
16 #include "clang/Driver/ToolChain.h"
17 #include "llvm/Support/Compiler.h"
18 #include "llvm/Support/VersionTuple.h"
26 /// A class to find a viable CUDA installation
27 class CudaInstallationDetector
{
31 CudaVersion Version
= CudaVersion::UNKNOWN
;
32 std::string InstallPath
;
34 std::string LibDevicePath
;
35 std::string IncludePath
;
36 llvm::StringMap
<std::string
> LibDeviceMap
;
38 // CUDA architectures for which we have raised an error in
39 // CheckCudaVersionSupportsArch.
40 mutable std::bitset
<(int)CudaArch::LAST
> ArchsWithBadVersion
;
43 CudaInstallationDetector(const Driver
&D
, const llvm::Triple
&HostTriple
,
44 const llvm::opt::ArgList
&Args
);
46 void AddCudaIncludeArgs(const llvm::opt::ArgList
&DriverArgs
,
47 llvm::opt::ArgStringList
&CC1Args
) const;
49 /// Emit an error if Version does not support the given Arch.
51 /// If either Version or Arch is unknown, does not emit an error. Emits at
52 /// most one error per Arch.
53 void CheckCudaVersionSupportsArch(CudaArch Arch
) const;
55 /// Check whether we detected a valid Cuda install.
56 bool isValid() const { return IsValid
; }
57 /// Print information about the detected CUDA installation.
58 void print(raw_ostream
&OS
) const;
60 /// Get the detected Cuda install's version.
61 CudaVersion
version() const {
62 return Version
== CudaVersion::NEW
? CudaVersion::PARTIALLY_SUPPORTED
65 /// Get the detected Cuda installation path.
66 StringRef
getInstallPath() const { return InstallPath
; }
67 /// Get the detected path to Cuda's bin directory.
68 StringRef
getBinPath() const { return BinPath
; }
69 /// Get the detected Cuda Include path.
70 StringRef
getIncludePath() const { return IncludePath
; }
71 /// Get the detected Cuda device library path.
72 StringRef
getLibDevicePath() const { return LibDevicePath
; }
73 /// Get libdevice file for given architecture
74 std::string
getLibDeviceFile(StringRef Gpu
) const {
75 return LibDeviceMap
.lookup(Gpu
);
77 void WarnIfUnsupportedVersion();
83 // Run ptxas, the NVPTX assembler.
84 class LLVM_LIBRARY_VISIBILITY Assembler final
: public Tool
{
86 Assembler(const ToolChain
&TC
) : Tool("NVPTX::Assembler", "ptxas", TC
) {}
88 bool hasIntegratedCPP() const override
{ return false; }
90 void ConstructJob(Compilation
&C
, const JobAction
&JA
,
91 const InputInfo
&Output
, const InputInfoList
&Inputs
,
92 const llvm::opt::ArgList
&TCArgs
,
93 const char *LinkingOutput
) const override
;
96 // Runs fatbinary, which combines GPU object files ("cubin" files) and/or PTX
97 // assembly into a single output file.
98 class LLVM_LIBRARY_VISIBILITY FatBinary
: public Tool
{
100 FatBinary(const ToolChain
&TC
) : Tool("NVPTX::Linker", "fatbinary", TC
) {}
102 bool hasIntegratedCPP() const override
{ return false; }
104 void ConstructJob(Compilation
&C
, const JobAction
&JA
,
105 const InputInfo
&Output
, const InputInfoList
&Inputs
,
106 const llvm::opt::ArgList
&TCArgs
,
107 const char *LinkingOutput
) const override
;
110 // Runs nvlink, which links GPU object files ("cubin" files) into a single file.
111 class LLVM_LIBRARY_VISIBILITY Linker final
: public Tool
{
113 Linker(const ToolChain
&TC
) : Tool("NVPTX::Linker", "nvlink", TC
) {}
115 bool hasIntegratedCPP() const override
{ return false; }
117 void ConstructJob(Compilation
&C
, const JobAction
&JA
,
118 const InputInfo
&Output
, const InputInfoList
&Inputs
,
119 const llvm::opt::ArgList
&TCArgs
,
120 const char *LinkingOutput
) const override
;
123 void getNVPTXTargetFeatures(const Driver
&D
, const llvm::Triple
&Triple
,
124 const llvm::opt::ArgList
&Args
,
125 std::vector
<StringRef
> &Features
);
127 } // end namespace NVPTX
128 } // end namespace tools
130 namespace toolchains
{
132 class LLVM_LIBRARY_VISIBILITY NVPTXToolChain
: public ToolChain
{
134 NVPTXToolChain(const Driver
&D
, const llvm::Triple
&Triple
,
135 const llvm::Triple
&HostTriple
, const llvm::opt::ArgList
&Args
,
138 NVPTXToolChain(const Driver
&D
, const llvm::Triple
&Triple
,
139 const llvm::opt::ArgList
&Args
);
141 llvm::opt::DerivedArgList
*
142 TranslateArgs(const llvm::opt::DerivedArgList
&Args
, StringRef BoundArch
,
143 Action::OffloadKind DeviceOffloadKind
) const override
;
146 addClangTargetOptions(const llvm::opt::ArgList
&DriverArgs
,
147 llvm::opt::ArgStringList
&CC1Args
,
148 Action::OffloadKind DeviceOffloadKind
) const override
;
150 // Never try to use the integrated assembler with CUDA; always fork out to
152 bool useIntegratedAs() const override
{ return false; }
153 bool isCrossCompiling() const override
{ return true; }
154 bool isPICDefault() const override
{ return false; }
155 bool isPIEDefault(const llvm::opt::ArgList
&Args
) const override
{
158 bool isPICDefaultForced() const override
{ return false; }
159 bool SupportsProfiling() const override
{ return false; }
161 bool IsMathErrnoDefault() const override
{ return false; }
163 bool supportsDebugInfoOption(const llvm::opt::Arg
*A
) const override
;
164 void adjustDebugInfoKind(llvm::codegenoptions::DebugInfoKind
&DebugInfoKind
,
165 const llvm::opt::ArgList
&Args
) const override
;
167 // NVPTX supports only DWARF2.
168 unsigned GetDefaultDwarfVersion() const override
{ return 2; }
169 unsigned getMaxDwarfVersion() const override
{ return 2; }
171 CudaInstallationDetector CudaInstallation
;
174 Tool
*buildAssembler() const override
; // ptxas.
175 Tool
*buildLinker() const override
; // nvlink.
178 bool Freestanding
= false;
181 class LLVM_LIBRARY_VISIBILITY CudaToolChain
: public NVPTXToolChain
{
183 CudaToolChain(const Driver
&D
, const llvm::Triple
&Triple
,
184 const ToolChain
&HostTC
, const llvm::opt::ArgList
&Args
);
186 const llvm::Triple
*getAuxTriple() const override
{
187 return &HostTC
.getTriple();
190 std::string
getInputFilename(const InputInfo
&Input
) const override
;
192 llvm::opt::DerivedArgList
*
193 TranslateArgs(const llvm::opt::DerivedArgList
&Args
, StringRef BoundArch
,
194 Action::OffloadKind DeviceOffloadKind
) const override
;
196 addClangTargetOptions(const llvm::opt::ArgList
&DriverArgs
,
197 llvm::opt::ArgStringList
&CC1Args
,
198 Action::OffloadKind DeviceOffloadKind
) const override
;
200 llvm::DenormalMode
getDefaultDenormalModeForType(
201 const llvm::opt::ArgList
&DriverArgs
, const JobAction
&JA
,
202 const llvm::fltSemantics
*FPType
= nullptr) const override
;
204 void AddCudaIncludeArgs(const llvm::opt::ArgList
&DriverArgs
,
205 llvm::opt::ArgStringList
&CC1Args
) const override
;
207 void addClangWarningOptions(llvm::opt::ArgStringList
&CC1Args
) const override
;
208 CXXStdlibType
GetCXXStdlibType(const llvm::opt::ArgList
&Args
) const override
;
210 AddClangSystemIncludeArgs(const llvm::opt::ArgList
&DriverArgs
,
211 llvm::opt::ArgStringList
&CC1Args
) const override
;
212 void AddClangCXXStdlibIncludeArgs(
213 const llvm::opt::ArgList
&Args
,
214 llvm::opt::ArgStringList
&CC1Args
) const override
;
215 void AddIAMCUIncludeArgs(const llvm::opt::ArgList
&DriverArgs
,
216 llvm::opt::ArgStringList
&CC1Args
) const override
;
218 SanitizerMask
getSupportedSanitizers() const override
;
221 computeMSVCVersion(const Driver
*D
,
222 const llvm::opt::ArgList
&Args
) const override
;
224 const ToolChain
&HostTC
;
226 /// Uses nvptx-arch tool to get arch of the system GPU. Will return error
227 /// if unable to find one.
228 virtual Expected
<SmallVector
<std::string
>>
229 getSystemGPUArchs(const llvm::opt::ArgList
&Args
) const override
;
232 Tool
*buildAssembler() const override
; // ptxas
233 Tool
*buildLinker() const override
; // fatbinary (ok, not really a linker)
236 } // end namespace toolchains
237 } // end namespace driver
238 } // end namespace clang
240 #endif // LLVM_CLANG_LIB_DRIVER_TOOLCHAINS_CUDA_H