clang 20.0.0git
Cuda.h
Go to the documentation of this file.
1//===--- Cuda.h - Cuda ToolChain Implementations ----------------*- C++ -*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8
9#ifndef LLVM_CLANG_LIB_DRIVER_TOOLCHAINS_CUDA_H
10#define LLVM_CLANG_LIB_DRIVER_TOOLCHAINS_CUDA_H
11
12#include "clang/Basic/Cuda.h"
13#include "clang/Driver/Action.h"
15#include "clang/Driver/Tool.h"
17#include "llvm/Support/Compiler.h"
18#include "llvm/Support/VersionTuple.h"
19#include <bitset>
20#include <set>
21#include <vector>
22
23namespace clang {
24namespace driver {
25
26/// A class to find a viable CUDA installation
28private:
29 const Driver &D;
30 bool IsValid = false;
32 std::string InstallPath;
33 std::string BinPath;
34 std::string LibDevicePath;
35 std::string IncludePath;
36 llvm::StringMap<std::string> LibDeviceMap;
37
38 // CUDA architectures for which we have raised an error in
39 // CheckCudaVersionSupportsArch.
40 mutable std::bitset<(int)OffloadArch::LAST> ArchsWithBadVersion;
41
42public:
43 CudaInstallationDetector(const Driver &D, const llvm::Triple &HostTriple,
44 const llvm::opt::ArgList &Args);
45
46 void AddCudaIncludeArgs(const llvm::opt::ArgList &DriverArgs,
47 llvm::opt::ArgStringList &CC1Args) const;
48
49 /// Emit an error if Version does not support the given Arch.
50 ///
51 /// If either Version or Arch is unknown, does not emit an error. Emits at
52 /// most one error per Arch.
54
55 /// Check whether we detected a valid Cuda install.
56 bool isValid() const { return IsValid; }
57 /// Print information about the detected CUDA installation.
58 void print(raw_ostream &OS) const;
59
60 /// Get the detected Cuda install's version.
63 : Version;
64 }
65 /// Get the detected Cuda installation path.
66 StringRef getInstallPath() const { return InstallPath; }
67 /// Get the detected path to Cuda's bin directory.
68 StringRef getBinPath() const { return BinPath; }
69 /// Get the detected Cuda Include path.
70 StringRef getIncludePath() const { return IncludePath; }
71 /// Get the detected Cuda device library path.
72 StringRef getLibDevicePath() const { return LibDevicePath; }
73 /// Get libdevice file for given architecture
74 std::string getLibDeviceFile(StringRef Gpu) const {
75 return LibDeviceMap.lookup(Gpu);
76 }
78};
79
80namespace tools {
81namespace NVPTX {
82
83// Run ptxas, the NVPTX assembler.
84class LLVM_LIBRARY_VISIBILITY Assembler final : public Tool {
85public:
86 Assembler(const ToolChain &TC) : Tool("NVPTX::Assembler", "ptxas", TC) {}
87
88 bool hasIntegratedCPP() const override { return false; }
89
90 void ConstructJob(Compilation &C, const JobAction &JA,
91 const InputInfo &Output, const InputInfoList &Inputs,
92 const llvm::opt::ArgList &TCArgs,
93 const char *LinkingOutput) const override;
94};
95
96// Runs fatbinary, which combines GPU object files ("cubin" files) and/or PTX
97// assembly into a single output file.
98class LLVM_LIBRARY_VISIBILITY FatBinary : public Tool {
99public:
100 FatBinary(const ToolChain &TC) : Tool("NVPTX::Linker", "fatbinary", TC) {}
101
102 bool hasIntegratedCPP() const override { return false; }
103
104 void ConstructJob(Compilation &C, const JobAction &JA,
105 const InputInfo &Output, const InputInfoList &Inputs,
106 const llvm::opt::ArgList &TCArgs,
107 const char *LinkingOutput) const override;
108};
109
110// Runs nvlink, which links GPU object files ("cubin" files) into a single file.
111class LLVM_LIBRARY_VISIBILITY Linker final : public Tool {
112public:
113 Linker(const ToolChain &TC) : Tool("NVPTX::Linker", "nvlink", TC) {}
114
115 bool hasIntegratedCPP() const override { return false; }
116
117 void ConstructJob(Compilation &C, const JobAction &JA,
118 const InputInfo &Output, const InputInfoList &Inputs,
119 const llvm::opt::ArgList &TCArgs,
120 const char *LinkingOutput) const override;
121};
122
123void getNVPTXTargetFeatures(const Driver &D, const llvm::Triple &Triple,
124 const llvm::opt::ArgList &Args,
125 std::vector<StringRef> &Features);
126
127} // end namespace NVPTX
128} // end namespace tools
129
130namespace toolchains {
131
132class LLVM_LIBRARY_VISIBILITY NVPTXToolChain : public ToolChain {
133public:
134 NVPTXToolChain(const Driver &D, const llvm::Triple &Triple,
135 const llvm::Triple &HostTriple, const llvm::opt::ArgList &Args,
136 bool Freestanding);
137
138 NVPTXToolChain(const Driver &D, const llvm::Triple &Triple,
139 const llvm::opt::ArgList &Args);
140
141 llvm::opt::DerivedArgList *
142 TranslateArgs(const llvm::opt::DerivedArgList &Args, StringRef BoundArch,
143 Action::OffloadKind DeviceOffloadKind) const override;
144
145 void
146 addClangTargetOptions(const llvm::opt::ArgList &DriverArgs,
147 llvm::opt::ArgStringList &CC1Args,
148 Action::OffloadKind DeviceOffloadKind) const override;
149
150 // Never try to use the integrated assembler with CUDA; always fork out to
151 // ptxas.
152 bool useIntegratedAs() const override { return false; }
153 bool isCrossCompiling() const override { return true; }
154 bool isPICDefault() const override { return false; }
155 bool isPIEDefault(const llvm::opt::ArgList &Args) const override {
156 return false;
157 }
158 bool HasNativeLLVMSupport() const override { return true; }
159 bool isPICDefaultForced() const override { return false; }
160 bool SupportsProfiling() const override { return false; }
161
162 bool IsMathErrnoDefault() const override { return false; }
163
164 bool supportsDebugInfoOption(const llvm::opt::Arg *A) const override;
165 void adjustDebugInfoKind(llvm::codegenoptions::DebugInfoKind &DebugInfoKind,
166 const llvm::opt::ArgList &Args) const override;
167
168 // NVPTX supports only DWARF2.
169 unsigned GetDefaultDwarfVersion() const override { return 2; }
170 unsigned getMaxDwarfVersion() const override { return 2; }
171
172 /// Uses nvptx-arch tool to get arch of the system GPU. Will return error
173 /// if unable to find one.
175 getSystemGPUArchs(const llvm::opt::ArgList &Args) const override;
176
178
179protected:
180 Tool *buildAssembler() const override; // ptxas.
181 Tool *buildLinker() const override; // nvlink.
182
183private:
184 bool Freestanding = false;
185};
186
187class LLVM_LIBRARY_VISIBILITY CudaToolChain : public NVPTXToolChain {
188public:
189 CudaToolChain(const Driver &D, const llvm::Triple &Triple,
190 const ToolChain &HostTC, const llvm::opt::ArgList &Args);
191
192 const llvm::Triple *getAuxTriple() const override {
193 return &HostTC.getTriple();
194 }
195
196 bool HasNativeLLVMSupport() const override { return false; }
197
198 std::string getInputFilename(const InputInfo &Input) const override;
199
200 llvm::opt::DerivedArgList *
201 TranslateArgs(const llvm::opt::DerivedArgList &Args, StringRef BoundArch,
202 Action::OffloadKind DeviceOffloadKind) const override;
203 void
204 addClangTargetOptions(const llvm::opt::ArgList &DriverArgs,
205 llvm::opt::ArgStringList &CC1Args,
206 Action::OffloadKind DeviceOffloadKind) const override;
207
208 llvm::DenormalMode getDefaultDenormalModeForType(
209 const llvm::opt::ArgList &DriverArgs, const JobAction &JA,
210 const llvm::fltSemantics *FPType = nullptr) const override;
211
212 void AddCudaIncludeArgs(const llvm::opt::ArgList &DriverArgs,
213 llvm::opt::ArgStringList &CC1Args) const override;
214
215 void addClangWarningOptions(llvm::opt::ArgStringList &CC1Args) const override;
216 CXXStdlibType GetCXXStdlibType(const llvm::opt::ArgList &Args) const override;
217 void
218 AddClangSystemIncludeArgs(const llvm::opt::ArgList &DriverArgs,
219 llvm::opt::ArgStringList &CC1Args) const override;
220 void AddClangCXXStdlibIncludeArgs(
221 const llvm::opt::ArgList &Args,
222 llvm::opt::ArgStringList &CC1Args) const override;
223 void AddIAMCUIncludeArgs(const llvm::opt::ArgList &DriverArgs,
224 llvm::opt::ArgStringList &CC1Args) const override;
225
226 SanitizerMask getSupportedSanitizers() const override;
227
228 VersionTuple
229 computeMSVCVersion(const Driver *D,
230 const llvm::opt::ArgList &Args) const override;
231
233
234protected:
235 Tool *buildAssembler() const override; // ptxas
236 Tool *buildLinker() const override; // fatbinary (ok, not really a linker)
237};
238
239} // end namespace toolchains
240} // end namespace driver
241} // end namespace clang
242
243#endif // LLVM_CLANG_LIB_DRIVER_TOOLCHAINS_CUDA_H
const Decl * D
__device__ int
Compilation - A set of tasks to perform for a single driver invocation.
Definition: Compilation.h:45
A class to find a viable CUDA installation.
Definition: Cuda.h:27
void AddCudaIncludeArgs(const llvm::opt::ArgList &DriverArgs, llvm::opt::ArgStringList &CC1Args) const
Definition: Cuda.cpp:290
StringRef getLibDevicePath() const
Get the detected Cuda device library path.
Definition: Cuda.h:72
CudaVersion version() const
Get the detected Cuda install's version.
Definition: Cuda.h:61
StringRef getInstallPath() const
Get the detected Cuda installation path.
Definition: Cuda.h:66
std::string getLibDeviceFile(StringRef Gpu) const
Get libdevice file for given architecture.
Definition: Cuda.h:74
StringRef getBinPath() const
Get the detected path to Cuda's bin directory.
Definition: Cuda.h:68
void CheckCudaVersionSupportsArch(OffloadArch Arch) const
Emit an error if Version does not support the given Arch.
Definition: Cuda.cpp:314
void print(raw_ostream &OS) const
Print information about the detected CUDA installation.
Definition: Cuda.cpp:331
StringRef getIncludePath() const
Get the detected Cuda Include path.
Definition: Cuda.h:70
bool isValid() const
Check whether we detected a valid Cuda install.
Definition: Cuda.h:56
Driver - Encapsulate logic for constructing compilation processes from a set of gcc-driver-like comma...
Definition: Driver.h:77
InputInfo - Wrapper for information about an input source.
Definition: InputInfo.h:22
ToolChain - Access to tools for a single platform.
Definition: ToolChain.h:92
const llvm::Triple & getTriple() const
Definition: ToolChain.h:254
Tool - Information on a specific compilation tool.
Definition: Tool.h:32
const llvm::Triple * getAuxTriple() const override
Get the toolchain's aux triple, if it has one.
Definition: Cuda.h:192
bool HasNativeLLVMSupport() const override
HasNativeLTOLinker - Check whether the linker and related tools have native LLVM support.
Definition: Cuda.h:196
unsigned getMaxDwarfVersion() const override
Definition: Cuda.h:170
CudaInstallationDetector CudaInstallation
Definition: Cuda.h:177
bool isPICDefault() const override
Test whether this toolchain defaults to PIC.
Definition: Cuda.h:154
bool isCrossCompiling() const override
Returns true if the toolchain is targeting a non-native architecture.
Definition: Cuda.h:153
bool IsMathErrnoDefault() const override
IsMathErrnoDefault - Does this tool chain use -fmath-errno by default.
Definition: Cuda.h:162
bool HasNativeLLVMSupport() const override
HasNativeLTOLinker - Check whether the linker and related tools have native LLVM support.
Definition: Cuda.h:158
NVPTXToolChain(const Driver &D, const llvm::Triple &Triple, const llvm::opt::ArgList &Args)
bool SupportsProfiling() const override
SupportsProfiling - Does this tool chain support -pg.
Definition: Cuda.h:160
unsigned GetDefaultDwarfVersion() const override
Definition: Cuda.h:169
bool useIntegratedAs() const override
Check if the toolchain should use the integrated assembler.
Definition: Cuda.h:152
bool isPIEDefault(const llvm::opt::ArgList &Args) const override
Test whether this toolchain defaults to PIE.
Definition: Cuda.h:155
NVPTXToolChain(const Driver &D, const llvm::Triple &Triple, const llvm::Triple &HostTriple, const llvm::opt::ArgList &Args, bool Freestanding)
bool isPICDefaultForced() const override
Tests whether this toolchain forces its default for PIC, PIE or non-PIC.
Definition: Cuda.h:159
bool hasIntegratedCPP() const override
Definition: Cuda.h:88
Assembler(const ToolChain &TC)
Definition: Cuda.h:86
FatBinary(const ToolChain &TC)
Definition: Cuda.h:100
bool hasIntegratedCPP() const override
Definition: Cuda.h:102
Linker(const ToolChain &TC)
Definition: Cuda.h:113
bool hasIntegratedCPP() const override
Definition: Cuda.h:115
void getNVPTXTargetFeatures(const Driver &D, const llvm::Triple &Triple, const llvm::opt::ArgList &Args, std::vector< StringRef > &Features)
Definition: Cuda.cpp:653
The JSON file list parser is used to communicate input to InstallAPI.
OffloadArch
Definition: Cuda.h:55
CudaVersion
Definition: Cuda.h:20