blob: 686c2e0c854e0501ea96a6dac455dfa31a8b7c4d [file] [log] [blame]
Yaxun Liuf6144222018-05-30 00:53:50 +00001//===--- HIP.cpp - HIP Tool and ToolChain Implementations -------*- C++ -*-===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
10#include "HIP.h"
11#include "CommonArgs.h"
12#include "InputInfo.h"
13#include "clang/Basic/Cuda.h"
14#include "clang/Driver/Compilation.h"
15#include "clang/Driver/Driver.h"
16#include "clang/Driver/DriverDiagnostic.h"
17#include "clang/Driver/Options.h"
18#include "llvm/Support/FileSystem.h"
19#include "llvm/Support/Path.h"
20
21using namespace clang::driver;
22using namespace clang::driver::toolchains;
23using namespace clang::driver::tools;
24using namespace clang;
25using namespace llvm::opt;
26
27namespace {
28
29static void addBCLib(Compilation &C, const ArgList &Args,
30 ArgStringList &CmdArgs, ArgStringList LibraryPaths,
31 StringRef BCName) {
32 StringRef FullName;
33 for (std::string LibraryPath : LibraryPaths) {
34 SmallString<128> Path(LibraryPath);
35 llvm::sys::path::append(Path, BCName);
36 FullName = Path;
37 if (llvm::sys::fs::exists(FullName)) {
38 CmdArgs.push_back(Args.MakeArgString(FullName));
39 return;
40 }
41 }
42 C.getDriver().Diag(diag::err_drv_no_such_file) << BCName;
43}
44
45} // namespace
46
47const char *AMDGCN::Linker::constructLLVMLinkCommand(
48 Compilation &C, const JobAction &JA, const InputInfoList &Inputs,
49 const ArgList &Args, StringRef SubArchName,
50 StringRef OutputFilePrefix) const {
51 ArgStringList CmdArgs;
52 // Add the input bc's created by compile step.
53 for (const auto &II : Inputs)
54 CmdArgs.push_back(II.getFilename());
55
56 ArgStringList LibraryPaths;
57
58 // Find in --hip-device-lib-path and HIP_LIBRARY_PATH.
59 for (auto Path : Args.getAllArgValues(options::OPT_hip_device_lib_path_EQ))
60 LibraryPaths.push_back(Args.MakeArgString(Path));
61
62 addDirectoryList(Args, LibraryPaths, "-L", "HIP_DEVICE_LIB_PATH");
63
64 llvm::SmallVector<std::string, 10> BCLibs;
65
66 // Add bitcode library in --hip-device-lib.
67 for (auto Lib : Args.getAllArgValues(options::OPT_hip_device_lib_EQ)) {
68 BCLibs.push_back(Args.MakeArgString(Lib));
69 }
70
71 // If --hip-device-lib is not set, add the default bitcode libraries.
72 if (BCLibs.empty()) {
73 // Get the bc lib file name for ISA version. For example,
74 // gfx803 => oclc_isa_version_803.amdgcn.bc.
75 std::string ISAVerBC =
76 "oclc_isa_version_" + SubArchName.drop_front(3).str() + ".amdgcn.bc";
77
78 BCLibs.append({"hip.amdgcn.bc", "hc.amdgcn.bc", "opencl.amdgcn.bc",
79 "ockl.amdgcn.bc", "irif.amdgcn.bc", "ocml.amdgcn.bc",
80 "oclc_finite_only_off.amdgcn.bc",
81 "oclc_daz_opt_off.amdgcn.bc",
82 "oclc_correctly_rounded_sqrt_on.amdgcn.bc",
83 "oclc_unsafe_math_off.amdgcn.bc", "hc.amdgcn.bc", ISAVerBC});
84 }
85 for (auto Lib : BCLibs)
86 addBCLib(C, Args, CmdArgs, LibraryPaths, Lib);
87
88 // Add an intermediate output file.
89 CmdArgs.push_back("-o");
90 std::string TmpName =
91 C.getDriver().GetTemporaryPath(OutputFilePrefix.str() + "-linked", "bc");
92 const char *OutputFileName =
93 C.addTempFile(C.getArgs().MakeArgString(TmpName));
94 CmdArgs.push_back(OutputFileName);
95 SmallString<128> ExecPath(C.getDriver().Dir);
96 llvm::sys::path::append(ExecPath, "llvm-link");
97 const char *Exec = Args.MakeArgString(ExecPath);
98 C.addCommand(llvm::make_unique<Command>(JA, *this, Exec, CmdArgs, Inputs));
99 return OutputFileName;
100}
101
102const char *AMDGCN::Linker::constructOptCommand(
103 Compilation &C, const JobAction &JA, const InputInfoList &Inputs,
104 const llvm::opt::ArgList &Args, llvm::StringRef SubArchName,
105 llvm::StringRef OutputFilePrefix, const char *InputFileName) const {
106 // Construct opt command.
107 ArgStringList OptArgs;
108 // The input to opt is the output from llvm-link.
109 OptArgs.push_back(InputFileName);
110 // Pass optimization arg to opt.
111 if (Arg *A = Args.getLastArg(options::OPT_O_Group)) {
112 StringRef OOpt = "3";
113 if (A->getOption().matches(options::OPT_O4) ||
114 A->getOption().matches(options::OPT_Ofast))
115 OOpt = "3";
116 else if (A->getOption().matches(options::OPT_O0))
117 OOpt = "0";
118 else if (A->getOption().matches(options::OPT_O)) {
119 // -Os, -Oz, and -O(anything else) map to -O2
120 OOpt = llvm::StringSwitch<const char *>(A->getValue())
121 .Case("1", "1")
122 .Case("2", "2")
123 .Case("3", "3")
124 .Case("s", "2")
125 .Case("z", "2")
126 .Default("2");
127 }
128 OptArgs.push_back(Args.MakeArgString("-O" + OOpt));
129 }
130 OptArgs.push_back("-mtriple=amdgcn-amd-amdhsa");
131 OptArgs.push_back(Args.MakeArgString("-mcpu=" + SubArchName));
132 OptArgs.push_back("-o");
133 std::string TmpFileName = C.getDriver().GetTemporaryPath(
134 OutputFilePrefix.str() + "-optimized", "bc");
135 const char *OutputFileName =
136 C.addTempFile(C.getArgs().MakeArgString(TmpFileName));
137 OptArgs.push_back(OutputFileName);
138 SmallString<128> OptPath(C.getDriver().Dir);
139 llvm::sys::path::append(OptPath, "opt");
140 const char *OptExec = Args.MakeArgString(OptPath);
141 C.addCommand(llvm::make_unique<Command>(JA, *this, OptExec, OptArgs, Inputs));
142 return OutputFileName;
143}
144
145const char *AMDGCN::Linker::constructLlcCommand(
146 Compilation &C, const JobAction &JA, const InputInfoList &Inputs,
147 const llvm::opt::ArgList &Args, llvm::StringRef SubArchName,
148 llvm::StringRef OutputFilePrefix, const char *InputFileName) const {
149 // Construct llc command.
150 ArgStringList LlcArgs{InputFileName, "-mtriple=amdgcn-amd-amdhsa",
151 "-filetype=obj",
152 Args.MakeArgString("-mcpu=" + SubArchName), "-o"};
153 std::string LlcOutputFileName =
154 C.getDriver().GetTemporaryPath(OutputFilePrefix, "o");
155 const char *LlcOutputFile =
156 C.addTempFile(C.getArgs().MakeArgString(LlcOutputFileName));
157 LlcArgs.push_back(LlcOutputFile);
158 SmallString<128> LlcPath(C.getDriver().Dir);
159 llvm::sys::path::append(LlcPath, "llc");
160 const char *Llc = Args.MakeArgString(LlcPath);
161 C.addCommand(llvm::make_unique<Command>(JA, *this, Llc, LlcArgs, Inputs));
162 return LlcOutputFile;
163}
164
165void AMDGCN::Linker::constructLldCommand(Compilation &C, const JobAction &JA,
166 const InputInfoList &Inputs,
167 const InputInfo &Output,
168 const llvm::opt::ArgList &Args,
169 const char *InputFileName) const {
170 // Construct lld command.
171 // The output from ld.lld is an HSA code object file.
172 ArgStringList LldArgs{"-flavor", "gnu", "--no-undefined",
173 "-shared", "-o", Output.getFilename(),
174 InputFileName};
175 SmallString<128> LldPath(C.getDriver().Dir);
176 llvm::sys::path::append(LldPath, "lld");
177 const char *Lld = Args.MakeArgString(LldPath);
178 C.addCommand(llvm::make_unique<Command>(JA, *this, Lld, LldArgs, Inputs));
179}
180
181// For amdgcn the inputs of the linker job are device bitcode and output is
182// object file. It calls llvm-link, opt, llc, then lld steps.
183void AMDGCN::Linker::ConstructJob(Compilation &C, const JobAction &JA,
184 const InputInfo &Output,
185 const InputInfoList &Inputs,
186 const ArgList &Args,
187 const char *LinkingOutput) const {
188
189 const auto &TC =
190 static_cast<const toolchains::HIPToolChain &>(getToolChain());
191 assert(TC.getTriple().getArch() == llvm::Triple::amdgcn &&
192 "Unsupported target");
193
194 std::string SubArchName = JA.getOffloadingArch();
195 assert(StringRef(SubArchName).startswith("gfx") && "Unsupported sub arch");
196
197 // Prefix for temporary file name.
198 std::string Prefix =
199 llvm::sys::path::stem(Inputs[0].getFilename()).str() + "-" + SubArchName;
200
201 // Each command outputs different files.
202 const char *LLVMLinkCommand =
203 constructLLVMLinkCommand(C, JA, Inputs, Args, SubArchName, Prefix);
204 const char *OptCommand = constructOptCommand(C, JA, Inputs, Args, SubArchName,
205 Prefix, LLVMLinkCommand);
206 const char *LlcCommand =
207 constructLlcCommand(C, JA, Inputs, Args, SubArchName, Prefix, OptCommand);
208 constructLldCommand(C, JA, Inputs, Output, Args, LlcCommand);
209}
210
211HIPToolChain::HIPToolChain(const Driver &D, const llvm::Triple &Triple,
212 const ToolChain &HostTC, const ArgList &Args)
213 : ToolChain(D, Triple, Args), HostTC(HostTC) {
214 // Lookup binaries into the driver directory, this is used to
215 // discover the clang-offload-bundler executable.
216 getProgramPaths().push_back(getDriver().Dir);
217}
218
219void HIPToolChain::addClangTargetOptions(
220 const llvm::opt::ArgList &DriverArgs,
221 llvm::opt::ArgStringList &CC1Args,
222 Action::OffloadKind DeviceOffloadingKind) const {
223 HostTC.addClangTargetOptions(DriverArgs, CC1Args, DeviceOffloadingKind);
224
225 StringRef GpuArch = DriverArgs.getLastArgValue(options::OPT_march_EQ);
226 assert(!GpuArch.empty() && "Must have an explicit GPU arch.");
227 assert(DeviceOffloadingKind == Action::OFK_HIP &&
228 "Only HIP offloading kinds are supported for GPUs.");
229
230 CC1Args.push_back("-fcuda-is-device");
231
232 if (DriverArgs.hasFlag(options::OPT_fcuda_flush_denormals_to_zero,
233 options::OPT_fno_cuda_flush_denormals_to_zero, false))
234 CC1Args.push_back("-fcuda-flush-denormals-to-zero");
235
236 if (DriverArgs.hasFlag(options::OPT_fcuda_approx_transcendentals,
237 options::OPT_fno_cuda_approx_transcendentals, false))
238 CC1Args.push_back("-fcuda-approx-transcendentals");
239
240 if (DriverArgs.hasFlag(options::OPT_fcuda_rdc, options::OPT_fno_cuda_rdc,
241 false))
242 CC1Args.push_back("-fcuda-rdc");
243}
244
245llvm::opt::DerivedArgList *
246HIPToolChain::TranslateArgs(const llvm::opt::DerivedArgList &Args,
247 StringRef BoundArch,
248 Action::OffloadKind DeviceOffloadKind) const {
249 DerivedArgList *DAL =
250 HostTC.TranslateArgs(Args, BoundArch, DeviceOffloadKind);
251 if (!DAL)
252 DAL = new DerivedArgList(Args.getBaseArgs());
253
254 const OptTable &Opts = getDriver().getOpts();
255
256 for (Arg *A : Args) {
257 if (A->getOption().matches(options::OPT_Xarch__)) {
258 // Skip this argument unless the architecture matches BoundArch
259 if (BoundArch.empty() || A->getValue(0) != BoundArch)
260 continue;
261
262 unsigned Index = Args.getBaseArgs().MakeIndex(A->getValue(1));
263 unsigned Prev = Index;
264 std::unique_ptr<Arg> XarchArg(Opts.ParseOneArg(Args, Index));
265
266 // If the argument parsing failed or more than one argument was
267 // consumed, the -Xarch_ argument's parameter tried to consume
268 // extra arguments. Emit an error and ignore.
269 //
270 // We also want to disallow any options which would alter the
271 // driver behavior; that isn't going to work in our model. We
272 // use isDriverOption() as an approximation, although things
273 // like -O4 are going to slip through.
274 if (!XarchArg || Index > Prev + 1) {
275 getDriver().Diag(diag::err_drv_invalid_Xarch_argument_with_args)
276 << A->getAsString(Args);
277 continue;
278 } else if (XarchArg->getOption().hasFlag(options::DriverOption)) {
279 getDriver().Diag(diag::err_drv_invalid_Xarch_argument_isdriver)
280 << A->getAsString(Args);
281 continue;
282 }
283 XarchArg->setBaseArg(A);
284 A = XarchArg.release();
285 DAL->AddSynthesizedArg(A);
286 }
287 DAL->append(A);
288 }
289
290 if (!BoundArch.empty()) {
291 DAL->eraseArg(options::OPT_march_EQ);
292 DAL->AddJoinedArg(nullptr, Opts.getOption(options::OPT_march_EQ), BoundArch);
293 }
294
295 return DAL;
296}
297
298Tool *HIPToolChain::buildLinker() const {
299 assert(getTriple().getArch() == llvm::Triple::amdgcn);
300 return new tools::AMDGCN::Linker(*this);
301}
302
303void HIPToolChain::addClangWarningOptions(ArgStringList &CC1Args) const {
304 HostTC.addClangWarningOptions(CC1Args);
305}
306
307ToolChain::CXXStdlibType
308HIPToolChain::GetCXXStdlibType(const ArgList &Args) const {
309 return HostTC.GetCXXStdlibType(Args);
310}
311
312void HIPToolChain::AddClangSystemIncludeArgs(const ArgList &DriverArgs,
313 ArgStringList &CC1Args) const {
314 HostTC.AddClangSystemIncludeArgs(DriverArgs, CC1Args);
315}
316
317void HIPToolChain::AddClangCXXStdlibIncludeArgs(const ArgList &Args,
318 ArgStringList &CC1Args) const {
319 HostTC.AddClangCXXStdlibIncludeArgs(Args, CC1Args);
320}
321
322void HIPToolChain::AddIAMCUIncludeArgs(const ArgList &Args,
323 ArgStringList &CC1Args) const {
324 HostTC.AddIAMCUIncludeArgs(Args, CC1Args);
325}
326
327SanitizerMask HIPToolChain::getSupportedSanitizers() const {
328 // The HIPToolChain only supports sanitizers in the sense that it allows
329 // sanitizer arguments on the command line if they are supported by the host
330 // toolchain. The HIPToolChain will actually ignore any command line
331 // arguments for any of these "supported" sanitizers. That means that no
332 // sanitization of device code is actually supported at this time.
333 //
334 // This behavior is necessary because the host and device toolchains
335 // invocations often share the command line, so the device toolchain must
336 // tolerate flags meant only for the host toolchain.
337 return HostTC.getSupportedSanitizers();
338}
339
340VersionTuple HIPToolChain::computeMSVCVersion(const Driver *D,
341 const ArgList &Args) const {
342 return HostTC.computeMSVCVersion(D, Args);
343}