21 #include "llvm/Support/Alignment.h"
22 #include "llvm/Support/FileSystem.h"
23 #include "llvm/Support/Path.h"
24 #include "llvm/Support/TargetParser.h"
29 using namespace clang;
32 #if defined(_WIN32) || defined(_WIN64)
33 #define NULL_FILE "nul"
35 #define NULL_FILE "/dev/null"
39 const llvm::opt::ArgList &DriverArgs,
41 const llvm::opt::Arg *A) {
45 Option O = A->getOption();
46 if (!O.matches(options::OPT_fsanitize_EQ))
49 if (!DriverArgs.hasFlag(options::OPT_fgpu_sanitize,
50 options::OPT_fno_gpu_sanitize,
true))
57 if (K != SanitizerKind::Address)
60 llvm::StringMap<bool> FeatureMap;
63 assert(OptionalGpuArch &&
"Invalid Target ID");
64 (void)OptionalGpuArch;
65 auto Loc = FeatureMap.find(
"xnack");
66 if (Loc == FeatureMap.end() || !Loc->second) {
68 clang::diag::warn_drv_unsupported_option_for_offload_arch_req_feature)
69 << A->getAsString(DriverArgs) << TargetID <<
"xnack+";
75 void AMDGCN::Linker::constructLlvmLinkCommand(
Compilation &C,
79 const llvm::opt::ArgList &Args)
const {
82 ArgStringList LlvmLinkArgs;
84 assert(!Inputs.empty() &&
"Must have at least one input.");
87 for (
auto Input : Inputs)
88 LlvmLinkArgs.push_back(Input.getFilename());
92 auto TargetID = Args.getLastArgValue(options::OPT_mcpu_EQ);
98 const char *LlvmLink =
99 Args.MakeArgString(getToolChain().GetProgramPath(
"llvm-link"));
101 LlvmLink, LlvmLinkArgs, Inputs,
108 const llvm::opt::ArgList &Args)
const {
111 ArgStringList LldArgs{
"-flavor",
117 "-plugin-opt=-amdgpu-internalize-symbols"};
119 auto &TC = getToolChain();
120 auto &D = TC.getDriver();
121 assert(!Inputs.empty() &&
"Must have at least one input.");
122 bool IsThinLTO = D.getLTOMode(
true) ==
LTOK_Thin;
123 addLTOOptions(TC, Args, LldArgs, Output, Inputs[0], IsThinLTO);
126 std::vector<llvm::StringRef> Features;
132 MAttrString.append(Args.MakeArgString(OneFeature));
133 if (OneFeature != Features.back())
134 MAttrString.append(
",");
136 if (!Features.empty())
137 LldArgs.push_back(Args.MakeArgString(MAttrString));
143 LldArgs.push_back(Args.MakeArgString(
"-plugin-opt=-force-import-all"));
145 for (
const Arg *A : Args.filtered(options::OPT_mllvm)) {
147 Args.MakeArgString(Twine(
"-plugin-opt=") + A->getValue(0)));
150 if (
C.getDriver().isSaveTempsEnabled())
151 LldArgs.push_back(
"-save-temps");
155 for (
auto *Arg : Args.filtered(options::OPT_Xoffload_linker))
156 LldArgs.push_back(Arg->getValue(1));
159 for (
auto Input : Inputs)
160 LldArgs.push_back(Input.getFilename());
164 auto TargetID = Args.getLastArgValue(options::OPT_mcpu_EQ);
170 const char *Lld = Args.MakeArgString(getToolChain().GetProgramPath(
"lld"));
172 Lld, LldArgs, Inputs, Output));
182 const char *LinkingOutput)
const {
183 if (Inputs.size() > 0 &&
184 Inputs[0].getType() == types::TY_Image &&
185 JA.
getType() == types::TY_Object)
189 if (JA.
getType() == types::TY_HIP_FATBIN)
193 if (JA.
getType() == types::TY_LLVM_BC)
194 return constructLlvmLinkCommand(C, JA, Inputs, Output, Args);
196 return constructLldCommand(C, JA, Inputs, Output, Args);
200 const ToolChain &HostTC,
const ArgList &Args)
207 if (!Args.hasFlag(options::OPT_fgpu_sanitize, options::OPT_fno_gpu_sanitize,
210 for (
auto *A : Args.filtered(options::OPT_fsanitize_EQ)) {
212 if (K != SanitizerKind::Address)
213 D.
getDiags().
Report(clang::diag::warn_drv_unsupported_option_for_target)
214 << A->getAsString(Args) <<
getTriple().str();
219 const llvm::opt::ArgList &DriverArgs, llvm::opt::ArgStringList &CC1Args,
224 "Only HIP offloading kinds are supported for GPUs.");
226 CC1Args.push_back(
"-fcuda-is-device");
228 if (DriverArgs.hasFlag(options::OPT_fcuda_approx_transcendentals,
229 options::OPT_fno_cuda_approx_transcendentals,
false))
230 CC1Args.push_back(
"-fcuda-approx-transcendentals");
232 if (!DriverArgs.hasFlag(options::OPT_fgpu_rdc, options::OPT_fno_gpu_rdc,
234 CC1Args.append({
"-mllvm",
"-amdgpu-internalize-symbols"});
236 StringRef MaxThreadsPerBlock =
237 DriverArgs.getLastArgValue(options::OPT_gpu_max_threads_per_block_EQ);
238 if (!MaxThreadsPerBlock.empty()) {
240 (Twine(
"--gpu-max-threads-per-block=") + MaxThreadsPerBlock).str();
241 CC1Args.push_back(DriverArgs.MakeArgStringRef(ArgStr));
244 CC1Args.push_back(
"-fcuda-allow-variadic-functions");
248 if (!DriverArgs.hasArg(options::OPT_fvisibility_EQ,
249 options::OPT_fvisibility_ms_compat)) {
250 CC1Args.append({
"-fvisibility=hidden"});
251 CC1Args.push_back(
"-fapply-global-visibility-to-externs");
255 CC1Args.push_back(BCFile.ShouldInternalize ?
"-mlink-builtin-bitcode"
256 :
"-mlink-bitcode-file");
257 CC1Args.push_back(DriverArgs.MakeArgString(BCFile.Path));
261 llvm::opt::DerivedArgList *
265 DerivedArgList *DAL =
268 DAL =
new DerivedArgList(Args.getBaseArgs());
272 for (Arg *A : Args) {
278 if (!BoundArch.empty()) {
279 DAL->eraseArg(options::OPT_mcpu_EQ);
280 DAL->AddJoinedArg(
nullptr, Opts.getOption(options::OPT_mcpu_EQ), BoundArch);
302 ArgStringList &CC1Args)
const {
307 const ArgList &Args, ArgStringList &CC1Args)
const {
312 ArgStringList &CC1Args)
const {
317 ArgStringList &CC1Args)
const {
335 const ArgList &Args)
const {
342 if (DriverArgs.hasArg(options::OPT_nogpulib))
344 ArgStringList LibraryPaths;
348 LibraryPaths.push_back(DriverArgs.MakeArgString(Path));
353 auto BCLibArgs = DriverArgs.getAllArgValues(options::OPT_hip_device_lib_EQ);
354 if (!BCLibArgs.empty()) {
355 llvm::for_each(BCLibArgs, [&](StringRef BCName) {
357 for (StringRef LibraryPath : LibraryPaths) {
359 llvm::sys::path::append(Path, BCName);
361 if (llvm::sys::fs::exists(FullName)) {
362 BCLibs.push_back(FullName);
374 assert(!GpuArch.empty() &&
"Must have an explicit GPU arch.");
377 if (DriverArgs.hasFlag(options::OPT_fgpu_sanitize,
378 options::OPT_fno_gpu_sanitize,
true) &&
381 if (AsanRTL.empty()) {
384 "AMDGPU address sanitizer runtime library (asanrtl) is not found. "
385 "Please install ROCm device library which supports address "
390 BCLibs.emplace_back(AsanRTL,
false);
398 BCLibs.emplace_back(N);
402 DriverArgs.getLastArgValue(options::OPT_gpu_instrument_lib_EQ);
405 if (llvm::sys::fs::exists(InstLib))
406 BCLibs.push_back(InstLib);
415 const llvm::opt::ArgList &DriverArgs)
const {
417 if (PTID.OptionalTargetID && !PTID.OptionalGPUArch) {
419 << *PTID.OptionalTargetID;