[cuda] Driver changes to compile and stitch together host and device-side CUDA code.

- Changed driver pipeline to compile host and device side of CUDA files and incorporate results of device-side compilation into host object file. - Added a test for cuda pipeline creation in clang driver. New clang options: --cuda-host-only - Do host-side compilation only. --cuda-device-only - Do device-side compilation only. --cuda-gpu-arch=<ARCH> - specify GPU architecture for device-side compilation. E.g. sm_35, sm_30. Default is sm_20. May be used more than once in which case one device-compilation will be done per unique specified GPU architecture. Differential Revision: http://reviews.llvm.org/D9509 llvm-svn: 242058
author: Artem Belevich <tra@google.com> 2015-07-13 20:21:06 +0000
committer: Artem Belevich <tra@google.com> 2015-07-13 20:21:06 +0000
commit: cd42e7f77a788969bc9365b8b0b2f21e2308e04e (patch)
tree: 454855373f13ce3944547ca616219084bb0f4bbe /clang/lib/Driver/Tools.cpp
parent: 6145ad2d3654350110e25460d0fcd9656a46e36c (diff)
download: llvm-cd42e7f77a788969bc9365b8b0b2f21e2308e04e.zip
llvm-cd42e7f77a788969bc9365b8b0b2f21e2308e04e.tar.gz
llvm-cd42e7f77a788969bc9365b8b0b2f21e2308e04e.tar.bz2
1 files changed, 28 insertions, 8 deletions
diff --git a/clang/lib/Driver/Tools.cpp b/clang/lib/Driver/Tools.cpp
index 1805333..0757355 100644
--- a/clang/lib/Driver/Tools.cpp
+++ b/clang/lib/Driver/Tools.cpp
@@ -1488,6 +1488,12 @@ static std::string getCPUName(const ArgList &Args, const llvm::Triple &T) {
     return CPUName;
   }
 
+  case llvm::Triple::nvptx:
+  case llvm::Triple::nvptx64:
+    if (const Arg *A = Args.getLastArg(options::OPT_march_EQ))
+      return A->getValue();
+    return "";
+
   case llvm::Triple::ppc:
   case llvm::Triple::ppc64:
   case llvm::Triple::ppc64le: {
@@ -2826,8 +2832,14 @@ void Clang::ConstructJob(Compilation &C, const JobAction &JA,
       getToolChain().getTriple().isWindowsCygwinEnvironment();
   bool IsWindowsMSVC = getToolChain().getTriple().isWindowsMSVCEnvironment();
 
-  assert(Inputs.size() == 1 && "Unable to handle multiple inputs.");
+  // Check number of inputs for sanity. We need at least one input.
+  assert(Inputs.size() >= 1 && "Must have at least one input.");
   const InputInfo &Input = Inputs[0];
+  // CUDA compilation may have multiple inputs (source file + results of
+  // device-side compilations). All other jobs are expected to have exactly one
+  // input.
+  bool IsCuda = types::isCuda(Input.getType());
+  assert((IsCuda || Inputs.size() == 1) && "Unable to handle multiple inputs.");
 
   // Invoke ourselves in -cc1 mode.
   //
@@ -4802,14 +4814,12 @@ void Clang::ConstructJob(Compilation &C, const JobAction &JA,
     assert(Output.isNothing() && "Invalid output.");
   }
 
-  for (const auto &II : Inputs) {
-    addDashXForInput(Args, II, CmdArgs);
+  addDashXForInput(Args, Input, CmdArgs);
 
-    if (II.isFilename())
-      CmdArgs.push_back(II.getFilename());
-    else
-      II.getInputArg().renderAsInput(Args, CmdArgs);
-  }
+  if (Input.isFilename())
+    CmdArgs.push_back(Input.getFilename());
+  else
+    Input.getInputArg().renderAsInput(Args, CmdArgs);
 
   Args.AddAllArgs(CmdArgs, options::OPT_undef);
 
@@ -4847,6 +4857,16 @@ void Clang::ConstructJob(Compilation &C, const JobAction &JA,
     CmdArgs.push_back(SplitDwarfOut);
   }
 
+  // Host-side cuda compilation receives device-side outputs as Inputs[1...].
+  // Include them with -fcuda-include-gpubinary.
+  if (IsCuda && Inputs.size() > 1)
+    for (InputInfoList::const_iterator it = std::next(Inputs.begin()),
+                                       ie = Inputs.end();
+         it != ie; ++it) {
+      CmdArgs.push_back("-fcuda-include-gpubinary");
+      CmdArgs.push_back(it->getFilename());
+    }
+
   // Finally add the compile command to the compilation.
   if (Args.hasArg(options::OPT__SLASH_fallback) &&
       Output.getType() == types::TY_Object &&
author	Artem Belevich <tra@google.com>	2015-07-13 20:21:06 +0000
committer	Artem Belevich <tra@google.com>	2015-07-13 20:21:06 +0000
commit	cd42e7f77a788969bc9365b8b0b2f21e2308e04e (patch)
tree	454855373f13ce3944547ca616219084bb0f4bbe /clang/lib/Driver/Tools.cpp
parent	6145ad2d3654350110e25460d0fcd9656a46e36c (diff)
download	llvm-cd42e7f77a788969bc9365b8b0b2f21e2308e04e.zip llvm-cd42e7f77a788969bc9365b8b0b2f21e2308e04e.tar.gz llvm-cd42e7f77a788969bc9365b8b0b2f21e2308e04e.tar.bz2