[CMake][OpenMP] Customize default offloading arch For the shuffle instructions in reductions we need at least sm_30 but the user may want to customize the default architecture. Differential Revision: https://reviews.llvm.org/D38883 llvm-svn: 315996

commit: 30b4418e5ac6c7f4b6f88571c4fe0f2b7d6b37d7 [log] [tgz]
author: Jonas Hahnfeld <hahnjo@hahnjo.de> Tue Oct 17 13:37:36 2017 +0000
committer: Jonas Hahnfeld <hahnjo@hahnjo.de> Tue Oct 17 13:37:36 2017 +0000
tree: 4dd7d460770a8edc8cc3098c35a3ac576d9faf9a
parent: da0183947f9f4ca5a642a4abf2bfeb2a99e7430f [diff]
diff --git a/clang/lib/Driver/ToolChains/Cuda.cpp b/clang/lib/Driver/ToolChains/Cuda.cpp
index 4d040a2..4f740fc 100644
--- a/clang/lib/Driver/ToolChains/Cuda.cpp
+++ b/clang/lib/Driver/ToolChains/Cuda.cpp

@@ -542,9 +542,9 @@
   // flags are not duplicated.
   // Also append the compute capability.
   if (DeviceOffloadKind == Action::OFK_OpenMP) {
-    for (Arg *A : Args){
+    for (Arg *A : Args) {
       bool IsDuplicate = false;
-      for (Arg *DALArg : *DAL){
+      for (Arg *DALArg : *DAL) {
         if (A == DALArg) {
           IsDuplicate = true;
           break;
@@ -555,14 +555,9 @@
     }
 
     StringRef Arch = DAL->getLastArgValue(options::OPT_march_EQ);
-    if (Arch.empty()) {
-      // Default compute capability for CUDA toolchain is the
-      // lowest compute capability supported by the installed
-      // CUDA version.
-      DAL->AddJoinedArg(nullptr,
-          Opts.getOption(options::OPT_march_EQ),
-          CudaInstallation.getLowestExistingArch());
-    }
+    if (Arch.empty())
+      DAL->AddJoinedArg(nullptr, Opts.getOption(options::OPT_march_EQ),
+                        CLANG_OPENMP_NVPTX_DEFAULT_ARCH);
 
     return DAL;
   }

diff --git a/clang/lib/Driver/ToolChains/Cuda.h b/clang/lib/Driver/ToolChains/Cuda.h
index 5144f5b..1e30aa7 100644
--- a/clang/lib/Driver/ToolChains/Cuda.h
+++ b/clang/lib/Driver/ToolChains/Cuda.h

@@ -76,17 +76,6 @@
   std::string getLibDeviceFile(StringRef Gpu) const {
     return LibDeviceMap.lookup(Gpu);
   }
-  /// \brief Get lowest available compute capability
-  /// for which a libdevice library exists.
-  std::string getLowestExistingArch() const {
-    std::string LibDeviceFile;
-    for (auto key : LibDeviceMap.keys()) {
-      LibDeviceFile = LibDeviceMap.lookup(key);
-      if (!LibDeviceFile.empty())
-        return key;
-    }
-    return "sm_20";
-  }
 };
 
 namespace tools {
commit	30b4418e5ac6c7f4b6f88571c4fe0f2b7d6b37d7	[log] [tgz]
author	Jonas Hahnfeld <hahnjo@hahnjo.de>	Tue Oct 17 13:37:36 2017 +0000
committer	Jonas Hahnfeld <hahnjo@hahnjo.de>	Tue Oct 17 13:37:36 2017 +0000
tree	4dd7d460770a8edc8cc3098c35a3ac576d9faf9a
parent	da0183947f9f4ca5a642a4abf2bfeb2a99e7430f [diff]