[X86] Don't report gather is legal on Skylake CPUs when AVX2/AVX512 is disabled. Allow gather on SKX/CNL/ICL when AVX512 is disabled by using AVX2 instructions. Summary: This adds a new fast gather feature bit to cover all CPUs that support fast gather that we can use independent of whether the AVX512 feature is enabled. I'm only using this new bit to qualify AVX2 codegen. AVX512 is still implicitly assuming fast gather to keep tests working and to match the scatter behavior. Test command lines have been added for these two cases. Reviewers: magabari, delena, RKSimon, zvi Reviewed By: RKSimon Subscribers: llvm-commits Differential Revision: https://reviews.llvm.org/D40282 llvm-svn: 318983

commit: ea37e201ec2f9c3d8b2c9bb37ff48cacdd992f55 [log] [tgz]
author: Craig Topper <craig.topper@intel.com> Sat Nov 25 18:09:37 2017 +0000
committer: Craig Topper <craig.topper@intel.com> Sat Nov 25 18:09:37 2017 +0000
tree: 6bebfa5efe92abba04700e0a8ba456b2e9e7def6
parent: e7426556c16d86d52356b23538708dbea2008a76 [diff] [blame]
diff --git a/llvm/lib/Target/X86/X86Subtarget.h b/llvm/lib/Target/X86/X86Subtarget.h
index c7fc561..faf88ab 100644
--- a/llvm/lib/Target/X86/X86Subtarget.h
+++ b/llvm/lib/Target/X86/X86Subtarget.h

@@ -229,6 +229,10 @@
   /// of a YMM or ZMM register without clearing the upper part.
   bool HasFastPartialYMMorZMMWrite;
 
+  /// True if gather is reasonably fast. This is true for Skylake client and
+  /// all AVX-512 CPUs.
+  bool HasFastGather;
+
   /// True if hardware SQRTSS instruction is at least as fast (latency) as
   /// RSQRTSS followed by a Newton-Raphson iteration.
   bool HasFastScalarFSQRT;
@@ -514,6 +518,7 @@
   bool hasFastPartialYMMorZMMWrite() const {
     return HasFastPartialYMMorZMMWrite;
   }
+  bool hasFastGather() const { return HasFastGather; }
   bool hasFastScalarFSQRT() const { return HasFastScalarFSQRT; }
   bool hasFastVectorFSQRT() const { return HasFastVectorFSQRT; }
   bool hasFastLZCNT() const { return HasFastLZCNT; }
commit	ea37e201ec2f9c3d8b2c9bb37ff48cacdd992f55	[log] [tgz]
author	Craig Topper <craig.topper@intel.com>	Sat Nov 25 18:09:37 2017 +0000
committer	Craig Topper <craig.topper@intel.com>	Sat Nov 25 18:09:37 2017 +0000
tree	6bebfa5efe92abba04700e0a8ba456b2e9e7def6
parent	e7426556c16d86d52356b23538708dbea2008a76 [diff] [blame]