[X86] Add support for passing 'prefer-vector-width' function attribute into X86Subtarget and exposing via X86's getRegisterWidth TTI interface. This will cause the vectorizers to do some limiting of the vector widths they create. This is not a strict limit. There are reasons I know of that the loop vectorizer will generate larger vectors for. I've written this in such a way that the interface will only return a properly supported width(0/128/256/512) even if the attribute says something funny like 384 or 10. This has been split from D41895 with the remainder in a follow up commit. llvm-svn: 323015

commit: 0d797a34d8be0707c4f17e88d7d22004d844fbf4 [log] [tgz]
author: Craig Topper <craig.topper@intel.com> Sat Jan 20 00:26:08 2018 +0000
committer: Craig Topper <craig.topper@intel.com> Sat Jan 20 00:26:08 2018 +0000
tree: e350faaa70f176cdc5da5f9d6826a26d54defdfc
parent: 2f8af79927c5902900a7ddeef2300ea92a9fcf22 [diff] [blame]
diff --git a/llvm/lib/Target/X86/X86TargetMachine.cpp b/llvm/lib/Target/X86/X86TargetMachine.cpp
index 48e2073..b3bf926 100644
--- a/llvm/lib/Target/X86/X86TargetMachine.cpp
+++ b/llvm/lib/Target/X86/X86TargetMachine.cpp

@@ -255,7 +255,24 @@
   if (SoftFloat)
     Key += FS.empty() ? "+soft-float" : ",+soft-float";
 
-  FS = Key.substr(CPU.size());
+  // Keep track of the key width after all features are added so we can extract
+  // the feature string out later.
+  unsigned CPUFSWidth = Key.size();
+
+  // Translate vector width function attribute into subtarget features. This
+  // overrides any CPU specific turning parameter
+  unsigned PreferVectorWidthOverride = 0;
+  if (F.hasFnAttribute("prefer-vector-width")) {
+    StringRef Val = F.getFnAttribute("prefer-vector-width").getValueAsString();
+    unsigned Width;
+    if (!Val.getAsInteger(0, Width)) {
+      Key += ",prefer-vector-width=";
+      Key += Val;
+      PreferVectorWidthOverride = Width;
+    }
+  }
+
+  FS = Key.slice(CPU.size(), CPUFSWidth);
 
   auto &I = SubtargetMap[Key];
   if (!I) {
@@ -264,7 +281,8 @@
     // function that reside in TargetOptions.
     resetTargetOptions(F);
     I = llvm::make_unique<X86Subtarget>(TargetTriple, CPU, FS, *this,
-                                        Options.StackAlignmentOverride);
+                                        Options.StackAlignmentOverride,
+                                        PreferVectorWidthOverride);
   }
   return I.get();
 }
commit	0d797a34d8be0707c4f17e88d7d22004d844fbf4	[log] [tgz]
author	Craig Topper <craig.topper@intel.com>	Sat Jan 20 00:26:08 2018 +0000
committer	Craig Topper <craig.topper@intel.com>	Sat Jan 20 00:26:08 2018 +0000
tree	e350faaa70f176cdc5da5f9d6826a26d54defdfc
parent	2f8af79927c5902900a7ddeef2300ea92a9fcf22 [diff] [blame]