AMDGPU: Restrict extract_vector_elt combine to loads The intention is to enable the extract_vector_elt load combine, and doing this for other operations interferes with more useful optimizations on vectors. Handle any type of load since in principle we should do the same combine for the various load intrinsics. llvm-svn: 341219

commit: bf07a50a98b312c02e7c4c53c701884975d00147 [log] [tgz]
author: Matt Arsenault <Matthew.Arsenault@amd.com> Fri Aug 31 15:39:52 2018 +0000
committer: Matt Arsenault <Matthew.Arsenault@amd.com> Fri Aug 31 15:39:52 2018 +0000
tree: 3f1277382aad9673d9a66b80d2e4663359cbde19
parent: 6f35f0c212bae156de4d504b511f86aba71976da [diff] [blame]
diff --git a/llvm/lib/Target/AMDGPU/SIISelLowering.cpp b/llvm/lib/Target/AMDGPU/SIISelLowering.cpp
index f9f24c7..f89b741 100644
--- a/llvm/lib/Target/AMDGPU/SIISelLowering.cpp
+++ b/llvm/lib/Target/AMDGPU/SIISelLowering.cpp

@@ -7941,7 +7941,8 @@
   // elements. This exposes more load reduction opportunities by replacing
   // multiple small extract_vector_elements with a single 32-bit extract.
   auto *Idx = dyn_cast<ConstantSDNode>(N->getOperand(1));
-  if (EltSize <= 16 &&
+  if (isa<MemSDNode>(Vec) &&
+      EltSize <= 16 &&
       EltVT.isByteSized() &&
       VecSize > 32 &&
       VecSize % 32 == 0 &&
commit	bf07a50a98b312c02e7c4c53c701884975d00147	[log] [tgz]
author	Matt Arsenault <Matthew.Arsenault@amd.com>	Fri Aug 31 15:39:52 2018 +0000
committer	Matt Arsenault <Matthew.Arsenault@amd.com>	Fri Aug 31 15:39:52 2018 +0000
tree	3f1277382aad9673d9a66b80d2e4663359cbde19
parent	6f35f0c212bae156de4d504b511f86aba71976da [diff] [blame]