AMDGPU/GlobalISel: Select G_FABS/G_FNEG f64 doesn't work yet because tablegen currently doesn't handlde REG_SEQUENCE. This does regress some multi use VALU fneg cases since now the immediate remains in an SGPR, and more moves are used for legalizing the xor. This is a SIFixSGPRCopies deficiency. llvm-svn: 371540

commit: e1895aba3da01df442253bf048e38371377db15e [log] [tgz]
author: Matt Arsenault <Matthew.Arsenault@amd.com> Tue Sep 10 17:19:46 2019 +0000
committer: Matt Arsenault <Matthew.Arsenault@amd.com> Tue Sep 10 17:19:46 2019 +0000
tree: a961bae49e9391414f9c3596d13e1dbb8d93d65b
parent: 7df5b3fd26243a80d97382fdc09ce0374ab98d87 [diff] [blame]
diff --git a/llvm/lib/Target/AMDGPU/AMDGPULegalizerInfo.cpp b/llvm/lib/Target/AMDGPU/AMDGPULegalizerInfo.cpp
index aa65fb6..9ea4a81 100644
--- a/llvm/lib/Target/AMDGPU/AMDGPULegalizerInfo.cpp
+++ b/llvm/lib/Target/AMDGPU/AMDGPULegalizerInfo.cpp

@@ -313,7 +313,7 @@
 
 
   auto &FPOpActions = getActionDefinitionsBuilder(
-    { G_FADD, G_FMUL, G_FNEG, G_FABS, G_FMA, G_FCANONICALIZE})
+    { G_FADD, G_FMUL, G_FMA, G_FCANONICALIZE})
     .legalFor({S32, S64});
   auto &TrigActions = getActionDefinitionsBuilder({G_FSIN, G_FCOS})
     .customFor({S32, S64});
@@ -345,9 +345,6 @@
       .scalarize(0);
   }
 
-  // TODO: Implement
-  getActionDefinitionsBuilder({G_FMINIMUM, G_FMAXIMUM}).lower();
-
   if (ST.hasVOP3PInsts())
     FPOpActions.clampMaxNumElements(0, S16, 2);
 
@@ -359,6 +356,15 @@
     .scalarize(0)
     .clampScalar(0, ST.has16BitInsts() ? S16 : S32, S64);
 
+  getActionDefinitionsBuilder({G_FNEG, G_FABS})
+    .legalFor(FPTypesPK16)
+    .clampMaxNumElements(0, S16, 2)
+    .scalarize(0)
+    .clampScalar(0, S16, S64);
+
+  // TODO: Implement
+  getActionDefinitionsBuilder({G_FMINIMUM, G_FMAXIMUM}).lower();
+
   if (ST.has16BitInsts()) {
     getActionDefinitionsBuilder(G_FSQRT)
       .legalFor({S32, S64, S16})
commit	e1895aba3da01df442253bf048e38371377db15e	[log] [tgz]
author	Matt Arsenault <Matthew.Arsenault@amd.com>	Tue Sep 10 17:19:46 2019 +0000
committer	Matt Arsenault <Matthew.Arsenault@amd.com>	Tue Sep 10 17:19:46 2019 +0000
tree	a961bae49e9391414f9c3596d13e1dbb8d93d65b
parent	7df5b3fd26243a80d97382fdc09ce0374ab98d87 [diff] [blame]