AMDGPU/SI: Select mad patterns to v_mac_f32 The two-address instruction pass will convert these back to v_mad_f32 if necessary. Differential Revision: http://reviews.llvm.org/D11060 llvm-svn: 242038

commit: db5a11f698cead8bd97b0942cadd29b001bcdf65 [log] [tgz]
author: Tom Stellard <thomas.stellard@amd.com> Mon Jul 13 15:47:57 2015 +0000
committer: Tom Stellard <thomas.stellard@amd.com> Mon Jul 13 15:47:57 2015 +0000
tree: f911d36fff459fbaa57c6568b244e02a03ed442f
parent: 0a43abc9f841246ba2974fe189628d7c45484cb6 [diff] [blame]
diff --git a/llvm/lib/Target/AMDGPU/SIInstructions.td b/llvm/lib/Target/AMDGPU/SIInstructions.td
index 8c8d836..1ee63c6 100644
--- a/llvm/lib/Target/AMDGPU/SIInstructions.td
+++ b/llvm/lib/Target/AMDGPU/SIInstructions.td

@@ -1488,7 +1488,10 @@
 defm V_OR_B32 : VOP2Inst <vop2<0x1c, 0x14>, "v_or_b32", VOP_I32_I32_I32>;
 defm V_XOR_B32 : VOP2Inst <vop2<0x1d, 0x15>, "v_xor_b32", VOP_I32_I32_I32>;
 
-defm V_MAC_F32 : VOP2Inst <vop2<0x1f, 0x16>, "v_mac_f32", VOP_F32_F32_F32>;
+let Constraints = "$dst = $src2", DisableEncoding="$src2",
+    isConvertibleToThreeAddress = 1 in {
+defm V_MAC_F32 : VOP2Inst <vop2<0x1f, 0x16>, "v_mac_f32", VOP_MAC>;
+}
 } // End isCommutable = 1
 
 defm V_MADMK_F32 : VOP2MADK <vop2<0x20, 0x17>, "v_madmk_f32">;
@@ -2206,6 +2209,15 @@
   (V_CNDMASK_B32_e64 $src2, $src1, $src0)
 >;
 
+// Pattern for V_MAC_F32
+def : Pat <
+  (fmad  (VOP3NoMods0 f32:$src0, i32:$src0_modifiers, i1:$clamp, i32:$omod),
+         (VOP3NoMods f32:$src1, i32:$src1_modifiers),
+         (VOP3NoMods f32:$src2, i32:$src2_modifiers)),
+  (V_MAC_F32_e64 $src0_modifiers, $src0, $src1_modifiers, $src1,
+                 $src2_modifiers, $src2, $clamp, $omod)
+>;
+
 /********** ======================= **********/
 /********** Image sampling patterns **********/
 /********** ======================= **********/
commit	db5a11f698cead8bd97b0942cadd29b001bcdf65	[log] [tgz]
author	Tom Stellard <thomas.stellard@amd.com>	Mon Jul 13 15:47:57 2015 +0000
committer	Tom Stellard <thomas.stellard@amd.com>	Mon Jul 13 15:47:57 2015 +0000
tree	f911d36fff459fbaa57c6568b244e02a03ed442f
parent	0a43abc9f841246ba2974fe189628d7c45484cb6 [diff] [blame]