[ARM] Add new target feature to fuse literal generation This feature enables the fusion of such operations on Cortex A57 and Cortex A72, as recommended in their Software Optimisation Guides, sections 4.14 and 4.11, respectively. Differential revision: https://reviews.llvm.org/D49563 llvm-svn: 338147

commit: fcca45f0ddb94947009615029bfd480e649abd64 [log] [tgz]
author: Evandro Menezes <e.menezes@samsung.com> Fri Jul 27 18:16:47 2018 +0000
committer: Evandro Menezes <e.menezes@samsung.com> Fri Jul 27 18:16:47 2018 +0000
tree: 36e6eed3a1a1369fc7f9647ccf9765636754a4f4
parent: cdaefac5bd3c6157445ae7a2ec198a9171083802 [diff] [blame]
diff --git a/llvm/lib/Target/ARM/ARMSubtarget.h b/llvm/lib/Target/ARM/ARMSubtarget.h
index 1650779..74aee9a 100644
--- a/llvm/lib/Target/ARM/ARMSubtarget.h
+++ b/llvm/lib/Target/ARM/ARMSubtarget.h

@@ -327,6 +327,10 @@
   /// pairs faster.
   bool HasFuseAES = false;
 
+  /// HasFuseLiterals - if true, processor executes back to back
+  /// bottom and top halves of literal generation faster.
+  bool HasFuseLiterals = false;
+
   /// If true, if conversion may decide to leave some instructions unpredicated.
   bool IsProfitableToUnpredicate = false;
 
@@ -616,8 +620,9 @@
   bool hasFullFP16() const { return HasFullFP16; }
 
   bool hasFuseAES() const { return HasFuseAES; }
+  bool hasFuseLiterals() const { return HasFuseLiterals; }
   /// Return true if the CPU supports any kind of instruction fusion.
-  bool hasFusion() const { return hasFuseAES(); }
+  bool hasFusion() const { return hasFuseAES() || hasFuseLiterals(); }
 
   const Triple &getTargetTriple() const { return TargetTriple; }
commit	fcca45f0ddb94947009615029bfd480e649abd64	[log] [tgz]
author	Evandro Menezes <e.menezes@samsung.com>	Fri Jul 27 18:16:47 2018 +0000
committer	Evandro Menezes <e.menezes@samsung.com>	Fri Jul 27 18:16:47 2018 +0000
tree	36e6eed3a1a1369fc7f9647ccf9765636754a4f4
parent	cdaefac5bd3c6157445ae7a2ec198a9171083802 [diff] [blame]