blob: a73ba8874131bd0c0f6a57c59b42ae072d52a46c [file] [log] [blame]
Tim Northover3b0846e2014-05-24 12:50:23 +00001//===--- AArch64Subtarget.h - Define Subtarget for the AArch64 -*- C++ -*--===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This file declares the AArch64 specific subclass of TargetSubtarget.
11//
12//===----------------------------------------------------------------------===//
13
Benjamin Kramera7c40ef2014-08-13 16:26:38 +000014#ifndef LLVM_LIB_TARGET_AARCH64_AARCH64SUBTARGET_H
15#define LLVM_LIB_TARGET_AARCH64_AARCH64SUBTARGET_H
Tim Northover3b0846e2014-05-24 12:50:23 +000016
Eric Christopher29aab7b2014-06-10 17:44:12 +000017#include "AArch64FrameLowering.h"
Eric Christopher841da852014-06-10 23:26:45 +000018#include "AArch64ISelLowering.h"
Benjamin Kramer1f8930e2014-07-25 11:42:14 +000019#include "AArch64InstrInfo.h"
Tim Northover3b0846e2014-05-24 12:50:23 +000020#include "AArch64RegisterInfo.h"
Eric Christopherfcb06ca2014-06-10 18:21:53 +000021#include "AArch64SelectionDAGInfo.h"
Quentin Colombet61d71a12017-08-15 22:31:51 +000022#include "llvm/CodeGen/GlobalISel/CallLowering.h"
23#include "llvm/CodeGen/GlobalISel/InstructionSelector.h"
24#include "llvm/CodeGen/GlobalISel/LegalizerInfo.h"
25#include "llvm/CodeGen/GlobalISel/RegisterBankInfo.h"
David Blaikieb3bde2e2017-11-17 01:07:10 +000026#include "llvm/CodeGen/TargetSubtargetInfo.h"
Eric Christopher6f2a2032014-06-10 18:06:23 +000027#include "llvm/IR/DataLayout.h"
Tim Northover3b0846e2014-05-24 12:50:23 +000028#include <string>
29
30#define GET_SUBTARGETINFO_HEADER
31#include "AArch64GenSubtargetInfo.inc"
32
33namespace llvm {
34class GlobalValue;
35class StringRef;
Daniel Sandersa73f1fd2015-06-10 12:11:26 +000036class Triple;
Tim Northover3b0846e2014-05-24 12:50:23 +000037
Ahmed Bougacha5e402ee2016-07-27 14:31:46 +000038class AArch64Subtarget final : public AArch64GenSubtargetInfo {
Matthias Braun651cff42016-06-02 18:03:53 +000039public:
40 enum ARMProcFamilyEnum : uint8_t {
MinSeong Kima7385eb2016-01-05 12:51:59 +000041 Others,
42 CortexA35,
43 CortexA53,
Sam Parkerb252ffd2017-08-21 08:43:06 +000044 CortexA55,
MinSeong Kima7385eb2016-01-05 12:51:59 +000045 CortexA57,
Silviu Barangaaee40fc2016-06-21 15:53:54 +000046 CortexA72,
47 CortexA73,
Sam Parkerb252ffd2017-08-21 08:43:06 +000048 CortexA75,
MinSeong Kima7385eb2016-01-05 12:51:59 +000049 Cyclone,
Chad Rosiercd2be7f2016-02-12 15:51:51 +000050 ExynosM1,
Chad Rosier201fc1e2016-11-15 21:34:12 +000051 Falkor,
Pankaj Gode0aab2e32016-06-20 11:13:31 +000052 Kryo,
Chad Rosier71070852017-09-25 14:05:00 +000053 Saphira,
Joel Jones28520882017-03-07 19:42:40 +000054 ThunderX2T99,
Joel Jonesab0f3b42017-02-17 18:34:24 +000055 ThunderX,
56 ThunderXT81,
57 ThunderXT83,
58 ThunderXT88
MinSeong Kima7385eb2016-01-05 12:51:59 +000059 };
Tim Northover3b0846e2014-05-24 12:50:23 +000060
Matthias Braun651cff42016-06-02 18:03:53 +000061protected:
Tim Northover3b0846e2014-05-24 12:50:23 +000062 /// ARMProcFamily - ARM processor family: Cortex-A53, Cortex-A57, and others.
Matthias Braun27b66922016-05-27 22:14:09 +000063 ARMProcFamilyEnum ARMProcFamily = Others;
Tim Northover3b0846e2014-05-24 12:50:23 +000064
Matthias Braun27b66922016-05-27 22:14:09 +000065 bool HasV8_1aOps = false;
66 bool HasV8_2aOps = false;
Sam Parker9d957642017-08-10 09:41:00 +000067 bool HasV8_3aOps = false;
Vladimir Sukharev439328e2015-04-01 14:49:29 +000068
Matthias Braun27b66922016-05-27 22:14:09 +000069 bool HasFPARMv8 = false;
70 bool HasNEON = false;
71 bool HasCrypto = false;
Sjoerd Meijer79876332017-08-09 14:59:54 +000072 bool HasDotProd = false;
Matthias Braun27b66922016-05-27 22:14:09 +000073 bool HasCRC = false;
Joel Jones75818bc2016-11-30 22:25:24 +000074 bool HasLSE = false;
Sjoerd Meijerd906bf12016-06-03 14:03:27 +000075 bool HasRAS = false;
Chad Rosier58fb5f52017-01-16 16:28:43 +000076 bool HasRDM = false;
Matthias Braun27b66922016-05-27 22:14:09 +000077 bool HasPerfMon = false;
78 bool HasFullFP16 = false;
79 bool HasSPE = false;
Balaram Makam2aba753e2017-03-31 18:16:53 +000080 bool HasLSLFast = false;
Amara Emerson9f3a2452017-07-13 15:19:56 +000081 bool HasSVE = false;
Sam Parker71a474d2017-08-10 09:52:55 +000082 bool HasRCPC = false;
Tim Northover3b0846e2014-05-24 12:50:23 +000083
84 // HasZeroCycleRegMove - Has zero-cycle register mov instructions.
Matthias Braun27b66922016-05-27 22:14:09 +000085 bool HasZeroCycleRegMove = false;
Tim Northover3b0846e2014-05-24 12:50:23 +000086
87 // HasZeroCycleZeroing - Has zero-cycle zeroing instructions.
Matthias Braun27b66922016-05-27 22:14:09 +000088 bool HasZeroCycleZeroing = false;
Tim Northover3b0846e2014-05-24 12:50:23 +000089
Akira Hatanakaf53b0402015-07-29 14:17:26 +000090 // StrictAlign - Disallow unaligned memory accesses.
Matthias Braun27b66922016-05-27 22:14:09 +000091 bool StrictAlign = false;
Sanne Woudad4658ee2017-03-28 10:02:56 +000092
93 // NegativeImmediates - transform instructions with negative immediates
94 bool NegativeImmediates = true;
95
Adam Nemete29686e2017-05-15 21:15:01 +000096 // Enable 64-bit vectorization in SLP.
97 unsigned MinVectorRegisterBitWidth = 64;
98
Matthias Braun651cff42016-06-02 18:03:53 +000099 bool UseAA = false;
100 bool PredictableSelectIsExpensive = false;
101 bool BalanceFPOps = false;
102 bool CustomAsCheapAsMove = false;
103 bool UsePostRAScheduler = false;
104 bool Misaligned128StoreIsSlow = false;
Evandro Menezes7784cac2017-01-24 17:34:31 +0000105 bool Paired128IsSlow = false;
Geoff Berry40cdc0e2017-08-28 20:48:43 +0000106 bool STRQroIsSlow = false;
Matthias Braun651cff42016-06-02 18:03:53 +0000107 bool UseAlternateSExtLoadCVTF32Pattern = false;
Matthias Braun46a52382016-10-04 19:28:21 +0000108 bool HasArithmeticBccFusion = false;
109 bool HasArithmeticCbzFusion = false;
Evandro Menezesb21fb292017-02-01 02:54:39 +0000110 bool HasFuseAES = false;
Evandro Menezes455382e2017-02-01 02:54:42 +0000111 bool HasFuseLiterals = false;
Matthias Braun651cff42016-06-02 18:03:53 +0000112 bool DisableLatencySchedHeuristic = false;
Evandro Menezeseff2bd92016-10-24 16:14:58 +0000113 bool UseRSqrt = false;
Matthias Braun651cff42016-06-02 18:03:53 +0000114 uint8_t MaxInterleaveFactor = 2;
115 uint8_t VectorInsertExtractBaseCost = 3;
116 uint16_t CacheLineSize = 0;
117 uint16_t PrefetchDistance = 0;
118 uint16_t MinPrefetchStride = 1;
119 unsigned MaxPrefetchIterationsAhead = UINT_MAX;
Evandro Menezesa3a0a602016-06-10 16:00:18 +0000120 unsigned PrefFunctionAlignment = 0;
121 unsigned PrefLoopAlignment = 0;
Evandro Menezese45de8a2016-09-26 15:32:33 +0000122 unsigned MaxJumpTableSize = 0;
Matthew Simpson78fd46b2017-05-09 20:18:12 +0000123 unsigned WideningBaseCost = 0;
Akira Hatanakaf53b0402015-07-29 14:17:26 +0000124
Akira Hatanaka0d4c9ea2015-07-25 00:18:31 +0000125 // ReserveX18 - X18 is not available as a general purpose register.
126 bool ReserveX18;
127
Eric Christopher8b770652015-01-26 19:03:15 +0000128 bool IsLittle;
129
Tim Northover3b0846e2014-05-24 12:50:23 +0000130 /// TargetTriple - What processor and OS we're targeting.
131 Triple TargetTriple;
132
Eric Christopher29aab7b2014-06-10 17:44:12 +0000133 AArch64FrameLowering FrameLowering;
Eric Christopherf63bc642014-06-10 22:57:25 +0000134 AArch64InstrInfo InstrInfo;
Eric Christopherfcb06ca2014-06-10 18:21:53 +0000135 AArch64SelectionDAGInfo TSInfo;
Eric Christopher7c9d4e02014-06-11 00:46:34 +0000136 AArch64TargetLowering TLInfo;
Quentin Colombet61d71a12017-08-15 22:31:51 +0000137
138 /// GlobalISel related APIs.
139 std::unique_ptr<CallLowering> CallLoweringInfo;
140 std::unique_ptr<InstructionSelector> InstSelector;
141 std::unique_ptr<LegalizerInfo> Legalizer;
142 std::unique_ptr<RegisterBankInfo> RegBankInfo;
Quentin Colombetba2a0162016-02-16 19:26:02 +0000143
Eric Christopher7c9d4e02014-06-11 00:46:34 +0000144private:
145 /// initializeSubtargetDependencies - Initializes using CPUString and the
146 /// passed in feature string so that we can use initializer lists for
147 /// subtarget initialization.
Matthias Brauna827ed82016-10-03 20:17:02 +0000148 AArch64Subtarget &initializeSubtargetDependencies(StringRef FS,
149 StringRef CPUString);
Eric Christopher29aab7b2014-06-10 17:44:12 +0000150
Matthias Braun651cff42016-06-02 18:03:53 +0000151 /// Initialize properties based on the selected processor family.
152 void initializeProperties();
153
Tim Northover3b0846e2014-05-24 12:50:23 +0000154public:
155 /// This constructor initializes the data members to match that
156 /// of the specified triple.
Daniel Sandersa73f1fd2015-06-10 12:11:26 +0000157 AArch64Subtarget(const Triple &TT, const std::string &CPU,
Eric Christophera0de2532015-03-18 20:37:30 +0000158 const std::string &FS, const TargetMachine &TM,
Daniel Sandersa1b2db792017-05-19 11:08:33 +0000159 bool LittleEndian);
Tim Northover3b0846e2014-05-24 12:50:23 +0000160
Eric Christopherd9134482014-08-04 21:25:23 +0000161 const AArch64SelectionDAGInfo *getSelectionDAGInfo() const override {
162 return &TSInfo;
163 }
164 const AArch64FrameLowering *getFrameLowering() const override {
Eric Christopher29aab7b2014-06-10 17:44:12 +0000165 return &FrameLowering;
166 }
Eric Christopherd9134482014-08-04 21:25:23 +0000167 const AArch64TargetLowering *getTargetLowering() const override {
Eric Christopher7c9d4e02014-06-11 00:46:34 +0000168 return &TLInfo;
Eric Christopher841da852014-06-10 23:26:45 +0000169 }
Eric Christopherd9134482014-08-04 21:25:23 +0000170 const AArch64InstrInfo *getInstrInfo() const override { return &InstrInfo; }
Eric Christophera0de2532015-03-18 20:37:30 +0000171 const AArch64RegisterInfo *getRegisterInfo() const override {
172 return &getInstrInfo()->getRegisterInfo();
173 }
Quentin Colombetba2a0162016-02-16 19:26:02 +0000174 const CallLowering *getCallLowering() const override;
Ahmed Bougacha6756a2c2016-07-27 14:31:55 +0000175 const InstructionSelector *getInstructionSelector() const override;
Tim Northover69fa84a2016-10-14 22:18:18 +0000176 const LegalizerInfo *getLegalizerInfo() const override;
Quentin Colombetc17f7442016-04-06 17:26:03 +0000177 const RegisterBankInfo *getRegBankInfo() const override;
Eric Christopher09696d32015-03-12 02:04:46 +0000178 const Triple &getTargetTriple() const { return TargetTriple; }
Tim Northover3b0846e2014-05-24 12:50:23 +0000179 bool enableMachineScheduler() const override { return true; }
Matthias Braun39a2afc2015-06-13 03:42:16 +0000180 bool enablePostRAScheduler() const override {
Matthias Braun651cff42016-06-02 18:03:53 +0000181 return UsePostRAScheduler;
182 }
183
184 /// Returns ARM processor family.
185 /// Avoid this function! CPU specifics should be kept local to this class
186 /// and preferably modeled with SubtargetFeatures or properties in
187 /// initializeProperties().
188 ARMProcFamilyEnum getProcFamily() const {
189 return ARMProcFamily;
Chad Rosier486e0872014-09-12 17:40:39 +0000190 }
Tim Northover3b0846e2014-05-24 12:50:23 +0000191
Vladimir Sukharev439328e2015-04-01 14:49:29 +0000192 bool hasV8_1aOps() const { return HasV8_1aOps; }
Oliver Stannard7cc0c4e2015-11-26 15:23:32 +0000193 bool hasV8_2aOps() const { return HasV8_2aOps; }
Sam Parker9d957642017-08-10 09:41:00 +0000194 bool hasV8_3aOps() const { return HasV8_3aOps; }
Vladimir Sukharev439328e2015-04-01 14:49:29 +0000195
Tim Northover3b0846e2014-05-24 12:50:23 +0000196 bool hasZeroCycleRegMove() const { return HasZeroCycleRegMove; }
197
198 bool hasZeroCycleZeroing() const { return HasZeroCycleZeroing; }
199
Akira Hatanakaf53b0402015-07-29 14:17:26 +0000200 bool requiresStrictAlign() const { return StrictAlign; }
201
Dean Michael Berris3234d3a2016-11-17 05:15:37 +0000202 bool isXRaySupported() const override { return true; }
203
Adam Nemete29686e2017-05-15 21:15:01 +0000204 unsigned getMinVectorRegisterBitWidth() const {
205 return MinVectorRegisterBitWidth;
206 }
207
Akira Hatanaka0d4c9ea2015-07-25 00:18:31 +0000208 bool isX18Reserved() const { return ReserveX18; }
Tim Northover3b0846e2014-05-24 12:50:23 +0000209 bool hasFPARMv8() const { return HasFPARMv8; }
210 bool hasNEON() const { return HasNEON; }
211 bool hasCrypto() const { return HasCrypto; }
Sjoerd Meijer79876332017-08-09 14:59:54 +0000212 bool hasDotProd() const { return HasDotProd; }
Tim Northover3b0846e2014-05-24 12:50:23 +0000213 bool hasCRC() const { return HasCRC; }
Joel Jones75818bc2016-11-30 22:25:24 +0000214 bool hasLSE() const { return HasLSE; }
Sjoerd Meijerd906bf12016-06-03 14:03:27 +0000215 bool hasRAS() const { return HasRAS; }
Chad Rosier58fb5f52017-01-16 16:28:43 +0000216 bool hasRDM() const { return HasRDM; }
Matthias Braun651cff42016-06-02 18:03:53 +0000217 bool balanceFPOps() const { return BalanceFPOps; }
218 bool predictableSelectIsExpensive() const {
219 return PredictableSelectIsExpensive;
220 }
221 bool hasCustomCheapAsMoveHandling() const { return CustomAsCheapAsMove; }
222 bool isMisaligned128StoreSlow() const { return Misaligned128StoreIsSlow; }
Evandro Menezes7784cac2017-01-24 17:34:31 +0000223 bool isPaired128Slow() const { return Paired128IsSlow; }
Geoff Berry40cdc0e2017-08-28 20:48:43 +0000224 bool isSTRQroSlow() const { return STRQroIsSlow; }
Matthias Braun651cff42016-06-02 18:03:53 +0000225 bool useAlternateSExtLoadCVTF32Pattern() const {
226 return UseAlternateSExtLoadCVTF32Pattern;
227 }
Matthias Braun46a52382016-10-04 19:28:21 +0000228 bool hasArithmeticBccFusion() const { return HasArithmeticBccFusion; }
229 bool hasArithmeticCbzFusion() const { return HasArithmeticCbzFusion; }
Evandro Menezesb21fb292017-02-01 02:54:39 +0000230 bool hasFuseAES() const { return HasFuseAES; }
Evandro Menezes455382e2017-02-01 02:54:42 +0000231 bool hasFuseLiterals() const { return HasFuseLiterals; }
Florian Hahnf934add2017-07-12 20:53:22 +0000232
233 /// \brief Return true if the CPU supports any kind of instruction fusion.
234 bool hasFusion() const {
235 return hasArithmeticBccFusion() || hasArithmeticCbzFusion() ||
236 hasFuseAES() || hasFuseLiterals();
237 }
238
Evandro Menezeseff2bd92016-10-24 16:14:58 +0000239 bool useRSqrt() const { return UseRSqrt; }
Matthias Braun651cff42016-06-02 18:03:53 +0000240 unsigned getMaxInterleaveFactor() const { return MaxInterleaveFactor; }
241 unsigned getVectorInsertExtractBaseCost() const {
242 return VectorInsertExtractBaseCost;
243 }
244 unsigned getCacheLineSize() const { return CacheLineSize; }
245 unsigned getPrefetchDistance() const { return PrefetchDistance; }
246 unsigned getMinPrefetchStride() const { return MinPrefetchStride; }
247 unsigned getMaxPrefetchIterationsAhead() const {
248 return MaxPrefetchIterationsAhead;
249 }
Evandro Menezesa3a0a602016-06-10 16:00:18 +0000250 unsigned getPrefFunctionAlignment() const { return PrefFunctionAlignment; }
251 unsigned getPrefLoopAlignment() const { return PrefLoopAlignment; }
Matthias Braun651cff42016-06-02 18:03:53 +0000252
Evandro Menezese45de8a2016-09-26 15:32:33 +0000253 unsigned getMaximumJumpTableSize() const { return MaxJumpTableSize; }
254
Matthew Simpson78fd46b2017-05-09 20:18:12 +0000255 unsigned getWideningBaseCost() const { return WideningBaseCost; }
256
Tim Northover339c83e2015-11-10 00:44:23 +0000257 /// CPU has TBI (top byte of addresses is ignored during HW address
258 /// translation) and OS enables it.
259 bool supportsAddressTopByteIgnored() const;
260
Ahmed Bougachab0ff6432015-09-01 16:23:45 +0000261 bool hasPerfMon() const { return HasPerfMon; }
Oliver Stannard7cc0c4e2015-11-26 15:23:32 +0000262 bool hasFullFP16() const { return HasFullFP16; }
Oliver Stannarda34e4702015-12-01 10:48:51 +0000263 bool hasSPE() const { return HasSPE; }
Balaram Makam2aba753e2017-03-31 18:16:53 +0000264 bool hasLSLFast() const { return HasLSLFast; }
Amara Emerson9f3a2452017-07-13 15:19:56 +0000265 bool hasSVE() const { return HasSVE; }
Sam Parker71a474d2017-08-10 09:52:55 +0000266 bool hasRCPC() const { return HasRCPC; }
Tim Northover3b0846e2014-05-24 12:50:23 +0000267
Eric Christopher8b770652015-01-26 19:03:15 +0000268 bool isLittleEndian() const { return IsLittle; }
Tim Northover3b0846e2014-05-24 12:50:23 +0000269
270 bool isTargetDarwin() const { return TargetTriple.isOSDarwin(); }
Chad Rosierb481bdf2014-08-06 16:56:58 +0000271 bool isTargetIOS() const { return TargetTriple.isiOS(); }
272 bool isTargetLinux() const { return TargetTriple.isOSLinux(); }
273 bool isTargetWindows() const { return TargetTriple.isOSWindows(); }
Evgeniy Stepanov5fe279e2015-10-08 21:21:24 +0000274 bool isTargetAndroid() const { return TargetTriple.isAndroid(); }
Petr Hoseka7d59162017-02-24 03:10:10 +0000275 bool isTargetFuchsia() const { return TargetTriple.isOSFuchsia(); }
Tim Northover3b0846e2014-05-24 12:50:23 +0000276
Chad Rosierb481bdf2014-08-06 16:56:58 +0000277 bool isTargetCOFF() const { return TargetTriple.isOSBinFormatCOFF(); }
Tim Northover3b0846e2014-05-24 12:50:23 +0000278 bool isTargetELF() const { return TargetTriple.isOSBinFormatELF(); }
Tim Northover3b0846e2014-05-24 12:50:23 +0000279 bool isTargetMachO() const { return TargetTriple.isOSBinFormatMachO(); }
280
Matthias Braun651cff42016-06-02 18:03:53 +0000281 bool useAA() const override { return UseAA; }
Chad Rosierc9f94772014-09-08 14:31:49 +0000282
Petr Hosek9eb0a1e2017-04-04 19:51:53 +0000283 bool useSmallAddressing() const {
284 switch (TLInfo.getTargetMachine().getCodeModel()) {
285 case CodeModel::Kernel:
286 // Kernel is currently allowed only for Fuchsia targets,
287 // where it is the same as Small for almost all purposes.
288 case CodeModel::Small:
289 return true;
290 default:
291 return false;
292 }
293 }
294
Tim Northover3b0846e2014-05-24 12:50:23 +0000295 /// ParseSubtargetFeatures - Parses features string setting specified
296 /// subtarget options. Definition of function is auto generated by tblgen.
297 void ParseSubtargetFeatures(StringRef CPU, StringRef FS);
298
299 /// ClassifyGlobalReference - Find the target operand flags that describe
300 /// how a global value should be referenced for the current subtarget.
301 unsigned char ClassifyGlobalReference(const GlobalValue *GV,
302 const TargetMachine &TM) const;
303
Tim Northover879a0b22017-04-17 17:27:56 +0000304 unsigned char classifyGlobalFunctionReference(const GlobalValue *GV,
305 const TargetMachine &TM) const;
306
Tim Northover3b0846e2014-05-24 12:50:23 +0000307 /// This function returns the name of a function which has an interface
308 /// like the non-standard bzero function, if such a function exists on
309 /// the current subtarget and it is considered prefereable over
310 /// memset with zero passed as the second argument. Otherwise it
311 /// returns null.
312 const char *getBZeroEntry() const;
313
Duncan P. N. Exon Smith63298722016-07-01 00:23:27 +0000314 void overrideSchedPolicy(MachineSchedPolicy &Policy,
Tim Northover3b0846e2014-05-24 12:50:23 +0000315 unsigned NumRegionInstrs) const override;
316
317 bool enableEarlyIfConversion() const override;
Lang Hames8f31f442014-10-09 18:20:51 +0000318
319 std::unique_ptr<PBQPRAConstraint> getCustomPBQPConstraints() const override;
Martin Storsjo2f24e932017-07-17 20:05:19 +0000320
321 bool isCallingConvWin64(CallingConv::ID CC) const {
322 switch (CC) {
323 case CallingConv::C:
324 return isTargetWindows();
325 case CallingConv::Win64:
326 return true;
327 default:
328 return false;
329 }
330 }
Tim Northover3b0846e2014-05-24 12:50:23 +0000331};
Alexander Kornienkof00654e2015-06-23 09:49:53 +0000332} // End llvm namespace
Tim Northover3b0846e2014-05-24 12:50:23 +0000333
Benjamin Kramera7c40ef2014-08-13 16:26:38 +0000334#endif