Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 1 | //===-- AMDGPU.h - MachineFunction passes hw codegen --------------*- C++ -*-=// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | /// \file |
| 9 | //===----------------------------------------------------------------------===// |
| 10 | |
Matt Arsenault | 6b6a2c3 | 2016-03-11 08:00:27 +0000 | [diff] [blame] | 11 | #ifndef LLVM_LIB_TARGET_AMDGPU_AMDGPU_H |
| 12 | #define LLVM_LIB_TARGET_AMDGPU_AMDGPU_H |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 13 | |
Matt Arsenault | 678e111 | 2017-04-10 17:58:06 +0000 | [diff] [blame] | 14 | #include "MCTargetDesc/AMDGPUMCTargetDesc.h" |
Konstantin Zhuravlyov | 60a8373 | 2016-10-03 18:47:26 +0000 | [diff] [blame] | 15 | #include "llvm/Target/TargetMachine.h" |
| 16 | |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 17 | namespace llvm { |
| 18 | |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 19 | class AMDGPUTargetMachine; |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 20 | class FunctionPass; |
Matt Arsenault | a1fe17c | 2016-07-19 23:16:53 +0000 | [diff] [blame] | 21 | class GCNTargetMachine; |
Matt Arsenault | 2ffe8fd | 2016-08-11 19:18:50 +0000 | [diff] [blame] | 22 | class ModulePass; |
| 23 | class Pass; |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 24 | class Target; |
| 25 | class TargetMachine; |
Matt Arsenault | 2ffe8fd | 2016-08-11 19:18:50 +0000 | [diff] [blame] | 26 | class PassRegistry; |
Yaxun Liu | 1a14bfa | 2017-03-27 14:04:01 +0000 | [diff] [blame] | 27 | class Module; |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 28 | |
| 29 | // R600 Passes |
Francis Visoiu Mistrih | 8b61764 | 2017-05-18 17:21:13 +0000 | [diff] [blame] | 30 | FunctionPass *createR600VectorRegMerger(); |
| 31 | FunctionPass *createR600ExpandSpecialInstrsPass(); |
Tom Stellard | 1de5582 | 2013-12-11 17:51:41 +0000 | [diff] [blame] | 32 | FunctionPass *createR600EmitClauseMarkers(); |
Francis Visoiu Mistrih | 8b61764 | 2017-05-18 17:21:13 +0000 | [diff] [blame] | 33 | FunctionPass *createR600ClauseMergePass(); |
| 34 | FunctionPass *createR600Packetizer(); |
| 35 | FunctionPass *createR600ControlFlowFinalizer(); |
Tom Stellard | f2ba972 | 2013-12-11 17:51:47 +0000 | [diff] [blame] | 36 | FunctionPass *createAMDGPUCFGStructurizerPass(); |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 37 | |
| 38 | // SI Passes |
Tom Stellard | f879435 | 2012-12-19 22:10:31 +0000 | [diff] [blame] | 39 | FunctionPass *createSIAnnotateControlFlowPass(); |
Tom Stellard | 6596ba7 | 2014-11-21 22:06:37 +0000 | [diff] [blame] | 40 | FunctionPass *createSIFoldOperandsPass(); |
Sam Kolton | f60ad58 | 2017-03-21 12:51:34 +0000 | [diff] [blame] | 41 | FunctionPass *createSIPeepholeSDWAPass(); |
Tom Stellard | 1bd8072 | 2014-04-30 15:31:33 +0000 | [diff] [blame] | 42 | FunctionPass *createSILowerI1CopiesPass(); |
Tom Stellard | 1aaad69 | 2014-07-21 16:55:33 +0000 | [diff] [blame] | 43 | FunctionPass *createSIShrinkInstructionsPass(); |
Francis Visoiu Mistrih | 8b61764 | 2017-05-18 17:21:13 +0000 | [diff] [blame] | 44 | FunctionPass *createSILoadStoreOptimizerPass(); |
Nicolai Haehnle | 213e87f | 2016-03-21 20:28:33 +0000 | [diff] [blame] | 45 | FunctionPass *createSIWholeQuadModePass(); |
Tom Stellard | 28d13a4 | 2015-05-12 17:13:02 +0000 | [diff] [blame] | 46 | FunctionPass *createSIFixControlFlowLiveIntervalsPass(); |
Stanislav Mekhanoshin | 37e7f95 | 2017-08-01 23:14:32 +0000 | [diff] [blame] | 47 | FunctionPass *createSIOptimizeExecMaskingPreRAPass(); |
Matt Arsenault | 782c03b | 2015-11-03 22:30:13 +0000 | [diff] [blame] | 48 | FunctionPass *createSIFixSGPRCopiesPass(); |
Konstantin Zhuravlyov | e9a5a77 | 2017-07-21 21:19:23 +0000 | [diff] [blame] | 49 | FunctionPass *createSIMemoryLegalizerPass(); |
Konstantin Zhuravlyov | a791932 | 2016-05-10 18:33:41 +0000 | [diff] [blame] | 50 | FunctionPass *createSIDebuggerInsertNopsPass(); |
Tom Stellard | 6e1967e | 2016-02-05 17:42:38 +0000 | [diff] [blame] | 51 | FunctionPass *createSIInsertWaitsPass(); |
Kannan Narayanan | acb089e | 2017-04-12 03:25:12 +0000 | [diff] [blame] | 52 | FunctionPass *createSIInsertWaitcntsPass(); |
Francis Visoiu Mistrih | 8b61764 | 2017-05-18 17:21:13 +0000 | [diff] [blame] | 53 | FunctionPass *createAMDGPUCodeGenPreparePass(); |
Jan Sjodin | a06bfe0 | 2017-05-15 20:18:37 +0000 | [diff] [blame] | 54 | FunctionPass *createAMDGPUMachineCFGStructurizerPass(); |
Matt Arsenault | c06574f | 2017-07-28 18:40:05 +0000 | [diff] [blame] | 55 | FunctionPass *createAMDGPURewriteOutArgumentsPass(); |
Jan Sjodin | a06bfe0 | 2017-05-15 20:18:37 +0000 | [diff] [blame] | 56 | |
| 57 | void initializeAMDGPUMachineCFGStructurizerPass(PassRegistry&); |
| 58 | extern char &AMDGPUMachineCFGStructurizerID; |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 59 | |
Matt Arsenault | 746e065 | 2017-06-02 18:02:42 +0000 | [diff] [blame] | 60 | void initializeAMDGPUAlwaysInlinePass(PassRegistry&); |
| 61 | |
Matt Arsenault | 6b93046 | 2017-07-13 21:43:42 +0000 | [diff] [blame] | 62 | Pass *createAMDGPUAnnotateKernelFeaturesPass(); |
Matt Arsenault | 3931948 | 2015-11-06 18:01:57 +0000 | [diff] [blame] | 63 | void initializeAMDGPUAnnotateKernelFeaturesPass(PassRegistry &); |
| 64 | extern char &AMDGPUAnnotateKernelFeaturesID; |
| 65 | |
Francis Visoiu Mistrih | 8b61764 | 2017-05-18 17:21:13 +0000 | [diff] [blame] | 66 | ModulePass *createAMDGPULowerIntrinsicsPass(); |
Matt Arsenault | 0699ef3 | 2017-02-09 22:00:42 +0000 | [diff] [blame] | 67 | void initializeAMDGPULowerIntrinsicsPass(PassRegistry &); |
| 68 | extern char &AMDGPULowerIntrinsicsID; |
| 69 | |
Matt Arsenault | c06574f | 2017-07-28 18:40:05 +0000 | [diff] [blame] | 70 | void initializeAMDGPURewriteOutArgumentsPass(PassRegistry &); |
| 71 | extern char &AMDGPURewriteOutArgumentsID; |
| 72 | |
Tom Stellard | 6596ba7 | 2014-11-21 22:06:37 +0000 | [diff] [blame] | 73 | void initializeSIFoldOperandsPass(PassRegistry &); |
| 74 | extern char &SIFoldOperandsID; |
| 75 | |
Sam Kolton | f60ad58 | 2017-03-21 12:51:34 +0000 | [diff] [blame] | 76 | void initializeSIPeepholeSDWAPass(PassRegistry &); |
| 77 | extern char &SIPeepholeSDWAID; |
| 78 | |
Matt Arsenault | c3a01ec | 2016-06-09 23:18:47 +0000 | [diff] [blame] | 79 | void initializeSIShrinkInstructionsPass(PassRegistry&); |
| 80 | extern char &SIShrinkInstructionsID; |
| 81 | |
Matt Arsenault | 782c03b | 2015-11-03 22:30:13 +0000 | [diff] [blame] | 82 | void initializeSIFixSGPRCopiesPass(PassRegistry &); |
| 83 | extern char &SIFixSGPRCopiesID; |
| 84 | |
Stanislav Mekhanoshin | 22a56f2 | 2017-01-24 17:46:17 +0000 | [diff] [blame] | 85 | void initializeSIFixVGPRCopiesPass(PassRegistry &); |
| 86 | extern char &SIFixVGPRCopiesID; |
| 87 | |
Tom Stellard | 1bd8072 | 2014-04-30 15:31:33 +0000 | [diff] [blame] | 88 | void initializeSILowerI1CopiesPass(PassRegistry &); |
| 89 | extern char &SILowerI1CopiesID; |
| 90 | |
Matt Arsenault | 4103328 | 2014-10-10 22:01:59 +0000 | [diff] [blame] | 91 | void initializeSILoadStoreOptimizerPass(PassRegistry &); |
| 92 | extern char &SILoadStoreOptimizerID; |
| 93 | |
Nicolai Haehnle | 213e87f | 2016-03-21 20:28:33 +0000 | [diff] [blame] | 94 | void initializeSIWholeQuadModePass(PassRegistry &); |
| 95 | extern char &SIWholeQuadModeID; |
| 96 | |
Matt Arsenault | 55d49cf | 2016-02-12 02:16:10 +0000 | [diff] [blame] | 97 | void initializeSILowerControlFlowPass(PassRegistry &); |
Matt Arsenault | 78fc9da | 2016-08-22 19:33:16 +0000 | [diff] [blame] | 98 | extern char &SILowerControlFlowID; |
Matt Arsenault | 55d49cf | 2016-02-12 02:16:10 +0000 | [diff] [blame] | 99 | |
Matt Arsenault | 78fc9da | 2016-08-22 19:33:16 +0000 | [diff] [blame] | 100 | void initializeSIInsertSkipsPass(PassRegistry &); |
| 101 | extern char &SIInsertSkipsPassID; |
Matt Arsenault | 55d49cf | 2016-02-12 02:16:10 +0000 | [diff] [blame] | 102 | |
Matt Arsenault | e674075 | 2016-09-29 01:44:16 +0000 | [diff] [blame] | 103 | void initializeSIOptimizeExecMaskingPass(PassRegistry &); |
| 104 | extern char &SIOptimizeExecMaskingID; |
| 105 | |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 106 | // Passes common to R600 and SI |
Francis Visoiu Mistrih | 8b61764 | 2017-05-18 17:21:13 +0000 | [diff] [blame] | 107 | FunctionPass *createAMDGPUPromoteAlloca(); |
Matt Arsenault | e013246 | 2016-01-30 05:19:45 +0000 | [diff] [blame] | 108 | void initializeAMDGPUPromoteAllocaPass(PassRegistry&); |
| 109 | extern char &AMDGPUPromoteAllocaID; |
| 110 | |
Tom Stellard | f879435 | 2012-12-19 22:10:31 +0000 | [diff] [blame] | 111 | Pass *createAMDGPUStructurizeCFGPass(); |
Konstantin Zhuravlyov | 60a8373 | 2016-10-03 18:47:26 +0000 | [diff] [blame] | 112 | FunctionPass *createAMDGPUISelDag(TargetMachine &TM, |
| 113 | CodeGenOpt::Level OptLevel); |
Stanislav Mekhanoshin | 89653df | 2017-03-30 20:16:02 +0000 | [diff] [blame] | 114 | ModulePass *createAMDGPUAlwaysInlinePass(bool GlobalOpt = true); |
Tom Stellard | fd25395 | 2015-08-07 23:19:30 +0000 | [diff] [blame] | 115 | ModulePass *createAMDGPUOpenCLImageTypeLoweringPass(); |
Tom Stellard | a6f24c6 | 2015-12-15 20:55:55 +0000 | [diff] [blame] | 116 | FunctionPass *createAMDGPUAnnotateUniformValues(); |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 117 | |
Stanislav Mekhanoshin | f6c1feb | 2017-01-27 16:38:10 +0000 | [diff] [blame] | 118 | ModulePass* createAMDGPUUnifyMetadataPass(); |
Stanislav Mekhanoshin | 50ea93a | 2016-12-08 19:46:04 +0000 | [diff] [blame] | 119 | void initializeAMDGPUUnifyMetadataPass(PassRegistry&); |
| 120 | extern char &AMDGPUUnifyMetadataID; |
| 121 | |
Tom Stellard | 28d13a4 | 2015-05-12 17:13:02 +0000 | [diff] [blame] | 122 | void initializeSIFixControlFlowLiveIntervalsPass(PassRegistry&); |
| 123 | extern char &SIFixControlFlowLiveIntervalsID; |
| 124 | |
Stanislav Mekhanoshin | 37e7f95 | 2017-08-01 23:14:32 +0000 | [diff] [blame] | 125 | void initializeSIOptimizeExecMaskingPreRAPass(PassRegistry&); |
| 126 | extern char &SIOptimizeExecMaskingPreRAID; |
| 127 | |
Tom Stellard | a6f24c6 | 2015-12-15 20:55:55 +0000 | [diff] [blame] | 128 | void initializeAMDGPUAnnotateUniformValuesPass(PassRegistry&); |
| 129 | extern char &AMDGPUAnnotateUniformValuesPassID; |
Tom Stellard | b2de94e | 2014-07-02 20:53:48 +0000 | [diff] [blame] | 130 | |
Matt Arsenault | 86de486 | 2016-06-24 07:07:55 +0000 | [diff] [blame] | 131 | void initializeAMDGPUCodeGenPreparePass(PassRegistry&); |
| 132 | extern char &AMDGPUCodeGenPrepareID; |
| 133 | |
Tom Stellard | 77a1777 | 2016-01-20 15:48:27 +0000 | [diff] [blame] | 134 | void initializeSIAnnotateControlFlowPass(PassRegistry&); |
| 135 | extern char &SIAnnotateControlFlowPassID; |
| 136 | |
Konstantin Zhuravlyov | e9a5a77 | 2017-07-21 21:19:23 +0000 | [diff] [blame] | 137 | void initializeSIMemoryLegalizerPass(PassRegistry&); |
| 138 | extern char &SIMemoryLegalizerID; |
| 139 | |
Konstantin Zhuravlyov | a791932 | 2016-05-10 18:33:41 +0000 | [diff] [blame] | 140 | void initializeSIDebuggerInsertNopsPass(PassRegistry&); |
| 141 | extern char &SIDebuggerInsertNopsID; |
Tom Stellard | cc7067a6 | 2016-03-03 03:53:29 +0000 | [diff] [blame] | 142 | |
Tom Stellard | 6e1967e | 2016-02-05 17:42:38 +0000 | [diff] [blame] | 143 | void initializeSIInsertWaitsPass(PassRegistry&); |
| 144 | extern char &SIInsertWaitsID; |
| 145 | |
Kannan Narayanan | acb089e | 2017-04-12 03:25:12 +0000 | [diff] [blame] | 146 | void initializeSIInsertWaitcntsPass(PassRegistry&); |
| 147 | extern char &SIInsertWaitcntsID; |
| 148 | |
Matt Arsenault | b8f8dbc | 2017-03-24 19:52:05 +0000 | [diff] [blame] | 149 | void initializeAMDGPUUnifyDivergentExitNodesPass(PassRegistry&); |
| 150 | extern char &AMDGPUUnifyDivergentExitNodesID; |
| 151 | |
Stanislav Mekhanoshin | 8e45acf | 2017-03-17 23:56:58 +0000 | [diff] [blame] | 152 | ImmutablePass *createAMDGPUAAWrapperPass(); |
| 153 | void initializeAMDGPUAAWrapperPassPass(PassRegistry&); |
| 154 | |
Mehdi Amini | f42454b | 2016-10-09 23:00:34 +0000 | [diff] [blame] | 155 | Target &getTheAMDGPUTarget(); |
| 156 | Target &getTheGCNTarget(); |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 157 | |
Tom Stellard | 067c815 | 2014-07-21 14:01:14 +0000 | [diff] [blame] | 158 | namespace AMDGPU { |
| 159 | enum TargetIndex { |
Tom Stellard | 95292bb | 2015-01-20 17:49:47 +0000 | [diff] [blame] | 160 | TI_CONSTDATA_START, |
| 161 | TI_SCRATCH_RSRC_DWORD0, |
| 162 | TI_SCRATCH_RSRC_DWORD1, |
| 163 | TI_SCRATCH_RSRC_DWORD2, |
| 164 | TI_SCRATCH_RSRC_DWORD3 |
Tom Stellard | 067c815 | 2014-07-21 14:01:14 +0000 | [diff] [blame] | 165 | }; |
| 166 | } |
| 167 | |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 168 | } // End namespace llvm |
| 169 | |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 170 | /// OpenCL uses address spaces to differentiate between |
| 171 | /// various memory regions on the hardware. On the CPU |
| 172 | /// all of the address spaces point to the same memory, |
| 173 | /// however on the GPU, each address space points to |
Alp Toker | cb40291 | 2014-01-24 17:20:08 +0000 | [diff] [blame] | 174 | /// a separate piece of memory that is unique from other |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 175 | /// memory locations. |
Yaxun Liu | 1a14bfa | 2017-03-27 14:04:01 +0000 | [diff] [blame] | 176 | struct AMDGPUAS { |
| 177 | // The following address space values depend on the triple environment. |
| 178 | unsigned PRIVATE_ADDRESS; ///< Address space for private memory. |
Yaxun Liu | 1a14bfa | 2017-03-27 14:04:01 +0000 | [diff] [blame] | 179 | unsigned FLAT_ADDRESS; ///< Address space for flat memory. |
| 180 | unsigned REGION_ADDRESS; ///< Address space for region memory. |
| 181 | |
| 182 | // The maximum value for flat, generic, local, private, constant and region. |
| 183 | const static unsigned MAX_COMMON_ADDRESS = 5; |
| 184 | |
| 185 | const static unsigned GLOBAL_ADDRESS = 1; ///< Address space for global memory (RAT0, VTX0). |
Yaxun Liu | 76ae47c | 2017-04-06 19:17:32 +0000 | [diff] [blame] | 186 | const static unsigned CONSTANT_ADDRESS = 2; ///< Address space for constant memory (VTX2) |
Yaxun Liu | 1a14bfa | 2017-03-27 14:04:01 +0000 | [diff] [blame] | 187 | const static unsigned LOCAL_ADDRESS = 3; ///< Address space for local memory. |
| 188 | const static unsigned PARAM_D_ADDRESS = 6; ///< Address space for direct addressible parameter memory (CONST0) |
| 189 | const static unsigned PARAM_I_ADDRESS = 7; ///< Address space for indirect addressible parameter memory (VTX1) |
Tom Stellard | 1e80309 | 2013-07-23 01:48:18 +0000 | [diff] [blame] | 190 | |
| 191 | // Do not re-order the CONSTANT_BUFFER_* enums. Several places depend on this |
| 192 | // order to be able to dynamically index a constant buffer, for example: |
| 193 | // |
| 194 | // ConstantBufferAS = CONSTANT_BUFFER_0 + CBIdx |
| 195 | |
Yaxun Liu | 1a14bfa | 2017-03-27 14:04:01 +0000 | [diff] [blame] | 196 | const static unsigned CONSTANT_BUFFER_0 = 8; |
| 197 | const static unsigned CONSTANT_BUFFER_1 = 9; |
| 198 | const static unsigned CONSTANT_BUFFER_2 = 10; |
| 199 | const static unsigned CONSTANT_BUFFER_3 = 11; |
| 200 | const static unsigned CONSTANT_BUFFER_4 = 12; |
| 201 | const static unsigned CONSTANT_BUFFER_5 = 13; |
| 202 | const static unsigned CONSTANT_BUFFER_6 = 14; |
| 203 | const static unsigned CONSTANT_BUFFER_7 = 15; |
| 204 | const static unsigned CONSTANT_BUFFER_8 = 16; |
| 205 | const static unsigned CONSTANT_BUFFER_9 = 17; |
| 206 | const static unsigned CONSTANT_BUFFER_10 = 18; |
| 207 | const static unsigned CONSTANT_BUFFER_11 = 19; |
| 208 | const static unsigned CONSTANT_BUFFER_12 = 20; |
| 209 | const static unsigned CONSTANT_BUFFER_13 = 21; |
| 210 | const static unsigned CONSTANT_BUFFER_14 = 22; |
| 211 | const static unsigned CONSTANT_BUFFER_15 = 23; |
Matt Arsenault | 73e06fa | 2015-06-04 16:17:42 +0000 | [diff] [blame] | 212 | |
| 213 | // Some places use this if the address space can't be determined. |
Yaxun Liu | 1a14bfa | 2017-03-27 14:04:01 +0000 | [diff] [blame] | 214 | const static unsigned UNKNOWN_ADDRESS_SPACE = ~0u; |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 215 | }; |
| 216 | |
Yaxun Liu | 1a14bfa | 2017-03-27 14:04:01 +0000 | [diff] [blame] | 217 | namespace llvm { |
| 218 | namespace AMDGPU { |
| 219 | AMDGPUAS getAMDGPUAS(const Module &M); |
| 220 | AMDGPUAS getAMDGPUAS(const TargetMachine &TM); |
| 221 | AMDGPUAS getAMDGPUAS(Triple T); |
| 222 | } // namespace AMDGPU |
| 223 | } // namespace llvm |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 224 | |
Benjamin Kramer | a7c40ef | 2014-08-13 16:26:38 +0000 | [diff] [blame] | 225 | #endif |