Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 1 | //===-- AMDGPU.h - MachineFunction passes hw codegen --------------*- C++ -*-=// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | /// \file |
| 9 | //===----------------------------------------------------------------------===// |
| 10 | |
Matt Arsenault | 6b6a2c3 | 2016-03-11 08:00:27 +0000 | [diff] [blame] | 11 | #ifndef LLVM_LIB_TARGET_AMDGPU_AMDGPU_H |
| 12 | #define LLVM_LIB_TARGET_AMDGPU_AMDGPU_H |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 13 | |
Matt Arsenault | 678e111 | 2017-04-10 17:58:06 +0000 | [diff] [blame^] | 14 | #include "MCTargetDesc/AMDGPUMCTargetDesc.h" |
Konstantin Zhuravlyov | 60a8373 | 2016-10-03 18:47:26 +0000 | [diff] [blame] | 15 | #include "llvm/Target/TargetMachine.h" |
| 16 | |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 17 | namespace llvm { |
| 18 | |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 19 | class AMDGPUTargetMachine; |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 20 | class FunctionPass; |
Matt Arsenault | a1fe17c | 2016-07-19 23:16:53 +0000 | [diff] [blame] | 21 | class GCNTargetMachine; |
Matt Arsenault | 2ffe8fd | 2016-08-11 19:18:50 +0000 | [diff] [blame] | 22 | class ModulePass; |
| 23 | class Pass; |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 24 | class Target; |
| 25 | class TargetMachine; |
Matt Arsenault | 2ffe8fd | 2016-08-11 19:18:50 +0000 | [diff] [blame] | 26 | class PassRegistry; |
Yaxun Liu | 1a14bfa | 2017-03-27 14:04:01 +0000 | [diff] [blame] | 27 | class Module; |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 28 | |
| 29 | // R600 Passes |
Vincent Lejeune | dec1875 | 2013-06-05 21:38:04 +0000 | [diff] [blame] | 30 | FunctionPass *createR600VectorRegMerger(TargetMachine &tm); |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 31 | FunctionPass *createR600ExpandSpecialInstrsPass(TargetMachine &tm); |
Tom Stellard | 1de5582 | 2013-12-11 17:51:41 +0000 | [diff] [blame] | 32 | FunctionPass *createR600EmitClauseMarkers(); |
Vincent Lejeune | a4da6fb | 2013-10-01 19:32:58 +0000 | [diff] [blame] | 33 | FunctionPass *createR600ClauseMergePass(TargetMachine &tm); |
Vincent Lejeune | 147700b | 2013-04-30 00:14:27 +0000 | [diff] [blame] | 34 | FunctionPass *createR600Packetizer(TargetMachine &tm); |
Vincent Lejeune | bfaa63a6 | 2013-04-01 21:48:05 +0000 | [diff] [blame] | 35 | FunctionPass *createR600ControlFlowFinalizer(TargetMachine &tm); |
Tom Stellard | f2ba972 | 2013-12-11 17:51:47 +0000 | [diff] [blame] | 36 | FunctionPass *createAMDGPUCFGStructurizerPass(); |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 37 | |
| 38 | // SI Passes |
Tom Stellard | 9fa1791 | 2013-08-14 23:24:45 +0000 | [diff] [blame] | 39 | FunctionPass *createSITypeRewriter(); |
Tom Stellard | f879435 | 2012-12-19 22:10:31 +0000 | [diff] [blame] | 40 | FunctionPass *createSIAnnotateControlFlowPass(); |
Tom Stellard | 6596ba7 | 2014-11-21 22:06:37 +0000 | [diff] [blame] | 41 | FunctionPass *createSIFoldOperandsPass(); |
Sam Kolton | f60ad58 | 2017-03-21 12:51:34 +0000 | [diff] [blame] | 42 | FunctionPass *createSIPeepholeSDWAPass(); |
Tom Stellard | 1bd8072 | 2014-04-30 15:31:33 +0000 | [diff] [blame] | 43 | FunctionPass *createSILowerI1CopiesPass(); |
Tom Stellard | 1aaad69 | 2014-07-21 16:55:33 +0000 | [diff] [blame] | 44 | FunctionPass *createSIShrinkInstructionsPass(); |
Matt Arsenault | 4103328 | 2014-10-10 22:01:59 +0000 | [diff] [blame] | 45 | FunctionPass *createSILoadStoreOptimizerPass(TargetMachine &tm); |
Nicolai Haehnle | 213e87f | 2016-03-21 20:28:33 +0000 | [diff] [blame] | 46 | FunctionPass *createSIWholeQuadModePass(); |
Tom Stellard | 28d13a4 | 2015-05-12 17:13:02 +0000 | [diff] [blame] | 47 | FunctionPass *createSIFixControlFlowLiveIntervalsPass(); |
Matt Arsenault | 782c03b | 2015-11-03 22:30:13 +0000 | [diff] [blame] | 48 | FunctionPass *createSIFixSGPRCopiesPass(); |
Konstantin Zhuravlyov | a791932 | 2016-05-10 18:33:41 +0000 | [diff] [blame] | 49 | FunctionPass *createSIDebuggerInsertNopsPass(); |
Tom Stellard | 6e1967e | 2016-02-05 17:42:38 +0000 | [diff] [blame] | 50 | FunctionPass *createSIInsertWaitsPass(); |
Matt Arsenault | a1fe17c | 2016-07-19 23:16:53 +0000 | [diff] [blame] | 51 | FunctionPass *createAMDGPUCodeGenPreparePass(const GCNTargetMachine *TM = nullptr); |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 52 | |
Matt Arsenault | e823d92 | 2017-02-18 18:29:53 +0000 | [diff] [blame] | 53 | ModulePass *createAMDGPUAnnotateKernelFeaturesPass(const TargetMachine *TM = nullptr); |
Matt Arsenault | 3931948 | 2015-11-06 18:01:57 +0000 | [diff] [blame] | 54 | void initializeAMDGPUAnnotateKernelFeaturesPass(PassRegistry &); |
| 55 | extern char &AMDGPUAnnotateKernelFeaturesID; |
| 56 | |
Matt Arsenault | 0699ef3 | 2017-02-09 22:00:42 +0000 | [diff] [blame] | 57 | ModulePass *createAMDGPULowerIntrinsicsPass(); |
| 58 | void initializeAMDGPULowerIntrinsicsPass(PassRegistry &); |
| 59 | extern char &AMDGPULowerIntrinsicsID; |
| 60 | |
Tom Stellard | 6596ba7 | 2014-11-21 22:06:37 +0000 | [diff] [blame] | 61 | void initializeSIFoldOperandsPass(PassRegistry &); |
| 62 | extern char &SIFoldOperandsID; |
| 63 | |
Sam Kolton | f60ad58 | 2017-03-21 12:51:34 +0000 | [diff] [blame] | 64 | void initializeSIPeepholeSDWAPass(PassRegistry &); |
| 65 | extern char &SIPeepholeSDWAID; |
| 66 | |
Matt Arsenault | c3a01ec | 2016-06-09 23:18:47 +0000 | [diff] [blame] | 67 | void initializeSIShrinkInstructionsPass(PassRegistry&); |
| 68 | extern char &SIShrinkInstructionsID; |
| 69 | |
Matt Arsenault | 782c03b | 2015-11-03 22:30:13 +0000 | [diff] [blame] | 70 | void initializeSIFixSGPRCopiesPass(PassRegistry &); |
| 71 | extern char &SIFixSGPRCopiesID; |
| 72 | |
Stanislav Mekhanoshin | 22a56f2 | 2017-01-24 17:46:17 +0000 | [diff] [blame] | 73 | void initializeSIFixVGPRCopiesPass(PassRegistry &); |
| 74 | extern char &SIFixVGPRCopiesID; |
| 75 | |
Tom Stellard | 1bd8072 | 2014-04-30 15:31:33 +0000 | [diff] [blame] | 76 | void initializeSILowerI1CopiesPass(PassRegistry &); |
| 77 | extern char &SILowerI1CopiesID; |
| 78 | |
Matt Arsenault | 4103328 | 2014-10-10 22:01:59 +0000 | [diff] [blame] | 79 | void initializeSILoadStoreOptimizerPass(PassRegistry &); |
| 80 | extern char &SILoadStoreOptimizerID; |
| 81 | |
Nicolai Haehnle | 213e87f | 2016-03-21 20:28:33 +0000 | [diff] [blame] | 82 | void initializeSIWholeQuadModePass(PassRegistry &); |
| 83 | extern char &SIWholeQuadModeID; |
| 84 | |
Matt Arsenault | 55d49cf | 2016-02-12 02:16:10 +0000 | [diff] [blame] | 85 | void initializeSILowerControlFlowPass(PassRegistry &); |
Matt Arsenault | 78fc9da | 2016-08-22 19:33:16 +0000 | [diff] [blame] | 86 | extern char &SILowerControlFlowID; |
Matt Arsenault | 55d49cf | 2016-02-12 02:16:10 +0000 | [diff] [blame] | 87 | |
Matt Arsenault | 78fc9da | 2016-08-22 19:33:16 +0000 | [diff] [blame] | 88 | void initializeSIInsertSkipsPass(PassRegistry &); |
| 89 | extern char &SIInsertSkipsPassID; |
Matt Arsenault | 55d49cf | 2016-02-12 02:16:10 +0000 | [diff] [blame] | 90 | |
Matt Arsenault | e674075 | 2016-09-29 01:44:16 +0000 | [diff] [blame] | 91 | void initializeSIOptimizeExecMaskingPass(PassRegistry &); |
| 92 | extern char &SIOptimizeExecMaskingID; |
| 93 | |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 94 | // Passes common to R600 and SI |
Matt Arsenault | e013246 | 2016-01-30 05:19:45 +0000 | [diff] [blame] | 95 | FunctionPass *createAMDGPUPromoteAlloca(const TargetMachine *TM = nullptr); |
| 96 | void initializeAMDGPUPromoteAllocaPass(PassRegistry&); |
| 97 | extern char &AMDGPUPromoteAllocaID; |
| 98 | |
Tom Stellard | f879435 | 2012-12-19 22:10:31 +0000 | [diff] [blame] | 99 | Pass *createAMDGPUStructurizeCFGPass(); |
Konstantin Zhuravlyov | 60a8373 | 2016-10-03 18:47:26 +0000 | [diff] [blame] | 100 | FunctionPass *createAMDGPUISelDag(TargetMachine &TM, |
| 101 | CodeGenOpt::Level OptLevel); |
Stanislav Mekhanoshin | 89653df | 2017-03-30 20:16:02 +0000 | [diff] [blame] | 102 | ModulePass *createAMDGPUAlwaysInlinePass(bool GlobalOpt = true); |
Tom Stellard | fd25395 | 2015-08-07 23:19:30 +0000 | [diff] [blame] | 103 | ModulePass *createAMDGPUOpenCLImageTypeLoweringPass(); |
Tom Stellard | a6f24c6 | 2015-12-15 20:55:55 +0000 | [diff] [blame] | 104 | FunctionPass *createAMDGPUAnnotateUniformValues(); |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 105 | |
Stanislav Mekhanoshin | f6c1feb | 2017-01-27 16:38:10 +0000 | [diff] [blame] | 106 | ModulePass* createAMDGPUUnifyMetadataPass(); |
Stanislav Mekhanoshin | 50ea93a | 2016-12-08 19:46:04 +0000 | [diff] [blame] | 107 | void initializeAMDGPUUnifyMetadataPass(PassRegistry&); |
| 108 | extern char &AMDGPUUnifyMetadataID; |
| 109 | |
Tom Stellard | 28d13a4 | 2015-05-12 17:13:02 +0000 | [diff] [blame] | 110 | void initializeSIFixControlFlowLiveIntervalsPass(PassRegistry&); |
| 111 | extern char &SIFixControlFlowLiveIntervalsID; |
| 112 | |
Tom Stellard | a6f24c6 | 2015-12-15 20:55:55 +0000 | [diff] [blame] | 113 | void initializeAMDGPUAnnotateUniformValuesPass(PassRegistry&); |
| 114 | extern char &AMDGPUAnnotateUniformValuesPassID; |
Tom Stellard | b2de94e | 2014-07-02 20:53:48 +0000 | [diff] [blame] | 115 | |
Matt Arsenault | 86de486 | 2016-06-24 07:07:55 +0000 | [diff] [blame] | 116 | void initializeAMDGPUCodeGenPreparePass(PassRegistry&); |
| 117 | extern char &AMDGPUCodeGenPrepareID; |
| 118 | |
Tom Stellard | 77a1777 | 2016-01-20 15:48:27 +0000 | [diff] [blame] | 119 | void initializeSIAnnotateControlFlowPass(PassRegistry&); |
| 120 | extern char &SIAnnotateControlFlowPassID; |
| 121 | |
Konstantin Zhuravlyov | a791932 | 2016-05-10 18:33:41 +0000 | [diff] [blame] | 122 | void initializeSIDebuggerInsertNopsPass(PassRegistry&); |
| 123 | extern char &SIDebuggerInsertNopsID; |
Tom Stellard | cc7067a6 | 2016-03-03 03:53:29 +0000 | [diff] [blame] | 124 | |
Tom Stellard | 6e1967e | 2016-02-05 17:42:38 +0000 | [diff] [blame] | 125 | void initializeSIInsertWaitsPass(PassRegistry&); |
| 126 | extern char &SIInsertWaitsID; |
| 127 | |
Matt Arsenault | b8f8dbc | 2017-03-24 19:52:05 +0000 | [diff] [blame] | 128 | void initializeAMDGPUUnifyDivergentExitNodesPass(PassRegistry&); |
| 129 | extern char &AMDGPUUnifyDivergentExitNodesID; |
| 130 | |
Stanislav Mekhanoshin | 8e45acf | 2017-03-17 23:56:58 +0000 | [diff] [blame] | 131 | ImmutablePass *createAMDGPUAAWrapperPass(); |
| 132 | void initializeAMDGPUAAWrapperPassPass(PassRegistry&); |
| 133 | |
Mehdi Amini | f42454b | 2016-10-09 23:00:34 +0000 | [diff] [blame] | 134 | Target &getTheAMDGPUTarget(); |
| 135 | Target &getTheGCNTarget(); |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 136 | |
Tom Stellard | 067c815 | 2014-07-21 14:01:14 +0000 | [diff] [blame] | 137 | namespace AMDGPU { |
| 138 | enum TargetIndex { |
Tom Stellard | 95292bb | 2015-01-20 17:49:47 +0000 | [diff] [blame] | 139 | TI_CONSTDATA_START, |
| 140 | TI_SCRATCH_RSRC_DWORD0, |
| 141 | TI_SCRATCH_RSRC_DWORD1, |
| 142 | TI_SCRATCH_RSRC_DWORD2, |
| 143 | TI_SCRATCH_RSRC_DWORD3 |
Tom Stellard | 067c815 | 2014-07-21 14:01:14 +0000 | [diff] [blame] | 144 | }; |
| 145 | } |
| 146 | |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 147 | } // End namespace llvm |
| 148 | |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 149 | /// OpenCL uses address spaces to differentiate between |
| 150 | /// various memory regions on the hardware. On the CPU |
| 151 | /// all of the address spaces point to the same memory, |
| 152 | /// however on the GPU, each address space points to |
Alp Toker | cb40291 | 2014-01-24 17:20:08 +0000 | [diff] [blame] | 153 | /// a separate piece of memory that is unique from other |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 154 | /// memory locations. |
Yaxun Liu | 1a14bfa | 2017-03-27 14:04:01 +0000 | [diff] [blame] | 155 | struct AMDGPUAS { |
| 156 | // The following address space values depend on the triple environment. |
| 157 | unsigned PRIVATE_ADDRESS; ///< Address space for private memory. |
Yaxun Liu | 1a14bfa | 2017-03-27 14:04:01 +0000 | [diff] [blame] | 158 | unsigned FLAT_ADDRESS; ///< Address space for flat memory. |
| 159 | unsigned REGION_ADDRESS; ///< Address space for region memory. |
| 160 | |
| 161 | // The maximum value for flat, generic, local, private, constant and region. |
| 162 | const static unsigned MAX_COMMON_ADDRESS = 5; |
| 163 | |
| 164 | const static unsigned GLOBAL_ADDRESS = 1; ///< Address space for global memory (RAT0, VTX0). |
Yaxun Liu | 76ae47c | 2017-04-06 19:17:32 +0000 | [diff] [blame] | 165 | const static unsigned CONSTANT_ADDRESS = 2; ///< Address space for constant memory (VTX2) |
Yaxun Liu | 1a14bfa | 2017-03-27 14:04:01 +0000 | [diff] [blame] | 166 | const static unsigned LOCAL_ADDRESS = 3; ///< Address space for local memory. |
| 167 | const static unsigned PARAM_D_ADDRESS = 6; ///< Address space for direct addressible parameter memory (CONST0) |
| 168 | const static unsigned PARAM_I_ADDRESS = 7; ///< Address space for indirect addressible parameter memory (VTX1) |
Tom Stellard | 1e80309 | 2013-07-23 01:48:18 +0000 | [diff] [blame] | 169 | |
| 170 | // Do not re-order the CONSTANT_BUFFER_* enums. Several places depend on this |
| 171 | // order to be able to dynamically index a constant buffer, for example: |
| 172 | // |
| 173 | // ConstantBufferAS = CONSTANT_BUFFER_0 + CBIdx |
| 174 | |
Yaxun Liu | 1a14bfa | 2017-03-27 14:04:01 +0000 | [diff] [blame] | 175 | const static unsigned CONSTANT_BUFFER_0 = 8; |
| 176 | const static unsigned CONSTANT_BUFFER_1 = 9; |
| 177 | const static unsigned CONSTANT_BUFFER_2 = 10; |
| 178 | const static unsigned CONSTANT_BUFFER_3 = 11; |
| 179 | const static unsigned CONSTANT_BUFFER_4 = 12; |
| 180 | const static unsigned CONSTANT_BUFFER_5 = 13; |
| 181 | const static unsigned CONSTANT_BUFFER_6 = 14; |
| 182 | const static unsigned CONSTANT_BUFFER_7 = 15; |
| 183 | const static unsigned CONSTANT_BUFFER_8 = 16; |
| 184 | const static unsigned CONSTANT_BUFFER_9 = 17; |
| 185 | const static unsigned CONSTANT_BUFFER_10 = 18; |
| 186 | const static unsigned CONSTANT_BUFFER_11 = 19; |
| 187 | const static unsigned CONSTANT_BUFFER_12 = 20; |
| 188 | const static unsigned CONSTANT_BUFFER_13 = 21; |
| 189 | const static unsigned CONSTANT_BUFFER_14 = 22; |
| 190 | const static unsigned CONSTANT_BUFFER_15 = 23; |
Matt Arsenault | 73e06fa | 2015-06-04 16:17:42 +0000 | [diff] [blame] | 191 | |
| 192 | // Some places use this if the address space can't be determined. |
Yaxun Liu | 1a14bfa | 2017-03-27 14:04:01 +0000 | [diff] [blame] | 193 | const static unsigned UNKNOWN_ADDRESS_SPACE = ~0u; |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 194 | }; |
| 195 | |
Yaxun Liu | 1a14bfa | 2017-03-27 14:04:01 +0000 | [diff] [blame] | 196 | namespace llvm { |
| 197 | namespace AMDGPU { |
| 198 | AMDGPUAS getAMDGPUAS(const Module &M); |
| 199 | AMDGPUAS getAMDGPUAS(const TargetMachine &TM); |
| 200 | AMDGPUAS getAMDGPUAS(Triple T); |
| 201 | } // namespace AMDGPU |
| 202 | } // namespace llvm |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 203 | |
Benjamin Kramer | a7c40ef | 2014-08-13 16:26:38 +0000 | [diff] [blame] | 204 | #endif |