Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 1 | //===-- RegAllocGreedy.cpp - greedy register allocator --------------------===// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | // This file defines the RAGreedy function pass for register allocation in |
| 11 | // optimized builds. |
| 12 | // |
| 13 | //===----------------------------------------------------------------------===// |
| 14 | |
| 15 | #define DEBUG_TYPE "regalloc" |
Jakob Stoklund Olesen | dd479e9 | 2010-12-10 22:21:05 +0000 | [diff] [blame] | 16 | #include "AllocationOrder.h" |
Jakob Stoklund Olesen | 5907d86 | 2011-04-02 06:03:35 +0000 | [diff] [blame] | 17 | #include "InterferenceCache.h" |
Jakob Stoklund Olesen | cfafc54 | 2011-04-05 21:40:37 +0000 | [diff] [blame] | 18 | #include "LiveDebugVariables.h" |
Jakob Stoklund Olesen | f428eb6 | 2010-12-17 23:16:32 +0000 | [diff] [blame] | 19 | #include "LiveRangeEdit.h" |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 20 | #include "RegAllocBase.h" |
| 21 | #include "Spiller.h" |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 22 | #include "SpillPlacement.h" |
Jakob Stoklund Olesen | d0bb5e2 | 2010-12-15 23:46:13 +0000 | [diff] [blame] | 23 | #include "SplitKit.h" |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 24 | #include "VirtRegMap.h" |
Jakob Stoklund Olesen | f4afdfc | 2011-04-09 02:59:09 +0000 | [diff] [blame^] | 25 | #include "llvm/ADT/SparseBitVector.h" |
Jakob Stoklund Olesen | 0db841f | 2011-02-17 22:53:48 +0000 | [diff] [blame] | 26 | #include "llvm/ADT/Statistic.h" |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 27 | #include "llvm/Analysis/AliasAnalysis.h" |
| 28 | #include "llvm/Function.h" |
| 29 | #include "llvm/PassAnalysisSupport.h" |
| 30 | #include "llvm/CodeGen/CalcSpillWeights.h" |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 31 | #include "llvm/CodeGen/EdgeBundles.h" |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 32 | #include "llvm/CodeGen/LiveIntervalAnalysis.h" |
| 33 | #include "llvm/CodeGen/LiveStackAnalysis.h" |
Jakob Stoklund Olesen | f428eb6 | 2010-12-17 23:16:32 +0000 | [diff] [blame] | 34 | #include "llvm/CodeGen/MachineDominators.h" |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 35 | #include "llvm/CodeGen/MachineFunctionPass.h" |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 36 | #include "llvm/CodeGen/MachineLoopInfo.h" |
Jakob Stoklund Olesen | d0bb5e2 | 2010-12-15 23:46:13 +0000 | [diff] [blame] | 37 | #include "llvm/CodeGen/MachineLoopRanges.h" |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 38 | #include "llvm/CodeGen/MachineRegisterInfo.h" |
| 39 | #include "llvm/CodeGen/Passes.h" |
| 40 | #include "llvm/CodeGen/RegAllocRegistry.h" |
| 41 | #include "llvm/CodeGen/RegisterCoalescer.h" |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 42 | #include "llvm/Target/TargetOptions.h" |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 43 | #include "llvm/Support/Debug.h" |
| 44 | #include "llvm/Support/ErrorHandling.h" |
| 45 | #include "llvm/Support/raw_ostream.h" |
Jakob Stoklund Olesen | 533f58e | 2010-12-11 00:19:56 +0000 | [diff] [blame] | 46 | #include "llvm/Support/Timer.h" |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 47 | |
Jakob Stoklund Olesen | 98d9648 | 2011-02-22 23:01:52 +0000 | [diff] [blame] | 48 | #include <queue> |
| 49 | |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 50 | using namespace llvm; |
| 51 | |
Jakob Stoklund Olesen | 0db841f | 2011-02-17 22:53:48 +0000 | [diff] [blame] | 52 | STATISTIC(NumGlobalSplits, "Number of split global live ranges"); |
| 53 | STATISTIC(NumLocalSplits, "Number of split local live ranges"); |
Jakob Stoklund Olesen | 0db841f | 2011-02-17 22:53:48 +0000 | [diff] [blame] | 54 | STATISTIC(NumEvicted, "Number of interferences evicted"); |
| 55 | |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 56 | static RegisterRegAlloc greedyRegAlloc("greedy", "greedy register allocator", |
| 57 | createGreedyRegisterAllocator); |
| 58 | |
| 59 | namespace { |
Jakob Stoklund Olesen | 92a55f4 | 2011-03-09 00:57:29 +0000 | [diff] [blame] | 60 | class RAGreedy : public MachineFunctionPass, |
| 61 | public RegAllocBase, |
| 62 | private LiveRangeEdit::Delegate { |
| 63 | |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 64 | // context |
| 65 | MachineFunction *MF; |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 66 | BitVector ReservedRegs; |
| 67 | |
| 68 | // analyses |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 69 | SlotIndexes *Indexes; |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 70 | LiveStacks *LS; |
Jakob Stoklund Olesen | f428eb6 | 2010-12-17 23:16:32 +0000 | [diff] [blame] | 71 | MachineDominatorTree *DomTree; |
Jakob Stoklund Olesen | d0bb5e2 | 2010-12-15 23:46:13 +0000 | [diff] [blame] | 72 | MachineLoopInfo *Loops; |
| 73 | MachineLoopRanges *LoopRanges; |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 74 | EdgeBundles *Bundles; |
| 75 | SpillPlacement *SpillPlacer; |
Jakob Stoklund Olesen | f428eb6 | 2010-12-17 23:16:32 +0000 | [diff] [blame] | 76 | |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 77 | // state |
| 78 | std::auto_ptr<Spiller> SpillerInstance; |
Jakob Stoklund Olesen | 98d9648 | 2011-02-22 23:01:52 +0000 | [diff] [blame] | 79 | std::priority_queue<std::pair<unsigned, unsigned> > Queue; |
Jakob Stoklund Olesen | 22a1df6 | 2011-03-01 21:10:07 +0000 | [diff] [blame] | 80 | |
| 81 | // Live ranges pass through a number of stages as we try to allocate them. |
| 82 | // Some of the stages may also create new live ranges: |
| 83 | // |
| 84 | // - Region splitting. |
| 85 | // - Per-block splitting. |
| 86 | // - Local splitting. |
| 87 | // - Spilling. |
| 88 | // |
| 89 | // Ranges produced by one of the stages skip the previous stages when they are |
| 90 | // dequeued. This improves performance because we can skip interference checks |
| 91 | // that are unlikely to give any results. It also guarantees that the live |
| 92 | // range splitting algorithm terminates, something that is otherwise hard to |
| 93 | // ensure. |
| 94 | enum LiveRangeStage { |
Jakob Stoklund Olesen | f22ca3f | 2011-03-30 02:52:39 +0000 | [diff] [blame] | 95 | RS_New, ///< Never seen before. |
| 96 | RS_First, ///< First time in the queue. |
Jakob Stoklund Olesen | 22a1df6 | 2011-03-01 21:10:07 +0000 | [diff] [blame] | 97 | RS_Second, ///< Second time in the queue. |
| 98 | RS_Region, ///< Produced by region splitting. |
| 99 | RS_Block, ///< Produced by per-block splitting. |
| 100 | RS_Local, ///< Produced by local splitting. |
| 101 | RS_Spill ///< Produced by spilling. |
| 102 | }; |
| 103 | |
| 104 | IndexedMap<unsigned char, VirtReg2IndexFunctor> LRStage; |
| 105 | |
| 106 | LiveRangeStage getStage(const LiveInterval &VirtReg) const { |
| 107 | return LiveRangeStage(LRStage[VirtReg.reg]); |
| 108 | } |
| 109 | |
| 110 | template<typename Iterator> |
| 111 | void setStage(Iterator Begin, Iterator End, LiveRangeStage NewStage) { |
| 112 | LRStage.resize(MRI->getNumVirtRegs()); |
Jakob Stoklund Olesen | f22ca3f | 2011-03-30 02:52:39 +0000 | [diff] [blame] | 113 | for (;Begin != End; ++Begin) { |
| 114 | unsigned Reg = (*Begin)->reg; |
| 115 | if (LRStage[Reg] == RS_New) |
| 116 | LRStage[Reg] = NewStage; |
| 117 | } |
Jakob Stoklund Olesen | 22a1df6 | 2011-03-01 21:10:07 +0000 | [diff] [blame] | 118 | } |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 119 | |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 120 | // splitting state. |
Jakob Stoklund Olesen | 22a1df6 | 2011-03-01 21:10:07 +0000 | [diff] [blame] | 121 | std::auto_ptr<SplitAnalysis> SA; |
Jakob Stoklund Olesen | bece06f | 2011-03-03 01:29:13 +0000 | [diff] [blame] | 122 | std::auto_ptr<SplitEditor> SE; |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 123 | |
Jakob Stoklund Olesen | eda0fe8 | 2011-04-02 06:03:38 +0000 | [diff] [blame] | 124 | /// Cached per-block interference maps |
| 125 | InterferenceCache IntfCache; |
| 126 | |
Jakob Stoklund Olesen | 7b41fbe | 2011-04-07 17:27:46 +0000 | [diff] [blame] | 127 | /// All basic blocks where the current register has uses. |
Jakob Stoklund Olesen | 96dcd95 | 2011-03-05 01:10:31 +0000 | [diff] [blame] | 128 | SmallVector<SpillPlacement::BlockConstraint, 8> SplitConstraints; |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 129 | |
Jakob Stoklund Olesen | f4afdfc | 2011-04-09 02:59:09 +0000 | [diff] [blame^] | 130 | /// Live-through blocks that have already been added to SpillPlacer. |
| 131 | SparseBitVector<> ActiveThroughBlocks; |
Jakob Stoklund Olesen | 7b41fbe | 2011-04-07 17:27:46 +0000 | [diff] [blame] | 132 | |
Jakob Stoklund Olesen | 96dcd95 | 2011-03-05 01:10:31 +0000 | [diff] [blame] | 133 | /// Global live range splitting candidate info. |
| 134 | struct GlobalSplitCandidate { |
| 135 | unsigned PhysReg; |
Jakob Stoklund Olesen | 96dcd95 | 2011-03-05 01:10:31 +0000 | [diff] [blame] | 136 | BitVector LiveBundles; |
| 137 | }; |
| 138 | |
| 139 | /// Candidate info for for each PhysReg in AllocationOrder. |
| 140 | /// This vector never shrinks, but grows to the size of the largest register |
| 141 | /// class. |
| 142 | SmallVector<GlobalSplitCandidate, 32> GlobalCand; |
| 143 | |
Jakob Stoklund Olesen | 034a80d | 2011-02-17 19:13:53 +0000 | [diff] [blame] | 144 | /// For every instruction in SA->UseSlots, store the previous non-copy |
| 145 | /// instruction. |
| 146 | SmallVector<SlotIndex, 8> PrevSlot; |
| 147 | |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 148 | public: |
| 149 | RAGreedy(); |
| 150 | |
| 151 | /// Return the pass name. |
| 152 | virtual const char* getPassName() const { |
Jakob Stoklund Olesen | 533f58e | 2010-12-11 00:19:56 +0000 | [diff] [blame] | 153 | return "Greedy Register Allocator"; |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 154 | } |
| 155 | |
| 156 | /// RAGreedy analysis usage. |
| 157 | virtual void getAnalysisUsage(AnalysisUsage &AU) const; |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 158 | virtual void releaseMemory(); |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 159 | virtual Spiller &spiller() { return *SpillerInstance; } |
Jakob Stoklund Olesen | 98d9648 | 2011-02-22 23:01:52 +0000 | [diff] [blame] | 160 | virtual void enqueue(LiveInterval *LI); |
| 161 | virtual LiveInterval *dequeue(); |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 162 | virtual unsigned selectOrSplit(LiveInterval&, |
| 163 | SmallVectorImpl<LiveInterval*>&); |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 164 | |
| 165 | /// Perform register allocation. |
| 166 | virtual bool runOnMachineFunction(MachineFunction &mf); |
| 167 | |
| 168 | static char ID; |
Andrew Trick | b853e6c | 2010-12-09 18:15:21 +0000 | [diff] [blame] | 169 | |
| 170 | private: |
Jakob Stoklund Olesen | 92a55f4 | 2011-03-09 00:57:29 +0000 | [diff] [blame] | 171 | void LRE_WillEraseInstruction(MachineInstr*); |
Jakob Stoklund Olesen | 7792e98 | 2011-03-13 01:23:11 +0000 | [diff] [blame] | 172 | bool LRE_CanEraseVirtReg(unsigned); |
Jakob Stoklund Olesen | 1d5b845 | 2011-03-16 22:56:16 +0000 | [diff] [blame] | 173 | void LRE_WillShrinkVirtReg(unsigned); |
Jakob Stoklund Olesen | f22ca3f | 2011-03-30 02:52:39 +0000 | [diff] [blame] | 174 | void LRE_DidCloneVirtReg(unsigned, unsigned); |
Jakob Stoklund Olesen | 92a55f4 | 2011-03-09 00:57:29 +0000 | [diff] [blame] | 175 | |
Jakob Stoklund Olesen | f4afdfc | 2011-04-09 02:59:09 +0000 | [diff] [blame^] | 176 | bool addSplitConstraints(InterferenceCache::Cursor, float&); |
| 177 | void addThroughConstraints(InterferenceCache::Cursor, ArrayRef<unsigned>); |
| 178 | void growRegion(InterferenceCache::Cursor); |
Jakob Stoklund Olesen | 9a54352 | 2011-04-06 21:32:41 +0000 | [diff] [blame] | 179 | float calcGlobalSplitCost(unsigned, const BitVector&); |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 180 | void splitAroundRegion(LiveInterval&, unsigned, const BitVector&, |
| 181 | SmallVectorImpl<LiveInterval*>&); |
Jakob Stoklund Olesen | 034a80d | 2011-02-17 19:13:53 +0000 | [diff] [blame] | 182 | void calcGapWeights(unsigned, SmallVectorImpl<float>&); |
| 183 | SlotIndex getPrevMappedIndex(const MachineInstr*); |
| 184 | void calcPrevSlots(); |
| 185 | unsigned nextSplitPoint(unsigned); |
Jakob Stoklund Olesen | d17924b | 2011-03-04 21:32:50 +0000 | [diff] [blame] | 186 | bool canEvictInterference(LiveInterval&, unsigned, float&); |
Jakob Stoklund Olesen | b64d92e | 2010-12-14 00:37:44 +0000 | [diff] [blame] | 187 | |
Jakob Stoklund Olesen | 98c8141 | 2011-02-23 00:29:52 +0000 | [diff] [blame] | 188 | unsigned tryEvict(LiveInterval&, AllocationOrder&, |
| 189 | SmallVectorImpl<LiveInterval*>&); |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 190 | unsigned tryRegionSplit(LiveInterval&, AllocationOrder&, |
| 191 | SmallVectorImpl<LiveInterval*>&); |
Jakob Stoklund Olesen | 034a80d | 2011-02-17 19:13:53 +0000 | [diff] [blame] | 192 | unsigned tryLocalSplit(LiveInterval&, AllocationOrder&, |
| 193 | SmallVectorImpl<LiveInterval*>&); |
Jakob Stoklund Olesen | b64d92e | 2010-12-14 00:37:44 +0000 | [diff] [blame] | 194 | unsigned trySplit(LiveInterval&, AllocationOrder&, |
| 195 | SmallVectorImpl<LiveInterval*>&); |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 196 | }; |
| 197 | } // end anonymous namespace |
| 198 | |
| 199 | char RAGreedy::ID = 0; |
| 200 | |
| 201 | FunctionPass* llvm::createGreedyRegisterAllocator() { |
| 202 | return new RAGreedy(); |
| 203 | } |
| 204 | |
Jakob Stoklund Olesen | f22ca3f | 2011-03-30 02:52:39 +0000 | [diff] [blame] | 205 | RAGreedy::RAGreedy(): MachineFunctionPass(ID), LRStage(RS_New) { |
Jakob Stoklund Olesen | cfafc54 | 2011-04-05 21:40:37 +0000 | [diff] [blame] | 206 | initializeLiveDebugVariablesPass(*PassRegistry::getPassRegistry()); |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 207 | initializeSlotIndexesPass(*PassRegistry::getPassRegistry()); |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 208 | initializeLiveIntervalsPass(*PassRegistry::getPassRegistry()); |
| 209 | initializeSlotIndexesPass(*PassRegistry::getPassRegistry()); |
| 210 | initializeStrongPHIEliminationPass(*PassRegistry::getPassRegistry()); |
| 211 | initializeRegisterCoalescerAnalysisGroup(*PassRegistry::getPassRegistry()); |
| 212 | initializeCalculateSpillWeightsPass(*PassRegistry::getPassRegistry()); |
| 213 | initializeLiveStacksPass(*PassRegistry::getPassRegistry()); |
| 214 | initializeMachineDominatorTreePass(*PassRegistry::getPassRegistry()); |
| 215 | initializeMachineLoopInfoPass(*PassRegistry::getPassRegistry()); |
Jakob Stoklund Olesen | d0bb5e2 | 2010-12-15 23:46:13 +0000 | [diff] [blame] | 216 | initializeMachineLoopRangesPass(*PassRegistry::getPassRegistry()); |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 217 | initializeVirtRegMapPass(*PassRegistry::getPassRegistry()); |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 218 | initializeEdgeBundlesPass(*PassRegistry::getPassRegistry()); |
| 219 | initializeSpillPlacementPass(*PassRegistry::getPassRegistry()); |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 220 | } |
| 221 | |
| 222 | void RAGreedy::getAnalysisUsage(AnalysisUsage &AU) const { |
| 223 | AU.setPreservesCFG(); |
| 224 | AU.addRequired<AliasAnalysis>(); |
| 225 | AU.addPreserved<AliasAnalysis>(); |
| 226 | AU.addRequired<LiveIntervals>(); |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 227 | AU.addRequired<SlotIndexes>(); |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 228 | AU.addPreserved<SlotIndexes>(); |
Jakob Stoklund Olesen | cfafc54 | 2011-04-05 21:40:37 +0000 | [diff] [blame] | 229 | AU.addRequired<LiveDebugVariables>(); |
| 230 | AU.addPreserved<LiveDebugVariables>(); |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 231 | if (StrongPHIElim) |
| 232 | AU.addRequiredID(StrongPHIEliminationID); |
| 233 | AU.addRequiredTransitive<RegisterCoalescer>(); |
| 234 | AU.addRequired<CalculateSpillWeights>(); |
| 235 | AU.addRequired<LiveStacks>(); |
| 236 | AU.addPreserved<LiveStacks>(); |
Jakob Stoklund Olesen | f428eb6 | 2010-12-17 23:16:32 +0000 | [diff] [blame] | 237 | AU.addRequired<MachineDominatorTree>(); |
| 238 | AU.addPreserved<MachineDominatorTree>(); |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 239 | AU.addRequired<MachineLoopInfo>(); |
| 240 | AU.addPreserved<MachineLoopInfo>(); |
Jakob Stoklund Olesen | d0bb5e2 | 2010-12-15 23:46:13 +0000 | [diff] [blame] | 241 | AU.addRequired<MachineLoopRanges>(); |
| 242 | AU.addPreserved<MachineLoopRanges>(); |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 243 | AU.addRequired<VirtRegMap>(); |
| 244 | AU.addPreserved<VirtRegMap>(); |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 245 | AU.addRequired<EdgeBundles>(); |
| 246 | AU.addRequired<SpillPlacement>(); |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 247 | MachineFunctionPass::getAnalysisUsage(AU); |
| 248 | } |
| 249 | |
Jakob Stoklund Olesen | 92a55f4 | 2011-03-09 00:57:29 +0000 | [diff] [blame] | 250 | |
| 251 | //===----------------------------------------------------------------------===// |
| 252 | // LiveRangeEdit delegate methods |
| 253 | //===----------------------------------------------------------------------===// |
| 254 | |
| 255 | void RAGreedy::LRE_WillEraseInstruction(MachineInstr *MI) { |
| 256 | // LRE itself will remove from SlotIndexes and parent basic block. |
| 257 | VRM->RemoveMachineInstrFromMaps(MI); |
| 258 | } |
| 259 | |
Jakob Stoklund Olesen | 7792e98 | 2011-03-13 01:23:11 +0000 | [diff] [blame] | 260 | bool RAGreedy::LRE_CanEraseVirtReg(unsigned VirtReg) { |
| 261 | if (unsigned PhysReg = VRM->getPhys(VirtReg)) { |
| 262 | unassign(LIS->getInterval(VirtReg), PhysReg); |
| 263 | return true; |
| 264 | } |
| 265 | // Unassigned virtreg is probably in the priority queue. |
| 266 | // RegAllocBase will erase it after dequeueing. |
| 267 | return false; |
| 268 | } |
Jakob Stoklund Olesen | 92a55f4 | 2011-03-09 00:57:29 +0000 | [diff] [blame] | 269 | |
Jakob Stoklund Olesen | 1d5b845 | 2011-03-16 22:56:16 +0000 | [diff] [blame] | 270 | void RAGreedy::LRE_WillShrinkVirtReg(unsigned VirtReg) { |
| 271 | unsigned PhysReg = VRM->getPhys(VirtReg); |
| 272 | if (!PhysReg) |
| 273 | return; |
| 274 | |
| 275 | // Register is assigned, put it back on the queue for reassignment. |
| 276 | LiveInterval &LI = LIS->getInterval(VirtReg); |
| 277 | unassign(LI, PhysReg); |
| 278 | enqueue(&LI); |
| 279 | } |
| 280 | |
Jakob Stoklund Olesen | f22ca3f | 2011-03-30 02:52:39 +0000 | [diff] [blame] | 281 | void RAGreedy::LRE_DidCloneVirtReg(unsigned New, unsigned Old) { |
| 282 | // LRE may clone a virtual register because dead code elimination causes it to |
| 283 | // be split into connected components. Ensure that the new register gets the |
| 284 | // same stage as the parent. |
| 285 | LRStage.grow(New); |
| 286 | LRStage[New] = LRStage[Old]; |
| 287 | } |
| 288 | |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 289 | void RAGreedy::releaseMemory() { |
| 290 | SpillerInstance.reset(0); |
Jakob Stoklund Olesen | 22a1df6 | 2011-03-01 21:10:07 +0000 | [diff] [blame] | 291 | LRStage.clear(); |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 292 | RegAllocBase::releaseMemory(); |
| 293 | } |
| 294 | |
Jakob Stoklund Olesen | 98d9648 | 2011-02-22 23:01:52 +0000 | [diff] [blame] | 295 | void RAGreedy::enqueue(LiveInterval *LI) { |
| 296 | // Prioritize live ranges by size, assigning larger ranges first. |
| 297 | // The queue holds (size, reg) pairs. |
Jakob Stoklund Olesen | 107d366 | 2011-02-24 23:21:36 +0000 | [diff] [blame] | 298 | const unsigned Size = LI->getSize(); |
| 299 | const unsigned Reg = LI->reg; |
Jakob Stoklund Olesen | 98d9648 | 2011-02-22 23:01:52 +0000 | [diff] [blame] | 300 | assert(TargetRegisterInfo::isVirtualRegister(Reg) && |
| 301 | "Can only enqueue virtual registers"); |
Jakob Stoklund Olesen | 107d366 | 2011-02-24 23:21:36 +0000 | [diff] [blame] | 302 | unsigned Prio; |
Jakob Stoklund Olesen | 90c1d7d | 2010-12-08 22:57:16 +0000 | [diff] [blame] | 303 | |
Jakob Stoklund Olesen | 22a1df6 | 2011-03-01 21:10:07 +0000 | [diff] [blame] | 304 | LRStage.grow(Reg); |
Jakob Stoklund Olesen | f22ca3f | 2011-03-30 02:52:39 +0000 | [diff] [blame] | 305 | if (LRStage[Reg] == RS_New) |
| 306 | LRStage[Reg] = RS_First; |
| 307 | |
Jakob Stoklund Olesen | eb29157 | 2011-03-27 22:49:21 +0000 | [diff] [blame] | 308 | if (LRStage[Reg] == RS_Second) |
| 309 | // Unsplit ranges that couldn't be allocated immediately are deferred until |
| 310 | // everything else has been allocated. Long ranges are allocated last so |
| 311 | // they are split against realistic interference. |
| 312 | Prio = (1u << 31) - Size; |
| 313 | else { |
| 314 | // Everything else is allocated in long->short order. Long ranges that don't |
| 315 | // fit should be spilled ASAP so they don't create interference. |
Jakob Stoklund Olesen | 107d366 | 2011-02-24 23:21:36 +0000 | [diff] [blame] | 316 | Prio = (1u << 31) + Size; |
Jakob Stoklund Olesen | d2a5073 | 2011-02-23 00:56:56 +0000 | [diff] [blame] | 317 | |
Jakob Stoklund Olesen | eb29157 | 2011-03-27 22:49:21 +0000 | [diff] [blame] | 318 | // Boost ranges that have a physical register hint. |
| 319 | if (TargetRegisterInfo::isPhysicalRegister(VRM->getRegAllocPref(Reg))) |
| 320 | Prio |= (1u << 30); |
| 321 | } |
Jakob Stoklund Olesen | 107d366 | 2011-02-24 23:21:36 +0000 | [diff] [blame] | 322 | |
| 323 | Queue.push(std::make_pair(Prio, Reg)); |
Jakob Stoklund Olesen | 90c1d7d | 2010-12-08 22:57:16 +0000 | [diff] [blame] | 324 | } |
| 325 | |
Jakob Stoklund Olesen | 98d9648 | 2011-02-22 23:01:52 +0000 | [diff] [blame] | 326 | LiveInterval *RAGreedy::dequeue() { |
| 327 | if (Queue.empty()) |
| 328 | return 0; |
| 329 | LiveInterval *LI = &LIS->getInterval(Queue.top().second); |
| 330 | Queue.pop(); |
| 331 | return LI; |
| 332 | } |
Jakob Stoklund Olesen | 770d42d | 2010-12-22 22:01:30 +0000 | [diff] [blame] | 333 | |
| 334 | //===----------------------------------------------------------------------===// |
Jakob Stoklund Olesen | 98c8141 | 2011-02-23 00:29:52 +0000 | [diff] [blame] | 335 | // Interference eviction |
| 336 | //===----------------------------------------------------------------------===// |
| 337 | |
| 338 | /// canEvict - Return true if all interferences between VirtReg and PhysReg can |
| 339 | /// be evicted. Set maxWeight to the maximal spill weight of an interference. |
| 340 | bool RAGreedy::canEvictInterference(LiveInterval &VirtReg, unsigned PhysReg, |
Jakob Stoklund Olesen | d17924b | 2011-03-04 21:32:50 +0000 | [diff] [blame] | 341 | float &MaxWeight) { |
Jakob Stoklund Olesen | 98c8141 | 2011-02-23 00:29:52 +0000 | [diff] [blame] | 342 | float Weight = 0; |
| 343 | for (const unsigned *AliasI = TRI->getOverlaps(PhysReg); *AliasI; ++AliasI) { |
| 344 | LiveIntervalUnion::Query &Q = query(VirtReg, *AliasI); |
| 345 | // If there is 10 or more interferences, chances are one is smaller. |
| 346 | if (Q.collectInterferingVRegs(10) >= 10) |
| 347 | return false; |
| 348 | |
Jakob Stoklund Olesen | d17924b | 2011-03-04 21:32:50 +0000 | [diff] [blame] | 349 | // Check if any interfering live range is heavier than VirtReg. |
Jakob Stoklund Olesen | 98c8141 | 2011-02-23 00:29:52 +0000 | [diff] [blame] | 350 | for (unsigned i = 0, e = Q.interferingVRegs().size(); i != e; ++i) { |
| 351 | LiveInterval *Intf = Q.interferingVRegs()[i]; |
| 352 | if (TargetRegisterInfo::isPhysicalRegister(Intf->reg)) |
| 353 | return false; |
Jakob Stoklund Olesen | d17924b | 2011-03-04 21:32:50 +0000 | [diff] [blame] | 354 | if (Intf->weight >= VirtReg.weight) |
Jakob Stoklund Olesen | 98c8141 | 2011-02-23 00:29:52 +0000 | [diff] [blame] | 355 | return false; |
| 356 | Weight = std::max(Weight, Intf->weight); |
Jakob Stoklund Olesen | 2710638 | 2011-02-09 01:14:03 +0000 | [diff] [blame] | 357 | } |
| 358 | } |
Jakob Stoklund Olesen | 98c8141 | 2011-02-23 00:29:52 +0000 | [diff] [blame] | 359 | MaxWeight = Weight; |
| 360 | return true; |
| 361 | } |
Jakob Stoklund Olesen | 2710638 | 2011-02-09 01:14:03 +0000 | [diff] [blame] | 362 | |
Jakob Stoklund Olesen | 98c8141 | 2011-02-23 00:29:52 +0000 | [diff] [blame] | 363 | /// tryEvict - Try to evict all interferences for a physreg. |
| 364 | /// @param VirtReg Currently unassigned virtual register. |
| 365 | /// @param Order Physregs to try. |
| 366 | /// @return Physreg to assign VirtReg, or 0. |
| 367 | unsigned RAGreedy::tryEvict(LiveInterval &VirtReg, |
| 368 | AllocationOrder &Order, |
| 369 | SmallVectorImpl<LiveInterval*> &NewVRegs){ |
| 370 | NamedRegionTimer T("Evict", TimerGroupName, TimePassesIsEnabled); |
| 371 | |
Jakob Stoklund Olesen | 98c8141 | 2011-02-23 00:29:52 +0000 | [diff] [blame] | 372 | // Keep track of the lightest single interference seen so far. |
| 373 | float BestWeight = 0; |
| 374 | unsigned BestPhys = 0; |
| 375 | |
| 376 | Order.rewind(); |
| 377 | while (unsigned PhysReg = Order.next()) { |
| 378 | float Weight = 0; |
Jakob Stoklund Olesen | d17924b | 2011-03-04 21:32:50 +0000 | [diff] [blame] | 379 | if (!canEvictInterference(VirtReg, PhysReg, Weight)) |
Jakob Stoklund Olesen | 98c8141 | 2011-02-23 00:29:52 +0000 | [diff] [blame] | 380 | continue; |
| 381 | |
| 382 | // This is an eviction candidate. |
| 383 | DEBUG(dbgs() << "max " << PrintReg(PhysReg, TRI) << " interference = " |
| 384 | << Weight << '\n'); |
| 385 | if (BestPhys && Weight >= BestWeight) |
| 386 | continue; |
| 387 | |
| 388 | // Best so far. |
| 389 | BestPhys = PhysReg; |
| 390 | BestWeight = Weight; |
Jakob Stoklund Olesen | 57f1e2c | 2011-02-25 01:04:22 +0000 | [diff] [blame] | 391 | // Stop if the hint can be used. |
| 392 | if (Order.isHint(PhysReg)) |
| 393 | break; |
Jakob Stoklund Olesen | 2710638 | 2011-02-09 01:14:03 +0000 | [diff] [blame] | 394 | } |
| 395 | |
Jakob Stoklund Olesen | 98c8141 | 2011-02-23 00:29:52 +0000 | [diff] [blame] | 396 | if (!BestPhys) |
| 397 | return 0; |
| 398 | |
| 399 | DEBUG(dbgs() << "evicting " << PrintReg(BestPhys, TRI) << " interference\n"); |
| 400 | for (const unsigned *AliasI = TRI->getOverlaps(BestPhys); *AliasI; ++AliasI) { |
| 401 | LiveIntervalUnion::Query &Q = query(VirtReg, *AliasI); |
| 402 | assert(Q.seenAllInterferences() && "Didn't check all interfererences."); |
| 403 | for (unsigned i = 0, e = Q.interferingVRegs().size(); i != e; ++i) { |
| 404 | LiveInterval *Intf = Q.interferingVRegs()[i]; |
| 405 | unassign(*Intf, VRM->getPhys(Intf->reg)); |
| 406 | ++NumEvicted; |
| 407 | NewVRegs.push_back(Intf); |
| 408 | } |
| 409 | } |
| 410 | return BestPhys; |
Andrew Trick | b853e6c | 2010-12-09 18:15:21 +0000 | [diff] [blame] | 411 | } |
| 412 | |
Jakob Stoklund Olesen | 770d42d | 2010-12-22 22:01:30 +0000 | [diff] [blame] | 413 | |
| 414 | //===----------------------------------------------------------------------===// |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 415 | // Region Splitting |
| 416 | //===----------------------------------------------------------------------===// |
| 417 | |
Jakob Stoklund Olesen | 1b400e8 | 2011-04-06 21:32:38 +0000 | [diff] [blame] | 418 | /// addSplitConstraints - Fill out the SplitConstraints vector based on the |
| 419 | /// interference pattern in Physreg and its aliases. Add the constraints to |
| 420 | /// SpillPlacement and return the static cost of this split in Cost, assuming |
| 421 | /// that all preferences in SplitConstraints are met. |
Jakob Stoklund Olesen | f4afdfc | 2011-04-09 02:59:09 +0000 | [diff] [blame^] | 422 | /// Return false if there are no bundles with positive bias. |
| 423 | bool RAGreedy::addSplitConstraints(InterferenceCache::Cursor Intf, |
| 424 | float &Cost) { |
Jakob Stoklund Olesen | db529a8 | 2011-04-06 03:57:00 +0000 | [diff] [blame] | 425 | ArrayRef<SplitAnalysis::BlockInfo> UseBlocks = SA->getUseBlocks(); |
Jakob Stoklund Olesen | eda0fe8 | 2011-04-02 06:03:38 +0000 | [diff] [blame] | 426 | |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 427 | // Reset interference dependent info. |
Jakob Stoklund Olesen | db529a8 | 2011-04-06 03:57:00 +0000 | [diff] [blame] | 428 | SplitConstraints.resize(UseBlocks.size()); |
Jakob Stoklund Olesen | 96dcd95 | 2011-03-05 01:10:31 +0000 | [diff] [blame] | 429 | float StaticCost = 0; |
Jakob Stoklund Olesen | db529a8 | 2011-04-06 03:57:00 +0000 | [diff] [blame] | 430 | for (unsigned i = 0; i != UseBlocks.size(); ++i) { |
| 431 | const SplitAnalysis::BlockInfo &BI = UseBlocks[i]; |
Jakob Stoklund Olesen | 96dcd95 | 2011-03-05 01:10:31 +0000 | [diff] [blame] | 432 | SpillPlacement::BlockConstraint &BC = SplitConstraints[i]; |
Jakob Stoklund Olesen | 96dcd95 | 2011-03-05 01:10:31 +0000 | [diff] [blame] | 433 | |
Jakob Stoklund Olesen | f0ac26c | 2011-02-09 22:50:26 +0000 | [diff] [blame] | 434 | BC.Number = BI.MBB->getNumber(); |
Jakob Stoklund Olesen | eda0fe8 | 2011-04-02 06:03:38 +0000 | [diff] [blame] | 435 | Intf.moveToBlock(BC.Number); |
Jakob Stoklund Olesen | db529a8 | 2011-04-06 03:57:00 +0000 | [diff] [blame] | 436 | BC.Entry = BI.LiveIn ? SpillPlacement::PrefReg : SpillPlacement::DontCare; |
| 437 | BC.Exit = BI.LiveOut ? SpillPlacement::PrefReg : SpillPlacement::DontCare; |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 438 | |
Jakob Stoklund Olesen | eda0fe8 | 2011-04-02 06:03:38 +0000 | [diff] [blame] | 439 | if (!Intf.hasInterference()) |
| 440 | continue; |
| 441 | |
Jakob Stoklund Olesen | 96dcd95 | 2011-03-05 01:10:31 +0000 | [diff] [blame] | 442 | // Number of spill code instructions to insert. |
| 443 | unsigned Ins = 0; |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 444 | |
Jakob Stoklund Olesen | 96dcd95 | 2011-03-05 01:10:31 +0000 | [diff] [blame] | 445 | // Interference for the live-in value. |
Jakob Stoklund Olesen | eda0fe8 | 2011-04-02 06:03:38 +0000 | [diff] [blame] | 446 | if (BI.LiveIn) { |
Jakob Stoklund Olesen | 6c8afd7 | 2011-04-04 15:32:15 +0000 | [diff] [blame] | 447 | if (Intf.first() <= Indexes->getMBBStartIdx(BC.Number)) |
Jakob Stoklund Olesen | db529a8 | 2011-04-06 03:57:00 +0000 | [diff] [blame] | 448 | BC.Entry = SpillPlacement::MustSpill, ++Ins; |
Jakob Stoklund Olesen | eda0fe8 | 2011-04-02 06:03:38 +0000 | [diff] [blame] | 449 | else if (Intf.first() < BI.FirstUse) |
Jakob Stoklund Olesen | 96dcd95 | 2011-03-05 01:10:31 +0000 | [diff] [blame] | 450 | BC.Entry = SpillPlacement::PrefSpill, ++Ins; |
Jakob Stoklund Olesen | eda0fe8 | 2011-04-02 06:03:38 +0000 | [diff] [blame] | 451 | else if (Intf.first() < (BI.LiveThrough ? BI.LastUse : BI.Kill)) |
Jakob Stoklund Olesen | 96dcd95 | 2011-03-05 01:10:31 +0000 | [diff] [blame] | 452 | ++Ins; |
Jakob Stoklund Olesen | a50c539 | 2011-02-08 23:02:58 +0000 | [diff] [blame] | 453 | } |
| 454 | |
Jakob Stoklund Olesen | 96dcd95 | 2011-03-05 01:10:31 +0000 | [diff] [blame] | 455 | // Interference for the live-out value. |
Jakob Stoklund Olesen | eda0fe8 | 2011-04-02 06:03:38 +0000 | [diff] [blame] | 456 | if (BI.LiveOut) { |
Jakob Stoklund Olesen | 612f780 | 2011-04-05 04:20:29 +0000 | [diff] [blame] | 457 | if (Intf.last() >= SA->getLastSplitPoint(BC.Number)) |
Jakob Stoklund Olesen | db529a8 | 2011-04-06 03:57:00 +0000 | [diff] [blame] | 458 | BC.Exit = SpillPlacement::MustSpill, ++Ins; |
Jakob Stoklund Olesen | eda0fe8 | 2011-04-02 06:03:38 +0000 | [diff] [blame] | 459 | else if (Intf.last() > BI.LastUse) |
Jakob Stoklund Olesen | 96dcd95 | 2011-03-05 01:10:31 +0000 | [diff] [blame] | 460 | BC.Exit = SpillPlacement::PrefSpill, ++Ins; |
Jakob Stoklund Olesen | eda0fe8 | 2011-04-02 06:03:38 +0000 | [diff] [blame] | 461 | else if (Intf.last() > (BI.LiveThrough ? BI.FirstUse : BI.Def)) |
Jakob Stoklund Olesen | 96dcd95 | 2011-03-05 01:10:31 +0000 | [diff] [blame] | 462 | ++Ins; |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 463 | } |
Jakob Stoklund Olesen | 96dcd95 | 2011-03-05 01:10:31 +0000 | [diff] [blame] | 464 | |
| 465 | // Accumulate the total frequency of inserted spill code. |
| 466 | if (Ins) |
| 467 | StaticCost += Ins * SpillPlacer->getBlockFrequency(BC.Number); |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 468 | } |
Jakob Stoklund Olesen | f4afdfc | 2011-04-09 02:59:09 +0000 | [diff] [blame^] | 469 | Cost = StaticCost; |
Jakob Stoklund Olesen | db529a8 | 2011-04-06 03:57:00 +0000 | [diff] [blame] | 470 | |
Jakob Stoklund Olesen | 1b400e8 | 2011-04-06 21:32:38 +0000 | [diff] [blame] | 471 | // Add constraints for use-blocks. Note that these are the only constraints |
| 472 | // that may add a positive bias, it is downhill from here. |
| 473 | SpillPlacer->addConstraints(SplitConstraints); |
Jakob Stoklund Olesen | f4afdfc | 2011-04-09 02:59:09 +0000 | [diff] [blame^] | 474 | return SpillPlacer->scanActiveBundles(); |
| 475 | } |
Jakob Stoklund Olesen | 1b400e8 | 2011-04-06 21:32:38 +0000 | [diff] [blame] | 476 | |
Jakob Stoklund Olesen | 1b400e8 | 2011-04-06 21:32:38 +0000 | [diff] [blame] | 477 | |
Jakob Stoklund Olesen | f4afdfc | 2011-04-09 02:59:09 +0000 | [diff] [blame^] | 478 | /// addThroughConstraints - Add constraints and links to SpillPlacer from the |
| 479 | /// live-through blocks in Blocks. |
| 480 | void RAGreedy::addThroughConstraints(InterferenceCache::Cursor Intf, |
| 481 | ArrayRef<unsigned> Blocks) { |
Jakob Stoklund Olesen | 1b400e8 | 2011-04-06 21:32:38 +0000 | [diff] [blame] | 482 | const unsigned GroupSize = 8; |
| 483 | SpillPlacement::BlockConstraint BCS[GroupSize]; |
Jakob Stoklund Olesen | f4afdfc | 2011-04-09 02:59:09 +0000 | [diff] [blame^] | 484 | unsigned TBS[GroupSize]; |
| 485 | unsigned B = 0, T = 0; |
Jakob Stoklund Olesen | 1b400e8 | 2011-04-06 21:32:38 +0000 | [diff] [blame] | 486 | |
Jakob Stoklund Olesen | f4afdfc | 2011-04-09 02:59:09 +0000 | [diff] [blame^] | 487 | for (unsigned i = 0; i != Blocks.size(); ++i) { |
| 488 | unsigned Number = Blocks[i]; |
Jakob Stoklund Olesen | 1b400e8 | 2011-04-06 21:32:38 +0000 | [diff] [blame] | 489 | Intf.moveToBlock(Number); |
Jakob Stoklund Olesen | db529a8 | 2011-04-06 03:57:00 +0000 | [diff] [blame] | 490 | |
Jakob Stoklund Olesen | 7b41fbe | 2011-04-07 17:27:46 +0000 | [diff] [blame] | 491 | if (!Intf.hasInterference()) { |
Jakob Stoklund Olesen | f4afdfc | 2011-04-09 02:59:09 +0000 | [diff] [blame^] | 492 | assert(T < GroupSize && "Array overflow"); |
| 493 | TBS[T] = Number; |
| 494 | if (++T == GroupSize) { |
| 495 | SpillPlacer->addLinks(ArrayRef<unsigned>(TBS, T)); |
| 496 | T = 0; |
| 497 | } |
Jakob Stoklund Olesen | 7b41fbe | 2011-04-07 17:27:46 +0000 | [diff] [blame] | 498 | continue; |
Jakob Stoklund Olesen | 1b400e8 | 2011-04-06 21:32:38 +0000 | [diff] [blame] | 499 | } |
Jakob Stoklund Olesen | db529a8 | 2011-04-06 03:57:00 +0000 | [diff] [blame] | 500 | |
Jakob Stoklund Olesen | f4afdfc | 2011-04-09 02:59:09 +0000 | [diff] [blame^] | 501 | assert(B < GroupSize && "Array overflow"); |
| 502 | BCS[B].Number = Number; |
| 503 | |
Jakob Stoklund Olesen | 7b41fbe | 2011-04-07 17:27:46 +0000 | [diff] [blame] | 504 | // Interference for the live-in value. |
| 505 | if (Intf.first() <= Indexes->getMBBStartIdx(Number)) |
| 506 | BCS[B].Entry = SpillPlacement::MustSpill; |
| 507 | else |
| 508 | BCS[B].Entry = SpillPlacement::PrefSpill; |
| 509 | |
| 510 | // Interference for the live-out value. |
| 511 | if (Intf.last() >= SA->getLastSplitPoint(Number)) |
| 512 | BCS[B].Exit = SpillPlacement::MustSpill; |
| 513 | else |
| 514 | BCS[B].Exit = SpillPlacement::PrefSpill; |
| 515 | |
Jakob Stoklund Olesen | 1b400e8 | 2011-04-06 21:32:38 +0000 | [diff] [blame] | 516 | if (++B == GroupSize) { |
| 517 | ArrayRef<SpillPlacement::BlockConstraint> Array(BCS, B); |
| 518 | SpillPlacer->addConstraints(Array); |
| 519 | B = 0; |
Jakob Stoklund Olesen | 1b400e8 | 2011-04-06 21:32:38 +0000 | [diff] [blame] | 520 | } |
Jakob Stoklund Olesen | db529a8 | 2011-04-06 03:57:00 +0000 | [diff] [blame] | 521 | } |
| 522 | |
Jakob Stoklund Olesen | 1b400e8 | 2011-04-06 21:32:38 +0000 | [diff] [blame] | 523 | ArrayRef<SpillPlacement::BlockConstraint> Array(BCS, B); |
| 524 | SpillPlacer->addConstraints(Array); |
Jakob Stoklund Olesen | f4afdfc | 2011-04-09 02:59:09 +0000 | [diff] [blame^] | 525 | SpillPlacer->addLinks(ArrayRef<unsigned>(TBS, T)); |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 526 | } |
| 527 | |
Jakob Stoklund Olesen | f4afdfc | 2011-04-09 02:59:09 +0000 | [diff] [blame^] | 528 | void RAGreedy::growRegion(InterferenceCache::Cursor Intf) { |
| 529 | // Keep track of through blocks that have already been added to SpillPlacer. |
| 530 | SparseBitVector<> Added; |
| 531 | SmallVector<unsigned, 16> ThroughBlocks; |
| 532 | #ifndef NDEBUG |
| 533 | unsigned Visited = 0; |
| 534 | #endif |
| 535 | for (;;) { |
| 536 | ArrayRef<unsigned> NewBundles = SpillPlacer->getRecentPositive(); |
| 537 | if (NewBundles.empty()) |
| 538 | break; |
| 539 | // Find new through blocks in the periphery of PrefRegBundles. |
| 540 | for (int i = 0, e = NewBundles.size(); i != e; ++i) { |
| 541 | unsigned Bundle = NewBundles[i]; |
| 542 | // Look at all blocks connected to Bundle in the full graph. |
| 543 | ArrayRef<unsigned> Blocks = Bundles->getBlocks(Bundle); |
| 544 | for (ArrayRef<unsigned>::iterator I = Blocks.begin(), E = Blocks.end(); |
| 545 | I != E; ++I) { |
| 546 | unsigned Block = *I; |
| 547 | if (!SA->isThroughBlock(Block) || !Added.test_and_set(Block)) |
| 548 | continue; |
| 549 | // This is a new through block. Add it to SpillPlacer later. |
| 550 | ThroughBlocks.push_back(Block); |
| 551 | #ifndef NDEBUG |
| 552 | ++Visited; |
| 553 | #endif |
| 554 | } |
| 555 | } |
| 556 | // Any new blocks to add? |
| 557 | if (!ThroughBlocks.empty()) { |
| 558 | addThroughConstraints(Intf, ThroughBlocks); |
| 559 | ThroughBlocks.clear(); |
| 560 | } |
| 561 | // Perhaps iterating can enable more bundles? |
| 562 | SpillPlacer->iterate(); |
| 563 | } |
| 564 | |
| 565 | // Rememeber the relevant set of through blocks for splitAroundRegion(). |
| 566 | ActiveThroughBlocks |= Added; |
| 567 | DEBUG(dbgs() << ", v=" << Visited); |
| 568 | } |
Jakob Stoklund Olesen | 96dcd95 | 2011-03-05 01:10:31 +0000 | [diff] [blame] | 569 | |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 570 | /// calcGlobalSplitCost - Return the global split cost of following the split |
| 571 | /// pattern in LiveBundles. This cost should be added to the local cost of the |
Jakob Stoklund Olesen | 96dcd95 | 2011-03-05 01:10:31 +0000 | [diff] [blame] | 572 | /// interference pattern in SplitConstraints. |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 573 | /// |
Jakob Stoklund Olesen | 9a54352 | 2011-04-06 21:32:41 +0000 | [diff] [blame] | 574 | float RAGreedy::calcGlobalSplitCost(unsigned PhysReg, |
| 575 | const BitVector &LiveBundles) { |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 576 | float GlobalCost = 0; |
Jakob Stoklund Olesen | db529a8 | 2011-04-06 03:57:00 +0000 | [diff] [blame] | 577 | ArrayRef<SplitAnalysis::BlockInfo> UseBlocks = SA->getUseBlocks(); |
| 578 | for (unsigned i = 0; i != UseBlocks.size(); ++i) { |
| 579 | const SplitAnalysis::BlockInfo &BI = UseBlocks[i]; |
Jakob Stoklund Olesen | 96dcd95 | 2011-03-05 01:10:31 +0000 | [diff] [blame] | 580 | SpillPlacement::BlockConstraint &BC = SplitConstraints[i]; |
Jakob Stoklund Olesen | 874be74 | 2011-03-05 03:28:51 +0000 | [diff] [blame] | 581 | bool RegIn = LiveBundles[Bundles->getBundle(BC.Number, 0)]; |
| 582 | bool RegOut = LiveBundles[Bundles->getBundle(BC.Number, 1)]; |
| 583 | unsigned Ins = 0; |
| 584 | |
Jakob Stoklund Olesen | db529a8 | 2011-04-06 03:57:00 +0000 | [diff] [blame] | 585 | if (BI.LiveIn) |
| 586 | Ins += RegIn != (BC.Entry == SpillPlacement::PrefReg); |
| 587 | if (BI.LiveOut) |
| 588 | Ins += RegOut != (BC.Exit == SpillPlacement::PrefReg); |
Jakob Stoklund Olesen | 874be74 | 2011-03-05 03:28:51 +0000 | [diff] [blame] | 589 | if (Ins) |
| 590 | GlobalCost += Ins * SpillPlacer->getBlockFrequency(BC.Number); |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 591 | } |
Jakob Stoklund Olesen | db529a8 | 2011-04-06 03:57:00 +0000 | [diff] [blame] | 592 | |
Jakob Stoklund Olesen | 9a54352 | 2011-04-06 21:32:41 +0000 | [diff] [blame] | 593 | InterferenceCache::Cursor Intf(IntfCache, PhysReg); |
Jakob Stoklund Olesen | f4afdfc | 2011-04-09 02:59:09 +0000 | [diff] [blame^] | 594 | for (SparseBitVector<>::iterator I = ActiveThroughBlocks.begin(), |
| 595 | E = ActiveThroughBlocks.end(); I != E; ++I) { |
| 596 | unsigned Number = *I; |
Jakob Stoklund Olesen | db529a8 | 2011-04-06 03:57:00 +0000 | [diff] [blame] | 597 | bool RegIn = LiveBundles[Bundles->getBundle(Number, 0)]; |
| 598 | bool RegOut = LiveBundles[Bundles->getBundle(Number, 1)]; |
Jakob Stoklund Olesen | 9a54352 | 2011-04-06 21:32:41 +0000 | [diff] [blame] | 599 | if (!RegIn && !RegOut) |
| 600 | continue; |
| 601 | if (RegIn && RegOut) { |
| 602 | // We need double spill code if this block has interference. |
| 603 | Intf.moveToBlock(Number); |
| 604 | if (Intf.hasInterference()) |
| 605 | GlobalCost += 2*SpillPlacer->getBlockFrequency(Number); |
| 606 | continue; |
| 607 | } |
| 608 | // live-in / stack-out or stack-in live-out. |
| 609 | GlobalCost += SpillPlacer->getBlockFrequency(Number); |
Jakob Stoklund Olesen | db529a8 | 2011-04-06 03:57:00 +0000 | [diff] [blame] | 610 | } |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 611 | return GlobalCost; |
| 612 | } |
| 613 | |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 614 | /// splitAroundRegion - Split VirtReg around the region determined by |
| 615 | /// LiveBundles. Make an effort to avoid interference from PhysReg. |
| 616 | /// |
| 617 | /// The 'register' interval is going to contain as many uses as possible while |
| 618 | /// avoiding interference. The 'stack' interval is the complement constructed by |
| 619 | /// SplitEditor. It will contain the rest. |
| 620 | /// |
| 621 | void RAGreedy::splitAroundRegion(LiveInterval &VirtReg, unsigned PhysReg, |
| 622 | const BitVector &LiveBundles, |
| 623 | SmallVectorImpl<LiveInterval*> &NewVRegs) { |
| 624 | DEBUG({ |
| 625 | dbgs() << "Splitting around region for " << PrintReg(PhysReg, TRI) |
| 626 | << " with bundles"; |
| 627 | for (int i = LiveBundles.find_first(); i>=0; i = LiveBundles.find_next(i)) |
| 628 | dbgs() << " EB#" << i; |
| 629 | dbgs() << ".\n"; |
| 630 | }); |
| 631 | |
Jakob Stoklund Olesen | eda0fe8 | 2011-04-02 06:03:38 +0000 | [diff] [blame] | 632 | InterferenceCache::Cursor Intf(IntfCache, PhysReg); |
Jakob Stoklund Olesen | 92a55f4 | 2011-03-09 00:57:29 +0000 | [diff] [blame] | 633 | LiveRangeEdit LREdit(VirtReg, NewVRegs, this); |
Jakob Stoklund Olesen | bece06f | 2011-03-03 01:29:13 +0000 | [diff] [blame] | 634 | SE->reset(LREdit); |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 635 | |
| 636 | // Create the main cross-block interval. |
Jakob Stoklund Olesen | bece06f | 2011-03-03 01:29:13 +0000 | [diff] [blame] | 637 | SE->openIntv(); |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 638 | |
| 639 | // First add all defs that are live out of a block. |
Jakob Stoklund Olesen | db529a8 | 2011-04-06 03:57:00 +0000 | [diff] [blame] | 640 | ArrayRef<SplitAnalysis::BlockInfo> UseBlocks = SA->getUseBlocks(); |
| 641 | for (unsigned i = 0; i != UseBlocks.size(); ++i) { |
| 642 | const SplitAnalysis::BlockInfo &BI = UseBlocks[i]; |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 643 | bool RegIn = LiveBundles[Bundles->getBundle(BI.MBB->getNumber(), 0)]; |
| 644 | bool RegOut = LiveBundles[Bundles->getBundle(BI.MBB->getNumber(), 1)]; |
| 645 | |
| 646 | // Should the register be live out? |
| 647 | if (!BI.LiveOut || !RegOut) |
| 648 | continue; |
| 649 | |
Jakob Stoklund Olesen | 6c8afd7 | 2011-04-04 15:32:15 +0000 | [diff] [blame] | 650 | SlotIndex Start, Stop; |
| 651 | tie(Start, Stop) = Indexes->getMBBRange(BI.MBB); |
Jakob Stoklund Olesen | eda0fe8 | 2011-04-02 06:03:38 +0000 | [diff] [blame] | 652 | Intf.moveToBlock(BI.MBB->getNumber()); |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 653 | DEBUG(dbgs() << "BB#" << BI.MBB->getNumber() << " -> EB#" |
Jakob Stoklund Olesen | 2dfbb3e | 2011-02-03 20:29:43 +0000 | [diff] [blame] | 654 | << Bundles->getBundle(BI.MBB->getNumber(), 1) |
Jakob Stoklund Olesen | 612f780 | 2011-04-05 04:20:29 +0000 | [diff] [blame] | 655 | << " [" << Start << ';' |
| 656 | << SA->getLastSplitPoint(BI.MBB->getNumber()) << '-' << Stop |
| 657 | << ") intf [" << Intf.first() << ';' << Intf.last() << ')'); |
Jakob Stoklund Olesen | 2dfbb3e | 2011-02-03 20:29:43 +0000 | [diff] [blame] | 658 | |
| 659 | // The interference interval should either be invalid or overlap MBB. |
Jakob Stoklund Olesen | 6c8afd7 | 2011-04-04 15:32:15 +0000 | [diff] [blame] | 660 | assert((!Intf.hasInterference() || Intf.first() < Stop) |
Jakob Stoklund Olesen | eda0fe8 | 2011-04-02 06:03:38 +0000 | [diff] [blame] | 661 | && "Bad interference"); |
Jakob Stoklund Olesen | 6c8afd7 | 2011-04-04 15:32:15 +0000 | [diff] [blame] | 662 | assert((!Intf.hasInterference() || Intf.last() > Start) |
Jakob Stoklund Olesen | 36d6186 | 2011-03-03 03:41:29 +0000 | [diff] [blame] | 663 | && "Bad interference"); |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 664 | |
| 665 | // Check interference leaving the block. |
Jakob Stoklund Olesen | eda0fe8 | 2011-04-02 06:03:38 +0000 | [diff] [blame] | 666 | if (!Intf.hasInterference()) { |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 667 | // Block is interference-free. |
| 668 | DEBUG(dbgs() << ", no interference"); |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 669 | if (!BI.LiveThrough) { |
| 670 | DEBUG(dbgs() << ", not live-through.\n"); |
Jakob Stoklund Olesen | 6c8afd7 | 2011-04-04 15:32:15 +0000 | [diff] [blame] | 671 | SE->useIntv(SE->enterIntvBefore(BI.Def), Stop); |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 672 | continue; |
| 673 | } |
| 674 | if (!RegIn) { |
| 675 | // Block is live-through, but entry bundle is on the stack. |
| 676 | // Reload just before the first use. |
| 677 | DEBUG(dbgs() << ", not live-in, enter before first use.\n"); |
Jakob Stoklund Olesen | 6c8afd7 | 2011-04-04 15:32:15 +0000 | [diff] [blame] | 678 | SE->useIntv(SE->enterIntvBefore(BI.FirstUse), Stop); |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 679 | continue; |
| 680 | } |
| 681 | DEBUG(dbgs() << ", live-through.\n"); |
| 682 | continue; |
| 683 | } |
| 684 | |
| 685 | // Block has interference. |
Jakob Stoklund Olesen | eda0fe8 | 2011-04-02 06:03:38 +0000 | [diff] [blame] | 686 | DEBUG(dbgs() << ", interference to " << Intf.last()); |
Jakob Stoklund Olesen | fe3f99f | 2011-02-05 01:06:39 +0000 | [diff] [blame] | 687 | |
Jakob Stoklund Olesen | eda0fe8 | 2011-04-02 06:03:38 +0000 | [diff] [blame] | 688 | if (!BI.LiveThrough && Intf.last() <= BI.Def) { |
Jakob Stoklund Olesen | fe3f99f | 2011-02-05 01:06:39 +0000 | [diff] [blame] | 689 | // The interference doesn't reach the outgoing segment. |
| 690 | DEBUG(dbgs() << " doesn't affect def from " << BI.Def << '\n'); |
Jakob Stoklund Olesen | 6c8afd7 | 2011-04-04 15:32:15 +0000 | [diff] [blame] | 691 | SE->useIntv(BI.Def, Stop); |
Jakob Stoklund Olesen | fe3f99f | 2011-02-05 01:06:39 +0000 | [diff] [blame] | 692 | continue; |
| 693 | } |
| 694 | |
Jakob Stoklund Olesen | 612f780 | 2011-04-05 04:20:29 +0000 | [diff] [blame] | 695 | SlotIndex LastSplitPoint = SA->getLastSplitPoint(BI.MBB->getNumber()); |
Jakob Stoklund Olesen | eda0fe8 | 2011-04-02 06:03:38 +0000 | [diff] [blame] | 696 | if (Intf.last().getBoundaryIndex() < BI.LastUse) { |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 697 | // There are interference-free uses at the end of the block. |
| 698 | // Find the first use that can get the live-out register. |
Jakob Stoklund Olesen | c0de995 | 2011-01-20 17:45:23 +0000 | [diff] [blame] | 699 | SmallVectorImpl<SlotIndex>::const_iterator UI = |
Jakob Stoklund Olesen | fe3f99f | 2011-02-05 01:06:39 +0000 | [diff] [blame] | 700 | std::lower_bound(SA->UseSlots.begin(), SA->UseSlots.end(), |
Jakob Stoklund Olesen | eda0fe8 | 2011-04-02 06:03:38 +0000 | [diff] [blame] | 701 | Intf.last().getBoundaryIndex()); |
Jakob Stoklund Olesen | c0de995 | 2011-01-20 17:45:23 +0000 | [diff] [blame] | 702 | assert(UI != SA->UseSlots.end() && "Couldn't find last use"); |
| 703 | SlotIndex Use = *UI; |
Jakob Stoklund Olesen | c0de995 | 2011-01-20 17:45:23 +0000 | [diff] [blame] | 704 | assert(Use <= BI.LastUse && "Couldn't find last use"); |
Jakob Stoklund Olesen | 8a2bbde | 2011-02-08 23:26:48 +0000 | [diff] [blame] | 705 | // Only attempt a split befroe the last split point. |
Jakob Stoklund Olesen | 612f780 | 2011-04-05 04:20:29 +0000 | [diff] [blame] | 706 | if (Use.getBaseIndex() <= LastSplitPoint) { |
Jakob Stoklund Olesen | 8a2bbde | 2011-02-08 23:26:48 +0000 | [diff] [blame] | 707 | DEBUG(dbgs() << ", free use at " << Use << ".\n"); |
Jakob Stoklund Olesen | bece06f | 2011-03-03 01:29:13 +0000 | [diff] [blame] | 708 | SlotIndex SegStart = SE->enterIntvBefore(Use); |
Jakob Stoklund Olesen | eda0fe8 | 2011-04-02 06:03:38 +0000 | [diff] [blame] | 709 | assert(SegStart >= Intf.last() && "Couldn't avoid interference"); |
Jakob Stoklund Olesen | 612f780 | 2011-04-05 04:20:29 +0000 | [diff] [blame] | 710 | assert(SegStart < LastSplitPoint && "Impossible split point"); |
Jakob Stoklund Olesen | 6c8afd7 | 2011-04-04 15:32:15 +0000 | [diff] [blame] | 711 | SE->useIntv(SegStart, Stop); |
Jakob Stoklund Olesen | 8a2bbde | 2011-02-08 23:26:48 +0000 | [diff] [blame] | 712 | continue; |
| 713 | } |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 714 | } |
| 715 | |
| 716 | // Interference is after the last use. |
| 717 | DEBUG(dbgs() << " after last use.\n"); |
Jakob Stoklund Olesen | bece06f | 2011-03-03 01:29:13 +0000 | [diff] [blame] | 718 | SlotIndex SegStart = SE->enterIntvAtEnd(*BI.MBB); |
Jakob Stoklund Olesen | eda0fe8 | 2011-04-02 06:03:38 +0000 | [diff] [blame] | 719 | assert(SegStart >= Intf.last() && "Couldn't avoid interference"); |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 720 | } |
| 721 | |
| 722 | // Now all defs leading to live bundles are handled, do everything else. |
Jakob Stoklund Olesen | db529a8 | 2011-04-06 03:57:00 +0000 | [diff] [blame] | 723 | for (unsigned i = 0; i != UseBlocks.size(); ++i) { |
| 724 | const SplitAnalysis::BlockInfo &BI = UseBlocks[i]; |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 725 | bool RegIn = LiveBundles[Bundles->getBundle(BI.MBB->getNumber(), 0)]; |
| 726 | bool RegOut = LiveBundles[Bundles->getBundle(BI.MBB->getNumber(), 1)]; |
| 727 | |
| 728 | // Is the register live-in? |
| 729 | if (!BI.LiveIn || !RegIn) |
| 730 | continue; |
| 731 | |
| 732 | // We have an incoming register. Check for interference. |
Jakob Stoklund Olesen | 6c8afd7 | 2011-04-04 15:32:15 +0000 | [diff] [blame] | 733 | SlotIndex Start, Stop; |
| 734 | tie(Start, Stop) = Indexes->getMBBRange(BI.MBB); |
Jakob Stoklund Olesen | eda0fe8 | 2011-04-02 06:03:38 +0000 | [diff] [blame] | 735 | Intf.moveToBlock(BI.MBB->getNumber()); |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 736 | DEBUG(dbgs() << "EB#" << Bundles->getBundle(BI.MBB->getNumber(), 0) |
Jakob Stoklund Olesen | 6c8afd7 | 2011-04-04 15:32:15 +0000 | [diff] [blame] | 737 | << " -> BB#" << BI.MBB->getNumber() << " [" << Start << ';' |
Jakob Stoklund Olesen | 612f780 | 2011-04-05 04:20:29 +0000 | [diff] [blame] | 738 | << SA->getLastSplitPoint(BI.MBB->getNumber()) << '-' << Stop |
| 739 | << ')'); |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 740 | |
| 741 | // Check interference entering the block. |
Jakob Stoklund Olesen | eda0fe8 | 2011-04-02 06:03:38 +0000 | [diff] [blame] | 742 | if (!Intf.hasInterference()) { |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 743 | // Block is interference-free. |
| 744 | DEBUG(dbgs() << ", no interference"); |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 745 | if (!BI.LiveThrough) { |
| 746 | DEBUG(dbgs() << ", killed in block.\n"); |
Jakob Stoklund Olesen | 6c8afd7 | 2011-04-04 15:32:15 +0000 | [diff] [blame] | 747 | SE->useIntv(Start, SE->leaveIntvAfter(BI.Kill)); |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 748 | continue; |
| 749 | } |
| 750 | if (!RegOut) { |
Jakob Stoklund Olesen | 612f780 | 2011-04-05 04:20:29 +0000 | [diff] [blame] | 751 | SlotIndex LastSplitPoint = SA->getLastSplitPoint(BI.MBB->getNumber()); |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 752 | // Block is live-through, but exit bundle is on the stack. |
| 753 | // Spill immediately after the last use. |
Jakob Stoklund Olesen | 612f780 | 2011-04-05 04:20:29 +0000 | [diff] [blame] | 754 | if (BI.LastUse < LastSplitPoint) { |
Jakob Stoklund Olesen | 5c716bd | 2011-02-08 18:50:21 +0000 | [diff] [blame] | 755 | DEBUG(dbgs() << ", uses, stack-out.\n"); |
Jakob Stoklund Olesen | 6c8afd7 | 2011-04-04 15:32:15 +0000 | [diff] [blame] | 756 | SE->useIntv(Start, SE->leaveIntvAfter(BI.LastUse)); |
Jakob Stoklund Olesen | 5c716bd | 2011-02-08 18:50:21 +0000 | [diff] [blame] | 757 | continue; |
| 758 | } |
| 759 | // The last use is after the last split point, it is probably an |
| 760 | // indirect jump. |
| 761 | DEBUG(dbgs() << ", uses at " << BI.LastUse << " after split point " |
Jakob Stoklund Olesen | 612f780 | 2011-04-05 04:20:29 +0000 | [diff] [blame] | 762 | << LastSplitPoint << ", stack-out.\n"); |
| 763 | SlotIndex SegEnd = SE->leaveIntvBefore(LastSplitPoint); |
Jakob Stoklund Olesen | 6c8afd7 | 2011-04-04 15:32:15 +0000 | [diff] [blame] | 764 | SE->useIntv(Start, SegEnd); |
Jakob Stoklund Olesen | 5c716bd | 2011-02-08 18:50:21 +0000 | [diff] [blame] | 765 | // Run a double interval from the split to the last use. |
| 766 | // This makes it possible to spill the complement without affecting the |
| 767 | // indirect branch. |
Jakob Stoklund Olesen | bece06f | 2011-03-03 01:29:13 +0000 | [diff] [blame] | 768 | SE->overlapIntv(SegEnd, BI.LastUse); |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 769 | continue; |
| 770 | } |
| 771 | // Register is live-through. |
| 772 | DEBUG(dbgs() << ", uses, live-through.\n"); |
Jakob Stoklund Olesen | 6c8afd7 | 2011-04-04 15:32:15 +0000 | [diff] [blame] | 773 | SE->useIntv(Start, Stop); |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 774 | continue; |
| 775 | } |
| 776 | |
| 777 | // Block has interference. |
Jakob Stoklund Olesen | eda0fe8 | 2011-04-02 06:03:38 +0000 | [diff] [blame] | 778 | DEBUG(dbgs() << ", interference from " << Intf.first()); |
Jakob Stoklund Olesen | fe3f99f | 2011-02-05 01:06:39 +0000 | [diff] [blame] | 779 | |
Jakob Stoklund Olesen | eda0fe8 | 2011-04-02 06:03:38 +0000 | [diff] [blame] | 780 | if (!BI.LiveThrough && Intf.first() >= BI.Kill) { |
Jakob Stoklund Olesen | fe3f99f | 2011-02-05 01:06:39 +0000 | [diff] [blame] | 781 | // The interference doesn't reach the outgoing segment. |
| 782 | DEBUG(dbgs() << " doesn't affect kill at " << BI.Kill << '\n'); |
Jakob Stoklund Olesen | 6c8afd7 | 2011-04-04 15:32:15 +0000 | [diff] [blame] | 783 | SE->useIntv(Start, BI.Kill); |
Jakob Stoklund Olesen | fe3f99f | 2011-02-05 01:06:39 +0000 | [diff] [blame] | 784 | continue; |
| 785 | } |
| 786 | |
Jakob Stoklund Olesen | eda0fe8 | 2011-04-02 06:03:38 +0000 | [diff] [blame] | 787 | if (Intf.first().getBaseIndex() > BI.FirstUse) { |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 788 | // There are interference-free uses at the beginning of the block. |
| 789 | // Find the last use that can get the register. |
Jakob Stoklund Olesen | c0de995 | 2011-01-20 17:45:23 +0000 | [diff] [blame] | 790 | SmallVectorImpl<SlotIndex>::const_iterator UI = |
Jakob Stoklund Olesen | fe3f99f | 2011-02-05 01:06:39 +0000 | [diff] [blame] | 791 | std::lower_bound(SA->UseSlots.begin(), SA->UseSlots.end(), |
Jakob Stoklund Olesen | eda0fe8 | 2011-04-02 06:03:38 +0000 | [diff] [blame] | 792 | Intf.first().getBaseIndex()); |
Jakob Stoklund Olesen | c0de995 | 2011-01-20 17:45:23 +0000 | [diff] [blame] | 793 | assert(UI != SA->UseSlots.begin() && "Couldn't find first use"); |
| 794 | SlotIndex Use = (--UI)->getBoundaryIndex(); |
| 795 | DEBUG(dbgs() << ", free use at " << *UI << ".\n"); |
Jakob Stoklund Olesen | bece06f | 2011-03-03 01:29:13 +0000 | [diff] [blame] | 796 | SlotIndex SegEnd = SE->leaveIntvAfter(Use); |
Jakob Stoklund Olesen | eda0fe8 | 2011-04-02 06:03:38 +0000 | [diff] [blame] | 797 | assert(SegEnd <= Intf.first() && "Couldn't avoid interference"); |
Jakob Stoklund Olesen | 6c8afd7 | 2011-04-04 15:32:15 +0000 | [diff] [blame] | 798 | SE->useIntv(Start, SegEnd); |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 799 | continue; |
| 800 | } |
| 801 | |
| 802 | // Interference is before the first use. |
| 803 | DEBUG(dbgs() << " before first use.\n"); |
Jakob Stoklund Olesen | bece06f | 2011-03-03 01:29:13 +0000 | [diff] [blame] | 804 | SlotIndex SegEnd = SE->leaveIntvAtTop(*BI.MBB); |
Jakob Stoklund Olesen | eda0fe8 | 2011-04-02 06:03:38 +0000 | [diff] [blame] | 805 | assert(SegEnd <= Intf.first() && "Couldn't avoid interference"); |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 806 | } |
| 807 | |
Jakob Stoklund Olesen | db529a8 | 2011-04-06 03:57:00 +0000 | [diff] [blame] | 808 | // Handle live-through blocks. |
Jakob Stoklund Olesen | f4afdfc | 2011-04-09 02:59:09 +0000 | [diff] [blame^] | 809 | for (SparseBitVector<>::iterator I = ActiveThroughBlocks.begin(), |
| 810 | E = ActiveThroughBlocks.end(); I != E; ++I) { |
| 811 | unsigned Number = *I; |
Jakob Stoklund Olesen | db529a8 | 2011-04-06 03:57:00 +0000 | [diff] [blame] | 812 | bool RegIn = LiveBundles[Bundles->getBundle(Number, 0)]; |
| 813 | bool RegOut = LiveBundles[Bundles->getBundle(Number, 1)]; |
| 814 | DEBUG(dbgs() << "Live through BB#" << Number << '\n'); |
| 815 | if (RegIn && RegOut) { |
| 816 | Intf.moveToBlock(Number); |
| 817 | if (!Intf.hasInterference()) { |
| 818 | SE->useIntv(Indexes->getMBBStartIdx(Number), |
| 819 | Indexes->getMBBEndIdx(Number)); |
| 820 | continue; |
| 821 | } |
| 822 | } |
| 823 | MachineBasicBlock *MBB = MF->getBlockNumbered(Number); |
| 824 | if (RegIn) |
| 825 | SE->leaveIntvAtTop(*MBB); |
| 826 | if (RegOut) |
| 827 | SE->enterIntvAtEnd(*MBB); |
| 828 | } |
| 829 | |
Jakob Stoklund Olesen | bece06f | 2011-03-03 01:29:13 +0000 | [diff] [blame] | 830 | SE->closeIntv(); |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 831 | |
| 832 | // FIXME: Should we be more aggressive about splitting the stack region into |
| 833 | // per-block segments? The current approach allows the stack region to |
| 834 | // separate into connected components. Some components may be allocatable. |
Jakob Stoklund Olesen | bece06f | 2011-03-03 01:29:13 +0000 | [diff] [blame] | 835 | SE->finish(); |
Jakob Stoklund Olesen | 0db841f | 2011-02-17 22:53:48 +0000 | [diff] [blame] | 836 | ++NumGlobalSplits; |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 837 | |
Jakob Stoklund Olesen | eb29157 | 2011-03-27 22:49:21 +0000 | [diff] [blame] | 838 | if (VerifyEnabled) |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 839 | MF->verify(this, "After splitting live range around region"); |
| 840 | } |
| 841 | |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 842 | unsigned RAGreedy::tryRegionSplit(LiveInterval &VirtReg, AllocationOrder &Order, |
| 843 | SmallVectorImpl<LiveInterval*> &NewVRegs) { |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 844 | BitVector LiveBundles, BestBundles; |
| 845 | float BestCost = 0; |
| 846 | unsigned BestReg = 0; |
Jakob Stoklund Olesen | f4afdfc | 2011-04-09 02:59:09 +0000 | [diff] [blame^] | 847 | ActiveThroughBlocks.clear(); |
Jakob Stoklund Olesen | 96dcd95 | 2011-03-05 01:10:31 +0000 | [diff] [blame] | 848 | |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 849 | Order.rewind(); |
Jakob Stoklund Olesen | 96dcd95 | 2011-03-05 01:10:31 +0000 | [diff] [blame] | 850 | for (unsigned Cand = 0; unsigned PhysReg = Order.next(); ++Cand) { |
| 851 | if (GlobalCand.size() <= Cand) |
| 852 | GlobalCand.resize(Cand+1); |
| 853 | GlobalCand[Cand].PhysReg = PhysReg; |
| 854 | |
Jakob Stoklund Olesen | 1b400e8 | 2011-04-06 21:32:38 +0000 | [diff] [blame] | 855 | SpillPlacer->prepare(LiveBundles); |
| 856 | float Cost; |
Jakob Stoklund Olesen | f4afdfc | 2011-04-09 02:59:09 +0000 | [diff] [blame^] | 857 | InterferenceCache::Cursor Intf(IntfCache, PhysReg); |
| 858 | if (!addSplitConstraints(Intf, Cost)) { |
| 859 | DEBUG(dbgs() << PrintReg(PhysReg, TRI) << "\tno positive bundles\n"); |
Jakob Stoklund Olesen | 1b400e8 | 2011-04-06 21:32:38 +0000 | [diff] [blame] | 860 | continue; |
| 861 | } |
Jakob Stoklund Olesen | f4afdfc | 2011-04-09 02:59:09 +0000 | [diff] [blame^] | 862 | DEBUG(dbgs() << PrintReg(PhysReg, TRI) << "\tstatic = " << Cost); |
Jakob Stoklund Olesen | 874be74 | 2011-03-05 03:28:51 +0000 | [diff] [blame] | 863 | if (BestReg && Cost >= BestCost) { |
Jakob Stoklund Olesen | 1b400e8 | 2011-04-06 21:32:38 +0000 | [diff] [blame] | 864 | DEBUG(dbgs() << " worse than " << PrintReg(BestReg, TRI) << '\n'); |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 865 | continue; |
Jakob Stoklund Olesen | 874be74 | 2011-03-05 03:28:51 +0000 | [diff] [blame] | 866 | } |
Jakob Stoklund Olesen | f4afdfc | 2011-04-09 02:59:09 +0000 | [diff] [blame^] | 867 | growRegion(Intf); |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 868 | |
Jakob Stoklund Olesen | 9efa2a2 | 2011-04-06 19:13:57 +0000 | [diff] [blame] | 869 | SpillPlacer->finish(); |
| 870 | |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 871 | // No live bundles, defer to splitSingleBlocks(). |
Jakob Stoklund Olesen | 874be74 | 2011-03-05 03:28:51 +0000 | [diff] [blame] | 872 | if (!LiveBundles.any()) { |
| 873 | DEBUG(dbgs() << " no bundles.\n"); |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 874 | continue; |
Jakob Stoklund Olesen | 874be74 | 2011-03-05 03:28:51 +0000 | [diff] [blame] | 875 | } |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 876 | |
Jakob Stoklund Olesen | 9a54352 | 2011-04-06 21:32:41 +0000 | [diff] [blame] | 877 | Cost += calcGlobalSplitCost(PhysReg, LiveBundles); |
Jakob Stoklund Olesen | 874be74 | 2011-03-05 03:28:51 +0000 | [diff] [blame] | 878 | DEBUG({ |
| 879 | dbgs() << ", total = " << Cost << " with bundles"; |
| 880 | for (int i = LiveBundles.find_first(); i>=0; i = LiveBundles.find_next(i)) |
| 881 | dbgs() << " EB#" << i; |
| 882 | dbgs() << ".\n"; |
| 883 | }); |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 884 | if (!BestReg || Cost < BestCost) { |
| 885 | BestReg = PhysReg; |
Jakob Stoklund Olesen | 874be74 | 2011-03-05 03:28:51 +0000 | [diff] [blame] | 886 | BestCost = 0.98f * Cost; // Prevent rounding effects. |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 887 | BestBundles.swap(LiveBundles); |
| 888 | } |
| 889 | } |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 890 | |
| 891 | if (!BestReg) |
| 892 | return 0; |
| 893 | |
| 894 | splitAroundRegion(VirtReg, BestReg, BestBundles, NewVRegs); |
Jakob Stoklund Olesen | 22a1df6 | 2011-03-01 21:10:07 +0000 | [diff] [blame] | 895 | setStage(NewVRegs.begin(), NewVRegs.end(), RS_Region); |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 896 | return 0; |
| 897 | } |
| 898 | |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 899 | |
| 900 | //===----------------------------------------------------------------------===// |
Jakob Stoklund Olesen | 034a80d | 2011-02-17 19:13:53 +0000 | [diff] [blame] | 901 | // Local Splitting |
| 902 | //===----------------------------------------------------------------------===// |
| 903 | |
| 904 | |
| 905 | /// calcGapWeights - Compute the maximum spill weight that needs to be evicted |
| 906 | /// in order to use PhysReg between two entries in SA->UseSlots. |
| 907 | /// |
| 908 | /// GapWeight[i] represents the gap between UseSlots[i] and UseSlots[i+1]. |
| 909 | /// |
| 910 | void RAGreedy::calcGapWeights(unsigned PhysReg, |
| 911 | SmallVectorImpl<float> &GapWeight) { |
Jakob Stoklund Olesen | db529a8 | 2011-04-06 03:57:00 +0000 | [diff] [blame] | 912 | assert(SA->getUseBlocks().size() == 1 && "Not a local interval"); |
| 913 | const SplitAnalysis::BlockInfo &BI = SA->getUseBlocks().front(); |
Jakob Stoklund Olesen | 034a80d | 2011-02-17 19:13:53 +0000 | [diff] [blame] | 914 | const SmallVectorImpl<SlotIndex> &Uses = SA->UseSlots; |
| 915 | const unsigned NumGaps = Uses.size()-1; |
| 916 | |
| 917 | // Start and end points for the interference check. |
| 918 | SlotIndex StartIdx = BI.LiveIn ? BI.FirstUse.getBaseIndex() : BI.FirstUse; |
| 919 | SlotIndex StopIdx = BI.LiveOut ? BI.LastUse.getBoundaryIndex() : BI.LastUse; |
| 920 | |
| 921 | GapWeight.assign(NumGaps, 0.0f); |
| 922 | |
| 923 | // Add interference from each overlapping register. |
| 924 | for (const unsigned *AI = TRI->getOverlaps(PhysReg); *AI; ++AI) { |
| 925 | if (!query(const_cast<LiveInterval&>(SA->getParent()), *AI) |
| 926 | .checkInterference()) |
| 927 | continue; |
| 928 | |
| 929 | // We know that VirtReg is a continuous interval from FirstUse to LastUse, |
| 930 | // so we don't need InterferenceQuery. |
| 931 | // |
| 932 | // Interference that overlaps an instruction is counted in both gaps |
| 933 | // surrounding the instruction. The exception is interference before |
| 934 | // StartIdx and after StopIdx. |
| 935 | // |
| 936 | LiveIntervalUnion::SegmentIter IntI = PhysReg2LiveUnion[*AI].find(StartIdx); |
| 937 | for (unsigned Gap = 0; IntI.valid() && IntI.start() < StopIdx; ++IntI) { |
| 938 | // Skip the gaps before IntI. |
| 939 | while (Uses[Gap+1].getBoundaryIndex() < IntI.start()) |
| 940 | if (++Gap == NumGaps) |
| 941 | break; |
| 942 | if (Gap == NumGaps) |
| 943 | break; |
| 944 | |
| 945 | // Update the gaps covered by IntI. |
| 946 | const float weight = IntI.value()->weight; |
| 947 | for (; Gap != NumGaps; ++Gap) { |
| 948 | GapWeight[Gap] = std::max(GapWeight[Gap], weight); |
| 949 | if (Uses[Gap+1].getBaseIndex() >= IntI.stop()) |
| 950 | break; |
| 951 | } |
| 952 | if (Gap == NumGaps) |
| 953 | break; |
| 954 | } |
| 955 | } |
| 956 | } |
| 957 | |
| 958 | /// getPrevMappedIndex - Return the slot index of the last non-copy instruction |
| 959 | /// before MI that has a slot index. If MI is the first mapped instruction in |
| 960 | /// its block, return the block start index instead. |
| 961 | /// |
| 962 | SlotIndex RAGreedy::getPrevMappedIndex(const MachineInstr *MI) { |
| 963 | assert(MI && "Missing MachineInstr"); |
| 964 | const MachineBasicBlock *MBB = MI->getParent(); |
| 965 | MachineBasicBlock::const_iterator B = MBB->begin(), I = MI; |
| 966 | while (I != B) |
| 967 | if (!(--I)->isDebugValue() && !I->isCopy()) |
| 968 | return Indexes->getInstructionIndex(I); |
| 969 | return Indexes->getMBBStartIdx(MBB); |
| 970 | } |
| 971 | |
| 972 | /// calcPrevSlots - Fill in the PrevSlot array with the index of the previous |
| 973 | /// real non-copy instruction for each instruction in SA->UseSlots. |
| 974 | /// |
| 975 | void RAGreedy::calcPrevSlots() { |
| 976 | const SmallVectorImpl<SlotIndex> &Uses = SA->UseSlots; |
| 977 | PrevSlot.clear(); |
| 978 | PrevSlot.reserve(Uses.size()); |
| 979 | for (unsigned i = 0, e = Uses.size(); i != e; ++i) { |
| 980 | const MachineInstr *MI = Indexes->getInstructionFromIndex(Uses[i]); |
| 981 | PrevSlot.push_back(getPrevMappedIndex(MI).getDefIndex()); |
| 982 | } |
| 983 | } |
| 984 | |
| 985 | /// nextSplitPoint - Find the next index into SA->UseSlots > i such that it may |
| 986 | /// be beneficial to split before UseSlots[i]. |
| 987 | /// |
| 988 | /// 0 is always a valid split point |
| 989 | unsigned RAGreedy::nextSplitPoint(unsigned i) { |
| 990 | const SmallVectorImpl<SlotIndex> &Uses = SA->UseSlots; |
| 991 | const unsigned Size = Uses.size(); |
| 992 | assert(i != Size && "No split points after the end"); |
| 993 | // Allow split before i when Uses[i] is not adjacent to the previous use. |
| 994 | while (++i != Size && PrevSlot[i].getBaseIndex() <= Uses[i-1].getBaseIndex()) |
| 995 | ; |
| 996 | return i; |
| 997 | } |
| 998 | |
| 999 | /// tryLocalSplit - Try to split VirtReg into smaller intervals inside its only |
| 1000 | /// basic block. |
| 1001 | /// |
| 1002 | unsigned RAGreedy::tryLocalSplit(LiveInterval &VirtReg, AllocationOrder &Order, |
| 1003 | SmallVectorImpl<LiveInterval*> &NewVRegs) { |
Jakob Stoklund Olesen | db529a8 | 2011-04-06 03:57:00 +0000 | [diff] [blame] | 1004 | assert(SA->getUseBlocks().size() == 1 && "Not a local interval"); |
| 1005 | const SplitAnalysis::BlockInfo &BI = SA->getUseBlocks().front(); |
Jakob Stoklund Olesen | 034a80d | 2011-02-17 19:13:53 +0000 | [diff] [blame] | 1006 | |
| 1007 | // Note that it is possible to have an interval that is live-in or live-out |
| 1008 | // while only covering a single block - A phi-def can use undef values from |
| 1009 | // predecessors, and the block could be a single-block loop. |
| 1010 | // We don't bother doing anything clever about such a case, we simply assume |
| 1011 | // that the interval is continuous from FirstUse to LastUse. We should make |
| 1012 | // sure that we don't do anything illegal to such an interval, though. |
| 1013 | |
| 1014 | const SmallVectorImpl<SlotIndex> &Uses = SA->UseSlots; |
| 1015 | if (Uses.size() <= 2) |
| 1016 | return 0; |
| 1017 | const unsigned NumGaps = Uses.size()-1; |
| 1018 | |
| 1019 | DEBUG({ |
| 1020 | dbgs() << "tryLocalSplit: "; |
| 1021 | for (unsigned i = 0, e = Uses.size(); i != e; ++i) |
| 1022 | dbgs() << ' ' << SA->UseSlots[i]; |
| 1023 | dbgs() << '\n'; |
| 1024 | }); |
| 1025 | |
| 1026 | // For every use, find the previous mapped non-copy instruction. |
| 1027 | // We use this to detect valid split points, and to estimate new interval |
| 1028 | // sizes. |
| 1029 | calcPrevSlots(); |
| 1030 | |
| 1031 | unsigned BestBefore = NumGaps; |
| 1032 | unsigned BestAfter = 0; |
| 1033 | float BestDiff = 0; |
| 1034 | |
Jakob Stoklund Olesen | 40a42a2 | 2011-03-04 00:58:40 +0000 | [diff] [blame] | 1035 | const float blockFreq = SpillPlacer->getBlockFrequency(BI.MBB->getNumber()); |
Jakob Stoklund Olesen | 034a80d | 2011-02-17 19:13:53 +0000 | [diff] [blame] | 1036 | SmallVector<float, 8> GapWeight; |
| 1037 | |
| 1038 | Order.rewind(); |
| 1039 | while (unsigned PhysReg = Order.next()) { |
| 1040 | // Keep track of the largest spill weight that would need to be evicted in |
| 1041 | // order to make use of PhysReg between UseSlots[i] and UseSlots[i+1]. |
| 1042 | calcGapWeights(PhysReg, GapWeight); |
| 1043 | |
| 1044 | // Try to find the best sequence of gaps to close. |
| 1045 | // The new spill weight must be larger than any gap interference. |
| 1046 | |
| 1047 | // We will split before Uses[SplitBefore] and after Uses[SplitAfter]. |
| 1048 | unsigned SplitBefore = 0, SplitAfter = nextSplitPoint(1) - 1; |
| 1049 | |
| 1050 | // MaxGap should always be max(GapWeight[SplitBefore..SplitAfter-1]). |
| 1051 | // It is the spill weight that needs to be evicted. |
| 1052 | float MaxGap = GapWeight[0]; |
| 1053 | for (unsigned i = 1; i != SplitAfter; ++i) |
| 1054 | MaxGap = std::max(MaxGap, GapWeight[i]); |
| 1055 | |
| 1056 | for (;;) { |
| 1057 | // Live before/after split? |
| 1058 | const bool LiveBefore = SplitBefore != 0 || BI.LiveIn; |
| 1059 | const bool LiveAfter = SplitAfter != NumGaps || BI.LiveOut; |
| 1060 | |
| 1061 | DEBUG(dbgs() << PrintReg(PhysReg, TRI) << ' ' |
| 1062 | << Uses[SplitBefore] << '-' << Uses[SplitAfter] |
| 1063 | << " i=" << MaxGap); |
| 1064 | |
| 1065 | // Stop before the interval gets so big we wouldn't be making progress. |
| 1066 | if (!LiveBefore && !LiveAfter) { |
| 1067 | DEBUG(dbgs() << " all\n"); |
| 1068 | break; |
| 1069 | } |
| 1070 | // Should the interval be extended or shrunk? |
| 1071 | bool Shrink = true; |
| 1072 | if (MaxGap < HUGE_VALF) { |
| 1073 | // Estimate the new spill weight. |
| 1074 | // |
| 1075 | // Each instruction reads and writes the register, except the first |
| 1076 | // instr doesn't read when !FirstLive, and the last instr doesn't write |
| 1077 | // when !LastLive. |
| 1078 | // |
| 1079 | // We will be inserting copies before and after, so the total number of |
| 1080 | // reads and writes is 2 * EstUses. |
| 1081 | // |
| 1082 | const unsigned EstUses = 2*(SplitAfter - SplitBefore) + |
| 1083 | 2*(LiveBefore + LiveAfter); |
| 1084 | |
| 1085 | // Try to guess the size of the new interval. This should be trivial, |
| 1086 | // but the slot index of an inserted copy can be a lot smaller than the |
| 1087 | // instruction it is inserted before if there are many dead indexes |
| 1088 | // between them. |
| 1089 | // |
| 1090 | // We measure the distance from the instruction before SplitBefore to |
| 1091 | // get a conservative estimate. |
| 1092 | // |
| 1093 | // The final distance can still be different if inserting copies |
| 1094 | // triggers a slot index renumbering. |
| 1095 | // |
| 1096 | const float EstWeight = normalizeSpillWeight(blockFreq * EstUses, |
| 1097 | PrevSlot[SplitBefore].distance(Uses[SplitAfter])); |
| 1098 | // Would this split be possible to allocate? |
| 1099 | // Never allocate all gaps, we wouldn't be making progress. |
| 1100 | float Diff = EstWeight - MaxGap; |
| 1101 | DEBUG(dbgs() << " w=" << EstWeight << " d=" << Diff); |
| 1102 | if (Diff > 0) { |
| 1103 | Shrink = false; |
| 1104 | if (Diff > BestDiff) { |
| 1105 | DEBUG(dbgs() << " (best)"); |
| 1106 | BestDiff = Diff; |
| 1107 | BestBefore = SplitBefore; |
| 1108 | BestAfter = SplitAfter; |
| 1109 | } |
| 1110 | } |
| 1111 | } |
| 1112 | |
| 1113 | // Try to shrink. |
| 1114 | if (Shrink) { |
| 1115 | SplitBefore = nextSplitPoint(SplitBefore); |
| 1116 | if (SplitBefore < SplitAfter) { |
| 1117 | DEBUG(dbgs() << " shrink\n"); |
| 1118 | // Recompute the max when necessary. |
| 1119 | if (GapWeight[SplitBefore - 1] >= MaxGap) { |
| 1120 | MaxGap = GapWeight[SplitBefore]; |
| 1121 | for (unsigned i = SplitBefore + 1; i != SplitAfter; ++i) |
| 1122 | MaxGap = std::max(MaxGap, GapWeight[i]); |
| 1123 | } |
| 1124 | continue; |
| 1125 | } |
| 1126 | MaxGap = 0; |
| 1127 | } |
| 1128 | |
| 1129 | // Try to extend the interval. |
| 1130 | if (SplitAfter >= NumGaps) { |
| 1131 | DEBUG(dbgs() << " end\n"); |
| 1132 | break; |
| 1133 | } |
| 1134 | |
| 1135 | DEBUG(dbgs() << " extend\n"); |
| 1136 | for (unsigned e = nextSplitPoint(SplitAfter + 1) - 1; |
| 1137 | SplitAfter != e; ++SplitAfter) |
| 1138 | MaxGap = std::max(MaxGap, GapWeight[SplitAfter]); |
| 1139 | continue; |
| 1140 | } |
| 1141 | } |
| 1142 | |
| 1143 | // Didn't find any candidates? |
| 1144 | if (BestBefore == NumGaps) |
| 1145 | return 0; |
| 1146 | |
| 1147 | DEBUG(dbgs() << "Best local split range: " << Uses[BestBefore] |
| 1148 | << '-' << Uses[BestAfter] << ", " << BestDiff |
| 1149 | << ", " << (BestAfter - BestBefore + 1) << " instrs\n"); |
| 1150 | |
Jakob Stoklund Olesen | 92a55f4 | 2011-03-09 00:57:29 +0000 | [diff] [blame] | 1151 | LiveRangeEdit LREdit(VirtReg, NewVRegs, this); |
Jakob Stoklund Olesen | bece06f | 2011-03-03 01:29:13 +0000 | [diff] [blame] | 1152 | SE->reset(LREdit); |
Jakob Stoklund Olesen | 034a80d | 2011-02-17 19:13:53 +0000 | [diff] [blame] | 1153 | |
Jakob Stoklund Olesen | bece06f | 2011-03-03 01:29:13 +0000 | [diff] [blame] | 1154 | SE->openIntv(); |
| 1155 | SlotIndex SegStart = SE->enterIntvBefore(Uses[BestBefore]); |
| 1156 | SlotIndex SegStop = SE->leaveIntvAfter(Uses[BestAfter]); |
| 1157 | SE->useIntv(SegStart, SegStop); |
| 1158 | SE->closeIntv(); |
| 1159 | SE->finish(); |
Jakob Stoklund Olesen | 22a1df6 | 2011-03-01 21:10:07 +0000 | [diff] [blame] | 1160 | setStage(NewVRegs.begin(), NewVRegs.end(), RS_Local); |
Jakob Stoklund Olesen | 0db841f | 2011-02-17 22:53:48 +0000 | [diff] [blame] | 1161 | ++NumLocalSplits; |
Jakob Stoklund Olesen | 034a80d | 2011-02-17 19:13:53 +0000 | [diff] [blame] | 1162 | |
| 1163 | return 0; |
| 1164 | } |
| 1165 | |
| 1166 | //===----------------------------------------------------------------------===// |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 1167 | // Live Range Splitting |
| 1168 | //===----------------------------------------------------------------------===// |
| 1169 | |
| 1170 | /// trySplit - Try to split VirtReg or one of its interferences, making it |
| 1171 | /// assignable. |
| 1172 | /// @return Physreg when VirtReg may be assigned and/or new NewVRegs. |
| 1173 | unsigned RAGreedy::trySplit(LiveInterval &VirtReg, AllocationOrder &Order, |
| 1174 | SmallVectorImpl<LiveInterval*>&NewVRegs) { |
Jakob Stoklund Olesen | 034a80d | 2011-02-17 19:13:53 +0000 | [diff] [blame] | 1175 | // Local intervals are handled separately. |
Jakob Stoklund Olesen | a2ebf60 | 2011-02-19 00:38:40 +0000 | [diff] [blame] | 1176 | if (LIS->intervalIsInOneMBB(VirtReg)) { |
| 1177 | NamedRegionTimer T("Local Splitting", TimerGroupName, TimePassesIsEnabled); |
Jakob Stoklund Olesen | 22a1df6 | 2011-03-01 21:10:07 +0000 | [diff] [blame] | 1178 | SA->analyze(&VirtReg); |
Jakob Stoklund Olesen | 034a80d | 2011-02-17 19:13:53 +0000 | [diff] [blame] | 1179 | return tryLocalSplit(VirtReg, Order, NewVRegs); |
Jakob Stoklund Olesen | a2ebf60 | 2011-02-19 00:38:40 +0000 | [diff] [blame] | 1180 | } |
| 1181 | |
| 1182 | NamedRegionTimer T("Global Splitting", TimerGroupName, TimePassesIsEnabled); |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 1183 | |
Jakob Stoklund Olesen | 22a1df6 | 2011-03-01 21:10:07 +0000 | [diff] [blame] | 1184 | // Don't iterate global splitting. |
| 1185 | // Move straight to spilling if this range was produced by a global split. |
| 1186 | LiveRangeStage Stage = getStage(VirtReg); |
| 1187 | if (Stage >= RS_Block) |
| 1188 | return 0; |
| 1189 | |
| 1190 | SA->analyze(&VirtReg); |
| 1191 | |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 1192 | // First try to split around a region spanning multiple blocks. |
Jakob Stoklund Olesen | 22a1df6 | 2011-03-01 21:10:07 +0000 | [diff] [blame] | 1193 | if (Stage < RS_Region) { |
| 1194 | unsigned PhysReg = tryRegionSplit(VirtReg, Order, NewVRegs); |
| 1195 | if (PhysReg || !NewVRegs.empty()) |
| 1196 | return PhysReg; |
| 1197 | } |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 1198 | |
| 1199 | // Then isolate blocks with multiple uses. |
Jakob Stoklund Olesen | 22a1df6 | 2011-03-01 21:10:07 +0000 | [diff] [blame] | 1200 | if (Stage < RS_Block) { |
| 1201 | SplitAnalysis::BlockPtrSet Blocks; |
| 1202 | if (SA->getMultiUseBlocks(Blocks)) { |
Jakob Stoklund Olesen | 92a55f4 | 2011-03-09 00:57:29 +0000 | [diff] [blame] | 1203 | LiveRangeEdit LREdit(VirtReg, NewVRegs, this); |
Jakob Stoklund Olesen | bece06f | 2011-03-03 01:29:13 +0000 | [diff] [blame] | 1204 | SE->reset(LREdit); |
| 1205 | SE->splitSingleBlocks(Blocks); |
Jakob Stoklund Olesen | 22a1df6 | 2011-03-01 21:10:07 +0000 | [diff] [blame] | 1206 | setStage(NewVRegs.begin(), NewVRegs.end(), RS_Block); |
| 1207 | if (VerifyEnabled) |
| 1208 | MF->verify(this, "After splitting live range around basic blocks"); |
| 1209 | } |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 1210 | } |
| 1211 | |
| 1212 | // Don't assign any physregs. |
| 1213 | return 0; |
| 1214 | } |
| 1215 | |
| 1216 | |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 1217 | //===----------------------------------------------------------------------===// |
Jakob Stoklund Olesen | 770d42d | 2010-12-22 22:01:30 +0000 | [diff] [blame] | 1218 | // Main Entry Point |
| 1219 | //===----------------------------------------------------------------------===// |
| 1220 | |
| 1221 | unsigned RAGreedy::selectOrSplit(LiveInterval &VirtReg, |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 1222 | SmallVectorImpl<LiveInterval*> &NewVRegs) { |
Jakob Stoklund Olesen | 770d42d | 2010-12-22 22:01:30 +0000 | [diff] [blame] | 1223 | // First try assigning a free register. |
Jakob Stoklund Olesen | dd479e9 | 2010-12-10 22:21:05 +0000 | [diff] [blame] | 1224 | AllocationOrder Order(VirtReg.reg, *VRM, ReservedRegs); |
| 1225 | while (unsigned PhysReg = Order.next()) { |
Jakob Stoklund Olesen | 770d42d | 2010-12-22 22:01:30 +0000 | [diff] [blame] | 1226 | if (!checkPhysRegInterference(VirtReg, PhysReg)) |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 1227 | return PhysReg; |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 1228 | } |
Andrew Trick | b853e6c | 2010-12-09 18:15:21 +0000 | [diff] [blame] | 1229 | |
Jakob Stoklund Olesen | 98c8141 | 2011-02-23 00:29:52 +0000 | [diff] [blame] | 1230 | if (unsigned PhysReg = tryEvict(VirtReg, Order, NewVRegs)) |
Jakob Stoklund Olesen | 46c83c8 | 2010-12-14 00:37:49 +0000 | [diff] [blame] | 1231 | return PhysReg; |
Andrew Trick | b853e6c | 2010-12-09 18:15:21 +0000 | [diff] [blame] | 1232 | |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 1233 | assert(NewVRegs.empty() && "Cannot append to existing NewVRegs"); |
| 1234 | |
Jakob Stoklund Olesen | 107d366 | 2011-02-24 23:21:36 +0000 | [diff] [blame] | 1235 | // The first time we see a live range, don't try to split or spill. |
| 1236 | // Wait until the second time, when all smaller ranges have been allocated. |
| 1237 | // This gives a better picture of the interference to split around. |
Jakob Stoklund Olesen | eb29157 | 2011-03-27 22:49:21 +0000 | [diff] [blame] | 1238 | LiveRangeStage Stage = getStage(VirtReg); |
Jakob Stoklund Olesen | f22ca3f | 2011-03-30 02:52:39 +0000 | [diff] [blame] | 1239 | if (Stage == RS_First) { |
Jakob Stoklund Olesen | eb29157 | 2011-03-27 22:49:21 +0000 | [diff] [blame] | 1240 | LRStage[VirtReg.reg] = RS_Second; |
Jakob Stoklund Olesen | c1655e1 | 2011-03-19 23:02:47 +0000 | [diff] [blame] | 1241 | DEBUG(dbgs() << "wait for second round\n"); |
Jakob Stoklund Olesen | 107d366 | 2011-02-24 23:21:36 +0000 | [diff] [blame] | 1242 | NewVRegs.push_back(&VirtReg); |
| 1243 | return 0; |
| 1244 | } |
| 1245 | |
Jakob Stoklund Olesen | 22a1df6 | 2011-03-01 21:10:07 +0000 | [diff] [blame] | 1246 | assert(Stage < RS_Spill && "Cannot allocate after spilling"); |
| 1247 | |
Jakob Stoklund Olesen | 46c83c8 | 2010-12-14 00:37:49 +0000 | [diff] [blame] | 1248 | // Try splitting VirtReg or interferences. |
Jakob Stoklund Olesen | ccdb3fc | 2011-01-19 22:11:48 +0000 | [diff] [blame] | 1249 | unsigned PhysReg = trySplit(VirtReg, Order, NewVRegs); |
| 1250 | if (PhysReg || !NewVRegs.empty()) |
Jakob Stoklund Olesen | b64d92e | 2010-12-14 00:37:44 +0000 | [diff] [blame] | 1251 | return PhysReg; |
| 1252 | |
Jakob Stoklund Olesen | 770d42d | 2010-12-22 22:01:30 +0000 | [diff] [blame] | 1253 | // Finally spill VirtReg itself. |
Jakob Stoklund Olesen | 533f58e | 2010-12-11 00:19:56 +0000 | [diff] [blame] | 1254 | NamedRegionTimer T("Spiller", TimerGroupName, TimePassesIsEnabled); |
Jakob Stoklund Olesen | 47dbf6c | 2011-03-10 01:51:42 +0000 | [diff] [blame] | 1255 | LiveRangeEdit LRE(VirtReg, NewVRegs, this); |
| 1256 | spiller().spill(LRE); |
Jakob Stoklund Olesen | 6094bd8 | 2011-03-29 21:20:19 +0000 | [diff] [blame] | 1257 | setStage(NewVRegs.begin(), NewVRegs.end(), RS_Spill); |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 1258 | |
Jakob Stoklund Olesen | c46570d | 2011-03-16 22:56:08 +0000 | [diff] [blame] | 1259 | if (VerifyEnabled) |
| 1260 | MF->verify(this, "After spilling"); |
| 1261 | |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 1262 | // The live virtual register requesting allocation was spilled, so tell |
| 1263 | // the caller not to allocate anything during this round. |
| 1264 | return 0; |
| 1265 | } |
| 1266 | |
| 1267 | bool RAGreedy::runOnMachineFunction(MachineFunction &mf) { |
| 1268 | DEBUG(dbgs() << "********** GREEDY REGISTER ALLOCATION **********\n" |
| 1269 | << "********** Function: " |
| 1270 | << ((Value*)mf.getFunction())->getName() << '\n'); |
| 1271 | |
| 1272 | MF = &mf; |
Jakob Stoklund Olesen | af24964 | 2010-12-17 23:16:35 +0000 | [diff] [blame] | 1273 | if (VerifyEnabled) |
Jakob Stoklund Olesen | 89cab93 | 2010-12-18 00:06:56 +0000 | [diff] [blame] | 1274 | MF->verify(this, "Before greedy register allocator"); |
Jakob Stoklund Olesen | af24964 | 2010-12-17 23:16:35 +0000 | [diff] [blame] | 1275 | |
Jakob Stoklund Olesen | 4680dec | 2010-12-10 23:49:00 +0000 | [diff] [blame] | 1276 | RegAllocBase::init(getAnalysis<VirtRegMap>(), getAnalysis<LiveIntervals>()); |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 1277 | Indexes = &getAnalysis<SlotIndexes>(); |
Jakob Stoklund Olesen | f428eb6 | 2010-12-17 23:16:32 +0000 | [diff] [blame] | 1278 | DomTree = &getAnalysis<MachineDominatorTree>(); |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 1279 | ReservedRegs = TRI->getReservedRegs(*MF); |
Jakob Stoklund Olesen | f6dff84 | 2010-12-10 22:54:44 +0000 | [diff] [blame] | 1280 | SpillerInstance.reset(createInlineSpiller(*this, *MF, *VRM)); |
Jakob Stoklund Olesen | d0bb5e2 | 2010-12-15 23:46:13 +0000 | [diff] [blame] | 1281 | Loops = &getAnalysis<MachineLoopInfo>(); |
| 1282 | LoopRanges = &getAnalysis<MachineLoopRanges>(); |
Jakob Stoklund Olesen | b5fa933 | 2011-01-18 21:13:27 +0000 | [diff] [blame] | 1283 | Bundles = &getAnalysis<EdgeBundles>(); |
| 1284 | SpillPlacer = &getAnalysis<SpillPlacement>(); |
| 1285 | |
Jakob Stoklund Olesen | 1b847de | 2011-02-19 00:53:42 +0000 | [diff] [blame] | 1286 | SA.reset(new SplitAnalysis(*VRM, *LIS, *Loops)); |
Jakob Stoklund Olesen | bece06f | 2011-03-03 01:29:13 +0000 | [diff] [blame] | 1287 | SE.reset(new SplitEditor(*SA, *LIS, *VRM, *DomTree)); |
Jakob Stoklund Olesen | 22a1df6 | 2011-03-01 21:10:07 +0000 | [diff] [blame] | 1288 | LRStage.clear(); |
| 1289 | LRStage.resize(MRI->getNumVirtRegs()); |
Jakob Stoklund Olesen | eda0fe8 | 2011-04-02 06:03:38 +0000 | [diff] [blame] | 1290 | IntfCache.init(MF, &PhysReg2LiveUnion[0], Indexes, TRI); |
Jakob Stoklund Olesen | d0bb5e2 | 2010-12-15 23:46:13 +0000 | [diff] [blame] | 1291 | |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 1292 | allocatePhysRegs(); |
| 1293 | addMBBLiveIns(MF); |
Jakob Stoklund Olesen | 8a61da8 | 2011-02-08 21:13:03 +0000 | [diff] [blame] | 1294 | LIS->addKillFlags(); |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 1295 | |
| 1296 | // Run rewriter |
Jakob Stoklund Olesen | 533f58e | 2010-12-11 00:19:56 +0000 | [diff] [blame] | 1297 | { |
| 1298 | NamedRegionTimer T("Rewriter", TimerGroupName, TimePassesIsEnabled); |
Jakob Stoklund Olesen | ba05c01 | 2011-02-18 22:03:18 +0000 | [diff] [blame] | 1299 | VRM->rewrite(Indexes); |
Jakob Stoklund Olesen | 533f58e | 2010-12-11 00:19:56 +0000 | [diff] [blame] | 1300 | } |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 1301 | |
Jakob Stoklund Olesen | cfafc54 | 2011-04-05 21:40:37 +0000 | [diff] [blame] | 1302 | // Write out new DBG_VALUE instructions. |
| 1303 | getAnalysis<LiveDebugVariables>().emitDebugValues(VRM); |
| 1304 | |
Jakob Stoklund Olesen | cba2e06 | 2010-12-08 03:26:16 +0000 | [diff] [blame] | 1305 | // The pass output is in VirtRegMap. Release all the transient data. |
| 1306 | releaseMemory(); |
| 1307 | |
| 1308 | return true; |
| 1309 | } |