Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 1 | //===-- TailDuplication.cpp - Duplicate blocks into predecessors' tails ---===// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | // This pass duplicates basic blocks ending in unconditional branches into |
| 11 | // the tails of their predecessors. |
| 12 | // |
| 13 | //===----------------------------------------------------------------------===// |
| 14 | |
| 15 | #define DEBUG_TYPE "tailduplication" |
| 16 | #include "llvm/Function.h" |
| 17 | #include "llvm/CodeGen/Passes.h" |
| 18 | #include "llvm/CodeGen/MachineModuleInfo.h" |
| 19 | #include "llvm/CodeGen/MachineFunctionPass.h" |
Evan Cheng | 111e762 | 2009-12-03 08:43:53 +0000 | [diff] [blame] | 20 | #include "llvm/CodeGen/MachineRegisterInfo.h" |
| 21 | #include "llvm/CodeGen/MachineSSAUpdater.h" |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 22 | #include "llvm/Target/TargetInstrInfo.h" |
| 23 | #include "llvm/Support/CommandLine.h" |
| 24 | #include "llvm/Support/Debug.h" |
| 25 | #include "llvm/Support/raw_ostream.h" |
| 26 | #include "llvm/ADT/SmallSet.h" |
| 27 | #include "llvm/ADT/SetVector.h" |
| 28 | #include "llvm/ADT/Statistic.h" |
| 29 | using namespace llvm; |
| 30 | |
| 31 | STATISTIC(NumTailDups , "Number of tail duplicated blocks"); |
| 32 | STATISTIC(NumInstrDups , "Additional instructions due to tail duplication"); |
| 33 | STATISTIC(NumDeadBlocks, "Number of dead blocks removed"); |
| 34 | |
| 35 | // Heuristic for tail duplication. |
| 36 | static cl::opt<unsigned> |
| 37 | TailDuplicateSize("tail-dup-size", |
| 38 | cl::desc("Maximum instructions to consider tail duplicating"), |
| 39 | cl::init(2), cl::Hidden); |
| 40 | |
Evan Cheng | 111e762 | 2009-12-03 08:43:53 +0000 | [diff] [blame] | 41 | typedef std::vector<unsigned> AvailableValsTy; |
| 42 | |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 43 | namespace { |
Bob Wilson | 2d521e5 | 2009-11-26 21:38:41 +0000 | [diff] [blame] | 44 | /// TailDuplicatePass - Perform tail duplication. |
| 45 | class TailDuplicatePass : public MachineFunctionPass { |
Evan Cheng | 79fc6f4 | 2009-12-04 09:42:45 +0000 | [diff] [blame^] | 46 | bool PreRegAlloc; |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 47 | const TargetInstrInfo *TII; |
| 48 | MachineModuleInfo *MMI; |
Evan Cheng | 111e762 | 2009-12-03 08:43:53 +0000 | [diff] [blame] | 49 | MachineRegisterInfo *MRI; |
| 50 | |
| 51 | // SSAUpdateVRs - A list of virtual registers for which to update SSA form. |
| 52 | SmallVector<unsigned, 16> SSAUpdateVRs; |
| 53 | |
| 54 | // SSAUpdateVals - For each virtual register in SSAUpdateVals keep a list of |
| 55 | // source virtual registers. |
| 56 | DenseMap<unsigned, AvailableValsTy> SSAUpdateVals; |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 57 | |
| 58 | public: |
| 59 | static char ID; |
Evan Cheng | 79fc6f4 | 2009-12-04 09:42:45 +0000 | [diff] [blame^] | 60 | explicit TailDuplicatePass(bool PreRA) : |
| 61 | MachineFunctionPass(&ID), PreRegAlloc(PreRA) {} |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 62 | |
| 63 | virtual bool runOnMachineFunction(MachineFunction &MF); |
| 64 | virtual const char *getPassName() const { return "Tail Duplication"; } |
| 65 | |
| 66 | private: |
Evan Cheng | 111e762 | 2009-12-03 08:43:53 +0000 | [diff] [blame] | 67 | void AddSSAUpdateEntry(unsigned OrigReg, unsigned NewReg); |
Evan Cheng | 79fc6f4 | 2009-12-04 09:42:45 +0000 | [diff] [blame^] | 68 | void ProcessPHI(MachineInstr *MI, MachineBasicBlock *TailBB, |
| 69 | MachineBasicBlock *PredBB, |
| 70 | DenseMap<unsigned, unsigned> &LocalVRMap); |
| 71 | void DuplicateInstruction(MachineInstr *MI, |
| 72 | MachineBasicBlock *TailBB, |
| 73 | MachineBasicBlock *PredBB, |
| 74 | MachineFunction &MF, |
| 75 | DenseMap<unsigned, unsigned> &LocalVRMap); |
| 76 | void UpdateSuccessorsPHIs(MachineBasicBlock *FromBB,MachineBasicBlock *ToBB, |
| 77 | SmallSetVector<MachineBasicBlock*,8> &Succs); |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 78 | bool TailDuplicateBlocks(MachineFunction &MF); |
| 79 | bool TailDuplicate(MachineBasicBlock *TailBB, MachineFunction &MF); |
| 80 | void RemoveDeadBlock(MachineBasicBlock *MBB); |
| 81 | }; |
| 82 | |
Bob Wilson | 2d521e5 | 2009-11-26 21:38:41 +0000 | [diff] [blame] | 83 | char TailDuplicatePass::ID = 0; |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 84 | } |
| 85 | |
Evan Cheng | 79fc6f4 | 2009-12-04 09:42:45 +0000 | [diff] [blame^] | 86 | FunctionPass *llvm::createTailDuplicatePass(bool PreRegAlloc) { |
| 87 | return new TailDuplicatePass(PreRegAlloc); |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 88 | } |
| 89 | |
Bob Wilson | 2d521e5 | 2009-11-26 21:38:41 +0000 | [diff] [blame] | 90 | bool TailDuplicatePass::runOnMachineFunction(MachineFunction &MF) { |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 91 | TII = MF.getTarget().getInstrInfo(); |
Evan Cheng | 111e762 | 2009-12-03 08:43:53 +0000 | [diff] [blame] | 92 | MRI = &MF.getRegInfo(); |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 93 | MMI = getAnalysisIfAvailable<MachineModuleInfo>(); |
| 94 | |
| 95 | bool MadeChange = false; |
| 96 | bool MadeChangeThisIteration = true; |
| 97 | while (MadeChangeThisIteration) { |
| 98 | MadeChangeThisIteration = false; |
| 99 | MadeChangeThisIteration |= TailDuplicateBlocks(MF); |
| 100 | MadeChange |= MadeChangeThisIteration; |
| 101 | } |
| 102 | |
| 103 | return MadeChange; |
| 104 | } |
| 105 | |
| 106 | /// TailDuplicateBlocks - Look for small blocks that are unconditionally |
| 107 | /// branched to and do not fall through. Tail-duplicate their instructions |
| 108 | /// into their predecessors to eliminate (dynamic) branches. |
Bob Wilson | 2d521e5 | 2009-11-26 21:38:41 +0000 | [diff] [blame] | 109 | bool TailDuplicatePass::TailDuplicateBlocks(MachineFunction &MF) { |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 110 | bool MadeChange = false; |
| 111 | |
| 112 | for (MachineFunction::iterator I = ++MF.begin(), E = MF.end(); I != E; ) { |
| 113 | MachineBasicBlock *MBB = I++; |
| 114 | |
| 115 | // Only duplicate blocks that end with unconditional branches. |
| 116 | if (MBB->canFallThrough()) |
| 117 | continue; |
| 118 | |
| 119 | MadeChange |= TailDuplicate(MBB, MF); |
| 120 | |
Evan Cheng | 79fc6f4 | 2009-12-04 09:42:45 +0000 | [diff] [blame^] | 121 | // If it is dead, remove it. Don't do this if this pass is run before |
| 122 | // register allocation to avoid having to update PHI nodes. |
| 123 | if (!PreRegAlloc && MBB->pred_empty()) { |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 124 | NumInstrDups -= MBB->size(); |
| 125 | RemoveDeadBlock(MBB); |
| 126 | MadeChange = true; |
| 127 | ++NumDeadBlocks; |
| 128 | } |
| 129 | } |
Evan Cheng | 111e762 | 2009-12-03 08:43:53 +0000 | [diff] [blame] | 130 | |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 131 | return MadeChange; |
| 132 | } |
| 133 | |
Evan Cheng | 111e762 | 2009-12-03 08:43:53 +0000 | [diff] [blame] | 134 | static bool isDefLiveOut(unsigned Reg, MachineBasicBlock *BB, |
| 135 | const MachineRegisterInfo *MRI) { |
| 136 | for (MachineRegisterInfo::use_iterator UI = MRI->use_begin(Reg), |
| 137 | UE = MRI->use_end(); UI != UE; ++UI) { |
| 138 | MachineInstr *UseMI = &*UI; |
| 139 | if (UseMI->getParent() != BB) |
| 140 | return true; |
| 141 | } |
| 142 | return false; |
| 143 | } |
| 144 | |
| 145 | static unsigned getPHISrcRegOpIdx(MachineInstr *MI, MachineBasicBlock *SrcBB) { |
| 146 | for (unsigned i = 1, e = MI->getNumOperands(); i != e; i += 2) |
| 147 | if (MI->getOperand(i+1).getMBB() == SrcBB) |
| 148 | return i; |
| 149 | return 0; |
| 150 | } |
| 151 | |
| 152 | /// AddSSAUpdateEntry - Add a definition and source virtual registers pair for |
| 153 | /// SSA update. |
| 154 | void TailDuplicatePass::AddSSAUpdateEntry(unsigned OrigReg, unsigned NewReg) { |
| 155 | DenseMap<unsigned, AvailableValsTy>::iterator LI = |
| 156 | SSAUpdateVals.find(OrigReg); |
| 157 | if (LI != SSAUpdateVals.end()) |
| 158 | LI->second.push_back(NewReg); |
| 159 | else { |
| 160 | AvailableValsTy Vals; |
| 161 | Vals.push_back(NewReg); |
| 162 | SSAUpdateVals.insert(std::make_pair(OrigReg, Vals)); |
| 163 | SSAUpdateVRs.push_back(OrigReg); |
| 164 | } |
| 165 | } |
| 166 | |
Evan Cheng | 79fc6f4 | 2009-12-04 09:42:45 +0000 | [diff] [blame^] | 167 | /// ProcessPHI - Process but do not duplicate a PHI node in TailBB. Remember the |
| 168 | /// source register that's contributed by PredBB and update SSA update map. |
| 169 | void TailDuplicatePass::ProcessPHI(MachineInstr *MI, |
| 170 | MachineBasicBlock *TailBB, |
| 171 | MachineBasicBlock *PredBB, |
| 172 | DenseMap<unsigned, unsigned> &LocalVRMap) { |
| 173 | unsigned DefReg = MI->getOperand(0).getReg(); |
| 174 | unsigned SrcOpIdx = getPHISrcRegOpIdx(MI, PredBB); |
| 175 | assert(SrcOpIdx && "Unable to find matching PHI source?"); |
| 176 | unsigned SrcReg = MI->getOperand(SrcOpIdx).getReg(); |
| 177 | LocalVRMap.insert(std::make_pair(DefReg, SrcReg)); |
| 178 | if (isDefLiveOut(DefReg, TailBB, MRI)) |
| 179 | AddSSAUpdateEntry(DefReg, SrcReg); |
| 180 | |
| 181 | // Remove PredBB from the PHI node. |
| 182 | MI->RemoveOperand(SrcOpIdx+1); |
| 183 | MI->RemoveOperand(SrcOpIdx); |
| 184 | if (MI->getNumOperands() == 1) |
| 185 | MI->eraseFromParent(); |
| 186 | } |
| 187 | |
| 188 | /// DuplicateInstruction - Duplicate a TailBB instruction to PredBB and update |
| 189 | /// the source operands due to earlier PHI translation. |
| 190 | void TailDuplicatePass::DuplicateInstruction(MachineInstr *MI, |
| 191 | MachineBasicBlock *TailBB, |
| 192 | MachineBasicBlock *PredBB, |
| 193 | MachineFunction &MF, |
| 194 | DenseMap<unsigned, unsigned> &LocalVRMap) { |
| 195 | MachineInstr *NewMI = MF.CloneMachineInstr(MI); |
| 196 | for (unsigned i = 0, e = NewMI->getNumOperands(); i != e; ++i) { |
| 197 | MachineOperand &MO = NewMI->getOperand(i); |
| 198 | if (!MO.isReg()) |
| 199 | continue; |
| 200 | unsigned Reg = MO.getReg(); |
| 201 | if (!Reg || TargetRegisterInfo::isPhysicalRegister(Reg)) |
| 202 | continue; |
| 203 | if (MO.isDef()) { |
| 204 | const TargetRegisterClass *RC = MRI->getRegClass(Reg); |
| 205 | unsigned NewReg = MRI->createVirtualRegister(RC); |
| 206 | MO.setReg(NewReg); |
| 207 | LocalVRMap.insert(std::make_pair(Reg, NewReg)); |
| 208 | if (isDefLiveOut(Reg, TailBB, MRI)) |
| 209 | AddSSAUpdateEntry(Reg, NewReg); |
| 210 | } else { |
| 211 | DenseMap<unsigned, unsigned>::iterator VI = LocalVRMap.find(Reg); |
| 212 | if (VI != LocalVRMap.end()) |
| 213 | MO.setReg(VI->second); |
| 214 | } |
| 215 | } |
| 216 | PredBB->insert(PredBB->end(), NewMI); |
| 217 | } |
| 218 | |
| 219 | /// UpdateSuccessorsPHIs - After FromBB is tail duplicated into its predecessor |
| 220 | /// blocks, the successors have gained new predecessors. Update the PHI |
| 221 | /// instructions in them accordingly. |
| 222 | void TailDuplicatePass::UpdateSuccessorsPHIs(MachineBasicBlock *FromBB, |
| 223 | MachineBasicBlock *ToBB, |
| 224 | SmallSetVector<MachineBasicBlock*,8> &Succs) { |
| 225 | for (SmallSetVector<MachineBasicBlock*, 8>::iterator SI = Succs.begin(), |
| 226 | SE = Succs.end(); SI != SE; ++SI) { |
| 227 | MachineBasicBlock *SuccBB = *SI; |
| 228 | for (MachineBasicBlock::iterator II = SuccBB->begin(), EE = SuccBB->end(); |
| 229 | II != EE; ++II) { |
| 230 | if (II->getOpcode() != TargetInstrInfo::PHI) |
| 231 | break; |
| 232 | for (unsigned i = 1, e = II->getNumOperands(); i != e; i += 2) { |
| 233 | MachineOperand &MO1 = II->getOperand(i+1); |
| 234 | if (MO1.getMBB() != FromBB) |
| 235 | continue; |
| 236 | MachineOperand &MO0 = II->getOperand(i); |
| 237 | unsigned Reg = MO0.getReg(); |
| 238 | if (ToBB) { |
| 239 | // Folded into the previous BB. |
| 240 | II->RemoveOperand(i+1); |
| 241 | II->RemoveOperand(i); |
| 242 | } |
| 243 | DenseMap<unsigned, AvailableValsTy>::iterator LI = |
| 244 | SSAUpdateVals.find(Reg); |
| 245 | if (LI == SSAUpdateVals.end()) |
| 246 | break; |
| 247 | for (unsigned j = 0, ee = LI->second.size(); j != ee; ++j) { |
| 248 | unsigned NewReg = LI->second[j]; |
| 249 | MachineInstr *DefMI = MRI->getVRegDef(NewReg); |
| 250 | II->addOperand(MachineOperand::CreateReg(NewReg, false)); |
| 251 | II->addOperand(MachineOperand::CreateMBB(DefMI->getParent())); |
| 252 | } |
| 253 | break; |
| 254 | } |
| 255 | } |
| 256 | } |
| 257 | } |
| 258 | |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 259 | /// TailDuplicate - If it is profitable, duplicate TailBB's contents in each |
| 260 | /// of its predecessors. |
Bob Wilson | 2d521e5 | 2009-11-26 21:38:41 +0000 | [diff] [blame] | 261 | bool TailDuplicatePass::TailDuplicate(MachineBasicBlock *TailBB, |
Evan Cheng | 111e762 | 2009-12-03 08:43:53 +0000 | [diff] [blame] | 262 | MachineFunction &MF) { |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 263 | // Don't try to tail-duplicate single-block loops. |
| 264 | if (TailBB->isSuccessor(TailBB)) |
| 265 | return false; |
| 266 | |
| 267 | // Set the limit on the number of instructions to duplicate, with a default |
| 268 | // of one less than the tail-merge threshold. When optimizing for size, |
| 269 | // duplicate only one, because one branch instruction can be eliminated to |
| 270 | // compensate for the duplication. |
| 271 | unsigned MaxDuplicateCount; |
Bob Wilson | 3858225 | 2009-11-30 18:56:45 +0000 | [diff] [blame] | 272 | if (!TailBB->empty() && TailBB->back().getDesc().isIndirectBranch()) |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 273 | // If the target has hardware branch prediction that can handle indirect |
| 274 | // branches, duplicating them can often make them predictable when there |
| 275 | // are common paths through the code. The limit needs to be high enough |
| 276 | // to allow undoing the effects of tail merging. |
| 277 | MaxDuplicateCount = 20; |
Bob Wilson | 3858225 | 2009-11-30 18:56:45 +0000 | [diff] [blame] | 278 | else if (MF.getFunction()->hasFnAttr(Attribute::OptimizeForSize)) |
| 279 | MaxDuplicateCount = 1; |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 280 | else |
| 281 | MaxDuplicateCount = TailDuplicateSize; |
| 282 | |
| 283 | // Check the instructions in the block to determine whether tail-duplication |
| 284 | // is invalid or unlikely to be profitable. |
Bob Wilson | f1e01dc | 2009-12-02 17:15:24 +0000 | [diff] [blame] | 285 | unsigned InstrCount = 0; |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 286 | bool HasCall = false; |
| 287 | for (MachineBasicBlock::iterator I = TailBB->begin(); |
Bob Wilson | f1e01dc | 2009-12-02 17:15:24 +0000 | [diff] [blame] | 288 | I != TailBB->end(); ++I) { |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 289 | // Non-duplicable things shouldn't be tail-duplicated. |
| 290 | if (I->getDesc().isNotDuplicable()) return false; |
Evan Cheng | 79fc6f4 | 2009-12-04 09:42:45 +0000 | [diff] [blame^] | 291 | // Do not duplicate 'return' instructions if this is a pre-regalloc run. |
| 292 | // A return may expand into a lot more instructions (e.g. reload of callee |
| 293 | // saved registers) after PEI. |
| 294 | if (PreRegAlloc && I->getDesc().isReturn()) return false; |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 295 | // Don't duplicate more than the threshold. |
Bob Wilson | f1e01dc | 2009-12-02 17:15:24 +0000 | [diff] [blame] | 296 | if (InstrCount == MaxDuplicateCount) return false; |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 297 | // Remember if we saw a call. |
| 298 | if (I->getDesc().isCall()) HasCall = true; |
Bob Wilson | f1e01dc | 2009-12-02 17:15:24 +0000 | [diff] [blame] | 299 | if (I->getOpcode() != TargetInstrInfo::PHI) |
| 300 | InstrCount += 1; |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 301 | } |
| 302 | // Heuristically, don't tail-duplicate calls if it would expand code size, |
| 303 | // as it's less likely to be worth the extra cost. |
Bob Wilson | f1e01dc | 2009-12-02 17:15:24 +0000 | [diff] [blame] | 304 | if (InstrCount > 1 && HasCall) |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 305 | return false; |
| 306 | |
| 307 | // Iterate through all the unique predecessors and tail-duplicate this |
| 308 | // block into them, if possible. Copying the list ahead of time also |
| 309 | // avoids trouble with the predecessor list reallocating. |
| 310 | bool Changed = false; |
Evan Cheng | 79fc6f4 | 2009-12-04 09:42:45 +0000 | [diff] [blame^] | 311 | SmallSetVector<MachineBasicBlock*, 8> Preds(TailBB->pred_begin(), |
| 312 | TailBB->pred_end()); |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 313 | for (SmallSetVector<MachineBasicBlock *, 8>::iterator PI = Preds.begin(), |
| 314 | PE = Preds.end(); PI != PE; ++PI) { |
| 315 | MachineBasicBlock *PredBB = *PI; |
| 316 | |
| 317 | assert(TailBB != PredBB && |
| 318 | "Single-block loop should have been rejected earlier!"); |
| 319 | if (PredBB->succ_size() > 1) continue; |
| 320 | |
| 321 | MachineBasicBlock *PredTBB, *PredFBB; |
| 322 | SmallVector<MachineOperand, 4> PredCond; |
| 323 | if (TII->AnalyzeBranch(*PredBB, PredTBB, PredFBB, PredCond, true)) |
| 324 | continue; |
| 325 | if (!PredCond.empty()) |
| 326 | continue; |
| 327 | // EH edges are ignored by AnalyzeBranch. |
| 328 | if (PredBB->succ_size() != 1) |
| 329 | continue; |
| 330 | // Don't duplicate into a fall-through predecessor (at least for now). |
| 331 | if (PredBB->isLayoutSuccessor(TailBB) && PredBB->canFallThrough()) |
| 332 | continue; |
| 333 | |
| 334 | DEBUG(errs() << "\nTail-duplicating into PredBB: " << *PredBB |
| 335 | << "From Succ: " << *TailBB); |
| 336 | |
| 337 | // Remove PredBB's unconditional branch. |
| 338 | TII->RemoveBranch(*PredBB); |
Evan Cheng | 111e762 | 2009-12-03 08:43:53 +0000 | [diff] [blame] | 339 | |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 340 | // Clone the contents of TailBB into PredBB. |
Evan Cheng | 111e762 | 2009-12-03 08:43:53 +0000 | [diff] [blame] | 341 | DenseMap<unsigned, unsigned> LocalVRMap; |
| 342 | MachineBasicBlock::iterator I = TailBB->begin(); |
Evan Cheng | 79fc6f4 | 2009-12-04 09:42:45 +0000 | [diff] [blame^] | 343 | while (I != TailBB->end()) { |
| 344 | MachineInstr *MI = &*I; |
| 345 | ++I; |
| 346 | if (MI->getOpcode() == TargetInstrInfo::PHI) { |
Evan Cheng | 111e762 | 2009-12-03 08:43:53 +0000 | [diff] [blame] | 347 | // Replace the uses of the def of the PHI with the register coming |
| 348 | // from PredBB. |
Evan Cheng | 79fc6f4 | 2009-12-04 09:42:45 +0000 | [diff] [blame^] | 349 | ProcessPHI(MI, TailBB, PredBB, LocalVRMap); |
| 350 | } else { |
| 351 | // Replace def of virtual registers with new registers, and update |
| 352 | // uses with PHI source register or the new registers. |
| 353 | DuplicateInstruction(MI, TailBB, PredBB, MF, LocalVRMap); |
Evan Cheng | 111e762 | 2009-12-03 08:43:53 +0000 | [diff] [blame] | 354 | } |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 355 | } |
| 356 | NumInstrDups += TailBB->size() - 1; // subtract one for removed branch |
| 357 | |
| 358 | // Update the CFG. |
| 359 | PredBB->removeSuccessor(PredBB->succ_begin()); |
| 360 | assert(PredBB->succ_empty() && |
| 361 | "TailDuplicate called on block with multiple successors!"); |
| 362 | for (MachineBasicBlock::succ_iterator I = TailBB->succ_begin(), |
Evan Cheng | 79fc6f4 | 2009-12-04 09:42:45 +0000 | [diff] [blame^] | 363 | E = TailBB->succ_end(); I != E; ++I) |
| 364 | PredBB->addSuccessor(*I); |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 365 | |
| 366 | Changed = true; |
| 367 | ++NumTailDups; |
| 368 | } |
| 369 | |
Evan Cheng | 79fc6f4 | 2009-12-04 09:42:45 +0000 | [diff] [blame^] | 370 | // Save the successors list. |
| 371 | SmallSetVector<MachineBasicBlock*, 8> Succs(TailBB->succ_begin(), |
| 372 | TailBB->succ_end()); |
| 373 | |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 374 | // If TailBB was duplicated into all its predecessors except for the prior |
| 375 | // block, which falls through unconditionally, move the contents of this |
| 376 | // block into the prior block. |
Evan Cheng | 79fc6f4 | 2009-12-04 09:42:45 +0000 | [diff] [blame^] | 377 | MachineBasicBlock *PrevBB = prior(MachineFunction::iterator(TailBB)); |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 378 | MachineBasicBlock *PriorTBB = 0, *PriorFBB = 0; |
| 379 | SmallVector<MachineOperand, 4> PriorCond; |
| 380 | bool PriorUnAnalyzable = |
Evan Cheng | 79fc6f4 | 2009-12-04 09:42:45 +0000 | [diff] [blame^] | 381 | TII->AnalyzeBranch(*PrevBB, PriorTBB, PriorFBB, PriorCond, true); |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 382 | // This has to check PrevBB->succ_size() because EH edges are ignored by |
| 383 | // AnalyzeBranch. |
Evan Cheng | 79fc6f4 | 2009-12-04 09:42:45 +0000 | [diff] [blame^] | 384 | // If TailBB starts with PHIs, then don't bother. Let the post regalloc |
| 385 | // run clean it up. |
| 386 | MachineBasicBlock *NewTailBB = 0; |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 387 | if (!PriorUnAnalyzable && PriorCond.empty() && !PriorTBB && |
Evan Cheng | 79fc6f4 | 2009-12-04 09:42:45 +0000 | [diff] [blame^] | 388 | TailBB->pred_size() == 1 && PrevBB->succ_size() == 1 && |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 389 | !TailBB->hasAddressTaken()) { |
Evan Cheng | 79fc6f4 | 2009-12-04 09:42:45 +0000 | [diff] [blame^] | 390 | DEBUG(errs() << "\nMerging into block: " << *PrevBB |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 391 | << "From MBB: " << *TailBB); |
Evan Cheng | 79fc6f4 | 2009-12-04 09:42:45 +0000 | [diff] [blame^] | 392 | if (PreRegAlloc) { |
| 393 | DenseMap<unsigned, unsigned> LocalVRMap; |
| 394 | MachineBasicBlock::iterator I = TailBB->begin(); |
| 395 | // Process PHI instructions first. |
| 396 | while (I != TailBB->end() && I->getOpcode() == TargetInstrInfo::PHI) { |
| 397 | // Replace the uses of the def of the PHI with the register coming |
| 398 | // from PredBB. |
| 399 | MachineInstr *MI = &*I++; |
| 400 | ProcessPHI(MI, TailBB, PrevBB, LocalVRMap); |
| 401 | if (MI->getParent()) |
| 402 | MI->eraseFromParent(); |
| 403 | } |
| 404 | |
| 405 | // Now copy the non-PHI instructions. |
| 406 | while (I != TailBB->end()) { |
| 407 | // Replace def of virtual registers with new registers, and update |
| 408 | // uses with PHI source register or the new registers. |
| 409 | MachineInstr *MI = &*I++; |
| 410 | DuplicateInstruction(MI, TailBB, PrevBB, MF, LocalVRMap); |
| 411 | MI->eraseFromParent(); |
| 412 | } |
| 413 | } else { |
| 414 | // No PHIs to worry about, just splice the instructions over. |
| 415 | PrevBB->splice(PrevBB->end(), TailBB, TailBB->begin(), TailBB->end()); |
| 416 | } |
| 417 | PrevBB->removeSuccessor(PrevBB->succ_begin()); |
| 418 | assert(PrevBB->succ_empty()); |
| 419 | PrevBB->transferSuccessors(TailBB); |
| 420 | NewTailBB = PrevBB; |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 421 | Changed = true; |
| 422 | } |
| 423 | |
Evan Cheng | 79fc6f4 | 2009-12-04 09:42:45 +0000 | [diff] [blame^] | 424 | if (!PreRegAlloc) |
| 425 | return Changed; |
| 426 | |
| 427 | // TailBB's immediate successors are now successors of those predecessors |
| 428 | // which duplicated TailBB. Add the predecessors as sources to the PHI |
| 429 | // instructions. |
| 430 | UpdateSuccessorsPHIs(TailBB, NewTailBB, Succs); |
| 431 | |
| 432 | if (!SSAUpdateVRs.empty()) { |
| 433 | // Update SSA form. |
| 434 | MachineSSAUpdater SSAUpdate(MF); |
| 435 | for (unsigned i = 0, e = SSAUpdateVRs.size(); i != e; ++i) { |
| 436 | unsigned VReg = SSAUpdateVRs[i]; |
| 437 | SSAUpdate.Initialize(VReg); |
| 438 | |
| 439 | // If the original definition is still around, add it as an available |
| 440 | // value. |
| 441 | MachineInstr *DefMI = MRI->getVRegDef(VReg); |
| 442 | MachineBasicBlock *DefBB = 0; |
| 443 | if (DefMI) { |
| 444 | DefBB = DefMI->getParent(); |
| 445 | SSAUpdate.AddAvailableValue(DefBB, VReg); |
| 446 | } |
| 447 | |
| 448 | // Add the new vregs as available values. |
| 449 | DenseMap<unsigned, AvailableValsTy>::iterator LI = |
| 450 | SSAUpdateVals.find(VReg); |
| 451 | for (unsigned j = 0, ee = LI->second.size(); j != ee; ++j) { |
| 452 | unsigned NewReg = LI->second[j]; |
| 453 | MachineInstr *DefMI = MRI->getVRegDef(NewReg); |
| 454 | SSAUpdate.AddAvailableValue(DefMI->getParent(), NewReg); |
| 455 | } |
| 456 | |
| 457 | // Rewrite uses that are outside of the original def's block. |
| 458 | MachineRegisterInfo::use_iterator UI = MRI->use_begin(VReg); |
| 459 | while (UI != MRI->use_end()) { |
| 460 | MachineOperand &UseMO = UI.getOperand(); |
| 461 | MachineInstr *UseMI = &*UI; |
| 462 | ++UI; |
| 463 | if (UseMI->getParent() != DefBB) |
| 464 | SSAUpdate.RewriteUse(UseMO); |
| 465 | } |
| 466 | } |
| 467 | |
| 468 | SSAUpdateVRs.clear(); |
| 469 | SSAUpdateVals.clear(); |
| 470 | } |
| 471 | |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 472 | return Changed; |
| 473 | } |
| 474 | |
| 475 | /// RemoveDeadBlock - Remove the specified dead machine basic block from the |
| 476 | /// function, updating the CFG. |
Bob Wilson | 2d521e5 | 2009-11-26 21:38:41 +0000 | [diff] [blame] | 477 | void TailDuplicatePass::RemoveDeadBlock(MachineBasicBlock *MBB) { |
Bob Wilson | 15acadd | 2009-11-26 00:32:21 +0000 | [diff] [blame] | 478 | assert(MBB->pred_empty() && "MBB must be dead!"); |
| 479 | DEBUG(errs() << "\nRemoving MBB: " << *MBB); |
| 480 | |
| 481 | // Remove all successors. |
| 482 | while (!MBB->succ_empty()) |
| 483 | MBB->removeSuccessor(MBB->succ_end()-1); |
| 484 | |
| 485 | // If there are any labels in the basic block, unregister them from |
| 486 | // MachineModuleInfo. |
| 487 | if (MMI && !MBB->empty()) { |
| 488 | for (MachineBasicBlock::iterator I = MBB->begin(), E = MBB->end(); |
| 489 | I != E; ++I) { |
| 490 | if (I->isLabel()) |
| 491 | // The label ID # is always operand #0, an immediate. |
| 492 | MMI->InvalidateLabel(I->getOperand(0).getImm()); |
| 493 | } |
| 494 | } |
| 495 | |
| 496 | // Remove the block. |
| 497 | MBB->eraseFromParent(); |
| 498 | } |
| 499 | |