Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 1 | //===-- MachineLICM.cpp - Machine Loop Invariant Code Motion Pass ---------===// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
Chris Lattner | 4ee451d | 2007-12-29 20:36:04 +0000 | [diff] [blame] | 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | // This pass performs loop invariant code motion on machine instructions. We |
| 11 | // attempt to remove as much code from the body of a loop as possible. |
| 12 | // |
Dan Gohman | c475c36 | 2009-01-15 22:01:38 +0000 | [diff] [blame] | 13 | // This pass does not attempt to throttle itself to limit register pressure. |
| 14 | // The register allocation phases are expected to perform rematerialization |
| 15 | // to recover when register pressure is high. |
| 16 | // |
| 17 | // This pass is not intended to be a replacement or a complete alternative |
| 18 | // for the LLVM-IR-level LICM pass. It is only designed to hoist simple |
| 19 | // constructs that are not exposed before lowering and instruction selection. |
| 20 | // |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 21 | //===----------------------------------------------------------------------===// |
| 22 | |
| 23 | #define DEBUG_TYPE "machine-licm" |
Chris Lattner | ac69582 | 2008-01-04 06:41:45 +0000 | [diff] [blame] | 24 | #include "llvm/CodeGen/Passes.h" |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 25 | #include "llvm/CodeGen/MachineDominators.h" |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 26 | #include "llvm/CodeGen/MachineLoopInfo.h" |
Bill Wendling | 9258cd3 | 2008-01-02 19:32:43 +0000 | [diff] [blame] | 27 | #include "llvm/CodeGen/MachineRegisterInfo.h" |
Dan Gohman | 6f0d024 | 2008-02-10 18:45:23 +0000 | [diff] [blame] | 28 | #include "llvm/Target/TargetRegisterInfo.h" |
Bill Wendling | efe2be7 | 2007-12-11 23:27:51 +0000 | [diff] [blame] | 29 | #include "llvm/Target/TargetInstrInfo.h" |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 30 | #include "llvm/Target/TargetMachine.h" |
Evan Cheng | af6949d | 2009-02-05 08:45:46 +0000 | [diff] [blame] | 31 | #include "llvm/ADT/DenseMap.h" |
Chris Lattner | ac69582 | 2008-01-04 06:41:45 +0000 | [diff] [blame] | 32 | #include "llvm/ADT/Statistic.h" |
| 33 | #include "llvm/Support/CommandLine.h" |
| 34 | #include "llvm/Support/Compiler.h" |
| 35 | #include "llvm/Support/Debug.h" |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 36 | |
| 37 | using namespace llvm; |
| 38 | |
Bill Wendling | 041b3f8 | 2007-12-08 23:58:46 +0000 | [diff] [blame] | 39 | STATISTIC(NumHoisted, "Number of machine instructions hoisted out of loops"); |
Evan Cheng | af6949d | 2009-02-05 08:45:46 +0000 | [diff] [blame] | 40 | STATISTIC(NumCSEed, "Number of hoisted machine instructions CSEed"); |
Bill Wendling | b48519c | 2007-12-08 01:47:01 +0000 | [diff] [blame] | 41 | |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 42 | namespace { |
| 43 | class VISIBILITY_HIDDEN MachineLICM : public MachineFunctionPass { |
Bill Wendling | 9258cd3 | 2008-01-02 19:32:43 +0000 | [diff] [blame] | 44 | const TargetMachine *TM; |
Bill Wendling | efe2be7 | 2007-12-11 23:27:51 +0000 | [diff] [blame] | 45 | const TargetInstrInfo *TII; |
Bill Wendling | 12ebf14 | 2007-12-11 19:40:06 +0000 | [diff] [blame] | 46 | |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 47 | // Various analyses that we use... |
Bill Wendling | e4fc1cc | 2008-05-12 19:38:32 +0000 | [diff] [blame] | 48 | MachineLoopInfo *LI; // Current MachineLoopInfo |
| 49 | MachineDominatorTree *DT; // Machine dominator tree for the cur loop |
Bill Wendling | 9258cd3 | 2008-01-02 19:32:43 +0000 | [diff] [blame] | 50 | MachineRegisterInfo *RegInfo; // Machine register information |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 51 | |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 52 | // State that is updated as we process loops |
Bill Wendling | e4fc1cc | 2008-05-12 19:38:32 +0000 | [diff] [blame] | 53 | bool Changed; // True if a loop is changed. |
| 54 | MachineLoop *CurLoop; // The current loop we are working on. |
Dan Gohman | c475c36 | 2009-01-15 22:01:38 +0000 | [diff] [blame] | 55 | MachineBasicBlock *CurPreheader; // The preheader for CurLoop. |
Evan Cheng | af6949d | 2009-02-05 08:45:46 +0000 | [diff] [blame] | 56 | |
| 57 | // For each BB and opcode pair, keep a list of hoisted instructions. |
| 58 | DenseMap<std::pair<unsigned, unsigned>, |
| 59 | std::vector<const MachineInstr*> > CSEMap; |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 60 | public: |
| 61 | static char ID; // Pass identification, replacement for typeid |
Dan Gohman | ae73dc1 | 2008-09-04 17:05:41 +0000 | [diff] [blame] | 62 | MachineLICM() : MachineFunctionPass(&ID) {} |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 63 | |
| 64 | virtual bool runOnMachineFunction(MachineFunction &MF); |
| 65 | |
Dan Gohman | 7224170 | 2008-12-18 01:37:56 +0000 | [diff] [blame] | 66 | const char *getPassName() const { return "Machine Instruction LICM"; } |
| 67 | |
Bill Wendling | 074223a | 2008-03-10 08:13:01 +0000 | [diff] [blame] | 68 | // FIXME: Loop preheaders? |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 69 | virtual void getAnalysisUsage(AnalysisUsage &AU) const { |
| 70 | AU.setPreservesCFG(); |
| 71 | AU.addRequired<MachineLoopInfo>(); |
| 72 | AU.addRequired<MachineDominatorTree>(); |
Bill Wendling | d5da704 | 2008-01-04 08:48:49 +0000 | [diff] [blame] | 73 | AU.addPreserved<MachineLoopInfo>(); |
| 74 | AU.addPreserved<MachineDominatorTree>(); |
| 75 | MachineFunctionPass::getAnalysisUsage(AU); |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 76 | } |
Evan Cheng | af6949d | 2009-02-05 08:45:46 +0000 | [diff] [blame] | 77 | |
| 78 | virtual void releaseMemory() { |
| 79 | CSEMap.clear(); |
| 80 | } |
| 81 | |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 82 | private: |
Bill Wendling | 041b3f8 | 2007-12-08 23:58:46 +0000 | [diff] [blame] | 83 | /// IsLoopInvariantInst - Returns true if the instruction is loop |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 84 | /// invariant. I.e., all virtual register operands are defined outside of |
| 85 | /// the loop, physical registers aren't accessed (explicitly or implicitly), |
| 86 | /// and the instruction is hoistable. |
| 87 | /// |
Bill Wendling | 041b3f8 | 2007-12-08 23:58:46 +0000 | [diff] [blame] | 88 | bool IsLoopInvariantInst(MachineInstr &I); |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 89 | |
Evan Cheng | 45e94d6 | 2009-02-04 09:19:56 +0000 | [diff] [blame] | 90 | /// IsProfitableToHoist - Return true if it is potentially profitable to |
| 91 | /// hoist the given loop invariant. |
| 92 | bool IsProfitableToHoist(MachineInstr &MI); |
| 93 | |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 94 | /// HoistRegion - Walk the specified region of the CFG (defined by all |
| 95 | /// blocks dominated by the specified block, and that are in the current |
| 96 | /// loop) in depth first order w.r.t the DominatorTree. This allows us to |
| 97 | /// visit definitions before uses, allowing us to hoist a loop body in one |
| 98 | /// pass without iteration. |
| 99 | /// |
| 100 | void HoistRegion(MachineDomTreeNode *N); |
| 101 | |
| 102 | /// Hoist - When an instruction is found to only use loop invariant operands |
| 103 | /// that is safe to hoist, this instruction is called to do the dirty work. |
| 104 | /// |
Bill Wendling | b48519c | 2007-12-08 01:47:01 +0000 | [diff] [blame] | 105 | void Hoist(MachineInstr &MI); |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 106 | }; |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 107 | } // end anonymous namespace |
| 108 | |
Dan Gohman | 844731a | 2008-05-13 00:00:25 +0000 | [diff] [blame] | 109 | char MachineLICM::ID = 0; |
| 110 | static RegisterPass<MachineLICM> |
Bill Wendling | 8870ce9 | 2008-07-07 05:42:27 +0000 | [diff] [blame] | 111 | X("machinelicm", "Machine Loop Invariant Code Motion"); |
Dan Gohman | 844731a | 2008-05-13 00:00:25 +0000 | [diff] [blame] | 112 | |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 113 | FunctionPass *llvm::createMachineLICMPass() { return new MachineLICM(); } |
| 114 | |
Dan Gohman | c475c36 | 2009-01-15 22:01:38 +0000 | [diff] [blame] | 115 | /// LoopIsOuterMostWithPreheader - Test if the given loop is the outer-most |
| 116 | /// loop that has a preheader. |
| 117 | static bool LoopIsOuterMostWithPreheader(MachineLoop *CurLoop) { |
| 118 | for (MachineLoop *L = CurLoop->getParentLoop(); L; L = L->getParentLoop()) |
| 119 | if (L->getLoopPreheader()) |
| 120 | return false; |
| 121 | return true; |
| 122 | } |
| 123 | |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 124 | /// Hoist expressions out of the specified loop. Note, alias info for inner loop |
| 125 | /// is not preserved so it is not a good idea to run LICM multiple times on one |
| 126 | /// loop. |
| 127 | /// |
| 128 | bool MachineLICM::runOnMachineFunction(MachineFunction &MF) { |
Bill Wendling | a17ad59 | 2007-12-11 22:22:22 +0000 | [diff] [blame] | 129 | DOUT << "******** Machine LICM ********\n"; |
| 130 | |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 131 | Changed = false; |
Bill Wendling | acb04ec | 2008-08-31 02:30:23 +0000 | [diff] [blame] | 132 | TM = &MF.getTarget(); |
Bill Wendling | 9258cd3 | 2008-01-02 19:32:43 +0000 | [diff] [blame] | 133 | TII = TM->getInstrInfo(); |
Bill Wendling | acb04ec | 2008-08-31 02:30:23 +0000 | [diff] [blame] | 134 | RegInfo = &MF.getRegInfo(); |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 135 | |
| 136 | // Get our Loop information... |
| 137 | LI = &getAnalysis<MachineLoopInfo>(); |
| 138 | DT = &getAnalysis<MachineDominatorTree>(); |
| 139 | |
| 140 | for (MachineLoopInfo::iterator |
| 141 | I = LI->begin(), E = LI->end(); I != E; ++I) { |
Bill Wendling | a17ad59 | 2007-12-11 22:22:22 +0000 | [diff] [blame] | 142 | CurLoop = *I; |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 143 | |
Dan Gohman | c475c36 | 2009-01-15 22:01:38 +0000 | [diff] [blame] | 144 | // Only visit outer-most preheader-sporting loops. |
| 145 | if (!LoopIsOuterMostWithPreheader(CurLoop)) |
| 146 | continue; |
| 147 | |
| 148 | // Determine the block to which to hoist instructions. If we can't find a |
| 149 | // suitable loop preheader, we can't do any hoisting. |
| 150 | // |
| 151 | // FIXME: We are only hoisting if the basic block coming into this loop |
| 152 | // has only one successor. This isn't the case in general because we haven't |
| 153 | // broken critical edges or added preheaders. |
| 154 | CurPreheader = CurLoop->getLoopPreheader(); |
| 155 | if (!CurPreheader) |
| 156 | continue; |
| 157 | |
| 158 | HoistRegion(DT->getNode(CurLoop->getHeader())); |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 159 | } |
| 160 | |
| 161 | return Changed; |
| 162 | } |
| 163 | |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 164 | /// HoistRegion - Walk the specified region of the CFG (defined by all blocks |
| 165 | /// dominated by the specified block, and that are in the current loop) in depth |
| 166 | /// first order w.r.t the DominatorTree. This allows us to visit definitions |
| 167 | /// before uses, allowing us to hoist a loop body in one pass without iteration. |
| 168 | /// |
| 169 | void MachineLICM::HoistRegion(MachineDomTreeNode *N) { |
| 170 | assert(N != 0 && "Null dominator tree node?"); |
| 171 | MachineBasicBlock *BB = N->getBlock(); |
| 172 | |
| 173 | // If this subregion is not in the top level loop at all, exit. |
| 174 | if (!CurLoop->contains(BB)) return; |
| 175 | |
Dan Gohman | c475c36 | 2009-01-15 22:01:38 +0000 | [diff] [blame] | 176 | for (MachineBasicBlock::iterator |
Evan Cheng | af6949d | 2009-02-05 08:45:46 +0000 | [diff] [blame] | 177 | MII = BB->begin(), E = BB->end(); MII != E; ) { |
| 178 | MachineBasicBlock::iterator NextMII = MII; ++NextMII; |
| 179 | MachineInstr &MI = *MII; |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 180 | |
Dan Gohman | c475c36 | 2009-01-15 22:01:38 +0000 | [diff] [blame] | 181 | Hoist(MI); |
Evan Cheng | af6949d | 2009-02-05 08:45:46 +0000 | [diff] [blame] | 182 | |
| 183 | MII = NextMII; |
Dan Gohman | c475c36 | 2009-01-15 22:01:38 +0000 | [diff] [blame] | 184 | } |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 185 | |
| 186 | const std::vector<MachineDomTreeNode*> &Children = N->getChildren(); |
| 187 | |
| 188 | for (unsigned I = 0, E = Children.size(); I != E; ++I) |
| 189 | HoistRegion(Children[I]); |
| 190 | } |
| 191 | |
Bill Wendling | 041b3f8 | 2007-12-08 23:58:46 +0000 | [diff] [blame] | 192 | /// IsLoopInvariantInst - Returns true if the instruction is loop |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 193 | /// invariant. I.e., all virtual register operands are defined outside of the |
Bill Wendling | 60ff1a3 | 2007-12-20 01:08:10 +0000 | [diff] [blame] | 194 | /// loop, physical registers aren't accessed explicitly, and there are no side |
| 195 | /// effects that aren't captured by the operands or other flags. |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 196 | /// |
Bill Wendling | 041b3f8 | 2007-12-08 23:58:46 +0000 | [diff] [blame] | 197 | bool MachineLICM::IsLoopInvariantInst(MachineInstr &I) { |
Chris Lattner | a22edc8 | 2008-01-10 23:08:24 +0000 | [diff] [blame] | 198 | const TargetInstrDesc &TID = I.getDesc(); |
| 199 | |
| 200 | // Ignore stuff that we obviously can't hoist. |
Dan Gohman | 237dee1 | 2008-12-23 17:28:50 +0000 | [diff] [blame] | 201 | if (TID.mayStore() || TID.isCall() || TID.isTerminator() || |
Chris Lattner | a22edc8 | 2008-01-10 23:08:24 +0000 | [diff] [blame] | 202 | TID.hasUnmodeledSideEffects()) |
| 203 | return false; |
Evan Cheng | 9b61f33 | 2009-02-04 07:17:49 +0000 | [diff] [blame] | 204 | |
Chris Lattner | a22edc8 | 2008-01-10 23:08:24 +0000 | [diff] [blame] | 205 | if (TID.mayLoad()) { |
Bill Wendling | e4fc1cc | 2008-05-12 19:38:32 +0000 | [diff] [blame] | 206 | // Okay, this instruction does a load. As a refinement, we allow the target |
| 207 | // to decide whether the loaded value is actually a constant. If so, we can |
| 208 | // actually use it as a load. |
Evan Cheng | 45e94d6 | 2009-02-04 09:19:56 +0000 | [diff] [blame] | 209 | if (!TII->isInvariantLoad(&I)) |
Chris Lattner | a22edc8 | 2008-01-10 23:08:24 +0000 | [diff] [blame] | 210 | // FIXME: we should be able to sink loads with no other side effects if |
| 211 | // there is nothing that can change memory from here until the end of |
Bill Wendling | e4fc1cc | 2008-05-12 19:38:32 +0000 | [diff] [blame] | 212 | // block. This is a trivial form of alias analysis. |
Chris Lattner | a22edc8 | 2008-01-10 23:08:24 +0000 | [diff] [blame] | 213 | return false; |
Chris Lattner | a22edc8 | 2008-01-10 23:08:24 +0000 | [diff] [blame] | 214 | } |
Bill Wendling | 074223a | 2008-03-10 08:13:01 +0000 | [diff] [blame] | 215 | |
Bill Wendling | 280f456 | 2007-12-18 21:38:04 +0000 | [diff] [blame] | 216 | DEBUG({ |
| 217 | DOUT << "--- Checking if we can hoist " << I; |
Chris Lattner | 749c6f6 | 2008-01-07 07:27:27 +0000 | [diff] [blame] | 218 | if (I.getDesc().getImplicitUses()) { |
Bill Wendling | 280f456 | 2007-12-18 21:38:04 +0000 | [diff] [blame] | 219 | DOUT << " * Instruction has implicit uses:\n"; |
| 220 | |
Dan Gohman | 6f0d024 | 2008-02-10 18:45:23 +0000 | [diff] [blame] | 221 | const TargetRegisterInfo *TRI = TM->getRegisterInfo(); |
Chris Lattner | 749c6f6 | 2008-01-07 07:27:27 +0000 | [diff] [blame] | 222 | for (const unsigned *ImpUses = I.getDesc().getImplicitUses(); |
Chris Lattner | 6924430 | 2008-01-07 01:56:04 +0000 | [diff] [blame] | 223 | *ImpUses; ++ImpUses) |
Bill Wendling | e6d088a | 2008-02-26 21:47:57 +0000 | [diff] [blame] | 224 | DOUT << " -> " << TRI->getName(*ImpUses) << "\n"; |
Bill Wendling | 280f456 | 2007-12-18 21:38:04 +0000 | [diff] [blame] | 225 | } |
| 226 | |
Chris Lattner | 749c6f6 | 2008-01-07 07:27:27 +0000 | [diff] [blame] | 227 | if (I.getDesc().getImplicitDefs()) { |
Bill Wendling | 280f456 | 2007-12-18 21:38:04 +0000 | [diff] [blame] | 228 | DOUT << " * Instruction has implicit defines:\n"; |
| 229 | |
Dan Gohman | 6f0d024 | 2008-02-10 18:45:23 +0000 | [diff] [blame] | 230 | const TargetRegisterInfo *TRI = TM->getRegisterInfo(); |
Chris Lattner | 749c6f6 | 2008-01-07 07:27:27 +0000 | [diff] [blame] | 231 | for (const unsigned *ImpDefs = I.getDesc().getImplicitDefs(); |
Chris Lattner | 6924430 | 2008-01-07 01:56:04 +0000 | [diff] [blame] | 232 | *ImpDefs; ++ImpDefs) |
Bill Wendling | e6d088a | 2008-02-26 21:47:57 +0000 | [diff] [blame] | 233 | DOUT << " -> " << TRI->getName(*ImpDefs) << "\n"; |
Bill Wendling | 280f456 | 2007-12-18 21:38:04 +0000 | [diff] [blame] | 234 | } |
Bill Wendling | 280f456 | 2007-12-18 21:38:04 +0000 | [diff] [blame] | 235 | }); |
| 236 | |
Bill Wendling | d3361e9 | 2008-08-18 00:33:49 +0000 | [diff] [blame] | 237 | if (I.getDesc().getImplicitDefs() || I.getDesc().getImplicitUses()) { |
| 238 | DOUT << "Cannot hoist with implicit defines or uses\n"; |
| 239 | return false; |
| 240 | } |
| 241 | |
Bill Wendling | e4fc1cc | 2008-05-12 19:38:32 +0000 | [diff] [blame] | 242 | // The instruction is loop invariant if all of its operands are. |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 243 | for (unsigned i = 0, e = I.getNumOperands(); i != e; ++i) { |
| 244 | const MachineOperand &MO = I.getOperand(i); |
| 245 | |
Dan Gohman | d735b80 | 2008-10-03 15:45:36 +0000 | [diff] [blame] | 246 | if (!MO.isReg()) |
Bill Wendling | fb018d0 | 2008-08-20 20:32:05 +0000 | [diff] [blame] | 247 | continue; |
| 248 | |
Dan Gohman | c475c36 | 2009-01-15 22:01:38 +0000 | [diff] [blame] | 249 | unsigned Reg = MO.getReg(); |
| 250 | if (Reg == 0) continue; |
| 251 | |
| 252 | // Don't hoist an instruction that uses or defines a physical register. |
| 253 | if (TargetRegisterInfo::isPhysicalRegister(Reg)) |
Bill Wendling | fb018d0 | 2008-08-20 20:32:05 +0000 | [diff] [blame] | 254 | return false; |
| 255 | |
| 256 | if (!MO.isUse()) |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 257 | continue; |
| 258 | |
Bill Wendling | e4fc1cc | 2008-05-12 19:38:32 +0000 | [diff] [blame] | 259 | assert(RegInfo->getVRegDef(Reg) && |
| 260 | "Machine instr not mapped for this vreg?!"); |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 261 | |
| 262 | // If the loop contains the definition of an operand, then the instruction |
| 263 | // isn't loop invariant. |
Bill Wendling | 9258cd3 | 2008-01-02 19:32:43 +0000 | [diff] [blame] | 264 | if (CurLoop->contains(RegInfo->getVRegDef(Reg)->getParent())) |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 265 | return false; |
| 266 | } |
| 267 | |
| 268 | // If we got this far, the instruction is loop invariant! |
| 269 | return true; |
| 270 | } |
| 271 | |
Evan Cheng | af6949d | 2009-02-05 08:45:46 +0000 | [diff] [blame] | 272 | |
| 273 | /// HasPHIUses - Return true if the specified register has any PHI use. |
| 274 | static bool HasPHIUses(unsigned Reg, MachineRegisterInfo *RegInfo) { |
Evan Cheng | 45e94d6 | 2009-02-04 09:19:56 +0000 | [diff] [blame] | 275 | for (MachineRegisterInfo::use_iterator UI = RegInfo->use_begin(Reg), |
| 276 | UE = RegInfo->use_end(); UI != UE; ++UI) { |
| 277 | MachineInstr *UseMI = &*UI; |
Evan Cheng | af6949d | 2009-02-05 08:45:46 +0000 | [diff] [blame] | 278 | if (UseMI->getOpcode() == TargetInstrInfo::PHI) |
| 279 | return true; |
Evan Cheng | 45e94d6 | 2009-02-04 09:19:56 +0000 | [diff] [blame] | 280 | } |
Evan Cheng | af6949d | 2009-02-05 08:45:46 +0000 | [diff] [blame] | 281 | return false; |
Evan Cheng | 45e94d6 | 2009-02-04 09:19:56 +0000 | [diff] [blame] | 282 | } |
| 283 | |
| 284 | /// IsProfitableToHoist - Return true if it is potentially profitable to hoist |
| 285 | /// the given loop invariant. |
| 286 | bool MachineLICM::IsProfitableToHoist(MachineInstr &MI) { |
| 287 | const TargetInstrDesc &TID = MI.getDesc(); |
| 288 | |
Evan Cheng | 45e94d6 | 2009-02-04 09:19:56 +0000 | [diff] [blame] | 289 | // FIXME: For now, only hoist re-materilizable instructions. LICM will |
| 290 | // increase register pressure. We want to make sure it doesn't increase |
| 291 | // spilling. |
Evan Cheng | 5caa883 | 2009-02-04 09:21:58 +0000 | [diff] [blame] | 292 | if (!TID.mayLoad() && (!TID.isRematerializable() || |
| 293 | !TII->isTriviallyReMaterializable(&MI))) |
Evan Cheng | 45e94d6 | 2009-02-04 09:19:56 +0000 | [diff] [blame] | 294 | return false; |
| 295 | |
Evan Cheng | af6949d | 2009-02-05 08:45:46 +0000 | [diff] [blame] | 296 | // If result(s) of this instruction is used by PHIs, then don't hoist it. |
| 297 | // The presence of joins makes it difficult for current register allocator |
| 298 | // implementation to perform remat. |
Evan Cheng | 45e94d6 | 2009-02-04 09:19:56 +0000 | [diff] [blame] | 299 | for (unsigned i = 0, e = MI.getNumOperands(); i != e; ++i) { |
| 300 | const MachineOperand &MO = MI.getOperand(i); |
| 301 | if (!MO.isReg() || !MO.isDef()) |
| 302 | continue; |
Evan Cheng | af6949d | 2009-02-05 08:45:46 +0000 | [diff] [blame] | 303 | if (HasPHIUses(MO.getReg(), RegInfo)) |
| 304 | return false; |
Evan Cheng | 45e94d6 | 2009-02-04 09:19:56 +0000 | [diff] [blame] | 305 | } |
Evan Cheng | af6949d | 2009-02-05 08:45:46 +0000 | [diff] [blame] | 306 | |
| 307 | return true; |
| 308 | } |
| 309 | |
| 310 | static const MachineInstr *LookForDuplicate(const MachineInstr *MI, |
| 311 | std::vector<const MachineInstr*> &PrevMIs) { |
| 312 | unsigned NumOps = MI->getNumOperands(); |
| 313 | for (unsigned i = 0, e = PrevMIs.size(); i != e; ++i) { |
| 314 | const MachineInstr *PrevMI = PrevMIs[i]; |
| 315 | unsigned NumOps2 = PrevMI->getNumOperands(); |
| 316 | if (NumOps != NumOps2) |
| 317 | continue; |
| 318 | bool IsSame = true; |
| 319 | for (unsigned j = 0; j != NumOps; ++j) { |
| 320 | const MachineOperand &MO = MI->getOperand(j); |
| 321 | if (MO.isReg() && MO.isDef()) |
| 322 | continue; |
| 323 | if (!MO.isIdenticalTo(PrevMI->getOperand(j))) { |
| 324 | IsSame = false; |
| 325 | break; |
| 326 | } |
| 327 | } |
| 328 | if (IsSame) |
| 329 | return PrevMI; |
| 330 | } |
| 331 | return 0; |
Evan Cheng | 45e94d6 | 2009-02-04 09:19:56 +0000 | [diff] [blame] | 332 | } |
| 333 | |
Bill Wendling | e4fc1cc | 2008-05-12 19:38:32 +0000 | [diff] [blame] | 334 | /// Hoist - When an instruction is found to use only loop invariant operands |
| 335 | /// that are safe to hoist, this instruction is called to do the dirty work. |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 336 | /// |
Bill Wendling | b48519c | 2007-12-08 01:47:01 +0000 | [diff] [blame] | 337 | void MachineLICM::Hoist(MachineInstr &MI) { |
Bill Wendling | 041b3f8 | 2007-12-08 23:58:46 +0000 | [diff] [blame] | 338 | if (!IsLoopInvariantInst(MI)) return; |
Evan Cheng | 45e94d6 | 2009-02-04 09:19:56 +0000 | [diff] [blame] | 339 | if (!IsProfitableToHoist(MI)) return; |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 340 | |
Dan Gohman | c475c36 | 2009-01-15 22:01:38 +0000 | [diff] [blame] | 341 | // Now move the instructions to the predecessor, inserting it before any |
| 342 | // terminator instructions. |
| 343 | DEBUG({ |
| 344 | DOUT << "Hoisting " << MI; |
| 345 | if (CurPreheader->getBasicBlock()) |
| 346 | DOUT << " to MachineBasicBlock " |
| 347 | << CurPreheader->getBasicBlock()->getName(); |
| 348 | if (MI.getParent()->getBasicBlock()) |
| 349 | DOUT << " from MachineBasicBlock " |
| 350 | << MI.getParent()->getBasicBlock()->getName(); |
| 351 | DOUT << "\n"; |
| 352 | }); |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 353 | |
Evan Cheng | af6949d | 2009-02-05 08:45:46 +0000 | [diff] [blame] | 354 | // Look for opportunity to CSE the hoisted instruction. |
| 355 | std::pair<unsigned, unsigned> BBOpcPair = |
| 356 | std::make_pair(CurPreheader->getNumber(), MI.getOpcode()); |
| 357 | DenseMap<std::pair<unsigned, unsigned>, |
| 358 | std::vector<const MachineInstr*> >::iterator CI = CSEMap.find(BBOpcPair); |
| 359 | bool DoneCSE = false; |
| 360 | if (CI != CSEMap.end()) { |
| 361 | const MachineInstr *Dup = LookForDuplicate(&MI, CI->second); |
| 362 | if (Dup) { |
| 363 | DOUT << "CSEing " << MI; |
| 364 | DOUT << " with " << *Dup; |
| 365 | for (unsigned i = 0, e = MI.getNumOperands(); i != e; ++i) { |
| 366 | const MachineOperand &MO = MI.getOperand(i); |
| 367 | if (MO.isReg() && MO.isDef()) |
| 368 | RegInfo->replaceRegWith(MO.getReg(), Dup->getOperand(i).getReg()); |
| 369 | } |
| 370 | MI.eraseFromParent(); |
| 371 | DoneCSE = true; |
| 372 | ++NumCSEed; |
| 373 | } |
| 374 | } |
| 375 | |
| 376 | // Otherwise, splice the instruction to the preheader. |
| 377 | if (!DoneCSE) { |
| 378 | CurPreheader->splice(CurPreheader->getFirstTerminator(), |
| 379 | MI.getParent(), &MI); |
| 380 | // Add to the CSE map. |
| 381 | if (CI != CSEMap.end()) |
| 382 | CI->second.push_back(&MI); |
| 383 | else { |
| 384 | std::vector<const MachineInstr*> CSEMIs; |
| 385 | CSEMIs.push_back(&MI); |
| 386 | CSEMap.insert(std::make_pair(BBOpcPair, CSEMIs)); |
| 387 | } |
| 388 | } |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 389 | |
Dan Gohman | c475c36 | 2009-01-15 22:01:38 +0000 | [diff] [blame] | 390 | ++NumHoisted; |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 391 | Changed = true; |
Bill Wendling | 0f940c9 | 2007-12-07 21:42:31 +0000 | [diff] [blame] | 392 | } |