blob: fc36bd5999bee1bad40ff666d936f1855a618f68 [file] [log] [blame]
Eugene Zelenko900b6332017-08-29 22:32:07 +00001//===- InlineSpiller.cpp - Insert spills and restores inline --------------===//
Jakob Stoklund Olesenf8889112010-06-29 23:58:39 +00002//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// The inline spiller modifies the machine function directly instead of
11// inserting spills and restores in VirtRegMap.
12//
13//===----------------------------------------------------------------------===//
14
Eugene Zelenko900b6332017-08-29 22:32:07 +000015#include "LiveRangeCalc.h"
Jakob Stoklund Olesenf8889112010-06-29 23:58:39 +000016#include "Spiller.h"
Wei Mi8c4136b2016-05-11 22:37:43 +000017#include "SplitKit.h"
Eugene Zelenko900b6332017-08-29 22:32:07 +000018#include "llvm/ADT/ArrayRef.h"
19#include "llvm/ADT/DenseMap.h"
Wei Mi9a16d652016-04-13 03:08:27 +000020#include "llvm/ADT/MapVector.h"
Eugene Zelenko900b6332017-08-29 22:32:07 +000021#include "llvm/ADT/None.h"
22#include "llvm/ADT/STLExtras.h"
Benjamin Kramerbc6666b2013-05-23 15:42:57 +000023#include "llvm/ADT/SetVector.h"
Eugene Zelenko900b6332017-08-29 22:32:07 +000024#include "llvm/ADT/SmallPtrSet.h"
25#include "llvm/ADT/SmallVector.h"
Jakob Stoklund Olesenc5a8c082011-05-05 17:22:53 +000026#include "llvm/ADT/Statistic.h"
Jakob Stoklund Olesen868dd4e2010-11-10 23:55:56 +000027#include "llvm/Analysis/AliasAnalysis.h"
Eugene Zelenko900b6332017-08-29 22:32:07 +000028#include "llvm/CodeGen/LiveInterval.h"
Jakob Stoklund Olesenf8889112010-06-29 23:58:39 +000029#include "llvm/CodeGen/LiveIntervalAnalysis.h"
Pete Cooper3ca96f92012-04-02 22:44:18 +000030#include "llvm/CodeGen/LiveRangeEdit.h"
Jakob Stoklund Olesene2c340c2010-10-26 00:11:35 +000031#include "llvm/CodeGen/LiveStackAnalysis.h"
Eugene Zelenko900b6332017-08-29 22:32:07 +000032#include "llvm/CodeGen/MachineBasicBlock.h"
Benjamin Kramere2a1d892013-06-17 19:00:36 +000033#include "llvm/CodeGen/MachineBlockFrequencyInfo.h"
Chandler Carruth8a8cd2b2014-01-07 11:48:04 +000034#include "llvm/CodeGen/MachineDominators.h"
Jakob Stoklund Olesenf8889112010-06-29 23:58:39 +000035#include "llvm/CodeGen/MachineFunction.h"
Eugene Zelenko900b6332017-08-29 22:32:07 +000036#include "llvm/CodeGen/MachineFunctionPass.h"
37#include "llvm/CodeGen/MachineInstr.h"
David Blaikie0252265b2013-06-16 20:34:15 +000038#include "llvm/CodeGen/MachineInstrBuilder.h"
Chandler Carruthed0881b2012-12-03 16:50:05 +000039#include "llvm/CodeGen/MachineInstrBundle.h"
Jakob Stoklund Olesena0d5ec12011-03-15 21:13:25 +000040#include "llvm/CodeGen/MachineLoopInfo.h"
Eugene Zelenko900b6332017-08-29 22:32:07 +000041#include "llvm/CodeGen/MachineOperand.h"
Jakob Stoklund Olesenf8889112010-06-29 23:58:39 +000042#include "llvm/CodeGen/MachineRegisterInfo.h"
Eugene Zelenko900b6332017-08-29 22:32:07 +000043#include "llvm/CodeGen/SlotIndexes.h"
Jakob Stoklund Olesen26c9d702012-11-28 19:13:06 +000044#include "llvm/CodeGen/VirtRegMap.h"
Eugene Zelenko900b6332017-08-29 22:32:07 +000045#include "llvm/Support/BlockFrequency.h"
46#include "llvm/Support/BranchProbability.h"
Jakob Stoklund Olesenbceb9e52011-09-15 21:06:00 +000047#include "llvm/Support/CommandLine.h"
Eugene Zelenko900b6332017-08-29 22:32:07 +000048#include "llvm/Support/Compiler.h"
Jakob Stoklund Olesenf8889112010-06-29 23:58:39 +000049#include "llvm/Support/Debug.h"
Eugene Zelenko900b6332017-08-29 22:32:07 +000050#include "llvm/Support/ErrorHandling.h"
Jakob Stoklund Olesenf8889112010-06-29 23:58:39 +000051#include "llvm/Support/raw_ostream.h"
Chandler Carruthed0881b2012-12-03 16:50:05 +000052#include "llvm/Target/TargetInstrInfo.h"
Eugene Zelenko900b6332017-08-29 22:32:07 +000053#include "llvm/Target/TargetOpcodes.h"
54#include "llvm/Target/TargetRegisterInfo.h"
55#include "llvm/Target/TargetSubtargetInfo.h"
56#include <cassert>
57#include <iterator>
58#include <tuple>
59#include <utility>
60#include <vector>
Jakob Stoklund Olesenf8889112010-06-29 23:58:39 +000061
62using namespace llvm;
63
Chandler Carruth1b9dde02014-04-22 02:02:50 +000064#define DEBUG_TYPE "regalloc"
65
Jakob Stoklund Olesenc5a8c082011-05-05 17:22:53 +000066STATISTIC(NumSpilledRanges, "Number of spilled live ranges");
Jakob Stoklund Olesen37eb6962011-09-15 17:54:28 +000067STATISTIC(NumSnippets, "Number of spilled snippets");
Jakob Stoklund Olesenc5a8c082011-05-05 17:22:53 +000068STATISTIC(NumSpills, "Number of spills inserted");
Jakob Stoklund Olesen37eb6962011-09-15 17:54:28 +000069STATISTIC(NumSpillsRemoved, "Number of spills removed");
Jakob Stoklund Olesenc5a8c082011-05-05 17:22:53 +000070STATISTIC(NumReloads, "Number of reloads inserted");
Jakob Stoklund Olesen37eb6962011-09-15 17:54:28 +000071STATISTIC(NumReloadsRemoved, "Number of reloads removed");
Jakob Stoklund Olesenc5a8c082011-05-05 17:22:53 +000072STATISTIC(NumFolded, "Number of folded stack accesses");
73STATISTIC(NumFoldedLoads, "Number of folded loads");
74STATISTIC(NumRemats, "Number of rematerialized defs for spilling");
Jakob Stoklund Olesenc5a8c082011-05-05 17:22:53 +000075
Jakob Stoklund Olesenbceb9e52011-09-15 21:06:00 +000076static cl::opt<bool> DisableHoisting("disable-spill-hoist", cl::Hidden,
77 cl::desc("Disable inline spill hoisting"));
78
Jakob Stoklund Olesenf8889112010-06-29 23:58:39 +000079namespace {
Eugene Zelenko900b6332017-08-29 22:32:07 +000080
Wei Mi963f2df2016-04-15 23:16:44 +000081class HoistSpillHelper : private LiveRangeEdit::Delegate {
82 MachineFunction &MF;
Wei Mi9a16d652016-04-13 03:08:27 +000083 LiveIntervals &LIS;
84 LiveStacks &LSS;
85 AliasAnalysis *AA;
86 MachineDominatorTree &MDT;
87 MachineLoopInfo &Loops;
88 VirtRegMap &VRM;
Wei Mi9a16d652016-04-13 03:08:27 +000089 MachineRegisterInfo &MRI;
90 const TargetInstrInfo &TII;
91 const TargetRegisterInfo &TRI;
92 const MachineBlockFrequencyInfo &MBFI;
93
Wei Mi8c4136b2016-05-11 22:37:43 +000094 InsertPointAnalysis IPA;
95
Wei Mi9a16d652016-04-13 03:08:27 +000096 // Map from StackSlot to its original register.
97 DenseMap<int, unsigned> StackSlotToReg;
Eugene Zelenko900b6332017-08-29 22:32:07 +000098
Wei Mi9a16d652016-04-13 03:08:27 +000099 // Map from pair of (StackSlot and Original VNI) to a set of spills which
100 // have the same stackslot and have equal values defined by Original VNI.
101 // These spills are mergeable and are hoist candiates.
Eugene Zelenko900b6332017-08-29 22:32:07 +0000102 using MergeableSpillsMap =
103 MapVector<std::pair<int, VNInfo *>, SmallPtrSet<MachineInstr *, 16>>;
Wei Mi9a16d652016-04-13 03:08:27 +0000104 MergeableSpillsMap MergeableSpills;
105
106 /// This is the map from original register to a set containing all its
107 /// siblings. To hoist a spill to another BB, we need to find out a live
108 /// sibling there and use it as the source of the new spill.
109 DenseMap<unsigned, SmallSetVector<unsigned, 16>> Virt2SiblingsMap;
110
111 bool isSpillCandBB(unsigned OrigReg, VNInfo &OrigVNI, MachineBasicBlock &BB,
112 unsigned &LiveReg);
113
114 void rmRedundantSpills(
115 SmallPtrSet<MachineInstr *, 16> &Spills,
116 SmallVectorImpl<MachineInstr *> &SpillsToRm,
117 DenseMap<MachineDomTreeNode *, MachineInstr *> &SpillBBToSpill);
118
119 void getVisitOrders(
120 MachineBasicBlock *Root, SmallPtrSet<MachineInstr *, 16> &Spills,
121 SmallVectorImpl<MachineDomTreeNode *> &Orders,
122 SmallVectorImpl<MachineInstr *> &SpillsToRm,
123 DenseMap<MachineDomTreeNode *, unsigned> &SpillsToKeep,
124 DenseMap<MachineDomTreeNode *, MachineInstr *> &SpillBBToSpill);
125
126 void runHoistSpills(unsigned OrigReg, VNInfo &OrigVNI,
127 SmallPtrSet<MachineInstr *, 16> &Spills,
128 SmallVectorImpl<MachineInstr *> &SpillsToRm,
129 DenseMap<MachineBasicBlock *, unsigned> &SpillsToIns);
130
131public:
132 HoistSpillHelper(MachineFunctionPass &pass, MachineFunction &mf,
133 VirtRegMap &vrm)
Wei Mi963f2df2016-04-15 23:16:44 +0000134 : MF(mf), LIS(pass.getAnalysis<LiveIntervals>()),
Wei Mi9a16d652016-04-13 03:08:27 +0000135 LSS(pass.getAnalysis<LiveStacks>()),
136 AA(&pass.getAnalysis<AAResultsWrapperPass>().getAAResults()),
137 MDT(pass.getAnalysis<MachineDominatorTree>()),
138 Loops(pass.getAnalysis<MachineLoopInfo>()), VRM(vrm),
Eugene Zelenko900b6332017-08-29 22:32:07 +0000139 MRI(mf.getRegInfo()), TII(*mf.getSubtarget().getInstrInfo()),
Wei Mi9a16d652016-04-13 03:08:27 +0000140 TRI(*mf.getSubtarget().getRegisterInfo()),
Wei Mi8c4136b2016-05-11 22:37:43 +0000141 MBFI(pass.getAnalysis<MachineBlockFrequencyInfo>()),
142 IPA(LIS, mf.getNumBlockIDs()) {}
Wei Mi9a16d652016-04-13 03:08:27 +0000143
Duncan P. N. Exon Smith91298732016-06-30 23:28:15 +0000144 void addToMergeableSpills(MachineInstr &Spill, int StackSlot,
Wei Mi9a16d652016-04-13 03:08:27 +0000145 unsigned Original);
Duncan P. N. Exon Smith91298732016-06-30 23:28:15 +0000146 bool rmFromMergeableSpills(MachineInstr &Spill, int StackSlot);
Wei Mi963f2df2016-04-15 23:16:44 +0000147 void hoistAllSpills();
148 void LRE_DidCloneVirtReg(unsigned, unsigned) override;
Wei Mi9a16d652016-04-13 03:08:27 +0000149};
150
Jakob Stoklund Olesenf8889112010-06-29 23:58:39 +0000151class InlineSpiller : public Spiller {
Jakob Stoklund Olesena00bab22011-03-14 19:56:43 +0000152 MachineFunction &MF;
153 LiveIntervals &LIS;
154 LiveStacks &LSS;
155 AliasAnalysis *AA;
Jakob Stoklund Olesena0d5ec12011-03-15 21:13:25 +0000156 MachineDominatorTree &MDT;
157 MachineLoopInfo &Loops;
Jakob Stoklund Olesena00bab22011-03-14 19:56:43 +0000158 VirtRegMap &VRM;
Jakob Stoklund Olesena00bab22011-03-14 19:56:43 +0000159 MachineRegisterInfo &MRI;
160 const TargetInstrInfo &TII;
161 const TargetRegisterInfo &TRI;
Benjamin Kramere2a1d892013-06-17 19:00:36 +0000162 const MachineBlockFrequencyInfo &MBFI;
Jakob Stoklund Olesenbde96ad2010-06-30 23:03:52 +0000163
164 // Variables that are valid during spill(), but used by multiple methods.
Jakob Stoklund Olesena00bab22011-03-14 19:56:43 +0000165 LiveRangeEdit *Edit;
Jakob Stoklund Olesene4663452011-03-26 22:16:41 +0000166 LiveInterval *StackInt;
Jakob Stoklund Olesena00bab22011-03-14 19:56:43 +0000167 int StackSlot;
Jakob Stoklund Olesena0d5ec12011-03-15 21:13:25 +0000168 unsigned Original;
Jakob Stoklund Olesenf8889112010-06-29 23:58:39 +0000169
Jakob Stoklund Olesena00bab22011-03-14 19:56:43 +0000170 // All registers to spill to StackSlot, including the main register.
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +0000171 SmallVector<unsigned, 8> RegsToSpill;
172
173 // All COPY instructions to/from snippets.
174 // They are ignored since both operands refer to the same stack slot.
175 SmallPtrSet<MachineInstr*, 8> SnippetCopies;
176
Jakob Stoklund Olesen2edaa2f2010-10-20 22:00:51 +0000177 // Values that failed to remat at some point.
Jakob Stoklund Olesena00bab22011-03-14 19:56:43 +0000178 SmallPtrSet<VNInfo*, 8> UsedValues;
Jakob Stoklund Olesen96037182010-07-02 17:44:57 +0000179
Jakob Stoklund Olesen27320cb2011-03-18 04:23:06 +0000180 // Dead defs generated during spilling.
181 SmallVector<MachineInstr*, 8> DeadDefs;
Jakob Stoklund Olesena0d5ec12011-03-15 21:13:25 +0000182
Wei Mi9a16d652016-04-13 03:08:27 +0000183 // Object records spills information and does the hoisting.
184 HoistSpillHelper HSpiller;
185
Eugene Zelenko900b6332017-08-29 22:32:07 +0000186 ~InlineSpiller() override = default;
Jakob Stoklund Olesenf8889112010-06-29 23:58:39 +0000187
188public:
Eric Christopherd9134482014-08-04 21:25:23 +0000189 InlineSpiller(MachineFunctionPass &pass, MachineFunction &mf, VirtRegMap &vrm)
190 : MF(mf), LIS(pass.getAnalysis<LiveIntervals>()),
191 LSS(pass.getAnalysis<LiveStacks>()),
Chandler Carruth7b560d42015-09-09 17:55:00 +0000192 AA(&pass.getAnalysis<AAResultsWrapperPass>().getAAResults()),
Eric Christopherd9134482014-08-04 21:25:23 +0000193 MDT(pass.getAnalysis<MachineDominatorTree>()),
194 Loops(pass.getAnalysis<MachineLoopInfo>()), VRM(vrm),
Eugene Zelenko900b6332017-08-29 22:32:07 +0000195 MRI(mf.getRegInfo()), TII(*mf.getSubtarget().getInstrInfo()),
Eric Christopherfc6de422014-08-05 02:39:49 +0000196 TRI(*mf.getSubtarget().getRegisterInfo()),
Wei Mi9a16d652016-04-13 03:08:27 +0000197 MBFI(pass.getAnalysis<MachineBlockFrequencyInfo>()),
198 HSpiller(pass, mf, vrm) {}
Jakob Stoklund Olesenf8889112010-06-29 23:58:39 +0000199
Craig Topper4584cd52014-03-07 09:26:03 +0000200 void spill(LiveRangeEdit &) override;
Wei Mi9a16d652016-04-13 03:08:27 +0000201 void postOptimization() override;
Jakob Stoklund Olesen72911e42010-10-14 23:49:52 +0000202
Jakob Stoklund Olesen96037182010-07-02 17:44:57 +0000203private:
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +0000204 bool isSnippet(const LiveInterval &SnipLI);
205 void collectRegsToSpill();
206
David Majnemer42531262016-08-12 03:55:06 +0000207 bool isRegToSpill(unsigned Reg) { return is_contained(RegsToSpill, Reg); }
Jakob Stoklund Olesen27320cb2011-03-18 04:23:06 +0000208
209 bool isSibling(unsigned Reg);
Wei Mi9a16d652016-04-13 03:08:27 +0000210 bool hoistSpillInsideBB(LiveInterval &SpillLI, MachineInstr &CopyMI);
Jakob Stoklund Olesen39488642011-03-20 05:44:55 +0000211 void eliminateRedundantSpills(LiveInterval &LI, VNInfo *VNI);
Jakob Stoklund Olesen27320cb2011-03-18 04:23:06 +0000212
Jakob Stoklund Olesend8af5292011-03-29 03:12:02 +0000213 void markValueUsed(LiveInterval*, VNInfo*);
Duncan P. N. Exon Smithd6ebd072016-02-27 20:23:14 +0000214 bool reMaterializeFor(LiveInterval &, MachineInstr &MI);
Jakob Stoklund Olesen96037182010-07-02 17:44:57 +0000215 void reMaterializeAll();
216
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +0000217 bool coalesceStackAccess(MachineInstr *MI, unsigned Reg);
Eugene Zelenko900b6332017-08-29 22:32:07 +0000218 bool foldMemoryOperand(ArrayRef<std::pair<MachineInstr *, unsigned>>,
Craig Topperc0196b12014-04-14 00:51:57 +0000219 MachineInstr *LoadMI = nullptr);
Mark Lacey9d8103d2013-08-14 23:50:16 +0000220 void insertReload(unsigned VReg, SlotIndex, MachineBasicBlock::iterator MI);
221 void insertSpill(unsigned VReg, bool isKill, MachineBasicBlock::iterator MI);
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +0000222
223 void spillAroundUses(unsigned Reg);
Jakob Stoklund Olesene991f722011-03-29 21:20:19 +0000224 void spillAll();
Jakob Stoklund Olesenf8889112010-06-29 23:58:39 +0000225};
Jakob Stoklund Olesenf8889112010-06-29 23:58:39 +0000226
Eugene Zelenko900b6332017-08-29 22:32:07 +0000227} // end anonymous namespace
Lang Hamescdd90772014-11-06 19:12:38 +0000228
Eugene Zelenko900b6332017-08-29 22:32:07 +0000229Spiller::~Spiller() = default;
Lang Hamescdd90772014-11-06 19:12:38 +0000230
Eugene Zelenko900b6332017-08-29 22:32:07 +0000231void Spiller::anchor() {}
232
233Spiller *llvm::createInlineSpiller(MachineFunctionPass &pass,
234 MachineFunction &mf,
235 VirtRegMap &vrm) {
Jakob Stoklund Olesen0fef9dd2010-07-20 23:50:15 +0000236 return new InlineSpiller(pass, mf, vrm);
Jakob Stoklund Olesenf8889112010-06-29 23:58:39 +0000237}
Lang Hamescdd90772014-11-06 19:12:38 +0000238
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +0000239//===----------------------------------------------------------------------===//
240// Snippets
241//===----------------------------------------------------------------------===//
242
243// When spilling a virtual register, we also spill any snippets it is connected
244// to. The snippets are small live ranges that only have a single real use,
245// leftovers from live range splitting. Spilling them enables memory operand
246// folding or tightens the live range around the single use.
247//
248// This minimizes register pressure and maximizes the store-to-load distance for
249// spill slots which can be important in tight loops.
250
251/// isFullCopyOf - If MI is a COPY to or from Reg, return the other register,
252/// otherwise return 0.
Duncan P. N. Exon Smith9cfc75c2016-06-30 00:01:54 +0000253static unsigned isFullCopyOf(const MachineInstr &MI, unsigned Reg) {
254 if (!MI.isFullCopy())
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +0000255 return 0;
Duncan P. N. Exon Smith9cfc75c2016-06-30 00:01:54 +0000256 if (MI.getOperand(0).getReg() == Reg)
257 return MI.getOperand(1).getReg();
258 if (MI.getOperand(1).getReg() == Reg)
259 return MI.getOperand(0).getReg();
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +0000260 return 0;
261}
262
263/// isSnippet - Identify if a live interval is a snippet that should be spilled.
264/// It is assumed that SnipLI is a virtual register with the same original as
Jakob Stoklund Olesena00bab22011-03-14 19:56:43 +0000265/// Edit->getReg().
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +0000266bool InlineSpiller::isSnippet(const LiveInterval &SnipLI) {
Jakob Stoklund Olesena00bab22011-03-14 19:56:43 +0000267 unsigned Reg = Edit->getReg();
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +0000268
269 // A snippet is a tiny live range with only a single instruction using it
270 // besides copies to/from Reg or spills/fills. We accept:
271 //
272 // %snip = COPY %Reg / FILL fi#
273 // %snip = USE %snip
274 // %Reg = COPY %snip / SPILL %snip, fi#
275 //
Jakob Stoklund Olesena00bab22011-03-14 19:56:43 +0000276 if (SnipLI.getNumValNums() > 2 || !LIS.intervalIsInOneMBB(SnipLI))
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +0000277 return false;
278
Craig Topperc0196b12014-04-14 00:51:57 +0000279 MachineInstr *UseMI = nullptr;
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +0000280
281 // Check that all uses satisfy our criteria.
Owen Andersonabb90c92014-03-13 06:02:25 +0000282 for (MachineRegisterInfo::reg_instr_nodbg_iterator
283 RI = MRI.reg_instr_nodbg_begin(SnipLI.reg),
284 E = MRI.reg_instr_nodbg_end(); RI != E; ) {
Duncan P. N. Exon Smith9cfc75c2016-06-30 00:01:54 +0000285 MachineInstr &MI = *RI++;
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +0000286
287 // Allow copies to/from Reg.
288 if (isFullCopyOf(MI, Reg))
289 continue;
290
291 // Allow stack slot loads.
292 int FI;
Jakob Stoklund Olesena00bab22011-03-14 19:56:43 +0000293 if (SnipLI.reg == TII.isLoadFromStackSlot(MI, FI) && FI == StackSlot)
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +0000294 continue;
295
296 // Allow stack slot stores.
Jakob Stoklund Olesena00bab22011-03-14 19:56:43 +0000297 if (SnipLI.reg == TII.isStoreToStackSlot(MI, FI) && FI == StackSlot)
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +0000298 continue;
299
300 // Allow a single additional instruction.
Duncan P. N. Exon Smith9cfc75c2016-06-30 00:01:54 +0000301 if (UseMI && &MI != UseMI)
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +0000302 return false;
Duncan P. N. Exon Smith9cfc75c2016-06-30 00:01:54 +0000303 UseMI = &MI;
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +0000304 }
305 return true;
306}
307
308/// collectRegsToSpill - Collect live range snippets that only have a single
309/// real use.
310void InlineSpiller::collectRegsToSpill() {
Jakob Stoklund Olesena00bab22011-03-14 19:56:43 +0000311 unsigned Reg = Edit->getReg();
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +0000312
313 // Main register always spills.
314 RegsToSpill.assign(1, Reg);
315 SnippetCopies.clear();
316
317 // Snippets all have the same original, so there can't be any for an original
318 // register.
Jakob Stoklund Olesena0d5ec12011-03-15 21:13:25 +0000319 if (Original == Reg)
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +0000320 return;
321
Owen Andersonabb90c92014-03-13 06:02:25 +0000322 for (MachineRegisterInfo::reg_instr_iterator
323 RI = MRI.reg_instr_begin(Reg), E = MRI.reg_instr_end(); RI != E; ) {
Duncan P. N. Exon Smith9cfc75c2016-06-30 00:01:54 +0000324 MachineInstr &MI = *RI++;
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +0000325 unsigned SnipReg = isFullCopyOf(MI, Reg);
Jakob Stoklund Olesen27320cb2011-03-18 04:23:06 +0000326 if (!isSibling(SnipReg))
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +0000327 continue;
Jakob Stoklund Olesena00bab22011-03-14 19:56:43 +0000328 LiveInterval &SnipLI = LIS.getInterval(SnipReg);
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +0000329 if (!isSnippet(SnipLI))
330 continue;
Duncan P. N. Exon Smith9cfc75c2016-06-30 00:01:54 +0000331 SnippetCopies.insert(&MI);
Jakob Stoklund Olesenc5a8c082011-05-05 17:22:53 +0000332 if (isRegToSpill(SnipReg))
333 continue;
334 RegsToSpill.push_back(SnipReg);
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +0000335 DEBUG(dbgs() << "\talso spill snippet " << SnipLI << '\n');
Jakob Stoklund Olesenc5a8c082011-05-05 17:22:53 +0000336 ++NumSnippets;
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +0000337 }
338}
339
Jakob Stoklund Olesen27320cb2011-03-18 04:23:06 +0000340bool InlineSpiller::isSibling(unsigned Reg) {
341 return TargetRegisterInfo::isVirtualRegister(Reg) &&
342 VRM.getOriginal(Reg) == Original;
343}
344
Wei Mi9a16d652016-04-13 03:08:27 +0000345/// It is beneficial to spill to earlier place in the same BB in case
346/// as follows:
347/// There is an alternative def earlier in the same MBB.
348/// Hoist the spill as far as possible in SpillMBB. This can ease
349/// register pressure:
Hans Wennborg5a7723c2016-04-08 15:17:43 +0000350///
Wei Mi9a16d652016-04-13 03:08:27 +0000351/// x = def
352/// y = use x
353/// s = copy x
Hans Wennborg5a7723c2016-04-08 15:17:43 +0000354///
Wei Mi9a16d652016-04-13 03:08:27 +0000355/// Hoisting the spill of s to immediately after the def removes the
356/// interference between x and y:
Hans Wennborg5a7723c2016-04-08 15:17:43 +0000357///
Wei Mi9a16d652016-04-13 03:08:27 +0000358/// x = def
359/// spill x
360/// y = use x<kill>
Hans Wennborg5a7723c2016-04-08 15:17:43 +0000361///
Wei Mi9a16d652016-04-13 03:08:27 +0000362/// This hoist only helps when the copy kills its source.
Hans Wennborg5a7723c2016-04-08 15:17:43 +0000363///
Wei Mi9a16d652016-04-13 03:08:27 +0000364bool InlineSpiller::hoistSpillInsideBB(LiveInterval &SpillLI,
365 MachineInstr &CopyMI) {
Hans Wennborg5a7723c2016-04-08 15:17:43 +0000366 SlotIndex Idx = LIS.getInstructionIndex(CopyMI);
Wei Mi9a16d652016-04-13 03:08:27 +0000367#ifndef NDEBUG
Hans Wennborg5a7723c2016-04-08 15:17:43 +0000368 VNInfo *VNI = SpillLI.getVNInfoAt(Idx.getRegSlot());
369 assert(VNI && VNI->def == Idx.getRegSlot() && "Not defined by copy");
Wei Mi9a16d652016-04-13 03:08:27 +0000370#endif
Wei Mifb5252c2016-04-04 17:45:03 +0000371
Wei Mi9a16d652016-04-13 03:08:27 +0000372 unsigned SrcReg = CopyMI.getOperand(1).getReg();
373 LiveInterval &SrcLI = LIS.getInterval(SrcReg);
374 VNInfo *SrcVNI = SrcLI.getVNInfoAt(Idx);
375 LiveQueryResult SrcQ = SrcLI.Query(Idx);
376 MachineBasicBlock *DefMBB = LIS.getMBBFromIndex(SrcVNI->def);
377 if (DefMBB != CopyMI.getParent() || !SrcQ.isKill())
Hans Wennborg5a7723c2016-04-08 15:17:43 +0000378 return false;
379
Jakob Stoklund Olesen27320cb2011-03-18 04:23:06 +0000380 // Conservatively extend the stack slot range to the range of the original
381 // value. We may be able to do better with stack slot coloring by being more
382 // careful here.
Jakob Stoklund Olesene4663452011-03-26 22:16:41 +0000383 assert(StackInt && "No stack slot assigned yet.");
Jakob Stoklund Olesen27320cb2011-03-18 04:23:06 +0000384 LiveInterval &OrigLI = LIS.getInterval(Original);
385 VNInfo *OrigVNI = OrigLI.getVNInfoAt(Idx);
Jakob Stoklund Olesene4663452011-03-26 22:16:41 +0000386 StackInt->MergeValueInAsValue(OrigLI, OrigVNI, StackInt->getValNumInfo(0));
Jakob Stoklund Olesen86985072011-03-19 23:02:47 +0000387 DEBUG(dbgs() << "\tmerged orig valno " << OrigVNI->id << ": "
Jakob Stoklund Olesene4663452011-03-26 22:16:41 +0000388 << *StackInt << '\n');
Jakob Stoklund Olesen27320cb2011-03-18 04:23:06 +0000389
Wei Mi9a16d652016-04-13 03:08:27 +0000390 // We are going to spill SrcVNI immediately after its def, so clear out
Jakob Stoklund Olesen27320cb2011-03-18 04:23:06 +0000391 // any later spills of the same value.
Wei Mi9a16d652016-04-13 03:08:27 +0000392 eliminateRedundantSpills(SrcLI, SrcVNI);
Jakob Stoklund Olesen27320cb2011-03-18 04:23:06 +0000393
Wei Mi9a16d652016-04-13 03:08:27 +0000394 MachineBasicBlock *MBB = LIS.getMBBFromIndex(SrcVNI->def);
Jakob Stoklund Olesen27320cb2011-03-18 04:23:06 +0000395 MachineBasicBlock::iterator MII;
Wei Mi9a16d652016-04-13 03:08:27 +0000396 if (SrcVNI->isPHIDef())
Keith Walker830a8c12016-09-16 14:07:29 +0000397 MII = MBB->SkipPHIsLabelsAndDebug(MBB->begin());
Jakob Stoklund Olesen27320cb2011-03-18 04:23:06 +0000398 else {
Wei Mi9a16d652016-04-13 03:08:27 +0000399 MachineInstr *DefMI = LIS.getInstructionFromIndex(SrcVNI->def);
Jakob Stoklund Olesenec9b4a62011-04-30 06:42:21 +0000400 assert(DefMI && "Defining instruction disappeared");
401 MII = DefMI;
Jakob Stoklund Olesen27320cb2011-03-18 04:23:06 +0000402 ++MII;
403 }
404 // Insert spill without kill flag immediately after def.
Wei Mi9a16d652016-04-13 03:08:27 +0000405 TII.storeRegToStackSlot(*MBB, MII, SrcReg, false, StackSlot,
406 MRI.getRegClass(SrcReg), &TRI);
Jakob Stoklund Olesen27320cb2011-03-18 04:23:06 +0000407 --MII; // Point to store instruction.
Duncan P. N. Exon Smith3ac9cc62016-02-27 06:40:41 +0000408 LIS.InsertMachineInstrInMaps(*MII);
Wei Mi9a16d652016-04-13 03:08:27 +0000409 DEBUG(dbgs() << "\thoisted: " << SrcVNI->def << '\t' << *MII);
Jakob Stoklund Olesenc5a8c082011-05-05 17:22:53 +0000410
Duncan P. N. Exon Smith91298732016-06-30 23:28:15 +0000411 HSpiller.addToMergeableSpills(*MII, StackSlot, Original);
Jakob Stoklund Olesen37eb6962011-09-15 17:54:28 +0000412 ++NumSpills;
Jakob Stoklund Olesen27320cb2011-03-18 04:23:06 +0000413 return true;
414}
415
Jakob Stoklund Olesen39488642011-03-20 05:44:55 +0000416/// eliminateRedundantSpills - SLI:VNI is known to be on the stack. Remove any
417/// redundant spills of this value in SLI.reg and sibling copies.
418void InlineSpiller::eliminateRedundantSpills(LiveInterval &SLI, VNInfo *VNI) {
Jakob Stoklund Olesene55003f2011-03-20 05:44:58 +0000419 assert(VNI && "Missing value");
Jakob Stoklund Olesen39488642011-03-20 05:44:55 +0000420 SmallVector<std::pair<LiveInterval*, VNInfo*>, 8> WorkList;
421 WorkList.push_back(std::make_pair(&SLI, VNI));
Jakob Stoklund Olesene4663452011-03-26 22:16:41 +0000422 assert(StackInt && "No stack slot assigned yet.");
Jakob Stoklund Olesen27320cb2011-03-18 04:23:06 +0000423
424 do {
Jakob Stoklund Olesen39488642011-03-20 05:44:55 +0000425 LiveInterval *LI;
Benjamin Kramerd6f1f842014-03-02 13:30:33 +0000426 std::tie(LI, VNI) = WorkList.pop_back_val();
Jakob Stoklund Olesen39488642011-03-20 05:44:55 +0000427 unsigned Reg = LI->reg;
Jakob Stoklund Olesenec9b4a62011-04-30 06:42:21 +0000428 DEBUG(dbgs() << "Checking redundant spills for "
429 << VNI->id << '@' << VNI->def << " in " << *LI << '\n');
Jakob Stoklund Olesen27320cb2011-03-18 04:23:06 +0000430
431 // Regs to spill are taken care of.
432 if (isRegToSpill(Reg))
433 continue;
434
435 // Add all of VNI's live range to StackInt.
Jakob Stoklund Olesene4663452011-03-26 22:16:41 +0000436 StackInt->MergeValueInAsValue(*LI, VNI, StackInt->getValNumInfo(0));
437 DEBUG(dbgs() << "Merged to stack int: " << *StackInt << '\n');
Jakob Stoklund Olesen27320cb2011-03-18 04:23:06 +0000438
439 // Find all spills and copies of VNI.
Owen Andersonabb90c92014-03-13 06:02:25 +0000440 for (MachineRegisterInfo::use_instr_nodbg_iterator
441 UI = MRI.use_instr_nodbg_begin(Reg), E = MRI.use_instr_nodbg_end();
442 UI != E; ) {
Duncan P. N. Exon Smith9cfc75c2016-06-30 00:01:54 +0000443 MachineInstr &MI = *UI++;
444 if (!MI.isCopy() && !MI.mayStore())
Jakob Stoklund Olesen27320cb2011-03-18 04:23:06 +0000445 continue;
Duncan P. N. Exon Smith9cfc75c2016-06-30 00:01:54 +0000446 SlotIndex Idx = LIS.getInstructionIndex(MI);
Jakob Stoklund Olesen39488642011-03-20 05:44:55 +0000447 if (LI->getVNInfoAt(Idx) != VNI)
Jakob Stoklund Olesen27320cb2011-03-18 04:23:06 +0000448 continue;
449
450 // Follow sibling copies down the dominator tree.
451 if (unsigned DstReg = isFullCopyOf(MI, Reg)) {
452 if (isSibling(DstReg)) {
453 LiveInterval &DstLI = LIS.getInterval(DstReg);
Jakob Stoklund Olesen90b5e562011-11-13 20:45:27 +0000454 VNInfo *DstVNI = DstLI.getVNInfoAt(Idx.getRegSlot());
Jakob Stoklund Olesen27320cb2011-03-18 04:23:06 +0000455 assert(DstVNI && "Missing defined value");
Jakob Stoklund Olesen90b5e562011-11-13 20:45:27 +0000456 assert(DstVNI->def == Idx.getRegSlot() && "Wrong copy def slot");
Jakob Stoklund Olesen39488642011-03-20 05:44:55 +0000457 WorkList.push_back(std::make_pair(&DstLI, DstVNI));
Jakob Stoklund Olesen27320cb2011-03-18 04:23:06 +0000458 }
459 continue;
460 }
461
462 // Erase spills.
463 int FI;
464 if (Reg == TII.isStoreToStackSlot(MI, FI) && FI == StackSlot) {
Duncan P. N. Exon Smith9cfc75c2016-06-30 00:01:54 +0000465 DEBUG(dbgs() << "Redundant spill " << Idx << '\t' << MI);
Jakob Stoklund Olesen27320cb2011-03-18 04:23:06 +0000466 // eliminateDeadDefs won't normally remove stores, so switch opcode.
Duncan P. N. Exon Smith9cfc75c2016-06-30 00:01:54 +0000467 MI.setDesc(TII.get(TargetOpcode::KILL));
468 DeadDefs.push_back(&MI);
Jakob Stoklund Olesen37eb6962011-09-15 17:54:28 +0000469 ++NumSpillsRemoved;
Duncan P. N. Exon Smith91298732016-06-30 23:28:15 +0000470 if (HSpiller.rmFromMergeableSpills(MI, StackSlot))
Wei Mi9a16d652016-04-13 03:08:27 +0000471 --NumSpills;
Jakob Stoklund Olesen27320cb2011-03-18 04:23:06 +0000472 }
473 }
474 } while (!WorkList.empty());
475}
476
Jakob Stoklund Olesend8af5292011-03-29 03:12:02 +0000477//===----------------------------------------------------------------------===//
478// Rematerialization
479//===----------------------------------------------------------------------===//
480
481/// markValueUsed - Remember that VNI failed to rematerialize, so its defining
482/// instruction cannot be eliminated. See through snippet copies
483void InlineSpiller::markValueUsed(LiveInterval *LI, VNInfo *VNI) {
484 SmallVector<std::pair<LiveInterval*, VNInfo*>, 8> WorkList;
485 WorkList.push_back(std::make_pair(LI, VNI));
486 do {
Benjamin Kramerd6f1f842014-03-02 13:30:33 +0000487 std::tie(LI, VNI) = WorkList.pop_back_val();
David Blaikie70573dc2014-11-19 07:49:26 +0000488 if (!UsedValues.insert(VNI).second)
Jakob Stoklund Olesend8af5292011-03-29 03:12:02 +0000489 continue;
490
491 if (VNI->isPHIDef()) {
492 MachineBasicBlock *MBB = LIS.getMBBFromIndex(VNI->def);
Craig Topper73275a22015-12-24 05:20:40 +0000493 for (MachineBasicBlock *P : MBB->predecessors()) {
494 VNInfo *PVNI = LI->getVNInfoBefore(LIS.getMBBEndIdx(P));
Jakob Stoklund Olesend8af5292011-03-29 03:12:02 +0000495 if (PVNI)
496 WorkList.push_back(std::make_pair(LI, PVNI));
497 }
498 continue;
499 }
500
501 // Follow snippet copies.
502 MachineInstr *MI = LIS.getInstructionFromIndex(VNI->def);
503 if (!SnippetCopies.count(MI))
504 continue;
505 LiveInterval &SnipLI = LIS.getInterval(MI->getOperand(1).getReg());
506 assert(isRegToSpill(SnipLI.reg) && "Unexpected register in copy");
Jakob Stoklund Olesen90b5e562011-11-13 20:45:27 +0000507 VNInfo *SnipVNI = SnipLI.getVNInfoAt(VNI->def.getRegSlot(true));
Jakob Stoklund Olesend8af5292011-03-29 03:12:02 +0000508 assert(SnipVNI && "Snippet undefined before copy");
509 WorkList.push_back(std::make_pair(&SnipLI, SnipVNI));
510 } while (!WorkList.empty());
511}
512
513/// reMaterializeFor - Attempt to rematerialize before MI instead of reloading.
Duncan P. N. Exon Smithd6ebd072016-02-27 20:23:14 +0000514bool InlineSpiller::reMaterializeFor(LiveInterval &VirtReg, MachineInstr &MI) {
Patrik Hagglund296acbf2014-09-01 11:04:07 +0000515 // Analyze instruction
516 SmallVector<std::pair<MachineInstr *, unsigned>, 8> Ops;
517 MIBundleOperands::VirtRegInfo RI =
Duncan P. N. Exon Smithd6ebd072016-02-27 20:23:14 +0000518 MIBundleOperands(MI).analyzeVirtReg(VirtReg.reg, &Ops);
Patrik Hagglund296acbf2014-09-01 11:04:07 +0000519
520 if (!RI.Reads)
521 return false;
522
Duncan P. N. Exon Smithd6ebd072016-02-27 20:23:14 +0000523 SlotIndex UseIdx = LIS.getInstructionIndex(MI).getRegSlot(true);
Jakob Stoklund Olesenc0dd3da2011-07-18 05:31:59 +0000524 VNInfo *ParentVNI = VirtReg.getVNInfoAt(UseIdx.getBaseIndex());
Jakob Stoklund Olesend8af5292011-03-29 03:12:02 +0000525
526 if (!ParentVNI) {
Jakob Stoklund Olesen96037182010-07-02 17:44:57 +0000527 DEBUG(dbgs() << "\tadding <undef> flags: ");
Duncan P. N. Exon Smithd6ebd072016-02-27 20:23:14 +0000528 for (unsigned i = 0, e = MI.getNumOperands(); i != e; ++i) {
529 MachineOperand &MO = MI.getOperand(i);
Jakob Stoklund Olesen0ed9ebc2011-03-29 17:47:02 +0000530 if (MO.isReg() && MO.isUse() && MO.getReg() == VirtReg.reg)
Jakob Stoklund Olesen96037182010-07-02 17:44:57 +0000531 MO.setIsUndef();
532 }
Duncan P. N. Exon Smithd6ebd072016-02-27 20:23:14 +0000533 DEBUG(dbgs() << UseIdx << '\t' << MI);
Jakob Stoklund Olesen96037182010-07-02 17:44:57 +0000534 return true;
535 }
Jakob Stoklund Olesen2edaa2f2010-10-20 22:00:51 +0000536
Duncan P. N. Exon Smithd6ebd072016-02-27 20:23:14 +0000537 if (SnippetCopies.count(&MI))
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +0000538 return false;
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +0000539
Wei Mi9a16d652016-04-13 03:08:27 +0000540 LiveInterval &OrigLI = LIS.getInterval(Original);
541 VNInfo *OrigVNI = OrigLI.getVNInfoAt(UseIdx);
Jakob Stoklund Olesend8af5292011-03-29 03:12:02 +0000542 LiveRangeEdit::Remat RM(ParentVNI);
Wei Mi9a16d652016-04-13 03:08:27 +0000543 RM.OrigMI = LIS.getInstructionFromIndex(OrigVNI->def);
544
545 if (!Edit->canRematerializeAt(RM, OrigVNI, UseIdx, false)) {
Jakob Stoklund Olesend8af5292011-03-29 03:12:02 +0000546 markValueUsed(&VirtReg, ParentVNI);
Duncan P. N. Exon Smithd6ebd072016-02-27 20:23:14 +0000547 DEBUG(dbgs() << "\tcannot remat for " << UseIdx << '\t' << MI);
Jakob Stoklund Olesen96037182010-07-02 17:44:57 +0000548 return false;
549 }
550
Jakob Stoklund Olesen0ed9ebc2011-03-29 17:47:02 +0000551 // If the instruction also writes VirtReg.reg, it had better not require the
552 // same register for uses and defs.
Jakob Stoklund Olesenabe8c092012-03-01 01:43:25 +0000553 if (RI.Tied) {
554 markValueUsed(&VirtReg, ParentVNI);
Duncan P. N. Exon Smithd6ebd072016-02-27 20:23:14 +0000555 DEBUG(dbgs() << "\tcannot remat tied reg: " << UseIdx << '\t' << MI);
Jakob Stoklund Olesenabe8c092012-03-01 01:43:25 +0000556 return false;
Jakob Stoklund Olesen96037182010-07-02 17:44:57 +0000557 }
558
Jakob Stoklund Olesen3b2966d2010-12-18 03:04:14 +0000559 // Before rematerializing into a register for a single instruction, try to
560 // fold a load into the instruction. That avoids allocating a new register.
Evan Cheng7f8e5632011-12-07 07:15:52 +0000561 if (RM.OrigMI->canFoldAsLoad() &&
Jakob Stoklund Olesenabe8c092012-03-01 01:43:25 +0000562 foldMemoryOperand(Ops, RM.OrigMI)) {
Jakob Stoklund Olesena00bab22011-03-14 19:56:43 +0000563 Edit->markRematerialized(RM.ParentVNI);
Jakob Stoklund Olesenc5a8c082011-05-05 17:22:53 +0000564 ++NumFoldedLoads;
Jakob Stoklund Olesen3b2966d2010-12-18 03:04:14 +0000565 return true;
566 }
567
Wolfgang Pieb8df58f42016-08-16 17:12:50 +0000568 // Allocate a new register for the remat.
Mark Lacey9d8103d2013-08-14 23:50:16 +0000569 unsigned NewVReg = Edit->createFrom(Original);
Jakob Stoklund Olesen96037182010-07-02 17:44:57 +0000570
571 // Finally we can rematerialize OrigMI before MI.
Duncan P. N. Exon Smithd6ebd072016-02-27 20:23:14 +0000572 SlotIndex DefIdx =
573 Edit->rematerializeAt(*MI.getParent(), MI, NewVReg, RM, TRI);
Wolfgang Pieb8df58f42016-08-16 17:12:50 +0000574
575 // We take the DebugLoc from MI, since OrigMI may be attributed to a
Junmo Park061bec82017-02-25 01:50:45 +0000576 // different source location.
Wolfgang Pieb8df58f42016-08-16 17:12:50 +0000577 auto *NewMI = LIS.getInstructionFromIndex(DefIdx);
578 NewMI->setDebugLoc(MI.getDebugLoc());
579
Mark Lacey9d8103d2013-08-14 23:50:16 +0000580 (void)DefIdx;
Jakob Stoklund Olesenc6a20412011-02-08 19:33:55 +0000581 DEBUG(dbgs() << "\tremat: " << DefIdx << '\t'
Jakob Stoklund Olesena00bab22011-03-14 19:56:43 +0000582 << *LIS.getInstructionFromIndex(DefIdx));
Jakob Stoklund Olesen96037182010-07-02 17:44:57 +0000583
584 // Replace operands
Craig Topper73275a22015-12-24 05:20:40 +0000585 for (const auto &OpPair : Ops) {
586 MachineOperand &MO = OpPair.first->getOperand(OpPair.second);
Jakob Stoklund Olesen0ed9ebc2011-03-29 17:47:02 +0000587 if (MO.isReg() && MO.isUse() && MO.getReg() == VirtReg.reg) {
Mark Lacey9d8103d2013-08-14 23:50:16 +0000588 MO.setReg(NewVReg);
Jakob Stoklund Olesen96037182010-07-02 17:44:57 +0000589 MO.setIsKill();
590 }
591 }
Duncan P. N. Exon Smithd6ebd072016-02-27 20:23:14 +0000592 DEBUG(dbgs() << "\t " << UseIdx << '\t' << MI << '\n');
Jakob Stoklund Olesen96037182010-07-02 17:44:57 +0000593
Jakob Stoklund Olesenc5a8c082011-05-05 17:22:53 +0000594 ++NumRemats;
Jakob Stoklund Olesenbde96ad2010-06-30 23:03:52 +0000595 return true;
596}
597
Jakob Stoklund Olesen72911e42010-10-14 23:49:52 +0000598/// reMaterializeAll - Try to rematerialize as many uses as possible,
Jakob Stoklund Olesen96037182010-07-02 17:44:57 +0000599/// and trim the live ranges after.
600void InlineSpiller::reMaterializeAll() {
Pete Cooper2bde2f42012-04-02 22:22:53 +0000601 if (!Edit->anyRematerializable(AA))
Jakob Stoklund Olesen96037182010-07-02 17:44:57 +0000602 return;
603
Jakob Stoklund Olesena00bab22011-03-14 19:56:43 +0000604 UsedValues.clear();
Jakob Stoklund Olesen2edaa2f2010-10-20 22:00:51 +0000605
Jakob Stoklund Olesend8af5292011-03-29 03:12:02 +0000606 // Try to remat before all uses of snippets.
Jakob Stoklund Olesen96037182010-07-02 17:44:57 +0000607 bool anyRemat = false;
Craig Topper73275a22015-12-24 05:20:40 +0000608 for (unsigned Reg : RegsToSpill) {
Jakob Stoklund Olesend8af5292011-03-29 03:12:02 +0000609 LiveInterval &LI = LIS.getInterval(Reg);
Patrik Hagglund296acbf2014-09-01 11:04:07 +0000610 for (MachineRegisterInfo::reg_bundle_iterator
611 RegI = MRI.reg_bundle_begin(Reg), E = MRI.reg_bundle_end();
612 RegI != E; ) {
Duncan P. N. Exon Smithd6ebd072016-02-27 20:23:14 +0000613 MachineInstr &MI = *RegI++;
Patrik Hagglund296acbf2014-09-01 11:04:07 +0000614
615 // Debug values are not allowed to affect codegen.
Duncan P. N. Exon Smithd6ebd072016-02-27 20:23:14 +0000616 if (MI.isDebugValue())
Patrik Hagglund296acbf2014-09-01 11:04:07 +0000617 continue;
618
Jakob Stoklund Olesend8af5292011-03-29 03:12:02 +0000619 anyRemat |= reMaterializeFor(LI, MI);
Owen Andersonabb90c92014-03-13 06:02:25 +0000620 }
Jakob Stoklund Olesend8af5292011-03-29 03:12:02 +0000621 }
Jakob Stoklund Olesen96037182010-07-02 17:44:57 +0000622 if (!anyRemat)
623 return;
624
625 // Remove any values that were completely rematted.
Craig Topper73275a22015-12-24 05:20:40 +0000626 for (unsigned Reg : RegsToSpill) {
Jakob Stoklund Olesend8af5292011-03-29 03:12:02 +0000627 LiveInterval &LI = LIS.getInterval(Reg);
628 for (LiveInterval::vni_iterator I = LI.vni_begin(), E = LI.vni_end();
629 I != E; ++I) {
630 VNInfo *VNI = *I;
Jakob Stoklund Olesenadd79c62011-03-29 17:47:00 +0000631 if (VNI->isUnused() || VNI->isPHIDef() || UsedValues.count(VNI))
Jakob Stoklund Olesencf6c5c92010-07-02 19:54:40 +0000632 continue;
Jakob Stoklund Olesend8af5292011-03-29 03:12:02 +0000633 MachineInstr *MI = LIS.getInstructionFromIndex(VNI->def);
634 MI->addRegisterDead(Reg, &TRI);
635 if (!MI->allDefsAreDead())
636 continue;
637 DEBUG(dbgs() << "All defs dead: " << *MI);
638 DeadDefs.push_back(MI);
Jakob Stoklund Olesencf6c5c92010-07-02 19:54:40 +0000639 }
Jakob Stoklund Olesen96037182010-07-02 17:44:57 +0000640 }
Jakob Stoklund Olesenadd79c62011-03-29 17:47:00 +0000641
642 // Eliminate dead code after remat. Note that some snippet copies may be
643 // deleted here.
644 if (DeadDefs.empty())
645 return;
646 DEBUG(dbgs() << "Remat created " << DeadDefs.size() << " dead defs.\n");
Wei Mic0223702016-07-08 21:08:09 +0000647 Edit->eliminateDeadDefs(DeadDefs, RegsToSpill, AA);
Jakob Stoklund Olesenadd79c62011-03-29 17:47:00 +0000648
Wei Mia62f0582016-02-05 18:14:24 +0000649 // LiveRangeEdit::eliminateDeadDef is used to remove dead define instructions
650 // after rematerialization. To remove a VNI for a vreg from its LiveInterval,
651 // LiveIntervals::removeVRegDefAt is used. However, after non-PHI VNIs are all
652 // removed, PHI VNI are still left in the LiveInterval.
653 // So to get rid of unused reg, we need to check whether it has non-dbg
654 // reference instead of whether it has non-empty interval.
Benjamin Kramer391f5a62013-05-05 11:29:14 +0000655 unsigned ResultPos = 0;
Craig Topper73275a22015-12-24 05:20:40 +0000656 for (unsigned Reg : RegsToSpill) {
Wei Mia62f0582016-02-05 18:14:24 +0000657 if (MRI.reg_nodbg_empty(Reg)) {
Benjamin Kramer391f5a62013-05-05 11:29:14 +0000658 Edit->eraseVirtReg(Reg);
Jakob Stoklund Olesenadd79c62011-03-29 17:47:00 +0000659 continue;
660 }
Matt Arsenaultc5d1e502017-07-22 00:24:01 +0000661
Matt Arsenault5fbc8702017-07-24 18:07:55 +0000662 assert(LIS.hasInterval(Reg) &&
663 (!LIS.getInterval(Reg).empty() || !MRI.reg_nodbg_empty(Reg)) &&
664 "Empty and not used live-range?!");
665
Benjamin Kramer391f5a62013-05-05 11:29:14 +0000666 RegsToSpill[ResultPos++] = Reg;
Jakob Stoklund Olesenadd79c62011-03-29 17:47:00 +0000667 }
Benjamin Kramer391f5a62013-05-05 11:29:14 +0000668 RegsToSpill.erase(RegsToSpill.begin() + ResultPos, RegsToSpill.end());
Jakob Stoklund Olesenadd79c62011-03-29 17:47:00 +0000669 DEBUG(dbgs() << RegsToSpill.size() << " registers to spill after remat.\n");
Jakob Stoklund Olesen96037182010-07-02 17:44:57 +0000670}
671
Jakob Stoklund Olesene991f722011-03-29 21:20:19 +0000672//===----------------------------------------------------------------------===//
673// Spilling
674//===----------------------------------------------------------------------===//
675
Jakob Stoklund Olesena00bab22011-03-14 19:56:43 +0000676/// If MI is a load or store of StackSlot, it can be removed.
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +0000677bool InlineSpiller::coalesceStackAccess(MachineInstr *MI, unsigned Reg) {
Jakob Stoklund Olesen7fd49052010-08-04 22:35:11 +0000678 int FI = 0;
Duncan P. N. Exon Smith9cfc75c2016-06-30 00:01:54 +0000679 unsigned InstrReg = TII.isLoadFromStackSlot(*MI, FI);
Jakob Stoklund Olesen37eb6962011-09-15 17:54:28 +0000680 bool IsLoad = InstrReg;
681 if (!IsLoad)
Duncan P. N. Exon Smith9cfc75c2016-06-30 00:01:54 +0000682 InstrReg = TII.isStoreToStackSlot(*MI, FI);
Jakob Stoklund Olesen7fd49052010-08-04 22:35:11 +0000683
684 // We have a stack access. Is it the right register and slot?
Jakob Stoklund Olesena00bab22011-03-14 19:56:43 +0000685 if (InstrReg != Reg || FI != StackSlot)
Jakob Stoklund Olesen7fd49052010-08-04 22:35:11 +0000686 return false;
687
Wei Mi9a16d652016-04-13 03:08:27 +0000688 if (!IsLoad)
Duncan P. N. Exon Smith91298732016-06-30 23:28:15 +0000689 HSpiller.rmFromMergeableSpills(*MI, StackSlot);
Wei Mi9a16d652016-04-13 03:08:27 +0000690
Jakob Stoklund Olesen7fd49052010-08-04 22:35:11 +0000691 DEBUG(dbgs() << "Coalescing stack access: " << *MI);
Duncan P. N. Exon Smith3ac9cc62016-02-27 06:40:41 +0000692 LIS.RemoveMachineInstrFromMaps(*MI);
Jakob Stoklund Olesen7fd49052010-08-04 22:35:11 +0000693 MI->eraseFromParent();
Jakob Stoklund Olesen37eb6962011-09-15 17:54:28 +0000694
695 if (IsLoad) {
696 ++NumReloadsRemoved;
697 --NumReloads;
698 } else {
699 ++NumSpillsRemoved;
700 --NumSpills;
701 }
702
Jakob Stoklund Olesen7fd49052010-08-04 22:35:11 +0000703 return true;
704}
705
Junmo Parkc7479ba2017-03-28 04:14:25 +0000706#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
707LLVM_DUMP_METHOD
Mark Lacey9d8103d2013-08-14 23:50:16 +0000708// Dump the range of instructions from B to E with their slot indexes.
709static void dumpMachineInstrRangeWithSlotIndex(MachineBasicBlock::iterator B,
710 MachineBasicBlock::iterator E,
711 LiveIntervals const &LIS,
712 const char *const header,
713 unsigned VReg =0) {
714 char NextLine = '\n';
715 char SlotIndent = '\t';
716
Benjamin Kramerb6d0bd42014-03-02 12:27:27 +0000717 if (std::next(B) == E) {
Mark Lacey9d8103d2013-08-14 23:50:16 +0000718 NextLine = ' ';
719 SlotIndent = ' ';
720 }
721
722 dbgs() << '\t' << header << ": " << NextLine;
723
724 for (MachineBasicBlock::iterator I = B; I != E; ++I) {
Duncan P. N. Exon Smith3ac9cc62016-02-27 06:40:41 +0000725 SlotIndex Idx = LIS.getInstructionIndex(*I).getRegSlot();
Mark Lacey9d8103d2013-08-14 23:50:16 +0000726
727 // If a register was passed in and this instruction has it as a
728 // destination that is marked as an early clobber, print the
729 // early-clobber slot index.
730 if (VReg) {
731 MachineOperand *MO = I->findRegisterDefOperand(VReg);
732 if (MO && MO->isEarlyClobber())
733 Idx = Idx.getRegSlot(true);
734 }
735
736 dbgs() << SlotIndent << Idx << '\t' << *I;
737 }
738}
739#endif
740
Jakob Stoklund Olesenabe8c092012-03-01 01:43:25 +0000741/// foldMemoryOperand - Try folding stack slot references in Ops into their
742/// instructions.
743///
744/// @param Ops Operand indices from analyzeVirtReg().
Jakob Stoklund Olesen3b2966d2010-12-18 03:04:14 +0000745/// @param LoadMI Load instruction to use instead of stack slot when non-null.
Jakob Stoklund Olesenabe8c092012-03-01 01:43:25 +0000746/// @return True on success.
747bool InlineSpiller::
Eugene Zelenko900b6332017-08-29 22:32:07 +0000748foldMemoryOperand(ArrayRef<std::pair<MachineInstr *, unsigned>> Ops,
Jakob Stoklund Olesenabe8c092012-03-01 01:43:25 +0000749 MachineInstr *LoadMI) {
750 if (Ops.empty())
751 return false;
752 // Don't attempt folding in bundles.
753 MachineInstr *MI = Ops.front().first;
754 if (Ops.back().first != MI || MI->isBundled())
755 return false;
756
Jakob Stoklund Olesenc94c9672011-09-15 18:22:52 +0000757 bool WasCopy = MI->isCopy();
Jakob Stoklund Oleseneef48b62011-11-10 00:17:03 +0000758 unsigned ImpReg = 0;
759
Michael Kuperstein47eb85a2016-11-23 18:33:49 +0000760 // Spill subregs if the target allows it.
761 // We always want to spill subregs for stackmap/patchpoint pseudos.
762 bool SpillSubRegs = TII.isSubregFoldable() ||
763 MI->getOpcode() == TargetOpcode::STATEPOINT ||
764 MI->getOpcode() == TargetOpcode::PATCHPOINT ||
765 MI->getOpcode() == TargetOpcode::STACKMAP;
Andrew Trick10d5be42013-11-17 01:36:23 +0000766
Jakob Stoklund Olesen8656a452010-07-01 00:13:04 +0000767 // TargetInstrInfo::foldMemoryOperand only expects explicit, non-tied
768 // operands.
769 SmallVector<unsigned, 8> FoldOps;
Craig Topper73275a22015-12-24 05:20:40 +0000770 for (const auto &OpPair : Ops) {
771 unsigned Idx = OpPair.second;
772 assert(MI == OpPair.first && "Instruction conflict during operand folding");
Jakob Stoklund Olesen8656a452010-07-01 00:13:04 +0000773 MachineOperand &MO = MI->getOperand(Idx);
Jakob Stoklund Oleseneef48b62011-11-10 00:17:03 +0000774 if (MO.isImplicit()) {
775 ImpReg = MO.getReg();
Jakob Stoklund Olesen8656a452010-07-01 00:13:04 +0000776 continue;
Jakob Stoklund Oleseneef48b62011-11-10 00:17:03 +0000777 }
Michael Kuperstein47eb85a2016-11-23 18:33:49 +0000778
Andrew Trick10d5be42013-11-17 01:36:23 +0000779 if (!SpillSubRegs && MO.getSubReg())
Jakob Stoklund Olesen8656a452010-07-01 00:13:04 +0000780 return false;
Jakob Stoklund Olesenc6a20412011-02-08 19:33:55 +0000781 // We cannot fold a load instruction into a def.
782 if (LoadMI && MO.isDef())
783 return false;
Jakob Stoklund Olesen8656a452010-07-01 00:13:04 +0000784 // Tied use operands should not be passed to foldMemoryOperand.
785 if (!MI->isRegTiedToDefOperand(Idx))
786 FoldOps.push_back(Idx);
787 }
788
Quentin Colombetae3168d2016-12-08 00:06:51 +0000789 // If we only have implicit uses, we won't be able to fold that.
790 // Moreover, TargetInstrInfo::foldMemoryOperand will assert if we try!
791 if (FoldOps.empty())
792 return false;
793
Mark Lacey9d8103d2013-08-14 23:50:16 +0000794 MachineInstrSpan MIS(MI);
795
Jakob Stoklund Olesen3b2966d2010-12-18 03:04:14 +0000796 MachineInstr *FoldMI =
Duncan P. N. Exon Smith9cfc75c2016-06-30 00:01:54 +0000797 LoadMI ? TII.foldMemoryOperand(*MI, FoldOps, *LoadMI, &LIS)
798 : TII.foldMemoryOperand(*MI, FoldOps, StackSlot, &LIS);
Jakob Stoklund Olesen8656a452010-07-01 00:13:04 +0000799 if (!FoldMI)
800 return false;
Andrew Trick5749b8b2013-06-21 18:33:26 +0000801
802 // Remove LIS for any dead defs in the original MI not in FoldMI.
Duncan P. N. Exon Smithf9ab4162016-02-27 17:05:33 +0000803 for (MIBundleOperands MO(*MI); MO.isValid(); ++MO) {
Andrew Trick5749b8b2013-06-21 18:33:26 +0000804 if (!MO->isReg())
805 continue;
806 unsigned Reg = MO->getReg();
807 if (!Reg || TargetRegisterInfo::isVirtualRegister(Reg) ||
808 MRI.isReserved(Reg)) {
809 continue;
810 }
Andrew Trickdfacda32014-01-07 07:31:10 +0000811 // Skip non-Defs, including undef uses and internal reads.
812 if (MO->isUse())
813 continue;
Andrew Trick5749b8b2013-06-21 18:33:26 +0000814 MIBundleOperands::PhysRegInfo RI =
Duncan P. N. Exon Smithf9ab4162016-02-27 17:05:33 +0000815 MIBundleOperands(*FoldMI).analyzePhysReg(Reg, &TRI);
Matthias Braun60d69e22015-12-11 19:42:09 +0000816 if (RI.FullyDefined)
Andrew Trick5749b8b2013-06-21 18:33:26 +0000817 continue;
818 // FoldMI does not define this physreg. Remove the LI segment.
819 assert(MO->isDead() && "Cannot fold physreg def");
Duncan P. N. Exon Smith3ac9cc62016-02-27 06:40:41 +0000820 SlotIndex Idx = LIS.getInstructionIndex(*MI).getRegSlot();
Matthias Brauncfb8ad22015-01-21 18:50:21 +0000821 LIS.removePhysRegDefAt(Reg, Idx);
Andrew Trick5749b8b2013-06-21 18:33:26 +0000822 }
Mark Lacey9d8103d2013-08-14 23:50:16 +0000823
Wei Mi9a16d652016-04-13 03:08:27 +0000824 int FI;
Duncan P. N. Exon Smith91298732016-06-30 23:28:15 +0000825 if (TII.isStoreToStackSlot(*MI, FI) &&
826 HSpiller.rmFromMergeableSpills(*MI, FI))
Wei Mi9a16d652016-04-13 03:08:27 +0000827 --NumSpills;
Duncan P. N. Exon Smith3ac9cc62016-02-27 06:40:41 +0000828 LIS.ReplaceMachineInstrInMaps(*MI, *FoldMI);
Jakob Stoklund Olesenbd953d12010-07-09 17:29:08 +0000829 MI->eraseFromParent();
Jakob Stoklund Oleseneef48b62011-11-10 00:17:03 +0000830
Mark Lacey9d8103d2013-08-14 23:50:16 +0000831 // Insert any new instructions other than FoldMI into the LIS maps.
832 assert(!MIS.empty() && "Unexpected empty span of instructions!");
Craig Topper73275a22015-12-24 05:20:40 +0000833 for (MachineInstr &MI : MIS)
834 if (&MI != FoldMI)
Duncan P. N. Exon Smith3ac9cc62016-02-27 06:40:41 +0000835 LIS.InsertMachineInstrInMaps(MI);
Mark Lacey9d8103d2013-08-14 23:50:16 +0000836
Jakob Stoklund Oleseneef48b62011-11-10 00:17:03 +0000837 // TII.foldMemoryOperand may have left some implicit operands on the
838 // instruction. Strip them.
839 if (ImpReg)
840 for (unsigned i = FoldMI->getNumOperands(); i; --i) {
841 MachineOperand &MO = FoldMI->getOperand(i - 1);
842 if (!MO.isReg() || !MO.isImplicit())
843 break;
844 if (MO.getReg() == ImpReg)
845 FoldMI->RemoveOperand(i - 1);
846 }
847
Mark Lacey9d8103d2013-08-14 23:50:16 +0000848 DEBUG(dumpMachineInstrRangeWithSlotIndex(MIS.begin(), MIS.end(), LIS,
849 "folded"));
850
Jakob Stoklund Olesenc94c9672011-09-15 18:22:52 +0000851 if (!WasCopy)
852 ++NumFolded;
Wei Mi9a16d652016-04-13 03:08:27 +0000853 else if (Ops.front().second == 0) {
Jakob Stoklund Olesenc94c9672011-09-15 18:22:52 +0000854 ++NumSpills;
Duncan P. N. Exon Smith91298732016-06-30 23:28:15 +0000855 HSpiller.addToMergeableSpills(*FoldMI, StackSlot, Original);
Wei Mi9a16d652016-04-13 03:08:27 +0000856 } else
Jakob Stoklund Olesenc94c9672011-09-15 18:22:52 +0000857 ++NumReloads;
Jakob Stoklund Olesen8656a452010-07-01 00:13:04 +0000858 return true;
859}
860
Mark Lacey9d8103d2013-08-14 23:50:16 +0000861void InlineSpiller::insertReload(unsigned NewVReg,
Jakob Stoklund Olesen9f294a92011-04-18 20:23:27 +0000862 SlotIndex Idx,
Jakob Stoklund Olesenbde96ad2010-06-30 23:03:52 +0000863 MachineBasicBlock::iterator MI) {
864 MachineBasicBlock &MBB = *MI->getParent();
Mark Lacey9d8103d2013-08-14 23:50:16 +0000865
866 MachineInstrSpan MIS(MI);
867 TII.loadRegFromStackSlot(MBB, MI, NewVReg, StackSlot,
868 MRI.getRegClass(NewVReg), &TRI);
869
870 LIS.InsertMachineInstrRangeInMaps(MIS.begin(), MI);
871
872 DEBUG(dumpMachineInstrRangeWithSlotIndex(MIS.begin(), MI, LIS, "reload",
873 NewVReg));
Jakob Stoklund Olesenc5a8c082011-05-05 17:22:53 +0000874 ++NumReloads;
Jakob Stoklund Olesenbde96ad2010-06-30 23:03:52 +0000875}
876
Quentin Colombetc6689352017-06-05 23:51:27 +0000877/// Check if \p Def fully defines a VReg with an undefined value.
878/// If that's the case, that means the value of VReg is actually
879/// not relevant.
880static bool isFullUndefDef(const MachineInstr &Def) {
881 if (!Def.isImplicitDef())
882 return false;
883 assert(Def.getNumOperands() == 1 &&
884 "Implicit def with more than one definition");
885 // We can say that the VReg defined by Def is undef, only if it is
886 // fully defined by Def. Otherwise, some of the lanes may not be
887 // undef and the value of the VReg matters.
888 return !Def.getOperand(0).getSubReg();
889}
890
Mark Lacey9d8103d2013-08-14 23:50:16 +0000891/// insertSpill - Insert a spill of NewVReg after MI.
892void InlineSpiller::insertSpill(unsigned NewVReg, bool isKill,
893 MachineBasicBlock::iterator MI) {
Jakob Stoklund Olesenbde96ad2010-06-30 23:03:52 +0000894 MachineBasicBlock &MBB = *MI->getParent();
Mark Lacey9d8103d2013-08-14 23:50:16 +0000895
896 MachineInstrSpan MIS(MI);
Quentin Colombet9e9d6382017-06-07 00:22:07 +0000897 bool IsRealSpill = true;
898 if (isFullUndefDef(*MI)) {
Quentin Colombetc6689352017-06-05 23:51:27 +0000899 // Don't spill undef value.
900 // Anything works for undef, in particular keeping the memory
901 // uninitialized is a viable option and it saves code size and
902 // run time.
903 BuildMI(MBB, std::next(MI), MI->getDebugLoc(), TII.get(TargetOpcode::KILL))
904 .addReg(NewVReg, getKillRegState(isKill));
Quentin Colombet9e9d6382017-06-07 00:22:07 +0000905 IsRealSpill = false;
906 } else
Quentin Colombetc6689352017-06-05 23:51:27 +0000907 TII.storeRegToStackSlot(MBB, std::next(MI), NewVReg, isKill, StackSlot,
908 MRI.getRegClass(NewVReg), &TRI);
Mark Lacey9d8103d2013-08-14 23:50:16 +0000909
Benjamin Kramerb6d0bd42014-03-02 12:27:27 +0000910 LIS.InsertMachineInstrRangeInMaps(std::next(MI), MIS.end());
Mark Lacey9d8103d2013-08-14 23:50:16 +0000911
Benjamin Kramerb6d0bd42014-03-02 12:27:27 +0000912 DEBUG(dumpMachineInstrRangeWithSlotIndex(std::next(MI), MIS.end(), LIS,
Mark Lacey9d8103d2013-08-14 23:50:16 +0000913 "spill"));
Jakob Stoklund Olesenc5a8c082011-05-05 17:22:53 +0000914 ++NumSpills;
Quentin Colombet9e9d6382017-06-07 00:22:07 +0000915 if (IsRealSpill)
916 HSpiller.addToMergeableSpills(*std::next(MI), StackSlot, Original);
Jakob Stoklund Olesenbde96ad2010-06-30 23:03:52 +0000917}
918
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +0000919/// spillAroundUses - insert spill code around each use of Reg.
920void InlineSpiller::spillAroundUses(unsigned Reg) {
Jakob Stoklund Olesen31a0b5e2011-05-11 18:25:10 +0000921 DEBUG(dbgs() << "spillAroundUses " << PrintReg(Reg) << '\n');
Jakob Stoklund Olesena00bab22011-03-14 19:56:43 +0000922 LiveInterval &OldLI = LIS.getInterval(Reg);
Jakob Stoklund Olesenf8889112010-06-29 23:58:39 +0000923
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +0000924 // Iterate over instructions using Reg.
Owen Andersonabb90c92014-03-13 06:02:25 +0000925 for (MachineRegisterInfo::reg_bundle_iterator
926 RegI = MRI.reg_bundle_begin(Reg), E = MRI.reg_bundle_end();
927 RegI != E; ) {
Owen Andersonec5d4802014-03-14 05:02:18 +0000928 MachineInstr *MI = &*(RegI++);
Jakob Stoklund Olesenf8889112010-06-29 23:58:39 +0000929
Jakob Stoklund Olesencf6c5c92010-07-02 19:54:40 +0000930 // Debug values are not allowed to affect codegen.
931 if (MI->isDebugValue()) {
932 // Modify DBG_VALUE now that the value is in a spill slot.
David Blaikie0252265b2013-06-16 20:34:15 +0000933 MachineBasicBlock *MBB = MI->getParent();
Adrian Prantl6825fb62017-04-18 01:21:53 +0000934 DEBUG(dbgs() << "Modifying debug info due to spill:\t" << *MI);
935 buildDbgValueForSpill(*MBB, MI, *MI, StackSlot);
936 MBB->erase(MI);
Jakob Stoklund Olesencf6c5c92010-07-02 19:54:40 +0000937 continue;
938 }
939
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +0000940 // Ignore copies to/from snippets. We'll delete them.
941 if (SnippetCopies.count(MI))
942 continue;
943
Jakob Stoklund Olesen7fd49052010-08-04 22:35:11 +0000944 // Stack slot accesses may coalesce away.
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +0000945 if (coalesceStackAccess(MI, Reg))
Jakob Stoklund Olesen7fd49052010-08-04 22:35:11 +0000946 continue;
947
Jakob Stoklund Olesenf8889112010-06-29 23:58:39 +0000948 // Analyze instruction.
Jakob Stoklund Olesenabe8c092012-03-01 01:43:25 +0000949 SmallVector<std::pair<MachineInstr*, unsigned>, 8> Ops;
James Molloy381fab92012-09-12 10:03:31 +0000950 MIBundleOperands::VirtRegInfo RI =
Duncan P. N. Exon Smithf9ab4162016-02-27 17:05:33 +0000951 MIBundleOperands(*MI).analyzeVirtReg(Reg, &Ops);
Jakob Stoklund Olesenf8889112010-06-29 23:58:39 +0000952
Jakob Stoklund Olesen9f294a92011-04-18 20:23:27 +0000953 // Find the slot index where this instruction reads and writes OldLI.
954 // This is usually the def slot, except for tied early clobbers.
Duncan P. N. Exon Smith3ac9cc62016-02-27 06:40:41 +0000955 SlotIndex Idx = LIS.getInstructionIndex(*MI).getRegSlot();
Jakob Stoklund Olesen90b5e562011-11-13 20:45:27 +0000956 if (VNInfo *VNI = OldLI.getVNInfoAt(Idx.getRegSlot(true)))
Jakob Stoklund Olesen9f294a92011-04-18 20:23:27 +0000957 if (SlotIndex::isSameInstr(Idx, VNI->def))
958 Idx = VNI->def;
959
Jakob Stoklund Olesen27320cb2011-03-18 04:23:06 +0000960 // Check for a sibling copy.
Duncan P. N. Exon Smith9cfc75c2016-06-30 00:01:54 +0000961 unsigned SibReg = isFullCopyOf(*MI, Reg);
Jakob Stoklund Olesene55003f2011-03-20 05:44:58 +0000962 if (SibReg && isSibling(SibReg)) {
Jakob Stoklund Olesen31a0b5e2011-05-11 18:25:10 +0000963 // This may actually be a copy between snippets.
964 if (isRegToSpill(SibReg)) {
965 DEBUG(dbgs() << "Found new snippet copy: " << *MI);
966 SnippetCopies.insert(MI);
967 continue;
968 }
Jakob Stoklund Olesenabe8c092012-03-01 01:43:25 +0000969 if (RI.Writes) {
Wei Mi9a16d652016-04-13 03:08:27 +0000970 if (hoistSpillInsideBB(OldLI, *MI)) {
Jakob Stoklund Olesene55003f2011-03-20 05:44:58 +0000971 // This COPY is now dead, the value is already in the stack slot.
972 MI->getOperand(0).setIsDead();
973 DeadDefs.push_back(MI);
974 continue;
975 }
976 } else {
977 // This is a reload for a sib-reg copy. Drop spills downstream.
Jakob Stoklund Olesene55003f2011-03-20 05:44:58 +0000978 LiveInterval &SibLI = LIS.getInterval(SibReg);
979 eliminateRedundantSpills(SibLI, SibLI.getVNInfoAt(Idx));
980 // The COPY will fold to a reload below.
981 }
Jakob Stoklund Olesen27320cb2011-03-18 04:23:06 +0000982 }
983
Jakob Stoklund Olesen96037182010-07-02 17:44:57 +0000984 // Attempt to fold memory ops.
Jakob Stoklund Olesenabe8c092012-03-01 01:43:25 +0000985 if (foldMemoryOperand(Ops))
Jakob Stoklund Olesen96037182010-07-02 17:44:57 +0000986 continue;
987
Mark Lacey9d8103d2013-08-14 23:50:16 +0000988 // Create a new virtual register for spill/fill.
Jakob Stoklund Olesenf8889112010-06-29 23:58:39 +0000989 // FIXME: Infer regclass from instruction alone.
Mark Lacey9d8103d2013-08-14 23:50:16 +0000990 unsigned NewVReg = Edit->createFrom(Reg);
Jakob Stoklund Olesenf8889112010-06-29 23:58:39 +0000991
Jakob Stoklund Olesenabe8c092012-03-01 01:43:25 +0000992 if (RI.Reads)
Mark Lacey9d8103d2013-08-14 23:50:16 +0000993 insertReload(NewVReg, Idx, MI);
Jakob Stoklund Olesenf8889112010-06-29 23:58:39 +0000994
995 // Rewrite instruction operands.
996 bool hasLiveDef = false;
Craig Topper73275a22015-12-24 05:20:40 +0000997 for (const auto &OpPair : Ops) {
998 MachineOperand &MO = OpPair.first->getOperand(OpPair.second);
Mark Lacey9d8103d2013-08-14 23:50:16 +0000999 MO.setReg(NewVReg);
Jakob Stoklund Olesenf8889112010-06-29 23:58:39 +00001000 if (MO.isUse()) {
Craig Topper73275a22015-12-24 05:20:40 +00001001 if (!OpPair.first->isRegTiedToDefOperand(OpPair.second))
Jakob Stoklund Olesenf8889112010-06-29 23:58:39 +00001002 MO.setIsKill();
1003 } else {
1004 if (!MO.isDead())
1005 hasLiveDef = true;
1006 }
1007 }
Mark Lacey9d8103d2013-08-14 23:50:16 +00001008 DEBUG(dbgs() << "\trewrite: " << Idx << '\t' << *MI << '\n');
Jakob Stoklund Olesenf8889112010-06-29 23:58:39 +00001009
Jakob Stoklund Olesenf8889112010-06-29 23:58:39 +00001010 // FIXME: Use a second vreg if instruction has no tied ops.
Mark Lacey9d8103d2013-08-14 23:50:16 +00001011 if (RI.Writes)
Jakob Stoklund Olesenabe8c092012-03-01 01:43:25 +00001012 if (hasLiveDef)
Mark Lacey9d8103d2013-08-14 23:50:16 +00001013 insertSpill(NewVReg, true, MI);
Jakob Stoklund Olesenf8889112010-06-29 23:58:39 +00001014 }
1015}
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +00001016
Jakob Stoklund Olesene991f722011-03-29 21:20:19 +00001017/// spillAll - Spill all registers remaining after rematerialization.
1018void InlineSpiller::spillAll() {
1019 // Update LiveStacks now that we are committed to spilling.
1020 if (StackSlot == VirtRegMap::NO_STACK_SLOT) {
1021 StackSlot = VRM.assignVirt2StackSlot(Original);
1022 StackInt = &LSS.getOrCreateInterval(StackSlot, MRI.getRegClass(Original));
Jakob Stoklund Olesenad6b22e2012-02-04 05:20:49 +00001023 StackInt->getNextValue(SlotIndex(), LSS.getVNInfoAllocator());
Jakob Stoklund Olesene991f722011-03-29 21:20:19 +00001024 } else
1025 StackInt = &LSS.getInterval(StackSlot);
1026
1027 if (Original != Edit->getReg())
1028 VRM.assignVirt2StackSlot(Edit->getReg(), StackSlot);
1029
1030 assert(StackInt->getNumValNums() == 1 && "Bad stack interval values");
Craig Topper73275a22015-12-24 05:20:40 +00001031 for (unsigned Reg : RegsToSpill)
1032 StackInt->MergeSegmentsInAsValue(LIS.getInterval(Reg),
Matthias Braun13ddb7c2013-10-10 21:28:43 +00001033 StackInt->getValNumInfo(0));
Jakob Stoklund Olesene991f722011-03-29 21:20:19 +00001034 DEBUG(dbgs() << "Merged spilled regs: " << *StackInt << '\n');
1035
1036 // Spill around uses of all RegsToSpill.
Craig Topper73275a22015-12-24 05:20:40 +00001037 for (unsigned Reg : RegsToSpill)
1038 spillAroundUses(Reg);
Jakob Stoklund Olesene991f722011-03-29 21:20:19 +00001039
1040 // Hoisted spills may cause dead code.
1041 if (!DeadDefs.empty()) {
1042 DEBUG(dbgs() << "Eliminating " << DeadDefs.size() << " dead defs\n");
Wei Mic0223702016-07-08 21:08:09 +00001043 Edit->eliminateDeadDefs(DeadDefs, RegsToSpill, AA);
Jakob Stoklund Olesene991f722011-03-29 21:20:19 +00001044 }
1045
1046 // Finally delete the SnippetCopies.
Craig Topper73275a22015-12-24 05:20:40 +00001047 for (unsigned Reg : RegsToSpill) {
Owen Andersonabb90c92014-03-13 06:02:25 +00001048 for (MachineRegisterInfo::reg_instr_iterator
Craig Topper73275a22015-12-24 05:20:40 +00001049 RI = MRI.reg_instr_begin(Reg), E = MRI.reg_instr_end();
Owen Andersonabb90c92014-03-13 06:02:25 +00001050 RI != E; ) {
Duncan P. N. Exon Smith3ac9cc62016-02-27 06:40:41 +00001051 MachineInstr &MI = *(RI++);
1052 assert(SnippetCopies.count(&MI) && "Remaining use wasn't a snippet copy");
Jakob Stoklund Olesen31a0b5e2011-05-11 18:25:10 +00001053 // FIXME: Do this with a LiveRangeEdit callback.
Jakob Stoklund Olesen31a0b5e2011-05-11 18:25:10 +00001054 LIS.RemoveMachineInstrFromMaps(MI);
Duncan P. N. Exon Smith3ac9cc62016-02-27 06:40:41 +00001055 MI.eraseFromParent();
Jakob Stoklund Olesen31a0b5e2011-05-11 18:25:10 +00001056 }
Jakob Stoklund Olesene991f722011-03-29 21:20:19 +00001057 }
1058
1059 // Delete all spilled registers.
Craig Topper73275a22015-12-24 05:20:40 +00001060 for (unsigned Reg : RegsToSpill)
1061 Edit->eraseVirtReg(Reg);
Jakob Stoklund Olesene991f722011-03-29 21:20:19 +00001062}
1063
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +00001064void InlineSpiller::spill(LiveRangeEdit &edit) {
Jakob Stoklund Olesenc5a8c082011-05-05 17:22:53 +00001065 ++NumSpilledRanges;
Jakob Stoklund Olesena00bab22011-03-14 19:56:43 +00001066 Edit = &edit;
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +00001067 assert(!TargetRegisterInfo::isStackSlot(edit.getReg())
1068 && "Trying to spill a stack slot.");
Jakob Stoklund Olesena0d5ec12011-03-15 21:13:25 +00001069 // Share a stack slot among all descendants of Original.
1070 Original = VRM.getOriginal(edit.getReg());
1071 StackSlot = VRM.getStackSlot(Original);
Craig Topperc0196b12014-04-14 00:51:57 +00001072 StackInt = nullptr;
Jakob Stoklund Olesena0d5ec12011-03-15 21:13:25 +00001073
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +00001074 DEBUG(dbgs() << "Inline spilling "
Craig Toppercf0444b2014-11-17 05:50:14 +00001075 << TRI.getRegClassName(MRI.getRegClass(edit.getReg()))
Matthias Braunf6fe6bf2013-10-10 21:29:05 +00001076 << ':' << edit.getParent()
Mark Lacey9d8103d2013-08-14 23:50:16 +00001077 << "\nFrom original " << PrintReg(Original) << '\n');
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +00001078 assert(edit.getParent().isSpillable() &&
1079 "Attempting to spill already spilled value.");
Jakob Stoklund Olesen27320cb2011-03-18 04:23:06 +00001080 assert(DeadDefs.empty() && "Previous spill didn't remove dead defs");
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +00001081
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +00001082 collectRegsToSpill();
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +00001083 reMaterializeAll();
1084
1085 // Remat may handle everything.
Jakob Stoklund Olesene991f722011-03-29 21:20:19 +00001086 if (!RegsToSpill.empty())
1087 spillAll();
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +00001088
Benjamin Kramere2a1d892013-06-17 19:00:36 +00001089 Edit->calculateRegClassAndHint(MF, Loops, MBFI);
Jakob Stoklund Olesena86595e2011-03-12 04:17:20 +00001090}
Wei Mi9a16d652016-04-13 03:08:27 +00001091
1092/// Optimizations after all the reg selections and spills are done.
Wei Mi963f2df2016-04-15 23:16:44 +00001093void InlineSpiller::postOptimization() { HSpiller.hoistAllSpills(); }
Wei Mi9a16d652016-04-13 03:08:27 +00001094
1095/// When a spill is inserted, add the spill to MergeableSpills map.
Duncan P. N. Exon Smith91298732016-06-30 23:28:15 +00001096void HoistSpillHelper::addToMergeableSpills(MachineInstr &Spill, int StackSlot,
Wei Mi9a16d652016-04-13 03:08:27 +00001097 unsigned Original) {
1098 StackSlotToReg[StackSlot] = Original;
Duncan P. N. Exon Smith91298732016-06-30 23:28:15 +00001099 SlotIndex Idx = LIS.getInstructionIndex(Spill);
Wei Mi9a16d652016-04-13 03:08:27 +00001100 VNInfo *OrigVNI = LIS.getInterval(Original).getVNInfoAt(Idx.getRegSlot());
1101 std::pair<int, VNInfo *> MIdx = std::make_pair(StackSlot, OrigVNI);
Duncan P. N. Exon Smith91298732016-06-30 23:28:15 +00001102 MergeableSpills[MIdx].insert(&Spill);
Wei Mi9a16d652016-04-13 03:08:27 +00001103}
1104
1105/// When a spill is removed, remove the spill from MergeableSpills map.
1106/// Return true if the spill is removed successfully.
Duncan P. N. Exon Smith91298732016-06-30 23:28:15 +00001107bool HoistSpillHelper::rmFromMergeableSpills(MachineInstr &Spill,
Wei Mi9a16d652016-04-13 03:08:27 +00001108 int StackSlot) {
1109 int Original = StackSlotToReg[StackSlot];
1110 if (!Original)
1111 return false;
Duncan P. N. Exon Smith91298732016-06-30 23:28:15 +00001112 SlotIndex Idx = LIS.getInstructionIndex(Spill);
Wei Mi9a16d652016-04-13 03:08:27 +00001113 VNInfo *OrigVNI = LIS.getInterval(Original).getVNInfoAt(Idx.getRegSlot());
1114 std::pair<int, VNInfo *> MIdx = std::make_pair(StackSlot, OrigVNI);
Duncan P. N. Exon Smith91298732016-06-30 23:28:15 +00001115 return MergeableSpills[MIdx].erase(&Spill);
Wei Mi9a16d652016-04-13 03:08:27 +00001116}
1117
1118/// Check BB to see if it is a possible target BB to place a hoisted spill,
1119/// i.e., there should be a living sibling of OrigReg at the insert point.
Wei Mi9a16d652016-04-13 03:08:27 +00001120bool HoistSpillHelper::isSpillCandBB(unsigned OrigReg, VNInfo &OrigVNI,
1121 MachineBasicBlock &BB, unsigned &LiveReg) {
1122 SlotIndex Idx;
Wei Mif3c8f532016-05-23 19:39:19 +00001123 LiveInterval &OrigLI = LIS.getInterval(OrigReg);
1124 MachineBasicBlock::iterator MI = IPA.getLastInsertPointIter(OrigLI, BB);
Wei Mi9a16d652016-04-13 03:08:27 +00001125 if (MI != BB.end())
1126 Idx = LIS.getInstructionIndex(*MI);
1127 else
1128 Idx = LIS.getMBBEndIdx(&BB).getPrevSlot();
1129 SmallSetVector<unsigned, 16> &Siblings = Virt2SiblingsMap[OrigReg];
1130 assert((LIS.getInterval(OrigReg)).getVNInfoAt(Idx) == &OrigVNI &&
1131 "Unexpected VNI");
1132
1133 for (auto const SibReg : Siblings) {
1134 LiveInterval &LI = LIS.getInterval(SibReg);
1135 VNInfo *VNI = LI.getVNInfoAt(Idx);
1136 if (VNI) {
1137 LiveReg = SibReg;
1138 return true;
1139 }
1140 }
1141 return false;
1142}
1143
Eric Christopher75d661a2016-05-04 21:45:36 +00001144/// Remove redundant spills in the same BB. Save those redundant spills in
Wei Mi9a16d652016-04-13 03:08:27 +00001145/// SpillsToRm, and save the spill to keep and its BB in SpillBBToSpill map.
Wei Mi9a16d652016-04-13 03:08:27 +00001146void HoistSpillHelper::rmRedundantSpills(
1147 SmallPtrSet<MachineInstr *, 16> &Spills,
1148 SmallVectorImpl<MachineInstr *> &SpillsToRm,
1149 DenseMap<MachineDomTreeNode *, MachineInstr *> &SpillBBToSpill) {
1150 // For each spill saw, check SpillBBToSpill[] and see if its BB already has
1151 // another spill inside. If a BB contains more than one spill, only keep the
1152 // earlier spill with smaller SlotIndex.
1153 for (const auto CurrentSpill : Spills) {
1154 MachineBasicBlock *Block = CurrentSpill->getParent();
Bjorn Pettersson3c6ce732017-01-04 09:41:56 +00001155 MachineDomTreeNode *Node = MDT.getBase().getNode(Block);
Wei Mi9a16d652016-04-13 03:08:27 +00001156 MachineInstr *PrevSpill = SpillBBToSpill[Node];
1157 if (PrevSpill) {
1158 SlotIndex PIdx = LIS.getInstructionIndex(*PrevSpill);
1159 SlotIndex CIdx = LIS.getInstructionIndex(*CurrentSpill);
1160 MachineInstr *SpillToRm = (CIdx > PIdx) ? CurrentSpill : PrevSpill;
1161 MachineInstr *SpillToKeep = (CIdx > PIdx) ? PrevSpill : CurrentSpill;
1162 SpillsToRm.push_back(SpillToRm);
Bjorn Pettersson3c6ce732017-01-04 09:41:56 +00001163 SpillBBToSpill[MDT.getBase().getNode(Block)] = SpillToKeep;
Wei Mi9a16d652016-04-13 03:08:27 +00001164 } else {
Bjorn Pettersson3c6ce732017-01-04 09:41:56 +00001165 SpillBBToSpill[MDT.getBase().getNode(Block)] = CurrentSpill;
Wei Mi9a16d652016-04-13 03:08:27 +00001166 }
1167 }
1168 for (const auto SpillToRm : SpillsToRm)
1169 Spills.erase(SpillToRm);
1170}
1171
1172/// Starting from \p Root find a top-down traversal order of the dominator
1173/// tree to visit all basic blocks containing the elements of \p Spills.
1174/// Redundant spills will be found and put into \p SpillsToRm at the same
1175/// time. \p SpillBBToSpill will be populated as part of the process and
1176/// maps a basic block to the first store occurring in the basic block.
1177/// \post SpillsToRm.union(Spills\@post) == Spills\@pre
Wei Mi9a16d652016-04-13 03:08:27 +00001178void HoistSpillHelper::getVisitOrders(
1179 MachineBasicBlock *Root, SmallPtrSet<MachineInstr *, 16> &Spills,
1180 SmallVectorImpl<MachineDomTreeNode *> &Orders,
1181 SmallVectorImpl<MachineInstr *> &SpillsToRm,
1182 DenseMap<MachineDomTreeNode *, unsigned> &SpillsToKeep,
1183 DenseMap<MachineDomTreeNode *, MachineInstr *> &SpillBBToSpill) {
1184 // The set contains all the possible BB nodes to which we may hoist
1185 // original spills.
1186 SmallPtrSet<MachineDomTreeNode *, 8> WorkSet;
1187 // Save the BB nodes on the path from the first BB node containing
Eric Christopher75d661a2016-05-04 21:45:36 +00001188 // non-redundant spill to the Root node.
Wei Mi9a16d652016-04-13 03:08:27 +00001189 SmallPtrSet<MachineDomTreeNode *, 8> NodesOnPath;
1190 // All the spills to be hoisted must originate from a single def instruction
1191 // to the OrigReg. It means the def instruction should dominate all the spills
1192 // to be hoisted. We choose the BB where the def instruction is located as
1193 // the Root.
1194 MachineDomTreeNode *RootIDomNode = MDT[Root]->getIDom();
1195 // For every node on the dominator tree with spill, walk up on the dominator
1196 // tree towards the Root node until it is reached. If there is other node
1197 // containing spill in the middle of the path, the previous spill saw will
Eric Christopher75d661a2016-05-04 21:45:36 +00001198 // be redundant and the node containing it will be removed. All the nodes on
1199 // the path starting from the first node with non-redundant spill to the Root
Wei Mi9a16d652016-04-13 03:08:27 +00001200 // node will be added to the WorkSet, which will contain all the possible
1201 // locations where spills may be hoisted to after the loop below is done.
1202 for (const auto Spill : Spills) {
1203 MachineBasicBlock *Block = Spill->getParent();
1204 MachineDomTreeNode *Node = MDT[Block];
1205 MachineInstr *SpillToRm = nullptr;
1206 while (Node != RootIDomNode) {
1207 // If Node dominates Block, and it already contains a spill, the spill in
Eric Christopher75d661a2016-05-04 21:45:36 +00001208 // Block will be redundant.
Wei Mi9a16d652016-04-13 03:08:27 +00001209 if (Node != MDT[Block] && SpillBBToSpill[Node]) {
1210 SpillToRm = SpillBBToSpill[MDT[Block]];
1211 break;
1212 /// If we see the Node already in WorkSet, the path from the Node to
1213 /// the Root node must already be traversed by another spill.
1214 /// Then no need to repeat.
1215 } else if (WorkSet.count(Node)) {
1216 break;
1217 } else {
1218 NodesOnPath.insert(Node);
1219 }
1220 Node = Node->getIDom();
1221 }
1222 if (SpillToRm) {
1223 SpillsToRm.push_back(SpillToRm);
1224 } else {
1225 // Add a BB containing the original spills to SpillsToKeep -- i.e.,
1226 // set the initial status before hoisting start. The value of BBs
1227 // containing original spills is set to 0, in order to descriminate
1228 // with BBs containing hoisted spills which will be inserted to
1229 // SpillsToKeep later during hoisting.
1230 SpillsToKeep[MDT[Block]] = 0;
1231 WorkSet.insert(NodesOnPath.begin(), NodesOnPath.end());
1232 }
1233 NodesOnPath.clear();
1234 }
1235
1236 // Sort the nodes in WorkSet in top-down order and save the nodes
1237 // in Orders. Orders will be used for hoisting in runHoistSpills.
1238 unsigned idx = 0;
Bjorn Pettersson3c6ce732017-01-04 09:41:56 +00001239 Orders.push_back(MDT.getBase().getNode(Root));
Wei Mi9a16d652016-04-13 03:08:27 +00001240 do {
1241 MachineDomTreeNode *Node = Orders[idx++];
1242 const std::vector<MachineDomTreeNode *> &Children = Node->getChildren();
1243 unsigned NumChildren = Children.size();
1244 for (unsigned i = 0; i != NumChildren; ++i) {
1245 MachineDomTreeNode *Child = Children[i];
1246 if (WorkSet.count(Child))
1247 Orders.push_back(Child);
1248 }
1249 } while (idx != Orders.size());
1250 assert(Orders.size() == WorkSet.size() &&
1251 "Orders have different size with WorkSet");
1252
1253#ifndef NDEBUG
1254 DEBUG(dbgs() << "Orders size is " << Orders.size() << "\n");
1255 SmallVector<MachineDomTreeNode *, 32>::reverse_iterator RIt = Orders.rbegin();
1256 for (; RIt != Orders.rend(); RIt++)
1257 DEBUG(dbgs() << "BB" << (*RIt)->getBlock()->getNumber() << ",");
1258 DEBUG(dbgs() << "\n");
1259#endif
1260}
1261
1262/// Try to hoist spills according to BB hotness. The spills to removed will
1263/// be saved in \p SpillsToRm. The spills to be inserted will be saved in
1264/// \p SpillsToIns.
Wei Mi9a16d652016-04-13 03:08:27 +00001265void HoistSpillHelper::runHoistSpills(
1266 unsigned OrigReg, VNInfo &OrigVNI, SmallPtrSet<MachineInstr *, 16> &Spills,
1267 SmallVectorImpl<MachineInstr *> &SpillsToRm,
1268 DenseMap<MachineBasicBlock *, unsigned> &SpillsToIns) {
1269 // Visit order of dominator tree nodes.
1270 SmallVector<MachineDomTreeNode *, 32> Orders;
1271 // SpillsToKeep contains all the nodes where spills are to be inserted
1272 // during hoisting. If the spill to be inserted is an original spill
1273 // (not a hoisted one), the value of the map entry is 0. If the spill
1274 // is a hoisted spill, the value of the map entry is the VReg to be used
1275 // as the source of the spill.
1276 DenseMap<MachineDomTreeNode *, unsigned> SpillsToKeep;
1277 // Map from BB to the first spill inside of it.
1278 DenseMap<MachineDomTreeNode *, MachineInstr *> SpillBBToSpill;
1279
1280 rmRedundantSpills(Spills, SpillsToRm, SpillBBToSpill);
1281
1282 MachineBasicBlock *Root = LIS.getMBBFromIndex(OrigVNI.def);
1283 getVisitOrders(Root, Spills, Orders, SpillsToRm, SpillsToKeep,
1284 SpillBBToSpill);
1285
1286 // SpillsInSubTreeMap keeps the map from a dom tree node to a pair of
1287 // nodes set and the cost of all the spills inside those nodes.
1288 // The nodes set are the locations where spills are to be inserted
1289 // in the subtree of current node.
Eugene Zelenko900b6332017-08-29 22:32:07 +00001290 using NodesCostPair =
1291 std::pair<SmallPtrSet<MachineDomTreeNode *, 16>, BlockFrequency>;
Wei Mi9a16d652016-04-13 03:08:27 +00001292 DenseMap<MachineDomTreeNode *, NodesCostPair> SpillsInSubTreeMap;
Eugene Zelenko900b6332017-08-29 22:32:07 +00001293
Wei Mi9a16d652016-04-13 03:08:27 +00001294 // Iterate Orders set in reverse order, which will be a bottom-up order
1295 // in the dominator tree. Once we visit a dom tree node, we know its
1296 // children have already been visited and the spill locations in the
1297 // subtrees of all the children have been determined.
1298 SmallVector<MachineDomTreeNode *, 32>::reverse_iterator RIt = Orders.rbegin();
1299 for (; RIt != Orders.rend(); RIt++) {
1300 MachineBasicBlock *Block = (*RIt)->getBlock();
1301
1302 // If Block contains an original spill, simply continue.
1303 if (SpillsToKeep.find(*RIt) != SpillsToKeep.end() && !SpillsToKeep[*RIt]) {
1304 SpillsInSubTreeMap[*RIt].first.insert(*RIt);
1305 // SpillsInSubTreeMap[*RIt].second contains the cost of spill.
1306 SpillsInSubTreeMap[*RIt].second = MBFI.getBlockFreq(Block);
1307 continue;
1308 }
1309
1310 // Collect spills in subtree of current node (*RIt) to
1311 // SpillsInSubTreeMap[*RIt].first.
1312 const std::vector<MachineDomTreeNode *> &Children = (*RIt)->getChildren();
1313 unsigned NumChildren = Children.size();
1314 for (unsigned i = 0; i != NumChildren; ++i) {
1315 MachineDomTreeNode *Child = Children[i];
1316 if (SpillsInSubTreeMap.find(Child) == SpillsInSubTreeMap.end())
1317 continue;
1318 // The stmt "SpillsInSubTree = SpillsInSubTreeMap[*RIt].first" below
1319 // should be placed before getting the begin and end iterators of
1320 // SpillsInSubTreeMap[Child].first, or else the iterators may be
1321 // invalidated when SpillsInSubTreeMap[*RIt] is seen the first time
1322 // and the map grows and then the original buckets in the map are moved.
1323 SmallPtrSet<MachineDomTreeNode *, 16> &SpillsInSubTree =
1324 SpillsInSubTreeMap[*RIt].first;
1325 BlockFrequency &SubTreeCost = SpillsInSubTreeMap[*RIt].second;
1326 SubTreeCost += SpillsInSubTreeMap[Child].second;
1327 auto BI = SpillsInSubTreeMap[Child].first.begin();
1328 auto EI = SpillsInSubTreeMap[Child].first.end();
1329 SpillsInSubTree.insert(BI, EI);
1330 SpillsInSubTreeMap.erase(Child);
1331 }
1332
1333 SmallPtrSet<MachineDomTreeNode *, 16> &SpillsInSubTree =
1334 SpillsInSubTreeMap[*RIt].first;
1335 BlockFrequency &SubTreeCost = SpillsInSubTreeMap[*RIt].second;
1336 // No spills in subtree, simply continue.
1337 if (SpillsInSubTree.empty())
1338 continue;
1339
1340 // Check whether Block is a possible candidate to insert spill.
1341 unsigned LiveReg = 0;
1342 if (!isSpillCandBB(OrigReg, OrigVNI, *Block, LiveReg))
1343 continue;
1344
1345 // If there are multiple spills that could be merged, bias a little
1346 // to hoist the spill.
1347 BranchProbability MarginProb = (SpillsInSubTree.size() > 1)
1348 ? BranchProbability(9, 10)
1349 : BranchProbability(1, 1);
1350 if (SubTreeCost > MBFI.getBlockFreq(Block) * MarginProb) {
1351 // Hoist: Move spills to current Block.
1352 for (const auto SpillBB : SpillsInSubTree) {
1353 // When SpillBB is a BB contains original spill, insert the spill
1354 // to SpillsToRm.
1355 if (SpillsToKeep.find(SpillBB) != SpillsToKeep.end() &&
1356 !SpillsToKeep[SpillBB]) {
1357 MachineInstr *SpillToRm = SpillBBToSpill[SpillBB];
1358 SpillsToRm.push_back(SpillToRm);
1359 }
1360 // SpillBB will not contain spill anymore, remove it from SpillsToKeep.
1361 SpillsToKeep.erase(SpillBB);
1362 }
1363 // Current Block is the BB containing the new hoisted spill. Add it to
1364 // SpillsToKeep. LiveReg is the source of the new spill.
1365 SpillsToKeep[*RIt] = LiveReg;
1366 DEBUG({
1367 dbgs() << "spills in BB: ";
1368 for (const auto Rspill : SpillsInSubTree)
1369 dbgs() << Rspill->getBlock()->getNumber() << " ";
1370 dbgs() << "were promoted to BB" << (*RIt)->getBlock()->getNumber()
1371 << "\n";
1372 });
1373 SpillsInSubTree.clear();
1374 SpillsInSubTree.insert(*RIt);
1375 SubTreeCost = MBFI.getBlockFreq(Block);
1376 }
1377 }
1378 // For spills in SpillsToKeep with LiveReg set (i.e., not original spill),
1379 // save them to SpillsToIns.
1380 for (const auto Ent : SpillsToKeep) {
1381 if (Ent.second)
1382 SpillsToIns[Ent.first->getBlock()] = Ent.second;
1383 }
1384}
1385
Eric Christopher75d661a2016-05-04 21:45:36 +00001386/// For spills with equal values, remove redundant spills and hoist those left
Wei Mi9a16d652016-04-13 03:08:27 +00001387/// to less hot spots.
1388///
1389/// Spills with equal values will be collected into the same set in
1390/// MergeableSpills when spill is inserted. These equal spills are originated
Eric Christopher75d661a2016-05-04 21:45:36 +00001391/// from the same defining instruction and are dominated by the instruction.
1392/// Before hoisting all the equal spills, redundant spills inside in the same
1393/// BB are first marked to be deleted. Then starting from the spills left, walk
1394/// up on the dominator tree towards the Root node where the define instruction
Wei Mi9a16d652016-04-13 03:08:27 +00001395/// is located, mark the dominated spills to be deleted along the way and
1396/// collect the BB nodes on the path from non-dominated spills to the define
1397/// instruction into a WorkSet. The nodes in WorkSet are the candidate places
Eric Christopher75d661a2016-05-04 21:45:36 +00001398/// where we are considering to hoist the spills. We iterate the WorkSet in
1399/// bottom-up order, and for each node, we will decide whether to hoist spills
1400/// inside its subtree to that node. In this way, we can get benefit locally
1401/// even if hoisting all the equal spills to one cold place is impossible.
Wei Mi963f2df2016-04-15 23:16:44 +00001402void HoistSpillHelper::hoistAllSpills() {
1403 SmallVector<unsigned, 4> NewVRegs;
1404 LiveRangeEdit Edit(nullptr, NewVRegs, MF, LIS, &VRM, this);
1405
Wei Mi9a16d652016-04-13 03:08:27 +00001406 // Save the mapping between stackslot and its original reg.
1407 DenseMap<int, unsigned> SlotToOrigReg;
1408 for (unsigned i = 0, e = MRI.getNumVirtRegs(); i != e; ++i) {
1409 unsigned Reg = TargetRegisterInfo::index2VirtReg(i);
1410 int Slot = VRM.getStackSlot(Reg);
1411 if (Slot != VirtRegMap::NO_STACK_SLOT)
1412 SlotToOrigReg[Slot] = VRM.getOriginal(Reg);
1413 unsigned Original = VRM.getPreSplitReg(Reg);
1414 if (!MRI.def_empty(Reg))
1415 Virt2SiblingsMap[Original].insert(Reg);
1416 }
1417
1418 // Each entry in MergeableSpills contains a spill set with equal values.
1419 for (auto &Ent : MergeableSpills) {
1420 int Slot = Ent.first.first;
1421 unsigned OrigReg = SlotToOrigReg[Slot];
Wei Mi8c4136b2016-05-11 22:37:43 +00001422 LiveInterval &OrigLI = LIS.getInterval(OrigReg);
Wei Mi9a16d652016-04-13 03:08:27 +00001423 VNInfo *OrigVNI = Ent.first.second;
1424 SmallPtrSet<MachineInstr *, 16> &EqValSpills = Ent.second;
1425 if (Ent.second.empty())
1426 continue;
1427
1428 DEBUG({
1429 dbgs() << "\nFor Slot" << Slot << " and VN" << OrigVNI->id << ":\n"
1430 << "Equal spills in BB: ";
1431 for (const auto spill : EqValSpills)
1432 dbgs() << spill->getParent()->getNumber() << " ";
1433 dbgs() << "\n";
1434 });
1435
1436 // SpillsToRm is the spill set to be removed from EqValSpills.
1437 SmallVector<MachineInstr *, 16> SpillsToRm;
1438 // SpillsToIns is the spill set to be newly inserted after hoisting.
1439 DenseMap<MachineBasicBlock *, unsigned> SpillsToIns;
1440
1441 runHoistSpills(OrigReg, *OrigVNI, EqValSpills, SpillsToRm, SpillsToIns);
1442
1443 DEBUG({
1444 dbgs() << "Finally inserted spills in BB: ";
1445 for (const auto Ispill : SpillsToIns)
1446 dbgs() << Ispill.first->getNumber() << " ";
1447 dbgs() << "\nFinally removed spills in BB: ";
1448 for (const auto Rspill : SpillsToRm)
1449 dbgs() << Rspill->getParent()->getNumber() << " ";
1450 dbgs() << "\n";
1451 });
1452
1453 // Stack live range update.
1454 LiveInterval &StackIntvl = LSS.getInterval(Slot);
Wei Mi8c4136b2016-05-11 22:37:43 +00001455 if (!SpillsToIns.empty() || !SpillsToRm.empty())
Wei Mi9a16d652016-04-13 03:08:27 +00001456 StackIntvl.MergeValueInAsValue(OrigLI, OrigVNI,
1457 StackIntvl.getValNumInfo(0));
Wei Mi9a16d652016-04-13 03:08:27 +00001458
1459 // Insert hoisted spills.
1460 for (auto const Insert : SpillsToIns) {
1461 MachineBasicBlock *BB = Insert.first;
1462 unsigned LiveReg = Insert.second;
Wei Mif3c8f532016-05-23 19:39:19 +00001463 MachineBasicBlock::iterator MI = IPA.getLastInsertPointIter(OrigLI, *BB);
Wei Mi9a16d652016-04-13 03:08:27 +00001464 TII.storeRegToStackSlot(*BB, MI, LiveReg, false, Slot,
1465 MRI.getRegClass(LiveReg), &TRI);
1466 LIS.InsertMachineInstrRangeInMaps(std::prev(MI), MI);
1467 ++NumSpills;
1468 }
1469
Eric Christopher75d661a2016-05-04 21:45:36 +00001470 // Remove redundant spills or change them to dead instructions.
Wei Mi9a16d652016-04-13 03:08:27 +00001471 NumSpills -= SpillsToRm.size();
1472 for (auto const RMEnt : SpillsToRm) {
1473 RMEnt->setDesc(TII.get(TargetOpcode::KILL));
1474 for (unsigned i = RMEnt->getNumOperands(); i; --i) {
1475 MachineOperand &MO = RMEnt->getOperand(i - 1);
1476 if (MO.isReg() && MO.isImplicit() && MO.isDef() && !MO.isDead())
1477 RMEnt->RemoveOperand(i - 1);
1478 }
1479 }
Wei Mic0223702016-07-08 21:08:09 +00001480 Edit.eliminateDeadDefs(SpillsToRm, None, AA);
Wei Mi9a16d652016-04-13 03:08:27 +00001481 }
1482}
Wei Mi963f2df2016-04-15 23:16:44 +00001483
1484/// For VirtReg clone, the \p New register should have the same physreg or
1485/// stackslot as the \p old register.
1486void HoistSpillHelper::LRE_DidCloneVirtReg(unsigned New, unsigned Old) {
1487 if (VRM.hasPhys(Old))
1488 VRM.assignVirt2Phys(New, VRM.getPhys(Old));
1489 else if (VRM.getStackSlot(Old) != VirtRegMap::NO_STACK_SLOT)
1490 VRM.assignVirt2StackSlot(New, VRM.getStackSlot(Old));
1491 else
1492 llvm_unreachable("VReg should be assigned either physreg or stackslot");
1493}