blob: b547c0f9954d28bf3a1711797d506a75d8767371 [file] [log] [blame]
Chris Lattneraa4c91f2003-12-28 07:59:53 +00001//===-- Passes.cpp - Target independent code generation passes ------------===//
Misha Brukmanedf128a2005-04-21 22:36:52 +00002//
John Criswellb576c942003-10-20 19:43:21 +00003// The LLVM Compiler Infrastructure
4//
Chris Lattner4ee451d2007-12-29 20:36:04 +00005// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Misha Brukmanedf128a2005-04-21 22:36:52 +00007//
John Criswellb576c942003-10-20 19:43:21 +00008//===----------------------------------------------------------------------===//
Alkis Evlogimenos7237ece2003-10-02 16:57:49 +00009//
10// This file defines interfaces to access the target independent code
11// generation passes provided by the LLVM backend.
12//
13//===---------------------------------------------------------------------===//
14
Andrew Trickd5422652012-02-04 02:56:48 +000015#include "llvm/Analysis/Passes.h"
16#include "llvm/Analysis/Verifier.h"
17#include "llvm/Transforms/Scalar.h"
18#include "llvm/PassManager.h"
19#include "llvm/CodeGen/GCStrategy.h"
Andrew Trickd5422652012-02-04 02:56:48 +000020#include "llvm/CodeGen/MachineFunctionPass.h"
Alkis Evlogimenos7237ece2003-10-02 16:57:49 +000021#include "llvm/CodeGen/Passes.h"
Andrew Trickd5422652012-02-04 02:56:48 +000022#include "llvm/CodeGen/RegAllocRegistry.h"
23#include "llvm/Target/TargetLowering.h"
Andrew Trickd5422652012-02-04 02:56:48 +000024#include "llvm/Target/TargetOptions.h"
Andrew Trickd5422652012-02-04 02:56:48 +000025#include "llvm/Assembly/PrintModulePass.h"
26#include "llvm/Support/CommandLine.h"
27#include "llvm/Support/Debug.h"
Andrew Trick74613342012-02-04 02:56:45 +000028#include "llvm/Support/ErrorHandling.h"
Jim Laskey13ec7022006-08-01 14:21:23 +000029
Chris Lattneraa4c91f2003-12-28 07:59:53 +000030using namespace llvm;
Brian Gaeked0fde302003-11-11 22:41:34 +000031
Andrew Trickd5422652012-02-04 02:56:48 +000032static cl::opt<bool> DisablePostRA("disable-post-ra", cl::Hidden,
33 cl::desc("Disable Post Regalloc"));
34static cl::opt<bool> DisableBranchFold("disable-branch-fold", cl::Hidden,
35 cl::desc("Disable branch folding"));
36static cl::opt<bool> DisableTailDuplicate("disable-tail-duplicate", cl::Hidden,
37 cl::desc("Disable tail duplication"));
38static cl::opt<bool> DisableEarlyTailDup("disable-early-taildup", cl::Hidden,
39 cl::desc("Disable pre-register allocation tail duplication"));
40static cl::opt<bool> EnableBlockPlacement("enable-block-placement",
41 cl::Hidden, cl::desc("Enable probability-driven block placement"));
42static cl::opt<bool> EnableBlockPlacementStats("enable-block-placement-stats",
43 cl::Hidden, cl::desc("Collect probability-driven block placement stats"));
44static cl::opt<bool> DisableCodePlace("disable-code-place", cl::Hidden,
45 cl::desc("Disable code placement"));
46static cl::opt<bool> DisableSSC("disable-ssc", cl::Hidden,
47 cl::desc("Disable Stack Slot Coloring"));
48static cl::opt<bool> DisableMachineDCE("disable-machine-dce", cl::Hidden,
49 cl::desc("Disable Machine Dead Code Elimination"));
50static cl::opt<bool> DisableMachineLICM("disable-machine-licm", cl::Hidden,
51 cl::desc("Disable Machine LICM"));
52static cl::opt<bool> DisableMachineCSE("disable-machine-cse", cl::Hidden,
53 cl::desc("Disable Machine Common Subexpression Elimination"));
54static cl::opt<bool> DisablePostRAMachineLICM("disable-postra-machine-licm",
55 cl::Hidden,
56 cl::desc("Disable Machine LICM"));
57static cl::opt<bool> DisableMachineSink("disable-machine-sink", cl::Hidden,
58 cl::desc("Disable Machine Sinking"));
59static cl::opt<bool> DisableLSR("disable-lsr", cl::Hidden,
60 cl::desc("Disable Loop Strength Reduction Pass"));
61static cl::opt<bool> DisableCGP("disable-cgp", cl::Hidden,
62 cl::desc("Disable Codegen Prepare"));
63static cl::opt<bool> DisableCopyProp("disable-copyprop", cl::Hidden,
64 cl::desc("Disable Copy Propagation pass"));
65static cl::opt<bool> PrintLSR("print-lsr-output", cl::Hidden,
66 cl::desc("Print LLVM IR produced by the loop-reduce pass"));
67static cl::opt<bool> PrintISelInput("print-isel-input", cl::Hidden,
68 cl::desc("Print LLVM IR input to isel pass"));
69static cl::opt<bool> PrintGCInfo("print-gc", cl::Hidden,
70 cl::desc("Dump garbage collector data"));
71static cl::opt<bool> VerifyMachineCode("verify-machineinstrs", cl::Hidden,
72 cl::desc("Verify generated machine code"),
73 cl::init(getenv("LLVM_VERIFY_MACHINEINSTRS")!=NULL));
74
Jim Laskeyeb577ba2006-08-02 12:30:23 +000075//===---------------------------------------------------------------------===//
Andrew Trick74613342012-02-04 02:56:45 +000076/// TargetPassConfig
77//===---------------------------------------------------------------------===//
78
79INITIALIZE_PASS(TargetPassConfig, "targetpassconfig",
80 "Target Pass Configuration", false, false)
81char TargetPassConfig::ID = 0;
82
83// Out of line virtual method.
84TargetPassConfig::~TargetPassConfig() {}
85
Andrew Trick61f1e3d2012-02-08 21:22:48 +000086// Out of line constructor provides default values for pass options and
87// registers all common codegen passes.
Andrew Trick061efcf2012-02-04 02:56:59 +000088TargetPassConfig::TargetPassConfig(TargetMachine *tm, PassManagerBase &pm)
Andrew Trickffea03f2012-02-08 21:22:39 +000089 : ImmutablePass(ID), TM(tm), PM(pm), Initialized(false),
90 DisableVerify(false),
91 EnableTailMerge(true) {
92
Andrew Trick74613342012-02-04 02:56:45 +000093 // Register all target independent codegen passes to activate their PassIDs,
94 // including this pass itself.
95 initializeCodeGen(*PassRegistry::getPassRegistry());
96}
97
98/// createPassConfig - Create a pass configuration object to be used by
99/// addPassToEmitX methods for generating a pipeline of CodeGen passes.
100///
101/// Targets may override this to extend TargetPassConfig.
Andrew Trick061efcf2012-02-04 02:56:59 +0000102TargetPassConfig *LLVMTargetMachine::createPassConfig(PassManagerBase &PM) {
103 return new TargetPassConfig(this, PM);
Andrew Trick74613342012-02-04 02:56:45 +0000104}
105
106TargetPassConfig::TargetPassConfig()
107 : ImmutablePass(ID), PM(*(PassManagerBase*)0) {
108 llvm_unreachable("TargetPassConfig should not be constructed on-the-fly");
109}
110
Andrew Trickffea03f2012-02-08 21:22:39 +0000111// Helper to verify the analysis is really immutable.
112void TargetPassConfig::setOpt(bool &Opt, bool Val) {
113 assert(!Initialized && "PassConfig is immutable");
114 Opt = Val;
115}
116
Andrew Trickebe18ef2012-02-08 21:22:34 +0000117void TargetPassConfig::addPass(char &ID) {
118 // FIXME: check user overrides
119 Pass *P = Pass::createPass(ID);
120 if (!P)
121 llvm_unreachable("Pass ID not registered");
122 PM.add(P);
Andrew Trick061efcf2012-02-04 02:56:59 +0000123}
Andrew Trickd5422652012-02-04 02:56:48 +0000124
125void TargetPassConfig::printNoVerify(const char *Banner) const {
126 if (TM->shouldPrintMachineCode())
127 PM.add(createMachineFunctionPrinterPass(dbgs(), Banner));
128}
129
130void TargetPassConfig::printAndVerify(const char *Banner) const {
131 if (TM->shouldPrintMachineCode())
132 PM.add(createMachineFunctionPrinterPass(dbgs(), Banner));
133
134 if (VerifyMachineCode)
135 PM.add(createMachineVerifierPass(Banner));
136}
137
Andrew Trick061efcf2012-02-04 02:56:59 +0000138/// Add common target configurable passes that perform LLVM IR to IR transforms
139/// following machine independent optimization.
140void TargetPassConfig::addIRPasses() {
Andrew Trickd5422652012-02-04 02:56:48 +0000141 // Basic AliasAnalysis support.
142 // Add TypeBasedAliasAnalysis before BasicAliasAnalysis so that
143 // BasicAliasAnalysis wins if they disagree. This is intended to help
144 // support "obvious" type-punning idioms.
145 PM.add(createTypeBasedAliasAnalysisPass());
146 PM.add(createBasicAliasAnalysisPass());
147
148 // Before running any passes, run the verifier to determine if the input
149 // coming from the front-end and/or optimizer is valid.
150 if (!DisableVerify)
151 PM.add(createVerifierPass());
152
153 // Run loop strength reduction before anything else.
154 if (getOptLevel() != CodeGenOpt::None && !DisableLSR) {
155 PM.add(createLoopStrengthReducePass(getTargetLowering()));
156 if (PrintLSR)
157 PM.add(createPrintFunctionPass("\n\n*** Code after LSR ***\n", &dbgs()));
158 }
159
160 PM.add(createGCLoweringPass());
161
162 // Make sure that no unreachable blocks are instruction selected.
163 PM.add(createUnreachableBlockEliminationPass());
Andrew Trick061efcf2012-02-04 02:56:59 +0000164}
Andrew Trickd5422652012-02-04 02:56:48 +0000165
Andrew Trick061efcf2012-02-04 02:56:59 +0000166/// Add common passes that perform LLVM IR to IR transforms in preparation for
167/// instruction selection.
168void TargetPassConfig::addISelPrepare() {
Andrew Trickd5422652012-02-04 02:56:48 +0000169 if (getOptLevel() != CodeGenOpt::None && !DisableCGP)
170 PM.add(createCodeGenPreparePass(getTargetLowering()));
171
172 PM.add(createStackProtectorPass(getTargetLowering()));
173
174 addPreISel();
175
176 if (PrintISelInput)
177 PM.add(createPrintFunctionPass("\n\n"
178 "*** Final LLVM Code input to ISel ***\n",
179 &dbgs()));
180
181 // All passes which modify the LLVM IR are now complete; run the verifier
182 // to ensure that the IR is valid.
183 if (!DisableVerify)
184 PM.add(createVerifierPass());
Andrew Trick061efcf2012-02-04 02:56:59 +0000185}
Andrew Trickd5422652012-02-04 02:56:48 +0000186
Andrew Trickf7b96312012-02-09 00:40:55 +0000187/// Add the complete set of target-independent postISel code generator passes.
188///
189/// This can be read as the standard order of major LLVM CodeGen stages. Stages
190/// with nontrivial configuration or multiple passes are broken out below in
191/// add%Stage routines.
192///
193/// Any TargetPassConfig::addXX routine may be overriden by the Target. The
194/// addPre/Post methods with empty header implementations allow injecting
195/// target-specific fixups just before or after major stages. Additionally,
196/// targets have the flexibility to change pass order within a stage by
197/// overriding default implementation of add%Stage routines below. Each
198/// technique has maintainability tradeoffs because alternate pass orders are
199/// not well supported. addPre/Post works better if the target pass is easily
200/// tied to a common pass. But if it has subtle dependencies on multiple passes,
201/// overriding the stage instead.
202///
203/// TODO: We could use a single addPre/Post(ID) hook to allow pass injection
204/// before/after any target-independent pass. But it's currently overkill.
Andrew Trick061efcf2012-02-04 02:56:59 +0000205void TargetPassConfig::addMachinePasses() {
Andrew Trickd5422652012-02-04 02:56:48 +0000206 // Print the instruction selected machine code...
207 printAndVerify("After Instruction Selection");
208
209 // Expand pseudo-instructions emitted by ISel.
Andrew Trick1dd8c852012-02-08 21:23:13 +0000210 addPass(ExpandISelPseudosID);
Andrew Trickd5422652012-02-04 02:56:48 +0000211
Andrew Trickf7b96312012-02-09 00:40:55 +0000212 // Add passes that optimize machine instructions in SSA form.
Andrew Trickd5422652012-02-04 02:56:48 +0000213 if (getOptLevel() != CodeGenOpt::None) {
Andrew Trickf7b96312012-02-09 00:40:55 +0000214 addMachineSSAOptimization();
215 }
216 else {
217 // If the target requests it, assign local variables to stack slots relative
218 // to one another and simplify frame index references where possible.
219 addPass(LocalStackSlotAllocationID);
Andrew Trickd5422652012-02-04 02:56:48 +0000220 }
221
222 // Run pre-ra passes.
223 if (addPreRegAlloc())
224 printAndVerify("After PreRegAlloc passes");
225
Andrew Trickf7b96312012-02-09 00:40:55 +0000226 // Run register allocation and passes that are tightly coupled with it,
227 // including phi elimination and scheduling.
228 addRegAlloc();
Andrew Trickd5422652012-02-04 02:56:48 +0000229
230 // Run post-ra passes.
231 if (addPostRegAlloc())
232 printAndVerify("After PostRegAlloc passes");
233
234 // Insert prolog/epilog code. Eliminate abstract frame index references...
Andrew Trick1dd8c852012-02-08 21:23:13 +0000235 addPass(PrologEpilogCodeInserterID);
Andrew Trickd5422652012-02-04 02:56:48 +0000236 printAndVerify("After PrologEpilogCodeInserter");
237
Andrew Trickf7b96312012-02-09 00:40:55 +0000238 /// Add passes that optimize machine instructions after register allocation.
239 if (getOptLevel() != CodeGenOpt::None)
240 addMachineLateOptimization();
Andrew Trickd5422652012-02-04 02:56:48 +0000241
242 // Expand pseudo instructions before second scheduling pass.
Andrew Trick1dd8c852012-02-08 21:23:13 +0000243 addPass(ExpandPostRAPseudosID);
Andrew Trickd5422652012-02-04 02:56:48 +0000244 printNoVerify("After ExpandPostRAPseudos");
245
246 // Run pre-sched2 passes.
247 if (addPreSched2())
248 printNoVerify("After PreSched2 passes");
249
250 // Second pass scheduler.
251 if (getOptLevel() != CodeGenOpt::None && !DisablePostRA) {
Andrew Trick1dd8c852012-02-08 21:23:13 +0000252 addPass(PostRASchedulerID);
Andrew Trickd5422652012-02-04 02:56:48 +0000253 printNoVerify("After PostRAScheduler");
254 }
255
Andrew Trickf7b96312012-02-09 00:40:55 +0000256 // GC
Andrew Trick1dd8c852012-02-08 21:23:13 +0000257 addPass(GCMachineCodeAnalysisID);
Andrew Trickd5422652012-02-04 02:56:48 +0000258 if (PrintGCInfo)
259 PM.add(createGCInfoPrinter(dbgs()));
260
Andrew Trickf7b96312012-02-09 00:40:55 +0000261 // Basic block placement.
262 if (getOptLevel() != CodeGenOpt::None && !DisableCodePlace)
263 addBlockPlacement();
Andrew Trickd5422652012-02-04 02:56:48 +0000264
265 if (addPreEmitPass())
266 printNoVerify("After PreEmit passes");
Andrew Trickd5422652012-02-04 02:56:48 +0000267}
268
Andrew Trickf7b96312012-02-09 00:40:55 +0000269/// Add passes that optimize machine instructions in SSA form.
270void TargetPassConfig::addMachineSSAOptimization() {
271 // Pre-ra tail duplication.
272 if (!DisableEarlyTailDup) {
273 addPass(TailDuplicateID);
274 printAndVerify("After Pre-RegAlloc TailDuplicate");
275 }
276
277 // Optimize PHIs before DCE: removing dead PHI cycles may make more
278 // instructions dead.
279 addPass(OptimizePHIsID);
280
281 // If the target requests it, assign local variables to stack slots relative
282 // to one another and simplify frame index references where possible.
283 addPass(LocalStackSlotAllocationID);
284
285 // With optimization, dead code should already be eliminated. However
286 // there is one known exception: lowered code for arguments that are only
287 // used by tail calls, where the tail calls reuse the incoming stack
288 // arguments directly (see t11 in test/CodeGen/X86/sibcall.ll).
289 if (!DisableMachineDCE)
290 addPass(DeadMachineInstructionElimID);
291 printAndVerify("After codegen DCE pass");
292
293 if (!DisableMachineLICM)
294 addPass(MachineLICMID);
295 if (!DisableMachineCSE)
296 addPass(MachineCSEID);
297 if (!DisableMachineSink)
298 addPass(MachineSinkingID);
299 printAndVerify("After Machine LICM, CSE and Sinking passes");
300
301 addPass(PeepholeOptimizerID);
302 printAndVerify("After codegen peephole optimization pass");
303}
304
Andrew Trick74613342012-02-04 02:56:45 +0000305//===---------------------------------------------------------------------===//
Andrew Trickf7b96312012-02-09 00:40:55 +0000306/// Register Allocation Pass Configuration
Jim Laskeyeb577ba2006-08-02 12:30:23 +0000307//===---------------------------------------------------------------------===//
Andrew Trickf7b96312012-02-09 00:40:55 +0000308
309/// RegisterRegAlloc's global Registry tracks allocator registration.
Jim Laskeyeb577ba2006-08-02 12:30:23 +0000310MachinePassRegistry RegisterRegAlloc::Registry;
311
Andrew Trickf7b96312012-02-09 00:40:55 +0000312/// A dummy default pass factory indicates whether the register allocator is
313/// overridden on the command line.
Jakob Stoklund Olesen700bfad2010-05-27 23:57:25 +0000314static FunctionPass *createDefaultRegisterAllocator() { return 0; }
315static RegisterRegAlloc
316defaultRegAlloc("default",
317 "pick register allocator based on -O option",
318 createDefaultRegisterAllocator);
Jim Laskeyeb577ba2006-08-02 12:30:23 +0000319
Andrew Trickf7b96312012-02-09 00:40:55 +0000320/// -regalloc=... command line option.
Dan Gohman844731a2008-05-13 00:00:25 +0000321static cl::opt<RegisterRegAlloc::FunctionPassCtor, false,
322 RegisterPassParser<RegisterRegAlloc> >
323RegAlloc("regalloc",
Jakob Stoklund Olesen700bfad2010-05-27 23:57:25 +0000324 cl::init(&createDefaultRegisterAllocator),
325 cl::desc("Register allocator to use"));
Alkis Evlogimenos7237ece2003-10-02 16:57:49 +0000326
Jim Laskeyeb577ba2006-08-02 12:30:23 +0000327
Jim Laskeyeb577ba2006-08-02 12:30:23 +0000328/// createRegisterAllocator - choose the appropriate register allocator.
Jakob Stoklund Olesen700bfad2010-05-27 23:57:25 +0000329FunctionPass *llvm::createRegisterAllocator(CodeGenOpt::Level OptLevel) {
Jim Laskey9ff542f2006-08-01 18:29:48 +0000330 RegisterRegAlloc::FunctionPassCtor Ctor = RegisterRegAlloc::getDefault();
Jakob Stoklund Olesen700bfad2010-05-27 23:57:25 +0000331
Jim Laskey13ec7022006-08-01 14:21:23 +0000332 if (!Ctor) {
Jim Laskeyeb577ba2006-08-02 12:30:23 +0000333 Ctor = RegAlloc;
334 RegisterRegAlloc::setDefault(RegAlloc);
Jim Laskey13ec7022006-08-01 14:21:23 +0000335 }
Jakob Stoklund Olesen700bfad2010-05-27 23:57:25 +0000336
337 if (Ctor != createDefaultRegisterAllocator)
338 return Ctor();
339
340 // When the 'default' allocator is requested, pick one based on OptLevel.
341 switch (OptLevel) {
342 case CodeGenOpt::None:
Jakob Stoklund Olesen8b89c642010-06-03 00:39:06 +0000343 return createFastRegisterAllocator();
Jakob Stoklund Olesen700bfad2010-05-27 23:57:25 +0000344 default:
Jakob Stoklund Olesen5aa32112011-04-30 01:37:54 +0000345 return createGreedyRegisterAllocator();
Jakob Stoklund Olesen700bfad2010-05-27 23:57:25 +0000346 }
Jim Laskey33a0a6d2006-07-27 20:05:00 +0000347}
Andrew Trickf7b96312012-02-09 00:40:55 +0000348
349/// Add standard target-independent passes that are tightly coupled with
350/// register allocation, including coalescing, machine instruction scheduling,
351/// and register allocation itself.
352///
353/// FIXME: This will become the register allocation "super pass" pipeline.
354void TargetPassConfig::addRegAlloc() {
355 // Perform register allocation.
356 PM.add(createRegisterAllocator(getOptLevel()));
357 printAndVerify("After Register Allocation");
358
359 // Perform stack slot coloring and post-ra machine LICM.
360 if (getOptLevel() != CodeGenOpt::None) {
361 // FIXME: Re-enable coloring with register when it's capable of adding
362 // kill markers.
363 if (!DisableSSC)
364 addPass(StackSlotColoringID);
365
366 // Run post-ra machine LICM to hoist reloads / remats.
367 //
368 // FIXME: can this move into MachineLateOptimization?
369 if (!DisablePostRAMachineLICM)
370 addPass(MachineLICMID);
371
372 printAndVerify("After StackSlotColoring and postra Machine LICM");
373 }
374}
375
376//===---------------------------------------------------------------------===//
377/// Post RegAlloc Pass Configuration
378//===---------------------------------------------------------------------===//
379
380/// Add passes that optimize machine instructions after register allocation.
381void TargetPassConfig::addMachineLateOptimization() {
382 // Branch folding must be run after regalloc and prolog/epilog insertion.
383 if (!DisableBranchFold) {
384 addPass(BranchFolderPassID);
385 printNoVerify("After BranchFolding");
386 }
387
388 // Tail duplication.
389 if (!DisableTailDuplicate) {
390 addPass(TailDuplicateID);
391 printNoVerify("After TailDuplicate");
392 }
393
394 // Copy propagation.
395 if (!DisableCopyProp) {
396 addPass(MachineCopyPropagationID);
397 printNoVerify("After copy propagation pass");
398 }
399}
400
401/// Add standard basic block placement passes.
402void TargetPassConfig::addBlockPlacement() {
403 if (EnableBlockPlacement) {
404 // MachineBlockPlacement is an experimental pass which is disabled by
405 // default currently. Eventually it should subsume CodePlacementOpt, so
406 // when enabled, the other is disabled.
407 addPass(MachineBlockPlacementID);
408 printNoVerify("After MachineBlockPlacement");
409 } else {
410 addPass(CodePlacementOptID);
411 printNoVerify("After CodePlacementOpt");
412 }
413
414 // Run a separate pass to collect block placement statistics.
415 if (EnableBlockPlacementStats) {
416 addPass(MachineBlockPlacementStatsID);
417 printNoVerify("After MachineBlockPlacementStats");
418 }
419}