Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 1 | //===- PassManagerBuilder.cpp - Build Standard Pass -----------------------===// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | // This file defines the PassManagerBuilder class, which is used to set up a |
| 11 | // "standard" optimization sequence suitable for languages like C and C++. |
| 12 | // |
| 13 | //===----------------------------------------------------------------------===// |
| 14 | |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 15 | #include "llvm/Transforms/IPO/PassManagerBuilder.h" |
Rafael Espindola | 07f60915 | 2011-08-09 22:17:34 +0000 | [diff] [blame] | 16 | #include "llvm-c/Transforms/PassManagerBuilder.h" |
Chandler Carruth | ed0881b | 2012-12-03 16:50:05 +0000 | [diff] [blame] | 17 | #include "llvm/ADT/SmallVector.h" |
Chandler Carruth | 17e0bc3 | 2015-08-06 07:33:15 +0000 | [diff] [blame] | 18 | #include "llvm/Analysis/BasicAliasAnalysis.h" |
George Burgess IV | bfa401e | 2016-07-06 00:26:41 +0000 | [diff] [blame] | 19 | #include "llvm/Analysis/CFLAndersAliasAnalysis.h" |
| 20 | #include "llvm/Analysis/CFLSteensAliasAnalysis.h" |
Chandler Carruth | 21dcff7 | 2015-08-14 03:48:20 +0000 | [diff] [blame] | 21 | #include "llvm/Analysis/GlobalsModRef.h" |
Easwaran Raman | 61edc10 | 2016-08-11 18:24:08 +0000 | [diff] [blame] | 22 | #include "llvm/Analysis/InlineCost.h" |
Chandler Carruth | 3a040e6 | 2015-12-27 08:41:34 +0000 | [diff] [blame] | 23 | #include "llvm/Analysis/Passes.h" |
Chandler Carruth | 42ff448 | 2015-08-14 02:55:50 +0000 | [diff] [blame] | 24 | #include "llvm/Analysis/ScopedNoAliasAA.h" |
Chandler Carruth | 62d4215 | 2015-01-15 02:16:27 +0000 | [diff] [blame] | 25 | #include "llvm/Analysis/TargetLibraryInfo.h" |
Chandler Carruth | 1db2282 | 2015-08-14 03:33:48 +0000 | [diff] [blame] | 26 | #include "llvm/Analysis/TypeBasedAliasAnalysis.h" |
Chandler Carruth | 3a040e6 | 2015-12-27 08:41:34 +0000 | [diff] [blame] | 27 | #include "llvm/IR/DataLayout.h" |
Chandler Carruth | 3a040e6 | 2015-12-27 08:41:34 +0000 | [diff] [blame] | 28 | #include "llvm/IR/LegacyPassManager.h" |
Teresa Johnson | 26ab577 | 2016-03-15 00:04:37 +0000 | [diff] [blame] | 29 | #include "llvm/IR/ModuleSummaryIndex.h" |
Chandler Carruth | 3a040e6 | 2015-12-27 08:41:34 +0000 | [diff] [blame] | 30 | #include "llvm/IR/Verifier.h" |
| 31 | #include "llvm/Support/CommandLine.h" |
| 32 | #include "llvm/Support/ManagedStatic.h" |
Rafael Espindola | 7cebf36 | 2014-08-21 20:03:44 +0000 | [diff] [blame] | 33 | #include "llvm/Target/TargetMachine.h" |
Chandler Carruth | ed0881b | 2012-12-03 16:50:05 +0000 | [diff] [blame] | 34 | #include "llvm/Transforms/IPO.h" |
Chandler Carruth | f49f1a87 | 2015-12-27 08:13:45 +0000 | [diff] [blame] | 35 | #include "llvm/Transforms/IPO/ForceFunctionAttrs.h" |
Chandler Carruth | 9c4ed17 | 2016-02-18 11:03:11 +0000 | [diff] [blame] | 36 | #include "llvm/Transforms/IPO/FunctionAttrs.h" |
Chandler Carruth | 3a040e6 | 2015-12-27 08:41:34 +0000 | [diff] [blame] | 37 | #include "llvm/Transforms/IPO/InferFunctionAttrs.h" |
Teresa Johnson | 26ab577 | 2016-03-15 00:04:37 +0000 | [diff] [blame] | 38 | #include "llvm/Transforms/Instrumentation.h" |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 39 | #include "llvm/Transforms/Scalar.h" |
Chandler Carruth | 89c45a1 | 2016-03-11 08:50:55 +0000 | [diff] [blame] | 40 | #include "llvm/Transforms/Scalar/GVN.h" |
Chandler Carruth | 1353f9a | 2017-04-27 18:45:20 +0000 | [diff] [blame] | 41 | #include "llvm/Transforms/Scalar/SimpleLoopUnswitch.h" |
Hal Finkel | c34e511 | 2012-02-01 03:51:43 +0000 | [diff] [blame] | 42 | #include "llvm/Transforms/Vectorize.h" |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 43 | |
| 44 | using namespace llvm; |
| 45 | |
Hal Finkel | c34e511 | 2012-02-01 03:51:43 +0000 | [diff] [blame] | 46 | static cl::opt<bool> |
Xinliang David Li | 126157c | 2017-05-22 16:41:57 +0000 | [diff] [blame] | 47 | RunPartialInlining("enable-partial-inlining", cl::init(false), cl::Hidden, |
| 48 | cl::ZeroOrMore, cl::desc("Run Partial inlinining pass")); |
| 49 | |
| 50 | static cl::opt<bool> |
| 51 | RunLoopVectorization("vectorize-loops", cl::Hidden, |
| 52 | cl::desc("Run the Loop vectorization passes")); |
Nadav Rotem | c59ae20 | 2012-10-29 16:36:25 +0000 | [diff] [blame] | 53 | |
| 54 | static cl::opt<bool> |
Nadav Rotem | 7f27e0b | 2013-10-18 23:38:13 +0000 | [diff] [blame] | 55 | RunSLPVectorization("vectorize-slp", cl::Hidden, |
Nadav Rotem | d4dcc00 | 2013-04-15 05:39:58 +0000 | [diff] [blame] | 56 | cl::desc("Run the SLP vectorization passes")); |
| 57 | |
| 58 | static cl::opt<bool> |
Hal Finkel | 204bf53 | 2012-04-13 17:15:33 +0000 | [diff] [blame] | 59 | UseGVNAfterVectorization("use-gvn-after-vectorization", |
| 60 | cl::init(false), cl::Hidden, |
| 61 | cl::desc("Run GVN instead of Early CSE after vectorization passes")); |
| 62 | |
Chandler Carruth | 7b8297a | 2014-10-14 00:31:29 +0000 | [diff] [blame] | 63 | static cl::opt<bool> ExtraVectorizerPasses( |
| 64 | "extra-vectorizer-passes", cl::init(false), cl::Hidden, |
| 65 | cl::desc("Run cleanup optimization passes after vectorization.")); |
| 66 | |
Hal Finkel | bf45efd | 2013-11-16 23:59:05 +0000 | [diff] [blame] | 67 | static cl::opt<bool> |
| 68 | RunLoopRerolling("reroll-loops", cl::Hidden, |
| 69 | cl::desc("Run the loop rerolling pass")); |
| 70 | |
Davide Italiano | fe7a3ee | 2016-12-26 18:26:19 +0000 | [diff] [blame] | 71 | static cl::opt<bool> RunNewGVN("enable-newgvn", cl::init(false), cl::Hidden, |
| 72 | cl::desc("Run the NewGVN pass")); |
| 73 | |
James Molloy | 568da09 | 2014-08-06 12:56:19 +0000 | [diff] [blame] | 74 | static cl::opt<bool> |
| 75 | RunSLPAfterLoopVectorization("run-slp-after-loop-vectorization", |
James Molloy | 6b95d8e | 2014-09-04 13:23:08 +0000 | [diff] [blame] | 76 | cl::init(true), cl::Hidden, |
James Molloy | 568da09 | 2014-08-06 12:56:19 +0000 | [diff] [blame] | 77 | cl::desc("Run the SLP vectorizer (and BB vectorizer) after the Loop " |
| 78 | "vectorizer instead of before")); |
| 79 | |
George Burgess IV | bfa401e | 2016-07-06 00:26:41 +0000 | [diff] [blame] | 80 | // Experimental option to use CFL-AA |
| 81 | enum class CFLAAType { None, Steensgaard, Andersen, Both }; |
| 82 | static cl::opt<CFLAAType> |
| 83 | UseCFLAA("use-cfl-aa", cl::init(CFLAAType::None), cl::Hidden, |
| 84 | cl::desc("Enable the new, experimental CFL alias analysis"), |
| 85 | cl::values(clEnumValN(CFLAAType::None, "none", "Disable CFL-AA"), |
| 86 | clEnumValN(CFLAAType::Steensgaard, "steens", |
| 87 | "Enable unification-based CFL-AA"), |
| 88 | clEnumValN(CFLAAType::Andersen, "anders", |
| 89 | "Enable inclusion-based CFL-AA"), |
| 90 | clEnumValN(CFLAAType::Both, "both", |
Mehdi Amini | 732afdd | 2016-10-08 19:41:06 +0000 | [diff] [blame] | 91 | "Enable both variants of CFL-AA"))); |
James Molloy | 568da09 | 2014-08-06 12:56:19 +0000 | [diff] [blame] | 92 | |
Karthik Bhat | 88db86d | 2015-03-06 10:11:25 +0000 | [diff] [blame] | 93 | static cl::opt<bool> EnableLoopInterchange( |
| 94 | "enable-loopinterchange", cl::init(false), cl::Hidden, |
| 95 | cl::desc("Enable the new, experimental LoopInterchange Pass")); |
| 96 | |
Teresa Johnson | fbb431b | 2016-09-17 20:40:16 +0000 | [diff] [blame] | 97 | static cl::opt<bool> |
| 98 | EnablePrepareForThinLTO("prepare-for-thinlto", cl::init(false), cl::Hidden, |
| 99 | cl::desc("Enable preparation for ThinLTO.")); |
| 100 | |
Xinliang David Li | 9239245 | 2016-07-23 04:28:52 +0000 | [diff] [blame] | 101 | static cl::opt<bool> RunPGOInstrGen( |
| 102 | "profile-generate", cl::init(false), cl::Hidden, |
| 103 | cl::desc("Enable PGO instrumentation.")); |
| 104 | |
| 105 | static cl::opt<std::string> |
| 106 | PGOOutputFile("profile-generate-file", cl::init(""), cl::Hidden, |
| 107 | cl::desc("Specify the path of profile data file.")); |
Rong Xu | 34abbfb | 2016-01-21 18:28:59 +0000 | [diff] [blame] | 108 | |
| 109 | static cl::opt<std::string> RunPGOInstrUse( |
| 110 | "profile-use", cl::init(""), cl::Hidden, cl::value_desc("filename"), |
| 111 | cl::desc("Enable use phase of PGO instrumentation and specify the path " |
| 112 | "of profile data file")); |
| 113 | |
Ashutosh Nema | df6763a | 2016-02-06 07:47:48 +0000 | [diff] [blame] | 114 | static cl::opt<bool> UseLoopVersioningLICM( |
| 115 | "enable-loop-versioning-licm", cl::init(false), cl::Hidden, |
| 116 | cl::desc("Enable the experimental Loop Versioning LICM pass")); |
| 117 | |
Rong Xu | 96a19d3 | 2016-07-15 18:10:49 +0000 | [diff] [blame] | 118 | static cl::opt<bool> |
| 119 | DisablePreInliner("disable-preinline", cl::init(false), cl::Hidden, |
| 120 | cl::desc("Disable pre-instrumentation inliner")); |
| 121 | |
| 122 | static cl::opt<int> PreInlineThreshold( |
| 123 | "preinline-threshold", cl::Hidden, cl::init(75), cl::ZeroOrMore, |
| 124 | cl::desc("Control the amount of inlining in pre-instrumentation inliner " |
| 125 | "(default = 75)")); |
| 126 | |
Geoff Berry | 3cca1da | 2017-06-10 15:20:03 +0000 | [diff] [blame] | 127 | static cl::opt<bool> EnableEarlyCSEMemSSA( |
Geoff Berry | 2573a19 | 2017-06-27 22:25:02 +0000 | [diff] [blame] | 128 | "enable-earlycse-memssa", cl::init(true), cl::Hidden, |
| 129 | cl::desc("Enable the EarlyCSE w/ MemorySSA pass (default = on)")); |
Geoff Berry | 3cca1da | 2017-06-10 15:20:03 +0000 | [diff] [blame] | 130 | |
Alina Sbirlea | ba21ffe | 2016-07-22 22:02:19 +0000 | [diff] [blame] | 131 | static cl::opt<bool> EnableGVNHoist( |
Chandler Carruth | c246a4c | 2017-04-27 00:28:03 +0000 | [diff] [blame] | 132 | "enable-gvn-hoist", cl::init(false), cl::Hidden, |
| 133 | cl::desc("Enable the GVN hoisting pass (default = off)")); |
Alina Sbirlea | ba21ffe | 2016-07-22 22:02:19 +0000 | [diff] [blame] | 134 | |
Rong Xu | 1c0e9b9 | 2016-10-18 21:36:27 +0000 | [diff] [blame] | 135 | static cl::opt<bool> |
| 136 | DisableLibCallsShrinkWrap("disable-libcalls-shrinkwrap", cl::init(false), |
| 137 | cl::Hidden, |
| 138 | cl::desc("Disable shrink-wrap library calls")); |
| 139 | |
Chandler Carruth | 1353f9a | 2017-04-27 18:45:20 +0000 | [diff] [blame] | 140 | static cl::opt<bool> |
| 141 | EnableSimpleLoopUnswitch("enable-simple-loop-unswitch", cl::init(false), |
| 142 | cl::Hidden, |
| 143 | cl::desc("Enable the simple loop unswitch pass.")); |
| 144 | |
James Molloy | a929063 | 2017-05-25 12:51:11 +0000 | [diff] [blame] | 145 | static cl::opt<bool> EnableGVNSink( |
| 146 | "enable-gvn-sink", cl::init(false), cl::Hidden, |
Davide Italiano | 1dd5558 | 2017-06-01 23:47:53 +0000 | [diff] [blame] | 147 | cl::desc("Enable the GVN sinking pass (default = off)")); |
James Molloy | a929063 | 2017-05-25 12:51:11 +0000 | [diff] [blame] | 148 | |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 149 | PassManagerBuilder::PassManagerBuilder() { |
| 150 | OptLevel = 2; |
| 151 | SizeLevel = 0; |
Craig Topper | f40110f | 2014-04-25 05:29:35 +0000 | [diff] [blame] | 152 | LibraryInfo = nullptr; |
| 153 | Inliner = nullptr; |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 154 | DisableUnrollLoops = false; |
Nadav Rotem | a1e5e44 | 2013-04-15 04:54:42 +0000 | [diff] [blame] | 155 | SLPVectorize = RunSLPVectorization; |
Nadav Rotem | c59ae20 | 2012-10-29 16:36:25 +0000 | [diff] [blame] | 156 | LoopVectorize = RunLoopVectorization; |
Hal Finkel | 29aeb20 | 2013-11-17 16:02:50 +0000 | [diff] [blame] | 157 | RerollLoops = RunLoopRerolling; |
Davide Italiano | fe7a3ee | 2016-12-26 18:26:19 +0000 | [diff] [blame] | 158 | NewGVN = RunNewGVN; |
Rafael Espindola | 208bc53 | 2014-08-21 13:13:17 +0000 | [diff] [blame] | 159 | DisableGVNLoadPRE = false; |
Rafael Espindola | 7cebf36 | 2014-08-21 20:03:44 +0000 | [diff] [blame] | 160 | VerifyInput = false; |
| 161 | VerifyOutput = false; |
Nick Lewycky | 9e6d184 | 2014-09-13 21:46:00 +0000 | [diff] [blame] | 162 | MergeFunctions = false; |
Teresa Johnson | d3a33a1 | 2015-07-06 16:22:42 +0000 | [diff] [blame] | 163 | PrepareForLTO = false; |
Xinliang David Li | 9239245 | 2016-07-23 04:28:52 +0000 | [diff] [blame] | 164 | EnablePGOInstrGen = RunPGOInstrGen; |
| 165 | PGOInstrGen = PGOOutputFile; |
Rong Xu | 34abbfb | 2016-01-21 18:28:59 +0000 | [diff] [blame] | 166 | PGOInstrUse = RunPGOInstrUse; |
Teresa Johnson | fbb431b | 2016-09-17 20:40:16 +0000 | [diff] [blame] | 167 | PrepareForThinLTO = EnablePrepareForThinLTO; |
Mehdi Amini | 1db10ac | 2016-02-16 23:02:29 +0000 | [diff] [blame] | 168 | PerformThinLTO = false; |
Stanislav Mekhanoshin | ee2dd78 | 2017-03-17 17:13:41 +0000 | [diff] [blame] | 169 | DivergentTarget = false; |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 170 | } |
| 171 | |
| 172 | PassManagerBuilder::~PassManagerBuilder() { |
| 173 | delete LibraryInfo; |
| 174 | delete Inliner; |
| 175 | } |
| 176 | |
David Chisnall | 719a72f | 2011-08-16 13:58:41 +0000 | [diff] [blame] | 177 | /// Set of global extensions, automatically added as part of the standard set. |
| 178 | static ManagedStatic<SmallVector<std::pair<PassManagerBuilder::ExtensionPointTy, |
| 179 | PassManagerBuilder::ExtensionFn>, 8> > GlobalExtensions; |
| 180 | |
Frederich Munch | 52dfcd1 | 2017-07-06 00:09:09 +0000 | [diff] [blame] | 181 | /// Check if GlobalExtensions is constructed and not empty. |
| 182 | /// Since GlobalExtensions is a managed static, calling 'empty()' will trigger |
| 183 | /// the construction of the object. |
| 184 | static bool GlobalExtensionsNotEmpty() { |
| 185 | return GlobalExtensions.isConstructed() && !GlobalExtensions->empty(); |
| 186 | } |
| 187 | |
Frederich Munch | 6391c7e | 2017-06-13 19:05:24 +0000 | [diff] [blame] | 188 | void PassManagerBuilder::addGlobalExtension( |
| 189 | PassManagerBuilder::ExtensionPointTy Ty, |
| 190 | PassManagerBuilder::ExtensionFn Fn) { |
| 191 | GlobalExtensions->push_back(std::make_pair(Ty, std::move(Fn))); |
David Chisnall | 719a72f | 2011-08-16 13:58:41 +0000 | [diff] [blame] | 192 | } |
| 193 | |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 194 | void PassManagerBuilder::addExtension(ExtensionPointTy Ty, ExtensionFn Fn) { |
Justin Lebar | 2fe1323 | 2016-03-30 20:39:29 +0000 | [diff] [blame] | 195 | Extensions.push_back(std::make_pair(Ty, std::move(Fn))); |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 196 | } |
| 197 | |
| 198 | void PassManagerBuilder::addExtensionsToPM(ExtensionPointTy ETy, |
Chandler Carruth | 30d69c2 | 2015-02-13 10:01:29 +0000 | [diff] [blame] | 199 | legacy::PassManagerBase &PM) const { |
Frederich Munch | 52dfcd1 | 2017-07-06 00:09:09 +0000 | [diff] [blame] | 200 | if (GlobalExtensionsNotEmpty()) { |
| 201 | for (auto &Ext : *GlobalExtensions) { |
| 202 | if (Ext.first == ETy) |
| 203 | Ext.second(*this, PM); |
| 204 | } |
| 205 | } |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 206 | for (unsigned i = 0, e = Extensions.size(); i != e; ++i) |
| 207 | if (Extensions[i].first == ETy) |
| 208 | Extensions[i].second(*this, PM); |
| 209 | } |
| 210 | |
Chandler Carruth | 30d69c2 | 2015-02-13 10:01:29 +0000 | [diff] [blame] | 211 | void PassManagerBuilder::addInitialAliasAnalysisPasses( |
| 212 | legacy::PassManagerBase &PM) const { |
George Burgess IV | bfa401e | 2016-07-06 00:26:41 +0000 | [diff] [blame] | 213 | switch (UseCFLAA) { |
| 214 | case CFLAAType::Steensgaard: |
| 215 | PM.add(createCFLSteensAAWrapperPass()); |
| 216 | break; |
| 217 | case CFLAAType::Andersen: |
| 218 | PM.add(createCFLAndersAAWrapperPass()); |
| 219 | break; |
| 220 | case CFLAAType::Both: |
| 221 | PM.add(createCFLSteensAAWrapperPass()); |
| 222 | PM.add(createCFLAndersAAWrapperPass()); |
| 223 | break; |
| 224 | default: |
| 225 | break; |
| 226 | } |
| 227 | |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 228 | // Add TypeBasedAliasAnalysis before BasicAliasAnalysis so that |
| 229 | // BasicAliasAnalysis wins if they disagree. This is intended to help |
| 230 | // support "obvious" type-punning idioms. |
Chandler Carruth | 7b560d4 | 2015-09-09 17:55:00 +0000 | [diff] [blame] | 231 | PM.add(createTypeBasedAAWrapperPass()); |
| 232 | PM.add(createScopedNoAliasAAWrapperPass()); |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 233 | } |
| 234 | |
Matthias Braun | c31032d | 2016-03-09 18:47:11 +0000 | [diff] [blame] | 235 | void PassManagerBuilder::addInstructionCombiningPass( |
| 236 | legacy::PassManagerBase &PM) const { |
| 237 | bool ExpensiveCombines = OptLevel > 2; |
| 238 | PM.add(createInstructionCombiningPass(ExpensiveCombines)); |
| 239 | } |
| 240 | |
Chandler Carruth | 30d69c2 | 2015-02-13 10:01:29 +0000 | [diff] [blame] | 241 | void PassManagerBuilder::populateFunctionPassManager( |
| 242 | legacy::FunctionPassManager &FPM) { |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 243 | addExtensionsToPM(EP_EarlyAsPossible, FPM); |
| 244 | |
| 245 | // Add LibraryInfo if we have some. |
Chandler Carruth | b98f63d | 2015-01-15 10:41:28 +0000 | [diff] [blame] | 246 | if (LibraryInfo) |
| 247 | FPM.add(new TargetLibraryInfoWrapperPass(*LibraryInfo)); |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 248 | |
| 249 | if (OptLevel == 0) return; |
| 250 | |
| 251 | addInitialAliasAnalysisPasses(FPM); |
| 252 | |
| 253 | FPM.add(createCFGSimplificationPass()); |
David Majnemer | cbf614a | 2016-06-15 00:19:09 +0000 | [diff] [blame] | 254 | FPM.add(createSROAPass()); |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 255 | FPM.add(createEarlyCSEPass()); |
| 256 | FPM.add(createLowerExpectIntrinsicPass()); |
| 257 | } |
| 258 | |
Rong Xu | 34abbfb | 2016-01-21 18:28:59 +0000 | [diff] [blame] | 259 | // Do PGO instrumentation generation or use pass as the option specified. |
| 260 | void PassManagerBuilder::addPGOInstrPasses(legacy::PassManagerBase &MPM) { |
Dehao Chen | 6613166 | 2017-06-27 17:23:33 +0000 | [diff] [blame] | 261 | if (!EnablePGOInstrGen && PGOInstrUse.empty() && PGOSampleUse.empty()) |
Rong Xu | 96a19d3 | 2016-07-15 18:10:49 +0000 | [diff] [blame] | 262 | return; |
| 263 | // Perform the preinline and cleanup passes for O1 and above. |
| 264 | // And avoid doing them if optimizing for size. |
Dehao Chen | 6613166 | 2017-06-27 17:23:33 +0000 | [diff] [blame] | 265 | if (OptLevel > 0 && SizeLevel == 0 && !DisablePreInliner && |
| 266 | PGOSampleUse.empty()) { |
Easwaran Raman | 61edc10 | 2016-08-11 18:24:08 +0000 | [diff] [blame] | 267 | // Create preinline pass. We construct an InlineParams object and specify |
| 268 | // the threshold here to avoid the command line options of the regular |
| 269 | // inliner to influence pre-inlining. The only fields of InlineParams we |
| 270 | // care about are DefaultThreshold and HintThreshold. |
| 271 | InlineParams IP; |
| 272 | IP.DefaultThreshold = PreInlineThreshold; |
| 273 | // FIXME: The hint threshold has the same value used by the regular inliner. |
| 274 | // This should probably be lowered after performance testing. |
| 275 | IP.HintThreshold = 325; |
| 276 | |
| 277 | MPM.add(createFunctionInliningPass(IP)); |
Rong Xu | 96a19d3 | 2016-07-15 18:10:49 +0000 | [diff] [blame] | 278 | MPM.add(createSROAPass()); |
| 279 | MPM.add(createEarlyCSEPass()); // Catch trivial redundancies |
| 280 | MPM.add(createCFGSimplificationPass()); // Merge & remove BBs |
| 281 | MPM.add(createInstructionCombiningPass()); // Combine silly seq's |
| 282 | addExtensionsToPM(EP_Peephole, MPM); |
| 283 | } |
Xinliang David Li | 9239245 | 2016-07-23 04:28:52 +0000 | [diff] [blame] | 284 | if (EnablePGOInstrGen) { |
Xinliang David Li | 8aebf44 | 2016-05-06 05:49:19 +0000 | [diff] [blame] | 285 | MPM.add(createPGOInstrumentationGenLegacyPass()); |
Rong Xu | 34abbfb | 2016-01-21 18:28:59 +0000 | [diff] [blame] | 286 | // Add the profile lowering pass. |
| 287 | InstrProfOptions Options; |
Xinliang David Li | 9239245 | 2016-07-23 04:28:52 +0000 | [diff] [blame] | 288 | if (!PGOInstrGen.empty()) |
| 289 | Options.InstrProfileOutput = PGOInstrGen; |
Xinliang David Li | b67530e | 2017-06-25 00:26:43 +0000 | [diff] [blame] | 290 | Options.DoCounterPromotion = true; |
| 291 | MPM.add(createLoopRotatePass()); |
Xinliang David Li | e6b8929 | 2016-04-18 17:47:38 +0000 | [diff] [blame] | 292 | MPM.add(createInstrProfilingLegacyPass(Options)); |
Rong Xu | 34abbfb | 2016-01-21 18:28:59 +0000 | [diff] [blame] | 293 | } |
| 294 | if (!PGOInstrUse.empty()) |
Xinliang David Li | d55827f | 2016-05-07 05:39:12 +0000 | [diff] [blame] | 295 | MPM.add(createPGOInstrumentationUseLegacyPass(PGOInstrUse)); |
Davide Italiano | 058abf1f | 2017-04-25 16:54:45 +0000 | [diff] [blame] | 296 | // Indirect call promotion that promotes intra-module targets only. |
| 297 | // For ThinLTO this is done earlier due to interactions with globalopt |
| 298 | // for imported functions. We don't run this at -O0. |
| 299 | if (OptLevel > 0) |
| 300 | MPM.add( |
| 301 | createPGOIndirectCallPromotionLegacyPass(false, !PGOSampleUse.empty())); |
Rong Xu | 34abbfb | 2016-01-21 18:28:59 +0000 | [diff] [blame] | 302 | } |
Mehdi Amini | ec8bee1 | 2016-02-16 22:54:27 +0000 | [diff] [blame] | 303 | void PassManagerBuilder::addFunctionSimplificationPasses( |
Mehdi Amini | 9c1c3ac | 2016-02-11 22:09:11 +0000 | [diff] [blame] | 304 | legacy::PassManagerBase &MPM) { |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 305 | // Start of function pass. |
| 306 | // Break up aggregate allocas, using SSAUpdater. |
David Majnemer | cbf614a | 2016-06-15 00:19:09 +0000 | [diff] [blame] | 307 | MPM.add(createSROAPass()); |
Geoff Berry | 3cca1da | 2017-06-10 15:20:03 +0000 | [diff] [blame] | 308 | MPM.add(createEarlyCSEPass(EnableEarlyCSEMemSSA)); // Catch trivial redundancies |
Geoff Berry | 85a530f | 2017-04-13 15:36:25 +0000 | [diff] [blame] | 309 | if (EnableGVNHoist) |
| 310 | MPM.add(createGVNHoistPass()); |
James Molloy | a929063 | 2017-05-25 12:51:11 +0000 | [diff] [blame] | 311 | if (EnableGVNSink) { |
| 312 | MPM.add(createGVNSinkPass()); |
| 313 | MPM.add(createCFGSimplificationPass()); |
| 314 | } |
| 315 | |
Justin Lebar | cf63b64 | 2016-04-15 00:32:12 +0000 | [diff] [blame] | 316 | // Speculative execution if the target has divergent branches; otherwise nop. |
| 317 | MPM.add(createSpeculativeExecutionIfHasBranchDivergencePass()); |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 318 | MPM.add(createJumpThreadingPass()); // Thread jumps. |
| 319 | MPM.add(createCorrelatedValuePropagationPass()); // Propagate conditionals |
| 320 | MPM.add(createCFGSimplificationPass()); // Merge & remove BBs |
Matthias Braun | c31032d | 2016-03-09 18:47:11 +0000 | [diff] [blame] | 321 | // Combine silly seq's |
| 322 | addInstructionCombiningPass(MPM); |
Rong Xu | 1c0e9b9 | 2016-10-18 21:36:27 +0000 | [diff] [blame] | 323 | if (SizeLevel == 0 && !DisableLibCallsShrinkWrap) |
| 324 | MPM.add(createLibCallsShrinkWrapPass()); |
Peter Collingbourne | 0a43761 | 2014-05-25 10:27:02 +0000 | [diff] [blame] | 325 | addExtensionsToPM(EP_Peephole, MPM); |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 326 | |
Rong Xu | 48596b6 | 2017-04-04 16:42:20 +0000 | [diff] [blame] | 327 | // Optimize memory intrinsic calls based on the profiled size information. |
| 328 | if (SizeLevel == 0) |
| 329 | MPM.add(createPGOMemOPSizeOptLegacyPass()); |
| 330 | |
Akira Hatanaka | d9699bc | 2015-06-09 19:07:19 +0000 | [diff] [blame] | 331 | MPM.add(createTailCallEliminationPass()); // Eliminate tail calls |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 332 | MPM.add(createCFGSimplificationPass()); // Merge & remove BBs |
| 333 | MPM.add(createReassociatePass()); // Reassociate expressions |
Roman Divacky | d2b9a1b | 2014-11-21 19:53:24 +0000 | [diff] [blame] | 334 | // Rotate Loop - disable header duplication at -Oz |
| 335 | MPM.add(createLoopRotatePass(SizeLevel == 2 ? 0 : -1)); |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 336 | MPM.add(createLICMPass()); // Hoist loop invariants |
Chandler Carruth | 1353f9a | 2017-04-27 18:45:20 +0000 | [diff] [blame] | 337 | if (EnableSimpleLoopUnswitch) |
| 338 | MPM.add(createSimpleLoopUnswitchLegacyPass()); |
| 339 | else |
| 340 | MPM.add(createLoopUnswitchPass(SizeLevel || OptLevel < 3, DivergentTarget)); |
Michael Zolotukhin | 74621cc | 2015-09-24 03:50:17 +0000 | [diff] [blame] | 341 | MPM.add(createCFGSimplificationPass()); |
Matthias Braun | c31032d | 2016-03-09 18:47:11 +0000 | [diff] [blame] | 342 | addInstructionCombiningPass(MPM); |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 343 | MPM.add(createIndVarSimplifyPass()); // Canonicalize indvars |
| 344 | MPM.add(createLoopIdiomPass()); // Recognize idioms like memset. |
Krzysztof Parzyszek | 0fd6296 | 2017-01-25 16:12:25 +0000 | [diff] [blame] | 345 | addExtensionsToPM(EP_LateLoopOptimizations, MPM); |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 346 | MPM.add(createLoopDeletionPass()); // Delete dead loops |
Krzysztof Parzyszek | 0fd6296 | 2017-01-25 16:12:25 +0000 | [diff] [blame] | 347 | |
Karthik Bhat | 8210fdf | 2015-04-23 04:51:44 +0000 | [diff] [blame] | 348 | if (EnableLoopInterchange) { |
Karthik Bhat | 88db86d | 2015-03-06 10:11:25 +0000 | [diff] [blame] | 349 | MPM.add(createLoopInterchangePass()); // Interchange loops |
Karthik Bhat | 8210fdf | 2015-04-23 04:51:44 +0000 | [diff] [blame] | 350 | MPM.add(createCFGSimplificationPass()); |
| 351 | } |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 352 | if (!DisableUnrollLoops) |
Dehao Chen | 7d23032 | 2017-02-18 03:46:51 +0000 | [diff] [blame] | 353 | MPM.add(createSimpleLoopUnrollPass(OptLevel)); // Unroll small loops |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 354 | addExtensionsToPM(EP_LoopOptimizerEnd, MPM); |
| 355 | |
Gerolf Hoflehner | f27ae6c | 2014-07-18 19:13:09 +0000 | [diff] [blame] | 356 | if (OptLevel > 1) { |
Davide Italiano | 9b8738d | 2017-01-28 23:45:37 +0000 | [diff] [blame] | 357 | MPM.add(createMergedLoadStoreMotionPass()); // Merge ld/st in diamonds |
Davide Italiano | fe7a3ee | 2016-12-26 18:26:19 +0000 | [diff] [blame] | 358 | MPM.add(NewGVN ? createNewGVNPass() |
| 359 | : createGVNPass(DisableGVNLoadPRE)); // Remove redundancies |
Gerolf Hoflehner | f27ae6c | 2014-07-18 19:13:09 +0000 | [diff] [blame] | 360 | } |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 361 | MPM.add(createMemCpyOptPass()); // Remove memcpy / form memset |
| 362 | MPM.add(createSCCPPass()); // Constant prop with SCCP |
| 363 | |
Hal Finkel | 2bb61ba | 2015-02-17 01:36:59 +0000 | [diff] [blame] | 364 | // Delete dead bit computations (instcombine runs after to fold away the dead |
| 365 | // computations, and then ADCE will run later to exploit any new DCE |
| 366 | // opportunities that creates). |
| 367 | MPM.add(createBitTrackingDCEPass()); // Delete dead bit computations |
| 368 | |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 369 | // Run instcombine after redundancy elimination to exploit opportunities |
| 370 | // opened up by them. |
Matthias Braun | c31032d | 2016-03-09 18:47:11 +0000 | [diff] [blame] | 371 | addInstructionCombiningPass(MPM); |
Peter Collingbourne | 0a43761 | 2014-05-25 10:27:02 +0000 | [diff] [blame] | 372 | addExtensionsToPM(EP_Peephole, MPM); |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 373 | MPM.add(createJumpThreadingPass()); // Thread jumps |
| 374 | MPM.add(createCorrelatedValuePropagationPass()); |
| 375 | MPM.add(createDeadStoreEliminationPass()); // Delete dead stores |
James Molloy | 8357024 | 2015-02-16 18:59:54 +0000 | [diff] [blame] | 376 | MPM.add(createLICMPass()); |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 377 | |
| 378 | addExtensionsToPM(EP_ScalarOptimizerLate, MPM); |
| 379 | |
Hal Finkel | 29aeb20 | 2013-11-17 16:02:50 +0000 | [diff] [blame] | 380 | if (RerollLoops) |
Hal Finkel | bf45efd | 2013-11-16 23:59:05 +0000 | [diff] [blame] | 381 | MPM.add(createLoopRerollPass()); |
Chandler Carruth | 3545a9e | 2017-06-30 07:09:08 +0000 | [diff] [blame] | 382 | if (!RunSLPAfterLoopVectorization && SLPVectorize) |
| 383 | MPM.add(createSLPVectorizerPass()); // Vectorize parallel scalar chains. |
Hal Finkel | c34e511 | 2012-02-01 03:51:43 +0000 | [diff] [blame] | 384 | |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 385 | MPM.add(createAggressiveDCEPass()); // Delete dead instructions |
Tom Stellard | aa664d9 | 2013-08-06 02:43:45 +0000 | [diff] [blame] | 386 | MPM.add(createCFGSimplificationPass()); // Merge & remove BBs |
Matthias Braun | c31032d | 2016-03-09 18:47:11 +0000 | [diff] [blame] | 387 | // Clean up after everything. |
| 388 | addInstructionCombiningPass(MPM); |
Peter Collingbourne | 0a43761 | 2014-05-25 10:27:02 +0000 | [diff] [blame] | 389 | addExtensionsToPM(EP_Peephole, MPM); |
Mehdi Amini | ec8bee1 | 2016-02-16 22:54:27 +0000 | [diff] [blame] | 390 | } |
| 391 | |
| 392 | void PassManagerBuilder::populateModulePassManager( |
| 393 | legacy::PassManagerBase &MPM) { |
Dehao Chen | a99e082 | 2016-12-14 21:40:47 +0000 | [diff] [blame] | 394 | if (!PGOSampleUse.empty()) { |
| 395 | MPM.add(createPruneEHPass()); |
| 396 | MPM.add(createSampleProfileLoaderPass(PGOSampleUse)); |
| 397 | } |
| 398 | |
Mehdi Amini | ec8bee1 | 2016-02-16 22:54:27 +0000 | [diff] [blame] | 399 | // Allow forcing function attributes as a debugging and tuning aid. |
| 400 | MPM.add(createForceFunctionAttrsLegacyPass()); |
| 401 | |
| 402 | // If all optimizations are disabled, just run the always-inline pass and, |
| 403 | // if enabled, the function merging pass. |
| 404 | if (OptLevel == 0) { |
| 405 | addPGOInstrPasses(MPM); |
| 406 | if (Inliner) { |
| 407 | MPM.add(Inliner); |
| 408 | Inliner = nullptr; |
| 409 | } |
| 410 | |
| 411 | // FIXME: The BarrierNoopPass is a HACK! The inliner pass above implicitly |
| 412 | // creates a CGSCC pass manager, but we don't want to add extensions into |
| 413 | // that pass manager. To prevent this we insert a no-op module pass to reset |
| 414 | // the pass manager to get the same behavior as EP_OptimizerLast in non-O0 |
| 415 | // builds. The function merging pass is |
| 416 | if (MergeFunctions) |
| 417 | MPM.add(createMergeFunctionsPass()); |
Frederich Munch | 52dfcd1 | 2017-07-06 00:09:09 +0000 | [diff] [blame] | 418 | else if (GlobalExtensionsNotEmpty() || !Extensions.empty()) |
Mehdi Amini | ec8bee1 | 2016-02-16 22:54:27 +0000 | [diff] [blame] | 419 | MPM.add(createBarrierNoopPass()); |
| 420 | |
Peter Collingbourne | 9fb6e1a | 2017-11-01 17:58:39 +0000 | [diff] [blame] | 421 | if (PerformThinLTO) { |
| 422 | // Drop available_externally and unreferenced globals. This is necessary |
| 423 | // with ThinLTO in order to avoid leaving undefined references to dead |
| 424 | // globals in the object file. |
| 425 | MPM.add(createEliminateAvailableExternallyPass()); |
| 426 | MPM.add(createGlobalDCEPass()); |
| 427 | } |
| 428 | |
Mehdi Amini | ec8bee1 | 2016-02-16 22:54:27 +0000 | [diff] [blame] | 429 | addExtensionsToPM(EP_EnabledOnOptLevel0, MPM); |
Davide Italiano | 5da7090 | 2017-04-23 04:49:34 +0000 | [diff] [blame] | 430 | |
| 431 | // Rename anon globals to be able to export them in the summary. |
| 432 | // This has to be done after we add the extensions to the pass manager |
| 433 | // as there could be passes (e.g. Adddress sanitizer) which introduce |
| 434 | // new unnamed globals. |
| 435 | if (PrepareForThinLTO) |
| 436 | MPM.add(createNameAnonGlobalPass()); |
Mehdi Amini | ec8bee1 | 2016-02-16 22:54:27 +0000 | [diff] [blame] | 437 | return; |
| 438 | } |
| 439 | |
| 440 | // Add LibraryInfo if we have some. |
| 441 | if (LibraryInfo) |
| 442 | MPM.add(new TargetLibraryInfoWrapperPass(*LibraryInfo)); |
| 443 | |
| 444 | addInitialAliasAnalysisPasses(MPM); |
| 445 | |
Teresa Johnson | 8c1bc98 | 2016-08-29 22:46:56 +0000 | [diff] [blame] | 446 | // For ThinLTO there are two passes of indirect call promotion. The |
| 447 | // first is during the compile phase when PerformThinLTO=false and |
| 448 | // intra-module indirect call targets are promoted. The second is during |
| 449 | // the ThinLTO backend when PerformThinLTO=true, when we promote imported |
| 450 | // inter-module indirect calls. For that we perform indirect call promotion |
| 451 | // earlier in the pass pipeline, here before globalopt. Otherwise imported |
| 452 | // available_externally functions look unreferenced and are removed. |
| 453 | if (PerformThinLTO) |
Dehao Chen | cc75d24 | 2017-02-23 22:15:18 +0000 | [diff] [blame] | 454 | MPM.add(createPGOIndirectCallPromotionLegacyPass(/*InLTO = */ true, |
| 455 | !PGOSampleUse.empty())); |
Teresa Johnson | 8c1bc98 | 2016-08-29 22:46:56 +0000 | [diff] [blame] | 456 | |
Dehao Chen | 8c88671 | 2017-03-23 21:20:05 +0000 | [diff] [blame] | 457 | // For SamplePGO in ThinLTO compile phase, we do not want to unroll loops |
| 458 | // as it will change the CFG too much to make the 2nd profile annotation |
| 459 | // in backend more difficult. |
| 460 | bool PrepareForThinLTOUsingPGOSampleProfile = |
| 461 | PrepareForThinLTO && !PGOSampleUse.empty(); |
| 462 | if (PrepareForThinLTOUsingPGOSampleProfile) |
| 463 | DisableUnrollLoops = true; |
| 464 | |
Davide Italiano | c74ea93 | 2017-10-06 04:39:40 +0000 | [diff] [blame] | 465 | // Infer attributes about declarations if possible. |
| 466 | MPM.add(createInferFunctionAttrsLegacyPass()); |
Mehdi Amini | ec8bee1 | 2016-02-16 22:54:27 +0000 | [diff] [blame] | 467 | |
Davide Italiano | c74ea93 | 2017-10-06 04:39:40 +0000 | [diff] [blame] | 468 | addExtensionsToPM(EP_ModuleOptimizerEarly, MPM); |
Mehdi Amini | ec8bee1 | 2016-02-16 22:54:27 +0000 | [diff] [blame] | 469 | |
Davide Italiano | c74ea93 | 2017-10-06 04:39:40 +0000 | [diff] [blame] | 470 | MPM.add(createIPSCCPPass()); // IP SCCP |
Matthew Simpson | cb58558 | 2017-10-25 13:40:08 +0000 | [diff] [blame] | 471 | MPM.add(createCalledValuePropagationPass()); |
Davide Italiano | c74ea93 | 2017-10-06 04:39:40 +0000 | [diff] [blame] | 472 | MPM.add(createGlobalOptimizerPass()); // Optimize out global vars |
| 473 | // Promote any localized global vars. |
| 474 | MPM.add(createPromoteMemoryToRegisterPass()); |
Mehdi Amini | ec8bee1 | 2016-02-16 22:54:27 +0000 | [diff] [blame] | 475 | |
Davide Italiano | c74ea93 | 2017-10-06 04:39:40 +0000 | [diff] [blame] | 476 | MPM.add(createDeadArgEliminationPass()); // Dead argument elimination |
Mehdi Amini | ec8bee1 | 2016-02-16 22:54:27 +0000 | [diff] [blame] | 477 | |
Davide Italiano | c74ea93 | 2017-10-06 04:39:40 +0000 | [diff] [blame] | 478 | addInstructionCombiningPass(MPM); // Clean up after IPCP & DAE |
| 479 | addExtensionsToPM(EP_Peephole, MPM); |
| 480 | MPM.add(createCFGSimplificationPass()); // Clean up after IPCP & DAE |
Mehdi Amini | ec8bee1 | 2016-02-16 22:54:27 +0000 | [diff] [blame] | 481 | |
Dehao Chen | 8c88671 | 2017-03-23 21:20:05 +0000 | [diff] [blame] | 482 | // For SamplePGO in ThinLTO compile phase, we do not want to do indirect |
| 483 | // call promotion as it will change the CFG too much to make the 2nd |
| 484 | // profile annotation in backend more difficult. |
Davide Italiano | 058abf1f | 2017-04-25 16:54:45 +0000 | [diff] [blame] | 485 | // PGO instrumentation is added during the compile phase for ThinLTO, do |
| 486 | // not run it a second time |
| 487 | if (!PerformThinLTO && !PrepareForThinLTOUsingPGOSampleProfile) |
Mehdi Amini | 1db10ac | 2016-02-16 23:02:29 +0000 | [diff] [blame] | 488 | addPGOInstrPasses(MPM); |
Mehdi Amini | ec8bee1 | 2016-02-16 22:54:27 +0000 | [diff] [blame] | 489 | |
Davide Italiano | c48d1c8 | 2017-10-02 23:39:20 +0000 | [diff] [blame] | 490 | // We add a module alias analysis pass here. In part due to bugs in the |
| 491 | // analysis infrastructure this "works" in that the analysis stays alive |
| 492 | // for the entire SCC pass run below. |
| 493 | MPM.add(createGlobalsAAWrapperPass()); |
Mehdi Amini | ec8bee1 | 2016-02-16 22:54:27 +0000 | [diff] [blame] | 494 | |
| 495 | // Start of CallGraph SCC passes. |
Davide Italiano | c74ea93 | 2017-10-06 04:39:40 +0000 | [diff] [blame] | 496 | MPM.add(createPruneEHPass()); // Remove dead EH info |
Davide Italiano | ff829ce | 2017-10-05 18:06:37 +0000 | [diff] [blame] | 497 | bool RunInliner = false; |
Mehdi Amini | ec8bee1 | 2016-02-16 22:54:27 +0000 | [diff] [blame] | 498 | if (Inliner) { |
| 499 | MPM.add(Inliner); |
| 500 | Inliner = nullptr; |
Davide Italiano | ff829ce | 2017-10-05 18:06:37 +0000 | [diff] [blame] | 501 | RunInliner = true; |
Mehdi Amini | ec8bee1 | 2016-02-16 22:54:27 +0000 | [diff] [blame] | 502 | } |
Davide Italiano | c74ea93 | 2017-10-06 04:39:40 +0000 | [diff] [blame] | 503 | |
| 504 | MPM.add(createPostOrderFunctionAttrsLegacyPass()); |
Mehdi Amini | ec8bee1 | 2016-02-16 22:54:27 +0000 | [diff] [blame] | 505 | if (OptLevel > 2) |
| 506 | MPM.add(createArgumentPromotionPass()); // Scalarize uninlined fn args |
| 507 | |
David Majnemer | 6e9b47b | 2016-07-28 03:28:43 +0000 | [diff] [blame] | 508 | addExtensionsToPM(EP_CGSCCOptimizerLate, MPM); |
Mehdi Amini | ec8bee1 | 2016-02-16 22:54:27 +0000 | [diff] [blame] | 509 | addFunctionSimplificationPasses(MPM); |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 510 | |
Mehdi Amini | 45c7b3e | 2016-05-02 16:53:16 +0000 | [diff] [blame] | 511 | // FIXME: This is a HACK! The inliner pass above implicitly creates a CGSCC |
| 512 | // pass manager that we are specifically trying to avoid. To prevent this |
| 513 | // we must insert a no-op module pass to reset the pass manager. |
| 514 | MPM.add(createBarrierNoopPass()); |
Davide Italiano | ff829ce | 2017-10-05 18:06:37 +0000 | [diff] [blame] | 515 | |
Xinliang David Li | 126157c | 2017-05-22 16:41:57 +0000 | [diff] [blame] | 516 | if (RunPartialInlining) |
| 517 | MPM.add(createPartialInliningPass()); |
Mehdi Amini | 45c7b3e | 2016-05-02 16:53:16 +0000 | [diff] [blame] | 518 | |
Davide Italiano | c74ea93 | 2017-10-06 04:39:40 +0000 | [diff] [blame] | 519 | if (OptLevel > 1 && !PrepareForLTO && !PrepareForThinLTO) |
Mehdi Amini | 7f7d8be | 2016-05-03 15:46:00 +0000 | [diff] [blame] | 520 | // Remove avail extern fns and globals definitions if we aren't |
| 521 | // compiling an object file for later LTO. For LTO we want to preserve |
| 522 | // these so they are eligible for inlining at link-time. Note if they |
| 523 | // are unreferenced they will be removed by GlobalDCE later, so |
| 524 | // this only impacts referenced available externally globals. |
| 525 | // Eventually they will be suppressed during codegen, but eliminating |
| 526 | // here enables more opportunity for GlobalDCE as it may make |
| 527 | // globals referenced by available external functions dead |
| 528 | // and saves running remaining passes on the eliminated functions. |
| 529 | MPM.add(createEliminateAvailableExternallyPass()); |
| 530 | |
Davide Italiano | c74ea93 | 2017-10-06 04:39:40 +0000 | [diff] [blame] | 531 | MPM.add(createReversePostOrderFunctionAttrsPass()); |
Mehdi Amini | 45c7b3e | 2016-05-02 16:53:16 +0000 | [diff] [blame] | 532 | |
Davide Italiano | c8708e5 | 2017-10-05 18:23:25 +0000 | [diff] [blame] | 533 | // The inliner performs some kind of dead code elimination as it goes, |
| 534 | // but there are cases that are not really caught by it. We might |
| 535 | // at some point consider teaching the inliner about them, but it |
| 536 | // is OK for now to run GlobalOpt + GlobalDCE in tandem as their |
| 537 | // benefits generally outweight the cost, making the whole pipeline |
| 538 | // faster. |
| 539 | if (RunInliner) { |
| 540 | MPM.add(createGlobalOptimizerPass()); |
| 541 | MPM.add(createGlobalDCEPass()); |
| 542 | } |
| 543 | |
Mehdi Amini | 1db10ac | 2016-02-16 23:02:29 +0000 | [diff] [blame] | 544 | // If we are planning to perform ThinLTO later, let's not bloat the code with |
| 545 | // unrolling/vectorization/... now. We'll first run the inliner + CGSCC passes |
| 546 | // during ThinLTO and perform the rest of the optimizations afterward. |
Mehdi Amini | f72ca86b | 2016-04-25 08:47:37 +0000 | [diff] [blame] | 547 | if (PrepareForThinLTO) { |
Mehdi Amini | 27d2379 | 2016-09-16 16:56:30 +0000 | [diff] [blame] | 548 | // Rename anon globals to be able to export them in the summary. |
| 549 | MPM.add(createNameAnonGlobalPass()); |
Mehdi Amini | 1db10ac | 2016-02-16 23:02:29 +0000 | [diff] [blame] | 550 | return; |
Mehdi Amini | f72ca86b | 2016-04-25 08:47:37 +0000 | [diff] [blame] | 551 | } |
Mehdi Amini | 1db10ac | 2016-02-16 23:02:29 +0000 | [diff] [blame] | 552 | |
Mehdi Amini | 31407ba | 2016-05-06 18:17:03 +0000 | [diff] [blame] | 553 | if (PerformThinLTO) |
| 554 | // Optimize globals now when performing ThinLTO, this enables more |
| 555 | // optimizations later. |
| 556 | MPM.add(createGlobalOptimizerPass()); |
| 557 | |
Ashutosh Nema | 2260a3a | 2016-02-11 09:23:53 +0000 | [diff] [blame] | 558 | // Scheduling LoopVersioningLICM when inlining is over, because after that |
Ashutosh Nema | df6763a | 2016-02-06 07:47:48 +0000 | [diff] [blame] | 559 | // we may see more accurate aliasing. Reason to run this late is that too |
| 560 | // early versioning may prevent further inlining due to increase of code |
Mehdi Amini | 31407ba | 2016-05-06 18:17:03 +0000 | [diff] [blame] | 561 | // size. By placing it just after inlining other optimizations which runs |
| 562 | // later might get benefit of no-alias assumption in clone loop. |
Ashutosh Nema | df6763a | 2016-02-06 07:47:48 +0000 | [diff] [blame] | 563 | if (UseLoopVersioningLICM) { |
| 564 | MPM.add(createLoopVersioningLICMPass()); // Do LoopVersioningLICM |
| 565 | MPM.add(createLICMPass()); // Hoist loop invariants |
| 566 | } |
| 567 | |
Davide Italiano | c48d1c8 | 2017-10-02 23:39:20 +0000 | [diff] [blame] | 568 | // We add a fresh GlobalsModRef run at this point. This is particularly |
| 569 | // useful as the above will have inlined, DCE'ed, and function-attr |
| 570 | // propagated everything. We should at this point have a reasonably minimal |
| 571 | // and richly annotated call graph. By computing aliasing and mod/ref |
| 572 | // information for all local globals here, the late loop passes and notably |
| 573 | // the vectorizer will be able to use them to help recognize vectorizable |
| 574 | // memory operations. |
| 575 | // |
| 576 | // Note that this relies on a bug in the pass manager which preserves |
| 577 | // a module analysis into a function pass pipeline (and throughout it) so |
| 578 | // long as the first function pass doesn't invalidate the module analysis. |
| 579 | // Thus both Float2Int and LoopRotate have to preserve AliasAnalysis for |
| 580 | // this to work. Fortunately, it is trivial to preserve AliasAnalysis |
| 581 | // (doing nothing preserves it as it is required to be conservatively |
| 582 | // correct in the face of IR changes). |
| 583 | MPM.add(createGlobalsAAWrapperPass()); |
Chandler Carruth | 08eebe2 | 2015-07-23 09:34:01 +0000 | [diff] [blame] | 584 | |
Davide Italiano | b672537 | 2017-01-02 17:49:18 +0000 | [diff] [blame] | 585 | MPM.add(createFloat2IntPass()); |
James Molloy | 0cbb2a86 | 2015-03-27 10:36:57 +0000 | [diff] [blame] | 586 | |
Tobias Grosser | 39a7bd1 | 2015-07-16 08:20:37 +0000 | [diff] [blame] | 587 | addExtensionsToPM(EP_VectorizerStart, MPM); |
| 588 | |
Chandler Carruth | 7b8297a | 2014-10-14 00:31:29 +0000 | [diff] [blame] | 589 | // Re-rotate loops in all our loop nests. These may have fallout out of |
| 590 | // rotated form due to GVN or other transformations, and the vectorizer relies |
Alexey Bataev | da33d80 | 2015-07-10 10:37:09 +0000 | [diff] [blame] | 591 | // on the rotated form. Disable header duplication at -Oz. |
| 592 | MPM.add(createLoopRotatePass(SizeLevel == 2 ? 0 : -1)); |
Chandler Carruth | 7b8297a | 2014-10-14 00:31:29 +0000 | [diff] [blame] | 593 | |
Adam Nemet | 938d3d6 | 2015-05-14 12:05:18 +0000 | [diff] [blame] | 594 | // Distribute loops to allow partial vectorization. I.e. isolate dependences |
Adam Nemet | d2fa414 | 2016-04-27 05:28:18 +0000 | [diff] [blame] | 595 | // into separate loop that would otherwise inhibit vectorization. This is |
| 596 | // currently only performed for loops marked with the metadata |
| 597 | // llvm.loop.distribute=true or when -enable-loop-distribute is specified. |
Adam Nemet | 32e6a34 | 2016-12-21 04:07:40 +0000 | [diff] [blame] | 598 | MPM.add(createLoopDistributePass()); |
Adam Nemet | 938d3d6 | 2015-05-14 12:05:18 +0000 | [diff] [blame] | 599 | |
Renato Golin | 729a3ae | 2013-12-05 21:20:02 +0000 | [diff] [blame] | 600 | MPM.add(createLoopVectorizePass(DisableUnrollLoops, LoopVectorize)); |
Adam Nemet | e54a4fa | 2015-11-03 23:50:08 +0000 | [diff] [blame] | 601 | |
| 602 | // Eliminate loads by forwarding stores from the previous iteration to loads |
| 603 | // of the current iteration. |
Davide Italiano | c48d1c8 | 2017-10-02 23:39:20 +0000 | [diff] [blame] | 604 | MPM.add(createLoopLoadEliminationPass()); |
Adam Nemet | e54a4fa | 2015-11-03 23:50:08 +0000 | [diff] [blame] | 605 | |
Renato Golin | 729a3ae | 2013-12-05 21:20:02 +0000 | [diff] [blame] | 606 | // FIXME: Because of #pragma vectorize enable, the passes below are always |
| 607 | // inserted in the pipeline, even when the vectorizer doesn't run (ex. when |
| 608 | // on -O1 and no #pragma is found). Would be good to have these two passes |
| 609 | // as function calls, so that we can only pass them when the vectorizer |
| 610 | // changed the code. |
Matthias Braun | c31032d | 2016-03-09 18:47:11 +0000 | [diff] [blame] | 611 | addInstructionCombiningPass(MPM); |
Chandler Carruth | 7b8297a | 2014-10-14 00:31:29 +0000 | [diff] [blame] | 612 | if (OptLevel > 1 && ExtraVectorizerPasses) { |
| 613 | // At higher optimization levels, try to clean up any runtime overlap and |
| 614 | // alignment checks inserted by the vectorizer. We want to track correllated |
| 615 | // runtime checks for two inner loops in the same outer loop, fold any |
| 616 | // common computations, hoist loop-invariant aspects out of any outer loop, |
| 617 | // and unswitch the runtime checks if possible. Once hoisted, we may have |
| 618 | // dead (or speculatable) control flows or more combining opportunities. |
| 619 | MPM.add(createEarlyCSEPass()); |
| 620 | MPM.add(createCorrelatedValuePropagationPass()); |
Matthias Braun | c31032d | 2016-03-09 18:47:11 +0000 | [diff] [blame] | 621 | addInstructionCombiningPass(MPM); |
Chandler Carruth | 7b8297a | 2014-10-14 00:31:29 +0000 | [diff] [blame] | 622 | MPM.add(createLICMPass()); |
Stanislav Mekhanoshin | ee2dd78 | 2017-03-17 17:13:41 +0000 | [diff] [blame] | 623 | MPM.add(createLoopUnswitchPass(SizeLevel || OptLevel < 3, DivergentTarget)); |
Chandler Carruth | 7b8297a | 2014-10-14 00:31:29 +0000 | [diff] [blame] | 624 | MPM.add(createCFGSimplificationPass()); |
Matthias Braun | c31032d | 2016-03-09 18:47:11 +0000 | [diff] [blame] | 625 | addInstructionCombiningPass(MPM); |
Chandler Carruth | 7b8297a | 2014-10-14 00:31:29 +0000 | [diff] [blame] | 626 | } |
James Molloy | 568da09 | 2014-08-06 12:56:19 +0000 | [diff] [blame] | 627 | |
Chandler Carruth | 3545a9e | 2017-06-30 07:09:08 +0000 | [diff] [blame] | 628 | if (RunSLPAfterLoopVectorization && SLPVectorize) { |
| 629 | MPM.add(createSLPVectorizerPass()); // Vectorize parallel scalar chains. |
| 630 | if (OptLevel > 1 && ExtraVectorizerPasses) { |
| 631 | MPM.add(createEarlyCSEPass()); |
James Molloy | 568da09 | 2014-08-06 12:56:19 +0000 | [diff] [blame] | 632 | } |
| 633 | } |
| 634 | |
Peter Collingbourne | 0a43761 | 2014-05-25 10:27:02 +0000 | [diff] [blame] | 635 | addExtensionsToPM(EP_Peephole, MPM); |
Sanjay Patel | b049173 | 2017-10-28 18:43:07 +0000 | [diff] [blame] | 636 | // Switches to lookup tables and other transforms that may not be considered |
| 637 | // canonical by other IR passes. |
| 638 | MPM.add(createCFGSimplificationPass(1, true, true, false)); |
Matthias Braun | c31032d | 2016-03-09 18:47:11 +0000 | [diff] [blame] | 639 | addInstructionCombiningPass(MPM); |
Chandler Carruth | 08e1b87 | 2013-06-24 07:21:47 +0000 | [diff] [blame] | 640 | |
Kevin Qin | 49bc764 | 2015-03-12 05:36:01 +0000 | [diff] [blame] | 641 | if (!DisableUnrollLoops) { |
Dehao Chen | 7d23032 | 2017-02-18 03:46:51 +0000 | [diff] [blame] | 642 | MPM.add(createLoopUnrollPass(OptLevel)); // Unroll small loops |
Hal Finkel | 86b3064 | 2014-03-31 23:23:51 +0000 | [diff] [blame] | 643 | |
Wei Mi | bf727ba | 2015-05-14 22:02:54 +0000 | [diff] [blame] | 644 | // LoopUnroll may generate some redundency to cleanup. |
Matthias Braun | c31032d | 2016-03-09 18:47:11 +0000 | [diff] [blame] | 645 | addInstructionCombiningPass(MPM); |
Wei Mi | bf727ba | 2015-05-14 22:02:54 +0000 | [diff] [blame] | 646 | |
Kevin Qin | 49bc764 | 2015-03-12 05:36:01 +0000 | [diff] [blame] | 647 | // Runtime unrolling will introduce runtime check in loop prologue. If the |
| 648 | // unrolled loop is a inner loop, then the prologue will be inside the |
| 649 | // outer loop. LICM pass can help to promote the runtime check out if the |
| 650 | // checked value is loop invariant. |
| 651 | MPM.add(createLICMPass()); |
Dehao Chen | 947dbe12 | 2016-11-09 00:58:19 +0000 | [diff] [blame] | 652 | } |
Kevin Qin | 49bc764 | 2015-03-12 05:36:01 +0000 | [diff] [blame] | 653 | |
Hal Finkel | d67e463 | 2014-09-07 20:05:11 +0000 | [diff] [blame] | 654 | // After vectorization and unrolling, assume intrinsics may tell us more |
| 655 | // about pointer alignments. |
| 656 | MPM.add(createAlignmentFromAssumptionsPass()); |
| 657 | |
Davide Italiano | c74ea93 | 2017-10-06 04:39:40 +0000 | [diff] [blame] | 658 | // FIXME: We shouldn't bother with this anymore. |
| 659 | MPM.add(createStripDeadPrototypesPass()); // Get rid of dead prototypes |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 660 | |
Davide Italiano | c74ea93 | 2017-10-06 04:39:40 +0000 | [diff] [blame] | 661 | // GlobalOpt already deletes dead functions and globals, at -O2 try a |
| 662 | // late pass of GlobalDCE. It is capable of deleting dead cycles. |
| 663 | if (OptLevel > 1) { |
| 664 | MPM.add(createGlobalDCEPass()); // Remove dead fns and globals. |
| 665 | MPM.add(createConstantMergePass()); // Merge dup global constants |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 666 | } |
Nick Lewycky | 9e6d184 | 2014-09-13 21:46:00 +0000 | [diff] [blame] | 667 | |
| 668 | if (MergeFunctions) |
| 669 | MPM.add(createMergeFunctionsPass()); |
| 670 | |
Dehao Chen | 5492f86 | 2016-11-10 17:42:18 +0000 | [diff] [blame] | 671 | // LoopSink pass sinks instructions hoisted by LICM, which serves as a |
| 672 | // canonicalization pass that enables other optimizations. As a result, |
| 673 | // LoopSink pass needs to be a very late IR pass to avoid undoing LICM |
| 674 | // result too early. |
Dehao Chen | 947dbe12 | 2016-11-09 00:58:19 +0000 | [diff] [blame] | 675 | MPM.add(createLoopSinkPass()); |
| 676 | // Get rid of LCSSA nodes. |
| 677 | MPM.add(createInstructionSimplifierPass()); |
Filipe Cabecinhas | 92dc348 | 2017-04-26 12:02:41 +0000 | [diff] [blame] | 678 | |
Sanjay Patel | 6fd4391 | 2017-09-09 13:38:18 +0000 | [diff] [blame] | 679 | // This hoists/decomposes div/rem ops. It should run after other sink/hoist |
| 680 | // passes to avoid re-sinking, but before SimplifyCFG because it can allow |
| 681 | // flattening of blocks. |
| 682 | MPM.add(createDivRemPairsPass()); |
| 683 | |
Filipe Cabecinhas | 92dc348 | 2017-04-26 12:02:41 +0000 | [diff] [blame] | 684 | // LoopSink (and other loop passes since the last simplifyCFG) might have |
| 685 | // resulted in single-entry-single-exit or empty blocks. Clean up the CFG. |
| 686 | MPM.add(createCFGSimplificationPass()); |
| 687 | |
Kostya Serebryany | e505a5a | 2012-03-23 23:22:59 +0000 | [diff] [blame] | 688 | addExtensionsToPM(EP_OptimizerLast, MPM); |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 689 | } |
| 690 | |
Chandler Carruth | 30d69c2 | 2015-02-13 10:01:29 +0000 | [diff] [blame] | 691 | void PassManagerBuilder::addLTOOptimizationPasses(legacy::PassManagerBase &PM) { |
Peter Collingbourne | fad596a | 2016-05-25 21:26:14 +0000 | [diff] [blame] | 692 | // Remove unused virtual tables to improve the quality of code generated by |
| 693 | // whole-program devirtualization and bitset lowering. |
| 694 | PM.add(createGlobalDCEPass()); |
| 695 | |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 696 | // Provide AliasAnalysis services for optimizations. |
| 697 | addInitialAliasAnalysisPasses(PM); |
| 698 | |
Chandler Carruth | f49f1a87 | 2015-12-27 08:13:45 +0000 | [diff] [blame] | 699 | // Allow forcing function attributes as a debugging and tuning aid. |
| 700 | PM.add(createForceFunctionAttrsLegacyPass()); |
| 701 | |
Chandler Carruth | 3a040e6 | 2015-12-27 08:41:34 +0000 | [diff] [blame] | 702 | // Infer attributes about declarations if possible. |
| 703 | PM.add(createInferFunctionAttrsLegacyPass()); |
| 704 | |
Peter Collingbourne | fad596a | 2016-05-25 21:26:14 +0000 | [diff] [blame] | 705 | if (OptLevel > 1) { |
| 706 | // Indirect call promotion. This should promote all the targets that are |
| 707 | // left by the earlier promotion pass that promotes intra-module targets. |
| 708 | // This two-step promotion is to save the compile time. For LTO, it should |
| 709 | // produce the same result as if we only do promotion here. |
Dehao Chen | cc75d24 | 2017-02-23 22:15:18 +0000 | [diff] [blame] | 710 | PM.add( |
| 711 | createPGOIndirectCallPromotionLegacyPass(true, !PGOSampleUse.empty())); |
Rong Xu | 6e34c49 | 2016-04-27 23:20:27 +0000 | [diff] [blame] | 712 | |
Peter Collingbourne | fad596a | 2016-05-25 21:26:14 +0000 | [diff] [blame] | 713 | // Propagate constants at call sites into the functions they call. This |
| 714 | // opens opportunities for globalopt (and inlining) by substituting function |
| 715 | // pointers passed as arguments to direct uses of functions. |
| 716 | PM.add(createIPSCCPPass()); |
Matthew Simpson | cb58558 | 2017-10-25 13:40:08 +0000 | [diff] [blame] | 717 | |
| 718 | // Attach metadata to indirect call sites indicating the set of functions |
| 719 | // they may target at run-time. This should follow IPSCCP. |
| 720 | PM.add(createCalledValuePropagationPass()); |
Peter Collingbourne | fad596a | 2016-05-25 21:26:14 +0000 | [diff] [blame] | 721 | } |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 722 | |
Peter Collingbourne | fad596a | 2016-05-25 21:26:14 +0000 | [diff] [blame] | 723 | // Infer attributes about definitions. The readnone attribute in particular is |
| 724 | // required for virtual constant propagation. |
Chandler Carruth | 9c4ed17 | 2016-02-18 11:03:11 +0000 | [diff] [blame] | 725 | PM.add(createPostOrderFunctionAttrsLegacyPass()); |
Chandler Carruth | 1926b70 | 2016-01-08 10:55:52 +0000 | [diff] [blame] | 726 | PM.add(createReversePostOrderFunctionAttrsPass()); |
Peter Collingbourne | fad596a | 2016-05-25 21:26:14 +0000 | [diff] [blame] | 727 | |
Peter Collingbourne | f72a8d4 | 2016-11-16 23:40:26 +0000 | [diff] [blame] | 728 | // Split globals using inrange annotations on GEP indices. This can help |
| 729 | // improve the quality of generated code when virtual constant propagation or |
| 730 | // control flow integrity are enabled. |
| 731 | PM.add(createGlobalSplitPass()); |
| 732 | |
Peter Collingbourne | fad596a | 2016-05-25 21:26:14 +0000 | [diff] [blame] | 733 | // Apply whole-program devirtualization and virtual constant propagation. |
Peter Collingbourne | f7691d8 | 2017-03-22 18:22:59 +0000 | [diff] [blame] | 734 | PM.add(createWholeProgramDevirtPass(ExportSummary, nullptr)); |
Peter Collingbourne | fad596a | 2016-05-25 21:26:14 +0000 | [diff] [blame] | 735 | |
| 736 | // That's all we need at opt level 1. |
| 737 | if (OptLevel == 1) |
| 738 | return; |
| 739 | |
| 740 | // Now that we internalized some globals, see if we can hack on them! |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 741 | PM.add(createGlobalOptimizerPass()); |
James Molloy | 6045cc8 | 2015-12-15 09:24:01 +0000 | [diff] [blame] | 742 | // Promote any localized global vars. |
| 743 | PM.add(createPromoteMemoryToRegisterPass()); |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 744 | |
| 745 | // Linking modules together can lead to duplicated global constants, only |
| 746 | // keep one copy of each constant. |
| 747 | PM.add(createConstantMergePass()); |
| 748 | |
| 749 | // Remove unused arguments from functions. |
| 750 | PM.add(createDeadArgEliminationPass()); |
| 751 | |
| 752 | // Reduce the code after globalopt and ipsccp. Both can open up significant |
| 753 | // simplification opportunities, and both can propagate functions through |
| 754 | // function pointers. When this happens, we often have to resolve varargs |
| 755 | // calls, etc, so let instcombine do this. |
Matthias Braun | c31032d | 2016-03-09 18:47:11 +0000 | [diff] [blame] | 756 | addInstructionCombiningPass(PM); |
Peter Collingbourne | 0a43761 | 2014-05-25 10:27:02 +0000 | [diff] [blame] | 757 | addExtensionsToPM(EP_Peephole, PM); |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 758 | |
| 759 | // Inline small functions |
Rafael Espindola | e07caad | 2014-08-21 13:35:30 +0000 | [diff] [blame] | 760 | bool RunInliner = Inliner; |
| 761 | if (RunInliner) { |
| 762 | PM.add(Inliner); |
| 763 | Inliner = nullptr; |
| 764 | } |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 765 | |
| 766 | PM.add(createPruneEHPass()); // Remove dead EH info. |
| 767 | |
| 768 | // Optimize globals again if we ran the inliner. |
| 769 | if (RunInliner) |
| 770 | PM.add(createGlobalOptimizerPass()); |
| 771 | PM.add(createGlobalDCEPass()); // Remove dead functions. |
| 772 | |
| 773 | // If we didn't decide to inline a function, check to see if we can |
| 774 | // transform it to pass arguments by value instead of by reference. |
| 775 | PM.add(createArgumentPromotionPass()); |
| 776 | |
| 777 | // The IPO passes may leave cruft around. Clean up after them. |
Matthias Braun | c31032d | 2016-03-09 18:47:11 +0000 | [diff] [blame] | 778 | addInstructionCombiningPass(PM); |
Peter Collingbourne | 0a43761 | 2014-05-25 10:27:02 +0000 | [diff] [blame] | 779 | addExtensionsToPM(EP_Peephole, PM); |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 780 | PM.add(createJumpThreadingPass()); |
Bill Wendling | 4c0d9ad | 2013-08-30 00:48:37 +0000 | [diff] [blame] | 781 | |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 782 | // Break up allocas |
David Majnemer | cbf614a | 2016-06-15 00:19:09 +0000 | [diff] [blame] | 783 | PM.add(createSROAPass()); |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 784 | |
| 785 | // Run a few AA driven optimizations here and now, to cleanup the code. |
Chandler Carruth | 9c4ed17 | 2016-02-18 11:03:11 +0000 | [diff] [blame] | 786 | PM.add(createPostOrderFunctionAttrsLegacyPass()); // Add nocapture. |
Chandler Carruth | 7b560d4 | 2015-09-09 17:55:00 +0000 | [diff] [blame] | 787 | PM.add(createGlobalsAAWrapperPass()); // IP alias analysis. |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 788 | |
Bill Wendling | 932b992 | 2012-04-02 22:16:50 +0000 | [diff] [blame] | 789 | PM.add(createLICMPass()); // Hoist loop invariants. |
Davide Italiano | 9b8738d | 2017-01-28 23:45:37 +0000 | [diff] [blame] | 790 | PM.add(createMergedLoadStoreMotionPass()); // Merge ld/st in diamonds. |
Davide Italiano | fe7a3ee | 2016-12-26 18:26:19 +0000 | [diff] [blame] | 791 | PM.add(NewGVN ? createNewGVNPass() |
| 792 | : createGVNPass(DisableGVNLoadPRE)); // Remove redundancies. |
Bill Wendling | 932b992 | 2012-04-02 22:16:50 +0000 | [diff] [blame] | 793 | PM.add(createMemCpyOptPass()); // Remove dead memcpys. |
Bill Wendling | 4c0d9ad | 2013-08-30 00:48:37 +0000 | [diff] [blame] | 794 | |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 795 | // Nuke dead stores. |
| 796 | PM.add(createDeadStoreEliminationPass()); |
| 797 | |
Duncan P. N. Exon Smith | 2b69189 | 2014-04-15 17:48:15 +0000 | [diff] [blame] | 798 | // More loops are countable; try to optimize them. |
| 799 | PM.add(createIndVarSimplifyPass()); |
| 800 | PM.add(createLoopDeletionPass()); |
Karthik Bhat | 88db86d | 2015-03-06 10:11:25 +0000 | [diff] [blame] | 801 | if (EnableLoopInterchange) |
| 802 | PM.add(createLoopInterchangePass()); |
| 803 | |
James Molloy | 31f3ddd | 2016-01-14 15:00:09 +0000 | [diff] [blame] | 804 | if (!DisableUnrollLoops) |
Dehao Chen | 7d23032 | 2017-02-18 03:46:51 +0000 | [diff] [blame] | 805 | PM.add(createSimpleLoopUnrollPass(OptLevel)); // Unroll small loops |
Arnold Schwaighofer | eb1a38f | 2014-10-26 21:50:58 +0000 | [diff] [blame] | 806 | PM.add(createLoopVectorizePass(true, LoopVectorize)); |
James Molloy | 31f3ddd | 2016-01-14 15:00:09 +0000 | [diff] [blame] | 807 | // The vectorizer may have significantly shortened a loop body; unroll again. |
| 808 | if (!DisableUnrollLoops) |
Dehao Chen | 7d23032 | 2017-02-18 03:46:51 +0000 | [diff] [blame] | 809 | PM.add(createLoopUnrollPass(OptLevel)); |
Arnold Schwaighofer | 6ccda92 | 2014-02-24 18:19:31 +0000 | [diff] [blame] | 810 | |
James Molloy | 6045cc8 | 2015-12-15 09:24:01 +0000 | [diff] [blame] | 811 | // Now that we've optimized loops (in particular loop induction variables), |
| 812 | // we may have exposed more scalar opportunities. Run parts of the scalar |
| 813 | // optimizer again at this point. |
Matthias Braun | c31032d | 2016-03-09 18:47:11 +0000 | [diff] [blame] | 814 | addInstructionCombiningPass(PM); // Initial cleanup |
James Molloy | 6045cc8 | 2015-12-15 09:24:01 +0000 | [diff] [blame] | 815 | PM.add(createCFGSimplificationPass()); // if-convert |
| 816 | PM.add(createSCCPPass()); // Propagate exposed constants |
Matthias Braun | c31032d | 2016-03-09 18:47:11 +0000 | [diff] [blame] | 817 | addInstructionCombiningPass(PM); // Clean up again |
James Molloy | 6045cc8 | 2015-12-15 09:24:01 +0000 | [diff] [blame] | 818 | PM.add(createBitTrackingDCEPass()); |
| 819 | |
Yi Jiang | 79eb0aa | 2014-05-05 23:14:46 +0000 | [diff] [blame] | 820 | // More scalar chains could be vectorized due to more alias information |
JF Bastien | f42a6ea | 2014-10-21 23:18:21 +0000 | [diff] [blame] | 821 | if (RunSLPAfterLoopVectorization) |
| 822 | if (SLPVectorize) |
| 823 | PM.add(createSLPVectorizerPass()); // Vectorize parallel scalar chains. |
Yi Jiang | 79eb0aa | 2014-05-05 23:14:46 +0000 | [diff] [blame] | 824 | |
Hal Finkel | d67e463 | 2014-09-07 20:05:11 +0000 | [diff] [blame] | 825 | // After vectorization, assume intrinsics may tell us more about pointer |
| 826 | // alignments. |
| 827 | PM.add(createAlignmentFromAssumptionsPass()); |
| 828 | |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 829 | // Cleanup and simplify the code after the scalar optimizations. |
Matthias Braun | c31032d | 2016-03-09 18:47:11 +0000 | [diff] [blame] | 830 | addInstructionCombiningPass(PM); |
Peter Collingbourne | 0a43761 | 2014-05-25 10:27:02 +0000 | [diff] [blame] | 831 | addExtensionsToPM(EP_Peephole, PM); |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 832 | |
| 833 | PM.add(createJumpThreadingPass()); |
Peter Collingbourne | 070843d | 2015-03-19 22:01:00 +0000 | [diff] [blame] | 834 | } |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 835 | |
Peter Collingbourne | 070843d | 2015-03-19 22:01:00 +0000 | [diff] [blame] | 836 | void PassManagerBuilder::addLateLTOOptimizationPasses( |
| 837 | legacy::PassManagerBase &PM) { |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 838 | // Delete basic blocks, which optimization passes may have killed. |
Tom Stellard | aa664d9 | 2013-08-06 02:43:45 +0000 | [diff] [blame] | 839 | PM.add(createCFGSimplificationPass()); |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 840 | |
Teresa Johnson | c4279a7 | 2015-08-11 16:26:41 +0000 | [diff] [blame] | 841 | // Drop bodies of available externally objects to improve GlobalDCE. |
| 842 | PM.add(createEliminateAvailableExternallyPass()); |
| 843 | |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 844 | // Now that we have optimized the program, discard unreachable functions. |
| 845 | PM.add(createGlobalDCEPass()); |
Nick Lewycky | 9e6d184 | 2014-09-13 21:46:00 +0000 | [diff] [blame] | 846 | |
| 847 | // FIXME: this is profitable (for compiler time) to do at -O0 too, but |
| 848 | // currently it damages debug info. |
| 849 | if (MergeFunctions) |
| 850 | PM.add(createMergeFunctionsPass()); |
Rafael Espindola | 3ea478b | 2011-08-02 21:50:27 +0000 | [diff] [blame] | 851 | } |
Rafael Espindola | 07f60915 | 2011-08-09 22:17:34 +0000 | [diff] [blame] | 852 | |
Mehdi Amini | 1db10ac | 2016-02-16 23:02:29 +0000 | [diff] [blame] | 853 | void PassManagerBuilder::populateThinLTOPassManager( |
| 854 | legacy::PassManagerBase &PM) { |
| 855 | PerformThinLTO = true; |
| 856 | |
| 857 | if (VerifyInput) |
| 858 | PM.add(createVerifierPass()); |
| 859 | |
Peter Collingbourne | f7691d8 | 2017-03-22 18:22:59 +0000 | [diff] [blame] | 860 | if (ImportSummary) { |
Peter Collingbourne | 08eb081 | 2017-02-15 23:48:38 +0000 | [diff] [blame] | 861 | // These passes import type identifier resolutions for whole-program |
| 862 | // devirtualization and CFI. They must run early because other passes may |
| 863 | // disturb the specific instruction patterns that these passes look for, |
| 864 | // creating dependencies on resolutions that may not appear in the summary. |
| 865 | // |
| 866 | // For example, GVN may transform the pattern assume(type.test) appearing in |
| 867 | // two basic blocks into assume(phi(type.test, type.test)), which would |
| 868 | // transform a dependency on a WPD resolution into a dependency on a type |
| 869 | // identifier resolution for CFI. |
| 870 | // |
| 871 | // Also, WPD has access to more precise information than ICP and can |
| 872 | // devirtualize more effectively, so it should operate on the IR first. |
Peter Collingbourne | f7691d8 | 2017-03-22 18:22:59 +0000 | [diff] [blame] | 873 | PM.add(createWholeProgramDevirtPass(nullptr, ImportSummary)); |
| 874 | PM.add(createLowerTypeTestsPass(nullptr, ImportSummary)); |
Peter Collingbourne | 08eb081 | 2017-02-15 23:48:38 +0000 | [diff] [blame] | 875 | } |
Peter Collingbourne | e02b74e | 2017-01-20 22:18:52 +0000 | [diff] [blame] | 876 | |
Mehdi Amini | 1db10ac | 2016-02-16 23:02:29 +0000 | [diff] [blame] | 877 | populateModulePassManager(PM); |
| 878 | |
| 879 | if (VerifyOutput) |
| 880 | PM.add(createVerifierPass()); |
| 881 | PerformThinLTO = false; |
| 882 | } |
| 883 | |
Chandler Carruth | 30d69c2 | 2015-02-13 10:01:29 +0000 | [diff] [blame] | 884 | void PassManagerBuilder::populateLTOPassManager(legacy::PassManagerBase &PM) { |
Rafael Espindola | 7cebf36 | 2014-08-21 20:03:44 +0000 | [diff] [blame] | 885 | if (LibraryInfo) |
Chandler Carruth | b98f63d | 2015-01-15 10:41:28 +0000 | [diff] [blame] | 886 | PM.add(new TargetLibraryInfoWrapperPass(*LibraryInfo)); |
Rafael Espindola | 7cebf36 | 2014-08-21 20:03:44 +0000 | [diff] [blame] | 887 | |
Duncan P. N. Exon Smith | ab58a56 | 2015-03-19 22:24:17 +0000 | [diff] [blame] | 888 | if (VerifyInput) |
Rafael Espindola | 7cebf36 | 2014-08-21 20:03:44 +0000 | [diff] [blame] | 889 | PM.add(createVerifierPass()); |
Rafael Espindola | 7cebf36 | 2014-08-21 20:03:44 +0000 | [diff] [blame] | 890 | |
Peter Collingbourne | df49d1b | 2016-02-09 22:50:34 +0000 | [diff] [blame] | 891 | if (OptLevel != 0) |
Rafael Espindola | 7cebf36 | 2014-08-21 20:03:44 +0000 | [diff] [blame] | 892 | addLTOOptimizationPasses(PM); |
Peter Collingbourne | 7730b24 | 2017-05-26 18:27:13 +0000 | [diff] [blame] | 893 | else { |
| 894 | // The whole-program-devirt pass needs to run at -O0 because only it knows |
| 895 | // about the llvm.type.checked.load intrinsic: it needs to both lower the |
| 896 | // intrinsic itself and handle it in the summary. |
| 897 | PM.add(createWholeProgramDevirtPass(ExportSummary, nullptr)); |
| 898 | } |
Rafael Espindola | 7cebf36 | 2014-08-21 20:03:44 +0000 | [diff] [blame] | 899 | |
Evgeniy Stepanov | 67849d5 | 2015-12-15 23:00:08 +0000 | [diff] [blame] | 900 | // Create a function that performs CFI checks for cross-DSO calls with targets |
| 901 | // in the current module. |
| 902 | PM.add(createCrossDSOCFIPass()); |
| 903 | |
Peter Collingbourne | 7efd750 | 2016-06-24 21:21:32 +0000 | [diff] [blame] | 904 | // Lower type metadata and the type.test intrinsic. This pass supports Clang's |
| 905 | // control flow integrity mechanisms (-fsanitize=cfi*) and needs to run at |
| 906 | // link time if CFI is enabled. The pass does nothing if CFI is disabled. |
Peter Collingbourne | f7691d8 | 2017-03-22 18:22:59 +0000 | [diff] [blame] | 907 | PM.add(createLowerTypeTestsPass(ExportSummary, nullptr)); |
Peter Collingbourne | 070843d | 2015-03-19 22:01:00 +0000 | [diff] [blame] | 908 | |
| 909 | if (OptLevel != 0) |
| 910 | addLateLTOOptimizationPasses(PM); |
| 911 | |
Duncan P. N. Exon Smith | ab58a56 | 2015-03-19 22:24:17 +0000 | [diff] [blame] | 912 | if (VerifyOutput) |
Rafael Espindola | 7cebf36 | 2014-08-21 20:03:44 +0000 | [diff] [blame] | 913 | PM.add(createVerifierPass()); |
Rafael Espindola | 7cebf36 | 2014-08-21 20:03:44 +0000 | [diff] [blame] | 914 | } |
| 915 | |
Eric Christopher | 04d4e93 | 2013-04-22 22:47:22 +0000 | [diff] [blame] | 916 | inline PassManagerBuilder *unwrap(LLVMPassManagerBuilderRef P) { |
| 917 | return reinterpret_cast<PassManagerBuilder*>(P); |
| 918 | } |
| 919 | |
| 920 | inline LLVMPassManagerBuilderRef wrap(PassManagerBuilder *P) { |
| 921 | return reinterpret_cast<LLVMPassManagerBuilderRef>(P); |
| 922 | } |
| 923 | |
Dmitri Gribenko | 0011bbf | 2012-11-15 16:51:49 +0000 | [diff] [blame] | 924 | LLVMPassManagerBuilderRef LLVMPassManagerBuilderCreate() { |
Rafael Espindola | 07f60915 | 2011-08-09 22:17:34 +0000 | [diff] [blame] | 925 | PassManagerBuilder *PMB = new PassManagerBuilder(); |
| 926 | return wrap(PMB); |
| 927 | } |
| 928 | |
| 929 | void LLVMPassManagerBuilderDispose(LLVMPassManagerBuilderRef PMB) { |
| 930 | PassManagerBuilder *Builder = unwrap(PMB); |
| 931 | delete Builder; |
| 932 | } |
| 933 | |
| 934 | void |
| 935 | LLVMPassManagerBuilderSetOptLevel(LLVMPassManagerBuilderRef PMB, |
| 936 | unsigned OptLevel) { |
| 937 | PassManagerBuilder *Builder = unwrap(PMB); |
| 938 | Builder->OptLevel = OptLevel; |
| 939 | } |
| 940 | |
| 941 | void |
| 942 | LLVMPassManagerBuilderSetSizeLevel(LLVMPassManagerBuilderRef PMB, |
| 943 | unsigned SizeLevel) { |
| 944 | PassManagerBuilder *Builder = unwrap(PMB); |
| 945 | Builder->SizeLevel = SizeLevel; |
| 946 | } |
| 947 | |
| 948 | void |
| 949 | LLVMPassManagerBuilderSetDisableUnitAtATime(LLVMPassManagerBuilderRef PMB, |
| 950 | LLVMBool Value) { |
Davide Italiano | c74ea93 | 2017-10-06 04:39:40 +0000 | [diff] [blame] | 951 | // NOTE: The DisableUnitAtATime switch has been removed. |
Rafael Espindola | 07f60915 | 2011-08-09 22:17:34 +0000 | [diff] [blame] | 952 | } |
| 953 | |
| 954 | void |
| 955 | LLVMPassManagerBuilderSetDisableUnrollLoops(LLVMPassManagerBuilderRef PMB, |
| 956 | LLVMBool Value) { |
| 957 | PassManagerBuilder *Builder = unwrap(PMB); |
| 958 | Builder->DisableUnrollLoops = Value; |
| 959 | } |
| 960 | |
| 961 | void |
| 962 | LLVMPassManagerBuilderSetDisableSimplifyLibCalls(LLVMPassManagerBuilderRef PMB, |
| 963 | LLVMBool Value) { |
Meador Inge | dfb08a2 | 2013-06-20 19:48:07 +0000 | [diff] [blame] | 964 | // NOTE: The simplify-libcalls pass has been removed. |
Rafael Espindola | 07f60915 | 2011-08-09 22:17:34 +0000 | [diff] [blame] | 965 | } |
| 966 | |
| 967 | void |
| 968 | LLVMPassManagerBuilderUseInlinerWithThreshold(LLVMPassManagerBuilderRef PMB, |
| 969 | unsigned Threshold) { |
| 970 | PassManagerBuilder *Builder = unwrap(PMB); |
| 971 | Builder->Inliner = createFunctionInliningPass(Threshold); |
| 972 | } |
| 973 | |
| 974 | void |
| 975 | LLVMPassManagerBuilderPopulateFunctionPassManager(LLVMPassManagerBuilderRef PMB, |
| 976 | LLVMPassManagerRef PM) { |
| 977 | PassManagerBuilder *Builder = unwrap(PMB); |
Chandler Carruth | 30d69c2 | 2015-02-13 10:01:29 +0000 | [diff] [blame] | 978 | legacy::FunctionPassManager *FPM = unwrap<legacy::FunctionPassManager>(PM); |
Rafael Espindola | 07f60915 | 2011-08-09 22:17:34 +0000 | [diff] [blame] | 979 | Builder->populateFunctionPassManager(*FPM); |
| 980 | } |
| 981 | |
| 982 | void |
| 983 | LLVMPassManagerBuilderPopulateModulePassManager(LLVMPassManagerBuilderRef PMB, |
| 984 | LLVMPassManagerRef PM) { |
| 985 | PassManagerBuilder *Builder = unwrap(PMB); |
Chandler Carruth | 30d69c2 | 2015-02-13 10:01:29 +0000 | [diff] [blame] | 986 | legacy::PassManagerBase *MPM = unwrap(PM); |
Rafael Espindola | 07f60915 | 2011-08-09 22:17:34 +0000 | [diff] [blame] | 987 | Builder->populateModulePassManager(*MPM); |
| 988 | } |
| 989 | |
| 990 | void LLVMPassManagerBuilderPopulateLTOPassManager(LLVMPassManagerBuilderRef PMB, |
| 991 | LLVMPassManagerRef PM, |
Nick Lewycky | 5f50854 | 2013-03-10 21:58:22 +0000 | [diff] [blame] | 992 | LLVMBool Internalize, |
| 993 | LLVMBool RunInliner) { |
Rafael Espindola | 07f60915 | 2011-08-09 22:17:34 +0000 | [diff] [blame] | 994 | PassManagerBuilder *Builder = unwrap(PMB); |
Chandler Carruth | 30d69c2 | 2015-02-13 10:01:29 +0000 | [diff] [blame] | 995 | legacy::PassManagerBase *LPM = unwrap(PM); |
Rafael Espindola | e07caad | 2014-08-21 13:35:30 +0000 | [diff] [blame] | 996 | |
| 997 | // A small backwards compatibility hack. populateLTOPassManager used to take |
| 998 | // an RunInliner option. |
| 999 | if (RunInliner && !Builder->Inliner) |
| 1000 | Builder->Inliner = createFunctionInliningPass(); |
| 1001 | |
| 1002 | Builder->populateLTOPassManager(*LPM); |
Rafael Espindola | 07f60915 | 2011-08-09 22:17:34 +0000 | [diff] [blame] | 1003 | } |