Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 1 | //===- FunctionImport.cpp - ThinLTO Summary-based Function Import ---------===// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | // This file implements Function import based on summaries. |
| 11 | // |
| 12 | //===----------------------------------------------------------------------===// |
| 13 | |
| 14 | #include "llvm/Transforms/IPO/FunctionImport.h" |
| 15 | |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 16 | #include "llvm/ADT/SmallVector.h" |
Teresa Johnson | d29478f | 2016-03-27 15:27:30 +0000 | [diff] [blame] | 17 | #include "llvm/ADT/Statistic.h" |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 18 | #include "llvm/ADT/StringSet.h" |
| 19 | #include "llvm/IR/AutoUpgrade.h" |
| 20 | #include "llvm/IR/DiagnosticPrinter.h" |
| 21 | #include "llvm/IR/IntrinsicInst.h" |
| 22 | #include "llvm/IR/Module.h" |
| 23 | #include "llvm/IRReader/IRReader.h" |
| 24 | #include "llvm/Linker/Linker.h" |
Teresa Johnson | 26ab577 | 2016-03-15 00:04:37 +0000 | [diff] [blame] | 25 | #include "llvm/Object/ModuleSummaryIndexObjectFile.h" |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 26 | #include "llvm/Support/CommandLine.h" |
| 27 | #include "llvm/Support/Debug.h" |
| 28 | #include "llvm/Support/SourceMgr.h" |
Teresa Johnson | 488a800 | 2016-02-10 18:11:31 +0000 | [diff] [blame] | 29 | #include "llvm/Transforms/Utils/FunctionImportUtils.h" |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 30 | |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 31 | #define DEBUG_TYPE "function-import" |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 32 | |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 33 | using namespace llvm; |
| 34 | |
Teresa Johnson | d29478f | 2016-03-27 15:27:30 +0000 | [diff] [blame] | 35 | STATISTIC(NumImported, "Number of functions imported"); |
| 36 | |
Teresa Johnson | 3930361 | 2015-11-24 22:55:46 +0000 | [diff] [blame] | 37 | /// Limit on instruction count of imported functions. |
| 38 | static cl::opt<unsigned> ImportInstrLimit( |
| 39 | "import-instr-limit", cl::init(100), cl::Hidden, cl::value_desc("N"), |
| 40 | cl::desc("Only import functions with less than N instructions")); |
| 41 | |
Mehdi Amini | 4064174 | 2016-02-10 23:31:45 +0000 | [diff] [blame] | 42 | static cl::opt<float> |
| 43 | ImportInstrFactor("import-instr-evolution-factor", cl::init(0.7), |
| 44 | cl::Hidden, cl::value_desc("x"), |
| 45 | cl::desc("As we import functions, multiply the " |
| 46 | "`import-instr-limit` threshold by this factor " |
| 47 | "before processing newly imported functions")); |
| 48 | |
Teresa Johnson | d29478f | 2016-03-27 15:27:30 +0000 | [diff] [blame] | 49 | static cl::opt<bool> PrintImports("print-imports", cl::init(false), cl::Hidden, |
| 50 | cl::desc("Print imported functions")); |
| 51 | |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 52 | // Load lazily a module from \p FileName in \p Context. |
| 53 | static std::unique_ptr<Module> loadFile(const std::string &FileName, |
| 54 | LLVMContext &Context) { |
| 55 | SMDiagnostic Err; |
| 56 | DEBUG(dbgs() << "Loading '" << FileName << "'\n"); |
Teresa Johnson | 6cba37c | 2016-01-22 00:15:53 +0000 | [diff] [blame] | 57 | // Metadata isn't loaded until functions are imported, to minimize |
| 58 | // the memory overhead. |
Teresa Johnson | a1080ee | 2016-01-08 14:17:41 +0000 | [diff] [blame] | 59 | std::unique_ptr<Module> Result = |
| 60 | getLazyIRFileModule(FileName, Err, Context, |
| 61 | /* ShouldLazyLoadMetadata = */ true); |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 62 | if (!Result) { |
| 63 | Err.print("function-import", errs()); |
Mehdi Amini | d7ad221 | 2016-04-01 05:33:11 +0000 | [diff] [blame] | 64 | report_fatal_error("Abort"); |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 65 | } |
| 66 | |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 67 | return Result; |
| 68 | } |
| 69 | |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 70 | namespace { |
Mehdi Amini | 4064174 | 2016-02-10 23:31:45 +0000 | [diff] [blame] | 71 | |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 72 | /// Given a list of possible callee implementation for a call site, select one |
| 73 | /// that fits the \p Threshold. |
| 74 | /// |
| 75 | /// FIXME: select "best" instead of first that fits. But what is "best"? |
| 76 | /// - The smallest: more likely to be inlined. |
| 77 | /// - The one with the least outgoing edges (already well optimized). |
| 78 | /// - One from a module already being imported from in order to reduce the |
| 79 | /// number of source modules parsed/linked. |
| 80 | /// - One that has PGO data attached. |
| 81 | /// - [insert you fancy metric here] |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 82 | static const GlobalValueSummary * |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 83 | selectCallee(const GlobalValueInfoList &CalleeInfoList, unsigned Threshold) { |
| 84 | auto It = llvm::find_if( |
| 85 | CalleeInfoList, [&](const std::unique_ptr<GlobalValueInfo> &GlobInfo) { |
| 86 | assert(GlobInfo->summary() && |
| 87 | "We should not have a Global Info without summary"); |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 88 | auto *GVSummary = GlobInfo->summary(); |
Mehdi Amini | 2c719cc | 2016-04-20 04:17:36 +0000 | [diff] [blame] | 89 | if (GlobalValue::isWeakAnyLinkage(GVSummary->linkage())) |
| 90 | // There is no point in importing weak symbols, we can't inline them |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 91 | return false; |
Mehdi Amini | 2c719cc | 2016-04-20 04:17:36 +0000 | [diff] [blame] | 92 | if (auto *AS = dyn_cast<AliasSummary>(GVSummary)) { |
| 93 | GVSummary = &AS->getAliasee(); |
| 94 | // Alias can't point to "available_externally". However when we import |
| 95 | // linkOnceODR the linkage does not change. So we import the alias |
| 96 | // and aliasee only in this case. |
| 97 | // FIXME: we should import alias as available_externally *function*, |
| 98 | // the destination module does need to know it is an alias. |
| 99 | if (!GlobalValue::isLinkOnceODRLinkage(GVSummary->linkage())) |
| 100 | return false; |
| 101 | } |
| 102 | |
| 103 | auto *Summary = cast<FunctionSummary>(GVSummary); |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 104 | |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 105 | if (Summary->instCount() > Threshold) |
| 106 | return false; |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 107 | |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 108 | return true; |
| 109 | }); |
| 110 | if (It == CalleeInfoList.end()) |
| 111 | return nullptr; |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 112 | |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 113 | return cast<GlobalValueSummary>((*It)->summary()); |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 114 | } |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 115 | |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 116 | /// Return the summary for the function \p GUID that fits the \p Threshold, or |
| 117 | /// null if there's no match. |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 118 | static const GlobalValueSummary *selectCallee(GlobalValue::GUID GUID, |
| 119 | unsigned Threshold, |
| 120 | const ModuleSummaryIndex &Index) { |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 121 | auto CalleeInfoList = Index.findGlobalValueInfoList(GUID); |
| 122 | if (CalleeInfoList == Index.end()) { |
| 123 | return nullptr; // This function does not have a summary |
| 124 | } |
| 125 | return selectCallee(CalleeInfoList->second, Threshold); |
| 126 | } |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 127 | |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 128 | /// Return true if the global \p GUID is exported by module \p ExportModulePath. |
| 129 | static bool isGlobalExported(const ModuleSummaryIndex &Index, |
Mehdi Amini | ad5741b | 2016-04-02 05:07:53 +0000 | [diff] [blame] | 130 | StringRef ExportModulePath, |
| 131 | GlobalValue::GUID GUID) { |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 132 | auto CalleeInfoList = Index.findGlobalValueInfoList(GUID); |
| 133 | if (CalleeInfoList == Index.end()) |
| 134 | // This global does not have a summary, it is not part of the ThinLTO |
| 135 | // process |
| 136 | return false; |
| 137 | auto DefinedInCalleeModule = llvm::find_if( |
| 138 | CalleeInfoList->second, |
| 139 | [&](const std::unique_ptr<GlobalValueInfo> &GlobInfo) { |
| 140 | auto *Summary = GlobInfo->summary(); |
| 141 | assert(Summary && "Unexpected GlobalValueInfo without summary"); |
| 142 | return Summary->modulePath() == ExportModulePath; |
| 143 | }); |
| 144 | return (DefinedInCalleeModule != CalleeInfoList->second.end()); |
| 145 | } |
Mehdi Amini | 4064174 | 2016-02-10 23:31:45 +0000 | [diff] [blame] | 146 | |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 147 | using EdgeInfo = std::pair<const FunctionSummary *, unsigned /* Threshold */>; |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 148 | |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 149 | /// Compute the list of functions to import for a given caller. Mark these |
| 150 | /// imported functions and the symbols they reference in their source module as |
| 151 | /// exported from their source module. |
| 152 | static void computeImportForFunction( |
Teresa Johnson | 3255eec | 2016-04-10 15:17:26 +0000 | [diff] [blame] | 153 | const FunctionSummary &Summary, const ModuleSummaryIndex &Index, |
| 154 | unsigned Threshold, |
Mehdi Amini | 1aafabf | 2016-04-16 07:02:16 +0000 | [diff] [blame] | 155 | const std::map<GlobalValue::GUID, GlobalValueSummary *> &DefinedGVSummaries, |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 156 | SmallVectorImpl<EdgeInfo> &Worklist, |
| 157 | FunctionImporter::ImportMapTy &ImportsForModule, |
Teresa Johnson | c86af33 | 2016-04-12 21:13:11 +0000 | [diff] [blame] | 158 | StringMap<FunctionImporter::ExportSetTy> *ExportLists = nullptr) { |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 159 | for (auto &Edge : Summary.calls()) { |
Teresa Johnson | 2d5487c | 2016-04-11 13:58:45 +0000 | [diff] [blame] | 160 | auto GUID = Edge.first.getGUID(); |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 161 | DEBUG(dbgs() << " edge -> " << GUID << " Threshold:" << Threshold << "\n"); |
| 162 | |
Mehdi Amini | 1aafabf | 2016-04-16 07:02:16 +0000 | [diff] [blame] | 163 | if (DefinedGVSummaries.count(GUID)) { |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 164 | DEBUG(dbgs() << "ignored! Target already in destination module.\n"); |
| 165 | continue; |
Teresa Johnson | d450da3 | 2015-11-24 21:15:19 +0000 | [diff] [blame] | 166 | } |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 167 | |
| 168 | auto *CalleeSummary = selectCallee(GUID, Threshold, Index); |
| 169 | if (!CalleeSummary) { |
| 170 | DEBUG(dbgs() << "ignored! No qualifying callee with summary found.\n"); |
| 171 | continue; |
| 172 | } |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 173 | // "Resolve" the summary, traversing alias, |
| 174 | const FunctionSummary *ResolvedCalleeSummary; |
Mehdi Amini | 6968ef7 | 2016-04-20 01:04:20 +0000 | [diff] [blame] | 175 | if (isa<AliasSummary>(CalleeSummary)) { |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 176 | ResolvedCalleeSummary = cast<FunctionSummary>( |
| 177 | &cast<AliasSummary>(CalleeSummary)->getAliasee()); |
Mehdi Amini | 2c719cc | 2016-04-20 04:17:36 +0000 | [diff] [blame] | 178 | assert( |
| 179 | GlobalValue::isLinkOnceODRLinkage(ResolvedCalleeSummary->linkage()) && |
| 180 | "Unexpected alias to a non-linkonceODR in import list"); |
Mehdi Amini | 6968ef7 | 2016-04-20 01:04:20 +0000 | [diff] [blame] | 181 | } else |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 182 | ResolvedCalleeSummary = cast<FunctionSummary>(CalleeSummary); |
| 183 | |
| 184 | assert(ResolvedCalleeSummary->instCount() <= Threshold && |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 185 | "selectCallee() didn't honor the threshold"); |
| 186 | |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 187 | auto ExportModulePath = ResolvedCalleeSummary->modulePath(); |
| 188 | auto &ProcessedThreshold = ImportsForModule[ExportModulePath][GUID]; |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 189 | /// Since the traversal of the call graph is DFS, we can revisit a function |
| 190 | /// a second time with a higher threshold. In this case, it is added back to |
| 191 | /// the worklist with the new threshold. |
| 192 | if (ProcessedThreshold && ProcessedThreshold > Threshold) { |
| 193 | DEBUG(dbgs() << "ignored! Target was already seen with Threshold " |
| 194 | << ProcessedThreshold << "\n"); |
| 195 | continue; |
| 196 | } |
| 197 | // Mark this function as imported in this module, with the current Threshold |
| 198 | ProcessedThreshold = Threshold; |
| 199 | |
| 200 | // Make exports in the source module. |
Teresa Johnson | c86af33 | 2016-04-12 21:13:11 +0000 | [diff] [blame] | 201 | if (ExportLists) { |
Mehdi Amini | ef7555f | 2016-04-13 01:52:32 +0000 | [diff] [blame] | 202 | auto &ExportList = (*ExportLists)[ExportModulePath]; |
Teresa Johnson | c86af33 | 2016-04-12 21:13:11 +0000 | [diff] [blame] | 203 | ExportList.insert(GUID); |
| 204 | // Mark all functions and globals referenced by this function as exported |
| 205 | // to the outside if they are defined in the same source module. |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 206 | for (auto &Edge : ResolvedCalleeSummary->calls()) { |
Teresa Johnson | c86af33 | 2016-04-12 21:13:11 +0000 | [diff] [blame] | 207 | auto CalleeGUID = Edge.first.getGUID(); |
| 208 | if (isGlobalExported(Index, ExportModulePath, CalleeGUID)) |
| 209 | ExportList.insert(CalleeGUID); |
| 210 | } |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 211 | for (auto &Ref : ResolvedCalleeSummary->refs()) { |
Teresa Johnson | c86af33 | 2016-04-12 21:13:11 +0000 | [diff] [blame] | 212 | auto GUID = Ref.getGUID(); |
| 213 | if (isGlobalExported(Index, ExportModulePath, GUID)) |
| 214 | ExportList.insert(GUID); |
| 215 | } |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 216 | } |
| 217 | |
| 218 | // Insert the newly imported function to the worklist. |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 219 | Worklist.push_back(std::make_pair(ResolvedCalleeSummary, Threshold)); |
Teresa Johnson | d450da3 | 2015-11-24 21:15:19 +0000 | [diff] [blame] | 220 | } |
| 221 | } |
| 222 | |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 223 | /// Given the list of globals defined in a module, compute the list of imports |
| 224 | /// as well as the list of "exports", i.e. the list of symbols referenced from |
| 225 | /// another module (that may require promotion). |
| 226 | static void ComputeImportForModule( |
Mehdi Amini | 1aafabf | 2016-04-16 07:02:16 +0000 | [diff] [blame] | 227 | const std::map<GlobalValue::GUID, GlobalValueSummary *> &DefinedGVSummaries, |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 228 | const ModuleSummaryIndex &Index, |
| 229 | FunctionImporter::ImportMapTy &ImportsForModule, |
Teresa Johnson | c86af33 | 2016-04-12 21:13:11 +0000 | [diff] [blame] | 230 | StringMap<FunctionImporter::ExportSetTy> *ExportLists = nullptr) { |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 231 | // Worklist contains the list of function imported in this module, for which |
| 232 | // we will analyse the callees and may import further down the callgraph. |
| 233 | SmallVector<EdgeInfo, 128> Worklist; |
| 234 | |
| 235 | // Populate the worklist with the import for the functions in the current |
| 236 | // module |
Mehdi Amini | 1aafabf | 2016-04-16 07:02:16 +0000 | [diff] [blame] | 237 | for (auto &GVInfo : DefinedGVSummaries) { |
| 238 | auto *Summary = GVInfo.second; |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 239 | if (auto *AS = dyn_cast<AliasSummary>(Summary)) |
| 240 | Summary = &AS->getAliasee(); |
Mehdi Amini | 1aafabf | 2016-04-16 07:02:16 +0000 | [diff] [blame] | 241 | auto *FuncSummary = dyn_cast<FunctionSummary>(Summary); |
| 242 | if (!FuncSummary) |
| 243 | // Skip import for global variables |
| 244 | continue; |
| 245 | DEBUG(dbgs() << "Initalize import for " << GVInfo.first << "\n"); |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 246 | computeImportForFunction(*FuncSummary, Index, ImportInstrLimit, |
Mehdi Amini | 1aafabf | 2016-04-16 07:02:16 +0000 | [diff] [blame] | 247 | DefinedGVSummaries, Worklist, ImportsForModule, |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 248 | ExportLists); |
| 249 | } |
| 250 | |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 251 | while (!Worklist.empty()) { |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 252 | auto FuncInfo = Worklist.pop_back_val(); |
| 253 | auto *Summary = FuncInfo.first; |
| 254 | auto Threshold = FuncInfo.second; |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 255 | |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 256 | // Process the newly imported functions and add callees to the worklist. |
Mehdi Amini | 4064174 | 2016-02-10 23:31:45 +0000 | [diff] [blame] | 257 | // Adjust the threshold |
| 258 | Threshold = Threshold * ImportInstrFactor; |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 259 | |
Mehdi Amini | 1aafabf | 2016-04-16 07:02:16 +0000 | [diff] [blame] | 260 | computeImportForFunction(*Summary, Index, Threshold, DefinedGVSummaries, |
Teresa Johnson | 3255eec | 2016-04-10 15:17:26 +0000 | [diff] [blame] | 261 | Worklist, ImportsForModule, ExportLists); |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 262 | } |
Mehdi Amini | c8c5517 | 2015-12-03 02:37:33 +0000 | [diff] [blame] | 263 | } |
Mehdi Amini | ffe2e4a | 2015-12-02 04:34:28 +0000 | [diff] [blame] | 264 | |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 265 | } // anonymous namespace |
| 266 | |
Teresa Johnson | c86af33 | 2016-04-12 21:13:11 +0000 | [diff] [blame] | 267 | /// Compute all the import and export for every module using the Index. |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 268 | void llvm::ComputeCrossModuleImport( |
| 269 | const ModuleSummaryIndex &Index, |
Mehdi Amini | 1aafabf | 2016-04-16 07:02:16 +0000 | [diff] [blame] | 270 | const StringMap<std::map<GlobalValue::GUID, GlobalValueSummary *>> & |
| 271 | ModuleToDefinedGVSummaries, |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 272 | StringMap<FunctionImporter::ImportMapTy> &ImportLists, |
| 273 | StringMap<FunctionImporter::ExportSetTy> &ExportLists) { |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 274 | // For each module that has function defined, compute the import/export lists. |
Mehdi Amini | 1aafabf | 2016-04-16 07:02:16 +0000 | [diff] [blame] | 275 | for (auto &DefinedGVSummaries : ModuleToDefinedGVSummaries) { |
| 276 | auto &ImportsForModule = ImportLists[DefinedGVSummaries.first()]; |
| 277 | DEBUG(dbgs() << "Computing import for Module '" |
| 278 | << DefinedGVSummaries.first() << "'\n"); |
| 279 | ComputeImportForModule(DefinedGVSummaries.second, Index, ImportsForModule, |
Teresa Johnson | c86af33 | 2016-04-12 21:13:11 +0000 | [diff] [blame] | 280 | &ExportLists); |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 281 | } |
| 282 | |
| 283 | #ifndef NDEBUG |
| 284 | DEBUG(dbgs() << "Import/Export lists for " << ImportLists.size() |
| 285 | << " modules:\n"); |
| 286 | for (auto &ModuleImports : ImportLists) { |
| 287 | auto ModName = ModuleImports.first(); |
| 288 | auto &Exports = ExportLists[ModName]; |
| 289 | DEBUG(dbgs() << "* Module " << ModName << " exports " << Exports.size() |
| 290 | << " functions. Imports from " << ModuleImports.second.size() |
| 291 | << " modules.\n"); |
| 292 | for (auto &Src : ModuleImports.second) { |
| 293 | auto SrcModName = Src.first(); |
| 294 | DEBUG(dbgs() << " - " << Src.second.size() << " functions imported from " |
| 295 | << SrcModName << "\n"); |
| 296 | } |
| 297 | } |
| 298 | #endif |
| 299 | } |
| 300 | |
Teresa Johnson | c86af33 | 2016-04-12 21:13:11 +0000 | [diff] [blame] | 301 | /// Compute all the imports for the given module in the Index. |
| 302 | void llvm::ComputeCrossModuleImportForModule( |
| 303 | StringRef ModulePath, const ModuleSummaryIndex &Index, |
| 304 | FunctionImporter::ImportMapTy &ImportList) { |
| 305 | |
| 306 | // Collect the list of functions this module defines. |
| 307 | // GUID -> Summary |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 308 | std::map<GlobalValue::GUID, GlobalValueSummary *> FunctionInfoMap; |
Teresa Johnson | c86af33 | 2016-04-12 21:13:11 +0000 | [diff] [blame] | 309 | Index.collectDefinedFunctionsForModule(ModulePath, FunctionInfoMap); |
| 310 | |
| 311 | // Compute the import list for this module. |
| 312 | DEBUG(dbgs() << "Computing import for Module '" << ModulePath << "'\n"); |
| 313 | ComputeImportForModule(FunctionInfoMap, Index, ImportList); |
| 314 | |
| 315 | #ifndef NDEBUG |
| 316 | DEBUG(dbgs() << "* Module " << ModulePath << " imports from " |
| 317 | << ImportList.size() << " modules.\n"); |
| 318 | for (auto &Src : ImportList) { |
| 319 | auto SrcModName = Src.first(); |
| 320 | DEBUG(dbgs() << " - " << Src.second.size() << " functions imported from " |
| 321 | << SrcModName << "\n"); |
| 322 | } |
| 323 | #endif |
| 324 | } |
| 325 | |
Mehdi Amini | c8c5517 | 2015-12-03 02:37:33 +0000 | [diff] [blame] | 326 | // Automatically import functions in Module \p DestModule based on the summaries |
| 327 | // index. |
| 328 | // |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 329 | bool FunctionImporter::importFunctions( |
| 330 | Module &DestModule, const FunctionImporter::ImportMapTy &ImportList) { |
Mehdi Amini | 5411d05 | 2015-12-08 23:04:19 +0000 | [diff] [blame] | 331 | DEBUG(dbgs() << "Starting import for Module " |
Mehdi Amini | 311fef6 | 2015-12-03 02:58:14 +0000 | [diff] [blame] | 332 | << DestModule.getModuleIdentifier() << "\n"); |
Mehdi Amini | c8c5517 | 2015-12-03 02:37:33 +0000 | [diff] [blame] | 333 | unsigned ImportedCount = 0; |
| 334 | |
Mehdi Amini | c8c5517 | 2015-12-03 02:37:33 +0000 | [diff] [blame] | 335 | // Linker that will be used for importing function |
Rafael Espindola | 9d2bfc4 | 2015-12-14 23:17:03 +0000 | [diff] [blame] | 336 | Linker TheLinker(DestModule); |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 337 | // Do the actual import of functions now, one Module at a time |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 338 | std::set<StringRef> ModuleNameOrderedList; |
| 339 | for (auto &FunctionsToImportPerModule : ImportList) { |
| 340 | ModuleNameOrderedList.insert(FunctionsToImportPerModule.first()); |
| 341 | } |
| 342 | for (auto &Name : ModuleNameOrderedList) { |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 343 | // Get the module for the import |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 344 | const auto &FunctionsToImportPerModule = ImportList.find(Name); |
| 345 | assert(FunctionsToImportPerModule != ImportList.end()); |
| 346 | std::unique_ptr<Module> SrcModule = ModuleLoader(Name); |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 347 | assert(&DestModule.getContext() == &SrcModule->getContext() && |
| 348 | "Context mismatch"); |
| 349 | |
Teresa Johnson | 6cba37c | 2016-01-22 00:15:53 +0000 | [diff] [blame] | 350 | // If modules were created with lazy metadata loading, materialize it |
| 351 | // now, before linking it (otherwise this will be a noop). |
| 352 | SrcModule->materializeMetadata(); |
| 353 | UpgradeDebugInfo(*SrcModule); |
Teresa Johnson | e5a6191 | 2015-12-17 17:14:09 +0000 | [diff] [blame] | 354 | |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 355 | auto &ImportGUIDs = FunctionsToImportPerModule->second; |
| 356 | // Find the globals to import |
| 357 | DenseSet<const GlobalValue *> GlobalsToImport; |
| 358 | for (auto &GV : *SrcModule) { |
Teresa Johnson | 0beb858 | 2016-04-04 18:52:23 +0000 | [diff] [blame] | 359 | if (!GV.hasName()) |
| 360 | continue; |
| 361 | auto GUID = GV.getGUID(); |
| 362 | auto Import = ImportGUIDs.count(GUID); |
Mehdi Amini | aeb1e59 | 2016-04-19 09:21:30 +0000 | [diff] [blame] | 363 | DEBUG(dbgs() << (Import ? "Is" : "Not") << " importing function " << GUID |
| 364 | << " " << GV.getName() << " from " |
| 365 | << SrcModule->getSourceFileName() << "\n"); |
Teresa Johnson | 0beb858 | 2016-04-04 18:52:23 +0000 | [diff] [blame] | 366 | if (Import) { |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 367 | GV.materialize(); |
| 368 | GlobalsToImport.insert(&GV); |
| 369 | } |
| 370 | } |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 371 | for (auto &GV : SrcModule->globals()) { |
| 372 | if (!GV.hasName()) |
| 373 | continue; |
| 374 | auto GUID = GV.getGUID(); |
| 375 | auto Import = ImportGUIDs.count(GUID); |
Mehdi Amini | aeb1e59 | 2016-04-19 09:21:30 +0000 | [diff] [blame] | 376 | DEBUG(dbgs() << (Import ? "Is" : "Not") << " importing global " << GUID |
| 377 | << " " << GV.getName() << " from " |
| 378 | << SrcModule->getSourceFileName() << "\n"); |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 379 | if (Import) { |
| 380 | GV.materialize(); |
| 381 | GlobalsToImport.insert(&GV); |
| 382 | } |
| 383 | } |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 384 | for (auto &GV : SrcModule->aliases()) { |
| 385 | if (!GV.hasName()) |
| 386 | continue; |
| 387 | auto GUID = GV.getGUID(); |
Teresa Johnson | 0beb858 | 2016-04-04 18:52:23 +0000 | [diff] [blame] | 388 | auto Import = ImportGUIDs.count(GUID); |
Mehdi Amini | aeb1e59 | 2016-04-19 09:21:30 +0000 | [diff] [blame] | 389 | DEBUG(dbgs() << (Import ? "Is" : "Not") << " importing alias " << GUID |
| 390 | << " " << GV.getName() << " from " |
| 391 | << SrcModule->getSourceFileName() << "\n"); |
Teresa Johnson | 0beb858 | 2016-04-04 18:52:23 +0000 | [diff] [blame] | 392 | if (Import) { |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 393 | // Alias can't point to "available_externally". However when we import |
Teresa Johnson | 9aae395 | 2016-03-27 15:01:11 +0000 | [diff] [blame] | 394 | // linkOnceODR the linkage does not change. So we import the alias |
Mehdi Amini | 6968ef7 | 2016-04-20 01:04:20 +0000 | [diff] [blame] | 395 | // and aliasee only in this case. This has been handled by |
| 396 | // computeImportForFunction() |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 397 | GlobalObject *GO = GV.getBaseObject(); |
Mehdi Amini | 6968ef7 | 2016-04-20 01:04:20 +0000 | [diff] [blame] | 398 | assert(GO->hasLinkOnceODRLinkage() && |
| 399 | "Unexpected alias to a non-linkonceODR in import list"); |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 400 | #ifndef NDEBUG |
| 401 | if (!GlobalsToImport.count(GO)) |
| 402 | DEBUG(dbgs() << " alias triggers importing aliasee " << GO->getGUID() |
| 403 | << " " << GO->getName() << " from " |
| 404 | << SrcModule->getSourceFileName() << "\n"); |
| 405 | #endif |
| 406 | GO->materialize(); |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 407 | GlobalsToImport.insert(GO); |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 408 | GV.materialize(); |
| 409 | GlobalsToImport.insert(&GV); |
| 410 | } |
| 411 | } |
| 412 | |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 413 | // Link in the specified functions. |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 414 | if (renameModuleForThinLTO(*SrcModule, Index, &GlobalsToImport)) |
Mehdi Amini | 8d05185 | 2016-03-19 00:40:31 +0000 | [diff] [blame] | 415 | return true; |
| 416 | |
Teresa Johnson | d29478f | 2016-03-27 15:27:30 +0000 | [diff] [blame] | 417 | if (PrintImports) { |
| 418 | for (const auto *GV : GlobalsToImport) |
| 419 | dbgs() << DestModule.getSourceFileName() << ": Import " << GV->getName() |
| 420 | << " from " << SrcModule->getSourceFileName() << "\n"; |
| 421 | } |
| 422 | |
Rafael Espindola | 434e956 | 2015-12-16 23:16:33 +0000 | [diff] [blame] | 423 | if (TheLinker.linkInModule(std::move(SrcModule), Linker::Flags::None, |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 424 | &GlobalsToImport)) |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 425 | report_fatal_error("Function Import: link error"); |
| 426 | |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 427 | ImportedCount += GlobalsToImport.size(); |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 428 | } |
Teresa Johnson | e5a6191 | 2015-12-17 17:14:09 +0000 | [diff] [blame] | 429 | |
Teresa Johnson | d29478f | 2016-03-27 15:27:30 +0000 | [diff] [blame] | 430 | NumImported += ImportedCount; |
| 431 | |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 432 | DEBUG(dbgs() << "Imported " << ImportedCount << " functions for Module " |
Mehdi Amini | c8c5517 | 2015-12-03 02:37:33 +0000 | [diff] [blame] | 433 | << DestModule.getModuleIdentifier() << "\n"); |
| 434 | return ImportedCount; |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 435 | } |
| 436 | |
| 437 | /// Summary file to use for function importing when using -function-import from |
| 438 | /// the command line. |
| 439 | static cl::opt<std::string> |
| 440 | SummaryFile("summary-file", |
| 441 | cl::desc("The summary file to use for function importing.")); |
| 442 | |
| 443 | static void diagnosticHandler(const DiagnosticInfo &DI) { |
| 444 | raw_ostream &OS = errs(); |
| 445 | DiagnosticPrinterRawOStream DP(OS); |
| 446 | DI.print(DP); |
| 447 | OS << '\n'; |
| 448 | } |
| 449 | |
Teresa Johnson | 26ab577 | 2016-03-15 00:04:37 +0000 | [diff] [blame] | 450 | /// Parse the summary index out of an IR file and return the summary |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 451 | /// index object if found, or nullptr if not. |
Teresa Johnson | 26ab577 | 2016-03-15 00:04:37 +0000 | [diff] [blame] | 452 | static std::unique_ptr<ModuleSummaryIndex> |
| 453 | getModuleSummaryIndexForFile(StringRef Path, std::string &Error, |
| 454 | DiagnosticHandlerFunction DiagnosticHandler) { |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 455 | std::unique_ptr<MemoryBuffer> Buffer; |
| 456 | ErrorOr<std::unique_ptr<MemoryBuffer>> BufferOrErr = |
| 457 | MemoryBuffer::getFile(Path); |
| 458 | if (std::error_code EC = BufferOrErr.getError()) { |
| 459 | Error = EC.message(); |
| 460 | return nullptr; |
| 461 | } |
| 462 | Buffer = std::move(BufferOrErr.get()); |
Teresa Johnson | 26ab577 | 2016-03-15 00:04:37 +0000 | [diff] [blame] | 463 | ErrorOr<std::unique_ptr<object::ModuleSummaryIndexObjectFile>> ObjOrErr = |
| 464 | object::ModuleSummaryIndexObjectFile::create(Buffer->getMemBufferRef(), |
| 465 | DiagnosticHandler); |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 466 | if (std::error_code EC = ObjOrErr.getError()) { |
| 467 | Error = EC.message(); |
| 468 | return nullptr; |
| 469 | } |
| 470 | return (*ObjOrErr)->takeIndex(); |
| 471 | } |
| 472 | |
Benjamin Kramer | fe2b541 | 2015-12-24 10:03:35 +0000 | [diff] [blame] | 473 | namespace { |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 474 | /// Pass that performs cross-module function import provided a summary file. |
| 475 | class FunctionImportPass : public ModulePass { |
Teresa Johnson | 26ab577 | 2016-03-15 00:04:37 +0000 | [diff] [blame] | 476 | /// Optional module summary index to use for importing, otherwise |
Teresa Johnson | 5fcbdb7 | 2015-12-07 19:21:11 +0000 | [diff] [blame] | 477 | /// the summary-file option must be specified. |
Teresa Johnson | 26ab577 | 2016-03-15 00:04:37 +0000 | [diff] [blame] | 478 | const ModuleSummaryIndex *Index; |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 479 | |
| 480 | public: |
| 481 | /// Pass identification, replacement for typeid |
| 482 | static char ID; |
| 483 | |
Teresa Johnson | 5fcbdb7 | 2015-12-07 19:21:11 +0000 | [diff] [blame] | 484 | /// Specify pass name for debug output |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 485 | const char *getPassName() const override { return "Function Importing"; } |
Teresa Johnson | 5fcbdb7 | 2015-12-07 19:21:11 +0000 | [diff] [blame] | 486 | |
Teresa Johnson | 26ab577 | 2016-03-15 00:04:37 +0000 | [diff] [blame] | 487 | explicit FunctionImportPass(const ModuleSummaryIndex *Index = nullptr) |
Teresa Johnson | 5fcbdb7 | 2015-12-07 19:21:11 +0000 | [diff] [blame] | 488 | : ModulePass(ID), Index(Index) {} |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 489 | |
| 490 | bool runOnModule(Module &M) override { |
Teresa Johnson | 5fcbdb7 | 2015-12-07 19:21:11 +0000 | [diff] [blame] | 491 | if (SummaryFile.empty() && !Index) |
| 492 | report_fatal_error("error: -function-import requires -summary-file or " |
| 493 | "file from frontend\n"); |
Teresa Johnson | 26ab577 | 2016-03-15 00:04:37 +0000 | [diff] [blame] | 494 | std::unique_ptr<ModuleSummaryIndex> IndexPtr; |
Teresa Johnson | 5fcbdb7 | 2015-12-07 19:21:11 +0000 | [diff] [blame] | 495 | if (!SummaryFile.empty()) { |
| 496 | if (Index) |
| 497 | report_fatal_error("error: -summary-file and index from frontend\n"); |
| 498 | std::string Error; |
Teresa Johnson | 26ab577 | 2016-03-15 00:04:37 +0000 | [diff] [blame] | 499 | IndexPtr = |
| 500 | getModuleSummaryIndexForFile(SummaryFile, Error, diagnosticHandler); |
Teresa Johnson | 5fcbdb7 | 2015-12-07 19:21:11 +0000 | [diff] [blame] | 501 | if (!IndexPtr) { |
| 502 | errs() << "Error loading file '" << SummaryFile << "': " << Error |
| 503 | << "\n"; |
| 504 | return false; |
| 505 | } |
| 506 | Index = IndexPtr.get(); |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 507 | } |
| 508 | |
Teresa Johnson | c86af33 | 2016-04-12 21:13:11 +0000 | [diff] [blame] | 509 | // First step is collecting the import list. |
| 510 | FunctionImporter::ImportMapTy ImportList; |
| 511 | ComputeCrossModuleImportForModule(M.getModuleIdentifier(), *Index, |
| 512 | ImportList); |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 513 | |
| 514 | // Next we need to promote to global scope and rename any local values that |
Teresa Johnson | 1b00f2d | 2016-01-08 17:06:29 +0000 | [diff] [blame] | 515 | // are potentially exported to other modules. |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 516 | if (renameModuleForThinLTO(M, *Index, nullptr)) { |
Teresa Johnson | 1b00f2d | 2016-01-08 17:06:29 +0000 | [diff] [blame] | 517 | errs() << "Error renaming module\n"; |
| 518 | return false; |
| 519 | } |
| 520 | |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 521 | // Perform the import now. |
Mehdi Amini | d16c806 | 2015-12-08 22:39:40 +0000 | [diff] [blame] | 522 | auto ModuleLoader = [&M](StringRef Identifier) { |
| 523 | return loadFile(Identifier, M.getContext()); |
| 524 | }; |
Rafael Espindola | 9d2bfc4 | 2015-12-14 23:17:03 +0000 | [diff] [blame] | 525 | FunctionImporter Importer(*Index, ModuleLoader); |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 526 | return Importer.importFunctions(M, ImportList); |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 527 | } |
| 528 | }; |
Benjamin Kramer | fe2b541 | 2015-12-24 10:03:35 +0000 | [diff] [blame] | 529 | } // anonymous namespace |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 530 | |
| 531 | char FunctionImportPass::ID = 0; |
| 532 | INITIALIZE_PASS_BEGIN(FunctionImportPass, "function-import", |
| 533 | "Summary Based Function Import", false, false) |
| 534 | INITIALIZE_PASS_END(FunctionImportPass, "function-import", |
| 535 | "Summary Based Function Import", false, false) |
| 536 | |
| 537 | namespace llvm { |
Teresa Johnson | 26ab577 | 2016-03-15 00:04:37 +0000 | [diff] [blame] | 538 | Pass *createFunctionImportPass(const ModuleSummaryIndex *Index = nullptr) { |
Teresa Johnson | 5fcbdb7 | 2015-12-07 19:21:11 +0000 | [diff] [blame] | 539 | return new FunctionImportPass(Index); |
| 540 | } |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 541 | } |