Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 1 | //===- FunctionImport.cpp - ThinLTO Summary-based Function Import ---------===// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | // This file implements Function import based on summaries. |
| 11 | // |
| 12 | //===----------------------------------------------------------------------===// |
| 13 | |
| 14 | #include "llvm/Transforms/IPO/FunctionImport.h" |
| 15 | |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 16 | #include "llvm/ADT/SmallVector.h" |
Teresa Johnson | d29478f | 2016-03-27 15:27:30 +0000 | [diff] [blame] | 17 | #include "llvm/ADT/Statistic.h" |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 18 | #include "llvm/ADT/StringSet.h" |
| 19 | #include "llvm/IR/AutoUpgrade.h" |
| 20 | #include "llvm/IR/DiagnosticPrinter.h" |
| 21 | #include "llvm/IR/IntrinsicInst.h" |
| 22 | #include "llvm/IR/Module.h" |
| 23 | #include "llvm/IRReader/IRReader.h" |
| 24 | #include "llvm/Linker/Linker.h" |
Teresa Johnson | 26ab577 | 2016-03-15 00:04:37 +0000 | [diff] [blame] | 25 | #include "llvm/Object/ModuleSummaryIndexObjectFile.h" |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 26 | #include "llvm/Support/CommandLine.h" |
| 27 | #include "llvm/Support/Debug.h" |
| 28 | #include "llvm/Support/SourceMgr.h" |
Teresa Johnson | 488a800 | 2016-02-10 18:11:31 +0000 | [diff] [blame] | 29 | #include "llvm/Transforms/Utils/FunctionImportUtils.h" |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 30 | |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 31 | #define DEBUG_TYPE "function-import" |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 32 | |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 33 | using namespace llvm; |
| 34 | |
Teresa Johnson | d29478f | 2016-03-27 15:27:30 +0000 | [diff] [blame] | 35 | STATISTIC(NumImported, "Number of functions imported"); |
| 36 | |
Teresa Johnson | 3930361 | 2015-11-24 22:55:46 +0000 | [diff] [blame] | 37 | /// Limit on instruction count of imported functions. |
| 38 | static cl::opt<unsigned> ImportInstrLimit( |
| 39 | "import-instr-limit", cl::init(100), cl::Hidden, cl::value_desc("N"), |
| 40 | cl::desc("Only import functions with less than N instructions")); |
| 41 | |
Mehdi Amini | 4064174 | 2016-02-10 23:31:45 +0000 | [diff] [blame] | 42 | static cl::opt<float> |
| 43 | ImportInstrFactor("import-instr-evolution-factor", cl::init(0.7), |
| 44 | cl::Hidden, cl::value_desc("x"), |
| 45 | cl::desc("As we import functions, multiply the " |
| 46 | "`import-instr-limit` threshold by this factor " |
| 47 | "before processing newly imported functions")); |
| 48 | |
Teresa Johnson | d29478f | 2016-03-27 15:27:30 +0000 | [diff] [blame] | 49 | static cl::opt<bool> PrintImports("print-imports", cl::init(false), cl::Hidden, |
| 50 | cl::desc("Print imported functions")); |
| 51 | |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 52 | // Load lazily a module from \p FileName in \p Context. |
| 53 | static std::unique_ptr<Module> loadFile(const std::string &FileName, |
| 54 | LLVMContext &Context) { |
| 55 | SMDiagnostic Err; |
| 56 | DEBUG(dbgs() << "Loading '" << FileName << "'\n"); |
Teresa Johnson | 6cba37c | 2016-01-22 00:15:53 +0000 | [diff] [blame] | 57 | // Metadata isn't loaded until functions are imported, to minimize |
| 58 | // the memory overhead. |
Teresa Johnson | a1080ee | 2016-01-08 14:17:41 +0000 | [diff] [blame] | 59 | std::unique_ptr<Module> Result = |
| 60 | getLazyIRFileModule(FileName, Err, Context, |
| 61 | /* ShouldLazyLoadMetadata = */ true); |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 62 | if (!Result) { |
| 63 | Err.print("function-import", errs()); |
Mehdi Amini | d7ad221 | 2016-04-01 05:33:11 +0000 | [diff] [blame] | 64 | report_fatal_error("Abort"); |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 65 | } |
| 66 | |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 67 | return Result; |
| 68 | } |
| 69 | |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 70 | namespace { |
Mehdi Amini | 4064174 | 2016-02-10 23:31:45 +0000 | [diff] [blame] | 71 | |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 72 | /// Given a list of possible callee implementation for a call site, select one |
| 73 | /// that fits the \p Threshold. |
| 74 | /// |
| 75 | /// FIXME: select "best" instead of first that fits. But what is "best"? |
| 76 | /// - The smallest: more likely to be inlined. |
| 77 | /// - The one with the least outgoing edges (already well optimized). |
| 78 | /// - One from a module already being imported from in order to reduce the |
| 79 | /// number of source modules parsed/linked. |
| 80 | /// - One that has PGO data attached. |
| 81 | /// - [insert you fancy metric here] |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 82 | static const GlobalValueSummary * |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 83 | selectCallee(const GlobalValueInfoList &CalleeInfoList, unsigned Threshold) { |
| 84 | auto It = llvm::find_if( |
| 85 | CalleeInfoList, [&](const std::unique_ptr<GlobalValueInfo> &GlobInfo) { |
| 86 | assert(GlobInfo->summary() && |
| 87 | "We should not have a Global Info without summary"); |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 88 | auto *GVSummary = GlobInfo->summary(); |
| 89 | if (auto *AS = dyn_cast<AliasSummary>(GVSummary)) |
| 90 | GVSummary = &AS->getAliasee(); |
| 91 | auto *Summary = cast<FunctionSummary>(GVSummary); |
Mehdi Amini | 4064174 | 2016-02-10 23:31:45 +0000 | [diff] [blame] | 92 | |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 93 | if (GlobalValue::isWeakAnyLinkage(Summary->linkage())) |
| 94 | return false; |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 95 | |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 96 | if (Summary->instCount() > Threshold) |
| 97 | return false; |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 98 | |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 99 | return true; |
| 100 | }); |
| 101 | if (It == CalleeInfoList.end()) |
| 102 | return nullptr; |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 103 | |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 104 | return cast<GlobalValueSummary>((*It)->summary()); |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 105 | } |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 106 | |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 107 | /// Return the summary for the function \p GUID that fits the \p Threshold, or |
| 108 | /// null if there's no match. |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 109 | static const GlobalValueSummary *selectCallee(GlobalValue::GUID GUID, |
| 110 | unsigned Threshold, |
| 111 | const ModuleSummaryIndex &Index) { |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 112 | auto CalleeInfoList = Index.findGlobalValueInfoList(GUID); |
| 113 | if (CalleeInfoList == Index.end()) { |
| 114 | return nullptr; // This function does not have a summary |
| 115 | } |
| 116 | return selectCallee(CalleeInfoList->second, Threshold); |
| 117 | } |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 118 | |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 119 | /// Return true if the global \p GUID is exported by module \p ExportModulePath. |
| 120 | static bool isGlobalExported(const ModuleSummaryIndex &Index, |
Mehdi Amini | ad5741b | 2016-04-02 05:07:53 +0000 | [diff] [blame] | 121 | StringRef ExportModulePath, |
| 122 | GlobalValue::GUID GUID) { |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 123 | auto CalleeInfoList = Index.findGlobalValueInfoList(GUID); |
| 124 | if (CalleeInfoList == Index.end()) |
| 125 | // This global does not have a summary, it is not part of the ThinLTO |
| 126 | // process |
| 127 | return false; |
| 128 | auto DefinedInCalleeModule = llvm::find_if( |
| 129 | CalleeInfoList->second, |
| 130 | [&](const std::unique_ptr<GlobalValueInfo> &GlobInfo) { |
| 131 | auto *Summary = GlobInfo->summary(); |
| 132 | assert(Summary && "Unexpected GlobalValueInfo without summary"); |
| 133 | return Summary->modulePath() == ExportModulePath; |
| 134 | }); |
| 135 | return (DefinedInCalleeModule != CalleeInfoList->second.end()); |
| 136 | } |
Mehdi Amini | 4064174 | 2016-02-10 23:31:45 +0000 | [diff] [blame] | 137 | |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 138 | using EdgeInfo = std::pair<const FunctionSummary *, unsigned /* Threshold */>; |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 139 | |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 140 | /// Compute the list of functions to import for a given caller. Mark these |
| 141 | /// imported functions and the symbols they reference in their source module as |
| 142 | /// exported from their source module. |
| 143 | static void computeImportForFunction( |
Teresa Johnson | 3255eec | 2016-04-10 15:17:26 +0000 | [diff] [blame] | 144 | const FunctionSummary &Summary, const ModuleSummaryIndex &Index, |
| 145 | unsigned Threshold, |
Mehdi Amini | 1aafabf | 2016-04-16 07:02:16 +0000 | [diff] [blame] | 146 | const std::map<GlobalValue::GUID, GlobalValueSummary *> &DefinedGVSummaries, |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 147 | SmallVectorImpl<EdgeInfo> &Worklist, |
| 148 | FunctionImporter::ImportMapTy &ImportsForModule, |
Teresa Johnson | c86af33 | 2016-04-12 21:13:11 +0000 | [diff] [blame] | 149 | StringMap<FunctionImporter::ExportSetTy> *ExportLists = nullptr) { |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 150 | for (auto &Edge : Summary.calls()) { |
Teresa Johnson | 2d5487c | 2016-04-11 13:58:45 +0000 | [diff] [blame] | 151 | auto GUID = Edge.first.getGUID(); |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 152 | DEBUG(dbgs() << " edge -> " << GUID << " Threshold:" << Threshold << "\n"); |
| 153 | |
Mehdi Amini | 1aafabf | 2016-04-16 07:02:16 +0000 | [diff] [blame] | 154 | if (DefinedGVSummaries.count(GUID)) { |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 155 | DEBUG(dbgs() << "ignored! Target already in destination module.\n"); |
| 156 | continue; |
Teresa Johnson | d450da3 | 2015-11-24 21:15:19 +0000 | [diff] [blame] | 157 | } |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 158 | |
| 159 | auto *CalleeSummary = selectCallee(GUID, Threshold, Index); |
| 160 | if (!CalleeSummary) { |
| 161 | DEBUG(dbgs() << "ignored! No qualifying callee with summary found.\n"); |
| 162 | continue; |
| 163 | } |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 164 | // "Resolve" the summary, traversing alias, |
| 165 | const FunctionSummary *ResolvedCalleeSummary; |
Mehdi Amini | 6968ef7 | 2016-04-20 01:04:20 +0000 | [diff] [blame^] | 166 | if (isa<AliasSummary>(CalleeSummary)) { |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 167 | ResolvedCalleeSummary = cast<FunctionSummary>( |
| 168 | &cast<AliasSummary>(CalleeSummary)->getAliasee()); |
Mehdi Amini | 6968ef7 | 2016-04-20 01:04:20 +0000 | [diff] [blame^] | 169 | if (!GlobalValue::isLinkOnceODRLinkage( |
| 170 | ResolvedCalleeSummary->linkage())) { |
| 171 | // Alias can't point to "available_externally". However when we import |
| 172 | // linkOnceODR the linkage does not change. So we import the alias |
| 173 | // and aliasee only in this case. |
| 174 | // FIXME: we should import alias as available_externally *function*, the |
| 175 | // destination module does need to know it is an alias. |
| 176 | DEBUG(dbgs() << "ignored! Aliasee is not linkonce_odr.\n"); |
| 177 | continue; |
| 178 | } |
| 179 | } else |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 180 | ResolvedCalleeSummary = cast<FunctionSummary>(CalleeSummary); |
| 181 | |
| 182 | assert(ResolvedCalleeSummary->instCount() <= Threshold && |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 183 | "selectCallee() didn't honor the threshold"); |
| 184 | |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 185 | auto ExportModulePath = ResolvedCalleeSummary->modulePath(); |
| 186 | auto &ProcessedThreshold = ImportsForModule[ExportModulePath][GUID]; |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 187 | /// Since the traversal of the call graph is DFS, we can revisit a function |
| 188 | /// a second time with a higher threshold. In this case, it is added back to |
| 189 | /// the worklist with the new threshold. |
| 190 | if (ProcessedThreshold && ProcessedThreshold > Threshold) { |
| 191 | DEBUG(dbgs() << "ignored! Target was already seen with Threshold " |
| 192 | << ProcessedThreshold << "\n"); |
| 193 | continue; |
| 194 | } |
| 195 | // Mark this function as imported in this module, with the current Threshold |
| 196 | ProcessedThreshold = Threshold; |
| 197 | |
| 198 | // Make exports in the source module. |
Teresa Johnson | c86af33 | 2016-04-12 21:13:11 +0000 | [diff] [blame] | 199 | if (ExportLists) { |
Mehdi Amini | ef7555f | 2016-04-13 01:52:32 +0000 | [diff] [blame] | 200 | auto &ExportList = (*ExportLists)[ExportModulePath]; |
Teresa Johnson | c86af33 | 2016-04-12 21:13:11 +0000 | [diff] [blame] | 201 | ExportList.insert(GUID); |
| 202 | // Mark all functions and globals referenced by this function as exported |
| 203 | // to the outside if they are defined in the same source module. |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 204 | for (auto &Edge : ResolvedCalleeSummary->calls()) { |
Teresa Johnson | c86af33 | 2016-04-12 21:13:11 +0000 | [diff] [blame] | 205 | auto CalleeGUID = Edge.first.getGUID(); |
| 206 | if (isGlobalExported(Index, ExportModulePath, CalleeGUID)) |
| 207 | ExportList.insert(CalleeGUID); |
| 208 | } |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 209 | for (auto &Ref : ResolvedCalleeSummary->refs()) { |
Teresa Johnson | c86af33 | 2016-04-12 21:13:11 +0000 | [diff] [blame] | 210 | auto GUID = Ref.getGUID(); |
| 211 | if (isGlobalExported(Index, ExportModulePath, GUID)) |
| 212 | ExportList.insert(GUID); |
| 213 | } |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 214 | } |
| 215 | |
| 216 | // Insert the newly imported function to the worklist. |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 217 | Worklist.push_back(std::make_pair(ResolvedCalleeSummary, Threshold)); |
Teresa Johnson | d450da3 | 2015-11-24 21:15:19 +0000 | [diff] [blame] | 218 | } |
| 219 | } |
| 220 | |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 221 | /// Given the list of globals defined in a module, compute the list of imports |
| 222 | /// as well as the list of "exports", i.e. the list of symbols referenced from |
| 223 | /// another module (that may require promotion). |
| 224 | static void ComputeImportForModule( |
Mehdi Amini | 1aafabf | 2016-04-16 07:02:16 +0000 | [diff] [blame] | 225 | const std::map<GlobalValue::GUID, GlobalValueSummary *> &DefinedGVSummaries, |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 226 | const ModuleSummaryIndex &Index, |
| 227 | FunctionImporter::ImportMapTy &ImportsForModule, |
Teresa Johnson | c86af33 | 2016-04-12 21:13:11 +0000 | [diff] [blame] | 228 | StringMap<FunctionImporter::ExportSetTy> *ExportLists = nullptr) { |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 229 | // Worklist contains the list of function imported in this module, for which |
| 230 | // we will analyse the callees and may import further down the callgraph. |
| 231 | SmallVector<EdgeInfo, 128> Worklist; |
| 232 | |
| 233 | // Populate the worklist with the import for the functions in the current |
| 234 | // module |
Mehdi Amini | 1aafabf | 2016-04-16 07:02:16 +0000 | [diff] [blame] | 235 | for (auto &GVInfo : DefinedGVSummaries) { |
| 236 | auto *Summary = GVInfo.second; |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 237 | if (auto *AS = dyn_cast<AliasSummary>(Summary)) |
| 238 | Summary = &AS->getAliasee(); |
Mehdi Amini | 1aafabf | 2016-04-16 07:02:16 +0000 | [diff] [blame] | 239 | auto *FuncSummary = dyn_cast<FunctionSummary>(Summary); |
| 240 | if (!FuncSummary) |
| 241 | // Skip import for global variables |
| 242 | continue; |
| 243 | DEBUG(dbgs() << "Initalize import for " << GVInfo.first << "\n"); |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 244 | computeImportForFunction(*FuncSummary, Index, ImportInstrLimit, |
Mehdi Amini | 1aafabf | 2016-04-16 07:02:16 +0000 | [diff] [blame] | 245 | DefinedGVSummaries, Worklist, ImportsForModule, |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 246 | ExportLists); |
| 247 | } |
| 248 | |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 249 | while (!Worklist.empty()) { |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 250 | auto FuncInfo = Worklist.pop_back_val(); |
| 251 | auto *Summary = FuncInfo.first; |
| 252 | auto Threshold = FuncInfo.second; |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 253 | |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 254 | // Process the newly imported functions and add callees to the worklist. |
Mehdi Amini | 4064174 | 2016-02-10 23:31:45 +0000 | [diff] [blame] | 255 | // Adjust the threshold |
| 256 | Threshold = Threshold * ImportInstrFactor; |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 257 | |
Mehdi Amini | 1aafabf | 2016-04-16 07:02:16 +0000 | [diff] [blame] | 258 | computeImportForFunction(*Summary, Index, Threshold, DefinedGVSummaries, |
Teresa Johnson | 3255eec | 2016-04-10 15:17:26 +0000 | [diff] [blame] | 259 | Worklist, ImportsForModule, ExportLists); |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 260 | } |
Mehdi Amini | c8c5517 | 2015-12-03 02:37:33 +0000 | [diff] [blame] | 261 | } |
Mehdi Amini | ffe2e4a | 2015-12-02 04:34:28 +0000 | [diff] [blame] | 262 | |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 263 | } // anonymous namespace |
| 264 | |
Teresa Johnson | c86af33 | 2016-04-12 21:13:11 +0000 | [diff] [blame] | 265 | /// Compute all the import and export for every module using the Index. |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 266 | void llvm::ComputeCrossModuleImport( |
| 267 | const ModuleSummaryIndex &Index, |
Mehdi Amini | 1aafabf | 2016-04-16 07:02:16 +0000 | [diff] [blame] | 268 | const StringMap<std::map<GlobalValue::GUID, GlobalValueSummary *>> & |
| 269 | ModuleToDefinedGVSummaries, |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 270 | StringMap<FunctionImporter::ImportMapTy> &ImportLists, |
| 271 | StringMap<FunctionImporter::ExportSetTy> &ExportLists) { |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 272 | // For each module that has function defined, compute the import/export lists. |
Mehdi Amini | 1aafabf | 2016-04-16 07:02:16 +0000 | [diff] [blame] | 273 | for (auto &DefinedGVSummaries : ModuleToDefinedGVSummaries) { |
| 274 | auto &ImportsForModule = ImportLists[DefinedGVSummaries.first()]; |
| 275 | DEBUG(dbgs() << "Computing import for Module '" |
| 276 | << DefinedGVSummaries.first() << "'\n"); |
| 277 | ComputeImportForModule(DefinedGVSummaries.second, Index, ImportsForModule, |
Teresa Johnson | c86af33 | 2016-04-12 21:13:11 +0000 | [diff] [blame] | 278 | &ExportLists); |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 279 | } |
| 280 | |
| 281 | #ifndef NDEBUG |
| 282 | DEBUG(dbgs() << "Import/Export lists for " << ImportLists.size() |
| 283 | << " modules:\n"); |
| 284 | for (auto &ModuleImports : ImportLists) { |
| 285 | auto ModName = ModuleImports.first(); |
| 286 | auto &Exports = ExportLists[ModName]; |
| 287 | DEBUG(dbgs() << "* Module " << ModName << " exports " << Exports.size() |
| 288 | << " functions. Imports from " << ModuleImports.second.size() |
| 289 | << " modules.\n"); |
| 290 | for (auto &Src : ModuleImports.second) { |
| 291 | auto SrcModName = Src.first(); |
| 292 | DEBUG(dbgs() << " - " << Src.second.size() << " functions imported from " |
| 293 | << SrcModName << "\n"); |
| 294 | } |
| 295 | } |
| 296 | #endif |
| 297 | } |
| 298 | |
Teresa Johnson | c86af33 | 2016-04-12 21:13:11 +0000 | [diff] [blame] | 299 | /// Compute all the imports for the given module in the Index. |
| 300 | void llvm::ComputeCrossModuleImportForModule( |
| 301 | StringRef ModulePath, const ModuleSummaryIndex &Index, |
| 302 | FunctionImporter::ImportMapTy &ImportList) { |
| 303 | |
| 304 | // Collect the list of functions this module defines. |
| 305 | // GUID -> Summary |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 306 | std::map<GlobalValue::GUID, GlobalValueSummary *> FunctionInfoMap; |
Teresa Johnson | c86af33 | 2016-04-12 21:13:11 +0000 | [diff] [blame] | 307 | Index.collectDefinedFunctionsForModule(ModulePath, FunctionInfoMap); |
| 308 | |
| 309 | // Compute the import list for this module. |
| 310 | DEBUG(dbgs() << "Computing import for Module '" << ModulePath << "'\n"); |
| 311 | ComputeImportForModule(FunctionInfoMap, Index, ImportList); |
| 312 | |
| 313 | #ifndef NDEBUG |
| 314 | DEBUG(dbgs() << "* Module " << ModulePath << " imports from " |
| 315 | << ImportList.size() << " modules.\n"); |
| 316 | for (auto &Src : ImportList) { |
| 317 | auto SrcModName = Src.first(); |
| 318 | DEBUG(dbgs() << " - " << Src.second.size() << " functions imported from " |
| 319 | << SrcModName << "\n"); |
| 320 | } |
| 321 | #endif |
| 322 | } |
| 323 | |
Mehdi Amini | c8c5517 | 2015-12-03 02:37:33 +0000 | [diff] [blame] | 324 | // Automatically import functions in Module \p DestModule based on the summaries |
| 325 | // index. |
| 326 | // |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 327 | bool FunctionImporter::importFunctions( |
| 328 | Module &DestModule, const FunctionImporter::ImportMapTy &ImportList) { |
Mehdi Amini | 5411d05 | 2015-12-08 23:04:19 +0000 | [diff] [blame] | 329 | DEBUG(dbgs() << "Starting import for Module " |
Mehdi Amini | 311fef6 | 2015-12-03 02:58:14 +0000 | [diff] [blame] | 330 | << DestModule.getModuleIdentifier() << "\n"); |
Mehdi Amini | c8c5517 | 2015-12-03 02:37:33 +0000 | [diff] [blame] | 331 | unsigned ImportedCount = 0; |
| 332 | |
Mehdi Amini | c8c5517 | 2015-12-03 02:37:33 +0000 | [diff] [blame] | 333 | // Linker that will be used for importing function |
Rafael Espindola | 9d2bfc4 | 2015-12-14 23:17:03 +0000 | [diff] [blame] | 334 | Linker TheLinker(DestModule); |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 335 | // Do the actual import of functions now, one Module at a time |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 336 | std::set<StringRef> ModuleNameOrderedList; |
| 337 | for (auto &FunctionsToImportPerModule : ImportList) { |
| 338 | ModuleNameOrderedList.insert(FunctionsToImportPerModule.first()); |
| 339 | } |
| 340 | for (auto &Name : ModuleNameOrderedList) { |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 341 | // Get the module for the import |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 342 | const auto &FunctionsToImportPerModule = ImportList.find(Name); |
| 343 | assert(FunctionsToImportPerModule != ImportList.end()); |
| 344 | std::unique_ptr<Module> SrcModule = ModuleLoader(Name); |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 345 | assert(&DestModule.getContext() == &SrcModule->getContext() && |
| 346 | "Context mismatch"); |
| 347 | |
Teresa Johnson | 6cba37c | 2016-01-22 00:15:53 +0000 | [diff] [blame] | 348 | // If modules were created with lazy metadata loading, materialize it |
| 349 | // now, before linking it (otherwise this will be a noop). |
| 350 | SrcModule->materializeMetadata(); |
| 351 | UpgradeDebugInfo(*SrcModule); |
Teresa Johnson | e5a6191 | 2015-12-17 17:14:09 +0000 | [diff] [blame] | 352 | |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 353 | auto &ImportGUIDs = FunctionsToImportPerModule->second; |
| 354 | // Find the globals to import |
| 355 | DenseSet<const GlobalValue *> GlobalsToImport; |
| 356 | for (auto &GV : *SrcModule) { |
Teresa Johnson | 0beb858 | 2016-04-04 18:52:23 +0000 | [diff] [blame] | 357 | if (!GV.hasName()) |
| 358 | continue; |
| 359 | auto GUID = GV.getGUID(); |
| 360 | auto Import = ImportGUIDs.count(GUID); |
Mehdi Amini | aeb1e59 | 2016-04-19 09:21:30 +0000 | [diff] [blame] | 361 | DEBUG(dbgs() << (Import ? "Is" : "Not") << " importing function " << GUID |
| 362 | << " " << GV.getName() << " from " |
| 363 | << SrcModule->getSourceFileName() << "\n"); |
Teresa Johnson | 0beb858 | 2016-04-04 18:52:23 +0000 | [diff] [blame] | 364 | if (Import) { |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 365 | GV.materialize(); |
| 366 | GlobalsToImport.insert(&GV); |
| 367 | } |
| 368 | } |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 369 | for (auto &GV : SrcModule->globals()) { |
| 370 | if (!GV.hasName()) |
| 371 | continue; |
| 372 | auto GUID = GV.getGUID(); |
| 373 | auto Import = ImportGUIDs.count(GUID); |
Mehdi Amini | aeb1e59 | 2016-04-19 09:21:30 +0000 | [diff] [blame] | 374 | DEBUG(dbgs() << (Import ? "Is" : "Not") << " importing global " << GUID |
| 375 | << " " << GV.getName() << " from " |
| 376 | << SrcModule->getSourceFileName() << "\n"); |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 377 | if (Import) { |
| 378 | GV.materialize(); |
| 379 | GlobalsToImport.insert(&GV); |
| 380 | } |
| 381 | } |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 382 | for (auto &GV : SrcModule->aliases()) { |
| 383 | if (!GV.hasName()) |
| 384 | continue; |
| 385 | auto GUID = GV.getGUID(); |
Teresa Johnson | 0beb858 | 2016-04-04 18:52:23 +0000 | [diff] [blame] | 386 | auto Import = ImportGUIDs.count(GUID); |
Mehdi Amini | aeb1e59 | 2016-04-19 09:21:30 +0000 | [diff] [blame] | 387 | DEBUG(dbgs() << (Import ? "Is" : "Not") << " importing alias " << GUID |
| 388 | << " " << GV.getName() << " from " |
| 389 | << SrcModule->getSourceFileName() << "\n"); |
Teresa Johnson | 0beb858 | 2016-04-04 18:52:23 +0000 | [diff] [blame] | 390 | if (Import) { |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 391 | // Alias can't point to "available_externally". However when we import |
Teresa Johnson | 9aae395 | 2016-03-27 15:01:11 +0000 | [diff] [blame] | 392 | // linkOnceODR the linkage does not change. So we import the alias |
Mehdi Amini | 6968ef7 | 2016-04-20 01:04:20 +0000 | [diff] [blame^] | 393 | // and aliasee only in this case. This has been handled by |
| 394 | // computeImportForFunction() |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 395 | GlobalObject *GO = GV.getBaseObject(); |
Mehdi Amini | 6968ef7 | 2016-04-20 01:04:20 +0000 | [diff] [blame^] | 396 | assert(GO->hasLinkOnceODRLinkage() && |
| 397 | "Unexpected alias to a non-linkonceODR in import list"); |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 398 | #ifndef NDEBUG |
| 399 | if (!GlobalsToImport.count(GO)) |
| 400 | DEBUG(dbgs() << " alias triggers importing aliasee " << GO->getGUID() |
| 401 | << " " << GO->getName() << " from " |
| 402 | << SrcModule->getSourceFileName() << "\n"); |
| 403 | #endif |
| 404 | GO->materialize(); |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 405 | GlobalsToImport.insert(GO); |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 406 | GV.materialize(); |
| 407 | GlobalsToImport.insert(&GV); |
| 408 | } |
| 409 | } |
| 410 | |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 411 | // Link in the specified functions. |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 412 | if (renameModuleForThinLTO(*SrcModule, Index, &GlobalsToImport)) |
Mehdi Amini | 8d05185 | 2016-03-19 00:40:31 +0000 | [diff] [blame] | 413 | return true; |
| 414 | |
Teresa Johnson | d29478f | 2016-03-27 15:27:30 +0000 | [diff] [blame] | 415 | if (PrintImports) { |
| 416 | for (const auto *GV : GlobalsToImport) |
| 417 | dbgs() << DestModule.getSourceFileName() << ": Import " << GV->getName() |
| 418 | << " from " << SrcModule->getSourceFileName() << "\n"; |
| 419 | } |
| 420 | |
Rafael Espindola | 434e956 | 2015-12-16 23:16:33 +0000 | [diff] [blame] | 421 | if (TheLinker.linkInModule(std::move(SrcModule), Linker::Flags::None, |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 422 | &GlobalsToImport)) |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 423 | report_fatal_error("Function Import: link error"); |
| 424 | |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 425 | ImportedCount += GlobalsToImport.size(); |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 426 | } |
Teresa Johnson | e5a6191 | 2015-12-17 17:14:09 +0000 | [diff] [blame] | 427 | |
Teresa Johnson | d29478f | 2016-03-27 15:27:30 +0000 | [diff] [blame] | 428 | NumImported += ImportedCount; |
| 429 | |
Mehdi Amini | 7e88d0d | 2015-12-09 08:17:35 +0000 | [diff] [blame] | 430 | DEBUG(dbgs() << "Imported " << ImportedCount << " functions for Module " |
Mehdi Amini | c8c5517 | 2015-12-03 02:37:33 +0000 | [diff] [blame] | 431 | << DestModule.getModuleIdentifier() << "\n"); |
| 432 | return ImportedCount; |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 433 | } |
| 434 | |
| 435 | /// Summary file to use for function importing when using -function-import from |
| 436 | /// the command line. |
| 437 | static cl::opt<std::string> |
| 438 | SummaryFile("summary-file", |
| 439 | cl::desc("The summary file to use for function importing.")); |
| 440 | |
| 441 | static void diagnosticHandler(const DiagnosticInfo &DI) { |
| 442 | raw_ostream &OS = errs(); |
| 443 | DiagnosticPrinterRawOStream DP(OS); |
| 444 | DI.print(DP); |
| 445 | OS << '\n'; |
| 446 | } |
| 447 | |
Teresa Johnson | 26ab577 | 2016-03-15 00:04:37 +0000 | [diff] [blame] | 448 | /// Parse the summary index out of an IR file and return the summary |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 449 | /// index object if found, or nullptr if not. |
Teresa Johnson | 26ab577 | 2016-03-15 00:04:37 +0000 | [diff] [blame] | 450 | static std::unique_ptr<ModuleSummaryIndex> |
| 451 | getModuleSummaryIndexForFile(StringRef Path, std::string &Error, |
| 452 | DiagnosticHandlerFunction DiagnosticHandler) { |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 453 | std::unique_ptr<MemoryBuffer> Buffer; |
| 454 | ErrorOr<std::unique_ptr<MemoryBuffer>> BufferOrErr = |
| 455 | MemoryBuffer::getFile(Path); |
| 456 | if (std::error_code EC = BufferOrErr.getError()) { |
| 457 | Error = EC.message(); |
| 458 | return nullptr; |
| 459 | } |
| 460 | Buffer = std::move(BufferOrErr.get()); |
Teresa Johnson | 26ab577 | 2016-03-15 00:04:37 +0000 | [diff] [blame] | 461 | ErrorOr<std::unique_ptr<object::ModuleSummaryIndexObjectFile>> ObjOrErr = |
| 462 | object::ModuleSummaryIndexObjectFile::create(Buffer->getMemBufferRef(), |
| 463 | DiagnosticHandler); |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 464 | if (std::error_code EC = ObjOrErr.getError()) { |
| 465 | Error = EC.message(); |
| 466 | return nullptr; |
| 467 | } |
| 468 | return (*ObjOrErr)->takeIndex(); |
| 469 | } |
| 470 | |
Benjamin Kramer | fe2b541 | 2015-12-24 10:03:35 +0000 | [diff] [blame] | 471 | namespace { |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 472 | /// Pass that performs cross-module function import provided a summary file. |
| 473 | class FunctionImportPass : public ModulePass { |
Teresa Johnson | 26ab577 | 2016-03-15 00:04:37 +0000 | [diff] [blame] | 474 | /// Optional module summary index to use for importing, otherwise |
Teresa Johnson | 5fcbdb7 | 2015-12-07 19:21:11 +0000 | [diff] [blame] | 475 | /// the summary-file option must be specified. |
Teresa Johnson | 26ab577 | 2016-03-15 00:04:37 +0000 | [diff] [blame] | 476 | const ModuleSummaryIndex *Index; |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 477 | |
| 478 | public: |
| 479 | /// Pass identification, replacement for typeid |
| 480 | static char ID; |
| 481 | |
Teresa Johnson | 5fcbdb7 | 2015-12-07 19:21:11 +0000 | [diff] [blame] | 482 | /// Specify pass name for debug output |
Mehdi Amini | 2d28f7a | 2016-04-16 06:56:44 +0000 | [diff] [blame] | 483 | const char *getPassName() const override { return "Function Importing"; } |
Teresa Johnson | 5fcbdb7 | 2015-12-07 19:21:11 +0000 | [diff] [blame] | 484 | |
Teresa Johnson | 26ab577 | 2016-03-15 00:04:37 +0000 | [diff] [blame] | 485 | explicit FunctionImportPass(const ModuleSummaryIndex *Index = nullptr) |
Teresa Johnson | 5fcbdb7 | 2015-12-07 19:21:11 +0000 | [diff] [blame] | 486 | : ModulePass(ID), Index(Index) {} |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 487 | |
| 488 | bool runOnModule(Module &M) override { |
Teresa Johnson | 5fcbdb7 | 2015-12-07 19:21:11 +0000 | [diff] [blame] | 489 | if (SummaryFile.empty() && !Index) |
| 490 | report_fatal_error("error: -function-import requires -summary-file or " |
| 491 | "file from frontend\n"); |
Teresa Johnson | 26ab577 | 2016-03-15 00:04:37 +0000 | [diff] [blame] | 492 | std::unique_ptr<ModuleSummaryIndex> IndexPtr; |
Teresa Johnson | 5fcbdb7 | 2015-12-07 19:21:11 +0000 | [diff] [blame] | 493 | if (!SummaryFile.empty()) { |
| 494 | if (Index) |
| 495 | report_fatal_error("error: -summary-file and index from frontend\n"); |
| 496 | std::string Error; |
Teresa Johnson | 26ab577 | 2016-03-15 00:04:37 +0000 | [diff] [blame] | 497 | IndexPtr = |
| 498 | getModuleSummaryIndexForFile(SummaryFile, Error, diagnosticHandler); |
Teresa Johnson | 5fcbdb7 | 2015-12-07 19:21:11 +0000 | [diff] [blame] | 499 | if (!IndexPtr) { |
| 500 | errs() << "Error loading file '" << SummaryFile << "': " << Error |
| 501 | << "\n"; |
| 502 | return false; |
| 503 | } |
| 504 | Index = IndexPtr.get(); |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 505 | } |
| 506 | |
Teresa Johnson | c86af33 | 2016-04-12 21:13:11 +0000 | [diff] [blame] | 507 | // First step is collecting the import list. |
| 508 | FunctionImporter::ImportMapTy ImportList; |
| 509 | ComputeCrossModuleImportForModule(M.getModuleIdentifier(), *Index, |
| 510 | ImportList); |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 511 | |
| 512 | // Next we need to promote to global scope and rename any local values that |
Teresa Johnson | 1b00f2d | 2016-01-08 17:06:29 +0000 | [diff] [blame] | 513 | // are potentially exported to other modules. |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 514 | if (renameModuleForThinLTO(M, *Index, nullptr)) { |
Teresa Johnson | 1b00f2d | 2016-01-08 17:06:29 +0000 | [diff] [blame] | 515 | errs() << "Error renaming module\n"; |
| 516 | return false; |
| 517 | } |
| 518 | |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 519 | // Perform the import now. |
Mehdi Amini | d16c806 | 2015-12-08 22:39:40 +0000 | [diff] [blame] | 520 | auto ModuleLoader = [&M](StringRef Identifier) { |
| 521 | return loadFile(Identifier, M.getContext()); |
| 522 | }; |
Rafael Espindola | 9d2bfc4 | 2015-12-14 23:17:03 +0000 | [diff] [blame] | 523 | FunctionImporter Importer(*Index, ModuleLoader); |
Mehdi Amini | 01e3213 | 2016-03-26 05:40:34 +0000 | [diff] [blame] | 524 | return Importer.importFunctions(M, ImportList); |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 525 | } |
| 526 | }; |
Benjamin Kramer | fe2b541 | 2015-12-24 10:03:35 +0000 | [diff] [blame] | 527 | } // anonymous namespace |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 528 | |
| 529 | char FunctionImportPass::ID = 0; |
| 530 | INITIALIZE_PASS_BEGIN(FunctionImportPass, "function-import", |
| 531 | "Summary Based Function Import", false, false) |
| 532 | INITIALIZE_PASS_END(FunctionImportPass, "function-import", |
| 533 | "Summary Based Function Import", false, false) |
| 534 | |
| 535 | namespace llvm { |
Teresa Johnson | 26ab577 | 2016-03-15 00:04:37 +0000 | [diff] [blame] | 536 | Pass *createFunctionImportPass(const ModuleSummaryIndex *Index = nullptr) { |
Teresa Johnson | 5fcbdb7 | 2015-12-07 19:21:11 +0000 | [diff] [blame] | 537 | return new FunctionImportPass(Index); |
| 538 | } |
Mehdi Amini | 42418ab | 2015-11-24 06:07:49 +0000 | [diff] [blame] | 539 | } |