Misha Brukman | de03bc0 | 2005-04-24 17:36:05 +0000 | [diff] [blame] | 1 | //===- llvm-extract.cpp - LLVM function extraction utility ----------------===// |
Misha Brukman | 3da94ae | 2005-04-22 00:00:37 +0000 | [diff] [blame] | 2 | // |
John Criswell | 7c0e022 | 2003-10-20 17:47:21 +0000 | [diff] [blame] | 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
Chris Lattner | 21c62da | 2007-12-29 20:44:31 +0000 | [diff] [blame] | 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
Misha Brukman | 3da94ae | 2005-04-22 00:00:37 +0000 | [diff] [blame] | 7 | // |
John Criswell | 7c0e022 | 2003-10-20 17:47:21 +0000 | [diff] [blame] | 8 | //===----------------------------------------------------------------------===// |
Chris Lattner | 579d914 | 2002-05-22 20:27:00 +0000 | [diff] [blame] | 9 | // |
| 10 | // This utility changes the input module to only contain a single function, |
| 11 | // which is primarily used for debugging transformations. |
| 12 | // |
| 13 | //===----------------------------------------------------------------------===// |
| 14 | |
Chandler Carruth | 0b8c9a8 | 2013-01-02 11:36:10 +0000 | [diff] [blame] | 15 | #include "llvm/IR/LLVMContext.h" |
Chandler Carruth | f010c46 | 2012-12-04 10:44:52 +0000 | [diff] [blame] | 16 | #include "llvm/ADT/SetVector.h" |
| 17 | #include "llvm/ADT/SmallPtrSet.h" |
Dan Gohman | ec08046 | 2009-09-11 20:46:33 +0000 | [diff] [blame] | 18 | #include "llvm/Assembly/PrintModulePass.h" |
Chris Lattner | c48e1db | 2007-05-06 05:13:17 +0000 | [diff] [blame] | 19 | #include "llvm/Bitcode/ReaderWriter.h" |
Chandler Carruth | 0b8c9a8 | 2013-01-02 11:36:10 +0000 | [diff] [blame] | 20 | #include "llvm/IR/DataLayout.h" |
| 21 | #include "llvm/IR/Module.h" |
Chandler Carruth | 7fc162f | 2013-03-26 02:25:37 +0000 | [diff] [blame] | 22 | #include "llvm/IRReader/IRReader.h" |
Chandler Carruth | f010c46 | 2012-12-04 10:44:52 +0000 | [diff] [blame] | 23 | #include "llvm/PassManager.h" |
Reid Spencer | 551ccae | 2004-09-01 22:55:40 +0000 | [diff] [blame] | 24 | #include "llvm/Support/CommandLine.h" |
Chris Lattner | c30598b | 2006-12-06 01:18:01 +0000 | [diff] [blame] | 25 | #include "llvm/Support/ManagedStatic.h" |
Chris Lattner | cc14d25 | 2009-03-06 05:34:10 +0000 | [diff] [blame] | 26 | #include "llvm/Support/PrettyStackTrace.h" |
Chad Rosier | 4e0a55d | 2011-09-16 21:09:17 +0000 | [diff] [blame] | 27 | #include "llvm/Support/Regex.h" |
Chandler Carruth | f010c46 | 2012-12-04 10:44:52 +0000 | [diff] [blame] | 28 | #include "llvm/Support/Signals.h" |
Chandler Carruth | 7fc162f | 2013-03-26 02:25:37 +0000 | [diff] [blame] | 29 | #include "llvm/Support/SourceMgr.h" |
Chandler Carruth | f010c46 | 2012-12-04 10:44:52 +0000 | [diff] [blame] | 30 | #include "llvm/Support/SystemUtils.h" |
| 31 | #include "llvm/Support/ToolOutputFile.h" |
| 32 | #include "llvm/Transforms/IPO.h" |
Chris Lattner | 579d914 | 2002-05-22 20:27:00 +0000 | [diff] [blame] | 33 | #include <memory> |
Brian Gaeke | d0fde30 | 2003-11-11 22:41:34 +0000 | [diff] [blame] | 34 | using namespace llvm; |
| 35 | |
Chris Lattner | 5ff62e9 | 2002-07-22 02:10:13 +0000 | [diff] [blame] | 36 | // InputFilename - The filename to read from. |
Chris Lattner | c7a0985 | 2002-07-25 16:31:09 +0000 | [diff] [blame] | 37 | static cl::opt<std::string> |
Gabor Greif | a99be51 | 2007-07-05 17:07:56 +0000 | [diff] [blame] | 38 | InputFilename(cl::Positional, cl::desc("<input bitcode file>"), |
Chris Lattner | 5ff62e9 | 2002-07-22 02:10:13 +0000 | [diff] [blame] | 39 | cl::init("-"), cl::value_desc("filename")); |
Misha Brukman | 3da94ae | 2005-04-22 00:00:37 +0000 | [diff] [blame] | 40 | |
Chris Lattner | ba9cc1f | 2004-02-18 16:53:59 +0000 | [diff] [blame] | 41 | static cl::opt<std::string> |
Misha Brukman | 3da94ae | 2005-04-22 00:00:37 +0000 | [diff] [blame] | 42 | OutputFilename("o", cl::desc("Specify output filename"), |
Chris Lattner | ba9cc1f | 2004-02-18 16:53:59 +0000 | [diff] [blame] | 43 | cl::value_desc("filename"), cl::init("-")); |
| 44 | |
| 45 | static cl::opt<bool> |
Dan Gohman | baa2639 | 2009-08-25 15:34:52 +0000 | [diff] [blame] | 46 | Force("f", cl::desc("Enable binary output on terminals")); |
Chris Lattner | 5ff62e9 | 2002-07-22 02:10:13 +0000 | [diff] [blame] | 47 | |
Misha Brukman | ca718e4 | 2004-04-22 23:07:39 +0000 | [diff] [blame] | 48 | static cl::opt<bool> |
Andrew Lenharth | d245a8a | 2008-03-07 19:51:57 +0000 | [diff] [blame] | 49 | DeleteFn("delete", cl::desc("Delete specified Globals from Module")); |
Misha Brukman | ca718e4 | 2004-04-22 23:07:39 +0000 | [diff] [blame] | 50 | |
Chad Rosier | 4e0a55d | 2011-09-16 21:09:17 +0000 | [diff] [blame] | 51 | // ExtractFuncs - The functions to extract from the module. |
Dan Gohman | a499d20 | 2010-02-10 23:58:53 +0000 | [diff] [blame] | 52 | static cl::list<std::string> |
| 53 | ExtractFuncs("func", cl::desc("Specify function to extract"), |
| 54 | cl::ZeroOrMore, cl::value_desc("function")); |
Chris Lattner | 5ff62e9 | 2002-07-22 02:10:13 +0000 | [diff] [blame] | 55 | |
Chad Rosier | 4e0a55d | 2011-09-16 21:09:17 +0000 | [diff] [blame] | 56 | // ExtractRegExpFuncs - The functions, matched via regular expression, to |
| 57 | // extract from the module. |
| 58 | static cl::list<std::string> |
| 59 | ExtractRegExpFuncs("rfunc", cl::desc("Specify function(s) to extract using a " |
| 60 | "regular expression"), |
| 61 | cl::ZeroOrMore, cl::value_desc("rfunction")); |
| 62 | |
Rafael Espindola | ca88cee | 2012-10-29 02:23:07 +0000 | [diff] [blame] | 63 | // ExtractAlias - The alias to extract from the module. |
| 64 | static cl::list<std::string> |
| 65 | ExtractAliases("alias", cl::desc("Specify alias to extract"), |
| 66 | cl::ZeroOrMore, cl::value_desc("alias")); |
| 67 | |
| 68 | |
| 69 | // ExtractRegExpAliases - The aliases, matched via regular expression, to |
| 70 | // extract from the module. |
| 71 | static cl::list<std::string> |
| 72 | ExtractRegExpAliases("ralias", cl::desc("Specify alias(es) to extract using a " |
| 73 | "regular expression"), |
| 74 | cl::ZeroOrMore, cl::value_desc("ralias")); |
| 75 | |
Chad Rosier | 4e0a55d | 2011-09-16 21:09:17 +0000 | [diff] [blame] | 76 | // ExtractGlobals - The globals to extract from the module. |
Dan Gohman | a499d20 | 2010-02-10 23:58:53 +0000 | [diff] [blame] | 77 | static cl::list<std::string> |
| 78 | ExtractGlobals("glob", cl::desc("Specify global to extract"), |
| 79 | cl::ZeroOrMore, cl::value_desc("global")); |
Andrew Lenharth | d245a8a | 2008-03-07 19:51:57 +0000 | [diff] [blame] | 80 | |
Chad Rosier | 4e0a55d | 2011-09-16 21:09:17 +0000 | [diff] [blame] | 81 | // ExtractRegExpGlobals - The globals, matched via regular expression, to |
| 82 | // extract from the module... |
| 83 | static cl::list<std::string> |
| 84 | ExtractRegExpGlobals("rglob", cl::desc("Specify global(s) to extract using a " |
| 85 | "regular expression"), |
| 86 | cl::ZeroOrMore, cl::value_desc("rglobal")); |
| 87 | |
Dan Gohman | ec08046 | 2009-09-11 20:46:33 +0000 | [diff] [blame] | 88 | static cl::opt<bool> |
| 89 | OutputAssembly("S", |
| 90 | cl::desc("Write output as LLVM assembly"), cl::Hidden); |
| 91 | |
Chris Lattner | 579d914 | 2002-05-22 20:27:00 +0000 | [diff] [blame] | 92 | int main(int argc, char **argv) { |
Chris Lattner | cc14d25 | 2009-03-06 05:34:10 +0000 | [diff] [blame] | 93 | // Print a stack trace if we signal out. |
Chris Lattner | c48e1db | 2007-05-06 05:13:17 +0000 | [diff] [blame] | 94 | sys::PrintStackTraceOnErrorSignal(); |
Chris Lattner | cc14d25 | 2009-03-06 05:34:10 +0000 | [diff] [blame] | 95 | PrettyStackTraceProgram X(argc, argv); |
Owen Anderson | 8b477ed | 2009-07-01 16:58:40 +0000 | [diff] [blame] | 96 | |
Owen Anderson | 0d7c695 | 2009-07-15 22:16:10 +0000 | [diff] [blame] | 97 | LLVMContext &Context = getGlobalContext(); |
Chris Lattner | cc14d25 | 2009-03-06 05:34:10 +0000 | [diff] [blame] | 98 | llvm_shutdown_obj Y; // Call llvm_shutdown() on exit. |
| 99 | cl::ParseCommandLineOptions(argc, argv, "llvm extractor\n"); |
Chris Lattner | 579d914 | 2002-05-22 20:27:00 +0000 | [diff] [blame] | 100 | |
Dan Gohman | 44f9533 | 2010-08-25 23:33:07 +0000 | [diff] [blame] | 101 | // Use lazy loading, since we only care about selected global values. |
Dan Gohman | ec08046 | 2009-09-11 20:46:33 +0000 | [diff] [blame] | 102 | SMDiagnostic Err; |
Andy Gibbs | 200241e | 2013-04-12 10:56:28 +0000 | [diff] [blame] | 103 | OwningPtr<Module> M; |
Dan Gohman | 44f9533 | 2010-08-25 23:33:07 +0000 | [diff] [blame] | 104 | M.reset(getLazyIRFileModule(InputFilename, Err, Context)); |
Dan Gohman | ec08046 | 2009-09-11 20:46:33 +0000 | [diff] [blame] | 105 | |
Chris Lattner | c48e1db | 2007-05-06 05:13:17 +0000 | [diff] [blame] | 106 | if (M.get() == 0) { |
Chris Lattner | d8b7aa2 | 2011-10-16 04:47:35 +0000 | [diff] [blame] | 107 | Err.print(argv[0], errs()); |
Chris Lattner | c48e1db | 2007-05-06 05:13:17 +0000 | [diff] [blame] | 108 | return 1; |
| 109 | } |
| 110 | |
Chad Rosier | 4e0a55d | 2011-09-16 21:09:17 +0000 | [diff] [blame] | 111 | // Use SetVector to avoid duplicates. |
| 112 | SetVector<GlobalValue *> GVs; |
Andrew Lenharth | d245a8a | 2008-03-07 19:51:57 +0000 | [diff] [blame] | 113 | |
Rafael Espindola | ca88cee | 2012-10-29 02:23:07 +0000 | [diff] [blame] | 114 | // Figure out which aliases we should extract. |
| 115 | for (size_t i = 0, e = ExtractAliases.size(); i != e; ++i) { |
| 116 | GlobalAlias *GA = M->getNamedAlias(ExtractAliases[i]); |
| 117 | if (!GA) { |
| 118 | errs() << argv[0] << ": program doesn't contain alias named '" |
| 119 | << ExtractAliases[i] << "'!\n"; |
| 120 | return 1; |
| 121 | } |
| 122 | GVs.insert(GA); |
| 123 | } |
| 124 | |
| 125 | // Extract aliases via regular expression matching. |
| 126 | for (size_t i = 0, e = ExtractRegExpAliases.size(); i != e; ++i) { |
| 127 | std::string Error; |
| 128 | Regex RegEx(ExtractRegExpAliases[i]); |
| 129 | if (!RegEx.isValid(Error)) { |
| 130 | errs() << argv[0] << ": '" << ExtractRegExpAliases[i] << "' " |
| 131 | "invalid regex: " << Error; |
| 132 | } |
| 133 | bool match = false; |
| 134 | for (Module::alias_iterator GA = M->alias_begin(), E = M->alias_end(); |
| 135 | GA != E; GA++) { |
| 136 | if (RegEx.match(GA->getName())) { |
| 137 | GVs.insert(&*GA); |
| 138 | match = true; |
| 139 | } |
| 140 | } |
| 141 | if (!match) { |
| 142 | errs() << argv[0] << ": program doesn't contain global named '" |
| 143 | << ExtractRegExpAliases[i] << "'!\n"; |
| 144 | return 1; |
| 145 | } |
| 146 | } |
| 147 | |
Dan Gohman | a499d20 | 2010-02-10 23:58:53 +0000 | [diff] [blame] | 148 | // Figure out which globals we should extract. |
| 149 | for (size_t i = 0, e = ExtractGlobals.size(); i != e; ++i) { |
Nick Lewycky | db186c4 | 2011-12-30 19:17:23 +0000 | [diff] [blame] | 150 | GlobalValue *GV = M->getNamedGlobal(ExtractGlobals[i]); |
Dan Gohman | a499d20 | 2010-02-10 23:58:53 +0000 | [diff] [blame] | 151 | if (!GV) { |
| 152 | errs() << argv[0] << ": program doesn't contain global named '" |
| 153 | << ExtractGlobals[i] << "'!\n"; |
| 154 | return 1; |
| 155 | } |
Chad Rosier | 4e0a55d | 2011-09-16 21:09:17 +0000 | [diff] [blame] | 156 | GVs.insert(GV); |
| 157 | } |
| 158 | |
| 159 | // Extract globals via regular expression matching. |
| 160 | for (size_t i = 0, e = ExtractRegExpGlobals.size(); i != e; ++i) { |
| 161 | std::string Error; |
| 162 | Regex RegEx(ExtractRegExpGlobals[i]); |
| 163 | if (!RegEx.isValid(Error)) { |
| 164 | errs() << argv[0] << ": '" << ExtractRegExpGlobals[i] << "' " |
| 165 | "invalid regex: " << Error; |
| 166 | } |
| 167 | bool match = false; |
Nick Lewycky | db186c4 | 2011-12-30 19:17:23 +0000 | [diff] [blame] | 168 | for (Module::global_iterator GV = M->global_begin(), |
| 169 | E = M->global_end(); GV != E; GV++) { |
Chad Rosier | 4e0a55d | 2011-09-16 21:09:17 +0000 | [diff] [blame] | 170 | if (RegEx.match(GV->getName())) { |
| 171 | GVs.insert(&*GV); |
| 172 | match = true; |
| 173 | } |
| 174 | } |
| 175 | if (!match) { |
| 176 | errs() << argv[0] << ": program doesn't contain global named '" |
| 177 | << ExtractRegExpGlobals[i] << "'!\n"; |
| 178 | return 1; |
| 179 | } |
Dan Gohman | a499d20 | 2010-02-10 23:58:53 +0000 | [diff] [blame] | 180 | } |
Andrew Lenharth | d245a8a | 2008-03-07 19:51:57 +0000 | [diff] [blame] | 181 | |
Dan Gohman | a499d20 | 2010-02-10 23:58:53 +0000 | [diff] [blame] | 182 | // Figure out which functions we should extract. |
| 183 | for (size_t i = 0, e = ExtractFuncs.size(); i != e; ++i) { |
Nick Lewycky | db186c4 | 2011-12-30 19:17:23 +0000 | [diff] [blame] | 184 | GlobalValue *GV = M->getFunction(ExtractFuncs[i]); |
Dan Gohman | a499d20 | 2010-02-10 23:58:53 +0000 | [diff] [blame] | 185 | if (!GV) { |
| 186 | errs() << argv[0] << ": program doesn't contain function named '" |
| 187 | << ExtractFuncs[i] << "'!\n"; |
| 188 | return 1; |
| 189 | } |
Chad Rosier | 4e0a55d | 2011-09-16 21:09:17 +0000 | [diff] [blame] | 190 | GVs.insert(GV); |
| 191 | } |
| 192 | // Extract functions via regular expression matching. |
| 193 | for (size_t i = 0, e = ExtractRegExpFuncs.size(); i != e; ++i) { |
| 194 | std::string Error; |
| 195 | StringRef RegExStr = ExtractRegExpFuncs[i]; |
| 196 | Regex RegEx(RegExStr); |
| 197 | if (!RegEx.isValid(Error)) { |
| 198 | errs() << argv[0] << ": '" << ExtractRegExpFuncs[i] << "' " |
| 199 | "invalid regex: " << Error; |
| 200 | } |
| 201 | bool match = false; |
Nick Lewycky | db186c4 | 2011-12-30 19:17:23 +0000 | [diff] [blame] | 202 | for (Module::iterator F = M->begin(), E = M->end(); F != E; |
Chad Rosier | 4e0a55d | 2011-09-16 21:09:17 +0000 | [diff] [blame] | 203 | F++) { |
| 204 | if (RegEx.match(F->getName())) { |
| 205 | GVs.insert(&*F); |
| 206 | match = true; |
| 207 | } |
| 208 | } |
| 209 | if (!match) { |
| 210 | errs() << argv[0] << ": program doesn't contain global named '" |
| 211 | << ExtractRegExpFuncs[i] << "'!\n"; |
| 212 | return 1; |
| 213 | } |
Chris Lattner | c48e1db | 2007-05-06 05:13:17 +0000 | [diff] [blame] | 214 | } |
| 215 | |
Dan Gohman | 44f9533 | 2010-08-25 23:33:07 +0000 | [diff] [blame] | 216 | // Materialize requisite global values. |
Dan Gohman | be2d4e7 | 2010-09-23 00:33:13 +0000 | [diff] [blame] | 217 | if (!DeleteFn) |
| 218 | for (size_t i = 0, e = GVs.size(); i != e; ++i) { |
| 219 | GlobalValue *GV = GVs[i]; |
| 220 | if (GV->isMaterializable()) { |
| 221 | std::string ErrInfo; |
| 222 | if (GV->Materialize(&ErrInfo)) { |
| 223 | errs() << argv[0] << ": error reading input: " << ErrInfo << "\n"; |
| 224 | return 1; |
| 225 | } |
| 226 | } |
| 227 | } |
| 228 | else { |
| 229 | // Deleting. Materialize every GV that's *not* in GVs. |
| 230 | SmallPtrSet<GlobalValue *, 8> GVSet(GVs.begin(), GVs.end()); |
| 231 | for (Module::global_iterator I = M->global_begin(), E = M->global_end(); |
| 232 | I != E; ++I) { |
| 233 | GlobalVariable *G = I; |
| 234 | if (!GVSet.count(G) && G->isMaterializable()) { |
| 235 | std::string ErrInfo; |
| 236 | if (G->Materialize(&ErrInfo)) { |
| 237 | errs() << argv[0] << ": error reading input: " << ErrInfo << "\n"; |
| 238 | return 1; |
| 239 | } |
| 240 | } |
| 241 | } |
| 242 | for (Module::iterator I = M->begin(), E = M->end(); I != E; ++I) { |
| 243 | Function *F = I; |
| 244 | if (!GVSet.count(F) && F->isMaterializable()) { |
| 245 | std::string ErrInfo; |
| 246 | if (F->Materialize(&ErrInfo)) { |
| 247 | errs() << argv[0] << ": error reading input: " << ErrInfo << "\n"; |
| 248 | return 1; |
| 249 | } |
Dan Gohman | 44f9533 | 2010-08-25 23:33:07 +0000 | [diff] [blame] | 250 | } |
| 251 | } |
| 252 | } |
| 253 | |
Chris Lattner | c48e1db | 2007-05-06 05:13:17 +0000 | [diff] [blame] | 254 | // In addition to deleting all other functions, we also want to spiff it |
| 255 | // up a little bit. Do this now. |
| 256 | PassManager Passes; |
Micah Villmow | 791cfc2 | 2012-10-08 16:39:34 +0000 | [diff] [blame] | 257 | Passes.add(new DataLayout(M.get())); // Use correct DataLayout |
Andrew Lenharth | d245a8a | 2008-03-07 19:51:57 +0000 | [diff] [blame] | 258 | |
Chad Rosier | 4e0a55d | 2011-09-16 21:09:17 +0000 | [diff] [blame] | 259 | std::vector<GlobalValue*> Gvs(GVs.begin(), GVs.end()); |
| 260 | |
| 261 | Passes.add(createGVExtractionPass(Gvs, DeleteFn)); |
Chris Lattner | c48e1db | 2007-05-06 05:13:17 +0000 | [diff] [blame] | 262 | if (!DeleteFn) |
| 263 | Passes.add(createGlobalDCEPass()); // Delete unreachable globals |
Devang Patel | c1874b7 | 2010-07-01 19:58:05 +0000 | [diff] [blame] | 264 | Passes.add(createStripDeadDebugInfoPass()); // Remove dead debug info |
Chris Lattner | c48e1db | 2007-05-06 05:13:17 +0000 | [diff] [blame] | 265 | Passes.add(createStripDeadPrototypesPass()); // Remove dead func decls |
| 266 | |
Chris Lattner | 51a1132 | 2009-08-23 02:56:05 +0000 | [diff] [blame] | 267 | std::string ErrorInfo; |
Dan Gohman | 2df9504 | 2010-08-20 01:12:13 +0000 | [diff] [blame] | 268 | tool_output_file Out(OutputFilename.c_str(), ErrorInfo, |
| 269 | raw_fd_ostream::F_Binary); |
Chris Lattner | 51a1132 | 2009-08-23 02:56:05 +0000 | [diff] [blame] | 270 | if (!ErrorInfo.empty()) { |
| 271 | errs() << ErrorInfo << '\n'; |
Chris Lattner | 51a1132 | 2009-08-23 02:56:05 +0000 | [diff] [blame] | 272 | return 1; |
Chris Lattner | c48e1db | 2007-05-06 05:13:17 +0000 | [diff] [blame] | 273 | } |
| 274 | |
Dan Gohman | ec08046 | 2009-09-11 20:46:33 +0000 | [diff] [blame] | 275 | if (OutputAssembly) |
Dan Gohman | d4c4543 | 2010-09-01 14:20:41 +0000 | [diff] [blame] | 276 | Passes.add(createPrintModulePass(&Out.os())); |
| 277 | else if (Force || !CheckBitcodeOutputToConsole(Out.os(), true)) |
| 278 | Passes.add(createBitcodeWriterPass(Out.os())); |
Dan Gohman | baa2639 | 2009-08-25 15:34:52 +0000 | [diff] [blame] | 279 | |
Chris Lattner | c48e1db | 2007-05-06 05:13:17 +0000 | [diff] [blame] | 280 | Passes.run(*M.get()); |
| 281 | |
Dan Gohman | 2df9504 | 2010-08-20 01:12:13 +0000 | [diff] [blame] | 282 | // Declare success. |
| 283 | Out.keep(); |
| 284 | |
Chris Lattner | c48e1db | 2007-05-06 05:13:17 +0000 | [diff] [blame] | 285 | return 0; |
Chris Lattner | 579d914 | 2002-05-22 20:27:00 +0000 | [diff] [blame] | 286 | } |