Chris Lattner | dbb1735 | 2002-04-28 05:43:27 +0000 | [diff] [blame] | 1 | //===-- Internalize.cpp - Mark functions internal -------------------------===// |
Misha Brukman | fd93908 | 2005-04-21 23:48:37 +0000 | [diff] [blame] | 2 | // |
John Criswell | b576c94 | 2003-10-20 19:43:21 +0000 | [diff] [blame] | 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
Chris Lattner | 4ee451d | 2007-12-29 20:36:04 +0000 | [diff] [blame] | 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
Misha Brukman | fd93908 | 2005-04-21 23:48:37 +0000 | [diff] [blame] | 7 | // |
John Criswell | b576c94 | 2003-10-20 19:43:21 +0000 | [diff] [blame] | 8 | //===----------------------------------------------------------------------===// |
Chris Lattner | dbb1735 | 2002-04-28 05:43:27 +0000 | [diff] [blame] | 9 | // |
Rafael Espindola | e5551ed | 2012-10-26 18:47:48 +0000 | [diff] [blame] | 10 | // This pass loops over all of the functions and variables in the input module. |
| 11 | // If the function or variable is not in the list of external names given to |
| 12 | // the pass it is marked as internal. |
Chris Lattner | dbb1735 | 2002-04-28 05:43:27 +0000 | [diff] [blame] | 13 | // |
Rafael Espindola | 713cab0 | 2013-10-21 17:14:55 +0000 | [diff] [blame^] | 14 | // This transformation would not be legal or profitable in a regular |
| 15 | // compilation, but it gets extra information from the linker about what is safe |
| 16 | // or profitable. |
| 17 | // |
| 18 | // As an example of a normally illegal transformation: Internalizing a function |
| 19 | // with external linkage. Only if we are told it is only used from within this |
| 20 | // module, it is safe to do it. |
| 21 | // |
| 22 | // On the profitability side: It is always legal to internalize a linkonce_odr |
| 23 | // whose address is not used. Doing so normally would introduce code bloat, but |
| 24 | // if we are told by the linker that the only use of this would be for a |
| 25 | // DSO symbol table, it is profitable to hide it. |
| 26 | // |
Chris Lattner | dbb1735 | 2002-04-28 05:43:27 +0000 | [diff] [blame] | 27 | //===----------------------------------------------------------------------===// |
| 28 | |
Chris Lattner | 86453c5 | 2006-12-19 22:09:18 +0000 | [diff] [blame] | 29 | #define DEBUG_TYPE "internalize" |
Chris Lattner | 568ddab | 2002-07-24 17:12:05 +0000 | [diff] [blame] | 30 | #include "llvm/Transforms/IPO.h" |
Rafael Espindola | 4ef7eaf | 2013-07-25 03:23:25 +0000 | [diff] [blame] | 31 | #include "llvm/ADT/SmallPtrSet.h" |
Chandler Carruth | d04a8d4 | 2012-12-03 16:50:05 +0000 | [diff] [blame] | 32 | #include "llvm/ADT/Statistic.h" |
| 33 | #include "llvm/Analysis/CallGraph.h" |
Chandler Carruth | 0b8c9a8 | 2013-01-02 11:36:10 +0000 | [diff] [blame] | 34 | #include "llvm/IR/Module.h" |
Chandler Carruth | d04a8d4 | 2012-12-03 16:50:05 +0000 | [diff] [blame] | 35 | #include "llvm/Pass.h" |
Reid Spencer | 551ccae | 2004-09-01 22:55:40 +0000 | [diff] [blame] | 36 | #include "llvm/Support/CommandLine.h" |
| 37 | #include "llvm/Support/Debug.h" |
Daniel Dunbar | ce63ffb | 2009-07-25 00:23:56 +0000 | [diff] [blame] | 38 | #include "llvm/Support/raw_ostream.h" |
Rafael Espindola | 713cab0 | 2013-10-21 17:14:55 +0000 | [diff] [blame^] | 39 | #include "llvm/Transforms/Utils/GlobalStatus.h" |
Rafael Espindola | 4ef7eaf | 2013-07-25 03:23:25 +0000 | [diff] [blame] | 40 | #include "llvm/Transforms/Utils/ModuleUtils.h" |
Chris Lattner | c7a2c7f | 2003-05-22 19:34:49 +0000 | [diff] [blame] | 41 | #include <fstream> |
| 42 | #include <set> |
Chris Lattner | 1e2385b | 2003-11-21 21:54:22 +0000 | [diff] [blame] | 43 | using namespace llvm; |
Brian Gaeke | d0fde30 | 2003-11-11 22:41:34 +0000 | [diff] [blame] | 44 | |
Duncan Sands | 27a5300 | 2009-01-05 21:24:45 +0000 | [diff] [blame] | 45 | STATISTIC(NumAliases , "Number of aliases internalized"); |
Chris Lattner | 86453c5 | 2006-12-19 22:09:18 +0000 | [diff] [blame] | 46 | STATISTIC(NumFunctions, "Number of functions internalized"); |
| 47 | STATISTIC(NumGlobals , "Number of global vars internalized"); |
| 48 | |
Dan Gohman | 844731a | 2008-05-13 00:00:25 +0000 | [diff] [blame] | 49 | // APIFile - A file which contains a list of symbols that should not be marked |
| 50 | // external. |
| 51 | static cl::opt<std::string> |
| 52 | APIFile("internalize-public-api-file", cl::value_desc("filename"), |
| 53 | cl::desc("A file containing list of symbol names to preserve")); |
| 54 | |
| 55 | // APIList - A list of symbols that should not be marked internal. |
| 56 | static cl::list<std::string> |
| 57 | APIList("internalize-public-api-list", cl::value_desc("list"), |
| 58 | cl::desc("A list of symbol names to preserve"), |
| 59 | cl::CommaSeparated); |
| 60 | |
Rafael Espindola | 4389009 | 2013-10-03 18:29:09 +0000 | [diff] [blame] | 61 | static cl::list<std::string> |
| 62 | DSOList("internalize-dso-list", cl::value_desc("list"), |
| 63 | cl::desc("A list of symbol names need for a dso symbol table"), |
| 64 | cl::CommaSeparated); |
| 65 | |
Chris Lattner | f629309 | 2002-07-23 18:06:35 +0000 | [diff] [blame] | 66 | namespace { |
Nick Lewycky | 6726b6d | 2009-10-25 06:33:48 +0000 | [diff] [blame] | 67 | class InternalizePass : public ModulePass { |
Chris Lattner | c7a2c7f | 2003-05-22 19:34:49 +0000 | [diff] [blame] | 68 | std::set<std::string> ExternalNames; |
Rafael Espindola | 4389009 | 2013-10-03 18:29:09 +0000 | [diff] [blame] | 69 | std::set<std::string> DSONames; |
Chris Lattner | c7a2c7f | 2003-05-22 19:34:49 +0000 | [diff] [blame] | 70 | public: |
Nick Lewycky | ecd94c8 | 2007-05-06 13:37:16 +0000 | [diff] [blame] | 71 | static char ID; // Pass identification, replacement for typeid |
Rafael Espindola | e5551ed | 2012-10-26 18:47:48 +0000 | [diff] [blame] | 72 | explicit InternalizePass(); |
Rafael Espindola | 4389009 | 2013-10-03 18:29:09 +0000 | [diff] [blame] | 73 | explicit InternalizePass(ArrayRef<const char *> ExportList, |
| 74 | ArrayRef<const char *> DSOList); |
Chris Lattner | 4eb40df | 2006-01-03 19:13:17 +0000 | [diff] [blame] | 75 | void LoadFile(const char *Filename); |
| 76 | virtual bool runOnModule(Module &M); |
Nuno Lopes | 0483d01 | 2008-09-30 22:04:30 +0000 | [diff] [blame] | 77 | |
| 78 | virtual void getAnalysisUsage(AnalysisUsage &AU) const { |
| 79 | AU.setPreservesCFG(); |
Duncan Sands | a2582da | 2008-10-03 07:36:09 +0000 | [diff] [blame] | 80 | AU.addPreserved<CallGraph>(); |
Nuno Lopes | 0483d01 | 2008-09-30 22:04:30 +0000 | [diff] [blame] | 81 | } |
Chris Lattner | 55e41ba | 2002-07-30 19:48:44 +0000 | [diff] [blame] | 82 | }; |
Chris Lattner | f629309 | 2002-07-23 18:06:35 +0000 | [diff] [blame] | 83 | } // end anonymous namespace |
| 84 | |
Dan Gohman | 844731a | 2008-05-13 00:00:25 +0000 | [diff] [blame] | 85 | char InternalizePass::ID = 0; |
Owen Anderson | d13db2c | 2010-07-21 22:09:45 +0000 | [diff] [blame] | 86 | INITIALIZE_PASS(InternalizePass, "internalize", |
Owen Anderson | ce665bd | 2010-10-07 22:25:06 +0000 | [diff] [blame] | 87 | "Internalize Global Symbols", false, false) |
Dan Gohman | 844731a | 2008-05-13 00:00:25 +0000 | [diff] [blame] | 88 | |
Rafael Espindola | e5551ed | 2012-10-26 18:47:48 +0000 | [diff] [blame] | 89 | InternalizePass::InternalizePass() |
| 90 | : ModulePass(ID) { |
Owen Anderson | 081c34b | 2010-10-19 17:21:58 +0000 | [diff] [blame] | 91 | initializeInternalizePassPass(*PassRegistry::getPassRegistry()); |
Devang Patel | ef3682a | 2008-05-14 20:01:01 +0000 | [diff] [blame] | 92 | if (!APIFile.empty()) // If a filename is specified, use it. |
Chris Lattner | 4eb40df | 2006-01-03 19:13:17 +0000 | [diff] [blame] | 93 | LoadFile(APIFile.c_str()); |
Rafael Espindola | 1d7df34 | 2013-09-04 18:53:21 +0000 | [diff] [blame] | 94 | ExternalNames.insert(APIList.begin(), APIList.end()); |
Rafael Espindola | 4389009 | 2013-10-03 18:29:09 +0000 | [diff] [blame] | 95 | DSONames.insert(DSOList.begin(), DSOList.end()); |
Chris Lattner | 4eb40df | 2006-01-03 19:13:17 +0000 | [diff] [blame] | 96 | } |
| 97 | |
Rafael Espindola | 4389009 | 2013-10-03 18:29:09 +0000 | [diff] [blame] | 98 | InternalizePass::InternalizePass(ArrayRef<const char *> ExportList, |
| 99 | ArrayRef<const char *> DSOList) |
Rafael Espindola | e5551ed | 2012-10-26 18:47:48 +0000 | [diff] [blame] | 100 | : ModulePass(ID){ |
Owen Anderson | 081c34b | 2010-10-19 17:21:58 +0000 | [diff] [blame] | 101 | initializeInternalizePassPass(*PassRegistry::getPassRegistry()); |
Rafael Espindola | 775079c | 2013-09-04 20:08:46 +0000 | [diff] [blame] | 102 | for(ArrayRef<const char *>::const_iterator itr = ExportList.begin(); |
| 103 | itr != ExportList.end(); itr++) { |
Devang Patel | 753d94a | 2006-07-20 17:48:05 +0000 | [diff] [blame] | 104 | ExternalNames.insert(*itr); |
| 105 | } |
Rafael Espindola | 4389009 | 2013-10-03 18:29:09 +0000 | [diff] [blame] | 106 | for(ArrayRef<const char *>::const_iterator itr = DSOList.begin(); |
| 107 | itr != DSOList.end(); itr++) { |
| 108 | DSONames.insert(*itr); |
| 109 | } |
Devang Patel | 753d94a | 2006-07-20 17:48:05 +0000 | [diff] [blame] | 110 | } |
| 111 | |
Chris Lattner | 4eb40df | 2006-01-03 19:13:17 +0000 | [diff] [blame] | 112 | void InternalizePass::LoadFile(const char *Filename) { |
| 113 | // Load the APIFile... |
| 114 | std::ifstream In(Filename); |
| 115 | if (!In.good()) { |
Chris Lattner | 4437ae2 | 2009-08-23 07:05:07 +0000 | [diff] [blame] | 116 | errs() << "WARNING: Internalize couldn't load file '" << Filename |
Devang Patel | ef3682a | 2008-05-14 20:01:01 +0000 | [diff] [blame] | 117 | << "'! Continuing as if it's empty.\n"; |
| 118 | return; // Just continue as if the file were empty |
Chris Lattner | 4eb40df | 2006-01-03 19:13:17 +0000 | [diff] [blame] | 119 | } |
| 120 | while (In) { |
| 121 | std::string Symbol; |
| 122 | In >> Symbol; |
| 123 | if (!Symbol.empty()) |
| 124 | ExternalNames.insert(Symbol); |
| 125 | } |
| 126 | } |
| 127 | |
Rafael Espindola | 0fb7716 | 2013-09-04 18:37:36 +0000 | [diff] [blame] | 128 | static bool shouldInternalize(const GlobalValue &GV, |
Rafael Espindola | 4389009 | 2013-10-03 18:29:09 +0000 | [diff] [blame] | 129 | const std::set<std::string> &ExternalNames, |
| 130 | const std::set<std::string> &DSONames) { |
Rafael Espindola | 0fb7716 | 2013-09-04 18:37:36 +0000 | [diff] [blame] | 131 | // Function must be defined here |
| 132 | if (GV.isDeclaration()) |
| 133 | return false; |
| 134 | |
| 135 | // Available externally is really just a "declaration with a body". |
| 136 | if (GV.hasAvailableExternallyLinkage()) |
| 137 | return false; |
| 138 | |
| 139 | // Already has internal linkage |
| 140 | if (GV.hasLocalLinkage()) |
| 141 | return false; |
| 142 | |
| 143 | // Marked to keep external? |
| 144 | if (ExternalNames.count(GV.getName())) |
| 145 | return false; |
| 146 | |
Rafael Espindola | 4389009 | 2013-10-03 18:29:09 +0000 | [diff] [blame] | 147 | // Not needed for the symbol table? |
| 148 | if (!DSONames.count(GV.getName())) |
| 149 | return true; |
| 150 | |
| 151 | // Not a linkonce. Someone can depend on it being on the symbol table. |
| 152 | if (!GV.hasLinkOnceLinkage()) |
| 153 | return false; |
| 154 | |
| 155 | // The address is not important, we can hide it. |
| 156 | if (GV.hasUnnamedAddr()) |
| 157 | return true; |
| 158 | |
Rafael Espindola | 713cab0 | 2013-10-21 17:14:55 +0000 | [diff] [blame^] | 159 | GlobalStatus GS; |
| 160 | if (GlobalStatus::analyzeGlobal(&GV, GS)) |
| 161 | return false; |
| 162 | |
| 163 | return !GS.IsCompared; |
Rafael Espindola | 0fb7716 | 2013-09-04 18:37:36 +0000 | [diff] [blame] | 164 | } |
| 165 | |
Chris Lattner | 4eb40df | 2006-01-03 19:13:17 +0000 | [diff] [blame] | 166 | bool InternalizePass::runOnModule(Module &M) { |
Duncan Sands | 1465d61 | 2009-01-28 13:14:17 +0000 | [diff] [blame] | 167 | CallGraph *CG = getAnalysisIfAvailable<CallGraph>(); |
Duncan Sands | a2582da | 2008-10-03 07:36:09 +0000 | [diff] [blame] | 168 | CallGraphNode *ExternalNode = CG ? CG->getExternalCallingNode() : 0; |
Chris Lattner | 4eb40df | 2006-01-03 19:13:17 +0000 | [diff] [blame] | 169 | bool Changed = false; |
Duncan Sands | 2631ac3 | 2009-01-05 20:38:27 +0000 | [diff] [blame] | 170 | |
Rafael Espindola | 4ef7eaf | 2013-07-25 03:23:25 +0000 | [diff] [blame] | 171 | SmallPtrSet<GlobalValue *, 8> Used; |
| 172 | collectUsedGlobalVariables(M, Used, false); |
| 173 | |
| 174 | // We must assume that globals in llvm.used have a reference that not even |
| 175 | // the linker can see, so we don't internalize them. |
| 176 | // For llvm.compiler.used the situation is a bit fuzzy. The assembler and |
| 177 | // linker can drop those symbols. If this pass is running as part of LTO, |
| 178 | // one might think that it could just drop llvm.compiler.used. The problem |
| 179 | // is that even in LTO llvm doesn't see every reference. For example, |
| 180 | // we don't see references from function local inline assembly. To be |
| 181 | // conservative, we internalize symbols in llvm.compiler.used, but we |
| 182 | // keep llvm.compiler.used so that the symbol is not deleted by llvm. |
| 183 | for (SmallPtrSet<GlobalValue *, 8>::iterator I = Used.begin(), E = Used.end(); |
| 184 | I != E; ++I) { |
| 185 | GlobalValue *V = *I; |
| 186 | ExternalNames.insert(V->getName()); |
| 187 | } |
| 188 | |
Devang Patel | ef3682a | 2008-05-14 20:01:01 +0000 | [diff] [blame] | 189 | // Mark all functions not in the api as internal. |
Rafael Espindola | bb46f52 | 2009-01-15 20:18:42 +0000 | [diff] [blame] | 190 | // FIXME: maybe use private linkage? |
Rafael Espindola | 0fb7716 | 2013-09-04 18:37:36 +0000 | [diff] [blame] | 191 | for (Module::iterator I = M.begin(), E = M.end(); I != E; ++I) { |
Rafael Espindola | 4389009 | 2013-10-03 18:29:09 +0000 | [diff] [blame] | 192 | if (!shouldInternalize(*I, ExternalNames, DSONames)) |
Rafael Espindola | 0fb7716 | 2013-09-04 18:37:36 +0000 | [diff] [blame] | 193 | continue; |
Bill Wendling | 86d4956 | 2013-08-30 21:07:33 +0000 | [diff] [blame] | 194 | |
Rafael Espindola | 0fb7716 | 2013-09-04 18:37:36 +0000 | [diff] [blame] | 195 | I->setLinkage(GlobalValue::InternalLinkage); |
Bill Wendling | 86d4956 | 2013-08-30 21:07:33 +0000 | [diff] [blame] | 196 | |
Rafael Espindola | 0fb7716 | 2013-09-04 18:37:36 +0000 | [diff] [blame] | 197 | if (ExternalNode) |
| 198 | // Remove a callgraph edge from the external node to this function. |
| 199 | ExternalNode->removeOneAbstractEdgeTo((*CG)[I]); |
| 200 | |
| 201 | Changed = true; |
| 202 | ++NumFunctions; |
| 203 | DEBUG(dbgs() << "Internalizing func " << I->getName() << "\n"); |
| 204 | } |
Duncan Sands | 2631ac3 | 2009-01-05 20:38:27 +0000 | [diff] [blame] | 205 | |
Chris Lattner | 4eb40df | 2006-01-03 19:13:17 +0000 | [diff] [blame] | 206 | // Never internalize the llvm.used symbol. It is used to implement |
| 207 | // attribute((used)). |
Chris Lattner | 401e10c | 2009-07-20 06:14:25 +0000 | [diff] [blame] | 208 | // FIXME: Shouldn't this just filter on llvm.metadata section?? |
Chris Lattner | 4eb40df | 2006-01-03 19:13:17 +0000 | [diff] [blame] | 209 | ExternalNames.insert("llvm.used"); |
Chris Lattner | 401e10c | 2009-07-20 06:14:25 +0000 | [diff] [blame] | 210 | ExternalNames.insert("llvm.compiler.used"); |
Duncan Sands | 2631ac3 | 2009-01-05 20:38:27 +0000 | [diff] [blame] | 211 | |
Jim Laskey | 44c3b9f | 2007-01-26 21:22:28 +0000 | [diff] [blame] | 212 | // Never internalize anchors used by the machine module info, else the info |
| 213 | // won't find them. (see MachineModuleInfo.) |
Chris Lattner | 4e2288b | 2007-06-06 20:51:41 +0000 | [diff] [blame] | 214 | ExternalNames.insert("llvm.global_ctors"); |
| 215 | ExternalNames.insert("llvm.global_dtors"); |
Tanya Lattner | 088b591 | 2007-10-03 17:05:40 +0000 | [diff] [blame] | 216 | ExternalNames.insert("llvm.global.annotations"); |
Duncan Sands | 2631ac3 | 2009-01-05 20:38:27 +0000 | [diff] [blame] | 217 | |
Bill Wendling | aab3c0c | 2012-04-13 01:06:27 +0000 | [diff] [blame] | 218 | // Never internalize symbols code-gen inserts. |
Bill Wendling | d275ff5 | 2013-08-12 20:09:37 +0000 | [diff] [blame] | 219 | // FIXME: We should probably add this (and the __stack_chk_guard) via some |
| 220 | // type of call-back in CodeGen. |
| 221 | ExternalNames.insert("__stack_chk_fail"); |
Bill Wendling | aab3c0c | 2012-04-13 01:06:27 +0000 | [diff] [blame] | 222 | ExternalNames.insert("__stack_chk_guard"); |
| 223 | |
Devang Patel | ef3682a | 2008-05-14 20:01:01 +0000 | [diff] [blame] | 224 | // Mark all global variables with initializers that are not in the api as |
| 225 | // internal as well. |
Rafael Espindola | bb46f52 | 2009-01-15 20:18:42 +0000 | [diff] [blame] | 226 | // FIXME: maybe use private linkage? |
Chris Lattner | 4eb40df | 2006-01-03 19:13:17 +0000 | [diff] [blame] | 227 | for (Module::global_iterator I = M.global_begin(), E = M.global_end(); |
Rafael Espindola | 0fb7716 | 2013-09-04 18:37:36 +0000 | [diff] [blame] | 228 | I != E; ++I) { |
Rafael Espindola | 4389009 | 2013-10-03 18:29:09 +0000 | [diff] [blame] | 229 | if (!shouldInternalize(*I, ExternalNames, DSONames)) |
Rafael Espindola | 0fb7716 | 2013-09-04 18:37:36 +0000 | [diff] [blame] | 230 | continue; |
| 231 | |
| 232 | I->setLinkage(GlobalValue::InternalLinkage); |
| 233 | Changed = true; |
| 234 | ++NumGlobals; |
| 235 | DEBUG(dbgs() << "Internalized gvar " << I->getName() << "\n"); |
| 236 | } |
Duncan Sands | 2631ac3 | 2009-01-05 20:38:27 +0000 | [diff] [blame] | 237 | |
Duncan Sands | 27a5300 | 2009-01-05 21:24:45 +0000 | [diff] [blame] | 238 | // Mark all aliases that are not in the api as internal as well. |
| 239 | for (Module::alias_iterator I = M.alias_begin(), E = M.alias_end(); |
Rafael Espindola | 0fb7716 | 2013-09-04 18:37:36 +0000 | [diff] [blame] | 240 | I != E; ++I) { |
Rafael Espindola | 4389009 | 2013-10-03 18:29:09 +0000 | [diff] [blame] | 241 | if (!shouldInternalize(*I, ExternalNames, DSONames)) |
Rafael Espindola | 0fb7716 | 2013-09-04 18:37:36 +0000 | [diff] [blame] | 242 | continue; |
| 243 | |
| 244 | I->setLinkage(GlobalValue::InternalLinkage); |
| 245 | Changed = true; |
| 246 | ++NumAliases; |
| 247 | DEBUG(dbgs() << "Internalized alias " << I->getName() << "\n"); |
| 248 | } |
Duncan Sands | 27a5300 | 2009-01-05 21:24:45 +0000 | [diff] [blame] | 249 | |
Chris Lattner | 4eb40df | 2006-01-03 19:13:17 +0000 | [diff] [blame] | 250 | return Changed; |
| 251 | } |
| 252 | |
Rafael Espindola | e5551ed | 2012-10-26 18:47:48 +0000 | [diff] [blame] | 253 | ModulePass *llvm::createInternalizePass() { |
| 254 | return new InternalizePass(); |
Chris Lattner | dbb1735 | 2002-04-28 05:43:27 +0000 | [diff] [blame] | 255 | } |
Devang Patel | 753d94a | 2006-07-20 17:48:05 +0000 | [diff] [blame] | 256 | |
Rafael Espindola | 4389009 | 2013-10-03 18:29:09 +0000 | [diff] [blame] | 257 | ModulePass *llvm::createInternalizePass(ArrayRef<const char *> ExportList, |
| 258 | ArrayRef<const char *> DSOList) { |
| 259 | return new InternalizePass(ExportList, DSOList); |
Devang Patel | 753d94a | 2006-07-20 17:48:05 +0000 | [diff] [blame] | 260 | } |