Chris Lattner | dbb1735 | 2002-04-28 05:43:27 +0000 | [diff] [blame] | 1 | //===-- Internalize.cpp - Mark functions internal -------------------------===// |
Misha Brukman | fd93908 | 2005-04-21 23:48:37 +0000 | [diff] [blame] | 2 | // |
John Criswell | b576c94 | 2003-10-20 19:43:21 +0000 | [diff] [blame] | 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
Chris Lattner | 4ee451d | 2007-12-29 20:36:04 +0000 | [diff] [blame] | 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
Misha Brukman | fd93908 | 2005-04-21 23:48:37 +0000 | [diff] [blame] | 7 | // |
John Criswell | b576c94 | 2003-10-20 19:43:21 +0000 | [diff] [blame] | 8 | //===----------------------------------------------------------------------===// |
Chris Lattner | dbb1735 | 2002-04-28 05:43:27 +0000 | [diff] [blame] | 9 | // |
Rafael Espindola | e5551ed | 2012-10-26 18:47:48 +0000 | [diff] [blame] | 10 | // This pass loops over all of the functions and variables in the input module. |
| 11 | // If the function or variable is not in the list of external names given to |
| 12 | // the pass it is marked as internal. |
Chris Lattner | dbb1735 | 2002-04-28 05:43:27 +0000 | [diff] [blame] | 13 | // |
| 14 | //===----------------------------------------------------------------------===// |
| 15 | |
Chris Lattner | 86453c5 | 2006-12-19 22:09:18 +0000 | [diff] [blame] | 16 | #define DEBUG_TYPE "internalize" |
Chris Lattner | 568ddab | 2002-07-24 17:12:05 +0000 | [diff] [blame] | 17 | #include "llvm/Transforms/IPO.h" |
Rafael Espindola | 4ef7eaf | 2013-07-25 03:23:25 +0000 | [diff] [blame] | 18 | #include "llvm/ADT/SmallPtrSet.h" |
Chandler Carruth | d04a8d4 | 2012-12-03 16:50:05 +0000 | [diff] [blame] | 19 | #include "llvm/ADT/Statistic.h" |
| 20 | #include "llvm/Analysis/CallGraph.h" |
Chandler Carruth | 0b8c9a8 | 2013-01-02 11:36:10 +0000 | [diff] [blame] | 21 | #include "llvm/IR/Module.h" |
Chandler Carruth | d04a8d4 | 2012-12-03 16:50:05 +0000 | [diff] [blame] | 22 | #include "llvm/Pass.h" |
Reid Spencer | 551ccae | 2004-09-01 22:55:40 +0000 | [diff] [blame] | 23 | #include "llvm/Support/CommandLine.h" |
| 24 | #include "llvm/Support/Debug.h" |
Daniel Dunbar | ce63ffb | 2009-07-25 00:23:56 +0000 | [diff] [blame] | 25 | #include "llvm/Support/raw_ostream.h" |
Rafael Espindola | 4ef7eaf | 2013-07-25 03:23:25 +0000 | [diff] [blame] | 26 | #include "llvm/Transforms/Utils/ModuleUtils.h" |
Chris Lattner | c7a2c7f | 2003-05-22 19:34:49 +0000 | [diff] [blame] | 27 | #include <fstream> |
| 28 | #include <set> |
Chris Lattner | 1e2385b | 2003-11-21 21:54:22 +0000 | [diff] [blame] | 29 | using namespace llvm; |
Brian Gaeke | d0fde30 | 2003-11-11 22:41:34 +0000 | [diff] [blame] | 30 | |
Duncan Sands | 27a5300 | 2009-01-05 21:24:45 +0000 | [diff] [blame] | 31 | STATISTIC(NumAliases , "Number of aliases internalized"); |
Chris Lattner | 86453c5 | 2006-12-19 22:09:18 +0000 | [diff] [blame] | 32 | STATISTIC(NumFunctions, "Number of functions internalized"); |
| 33 | STATISTIC(NumGlobals , "Number of global vars internalized"); |
| 34 | |
Dan Gohman | 844731a | 2008-05-13 00:00:25 +0000 | [diff] [blame] | 35 | // APIFile - A file which contains a list of symbols that should not be marked |
| 36 | // external. |
| 37 | static cl::opt<std::string> |
| 38 | APIFile("internalize-public-api-file", cl::value_desc("filename"), |
| 39 | cl::desc("A file containing list of symbol names to preserve")); |
| 40 | |
| 41 | // APIList - A list of symbols that should not be marked internal. |
| 42 | static cl::list<std::string> |
| 43 | APIList("internalize-public-api-list", cl::value_desc("list"), |
| 44 | cl::desc("A list of symbol names to preserve"), |
| 45 | cl::CommaSeparated); |
| 46 | |
Rafael Espindola | 4389009 | 2013-10-03 18:29:09 +0000 | [diff] [blame^] | 47 | static cl::list<std::string> |
| 48 | DSOList("internalize-dso-list", cl::value_desc("list"), |
| 49 | cl::desc("A list of symbol names need for a dso symbol table"), |
| 50 | cl::CommaSeparated); |
| 51 | |
Chris Lattner | f629309 | 2002-07-23 18:06:35 +0000 | [diff] [blame] | 52 | namespace { |
Nick Lewycky | 6726b6d | 2009-10-25 06:33:48 +0000 | [diff] [blame] | 53 | class InternalizePass : public ModulePass { |
Chris Lattner | c7a2c7f | 2003-05-22 19:34:49 +0000 | [diff] [blame] | 54 | std::set<std::string> ExternalNames; |
Rafael Espindola | 4389009 | 2013-10-03 18:29:09 +0000 | [diff] [blame^] | 55 | std::set<std::string> DSONames; |
Chris Lattner | c7a2c7f | 2003-05-22 19:34:49 +0000 | [diff] [blame] | 56 | public: |
Nick Lewycky | ecd94c8 | 2007-05-06 13:37:16 +0000 | [diff] [blame] | 57 | static char ID; // Pass identification, replacement for typeid |
Rafael Espindola | e5551ed | 2012-10-26 18:47:48 +0000 | [diff] [blame] | 58 | explicit InternalizePass(); |
Rafael Espindola | 4389009 | 2013-10-03 18:29:09 +0000 | [diff] [blame^] | 59 | explicit InternalizePass(ArrayRef<const char *> ExportList, |
| 60 | ArrayRef<const char *> DSOList); |
Chris Lattner | 4eb40df | 2006-01-03 19:13:17 +0000 | [diff] [blame] | 61 | void LoadFile(const char *Filename); |
| 62 | virtual bool runOnModule(Module &M); |
Nuno Lopes | 0483d01 | 2008-09-30 22:04:30 +0000 | [diff] [blame] | 63 | |
| 64 | virtual void getAnalysisUsage(AnalysisUsage &AU) const { |
| 65 | AU.setPreservesCFG(); |
Duncan Sands | a2582da | 2008-10-03 07:36:09 +0000 | [diff] [blame] | 66 | AU.addPreserved<CallGraph>(); |
Nuno Lopes | 0483d01 | 2008-09-30 22:04:30 +0000 | [diff] [blame] | 67 | } |
Chris Lattner | 55e41ba | 2002-07-30 19:48:44 +0000 | [diff] [blame] | 68 | }; |
Chris Lattner | f629309 | 2002-07-23 18:06:35 +0000 | [diff] [blame] | 69 | } // end anonymous namespace |
| 70 | |
Dan Gohman | 844731a | 2008-05-13 00:00:25 +0000 | [diff] [blame] | 71 | char InternalizePass::ID = 0; |
Owen Anderson | d13db2c | 2010-07-21 22:09:45 +0000 | [diff] [blame] | 72 | INITIALIZE_PASS(InternalizePass, "internalize", |
Owen Anderson | ce665bd | 2010-10-07 22:25:06 +0000 | [diff] [blame] | 73 | "Internalize Global Symbols", false, false) |
Dan Gohman | 844731a | 2008-05-13 00:00:25 +0000 | [diff] [blame] | 74 | |
Rafael Espindola | e5551ed | 2012-10-26 18:47:48 +0000 | [diff] [blame] | 75 | InternalizePass::InternalizePass() |
| 76 | : ModulePass(ID) { |
Owen Anderson | 081c34b | 2010-10-19 17:21:58 +0000 | [diff] [blame] | 77 | initializeInternalizePassPass(*PassRegistry::getPassRegistry()); |
Devang Patel | ef3682a | 2008-05-14 20:01:01 +0000 | [diff] [blame] | 78 | if (!APIFile.empty()) // If a filename is specified, use it. |
Chris Lattner | 4eb40df | 2006-01-03 19:13:17 +0000 | [diff] [blame] | 79 | LoadFile(APIFile.c_str()); |
Rafael Espindola | 1d7df34 | 2013-09-04 18:53:21 +0000 | [diff] [blame] | 80 | ExternalNames.insert(APIList.begin(), APIList.end()); |
Rafael Espindola | 4389009 | 2013-10-03 18:29:09 +0000 | [diff] [blame^] | 81 | DSONames.insert(DSOList.begin(), DSOList.end()); |
Chris Lattner | 4eb40df | 2006-01-03 19:13:17 +0000 | [diff] [blame] | 82 | } |
| 83 | |
Rafael Espindola | 4389009 | 2013-10-03 18:29:09 +0000 | [diff] [blame^] | 84 | InternalizePass::InternalizePass(ArrayRef<const char *> ExportList, |
| 85 | ArrayRef<const char *> DSOList) |
Rafael Espindola | e5551ed | 2012-10-26 18:47:48 +0000 | [diff] [blame] | 86 | : ModulePass(ID){ |
Owen Anderson | 081c34b | 2010-10-19 17:21:58 +0000 | [diff] [blame] | 87 | initializeInternalizePassPass(*PassRegistry::getPassRegistry()); |
Rafael Espindola | 775079c | 2013-09-04 20:08:46 +0000 | [diff] [blame] | 88 | for(ArrayRef<const char *>::const_iterator itr = ExportList.begin(); |
| 89 | itr != ExportList.end(); itr++) { |
Devang Patel | 753d94a | 2006-07-20 17:48:05 +0000 | [diff] [blame] | 90 | ExternalNames.insert(*itr); |
| 91 | } |
Rafael Espindola | 4389009 | 2013-10-03 18:29:09 +0000 | [diff] [blame^] | 92 | for(ArrayRef<const char *>::const_iterator itr = DSOList.begin(); |
| 93 | itr != DSOList.end(); itr++) { |
| 94 | DSONames.insert(*itr); |
| 95 | } |
Devang Patel | 753d94a | 2006-07-20 17:48:05 +0000 | [diff] [blame] | 96 | } |
| 97 | |
Chris Lattner | 4eb40df | 2006-01-03 19:13:17 +0000 | [diff] [blame] | 98 | void InternalizePass::LoadFile(const char *Filename) { |
| 99 | // Load the APIFile... |
| 100 | std::ifstream In(Filename); |
| 101 | if (!In.good()) { |
Chris Lattner | 4437ae2 | 2009-08-23 07:05:07 +0000 | [diff] [blame] | 102 | errs() << "WARNING: Internalize couldn't load file '" << Filename |
Devang Patel | ef3682a | 2008-05-14 20:01:01 +0000 | [diff] [blame] | 103 | << "'! Continuing as if it's empty.\n"; |
| 104 | return; // Just continue as if the file were empty |
Chris Lattner | 4eb40df | 2006-01-03 19:13:17 +0000 | [diff] [blame] | 105 | } |
| 106 | while (In) { |
| 107 | std::string Symbol; |
| 108 | In >> Symbol; |
| 109 | if (!Symbol.empty()) |
| 110 | ExternalNames.insert(Symbol); |
| 111 | } |
| 112 | } |
| 113 | |
Rafael Espindola | 0fb7716 | 2013-09-04 18:37:36 +0000 | [diff] [blame] | 114 | static bool shouldInternalize(const GlobalValue &GV, |
Rafael Espindola | 4389009 | 2013-10-03 18:29:09 +0000 | [diff] [blame^] | 115 | const std::set<std::string> &ExternalNames, |
| 116 | const std::set<std::string> &DSONames) { |
Rafael Espindola | 0fb7716 | 2013-09-04 18:37:36 +0000 | [diff] [blame] | 117 | // Function must be defined here |
| 118 | if (GV.isDeclaration()) |
| 119 | return false; |
| 120 | |
| 121 | // Available externally is really just a "declaration with a body". |
| 122 | if (GV.hasAvailableExternallyLinkage()) |
| 123 | return false; |
| 124 | |
| 125 | // Already has internal linkage |
| 126 | if (GV.hasLocalLinkage()) |
| 127 | return false; |
| 128 | |
| 129 | // Marked to keep external? |
| 130 | if (ExternalNames.count(GV.getName())) |
| 131 | return false; |
| 132 | |
Rafael Espindola | 4389009 | 2013-10-03 18:29:09 +0000 | [diff] [blame^] | 133 | // Not needed for the symbol table? |
| 134 | if (!DSONames.count(GV.getName())) |
| 135 | return true; |
| 136 | |
| 137 | // Not a linkonce. Someone can depend on it being on the symbol table. |
| 138 | if (!GV.hasLinkOnceLinkage()) |
| 139 | return false; |
| 140 | |
| 141 | // The address is not important, we can hide it. |
| 142 | if (GV.hasUnnamedAddr()) |
| 143 | return true; |
| 144 | |
| 145 | // FIXME: Check if the address is used. |
| 146 | return false; |
Rafael Espindola | 0fb7716 | 2013-09-04 18:37:36 +0000 | [diff] [blame] | 147 | } |
| 148 | |
Chris Lattner | 4eb40df | 2006-01-03 19:13:17 +0000 | [diff] [blame] | 149 | bool InternalizePass::runOnModule(Module &M) { |
Duncan Sands | 1465d61 | 2009-01-28 13:14:17 +0000 | [diff] [blame] | 150 | CallGraph *CG = getAnalysisIfAvailable<CallGraph>(); |
Duncan Sands | a2582da | 2008-10-03 07:36:09 +0000 | [diff] [blame] | 151 | CallGraphNode *ExternalNode = CG ? CG->getExternalCallingNode() : 0; |
Chris Lattner | 4eb40df | 2006-01-03 19:13:17 +0000 | [diff] [blame] | 152 | bool Changed = false; |
Duncan Sands | 2631ac3 | 2009-01-05 20:38:27 +0000 | [diff] [blame] | 153 | |
Rafael Espindola | 4ef7eaf | 2013-07-25 03:23:25 +0000 | [diff] [blame] | 154 | SmallPtrSet<GlobalValue *, 8> Used; |
| 155 | collectUsedGlobalVariables(M, Used, false); |
| 156 | |
| 157 | // We must assume that globals in llvm.used have a reference that not even |
| 158 | // the linker can see, so we don't internalize them. |
| 159 | // For llvm.compiler.used the situation is a bit fuzzy. The assembler and |
| 160 | // linker can drop those symbols. If this pass is running as part of LTO, |
| 161 | // one might think that it could just drop llvm.compiler.used. The problem |
| 162 | // is that even in LTO llvm doesn't see every reference. For example, |
| 163 | // we don't see references from function local inline assembly. To be |
| 164 | // conservative, we internalize symbols in llvm.compiler.used, but we |
| 165 | // keep llvm.compiler.used so that the symbol is not deleted by llvm. |
| 166 | for (SmallPtrSet<GlobalValue *, 8>::iterator I = Used.begin(), E = Used.end(); |
| 167 | I != E; ++I) { |
| 168 | GlobalValue *V = *I; |
| 169 | ExternalNames.insert(V->getName()); |
| 170 | } |
| 171 | |
Devang Patel | ef3682a | 2008-05-14 20:01:01 +0000 | [diff] [blame] | 172 | // Mark all functions not in the api as internal. |
Rafael Espindola | bb46f52 | 2009-01-15 20:18:42 +0000 | [diff] [blame] | 173 | // FIXME: maybe use private linkage? |
Rafael Espindola | 0fb7716 | 2013-09-04 18:37:36 +0000 | [diff] [blame] | 174 | for (Module::iterator I = M.begin(), E = M.end(); I != E; ++I) { |
Rafael Espindola | 4389009 | 2013-10-03 18:29:09 +0000 | [diff] [blame^] | 175 | if (!shouldInternalize(*I, ExternalNames, DSONames)) |
Rafael Espindola | 0fb7716 | 2013-09-04 18:37:36 +0000 | [diff] [blame] | 176 | continue; |
Bill Wendling | 86d4956 | 2013-08-30 21:07:33 +0000 | [diff] [blame] | 177 | |
Rafael Espindola | 0fb7716 | 2013-09-04 18:37:36 +0000 | [diff] [blame] | 178 | I->setLinkage(GlobalValue::InternalLinkage); |
Bill Wendling | 86d4956 | 2013-08-30 21:07:33 +0000 | [diff] [blame] | 179 | |
Rafael Espindola | 0fb7716 | 2013-09-04 18:37:36 +0000 | [diff] [blame] | 180 | if (ExternalNode) |
| 181 | // Remove a callgraph edge from the external node to this function. |
| 182 | ExternalNode->removeOneAbstractEdgeTo((*CG)[I]); |
| 183 | |
| 184 | Changed = true; |
| 185 | ++NumFunctions; |
| 186 | DEBUG(dbgs() << "Internalizing func " << I->getName() << "\n"); |
| 187 | } |
Duncan Sands | 2631ac3 | 2009-01-05 20:38:27 +0000 | [diff] [blame] | 188 | |
Chris Lattner | 4eb40df | 2006-01-03 19:13:17 +0000 | [diff] [blame] | 189 | // Never internalize the llvm.used symbol. It is used to implement |
| 190 | // attribute((used)). |
Chris Lattner | 401e10c | 2009-07-20 06:14:25 +0000 | [diff] [blame] | 191 | // FIXME: Shouldn't this just filter on llvm.metadata section?? |
Chris Lattner | 4eb40df | 2006-01-03 19:13:17 +0000 | [diff] [blame] | 192 | ExternalNames.insert("llvm.used"); |
Chris Lattner | 401e10c | 2009-07-20 06:14:25 +0000 | [diff] [blame] | 193 | ExternalNames.insert("llvm.compiler.used"); |
Duncan Sands | 2631ac3 | 2009-01-05 20:38:27 +0000 | [diff] [blame] | 194 | |
Jim Laskey | 44c3b9f | 2007-01-26 21:22:28 +0000 | [diff] [blame] | 195 | // Never internalize anchors used by the machine module info, else the info |
| 196 | // won't find them. (see MachineModuleInfo.) |
Chris Lattner | 4e2288b | 2007-06-06 20:51:41 +0000 | [diff] [blame] | 197 | ExternalNames.insert("llvm.global_ctors"); |
| 198 | ExternalNames.insert("llvm.global_dtors"); |
Tanya Lattner | 088b591 | 2007-10-03 17:05:40 +0000 | [diff] [blame] | 199 | ExternalNames.insert("llvm.global.annotations"); |
Duncan Sands | 2631ac3 | 2009-01-05 20:38:27 +0000 | [diff] [blame] | 200 | |
Bill Wendling | aab3c0c | 2012-04-13 01:06:27 +0000 | [diff] [blame] | 201 | // Never internalize symbols code-gen inserts. |
Bill Wendling | d275ff5 | 2013-08-12 20:09:37 +0000 | [diff] [blame] | 202 | // FIXME: We should probably add this (and the __stack_chk_guard) via some |
| 203 | // type of call-back in CodeGen. |
| 204 | ExternalNames.insert("__stack_chk_fail"); |
Bill Wendling | aab3c0c | 2012-04-13 01:06:27 +0000 | [diff] [blame] | 205 | ExternalNames.insert("__stack_chk_guard"); |
| 206 | |
Devang Patel | ef3682a | 2008-05-14 20:01:01 +0000 | [diff] [blame] | 207 | // Mark all global variables with initializers that are not in the api as |
| 208 | // internal as well. |
Rafael Espindola | bb46f52 | 2009-01-15 20:18:42 +0000 | [diff] [blame] | 209 | // FIXME: maybe use private linkage? |
Chris Lattner | 4eb40df | 2006-01-03 19:13:17 +0000 | [diff] [blame] | 210 | for (Module::global_iterator I = M.global_begin(), E = M.global_end(); |
Rafael Espindola | 0fb7716 | 2013-09-04 18:37:36 +0000 | [diff] [blame] | 211 | I != E; ++I) { |
Rafael Espindola | 4389009 | 2013-10-03 18:29:09 +0000 | [diff] [blame^] | 212 | if (!shouldInternalize(*I, ExternalNames, DSONames)) |
Rafael Espindola | 0fb7716 | 2013-09-04 18:37:36 +0000 | [diff] [blame] | 213 | continue; |
| 214 | |
| 215 | I->setLinkage(GlobalValue::InternalLinkage); |
| 216 | Changed = true; |
| 217 | ++NumGlobals; |
| 218 | DEBUG(dbgs() << "Internalized gvar " << I->getName() << "\n"); |
| 219 | } |
Duncan Sands | 2631ac3 | 2009-01-05 20:38:27 +0000 | [diff] [blame] | 220 | |
Duncan Sands | 27a5300 | 2009-01-05 21:24:45 +0000 | [diff] [blame] | 221 | // Mark all aliases that are not in the api as internal as well. |
| 222 | for (Module::alias_iterator I = M.alias_begin(), E = M.alias_end(); |
Rafael Espindola | 0fb7716 | 2013-09-04 18:37:36 +0000 | [diff] [blame] | 223 | I != E; ++I) { |
Rafael Espindola | 4389009 | 2013-10-03 18:29:09 +0000 | [diff] [blame^] | 224 | if (!shouldInternalize(*I, ExternalNames, DSONames)) |
Rafael Espindola | 0fb7716 | 2013-09-04 18:37:36 +0000 | [diff] [blame] | 225 | continue; |
| 226 | |
| 227 | I->setLinkage(GlobalValue::InternalLinkage); |
| 228 | Changed = true; |
| 229 | ++NumAliases; |
| 230 | DEBUG(dbgs() << "Internalized alias " << I->getName() << "\n"); |
| 231 | } |
Duncan Sands | 27a5300 | 2009-01-05 21:24:45 +0000 | [diff] [blame] | 232 | |
Chris Lattner | 4eb40df | 2006-01-03 19:13:17 +0000 | [diff] [blame] | 233 | return Changed; |
| 234 | } |
| 235 | |
Rafael Espindola | e5551ed | 2012-10-26 18:47:48 +0000 | [diff] [blame] | 236 | ModulePass *llvm::createInternalizePass() { |
| 237 | return new InternalizePass(); |
Chris Lattner | dbb1735 | 2002-04-28 05:43:27 +0000 | [diff] [blame] | 238 | } |
Devang Patel | 753d94a | 2006-07-20 17:48:05 +0000 | [diff] [blame] | 239 | |
Rafael Espindola | 4389009 | 2013-10-03 18:29:09 +0000 | [diff] [blame^] | 240 | ModulePass *llvm::createInternalizePass(ArrayRef<const char *> ExportList, |
| 241 | ArrayRef<const char *> DSOList) { |
| 242 | return new InternalizePass(ExportList, DSOList); |
Devang Patel | 753d94a | 2006-07-20 17:48:05 +0000 | [diff] [blame] | 243 | } |