Devang Patel | 827454e | 2011-10-17 17:17:43 +0000 | [diff] [blame] | 1 | //===-- GlobalMerge.cpp - Internal globals merging -----------------------===// |
Anton Korobeynikov | cec36f4 | 2010-07-24 21:52:08 +0000 | [diff] [blame] | 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // This pass merges globals with internal linkage into one. This way all the |
| 10 | // globals which were merged into a biggest one can be addressed using offsets |
| 11 | // from the same base pointer (no need for separate base pointer for each of the |
| 12 | // global). Such a transformation can significantly reduce the register pressure |
| 13 | // when many globals are involved. |
| 14 | // |
Nadav Rotem | a94d6e8 | 2012-07-24 10:51:42 +0000 | [diff] [blame] | 15 | // For example, consider the code which touches several global variables at |
Eric Christopher | a99c3e9 | 2010-09-28 04:18:29 +0000 | [diff] [blame] | 16 | // once: |
Anton Korobeynikov | cec36f4 | 2010-07-24 21:52:08 +0000 | [diff] [blame] | 17 | // |
| 18 | // static int foo[N], bar[N], baz[N]; |
| 19 | // |
| 20 | // for (i = 0; i < N; ++i) { |
| 21 | // foo[i] = bar[i] * baz[i]; |
| 22 | // } |
| 23 | // |
| 24 | // On ARM the addresses of 3 arrays should be kept in the registers, thus |
| 25 | // this code has quite large register pressure (loop body): |
| 26 | // |
| 27 | // ldr r1, [r5], #4 |
| 28 | // ldr r2, [r6], #4 |
| 29 | // mul r1, r2, r1 |
| 30 | // str r1, [r0], #4 |
| 31 | // |
| 32 | // Pass converts the code to something like: |
| 33 | // |
| 34 | // static struct { |
| 35 | // int foo[N]; |
| 36 | // int bar[N]; |
| 37 | // int baz[N]; |
| 38 | // } merged; |
| 39 | // |
| 40 | // for (i = 0; i < N; ++i) { |
| 41 | // merged.foo[i] = merged.bar[i] * merged.baz[i]; |
| 42 | // } |
| 43 | // |
| 44 | // and in ARM code this becomes: |
| 45 | // |
| 46 | // ldr r0, [r5, #40] |
| 47 | // ldr r1, [r5, #80] |
| 48 | // mul r0, r1, r0 |
| 49 | // str r0, [r5], #4 |
| 50 | // |
| 51 | // note that we saved 2 registers here almostly "for free". |
Eric Christopher | a99c3e9 | 2010-09-28 04:18:29 +0000 | [diff] [blame] | 52 | // ===---------------------------------------------------------------------===// |
Anton Korobeynikov | cec36f4 | 2010-07-24 21:52:08 +0000 | [diff] [blame] | 53 | |
Devang Patel | 827454e | 2011-10-17 17:17:43 +0000 | [diff] [blame] | 54 | #define DEBUG_TYPE "global-merge" |
| 55 | #include "llvm/Transforms/Scalar.h" |
Chandler Carruth | d04a8d4 | 2012-12-03 16:50:05 +0000 | [diff] [blame] | 56 | #include "llvm/ADT/Statistic.h" |
Anton Korobeynikov | cec36f4 | 2010-07-24 21:52:08 +0000 | [diff] [blame] | 57 | #include "llvm/Attributes.h" |
| 58 | #include "llvm/Constants.h" |
Chandler Carruth | d04a8d4 | 2012-12-03 16:50:05 +0000 | [diff] [blame] | 59 | #include "llvm/DataLayout.h" |
Anton Korobeynikov | cec36f4 | 2010-07-24 21:52:08 +0000 | [diff] [blame] | 60 | #include "llvm/DerivedTypes.h" |
| 61 | #include "llvm/Function.h" |
| 62 | #include "llvm/GlobalVariable.h" |
| 63 | #include "llvm/Instructions.h" |
| 64 | #include "llvm/Intrinsics.h" |
| 65 | #include "llvm/Module.h" |
| 66 | #include "llvm/Pass.h" |
Anton Korobeynikov | cec36f4 | 2010-07-24 21:52:08 +0000 | [diff] [blame] | 67 | #include "llvm/Target/TargetLowering.h" |
Bob Wilson | 0564609 | 2010-11-17 21:25:39 +0000 | [diff] [blame] | 68 | #include "llvm/Target/TargetLoweringObjectFile.h" |
Anton Korobeynikov | cec36f4 | 2010-07-24 21:52:08 +0000 | [diff] [blame] | 69 | using namespace llvm; |
| 70 | |
Devang Patel | 827454e | 2011-10-17 17:17:43 +0000 | [diff] [blame] | 71 | STATISTIC(NumMerged , "Number of globals merged"); |
Anton Korobeynikov | cec36f4 | 2010-07-24 21:52:08 +0000 | [diff] [blame] | 72 | namespace { |
Devang Patel | 827454e | 2011-10-17 17:17:43 +0000 | [diff] [blame] | 73 | class GlobalMerge : public FunctionPass { |
Anton Korobeynikov | cec36f4 | 2010-07-24 21:52:08 +0000 | [diff] [blame] | 74 | /// TLI - Keep a pointer of a TargetLowering to consult for determining |
| 75 | /// target type sizes. |
| 76 | const TargetLowering *TLI; |
| 77 | |
| 78 | bool doMerge(SmallVectorImpl<GlobalVariable*> &Globals, |
Bob Wilson | 0564609 | 2010-11-17 21:25:39 +0000 | [diff] [blame] | 79 | Module &M, bool isConst) const; |
Anton Korobeynikov | cec36f4 | 2010-07-24 21:52:08 +0000 | [diff] [blame] | 80 | |
| 81 | public: |
| 82 | static char ID; // Pass identification, replacement for typeid. |
Devang Patel | 827454e | 2011-10-17 17:17:43 +0000 | [diff] [blame] | 83 | explicit GlobalMerge(const TargetLowering *tli = 0) |
| 84 | : FunctionPass(ID), TLI(tli) { |
| 85 | initializeGlobalMergePass(*PassRegistry::getPassRegistry()); |
| 86 | } |
Anton Korobeynikov | cec36f4 | 2010-07-24 21:52:08 +0000 | [diff] [blame] | 87 | |
| 88 | virtual bool doInitialization(Module &M); |
Chris Lattner | 252b491 | 2010-09-05 21:18:45 +0000 | [diff] [blame] | 89 | virtual bool runOnFunction(Function &F); |
Anton Korobeynikov | cec36f4 | 2010-07-24 21:52:08 +0000 | [diff] [blame] | 90 | |
| 91 | const char *getPassName() const { |
| 92 | return "Merge internal globals"; |
| 93 | } |
| 94 | |
| 95 | virtual void getAnalysisUsage(AnalysisUsage &AU) const { |
| 96 | AU.setPreservesCFG(); |
| 97 | FunctionPass::getAnalysisUsage(AU); |
| 98 | } |
| 99 | |
| 100 | struct GlobalCmp { |
Micah Villmow | 3574eca | 2012-10-08 16:38:25 +0000 | [diff] [blame] | 101 | const DataLayout *TD; |
Anton Korobeynikov | cec36f4 | 2010-07-24 21:52:08 +0000 | [diff] [blame] | 102 | |
Micah Villmow | 3574eca | 2012-10-08 16:38:25 +0000 | [diff] [blame] | 103 | GlobalCmp(const DataLayout *td) : TD(td) { } |
Anton Korobeynikov | cec36f4 | 2010-07-24 21:52:08 +0000 | [diff] [blame] | 104 | |
Chris Lattner | 252b491 | 2010-09-05 21:18:45 +0000 | [diff] [blame] | 105 | bool operator()(const GlobalVariable *GV1, const GlobalVariable *GV2) { |
Chris Lattner | db125cf | 2011-07-18 04:54:35 +0000 | [diff] [blame] | 106 | Type *Ty1 = cast<PointerType>(GV1->getType())->getElementType(); |
| 107 | Type *Ty2 = cast<PointerType>(GV2->getType())->getElementType(); |
Anton Korobeynikov | cec36f4 | 2010-07-24 21:52:08 +0000 | [diff] [blame] | 108 | |
| 109 | return (TD->getTypeAllocSize(Ty1) < TD->getTypeAllocSize(Ty2)); |
| 110 | } |
| 111 | }; |
| 112 | }; |
| 113 | } // end anonymous namespace |
| 114 | |
Devang Patel | 827454e | 2011-10-17 17:17:43 +0000 | [diff] [blame] | 115 | char GlobalMerge::ID = 0; |
| 116 | INITIALIZE_PASS(GlobalMerge, "global-merge", |
| 117 | "Global Merge", false, false) |
Anton Korobeynikov | cec36f4 | 2010-07-24 21:52:08 +0000 | [diff] [blame] | 118 | |
Devang Patel | 827454e | 2011-10-17 17:17:43 +0000 | [diff] [blame] | 119 | |
| 120 | bool GlobalMerge::doMerge(SmallVectorImpl<GlobalVariable*> &Globals, |
Anton Korobeynikov | cec36f4 | 2010-07-24 21:52:08 +0000 | [diff] [blame] | 121 | Module &M, bool isConst) const { |
Micah Villmow | 3574eca | 2012-10-08 16:38:25 +0000 | [diff] [blame] | 122 | const DataLayout *TD = TLI->getDataLayout(); |
Anton Korobeynikov | cec36f4 | 2010-07-24 21:52:08 +0000 | [diff] [blame] | 123 | |
| 124 | // FIXME: Infer the maximum possible offset depending on the actual users |
| 125 | // (these max offsets are different for the users inside Thumb or ARM |
| 126 | // functions) |
| 127 | unsigned MaxOffset = TLI->getMaximalGlobalOffset(); |
| 128 | |
| 129 | // FIXME: Find better heuristics |
| 130 | std::stable_sort(Globals.begin(), Globals.end(), GlobalCmp(TD)); |
| 131 | |
Chris Lattner | db125cf | 2011-07-18 04:54:35 +0000 | [diff] [blame] | 132 | Type *Int32Ty = Type::getInt32Ty(M.getContext()); |
Anton Korobeynikov | cec36f4 | 2010-07-24 21:52:08 +0000 | [diff] [blame] | 133 | |
| 134 | for (size_t i = 0, e = Globals.size(); i != e; ) { |
| 135 | size_t j = 0; |
| 136 | uint64_t MergedSize = 0; |
Jay Foad | 5fdd6c8 | 2011-07-12 14:06:48 +0000 | [diff] [blame] | 137 | std::vector<Type*> Tys; |
Anton Korobeynikov | cec36f4 | 2010-07-24 21:52:08 +0000 | [diff] [blame] | 138 | std::vector<Constant*> Inits; |
Bob Wilson | 619a372 | 2010-11-17 21:25:36 +0000 | [diff] [blame] | 139 | for (j = i; j != e; ++j) { |
Jay Foad | 5fdd6c8 | 2011-07-12 14:06:48 +0000 | [diff] [blame] | 140 | Type *Ty = Globals[j]->getType()->getElementType(); |
Bob Wilson | 619a372 | 2010-11-17 21:25:36 +0000 | [diff] [blame] | 141 | MergedSize += TD->getTypeAllocSize(Ty); |
| 142 | if (MergedSize > MaxOffset) { |
| 143 | break; |
| 144 | } |
Anton Korobeynikov | cec36f4 | 2010-07-24 21:52:08 +0000 | [diff] [blame] | 145 | Tys.push_back(Ty); |
| 146 | Inits.push_back(Globals[j]->getInitializer()); |
Anton Korobeynikov | cec36f4 | 2010-07-24 21:52:08 +0000 | [diff] [blame] | 147 | } |
| 148 | |
Chris Lattner | 252b491 | 2010-09-05 21:18:45 +0000 | [diff] [blame] | 149 | StructType *MergedTy = StructType::get(M.getContext(), Tys); |
| 150 | Constant *MergedInit = ConstantStruct::get(MergedTy, Inits); |
| 151 | GlobalVariable *MergedGV = new GlobalVariable(M, MergedTy, isConst, |
Anton Korobeynikov | cec36f4 | 2010-07-24 21:52:08 +0000 | [diff] [blame] | 152 | GlobalValue::InternalLinkage, |
Bob Wilson | 72831dc | 2010-11-17 21:25:33 +0000 | [diff] [blame] | 153 | MergedInit, "_MergedGlobals"); |
Anton Korobeynikov | cec36f4 | 2010-07-24 21:52:08 +0000 | [diff] [blame] | 154 | for (size_t k = i; k < j; ++k) { |
Chris Lattner | 252b491 | 2010-09-05 21:18:45 +0000 | [diff] [blame] | 155 | Constant *Idx[2] = { |
| 156 | ConstantInt::get(Int32Ty, 0), |
| 157 | ConstantInt::get(Int32Ty, k-i) |
| 158 | }; |
Jay Foad | dab3d29 | 2011-07-21 14:31:17 +0000 | [diff] [blame] | 159 | Constant *GEP = ConstantExpr::getInBoundsGetElementPtr(MergedGV, Idx); |
Anton Korobeynikov | cec36f4 | 2010-07-24 21:52:08 +0000 | [diff] [blame] | 160 | Globals[k]->replaceAllUsesWith(GEP); |
| 161 | Globals[k]->eraseFromParent(); |
Devang Patel | 827454e | 2011-10-17 17:17:43 +0000 | [diff] [blame] | 162 | NumMerged++; |
Anton Korobeynikov | cec36f4 | 2010-07-24 21:52:08 +0000 | [diff] [blame] | 163 | } |
| 164 | i = j; |
| 165 | } |
| 166 | |
| 167 | return true; |
| 168 | } |
| 169 | |
| 170 | |
Devang Patel | 827454e | 2011-10-17 17:17:43 +0000 | [diff] [blame] | 171 | bool GlobalMerge::doInitialization(Module &M) { |
Bob Wilson | 0564609 | 2010-11-17 21:25:39 +0000 | [diff] [blame] | 172 | SmallVector<GlobalVariable*, 16> Globals, ConstGlobals, BSSGlobals; |
Micah Villmow | 3574eca | 2012-10-08 16:38:25 +0000 | [diff] [blame] | 173 | const DataLayout *TD = TLI->getDataLayout(); |
Anton Korobeynikov | cec36f4 | 2010-07-24 21:52:08 +0000 | [diff] [blame] | 174 | unsigned MaxOffset = TLI->getMaximalGlobalOffset(); |
| 175 | bool Changed = false; |
| 176 | |
| 177 | // Grab all non-const globals. |
| 178 | for (Module::global_iterator I = M.global_begin(), |
| 179 | E = M.global_end(); I != E; ++I) { |
| 180 | // Merge is safe for "normal" internal globals only |
| 181 | if (!I->hasLocalLinkage() || I->isThreadLocal() || I->hasSection()) |
| 182 | continue; |
| 183 | |
| 184 | // Ignore fancy-aligned globals for now. |
Eli Friedman | 3dad610 | 2011-11-30 21:54:15 +0000 | [diff] [blame] | 185 | unsigned Alignment = TD->getPreferredAlignment(I); |
Chris Lattner | db125cf | 2011-07-18 04:54:35 +0000 | [diff] [blame] | 186 | Type *Ty = I->getType()->getElementType(); |
Cameron Zwarich | f75ae4c | 2011-07-11 01:29:42 +0000 | [diff] [blame] | 187 | if (Alignment > TD->getABITypeAlignment(Ty)) |
Anton Korobeynikov | cec36f4 | 2010-07-24 21:52:08 +0000 | [diff] [blame] | 188 | continue; |
| 189 | |
Anton Korobeynikov | b5a0ef9 | 2010-07-26 18:45:39 +0000 | [diff] [blame] | 190 | // Ignore all 'special' globals. |
| 191 | if (I->getName().startswith("llvm.") || |
| 192 | I->getName().startswith(".llvm.")) |
| 193 | continue; |
| 194 | |
Cameron Zwarich | f75ae4c | 2011-07-11 01:29:42 +0000 | [diff] [blame] | 195 | if (TD->getTypeAllocSize(Ty) < MaxOffset) { |
Ahmed Charles | b83a67e | 2012-02-13 06:30:56 +0000 | [diff] [blame] | 196 | if (TargetLoweringObjectFile::getKindForGlobal(I, TLI->getTargetMachine()) |
| 197 | .isBSSLocal()) |
Bob Wilson | 0564609 | 2010-11-17 21:25:39 +0000 | [diff] [blame] | 198 | BSSGlobals.push_back(I); |
| 199 | else if (I->isConstant()) |
Anton Korobeynikov | cec36f4 | 2010-07-24 21:52:08 +0000 | [diff] [blame] | 200 | ConstGlobals.push_back(I); |
| 201 | else |
| 202 | Globals.push_back(I); |
| 203 | } |
| 204 | } |
| 205 | |
| 206 | if (Globals.size() > 1) |
| 207 | Changed |= doMerge(Globals, M, false); |
Bob Wilson | 0564609 | 2010-11-17 21:25:39 +0000 | [diff] [blame] | 208 | if (BSSGlobals.size() > 1) |
| 209 | Changed |= doMerge(BSSGlobals, M, false); |
| 210 | |
Nadav Rotem | a94d6e8 | 2012-07-24 10:51:42 +0000 | [diff] [blame] | 211 | // FIXME: This currently breaks the EH processing due to way how the |
| 212 | // typeinfo detection works. We might want to detect the TIs and ignore |
Anton Korobeynikov | b5a0ef9 | 2010-07-26 18:45:39 +0000 | [diff] [blame] | 213 | // them in the future. |
Anton Korobeynikov | b5a0ef9 | 2010-07-26 18:45:39 +0000 | [diff] [blame] | 214 | // if (ConstGlobals.size() > 1) |
| 215 | // Changed |= doMerge(ConstGlobals, M, true); |
Anton Korobeynikov | cec36f4 | 2010-07-24 21:52:08 +0000 | [diff] [blame] | 216 | |
| 217 | return Changed; |
| 218 | } |
| 219 | |
Devang Patel | 827454e | 2011-10-17 17:17:43 +0000 | [diff] [blame] | 220 | bool GlobalMerge::runOnFunction(Function &F) { |
Anton Korobeynikov | cec36f4 | 2010-07-24 21:52:08 +0000 | [diff] [blame] | 221 | return false; |
| 222 | } |
| 223 | |
Devang Patel | 827454e | 2011-10-17 17:17:43 +0000 | [diff] [blame] | 224 | Pass *llvm::createGlobalMergePass(const TargetLowering *tli) { |
| 225 | return new GlobalMerge(tli); |
Anton Korobeynikov | cec36f4 | 2010-07-24 21:52:08 +0000 | [diff] [blame] | 226 | } |