Tom Stellard | 5cbb53c | 2014-11-03 19:49:05 +0000 | [diff] [blame] | 1 | //===-- AMDGPUAlwaysInlinePass.cpp - Promote Allocas ----------------------===// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | /// \file |
| 11 | /// This pass marks all internal functions as always_inline and creates |
| 12 | /// duplicates of all other functions a marks the duplicates as always_inline. |
| 13 | // |
| 14 | //===----------------------------------------------------------------------===// |
| 15 | |
| 16 | #include "AMDGPU.h" |
| 17 | #include "llvm/IR/Module.h" |
| 18 | #include "llvm/Transforms/Utils/Cloning.h" |
| 19 | |
| 20 | using namespace llvm; |
| 21 | |
| 22 | namespace { |
| 23 | |
| 24 | class AMDGPUAlwaysInline : public ModulePass { |
Tom Stellard | 5cbb53c | 2014-11-03 19:49:05 +0000 | [diff] [blame] | 25 | static char ID; |
| 26 | |
| 27 | public: |
| 28 | AMDGPUAlwaysInline() : ModulePass(ID) { } |
| 29 | bool runOnModule(Module &M) override; |
| 30 | const char *getPassName() const override { return "AMDGPU Always Inline Pass"; } |
| 31 | }; |
| 32 | |
| 33 | } // End anonymous namespace |
| 34 | |
| 35 | char AMDGPUAlwaysInline::ID = 0; |
| 36 | |
| 37 | bool AMDGPUAlwaysInline::runOnModule(Module &M) { |
Matt Arsenault | ca95d44 | 2015-07-13 19:08:36 +0000 | [diff] [blame^] | 38 | std::vector<Function *> FuncsToClone; |
Tom Stellard | 5cbb53c | 2014-11-03 19:49:05 +0000 | [diff] [blame] | 39 | |
Matt Arsenault | ca95d44 | 2015-07-13 19:08:36 +0000 | [diff] [blame^] | 40 | for (Function &F : M) { |
Matt Arsenault | deaef8e | 2015-04-22 17:10:44 +0000 | [diff] [blame] | 41 | if (!F.hasLocalLinkage() && !F.isDeclaration() && !F.use_empty() && |
| 42 | !F.hasFnAttribute(Attribute::NoInline)) |
Tom Stellard | 5cbb53c | 2014-11-03 19:49:05 +0000 | [diff] [blame] | 43 | FuncsToClone.push_back(&F); |
| 44 | } |
| 45 | |
| 46 | for (Function *F : FuncsToClone) { |
| 47 | ValueToValueMapTy VMap; |
| 48 | Function *NewFunc = CloneFunction(F, VMap, false); |
| 49 | NewFunc->setLinkage(GlobalValue::InternalLinkage); |
Matt Arsenault | ca95d44 | 2015-07-13 19:08:36 +0000 | [diff] [blame^] | 50 | M.getFunctionList().push_back(NewFunc); |
Tom Stellard | 5cbb53c | 2014-11-03 19:49:05 +0000 | [diff] [blame] | 51 | F->replaceAllUsesWith(NewFunc); |
| 52 | } |
| 53 | |
Matt Arsenault | ca95d44 | 2015-07-13 19:08:36 +0000 | [diff] [blame^] | 54 | for (Function &F : M) { |
Matt Arsenault | deaef8e | 2015-04-22 17:10:44 +0000 | [diff] [blame] | 55 | if (F.hasLocalLinkage() && !F.hasFnAttribute(Attribute::NoInline)) { |
Tom Stellard | 5cbb53c | 2014-11-03 19:49:05 +0000 | [diff] [blame] | 56 | F.addFnAttr(Attribute::AlwaysInline); |
| 57 | } |
| 58 | } |
| 59 | return false; |
| 60 | } |
| 61 | |
| 62 | ModulePass *llvm::createAMDGPUAlwaysInlinePass() { |
| 63 | return new AMDGPUAlwaysInline(); |
| 64 | } |