AMDGPUAlwaysInlinePass.cpp revision 284677
1284677Sdim//===-- AMDGPUAlwaysInlinePass.cpp - Promote Allocas ----------------------===// 2284677Sdim// 3284677Sdim// The LLVM Compiler Infrastructure 4284677Sdim// 5284677Sdim// This file is distributed under the University of Illinois Open Source 6284677Sdim// License. See LICENSE.TXT for details. 7284677Sdim// 8284677Sdim//===----------------------------------------------------------------------===// 9284677Sdim// 10284677Sdim/// \file 11284677Sdim/// This pass marks all internal functions as always_inline and creates 12284677Sdim/// duplicates of all other functions a marks the duplicates as always_inline. 13284677Sdim// 14284677Sdim//===----------------------------------------------------------------------===// 15284677Sdim 16284677Sdim#include "AMDGPU.h" 17284677Sdim#include "llvm/IR/Module.h" 18284677Sdim#include "llvm/Transforms/Utils/Cloning.h" 19284677Sdim 20284677Sdimusing namespace llvm; 21284677Sdim 22284677Sdimnamespace { 23284677Sdim 24284677Sdimclass AMDGPUAlwaysInline : public ModulePass { 25284677Sdim 26284677Sdim static char ID; 27284677Sdim 28284677Sdimpublic: 29284677Sdim AMDGPUAlwaysInline() : ModulePass(ID) { } 30284677Sdim bool runOnModule(Module &M) override; 31284677Sdim const char *getPassName() const override { return "AMDGPU Always Inline Pass"; } 32284677Sdim}; 33284677Sdim 34284677Sdim} // End anonymous namespace 35284677Sdim 36284677Sdimchar AMDGPUAlwaysInline::ID = 0; 37284677Sdim 38284677Sdimbool AMDGPUAlwaysInline::runOnModule(Module &M) { 39284677Sdim 40284677Sdim std::vector<Function*> FuncsToClone; 41284677Sdim for (Module::iterator I = M.begin(), E = M.end(); I != E; ++I) { 42284677Sdim Function &F = *I; 43284677Sdim if (!F.hasLocalLinkage() && !F.isDeclaration() && !F.use_empty() && 44284677Sdim !F.hasFnAttribute(Attribute::NoInline)) 45284677Sdim FuncsToClone.push_back(&F); 46284677Sdim } 47284677Sdim 48284677Sdim for (Function *F : FuncsToClone) { 49284677Sdim ValueToValueMapTy VMap; 50284677Sdim Function *NewFunc = CloneFunction(F, VMap, false); 51284677Sdim NewFunc->setLinkage(GlobalValue::InternalLinkage); 52284677Sdim F->getParent()->getFunctionList().push_back(NewFunc); 53284677Sdim F->replaceAllUsesWith(NewFunc); 54284677Sdim } 55284677Sdim 56284677Sdim for (Module::iterator I = M.begin(), E = M.end(); I != E; ++I) { 57284677Sdim Function &F = *I; 58284677Sdim if (F.hasLocalLinkage() && !F.hasFnAttribute(Attribute::NoInline)) { 59284677Sdim F.addFnAttr(Attribute::AlwaysInline); 60284677Sdim } 61284677Sdim } 62284677Sdim return false; 63284677Sdim} 64284677Sdim 65284677SdimModulePass *llvm::createAMDGPUAlwaysInlinePass() { 66284677Sdim return new AMDGPUAlwaysInline(); 67284677Sdim} 68