AMDGPUAlwaysInlinePass.cpp revision 284677
1284677Sdim//===-- AMDGPUAlwaysInlinePass.cpp - Promote Allocas ----------------------===//
2284677Sdim//
3284677Sdim//                     The LLVM Compiler Infrastructure
4284677Sdim//
5284677Sdim// This file is distributed under the University of Illinois Open Source
6284677Sdim// License. See LICENSE.TXT for details.
7284677Sdim//
8284677Sdim//===----------------------------------------------------------------------===//
9284677Sdim//
10284677Sdim/// \file
11284677Sdim/// This pass marks all internal functions as always_inline and creates
12284677Sdim/// duplicates of all other functions a marks the duplicates as always_inline.
13284677Sdim//
14284677Sdim//===----------------------------------------------------------------------===//
15284677Sdim
16284677Sdim#include "AMDGPU.h"
17284677Sdim#include "llvm/IR/Module.h"
18284677Sdim#include "llvm/Transforms/Utils/Cloning.h"
19284677Sdim
20284677Sdimusing namespace llvm;
21284677Sdim
22284677Sdimnamespace {
23284677Sdim
24284677Sdimclass AMDGPUAlwaysInline : public ModulePass {
25284677Sdim
26284677Sdim  static char ID;
27284677Sdim
28284677Sdimpublic:
29284677Sdim  AMDGPUAlwaysInline() : ModulePass(ID) { }
30284677Sdim  bool runOnModule(Module &M) override;
31284677Sdim  const char *getPassName() const override { return "AMDGPU Always Inline Pass"; }
32284677Sdim};
33284677Sdim
34284677Sdim} // End anonymous namespace
35284677Sdim
36284677Sdimchar AMDGPUAlwaysInline::ID = 0;
37284677Sdim
38284677Sdimbool AMDGPUAlwaysInline::runOnModule(Module &M) {
39284677Sdim
40284677Sdim  std::vector<Function*> FuncsToClone;
41284677Sdim  for (Module::iterator I = M.begin(), E = M.end(); I != E; ++I) {
42284677Sdim    Function &F = *I;
43284677Sdim    if (!F.hasLocalLinkage() && !F.isDeclaration() && !F.use_empty() &&
44284677Sdim        !F.hasFnAttribute(Attribute::NoInline))
45284677Sdim      FuncsToClone.push_back(&F);
46284677Sdim  }
47284677Sdim
48284677Sdim  for (Function *F : FuncsToClone) {
49284677Sdim    ValueToValueMapTy VMap;
50284677Sdim    Function *NewFunc = CloneFunction(F, VMap, false);
51284677Sdim    NewFunc->setLinkage(GlobalValue::InternalLinkage);
52284677Sdim    F->getParent()->getFunctionList().push_back(NewFunc);
53284677Sdim    F->replaceAllUsesWith(NewFunc);
54284677Sdim  }
55284677Sdim
56284677Sdim  for (Module::iterator I = M.begin(), E = M.end(); I != E; ++I) {
57284677Sdim    Function &F = *I;
58284677Sdim    if (F.hasLocalLinkage() && !F.hasFnAttribute(Attribute::NoInline)) {
59284677Sdim      F.addFnAttr(Attribute::AlwaysInline);
60284677Sdim    }
61284677Sdim  }
62284677Sdim  return false;
63284677Sdim}
64284677Sdim
65284677SdimModulePass *llvm::createAMDGPUAlwaysInlinePass() {
66284677Sdim  return new AMDGPUAlwaysInline();
67284677Sdim}
68