1 //===-- AMDGPUAlwaysInlinePass.cpp - Promote Allocas ----------------------===//
3 // The LLVM Compiler Infrastructure
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
8 //===----------------------------------------------------------------------===//
11 /// This pass marks all internal functions as always_inline and creates
12 /// duplicates of all other functions and marks the duplicates as always_inline.
14 //===----------------------------------------------------------------------===//
17 #include "llvm/IR/Module.h"
18 #include "llvm/Transforms/Utils/Cloning.h"
24 class AMDGPUAlwaysInline : public ModulePass {
30 AMDGPUAlwaysInline(bool GlobalOpt = false) :
31 ModulePass(ID), GlobalOpt(GlobalOpt) { }
32 bool runOnModule(Module &M) override;
33 StringRef getPassName() const override { return "AMDGPU Always Inline Pass"; }
36 } // End anonymous namespace
38 INITIALIZE_PASS(AMDGPUAlwaysInline, "amdgpu-always-inline",
39 "AMDGPU Inline All Functions", false, false)
41 char AMDGPUAlwaysInline::ID = 0;
43 bool AMDGPUAlwaysInline::runOnModule(Module &M) {
44 std::vector<GlobalAlias*> AliasesToRemove;
45 std::vector<Function *> FuncsToClone;
47 for (GlobalAlias &A : M.aliases()) {
48 if (Function* F = dyn_cast<Function>(A.getAliasee())) {
49 A.replaceAllUsesWith(F);
50 AliasesToRemove.push_back(&A);
55 for (GlobalAlias* A : AliasesToRemove) {
60 for (Function &F : M) {
61 if (!F.hasLocalLinkage() && !F.isDeclaration() && !F.use_empty() &&
62 !F.hasFnAttribute(Attribute::NoInline))
63 FuncsToClone.push_back(&F);
66 for (Function *F : FuncsToClone) {
67 ValueToValueMapTy VMap;
68 Function *NewFunc = CloneFunction(F, VMap);
69 NewFunc->setLinkage(GlobalValue::InternalLinkage);
70 F->replaceAllUsesWith(NewFunc);
73 for (Function &F : M) {
74 if (F.hasLocalLinkage() && !F.hasFnAttribute(Attribute::NoInline)) {
75 F.addFnAttr(Attribute::AlwaysInline);
81 ModulePass *llvm::createAMDGPUAlwaysInlinePass(bool GlobalOpt) {
82 return new AMDGPUAlwaysInline(GlobalOpt);