64ac736ec5
Former-commit-id: f3cc9b82f3e5bd8f0fd3ebc098f789556b44e9cd
94 lines
2.5 KiB
C++
94 lines
2.5 KiB
C++
//===-- AMDGPUAlwaysInlinePass.cpp - Promote Allocas ----------------------===//
|
|
//
|
|
// The LLVM Compiler Infrastructure
|
|
//
|
|
// This file is distributed under the University of Illinois Open Source
|
|
// License. See LICENSE.TXT for details.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
/// \file
|
|
/// This pass marks all internal functions as always_inline and creates
|
|
/// duplicates of all other functions and marks the duplicates as always_inline.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "AMDGPU.h"
|
|
#include "llvm/IR/Module.h"
|
|
#include "llvm/Transforms/Utils/Cloning.h"
|
|
|
|
using namespace llvm;
|
|
|
|
namespace {
|
|
|
|
static cl::opt<bool> StressCalls(
|
|
"amdgpu-stress-function-calls",
|
|
cl::Hidden,
|
|
cl::desc("Force all functions to be noinline"),
|
|
cl::init(false));
|
|
|
|
class AMDGPUAlwaysInline : public ModulePass {
|
|
bool GlobalOpt;
|
|
|
|
public:
|
|
static char ID;
|
|
|
|
AMDGPUAlwaysInline(bool GlobalOpt = false) :
|
|
ModulePass(ID), GlobalOpt(GlobalOpt) { }
|
|
bool runOnModule(Module &M) override;
|
|
StringRef getPassName() const override { return "AMDGPU Always Inline Pass"; }
|
|
};
|
|
|
|
} // End anonymous namespace
|
|
|
|
INITIALIZE_PASS(AMDGPUAlwaysInline, "amdgpu-always-inline",
|
|
"AMDGPU Inline All Functions", false, false)
|
|
|
|
char AMDGPUAlwaysInline::ID = 0;
|
|
|
|
bool AMDGPUAlwaysInline::runOnModule(Module &M) {
|
|
std::vector<GlobalAlias*> AliasesToRemove;
|
|
std::vector<Function *> FuncsToClone;
|
|
|
|
for (GlobalAlias &A : M.aliases()) {
|
|
if (Function* F = dyn_cast<Function>(A.getAliasee())) {
|
|
A.replaceAllUsesWith(F);
|
|
AliasesToRemove.push_back(&A);
|
|
}
|
|
}
|
|
|
|
if (GlobalOpt) {
|
|
for (GlobalAlias* A : AliasesToRemove) {
|
|
A->eraseFromParent();
|
|
}
|
|
}
|
|
|
|
auto NewAttr = StressCalls ? Attribute::NoInline : Attribute::AlwaysInline;
|
|
auto IncompatAttr
|
|
= StressCalls ? Attribute::AlwaysInline : Attribute::NoInline;
|
|
|
|
for (Function &F : M) {
|
|
if (!F.hasLocalLinkage() && !F.isDeclaration() && !F.use_empty() &&
|
|
!F.hasFnAttribute(IncompatAttr))
|
|
FuncsToClone.push_back(&F);
|
|
}
|
|
|
|
for (Function *F : FuncsToClone) {
|
|
ValueToValueMapTy VMap;
|
|
Function *NewFunc = CloneFunction(F, VMap);
|
|
NewFunc->setLinkage(GlobalValue::InternalLinkage);
|
|
F->replaceAllUsesWith(NewFunc);
|
|
}
|
|
|
|
for (Function &F : M) {
|
|
if (F.hasLocalLinkage() && !F.hasFnAttribute(IncompatAttr)) {
|
|
F.addFnAttr(NewAttr);
|
|
}
|
|
}
|
|
return false;
|
|
}
|
|
|
|
ModulePass *llvm::createAMDGPUAlwaysInlinePass(bool GlobalOpt) {
|
|
return new AMDGPUAlwaysInline(GlobalOpt);
|
|
}
|