65 lines
		
	
	
		
			1.8 KiB
		
	
	
	
		
			C++
		
	
	
	
			
		
		
	
	
			65 lines
		
	
	
		
			1.8 KiB
		
	
	
	
		
			C++
		
	
	
	
//===-- AMDGPUAlwaysInlinePass.cpp - Promote Allocas ----------------------===//
 | 
						|
//
 | 
						|
//                     The LLVM Compiler Infrastructure
 | 
						|
//
 | 
						|
// This file is distributed under the University of Illinois Open Source
 | 
						|
// License. See LICENSE.TXT for details.
 | 
						|
//
 | 
						|
//===----------------------------------------------------------------------===//
 | 
						|
//
 | 
						|
/// \file
 | 
						|
/// This pass marks all internal functions as always_inline and creates
 | 
						|
/// duplicates of all other functions a marks the duplicates as always_inline.
 | 
						|
//
 | 
						|
//===----------------------------------------------------------------------===//
 | 
						|
 | 
						|
#include "AMDGPU.h"
 | 
						|
#include "llvm/IR/Module.h"
 | 
						|
#include "llvm/Transforms/Utils/Cloning.h"
 | 
						|
 | 
						|
using namespace llvm;
 | 
						|
 | 
						|
namespace {
 | 
						|
 | 
						|
class AMDGPUAlwaysInline : public ModulePass {
 | 
						|
  static char ID;
 | 
						|
 | 
						|
public:
 | 
						|
  AMDGPUAlwaysInline() : ModulePass(ID) { }
 | 
						|
  bool runOnModule(Module &M) override;
 | 
						|
  const char *getPassName() const override { return "AMDGPU Always Inline Pass"; }
 | 
						|
};
 | 
						|
 | 
						|
} // End anonymous namespace
 | 
						|
 | 
						|
char AMDGPUAlwaysInline::ID = 0;
 | 
						|
 | 
						|
bool AMDGPUAlwaysInline::runOnModule(Module &M) {
 | 
						|
  std::vector<Function *> FuncsToClone;
 | 
						|
 | 
						|
  for (Function &F : M) {
 | 
						|
    if (!F.hasLocalLinkage() && !F.isDeclaration() && !F.use_empty() &&
 | 
						|
        !F.hasFnAttribute(Attribute::NoInline))
 | 
						|
      FuncsToClone.push_back(&F);
 | 
						|
  }
 | 
						|
 | 
						|
  for (Function *F : FuncsToClone) {
 | 
						|
    ValueToValueMapTy VMap;
 | 
						|
    Function *NewFunc = CloneFunction(F, VMap, false);
 | 
						|
    NewFunc->setLinkage(GlobalValue::InternalLinkage);
 | 
						|
    M.getFunctionList().push_back(NewFunc);
 | 
						|
    F->replaceAllUsesWith(NewFunc);
 | 
						|
  }
 | 
						|
 | 
						|
  for (Function &F : M) {
 | 
						|
    if (F.hasLocalLinkage() && !F.hasFnAttribute(Attribute::NoInline)) {
 | 
						|
      F.addFnAttr(Attribute::AlwaysInline);
 | 
						|
    }
 | 
						|
  }
 | 
						|
  return false;
 | 
						|
}
 | 
						|
 | 
						|
ModulePass *llvm::createAMDGPUAlwaysInlinePass() {
 | 
						|
  return new AMDGPUAlwaysInline();
 | 
						|
}
 |