272 lines
		
	
	
		
			9.3 KiB
		
	
	
	
		
			C++
		
	
	
	
			
		
		
	
	
			272 lines
		
	
	
		
			9.3 KiB
		
	
	
	
		
			C++
		
	
	
	
| //===-- ModuleUtils.cpp - Functions to manipulate Modules -----------------===//
 | |
| //
 | |
| //                     The LLVM Compiler Infrastructure
 | |
| //
 | |
| // This file is distributed under the University of Illinois Open Source
 | |
| // License. See LICENSE.TXT for details.
 | |
| //
 | |
| //===----------------------------------------------------------------------===//
 | |
| //
 | |
| // This family of functions perform manipulations on Modules.
 | |
| //
 | |
| //===----------------------------------------------------------------------===//
 | |
| 
 | |
| #include "llvm/Transforms/Utils/ModuleUtils.h"
 | |
| #include "llvm/IR/DerivedTypes.h"
 | |
| #include "llvm/IR/Function.h"
 | |
| #include "llvm/IR/IRBuilder.h"
 | |
| #include "llvm/IR/Module.h"
 | |
| #include "llvm/Support/raw_ostream.h"
 | |
| 
 | |
| using namespace llvm;
 | |
| 
 | |
| static void appendToGlobalArray(const char *Array, Module &M, Function *F,
 | |
|                                 int Priority, Constant *Data) {
 | |
|   IRBuilder<> IRB(M.getContext());
 | |
|   FunctionType *FnTy = FunctionType::get(IRB.getVoidTy(), false);
 | |
| 
 | |
|   // Get the current set of static global constructors and add the new ctor
 | |
|   // to the list.
 | |
|   SmallVector<Constant *, 16> CurrentCtors;
 | |
|   StructType *EltTy;
 | |
|   if (GlobalVariable *GVCtor = M.getNamedGlobal(Array)) {
 | |
|     ArrayType *ATy = cast<ArrayType>(GVCtor->getValueType());
 | |
|     StructType *OldEltTy = cast<StructType>(ATy->getElementType());
 | |
|     // Upgrade a 2-field global array type to the new 3-field format if needed.
 | |
|     if (Data && OldEltTy->getNumElements() < 3)
 | |
|       EltTy = StructType::get(IRB.getInt32Ty(), PointerType::getUnqual(FnTy),
 | |
|                               IRB.getInt8PtrTy());
 | |
|     else
 | |
|       EltTy = OldEltTy;
 | |
|     if (Constant *Init = GVCtor->getInitializer()) {
 | |
|       unsigned n = Init->getNumOperands();
 | |
|       CurrentCtors.reserve(n + 1);
 | |
|       for (unsigned i = 0; i != n; ++i) {
 | |
|         auto Ctor = cast<Constant>(Init->getOperand(i));
 | |
|         if (EltTy != OldEltTy)
 | |
|           Ctor =
 | |
|               ConstantStruct::get(EltTy, Ctor->getAggregateElement((unsigned)0),
 | |
|                                   Ctor->getAggregateElement(1),
 | |
|                                   Constant::getNullValue(IRB.getInt8PtrTy()));
 | |
|         CurrentCtors.push_back(Ctor);
 | |
|       }
 | |
|     }
 | |
|     GVCtor->eraseFromParent();
 | |
|   } else {
 | |
|     // Use the new three-field struct if there isn't one already.
 | |
|     EltTy = StructType::get(IRB.getInt32Ty(), PointerType::getUnqual(FnTy),
 | |
|                             IRB.getInt8PtrTy());
 | |
|   }
 | |
| 
 | |
|   // Build a 2 or 3 field global_ctor entry.  We don't take a comdat key.
 | |
|   Constant *CSVals[3];
 | |
|   CSVals[0] = IRB.getInt32(Priority);
 | |
|   CSVals[1] = F;
 | |
|   // FIXME: Drop support for the two element form in LLVM 4.0.
 | |
|   if (EltTy->getNumElements() >= 3)
 | |
|     CSVals[2] = Data ? ConstantExpr::getPointerCast(Data, IRB.getInt8PtrTy())
 | |
|                      : Constant::getNullValue(IRB.getInt8PtrTy());
 | |
|   Constant *RuntimeCtorInit =
 | |
|       ConstantStruct::get(EltTy, makeArrayRef(CSVals, EltTy->getNumElements()));
 | |
| 
 | |
|   CurrentCtors.push_back(RuntimeCtorInit);
 | |
| 
 | |
|   // Create a new initializer.
 | |
|   ArrayType *AT = ArrayType::get(EltTy, CurrentCtors.size());
 | |
|   Constant *NewInit = ConstantArray::get(AT, CurrentCtors);
 | |
| 
 | |
|   // Create the new global variable and replace all uses of
 | |
|   // the old global variable with the new one.
 | |
|   (void)new GlobalVariable(M, NewInit->getType(), false,
 | |
|                            GlobalValue::AppendingLinkage, NewInit, Array);
 | |
| }
 | |
| 
 | |
| void llvm::appendToGlobalCtors(Module &M, Function *F, int Priority, Constant *Data) {
 | |
|   appendToGlobalArray("llvm.global_ctors", M, F, Priority, Data);
 | |
| }
 | |
| 
 | |
| void llvm::appendToGlobalDtors(Module &M, Function *F, int Priority, Constant *Data) {
 | |
|   appendToGlobalArray("llvm.global_dtors", M, F, Priority, Data);
 | |
| }
 | |
| 
 | |
| static void appendToUsedList(Module &M, StringRef Name, ArrayRef<GlobalValue *> Values) {
 | |
|   GlobalVariable *GV = M.getGlobalVariable(Name);
 | |
|   SmallPtrSet<Constant *, 16> InitAsSet;
 | |
|   SmallVector<Constant *, 16> Init;
 | |
|   if (GV) {
 | |
|     ConstantArray *CA = dyn_cast<ConstantArray>(GV->getInitializer());
 | |
|     for (auto &Op : CA->operands()) {
 | |
|       Constant *C = cast_or_null<Constant>(Op);
 | |
|       if (InitAsSet.insert(C).second)
 | |
|         Init.push_back(C);
 | |
|     }
 | |
|     GV->eraseFromParent();
 | |
|   }
 | |
| 
 | |
|   Type *Int8PtrTy = llvm::Type::getInt8PtrTy(M.getContext());
 | |
|   for (auto *V : Values) {
 | |
|     Constant *C = ConstantExpr::getBitCast(V, Int8PtrTy);
 | |
|     if (InitAsSet.insert(C).second)
 | |
|       Init.push_back(C);
 | |
|   }
 | |
| 
 | |
|   if (Init.empty())
 | |
|     return;
 | |
| 
 | |
|   ArrayType *ATy = ArrayType::get(Int8PtrTy, Init.size());
 | |
|   GV = new llvm::GlobalVariable(M, ATy, false, GlobalValue::AppendingLinkage,
 | |
|                                 ConstantArray::get(ATy, Init), Name);
 | |
|   GV->setSection("llvm.metadata");
 | |
| }
 | |
| 
 | |
| void llvm::appendToUsed(Module &M, ArrayRef<GlobalValue *> Values) {
 | |
|   appendToUsedList(M, "llvm.used", Values);
 | |
| }
 | |
| 
 | |
| void llvm::appendToCompilerUsed(Module &M, ArrayRef<GlobalValue *> Values) {
 | |
|   appendToUsedList(M, "llvm.compiler.used", Values);
 | |
| }
 | |
| 
 | |
| Function *llvm::checkSanitizerInterfaceFunction(Constant *FuncOrBitcast) {
 | |
|   if (isa<Function>(FuncOrBitcast))
 | |
|     return cast<Function>(FuncOrBitcast);
 | |
|   FuncOrBitcast->print(errs());
 | |
|   errs() << '\n';
 | |
|   std::string Err;
 | |
|   raw_string_ostream Stream(Err);
 | |
|   Stream << "Sanitizer interface function redefined: " << *FuncOrBitcast;
 | |
|   report_fatal_error(Err);
 | |
| }
 | |
| 
 | |
| Function *llvm::declareSanitizerInitFunction(Module &M, StringRef InitName,
 | |
|                                              ArrayRef<Type *> InitArgTypes) {
 | |
|   assert(!InitName.empty() && "Expected init function name");
 | |
|   Function *F = checkSanitizerInterfaceFunction(M.getOrInsertFunction(
 | |
|       InitName,
 | |
|       FunctionType::get(Type::getVoidTy(M.getContext()), InitArgTypes, false),
 | |
|       AttributeList()));
 | |
|   F->setLinkage(Function::ExternalLinkage);
 | |
|   return F;
 | |
| }
 | |
| 
 | |
| std::pair<Function *, Function *> llvm::createSanitizerCtorAndInitFunctions(
 | |
|     Module &M, StringRef CtorName, StringRef InitName,
 | |
|     ArrayRef<Type *> InitArgTypes, ArrayRef<Value *> InitArgs,
 | |
|     StringRef VersionCheckName) {
 | |
|   assert(!InitName.empty() && "Expected init function name");
 | |
|   assert(InitArgs.size() == InitArgTypes.size() &&
 | |
|          "Sanitizer's init function expects different number of arguments");
 | |
|   Function *InitFunction =
 | |
|       declareSanitizerInitFunction(M, InitName, InitArgTypes);
 | |
|   Function *Ctor = Function::Create(
 | |
|       FunctionType::get(Type::getVoidTy(M.getContext()), false),
 | |
|       GlobalValue::InternalLinkage, CtorName, &M);
 | |
|   BasicBlock *CtorBB = BasicBlock::Create(M.getContext(), "", Ctor);
 | |
|   IRBuilder<> IRB(ReturnInst::Create(M.getContext(), CtorBB));
 | |
|   IRB.CreateCall(InitFunction, InitArgs);
 | |
|   if (!VersionCheckName.empty()) {
 | |
|     Function *VersionCheckFunction =
 | |
|         checkSanitizerInterfaceFunction(M.getOrInsertFunction(
 | |
|             VersionCheckName, FunctionType::get(IRB.getVoidTy(), {}, false),
 | |
|             AttributeList()));
 | |
|     IRB.CreateCall(VersionCheckFunction, {});
 | |
|   }
 | |
|   return std::make_pair(Ctor, InitFunction);
 | |
| }
 | |
| 
 | |
| void llvm::filterDeadComdatFunctions(
 | |
|     Module &M, SmallVectorImpl<Function *> &DeadComdatFunctions) {
 | |
|   // Build a map from the comdat to the number of entries in that comdat we
 | |
|   // think are dead. If this fully covers the comdat group, then the entire
 | |
|   // group is dead. If we find another entry in the comdat group though, we'll
 | |
|   // have to preserve the whole group.
 | |
|   SmallDenseMap<Comdat *, int, 16> ComdatEntriesCovered;
 | |
|   for (Function *F : DeadComdatFunctions) {
 | |
|     Comdat *C = F->getComdat();
 | |
|     assert(C && "Expected all input GVs to be in a comdat!");
 | |
|     ComdatEntriesCovered[C] += 1;
 | |
|   }
 | |
| 
 | |
|   auto CheckComdat = [&](Comdat &C) {
 | |
|     auto CI = ComdatEntriesCovered.find(&C);
 | |
|     if (CI == ComdatEntriesCovered.end())
 | |
|       return;
 | |
| 
 | |
|     // If this could have been covered by a dead entry, just subtract one to
 | |
|     // account for it.
 | |
|     if (CI->second > 0) {
 | |
|       CI->second -= 1;
 | |
|       return;
 | |
|     }
 | |
| 
 | |
|     // If we've already accounted for all the entries that were dead, the
 | |
|     // entire comdat is alive so remove it from the map.
 | |
|     ComdatEntriesCovered.erase(CI);
 | |
|   };
 | |
| 
 | |
|   auto CheckAllComdats = [&] {
 | |
|     for (Function &F : M.functions())
 | |
|       if (Comdat *C = F.getComdat()) {
 | |
|         CheckComdat(*C);
 | |
|         if (ComdatEntriesCovered.empty())
 | |
|           return;
 | |
|       }
 | |
|     for (GlobalVariable &GV : M.globals())
 | |
|       if (Comdat *C = GV.getComdat()) {
 | |
|         CheckComdat(*C);
 | |
|         if (ComdatEntriesCovered.empty())
 | |
|           return;
 | |
|       }
 | |
|     for (GlobalAlias &GA : M.aliases())
 | |
|       if (Comdat *C = GA.getComdat()) {
 | |
|         CheckComdat(*C);
 | |
|         if (ComdatEntriesCovered.empty())
 | |
|           return;
 | |
|       }
 | |
|   };
 | |
|   CheckAllComdats();
 | |
| 
 | |
|   if (ComdatEntriesCovered.empty()) {
 | |
|     DeadComdatFunctions.clear();
 | |
|     return;
 | |
|   }
 | |
| 
 | |
|   // Remove the entries that were not covering.
 | |
|   erase_if(DeadComdatFunctions, [&](GlobalValue *GV) {
 | |
|     return ComdatEntriesCovered.find(GV->getComdat()) ==
 | |
|            ComdatEntriesCovered.end();
 | |
|   });
 | |
| }
 | |
| 
 | |
| std::string llvm::getUniqueModuleId(Module *M) {
 | |
|   MD5 Md5;
 | |
|   bool ExportsSymbols = false;
 | |
|   auto AddGlobal = [&](GlobalValue &GV) {
 | |
|     if (GV.isDeclaration() || GV.getName().startswith("llvm.") ||
 | |
|         !GV.hasExternalLinkage() || GV.hasComdat())
 | |
|       return;
 | |
|     ExportsSymbols = true;
 | |
|     Md5.update(GV.getName());
 | |
|     Md5.update(ArrayRef<uint8_t>{0});
 | |
|   };
 | |
| 
 | |
|   for (auto &F : *M)
 | |
|     AddGlobal(F);
 | |
|   for (auto &GV : M->globals())
 | |
|     AddGlobal(GV);
 | |
|   for (auto &GA : M->aliases())
 | |
|     AddGlobal(GA);
 | |
|   for (auto &IF : M->ifuncs())
 | |
|     AddGlobal(IF);
 | |
| 
 | |
|   if (!ExportsSymbols)
 | |
|     return "";
 | |
| 
 | |
|   MD5::MD5Result R;
 | |
|   Md5.final(R);
 | |
| 
 | |
|   SmallString<32> Str;
 | |
|   MD5::stringifyResult(R, Str);
 | |
|   return ("$" + Str).str();
 | |
| }
 |