//===-- ModuleUtils.cpp - Functions to manipulate Modules -----------------===// // // The LLVM Compiler Infrastructure // // This file is distributed under the University of Illinois Open Source // License. See LICENSE.TXT for details. // //===----------------------------------------------------------------------===// // // This family of functions perform manipulations on Modules. // //===----------------------------------------------------------------------===// #include "llvm/Transforms/Utils/ModuleUtils.h" #include "llvm/IR/DerivedTypes.h" #include "llvm/IR/Function.h" #include "llvm/IR/IRBuilder.h" #include "llvm/IR/Module.h" #include "llvm/Support/raw_ostream.h" using namespace llvm; static void appendToGlobalArray(const char *Array, Module &M, Function *F, int Priority, Constant *Data) { IRBuilder<> IRB(M.getContext()); FunctionType *FnTy = FunctionType::get(IRB.getVoidTy(), false); // Get the current set of static global constructors and add the new ctor // to the list. SmallVector CurrentCtors; StructType *EltTy; if (GlobalVariable *GVCtor = M.getNamedGlobal(Array)) { ArrayType *ATy = cast(GVCtor->getValueType()); StructType *OldEltTy = cast(ATy->getElementType()); // Upgrade a 2-field global array type to the new 3-field format if needed. if (Data && OldEltTy->getNumElements() < 3) EltTy = StructType::get(IRB.getInt32Ty(), PointerType::getUnqual(FnTy), IRB.getInt8PtrTy()); else EltTy = OldEltTy; if (Constant *Init = GVCtor->getInitializer()) { unsigned n = Init->getNumOperands(); CurrentCtors.reserve(n + 1); for (unsigned i = 0; i != n; ++i) { auto Ctor = cast(Init->getOperand(i)); if (EltTy != OldEltTy) Ctor = ConstantStruct::get(EltTy, Ctor->getAggregateElement((unsigned)0), Ctor->getAggregateElement(1), Constant::getNullValue(IRB.getInt8PtrTy())); CurrentCtors.push_back(Ctor); } } GVCtor->eraseFromParent(); } else { // Use the new three-field struct if there isn't one already. EltTy = StructType::get(IRB.getInt32Ty(), PointerType::getUnqual(FnTy), IRB.getInt8PtrTy()); } // Build a 2 or 3 field global_ctor entry. We don't take a comdat key. Constant *CSVals[3]; CSVals[0] = IRB.getInt32(Priority); CSVals[1] = F; // FIXME: Drop support for the two element form in LLVM 4.0. if (EltTy->getNumElements() >= 3) CSVals[2] = Data ? ConstantExpr::getPointerCast(Data, IRB.getInt8PtrTy()) : Constant::getNullValue(IRB.getInt8PtrTy()); Constant *RuntimeCtorInit = ConstantStruct::get(EltTy, makeArrayRef(CSVals, EltTy->getNumElements())); CurrentCtors.push_back(RuntimeCtorInit); // Create a new initializer. ArrayType *AT = ArrayType::get(EltTy, CurrentCtors.size()); Constant *NewInit = ConstantArray::get(AT, CurrentCtors); // Create the new global variable and replace all uses of // the old global variable with the new one. (void)new GlobalVariable(M, NewInit->getType(), false, GlobalValue::AppendingLinkage, NewInit, Array); } void llvm::appendToGlobalCtors(Module &M, Function *F, int Priority, Constant *Data) { appendToGlobalArray("llvm.global_ctors", M, F, Priority, Data); } void llvm::appendToGlobalDtors(Module &M, Function *F, int Priority, Constant *Data) { appendToGlobalArray("llvm.global_dtors", M, F, Priority, Data); } static void appendToUsedList(Module &M, StringRef Name, ArrayRef Values) { GlobalVariable *GV = M.getGlobalVariable(Name); SmallPtrSet InitAsSet; SmallVector Init; if (GV) { ConstantArray *CA = dyn_cast(GV->getInitializer()); for (auto &Op : CA->operands()) { Constant *C = cast_or_null(Op); if (InitAsSet.insert(C).second) Init.push_back(C); } GV->eraseFromParent(); } Type *Int8PtrTy = llvm::Type::getInt8PtrTy(M.getContext()); for (auto *V : Values) { Constant *C = ConstantExpr::getBitCast(V, Int8PtrTy); if (InitAsSet.insert(C).second) Init.push_back(C); } if (Init.empty()) return; ArrayType *ATy = ArrayType::get(Int8PtrTy, Init.size()); GV = new llvm::GlobalVariable(M, ATy, false, GlobalValue::AppendingLinkage, ConstantArray::get(ATy, Init), Name); GV->setSection("llvm.metadata"); } void llvm::appendToUsed(Module &M, ArrayRef Values) { appendToUsedList(M, "llvm.used", Values); } void llvm::appendToCompilerUsed(Module &M, ArrayRef Values) { appendToUsedList(M, "llvm.compiler.used", Values); } Function *llvm::checkSanitizerInterfaceFunction(Constant *FuncOrBitcast) { if (isa(FuncOrBitcast)) return cast(FuncOrBitcast); FuncOrBitcast->print(errs()); errs() << '\n'; std::string Err; raw_string_ostream Stream(Err); Stream << "Sanitizer interface function redefined: " << *FuncOrBitcast; report_fatal_error(Err); } Function *llvm::declareSanitizerInitFunction(Module &M, StringRef InitName, ArrayRef InitArgTypes) { assert(!InitName.empty() && "Expected init function name"); Function *F = checkSanitizerInterfaceFunction(M.getOrInsertFunction( InitName, FunctionType::get(Type::getVoidTy(M.getContext()), InitArgTypes, false), AttributeList())); F->setLinkage(Function::ExternalLinkage); return F; } std::pair llvm::createSanitizerCtorAndInitFunctions( Module &M, StringRef CtorName, StringRef InitName, ArrayRef InitArgTypes, ArrayRef InitArgs, StringRef VersionCheckName) { assert(!InitName.empty() && "Expected init function name"); assert(InitArgs.size() == InitArgTypes.size() && "Sanitizer's init function expects different number of arguments"); Function *InitFunction = declareSanitizerInitFunction(M, InitName, InitArgTypes); Function *Ctor = Function::Create( FunctionType::get(Type::getVoidTy(M.getContext()), false), GlobalValue::InternalLinkage, CtorName, &M); BasicBlock *CtorBB = BasicBlock::Create(M.getContext(), "", Ctor); IRBuilder<> IRB(ReturnInst::Create(M.getContext(), CtorBB)); IRB.CreateCall(InitFunction, InitArgs); if (!VersionCheckName.empty()) { Function *VersionCheckFunction = checkSanitizerInterfaceFunction(M.getOrInsertFunction( VersionCheckName, FunctionType::get(IRB.getVoidTy(), {}, false), AttributeList())); IRB.CreateCall(VersionCheckFunction, {}); } return std::make_pair(Ctor, InitFunction); } void llvm::filterDeadComdatFunctions( Module &M, SmallVectorImpl &DeadComdatFunctions) { // Build a map from the comdat to the number of entries in that comdat we // think are dead. If this fully covers the comdat group, then the entire // group is dead. If we find another entry in the comdat group though, we'll // have to preserve the whole group. SmallDenseMap ComdatEntriesCovered; for (Function *F : DeadComdatFunctions) { Comdat *C = F->getComdat(); assert(C && "Expected all input GVs to be in a comdat!"); ComdatEntriesCovered[C] += 1; } auto CheckComdat = [&](Comdat &C) { auto CI = ComdatEntriesCovered.find(&C); if (CI == ComdatEntriesCovered.end()) return; // If this could have been covered by a dead entry, just subtract one to // account for it. if (CI->second > 0) { CI->second -= 1; return; } // If we've already accounted for all the entries that were dead, the // entire comdat is alive so remove it from the map. ComdatEntriesCovered.erase(CI); }; auto CheckAllComdats = [&] { for (Function &F : M.functions()) if (Comdat *C = F.getComdat()) { CheckComdat(*C); if (ComdatEntriesCovered.empty()) return; } for (GlobalVariable &GV : M.globals()) if (Comdat *C = GV.getComdat()) { CheckComdat(*C); if (ComdatEntriesCovered.empty()) return; } for (GlobalAlias &GA : M.aliases()) if (Comdat *C = GA.getComdat()) { CheckComdat(*C); if (ComdatEntriesCovered.empty()) return; } }; CheckAllComdats(); if (ComdatEntriesCovered.empty()) { DeadComdatFunctions.clear(); return; } // Remove the entries that were not covering. erase_if(DeadComdatFunctions, [&](GlobalValue *GV) { return ComdatEntriesCovered.find(GV->getComdat()) == ComdatEntriesCovered.end(); }); } std::string llvm::getUniqueModuleId(Module *M) { MD5 Md5; bool ExportsSymbols = false; auto AddGlobal = [&](GlobalValue &GV) { if (GV.isDeclaration() || GV.getName().startswith("llvm.") || !GV.hasExternalLinkage() || GV.hasComdat()) return; ExportsSymbols = true; Md5.update(GV.getName()); Md5.update(ArrayRef{0}); }; for (auto &F : *M) AddGlobal(F); for (auto &GV : M->globals()) AddGlobal(GV); for (auto &GA : M->aliases()) AddGlobal(GA); for (auto &IF : M->ifuncs()) AddGlobal(IF); if (!ExportsSymbols) return ""; MD5::MD5Result R; Md5.final(R); SmallString<32> Str; MD5::stringifyResult(R, Str); return ("$" + Str).str(); }