//===- SymbolTable.cpp ----------------------------------------------------===// // // The LLVM Linker // // This file is distributed under the University of Illinois Open Source // License. See LICENSE.TXT for details. // //===----------------------------------------------------------------------===// #include "Config.h" #include "Driver.h" #include "Error.h" #include "SymbolTable.h" #include "Symbols.h" #include "lld/Core/Parallel.h" #include "llvm/IR/LLVMContext.h" #include "llvm/LTO/legacy/LTOCodeGenerator.h" #include "llvm/Support/Debug.h" #include "llvm/Support/raw_ostream.h" #include using namespace llvm; namespace lld { namespace coff { void SymbolTable::addFile(std::unique_ptr FileP) { #if LLVM_ENABLE_THREADS std::launch Policy = std::launch::async; #else std::launch Policy = std::launch::deferred; #endif InputFile *File = FileP.get(); Files.push_back(std::move(FileP)); if (auto *F = dyn_cast(File)) { ArchiveQueue.push_back( std::async(Policy, [=]() { F->parse(); return F; })); return; } ObjectQueue.push_back( std::async(Policy, [=]() { File->parse(); return File; })); if (auto *F = dyn_cast(File)) { ObjectFiles.push_back(F); } else if (auto *F = dyn_cast(File)) { BitcodeFiles.push_back(F); } else { ImportFiles.push_back(cast(File)); } } void SymbolTable::step() { if (queueEmpty()) return; readObjects(); readArchives(); } void SymbolTable::run() { while (!queueEmpty()) step(); } void SymbolTable::readArchives() { if (ArchiveQueue.empty()) return; // Add lazy symbols to the symbol table. Lazy symbols that conflict // with existing undefined symbols are accumulated in LazySyms. std::vector LazySyms; for (std::future &Future : ArchiveQueue) { ArchiveFile *File = Future.get(); if (Config->Verbose) llvm::outs() << "Reading " << File->getShortName() << "\n"; for (Lazy &Sym : File->getLazySymbols()) addLazy(&Sym, &LazySyms); } ArchiveQueue.clear(); // Add archive member files to ObjectQueue that should resolve // existing undefined symbols. for (Symbol *Sym : LazySyms) addMemberFile(cast(Sym->Body)); } void SymbolTable::readObjects() { if (ObjectQueue.empty()) return; // Add defined and undefined symbols to the symbol table. std::vector Directives; for (size_t I = 0; I < ObjectQueue.size(); ++I) { InputFile *File = ObjectQueue[I].get(); if (Config->Verbose) llvm::outs() << "Reading " << File->getShortName() << "\n"; // Adding symbols may add more files to ObjectQueue // (but not to ArchiveQueue). for (SymbolBody *Sym : File->getSymbols()) if (Sym->isExternal()) addSymbol(Sym); StringRef S = File->getDirectives(); if (!S.empty()) { Directives.push_back(S); if (Config->Verbose) llvm::outs() << "Directives: " << File->getShortName() << ": " << S << "\n"; } } ObjectQueue.clear(); // Parse directive sections. This may add files to // ArchiveQueue and ObjectQueue. for (StringRef S : Directives) Driver->parseDirectives(S); } bool SymbolTable::queueEmpty() { return ArchiveQueue.empty() && ObjectQueue.empty(); } void SymbolTable::reportRemainingUndefines(bool Resolve) { llvm::SmallPtrSet Undefs; for (auto &I : Symtab) { Symbol *Sym = I.second; auto *Undef = dyn_cast(Sym->Body); if (!Undef) continue; StringRef Name = Undef->getName(); // A weak alias may have been resolved, so check for that. if (Defined *D = Undef->getWeakAlias()) { if (Resolve) Sym->Body = D; continue; } // If we can resolve a symbol by removing __imp_ prefix, do that. // This odd rule is for compatibility with MSVC linker. if (Name.startswith("__imp_")) { Symbol *Imp = find(Name.substr(strlen("__imp_"))); if (Imp && isa(Imp->Body)) { if (!Resolve) continue; auto *D = cast(Imp->Body); auto *S = new (Alloc) DefinedLocalImport(Name, D); LocalImportChunks.push_back(S->getChunk()); Sym->Body = S; continue; } } // Remaining undefined symbols are not fatal if /force is specified. // They are replaced with dummy defined symbols. if (Config->Force && Resolve) Sym->Body = new (Alloc) DefinedAbsolute(Name, 0); Undefs.insert(Sym->Body); } if (Undefs.empty()) return; for (Undefined *U : Config->GCRoot) if (Undefs.count(U->repl())) llvm::errs() << ": undefined symbol: " << U->getName() << "\n"; for (std::unique_ptr &File : Files) if (!isa(File.get())) for (SymbolBody *Sym : File->getSymbols()) if (Undefs.count(Sym->repl())) llvm::errs() << File->getShortName() << ": undefined symbol: " << Sym->getName() << "\n"; if (!Config->Force) fatal("link failed"); } void SymbolTable::addLazy(Lazy *New, std::vector *Accum) { Symbol *Sym = insert(New); if (Sym->Body == New) return; SymbolBody *Existing = Sym->Body; if (isa(Existing)) return; if (Lazy *L = dyn_cast(Existing)) if (L->getFileIndex() < New->getFileIndex()) return; Sym->Body = New; New->setBackref(Sym); if (isa(Existing)) Accum->push_back(Sym); } void SymbolTable::addSymbol(SymbolBody *New) { // Find an existing symbol or create and insert a new one. assert(isa(New) || isa(New)); Symbol *Sym = insert(New); if (Sym->Body == New) return; SymbolBody *Existing = Sym->Body; // If we have an undefined symbol and a lazy symbol, // let the lazy symbol to read a member file. if (auto *L = dyn_cast(Existing)) { // Undefined symbols with weak aliases need not to be resolved, // since they would be replaced with weak aliases if they remain // undefined. if (auto *U = dyn_cast(New)) { if (!U->WeakAlias) { addMemberFile(L); return; } } Sym->Body = New; return; } // compare() returns -1, 0, or 1 if the lhs symbol is less preferable, // equivalent (conflicting), or more preferable, respectively. int Comp = Existing->compare(New); if (Comp == 0) fatal("duplicate symbol: " + Existing->getDebugName() + " and " + New->getDebugName()); if (Comp < 0) Sym->Body = New; } Symbol *SymbolTable::insert(SymbolBody *New) { Symbol *&Sym = Symtab[New->getName()]; if (Sym) { New->setBackref(Sym); return Sym; } Sym = new (Alloc) Symbol(New); New->setBackref(Sym); return Sym; } // Reads an archive member file pointed by a given symbol. void SymbolTable::addMemberFile(Lazy *Body) { std::unique_ptr File = Body->getMember(); // getMember returns an empty buffer if the member was already // read from the library. if (!File) return; if (Config->Verbose) llvm::outs() << "Loaded " << File->getShortName() << " for " << Body->getName() << "\n"; addFile(std::move(File)); } std::vector SymbolTable::getChunks() { std::vector Res; for (ObjectFile *File : ObjectFiles) { std::vector &V = File->getChunks(); Res.insert(Res.end(), V.begin(), V.end()); } return Res; } Symbol *SymbolTable::find(StringRef Name) { auto It = Symtab.find(Name); if (It == Symtab.end()) return nullptr; return It->second; } Symbol *SymbolTable::findUnderscore(StringRef Name) { if (Config->Machine == I386) return find(("_" + Name).str()); return find(Name); } StringRef SymbolTable::findByPrefix(StringRef Prefix) { for (auto Pair : Symtab) { StringRef Name = Pair.first; if (Name.startswith(Prefix)) return Name; } return ""; } StringRef SymbolTable::findMangle(StringRef Name) { if (Symbol *Sym = find(Name)) if (!isa(Sym->Body)) return Name; if (Config->Machine != I386) return findByPrefix(("?" + Name + "@@Y").str()); if (!Name.startswith("_")) return ""; // Search for x86 C function. StringRef S = findByPrefix((Name + "@").str()); if (!S.empty()) return S; // Search for x86 C++ non-member function. return findByPrefix(("?" + Name.substr(1) + "@@Y").str()); } void SymbolTable::mangleMaybe(Undefined *U) { if (U->WeakAlias) return; if (!isa(U->repl())) return; StringRef Alias = findMangle(U->getName()); if (!Alias.empty()) U->WeakAlias = addUndefined(Alias); } Undefined *SymbolTable::addUndefined(StringRef Name) { auto *New = new (Alloc) Undefined(Name); addSymbol(New); if (auto *U = dyn_cast(New->repl())) return U; return New; } DefinedRelative *SymbolTable::addRelative(StringRef Name, uint64_t VA) { auto *New = new (Alloc) DefinedRelative(Name, VA); addSymbol(New); return New; } DefinedAbsolute *SymbolTable::addAbsolute(StringRef Name, uint64_t VA) { auto *New = new (Alloc) DefinedAbsolute(Name, VA); addSymbol(New); return New; } void SymbolTable::printMap(llvm::raw_ostream &OS) { for (ObjectFile *File : ObjectFiles) { OS << File->getShortName() << ":\n"; for (SymbolBody *Body : File->getSymbols()) if (auto *R = dyn_cast(Body)) if (R->getChunk()->isLive()) OS << Twine::utohexstr(Config->ImageBase + R->getRVA()) << " " << R->getName() << "\n"; } } void SymbolTable::addCombinedLTOObject(ObjectFile *Obj) { for (SymbolBody *Body : Obj->getSymbols()) { if (!Body->isExternal()) continue; // We should not see any new undefined symbols at this point, but we'll // diagnose them later in reportRemainingUndefines(). StringRef Name = Body->getName(); Symbol *Sym = insert(Body); SymbolBody *Existing = Sym->Body; if (Existing == Body) continue; if (isa(Existing)) { Sym->Body = Body; continue; } if (auto *L = dyn_cast(Existing)) { // We may see new references to runtime library symbols such as __chkstk // here. These symbols must be wholly defined in non-bitcode files. addMemberFile(L); continue; } int Comp = Existing->compare(Body); if (Comp == 0) fatal("LTO: unexpected duplicate symbol: " + Name); if (Comp < 0) Sym->Body = Body; } } void SymbolTable::addCombinedLTOObjects() { if (BitcodeFiles.empty()) return; // Diagnose any undefined symbols early, but do not resolve weak externals, // as resolution breaks the invariant that each Symbol points to a unique // SymbolBody, which we rely on to replace DefinedBitcode symbols correctly. reportRemainingUndefines(/*Resolve=*/false); // Create an object file and add it to the symbol table by replacing any // DefinedBitcode symbols with the definitions in the object file. LTOCodeGenerator CG(BitcodeFile::Context); CG.setOptLevel(Config->LTOOptLevel); std::vector Objs = createLTOObjects(&CG); for (ObjectFile *Obj : Objs) addCombinedLTOObject(Obj); size_t NumBitcodeFiles = BitcodeFiles.size(); run(); if (BitcodeFiles.size() != NumBitcodeFiles) fatal("LTO: late loaded symbol created new bitcode reference"); } // Combine and compile bitcode files and then return the result // as a vector of regular COFF object files. std::vector SymbolTable::createLTOObjects(LTOCodeGenerator *CG) { // All symbols referenced by non-bitcode objects must be preserved. for (ObjectFile *File : ObjectFiles) for (SymbolBody *Body : File->getSymbols()) if (auto *S = dyn_cast(Body->repl())) CG->addMustPreserveSymbol(S->getName()); // Likewise for bitcode symbols which we initially resolved to non-bitcode. for (BitcodeFile *File : BitcodeFiles) for (SymbolBody *Body : File->getSymbols()) if (isa(Body) && !isa(Body->repl())) CG->addMustPreserveSymbol(Body->getName()); // Likewise for other symbols that must be preserved. for (Undefined *U : Config->GCRoot) { if (auto *S = dyn_cast(U->repl())) CG->addMustPreserveSymbol(S->getName()); else if (auto *S = dyn_cast_or_null(U->getWeakAlias())) CG->addMustPreserveSymbol(S->getName()); } CG->setModule(BitcodeFiles[0]->takeModule()); for (unsigned I = 1, E = BitcodeFiles.size(); I != E; ++I) CG->addModule(BitcodeFiles[I]->takeModule().get()); bool DisableVerify = true; #ifdef NDEBUG DisableVerify = false; #endif if (!CG->optimize(DisableVerify, false, false, false)) fatal(""); // optimize() should have emitted any error message. Objs.resize(Config->LTOJobs); // Use std::list to avoid invalidation of pointers in OSPtrs. std::list OSs; std::vector OSPtrs; for (SmallString<0> &Obj : Objs) { OSs.emplace_back(Obj); OSPtrs.push_back(&OSs.back()); } if (!CG->compileOptimized(OSPtrs)) fatal(""); // compileOptimized() should have emitted any error message. std::vector ObjFiles; for (SmallString<0> &Obj : Objs) { auto *ObjFile = new ObjectFile(MemoryBufferRef(Obj, "")); Files.emplace_back(ObjFile); ObjectFiles.push_back(ObjFile); ObjFile->parse(); ObjFiles.push_back(ObjFile); } return ObjFiles; } } // namespace coff } // namespace lld