//===- InputFiles.cpp -----------------------------------------------------===// // // The LLVM Linker // // This file is distributed under the University of Illinois Open Source // License. See LICENSE.TXT for details. // //===----------------------------------------------------------------------===// #include "InputFiles.h" #include "Config.h" #include "InputSegment.h" #include "SymbolTable.h" #include "lld/Common/ErrorHandler.h" #include "lld/Common/Memory.h" #include "llvm/Object/Binary.h" #include "llvm/Object/Wasm.h" #include "llvm/Support/raw_ostream.h" #define DEBUG_TYPE "lld" using namespace lld; using namespace lld::wasm; using namespace llvm; using namespace llvm::object; using namespace llvm::wasm; Optional lld::wasm::readFile(StringRef Path) { log("Loading: " + Path); auto MBOrErr = MemoryBuffer::getFile(Path); if (auto EC = MBOrErr.getError()) { error("cannot open " + Path + ": " + EC.message()); return None; } std::unique_ptr &MB = *MBOrErr; MemoryBufferRef MBRef = MB->getMemBufferRef(); make>(std::move(MB)); // take MB ownership return MBRef; } void ObjFile::dumpInfo() const { log("reloc info for: " + getName() + "\n" + " FunctionIndexOffset : " + Twine(FunctionIndexOffset) + "\n" + " NumFunctionImports : " + Twine(NumFunctionImports()) + "\n" + " NumGlobalImports : " + Twine(NumGlobalImports()) + "\n"); } bool ObjFile::isImportedFunction(uint32_t Index) const { return Index < NumFunctionImports(); } Symbol *ObjFile::getFunctionSymbol(uint32_t Index) const { return FunctionSymbols[Index]; } Symbol *ObjFile::getTableSymbol(uint32_t Index) const { return TableSymbols[Index]; } Symbol *ObjFile::getGlobalSymbol(uint32_t Index) const { return GlobalSymbols[Index]; } uint32_t ObjFile::getRelocatedAddress(uint32_t Index) const { return getGlobalSymbol(Index)->getVirtualAddress(); } uint32_t ObjFile::relocateFunctionIndex(uint32_t Original) const { Symbol *Sym = getFunctionSymbol(Original); uint32_t Index = Sym->getOutputIndex(); DEBUG(dbgs() << "relocateFunctionIndex: " << toString(*Sym) << ": " << Original << " -> " << Index << "\n"); return Index; } uint32_t ObjFile::relocateTypeIndex(uint32_t Original) const { return TypeMap[Original]; } uint32_t ObjFile::relocateTableIndex(uint32_t Original) const { Symbol *Sym = getTableSymbol(Original); uint32_t Index = Sym->getTableIndex(); DEBUG(dbgs() << "relocateTableIndex: " << toString(*Sym) << ": " << Original << " -> " << Index << "\n"); return Index; } uint32_t ObjFile::relocateGlobalIndex(uint32_t Original) const { Symbol *Sym = getGlobalSymbol(Original); uint32_t Index = Sym->getOutputIndex(); DEBUG(dbgs() << "relocateGlobalIndex: " << toString(*Sym) << ": " << Original << " -> " << Index << "\n"); return Index; } void ObjFile::parse() { // Parse a memory buffer as a wasm file. DEBUG(dbgs() << "Parsing object: " << toString(this) << "\n"); std::unique_ptr Bin = CHECK(createBinary(MB), toString(this)); auto *Obj = dyn_cast(Bin.get()); if (!Obj) fatal(toString(this) + ": not a wasm file"); if (!Obj->isRelocatableObject()) fatal(toString(this) + ": not a relocatable wasm file"); Bin.release(); WasmObj.reset(Obj); // Find the code and data sections. Wasm objects can have at most one code // and one data section. for (const SectionRef &Sec : WasmObj->sections()) { const WasmSection &Section = WasmObj->getWasmSection(Sec); if (Section.Type == WASM_SEC_CODE) CodeSection = &Section; else if (Section.Type == WASM_SEC_DATA) DataSection = &Section; } initializeSymbols(); } // Return the InputSegment in which a given symbol is defined. InputSegment *ObjFile::getSegment(const WasmSymbol &WasmSym) { uint32_t Address = WasmObj->getWasmSymbolValue(WasmSym); for (InputSegment *Segment : Segments) { if (Address >= Segment->startVA() && Address < Segment->endVA()) { DEBUG(dbgs() << "Found symbol in segment: " << WasmSym.Name << " -> " << Segment->getName() << "\n"); return Segment; } } error("symbol not found in any segment: " + WasmSym.Name); return nullptr; } static void copyRelocationsRange(std::vector &To, ArrayRef From, size_t Start, size_t End) { for (const WasmRelocation &R : From) if (R.Offset >= Start && R.Offset < End) To.push_back(R); } void ObjFile::initializeSymbols() { Symbols.reserve(WasmObj->getNumberOfSymbols()); for (const WasmImport &Import : WasmObj->imports()) { switch (Import.Kind) { case WASM_EXTERNAL_FUNCTION: ++FunctionImports; break; case WASM_EXTERNAL_GLOBAL: ++GlobalImports; break; } } FunctionSymbols.resize(FunctionImports + WasmObj->functions().size()); GlobalSymbols.resize(GlobalImports + WasmObj->globals().size()); for (const WasmSegment &S : WasmObj->dataSegments()) { InputSegment *Seg = make(&S, this); copyRelocationsRange(Seg->Relocations, DataSection->Relocations, Seg->getInputSectionOffset(), Seg->getInputSectionOffset() + Seg->getSize()); Segments.emplace_back(Seg); } // Populate `FunctionSymbols` and `GlobalSymbols` based on the WasmSymbols // in the object for (const SymbolRef &Sym : WasmObj->symbols()) { const WasmSymbol &WasmSym = WasmObj->getWasmSymbol(Sym.getRawDataRefImpl()); Symbol *S; switch (WasmSym.Type) { case WasmSymbol::SymbolType::FUNCTION_IMPORT: case WasmSymbol::SymbolType::GLOBAL_IMPORT: S = createUndefined(WasmSym); break; case WasmSymbol::SymbolType::GLOBAL_EXPORT: S = createDefined(WasmSym, getSegment(WasmSym)); break; case WasmSymbol::SymbolType::FUNCTION_EXPORT: S = createDefined(WasmSym); break; case WasmSymbol::SymbolType::DEBUG_FUNCTION_NAME: // These are for debugging only, no need to create linker symbols for them continue; } Symbols.push_back(S); if (WasmSym.isFunction()) { DEBUG(dbgs() << "Function: " << WasmSym.ElementIndex << " -> " << toString(*S) << "\n"); FunctionSymbols[WasmSym.ElementIndex] = S; if (WasmSym.HasAltIndex) FunctionSymbols[WasmSym.AltIndex] = S; } else { DEBUG(dbgs() << "Global: " << WasmSym.ElementIndex << " -> " << toString(*S) << "\n"); GlobalSymbols[WasmSym.ElementIndex] = S; if (WasmSym.HasAltIndex) GlobalSymbols[WasmSym.AltIndex] = S; } } DEBUG(for (size_t I = 0; I < FunctionSymbols.size(); ++I) assert(FunctionSymbols[I] != nullptr); for (size_t I = 0; I < GlobalSymbols.size(); ++I) assert(GlobalSymbols[I] != nullptr);); // Populate `TableSymbols` with all symbols that are called indirectly uint32_t SegmentCount = WasmObj->elements().size(); if (SegmentCount) { if (SegmentCount > 1) fatal(getName() + ": contains more than one element segment"); const WasmElemSegment &Segment = WasmObj->elements()[0]; if (Segment.Offset.Opcode != WASM_OPCODE_I32_CONST) fatal(getName() + ": unsupported element segment"); if (Segment.TableIndex != 0) fatal(getName() + ": unsupported table index in elem segment"); if (Segment.Offset.Value.Int32 != 0) fatal(getName() + ": unsupported element segment offset"); TableSymbols.reserve(Segment.Functions.size()); for (uint64_t FunctionIndex : Segment.Functions) TableSymbols.push_back(getFunctionSymbol(FunctionIndex)); } DEBUG(dbgs() << "TableSymbols: " << TableSymbols.size() << "\n"); DEBUG(dbgs() << "Functions : " << FunctionSymbols.size() << "\n"); DEBUG(dbgs() << "Globals : " << GlobalSymbols.size() << "\n"); } Symbol *ObjFile::createUndefined(const WasmSymbol &Sym) { return Symtab->addUndefined(this, &Sym); } Symbol *ObjFile::createDefined(const WasmSymbol &Sym, const InputSegment *Segment) { Symbol *S; if (Sym.isLocal()) { S = make(Sym.Name, true); Symbol::Kind Kind; if (Sym.Type == WasmSymbol::SymbolType::FUNCTION_EXPORT) Kind = Symbol::Kind::DefinedFunctionKind; else if (Sym.Type == WasmSymbol::SymbolType::GLOBAL_EXPORT) Kind = Symbol::Kind::DefinedGlobalKind; else llvm_unreachable("invalid local symbol type"); S->update(Kind, this, &Sym, Segment); return S; } return Symtab->addDefined(this, &Sym, Segment); } void ArchiveFile::parse() { // Parse a MemoryBufferRef as an archive file. DEBUG(dbgs() << "Parsing library: " << toString(this) << "\n"); File = CHECK(Archive::create(MB), toString(this)); // Read the symbol table to construct Lazy symbols. int Count = 0; for (const Archive::Symbol &Sym : File->symbols()) { Symtab->addLazy(this, &Sym); ++Count; } DEBUG(dbgs() << "Read " << Count << " symbols\n"); } void ArchiveFile::addMember(const Archive::Symbol *Sym) { const Archive::Child &C = CHECK(Sym->getMember(), "could not get the member for symbol " + Sym->getName()); // Don't try to load the same member twice (this can happen when members // mutually reference each other). if (!Seen.insert(C.getChildOffset()).second) return; DEBUG(dbgs() << "loading lazy: " << Sym->getName() << "\n"); DEBUG(dbgs() << "from archive: " << toString(this) << "\n"); MemoryBufferRef MB = CHECK(C.getMemoryBufferRef(), "could not get the buffer for the member defining symbol " + Sym->getName()); if (identify_magic(MB.getBuffer()) != file_magic::wasm_object) { error("unknown file type: " + MB.getBufferIdentifier()); return; } InputFile *Obj = make(MB); Obj->ParentName = ParentName; Symtab->addFile(Obj); } // Returns a string in the format of "foo.o" or "foo.a(bar.o)". std::string lld::toString(const wasm::InputFile *File) { if (!File) return ""; if (File->ParentName.empty()) return File->getName(); return (File->ParentName + "(" + File->getName() + ")").str(); }