//===- Writer.cpp ---------------------------------------------------------===// // // The LLVM Linker // // This file is distributed under the University of Illinois Open Source // License. See LICENSE.TXT for details. // //===----------------------------------------------------------------------===// #include "Writer.h" #include "Config.h" #include "OutputSections.h" #include "OutputSegment.h" #include "SymbolTable.h" #include "WriterUtils.h" #include "lld/Common/ErrorHandler.h" #include "lld/Common/Memory.h" #include "lld/Common/Threads.h" #include "llvm/Support/FileOutputBuffer.h" #include "llvm/Support/Format.h" #include "llvm/Support/FormatVariadic.h" #include "llvm/Support/LEB128.h" #include #define DEBUG_TYPE "lld" using namespace llvm; using namespace llvm::wasm; using namespace lld; using namespace lld::wasm; static constexpr int kStackAlignment = 16; namespace { // Traits for using WasmSignature in a DenseMap. struct WasmSignatureDenseMapInfo { static WasmSignature getEmptyKey() { WasmSignature Sig; Sig.ReturnType = 1; return Sig; } static WasmSignature getTombstoneKey() { WasmSignature Sig; Sig.ReturnType = 2; return Sig; } static unsigned getHashValue(const WasmSignature &Sig) { uintptr_t Value = 0; Value += DenseMapInfo::getHashValue(Sig.ReturnType); for (int32_t Param : Sig.ParamTypes) Value += DenseMapInfo::getHashValue(Param); return Value; } static bool isEqual(const WasmSignature &LHS, const WasmSignature &RHS) { return LHS == RHS; } }; // The writer writes a SymbolTable result to a file. class Writer { public: void run(); private: void openFile(); uint32_t getTypeIndex(const WasmSignature &Sig); void assignSymbolIndexes(); void calculateImports(); void calculateOffsets(); void calculateTypes(); void createOutputSegments(); void layoutMemory(); void createHeader(); void createSections(); SyntheticSection *createSyntheticSection(uint32_t Type, std::string Name = ""); // Builtin sections void createTypeSection(); void createFunctionSection(); void createTableSection(); void createGlobalSection(); void createExportSection(); void createImportSection(); void createMemorySection(); void createElemSection(); void createStartSection(); void createCodeSection(); void createDataSection(); // Custom sections void createRelocSections(); void createLinkingSection(); void createNameSection(); void writeHeader(); void writeSections(); uint64_t FileSize = 0; uint32_t DataSize = 0; uint32_t NumFunctions = 0; uint32_t NumMemoryPages = 0; uint32_t InitialTableOffset = 0; std::vector Types; DenseMap TypeIndices; std::vector FunctionImports; std::vector GlobalImports; std::vector DefinedGlobals; std::vector IndirectFunctions; // Elements that are used to construct the final output std::string Header; std::vector OutputSections; std::unique_ptr Buffer; std::vector Segments; llvm::SmallDenseMap SegmentMap; }; } // anonymous namespace static void debugPrint(const char *fmt, ...) { if (!errorHandler().Verbose) return; fprintf(stderr, "lld: "); va_list ap; va_start(ap, fmt); vfprintf(stderr, fmt, ap); va_end(ap); } void Writer::createImportSection() { uint32_t NumImports = FunctionImports.size() + GlobalImports.size(); if (Config->ImportMemory) ++NumImports; if (NumImports == 0) return; SyntheticSection *Section = createSyntheticSection(WASM_SEC_IMPORT); raw_ostream &OS = Section->getStream(); writeUleb128(OS, NumImports, "import count"); for (const Symbol *Sym : FunctionImports) { WasmImport Import; Import.Module = "env"; Import.Field = Sym->getName(); Import.Kind = WASM_EXTERNAL_FUNCTION; assert(TypeIndices.count(Sym->getFunctionType()) > 0); Import.SigIndex = TypeIndices.lookup(Sym->getFunctionType()); writeImport(OS, Import); } if (Config->ImportMemory) { WasmImport Import; Import.Module = "env"; Import.Field = "memory"; Import.Kind = WASM_EXTERNAL_MEMORY; Import.Memory.Flags = 0; Import.Memory.Initial = NumMemoryPages; writeImport(OS, Import); } for (const Symbol *Sym : GlobalImports) { WasmImport Import; Import.Module = "env"; Import.Field = Sym->getName(); Import.Kind = WASM_EXTERNAL_GLOBAL; Import.Global.Mutable = false; Import.Global.Type = WASM_TYPE_I32; writeImport(OS, Import); } } void Writer::createTypeSection() { SyntheticSection *Section = createSyntheticSection(WASM_SEC_TYPE); raw_ostream &OS = Section->getStream(); writeUleb128(OS, Types.size(), "type count"); for (const WasmSignature *Sig : Types) writeSig(OS, *Sig); } void Writer::createFunctionSection() { if (!NumFunctions) return; SyntheticSection *Section = createSyntheticSection(WASM_SEC_FUNCTION); raw_ostream &OS = Section->getStream(); writeUleb128(OS, NumFunctions, "function count"); for (ObjFile *File : Symtab->ObjectFiles) for (uint32_t Sig : File->getWasmObj()->functionTypes()) writeUleb128(OS, File->relocateTypeIndex(Sig), "sig index"); } void Writer::createMemorySection() { if (Config->ImportMemory) return; SyntheticSection *Section = createSyntheticSection(WASM_SEC_MEMORY); raw_ostream &OS = Section->getStream(); writeUleb128(OS, 1, "memory count"); writeUleb128(OS, 0, "memory limits flags"); writeUleb128(OS, NumMemoryPages, "initial pages"); } void Writer::createGlobalSection() { if (DefinedGlobals.empty()) return; SyntheticSection *Section = createSyntheticSection(WASM_SEC_GLOBAL); raw_ostream &OS = Section->getStream(); writeUleb128(OS, DefinedGlobals.size(), "global count"); for (const Symbol *Sym : DefinedGlobals) { WasmGlobal Global; Global.Type = WASM_TYPE_I32; Global.Mutable = Sym == Config->StackPointerSymbol; Global.InitExpr.Opcode = WASM_OPCODE_I32_CONST; Global.InitExpr.Value.Int32 = Sym->getVirtualAddress(); writeGlobal(OS, Global); } } void Writer::createTableSection() { // Always output a table section, even if there are no indirect calls. // There are two reasons for this: // 1. For executables it is useful to have an empty table slot at 0 // which can be filled with a null function call handler. // 2. If we don't do this, any program that contains a call_indirect but // no address-taken function will fail at validation time since it is // a validation error to include a call_indirect instruction if there // is not table. uint32_t TableSize = InitialTableOffset + IndirectFunctions.size(); SyntheticSection *Section = createSyntheticSection(WASM_SEC_TABLE); raw_ostream &OS = Section->getStream(); writeUleb128(OS, 1, "table count"); writeSleb128(OS, WASM_TYPE_ANYFUNC, "table type"); writeUleb128(OS, WASM_LIMITS_FLAG_HAS_MAX, "table flags"); writeUleb128(OS, TableSize, "table initial size"); writeUleb128(OS, TableSize, "table max size"); } void Writer::createExportSection() { bool ExportMemory = !Config->Relocatable && !Config->ImportMemory; Symbol *EntrySym = Symtab->find(Config->Entry); bool ExportEntry = !Config->Relocatable && EntrySym && EntrySym->isDefined(); bool ExportHidden = Config->EmitRelocs; uint32_t NumExports = ExportMemory ? 1 : 0; std::vector SymbolExports; if (ExportEntry) SymbolExports.emplace_back(EntrySym); for (const Symbol *Sym : Symtab->getSymbols()) { if (Sym->isUndefined() || Sym->isGlobal()) continue; if (Sym->isHidden() && !ExportHidden) continue; if (ExportEntry && Sym == EntrySym) continue; SymbolExports.emplace_back(Sym); } for (const Symbol *Sym : DefinedGlobals) { // Can't export the SP right now because it mutable and mutable globals // connot be exported. if (Sym == Config->StackPointerSymbol) continue; SymbolExports.emplace_back(Sym); } NumExports += SymbolExports.size(); if (!NumExports) return; SyntheticSection *Section = createSyntheticSection(WASM_SEC_EXPORT); raw_ostream &OS = Section->getStream(); writeUleb128(OS, NumExports, "export count"); if (ExportMemory) { WasmExport MemoryExport; MemoryExport.Name = "memory"; MemoryExport.Kind = WASM_EXTERNAL_MEMORY; MemoryExport.Index = 0; writeExport(OS, MemoryExport); } for (const Symbol *Sym : SymbolExports) { log("Export: " + Sym->getName()); WasmExport Export; Export.Name = Sym->getName(); Export.Index = Sym->getOutputIndex(); if (Sym->isFunction()) Export.Kind = WASM_EXTERNAL_FUNCTION; else Export.Kind = WASM_EXTERNAL_GLOBAL; writeExport(OS, Export); } } void Writer::createStartSection() {} void Writer::createElemSection() { if (IndirectFunctions.empty()) return; SyntheticSection *Section = createSyntheticSection(WASM_SEC_ELEM); raw_ostream &OS = Section->getStream(); writeUleb128(OS, 1, "segment count"); writeUleb128(OS, 0, "table index"); WasmInitExpr InitExpr; InitExpr.Opcode = WASM_OPCODE_I32_CONST; InitExpr.Value.Int32 = InitialTableOffset; writeInitExpr(OS, InitExpr); writeUleb128(OS, IndirectFunctions.size(), "elem count"); uint32_t TableIndex = InitialTableOffset; for (const Symbol *Sym : IndirectFunctions) { assert(Sym->getTableIndex() == TableIndex); writeUleb128(OS, Sym->getOutputIndex(), "function index"); ++TableIndex; } } void Writer::createCodeSection() { if (!NumFunctions) return; log("createCodeSection"); auto Section = make(NumFunctions, Symtab->ObjectFiles); OutputSections.push_back(Section); } void Writer::createDataSection() { if (!Segments.size()) return; log("createDataSection"); auto Section = make(Segments); OutputSections.push_back(Section); } // Create relocations sections in the final output. // These are only created when relocatable output is requested. void Writer::createRelocSections() { log("createRelocSections"); // Don't use iterator here since we are adding to OutputSection size_t OrigSize = OutputSections.size(); for (size_t i = 0; i < OrigSize; i++) { OutputSection *S = OutputSections[i]; const char *name; uint32_t Count = S->numRelocations(); if (!Count) continue; if (S->Type == WASM_SEC_DATA) name = "reloc.DATA"; else if (S->Type == WASM_SEC_CODE) name = "reloc.CODE"; else llvm_unreachable("relocations only supported for code and data"); SyntheticSection *Section = createSyntheticSection(WASM_SEC_CUSTOM, name); raw_ostream &OS = Section->getStream(); writeUleb128(OS, S->Type, "reloc section"); writeUleb128(OS, Count, "reloc count"); S->writeRelocations(OS); } } // Create the custom "linking" section containing linker metadata. // This is only created when relocatable output is requested. void Writer::createLinkingSection() { SyntheticSection *Section = createSyntheticSection(WASM_SEC_CUSTOM, "linking"); raw_ostream &OS = Section->getStream(); SubSection DataSizeSubSection(WASM_DATA_SIZE); writeUleb128(DataSizeSubSection.getStream(), DataSize, "data size"); DataSizeSubSection.finalizeContents(); DataSizeSubSection.writeToStream(OS); if (!Config->Relocatable) return; if (Segments.size()) { SubSection SubSection(WASM_SEGMENT_INFO); writeUleb128(SubSection.getStream(), Segments.size(), "num data segments"); for (const OutputSegment *S : Segments) { writeStr(SubSection.getStream(), S->Name, "segment name"); writeUleb128(SubSection.getStream(), S->Alignment, "alignment"); writeUleb128(SubSection.getStream(), 0, "flags"); } SubSection.finalizeContents(); SubSection.writeToStream(OS); } std::vector InitFunctions; for (ObjFile *File : Symtab->ObjectFiles) { const WasmLinkingData &L = File->getWasmObj()->linkingData(); InitFunctions.reserve(InitFunctions.size() + L.InitFunctions.size()); for (const WasmInitFunc &F : L.InitFunctions) InitFunctions.emplace_back(WasmInitFunc{ F.Priority, File->relocateFunctionIndex(F.FunctionIndex)}); } if (!InitFunctions.empty()) { SubSection SubSection(WASM_INIT_FUNCS); writeUleb128(SubSection.getStream(), InitFunctions.size(), "num init functionsw"); for (const WasmInitFunc &F : InitFunctions) { writeUleb128(SubSection.getStream(), F.Priority, "priority"); writeUleb128(SubSection.getStream(), F.FunctionIndex, "function index"); } SubSection.finalizeContents(); SubSection.writeToStream(OS); } } // Create the custom "name" section containing debug symbol names. void Writer::createNameSection() { // Create an array of all function sorted by function index space std::vector Names; for (ObjFile *File : Symtab->ObjectFiles) { Names.reserve(Names.size() + File->getSymbols().size()); for (Symbol *S : File->getSymbols()) { if (!S->isFunction() || S->isWeak() || S->WrittenToNameSec) continue; S->WrittenToNameSec = true; Names.emplace_back(S); } } SyntheticSection *Section = createSyntheticSection(WASM_SEC_CUSTOM, "name"); std::sort(Names.begin(), Names.end(), [](const Symbol *A, const Symbol *B) { return A->getOutputIndex() < B->getOutputIndex(); }); SubSection FunctionSubsection(WASM_NAMES_FUNCTION); raw_ostream &OS = FunctionSubsection.getStream(); writeUleb128(OS, Names.size(), "name count"); // We have to iterate through the inputs twice so that all the imports // appear first before any of the local function names. for (const Symbol *S : Names) { writeUleb128(OS, S->getOutputIndex(), "func index"); writeStr(OS, S->getName(), "symbol name"); } FunctionSubsection.finalizeContents(); FunctionSubsection.writeToStream(Section->getStream()); } void Writer::writeHeader() { memcpy(Buffer->getBufferStart(), Header.data(), Header.size()); } void Writer::writeSections() { uint8_t *Buf = Buffer->getBufferStart(); parallelForEach(OutputSections, [Buf](OutputSection *S) { S->writeTo(Buf); }); } // Fix the memory layout of the output binary. This assigns memory offsets // to each of the input data sections as well as the explicit stack region. void Writer::layoutMemory() { uint32_t MemoryPtr = 0; if (!Config->Relocatable) { MemoryPtr = Config->GlobalBase; debugPrint("mem: global base = %d\n", Config->GlobalBase); } createOutputSegments(); // Static data comes first for (OutputSegment *Seg : Segments) { MemoryPtr = alignTo(MemoryPtr, Seg->Alignment); Seg->StartVA = MemoryPtr; debugPrint("mem: %-10s offset=%-8d size=%-4d align=%d\n", Seg->Name.str().c_str(), MemoryPtr, Seg->Size, Seg->Alignment); MemoryPtr += Seg->Size; } DataSize = MemoryPtr; if (!Config->Relocatable) DataSize -= Config->GlobalBase; debugPrint("mem: static data = %d\n", DataSize); // Stack comes after static data if (!Config->Relocatable) { MemoryPtr = alignTo(MemoryPtr, kStackAlignment); if (Config->ZStackSize != alignTo(Config->ZStackSize, kStackAlignment)) error("stack size must be " + Twine(kStackAlignment) + "-byte aligned"); debugPrint("mem: stack size = %d\n", Config->ZStackSize); debugPrint("mem: stack base = %d\n", MemoryPtr); MemoryPtr += Config->ZStackSize; Config->StackPointerSymbol->setVirtualAddress(MemoryPtr); debugPrint("mem: stack top = %d\n", MemoryPtr); } uint32_t MemSize = alignTo(MemoryPtr, WasmPageSize); NumMemoryPages = MemSize / WasmPageSize; debugPrint("mem: total pages = %d\n", NumMemoryPages); } SyntheticSection *Writer::createSyntheticSection(uint32_t Type, std::string Name) { auto Sec = make(Type, Name); log("createSection: " + toString(*Sec)); OutputSections.push_back(Sec); return Sec; } void Writer::createSections() { // Known sections createTypeSection(); createImportSection(); createFunctionSection(); createTableSection(); createMemorySection(); createGlobalSection(); createExportSection(); createStartSection(); createElemSection(); createCodeSection(); createDataSection(); // Custom sections if (Config->EmitRelocs) createRelocSections(); createLinkingSection(); if (!Config->StripDebug && !Config->StripAll) createNameSection(); for (OutputSection *S : OutputSections) { S->setOffset(FileSize); S->finalizeContents(); FileSize += S->getSize(); } } void Writer::calculateOffsets() { for (ObjFile *File : Symtab->ObjectFiles) { const WasmObjectFile *WasmFile = File->getWasmObj(); // Function Index File->FunctionIndexOffset = FunctionImports.size() - File->NumFunctionImports() + NumFunctions; NumFunctions += WasmFile->functions().size(); // Memory if (WasmFile->memories().size() > 1) fatal(File->getName() + ": contains more than one memory"); } } void Writer::calculateImports() { for (Symbol *Sym : Symtab->getSymbols()) { if (!Sym->isUndefined() || Sym->isWeak()) continue; if (Sym->isFunction()) { Sym->setOutputIndex(FunctionImports.size()); FunctionImports.push_back(Sym); } else { Sym->setOutputIndex(GlobalImports.size()); GlobalImports.push_back(Sym); } } } uint32_t Writer::getTypeIndex(const WasmSignature &Sig) { auto Pair = TypeIndices.insert(std::make_pair(Sig, Types.size())); if (Pair.second) Types.push_back(&Sig); return Pair.first->second; } void Writer::calculateTypes() { for (ObjFile *File : Symtab->ObjectFiles) { File->TypeMap.reserve(File->getWasmObj()->types().size()); for (const WasmSignature &Sig : File->getWasmObj()->types()) File->TypeMap.push_back(getTypeIndex(Sig)); } } void Writer::assignSymbolIndexes() { uint32_t GlobalIndex = GlobalImports.size(); if (Config->StackPointerSymbol) { DefinedGlobals.emplace_back(Config->StackPointerSymbol); Config->StackPointerSymbol->setOutputIndex(GlobalIndex++); } if (Config->EmitRelocs) DefinedGlobals.reserve(Symtab->getSymbols().size()); uint32_t TableIndex = InitialTableOffset; for (ObjFile *File : Symtab->ObjectFiles) { DEBUG(dbgs() << "assignSymbolIndexes: " << File->getName() << "\n"); for (Symbol *Sym : File->getSymbols()) { // Assign indexes for symbols defined with this file. if (!Sym->isDefined() || File != Sym->getFile()) continue; if (Sym->isFunction()) { auto *Obj = cast(Sym->getFile()); Sym->setOutputIndex(Obj->FunctionIndexOffset + Sym->getFunctionIndex()); } else if (Config->EmitRelocs) { DefinedGlobals.emplace_back(Sym); Sym->setOutputIndex(GlobalIndex++); } } for (Symbol *Sym : File->getTableSymbols()) { if (!Sym->hasTableIndex()) { Sym->setTableIndex(TableIndex++); IndirectFunctions.emplace_back(Sym); } } } } static StringRef getOutputDataSegmentName(StringRef Name) { if (Config->Relocatable) return Name; for (StringRef V : {".text.", ".rodata.", ".data.rel.ro.", ".data.", ".bss.rel.ro.", ".bss.", ".init_array.", ".fini_array.", ".ctors.", ".dtors.", ".tbss.", ".gcc_except_table.", ".tdata.", ".ARM.exidx.", ".ARM.extab."}) { StringRef Prefix = V.drop_back(); if (Name.startswith(V) || Name == Prefix) return Prefix; } return Name; } void Writer::createOutputSegments() { for (ObjFile *File : Symtab->ObjectFiles) { for (InputSegment *Segment : File->Segments) { StringRef Name = getOutputDataSegmentName(Segment->getName()); OutputSegment *&S = SegmentMap[Name]; if (S == nullptr) { DEBUG(dbgs() << "new segment: " << Name << "\n"); S = make(Name); Segments.push_back(S); } S->addInputSegment(Segment); DEBUG(dbgs() << "added data: " << Name << ": " << S->Size << "\n"); } } } void Writer::run() { if (!Config->Relocatable) InitialTableOffset = 1; log("-- calculateTypes"); calculateTypes(); log("-- calculateImports"); calculateImports(); log("-- calculateOffsets"); calculateOffsets(); if (errorHandler().Verbose) { log("Defined Functions: " + Twine(NumFunctions)); log("Defined Globals : " + Twine(DefinedGlobals.size())); log("Function Imports : " + Twine(FunctionImports.size())); log("Global Imports : " + Twine(GlobalImports.size())); log("Total Imports : " + Twine(FunctionImports.size() + GlobalImports.size())); for (ObjFile *File : Symtab->ObjectFiles) File->dumpInfo(); } log("-- assignSymbolIndexes"); assignSymbolIndexes(); log("-- layoutMemory"); layoutMemory(); createHeader(); log("-- createSections"); createSections(); log("-- openFile"); openFile(); if (errorCount()) return; writeHeader(); log("-- writeSections"); writeSections(); if (errorCount()) return; if (Error E = Buffer->commit()) fatal("failed to write the output file: " + toString(std::move(E))); } // Open a result file. void Writer::openFile() { log("writing: " + Config->OutputFile); ::remove(Config->OutputFile.str().c_str()); Expected> BufferOrErr = FileOutputBuffer::create(Config->OutputFile, FileSize, FileOutputBuffer::F_executable); if (!BufferOrErr) error("failed to open " + Config->OutputFile + ": " + toString(BufferOrErr.takeError())); else Buffer = std::move(*BufferOrErr); } void Writer::createHeader() { raw_string_ostream OS(Header); writeBytes(OS, WasmMagic, sizeof(WasmMagic), "wasm magic"); writeU32(OS, WasmVersion, "wasm version"); OS.flush(); FileSize += Header.size(); } void lld::wasm::writeResult() { Writer().run(); }