diff options
author | Dimitry Andric <dim@FreeBSD.org> | 2019-01-19 10:05:49 +0000 |
---|---|---|
committer | Dimitry Andric <dim@FreeBSD.org> | 2019-01-19 10:05:49 +0000 |
commit | e2fd426bdafe9f5c10066d3926ece6e342184a67 (patch) | |
tree | bfbbb5fd38554e6b8988b7a217e9fd0623728d7d /wasm | |
parent | 84c4061b34e048f47e5eb4fbabc1558495e8157c (diff) |
Vendor import of lld trunk r351319 (just before the release_80 branchvendor/lld/lld-trunk-r351319
Notes
Notes:
svn path=/vendor/lld/dist/; revision=343179
svn path=/vendor/lld/lld-trunk-r351319/; revision=343180; tag=vendor/lld/lld-trunk-r351319
Diffstat (limited to 'wasm')
-rw-r--r-- | wasm/Config.h | 9 | ||||
-rw-r--r-- | wasm/Driver.cpp | 288 | ||||
-rw-r--r-- | wasm/InputChunks.cpp | 27 | ||||
-rw-r--r-- | wasm/InputChunks.h | 40 | ||||
-rw-r--r-- | wasm/InputEvent.h | 63 | ||||
-rw-r--r-- | wasm/InputFiles.cpp | 93 | ||||
-rw-r--r-- | wasm/InputFiles.h | 22 | ||||
-rw-r--r-- | wasm/InputGlobal.h | 3 | ||||
-rw-r--r-- | wasm/LTO.cpp | 17 | ||||
-rw-r--r-- | wasm/MarkLive.cpp | 6 | ||||
-rw-r--r-- | wasm/Options.td | 49 | ||||
-rw-r--r-- | wasm/OutputSections.cpp | 16 | ||||
-rw-r--r-- | wasm/OutputSections.h | 8 | ||||
-rw-r--r-- | wasm/OutputSegment.h | 2 | ||||
-rw-r--r-- | wasm/SymbolTable.cpp | 147 | ||||
-rw-r--r-- | wasm/SymbolTable.h | 11 | ||||
-rw-r--r-- | wasm/Symbols.cpp | 52 | ||||
-rw-r--r-- | wasm/Symbols.h | 93 | ||||
-rw-r--r-- | wasm/Writer.cpp | 190 | ||||
-rw-r--r-- | wasm/WriterUtils.cpp | 82 | ||||
-rw-r--r-- | wasm/WriterUtils.h | 13 |
21 files changed, 842 insertions, 389 deletions
diff --git a/wasm/Config.h b/wasm/Config.h index 76a780567072..0857a645f1e8 100644 --- a/wasm/Config.h +++ b/wasm/Config.h @@ -20,18 +20,22 @@ namespace wasm { struct Configuration { bool AllowUndefined; - bool CompressRelocTargets; + bool CompressRelocations; bool Demangle; bool DisableVerify; bool ExportAll; + bool ExportDynamic; bool ExportTable; bool GcSections; bool ImportMemory; + bool SharedMemory; bool ImportTable; bool MergeDataSegments; + bool Pie; bool PrintGcSections; bool Relocatable; bool SaveTemps; + bool Shared; bool StripAll; bool StripDebug; bool StackFirst; @@ -50,6 +54,9 @@ struct Configuration { llvm::StringSet<> AllowUndefinedSymbols; std::vector<llvm::StringRef> SearchPaths; llvm::CachePruningPolicy ThinLTOCachePolicy; + + // True if we are creating position-independent code. + bool Pic; }; // The only instance of Configuration struct. diff --git a/wasm/Driver.cpp b/wasm/Driver.cpp index 329b5ae80a9c..fab4c0c4ed8b 100644 --- a/wasm/Driver.cpp +++ b/wasm/Driver.cpp @@ -31,6 +31,7 @@ #define DEBUG_TYPE "lld" using namespace llvm; +using namespace llvm::object; using namespace llvm::sys; using namespace llvm::wasm; @@ -78,7 +79,7 @@ private: bool lld::wasm::link(ArrayRef<const char *> Args, bool CanExitEarly, raw_ostream &Error) { - errorHandler().LogName = sys::path::filename(Args[0]); + errorHandler().LogName = args::getFilenameWithoutExe(Args[0]); errorHandler().ErrorOS = &Error; errorHandler().ColorDiagnostics = Error.has_colors(); errorHandler().ErrorLimitExceededMsg = @@ -186,8 +187,7 @@ static void readImportFile(StringRef Filename) { // Returns slices of MB by parsing MB as an archive file. // Each slice consists of a member file in the archive. -std::vector<MemoryBufferRef> static getArchiveMembers( - MemoryBufferRef MB) { +std::vector<MemoryBufferRef> static getArchiveMembers(MemoryBufferRef MB) { std::unique_ptr<Archive> File = CHECK(Archive::create(MB), MB.getBufferIdentifier() + ": failed to parse archive"); @@ -205,8 +205,8 @@ std::vector<MemoryBufferRef> static getArchiveMembers( V.push_back(MBRef); } if (Err) - fatal(MB.getBufferIdentifier() + ": Archive::children failed: " + - toString(std::move(Err))); + fatal(MB.getBufferIdentifier() + + ": Archive::children failed: " + toString(std::move(Err))); // Take ownership of memory buffers created for members of thin archives. for (std::unique_ptr<MemoryBuffer> &MB : File->takeThinBuffers()) @@ -306,17 +306,14 @@ static void handleWeakUndefines() { // It is possible for undefined functions not to have a signature (eg. if // added via "--undefined"), but weak undefined ones do have a signature. - assert(FuncSym->FunctionType); - const WasmSignature &Sig = *FuncSym->FunctionType; + assert(FuncSym->Signature); + const WasmSignature &Sig = *FuncSym->Signature; // Add a synthetic dummy for weak undefined functions. These dummies will // be GC'd if not used as the target of any "call" instructions. - Optional<std::string> SymName = demangleItanium(Sym->getName()); - StringRef DebugName = - Saver.save("undefined function " + - (SymName ? StringRef(*SymName) : Sym->getName())); - SyntheticFunction *Func = - make<SyntheticFunction>(Sig, Sym->getName(), DebugName); + std::string SymName = toString(*Sym); + StringRef DebugName = Saver.save("undefined function " + SymName); + auto *Func = make<SyntheticFunction>(Sig, Sym->getName(), DebugName); Func->setBody(UnreachableFn); // Ensure it compares equal to the null pointer, and so that table relocs // don't pull in the stub body (only call-operand relocs should do that). @@ -328,51 +325,24 @@ static void handleWeakUndefines() { } } -// Force Sym to be entered in the output. Used for -u or equivalent. -static Symbol *addUndefined(StringRef Name) { - Symbol *S = Symtab->addUndefinedFunction(Name, 0, nullptr, nullptr); - - // Since symbol S may not be used inside the program, LTO may - // eliminate it. Mark the symbol as "used" to prevent it. - S->IsUsedInRegularObj = true; - - return S; -} - -void LinkerDriver::link(ArrayRef<const char *> ArgsArr) { - WasmOptTable Parser; - opt::InputArgList Args = Parser.parse(ArgsArr.slice(1)); - - // Handle --help - if (Args.hasArg(OPT_help)) { - Parser.PrintHelp(outs(), ArgsArr[0], "LLVM Linker", false); - return; - } - - // Handle --version - if (Args.hasArg(OPT_version) || Args.hasArg(OPT_v)) { - outs() << getLLDVersion() << "\n"; - return; - } - - // Parse and evaluate -mllvm options. - std::vector<const char *> V; - V.push_back("wasm-ld (LLVM option parsing)"); - for (auto *Arg : Args.filtered(OPT_mllvm)) - V.push_back(Arg->getValue()); - cl::ParseCommandLineOptions(V.size(), V.data()); - - errorHandler().ErrorLimit = args::getInteger(Args, OPT_error_limit, 20); - +// Some Config members do not directly correspond to any particular +// command line options, but computed based on other Config values. +// This function initialize such members. See Config.h for the details +// of these values. +static void setConfigs(opt::InputArgList &Args) { Config->AllowUndefined = Args.hasArg(OPT_allow_undefined); + Config->CompressRelocations = Args.hasArg(OPT_compress_relocations); Config->Demangle = Args.hasFlag(OPT_demangle, OPT_no_demangle, true); Config->DisableVerify = Args.hasArg(OPT_disable_verify); Config->Entry = getEntry(Args, Args.hasArg(OPT_relocatable) ? "" : "_start"); Config->ExportAll = Args.hasArg(OPT_export_all); + Config->ExportDynamic = Args.hasFlag(OPT_export_dynamic, + OPT_no_export_dynamic, false); Config->ExportTable = Args.hasArg(OPT_export_table); errorHandler().FatalWarnings = Args.hasFlag(OPT_fatal_warnings, OPT_no_fatal_warnings, false); Config->ImportMemory = Args.hasArg(OPT_import_memory); + Config->SharedMemory = Args.hasArg(OPT_shared_memory); Config->ImportTable = Args.hasArg(OPT_import_table); Config->LTOO = args::getInteger(Args, OPT_lto_O, 2); Config->LTOPartitions = args::getInteger(Args, OPT_lto_partitions, 1); @@ -384,10 +354,12 @@ void LinkerDriver::link(ArrayRef<const char *> ArgsArr) { Config->MergeDataSegments = Args.hasFlag(OPT_merge_data_segments, OPT_no_merge_data_segments, !Config->Relocatable); + Config->Pie = Args.hasFlag(OPT_pie, OPT_no_pie, false); Config->PrintGcSections = Args.hasFlag(OPT_print_gc_sections, OPT_no_print_gc_sections, false); Config->SaveTemps = Args.hasArg(OPT_save_temps); Config->SearchPaths = args::getStrings(Args, OPT_L); + Config->Shared = Args.hasArg(OPT_shared); Config->StripAll = Args.hasArg(OPT_strip_all); Config->StripDebug = Args.hasArg(OPT_strip_debug); Config->StackFirst = Args.hasArg(OPT_stack_first); @@ -404,8 +376,14 @@ void LinkerDriver::link(ArrayRef<const char *> ArgsArr) { Config->MaxMemory = args::getInteger(Args, OPT_max_memory, 0); Config->ZStackSize = args::getZOptionValue(Args, OPT_z, "stack-size", WasmPageSize); +} - Config->CompressRelocTargets = Config->Optimize > 0 && !Config->Relocatable; +// Some command line options or some combinations of them are not allowed. +// This function checks for such errors. +static void checkOptions(opt::InputArgList &Args) { + if (!Config->StripDebug && !Config->StripAll && Config->CompressRelocations) + error("--compress-relocations is incompatible with output debug" + " information. Please pass --strip-debug or --strip-all"); if (Config->LTOO > 3) error("invalid optimization level for LTO: " + Twine(Config->LTOO)); @@ -414,13 +392,8 @@ void LinkerDriver::link(ArrayRef<const char *> ArgsArr) { if (Config->ThinLTOJobs == 0) error("--thinlto-jobs: number of threads must be > 0"); - if (auto *Arg = Args.getLastArg(OPT_allow_undefined_file)) - readImportFile(Arg->getValue()); - - if (!Args.hasArg(OPT_INPUT)) { - error("no input files"); - return; - } + if (Config->Pie && Config->Shared) + error("-shared and -pie may not be used together"); if (Config->OutputFile.empty()) error("no output file specified"); @@ -433,46 +406,151 @@ void LinkerDriver::link(ArrayRef<const char *> ArgsArr) { error("entry point specified for relocatable output file"); if (Config->GcSections) error("-r and --gc-sections may not be used together"); + if (Config->CompressRelocations) + error("-r -and --compress-relocations may not be used together"); if (Args.hasArg(OPT_undefined)) error("-r -and --undefined may not be used together"); + if (Config->Pie) + error("-r and -pie may not be used together"); } +} - Symbol *EntrySym = nullptr; - if (!Config->Relocatable) { +// Force Sym to be entered in the output. Used for -u or equivalent. +static Symbol *handleUndefined(StringRef Name) { + Symbol *Sym = Symtab->find(Name); + if (!Sym) + return nullptr; + + // Since symbol S may not be used inside the program, LTO may + // eliminate it. Mark the symbol as "used" to prevent it. + Sym->IsUsedInRegularObj = true; + + if (auto *LazySym = dyn_cast<LazySymbol>(Sym)) + LazySym->fetch(); + + return Sym; +} + +static UndefinedGlobal * +createUndefinedGlobal(StringRef Name, llvm::wasm::WasmGlobalType *Type) { + auto *Sym = + cast<UndefinedGlobal>(Symtab->addUndefinedGlobal(Name, 0, nullptr, Type)); + Config->AllowUndefinedSymbols.insert(Sym->getName()); + Sym->IsUsedInRegularObj = true; + return Sym; +} + +// Create ABI-defined synthetic symbols +static void createSyntheticSymbols() { + static WasmSignature NullSignature = {{}, {}}; + static llvm::wasm::WasmGlobalType GlobalTypeI32 = {WASM_TYPE_I32, false}; + static llvm::wasm::WasmGlobalType MutableGlobalTypeI32 = {WASM_TYPE_I32, + true}; + + if (!Config->Relocatable) + WasmSym::CallCtors = Symtab->addSyntheticFunction( + "__wasm_call_ctors", WASM_SYMBOL_VISIBILITY_HIDDEN, + make<SyntheticFunction>(NullSignature, "__wasm_call_ctors")); + + // The __stack_pointer is imported in the shared library case, and exported + // in the non-shared (executable) case. + if (Config->Shared) { + WasmSym::StackPointer = + createUndefinedGlobal("__stack_pointer", &MutableGlobalTypeI32); + } else { llvm::wasm::WasmGlobal Global; Global.Type = {WASM_TYPE_I32, true}; Global.InitExpr.Value.Int32 = 0; Global.InitExpr.Opcode = WASM_OPCODE_I32_CONST; Global.SymbolName = "__stack_pointer"; - InputGlobal *StackPointer = make<InputGlobal>(Global, nullptr); + auto *StackPointer = make<InputGlobal>(Global, nullptr); StackPointer->Live = true; - - static WasmSignature NullSignature = {{}, WASM_TYPE_NORESULT}; - - // Add synthetic symbols before any others - WasmSym::CallCtors = Symtab->addSyntheticFunction( - "__wasm_call_ctors", WASM_SYMBOL_VISIBILITY_HIDDEN, - make<SyntheticFunction>(NullSignature, "__wasm_call_ctors")); + // For non-PIC code // TODO(sbc): Remove WASM_SYMBOL_VISIBILITY_HIDDEN when the mutable global // spec proposal is implemented in all major browsers. // See: https://github.com/WebAssembly/mutable-global WasmSym::StackPointer = Symtab->addSyntheticGlobal( "__stack_pointer", WASM_SYMBOL_VISIBILITY_HIDDEN, StackPointer); WasmSym::HeapBase = Symtab->addSyntheticDataSymbol("__heap_base", 0); - WasmSym::DsoHandle = Symtab->addSyntheticDataSymbol( - "__dso_handle", WASM_SYMBOL_VISIBILITY_HIDDEN); WasmSym::DataEnd = Symtab->addSyntheticDataSymbol("__data_end", 0); - // For now, since we don't actually use the start function as the - // wasm start symbol, we don't need to care about it signature. - if (!Config->Entry.empty()) - EntrySym = addUndefined(Config->Entry); + // These two synthetic symbols exist purely for the embedder so we always + // want to export them. + WasmSym::HeapBase->ForceExport = true; + WasmSym::DataEnd->ForceExport = true; + } + + if (Config->Pic) { + // For PIC code, we import two global variables (__memory_base and + // __table_base) from the environment and use these as the offset at + // which to load our static data and function table. + // See: + // https://github.com/WebAssembly/tool-conventions/blob/master/DynamicLinking.md + WasmSym::MemoryBase = + createUndefinedGlobal("__memory_base", &GlobalTypeI32); + WasmSym::TableBase = createUndefinedGlobal("__table_base", &GlobalTypeI32); + WasmSym::MemoryBase->markLive(); + WasmSym::TableBase->markLive(); + } + + WasmSym::DsoHandle = Symtab->addSyntheticDataSymbol( + "__dso_handle", WASM_SYMBOL_VISIBILITY_HIDDEN); +} + +void LinkerDriver::link(ArrayRef<const char *> ArgsArr) { + WasmOptTable Parser; + opt::InputArgList Args = Parser.parse(ArgsArr.slice(1)); + + // Handle --help + if (Args.hasArg(OPT_help)) { + Parser.PrintHelp(outs(), + (std::string(ArgsArr[0]) + " [options] file...").c_str(), + "LLVM Linker", false); + return; + } - // Handle the `--undefined <sym>` options. - for (auto *Arg : Args.filtered(OPT_undefined)) - addUndefined(Arg->getValue()); + // Handle --version + if (Args.hasArg(OPT_version) || Args.hasArg(OPT_v)) { + outs() << getLLDVersion() << "\n"; + return; } + // Parse and evaluate -mllvm options. + std::vector<const char *> V; + V.push_back("wasm-ld (LLVM option parsing)"); + for (auto *Arg : Args.filtered(OPT_mllvm)) + V.push_back(Arg->getValue()); + cl::ParseCommandLineOptions(V.size(), V.data()); + + errorHandler().ErrorLimit = args::getInteger(Args, OPT_error_limit, 20); + + setConfigs(Args); + checkOptions(Args); + + if (auto *Arg = Args.getLastArg(OPT_allow_undefined_file)) + readImportFile(Arg->getValue()); + + if (!Args.hasArg(OPT_INPUT)) { + error("no input files"); + return; + } + + Config->Pic = Config->Pie || Config->Shared; + + if (Config->Pic) { + if (Config->ExportTable) + error("-shared/-pie is incompatible with --export-table"); + Config->ImportTable = true; + } + + if (Config->Shared) { + Config->ExportDynamic = true; + Config->AllowUndefined = true; + } + + if (!Config->Relocatable) + createSyntheticSymbols(); + createFiles(Args); if (errorCount()) return; @@ -484,44 +562,46 @@ void LinkerDriver::link(ArrayRef<const char *> ArgsArr) { if (errorCount()) return; - // Add synthetic dummies for weak undefined functions. - if (!Config->Relocatable) - handleWeakUndefines(); + // Handle the `--undefined <sym>` options. + for (auto *Arg : Args.filtered(OPT_undefined)) + handleUndefined(Arg->getValue()); - // Handle --export. + // Handle the `--export <sym>` options + // This works like --undefined but also exports the symbol if its found for (auto *Arg : Args.filtered(OPT_export)) { - StringRef Name = Arg->getValue(); - Symbol *Sym = Symtab->find(Name); + Symbol *Sym = handleUndefined(Arg->getValue()); if (Sym && Sym->isDefined()) Sym->ForceExport = true; else if (!Config->AllowUndefined) - error("symbol exported via --export not found: " + Name); + error(Twine("symbol exported via --export not found: ") + + Arg->getValue()); } - // Do link-time optimization if given files are LLVM bitcode files. - // This compiles bitcode files into real object files. - Symtab->addCombinedLTOObject(); - if (errorCount()) - return; + Symbol *EntrySym = nullptr; + if (!Config->Relocatable) { + // Add synthetic dummies for weak undefined functions. + handleWeakUndefines(); - // Make sure we have resolved all symbols. - if (!Config->Relocatable && !Config->AllowUndefined) { - Symtab->reportRemainingUndefines(); - } else { - // Even when using --allow-undefined we still want to report the absence of - // our initial set of undefined symbols (i.e. the entry point and symbols - // specified via --undefined). - // Part of the reason for this is that these function don't have signatures - // so which means they cannot be written as wasm function imports. - for (auto *Arg : Args.filtered(OPT_undefined)) { - Symbol *Sym = Symtab->find(Arg->getValue()); - if (!Sym->isDefined()) - error("symbol forced with --undefined not found: " + Sym->getName()); + if (!Config->Shared && !Config->Entry.empty()) { + EntrySym = handleUndefined(Config->Entry); + if (EntrySym && EntrySym->isDefined()) + EntrySym->ForceExport = true; + else + error("entry symbol not defined (pass --no-entry to supress): " + + Config->Entry); } - if (EntrySym && !EntrySym->isDefined()) - error("entry symbol not defined (pass --no-entry to supress): " + - EntrySym->getName()); + + // Make sure we have resolved all symbols. + if (!Config->AllowUndefined) + Symtab->reportRemainingUndefines(); } + + if (errorCount()) + return; + + // Do link-time optimization if given files are LLVM bitcode files. + // This compiles bitcode files into real object files. + Symtab->addCombinedLTOObject(); if (errorCount()) return; diff --git a/wasm/InputChunks.cpp b/wasm/InputChunks.cpp index fcefac7d99b8..1145c670253c 100644 --- a/wasm/InputChunks.cpp +++ b/wasm/InputChunks.cpp @@ -25,7 +25,9 @@ using namespace lld::wasm; static StringRef ReloctTypeToString(uint8_t RelocType) { switch (RelocType) { -#define WASM_RELOC(NAME, REL) case REL: return #NAME; +#define WASM_RELOC(NAME, REL) \ + case REL: \ + return #NAME; #include "llvm/BinaryFormat/WasmRelocs.def" #undef WASM_RELOC } @@ -43,16 +45,6 @@ StringRef InputChunk::getComdatName() const { return File->getWasmObj()->linkingData().Comdats[Index]; } -void InputChunk::copyRelocations(const WasmSection &Section) { - if (Section.Relocations.empty()) - return; - size_t Start = getInputSectionOffset(); - size_t Size = getInputSize(); - for (const WasmRelocation &R : Section.Relocations) - if (R.Offset >= Start && R.Offset < Start + Size) - Relocations.push_back(R); -} - void InputChunk::verifyRelocTargets() const { for (const WasmRelocation &Rel : Relocations) { uint32_t ExistingValue; @@ -63,6 +55,7 @@ void InputChunk::verifyRelocTargets() const { case R_WEBASSEMBLY_TYPE_INDEX_LEB: case R_WEBASSEMBLY_FUNCTION_INDEX_LEB: case R_WEBASSEMBLY_GLOBAL_INDEX_LEB: + case R_WEBASSEMBLY_EVENT_INDEX_LEB: case R_WEBASSEMBLY_MEMORY_ADDR_LEB: ExistingValue = decodeULEB128(Loc, &BytesRead); break; @@ -119,6 +112,7 @@ void InputChunk::writeTo(uint8_t *Buf) const { case R_WEBASSEMBLY_TYPE_INDEX_LEB: case R_WEBASSEMBLY_FUNCTION_INDEX_LEB: case R_WEBASSEMBLY_GLOBAL_INDEX_LEB: + case R_WEBASSEMBLY_EVENT_INDEX_LEB: case R_WEBASSEMBLY_MEMORY_ADDR_LEB: encodeULEB128(Value, Loc, 5); break; @@ -188,6 +182,7 @@ static unsigned writeCompressedReloc(uint8_t *Buf, const WasmRelocation &Rel, case R_WEBASSEMBLY_TYPE_INDEX_LEB: case R_WEBASSEMBLY_FUNCTION_INDEX_LEB: case R_WEBASSEMBLY_GLOBAL_INDEX_LEB: + case R_WEBASSEMBLY_EVENT_INDEX_LEB: case R_WEBASSEMBLY_MEMORY_ADDR_LEB: return encodeULEB128(Value, Buf); case R_WEBASSEMBLY_TABLE_INDEX_SLEB: @@ -203,6 +198,7 @@ static unsigned getRelocWidthPadded(const WasmRelocation &Rel) { case R_WEBASSEMBLY_TYPE_INDEX_LEB: case R_WEBASSEMBLY_FUNCTION_INDEX_LEB: case R_WEBASSEMBLY_GLOBAL_INDEX_LEB: + case R_WEBASSEMBLY_EVENT_INDEX_LEB: case R_WEBASSEMBLY_MEMORY_ADDR_LEB: case R_WEBASSEMBLY_TABLE_INDEX_SLEB: case R_WEBASSEMBLY_MEMORY_ADDR_SLEB: @@ -228,7 +224,7 @@ static unsigned getRelocWidth(const WasmRelocation &Rel, uint32_t Value) { // This function only computes the final output size. It must be called // before getSize() is used to calculate of layout of the code section. void InputFunction::calculateSize() { - if (!File || !Config->CompressRelocTargets) + if (!File || !Config->CompressRelocations) return; LLVM_DEBUG(dbgs() << "calculateSize: " << getName() << "\n"); @@ -242,7 +238,7 @@ void InputFunction::calculateSize() { uint32_t End = Start + Function->Size; uint32_t LastRelocEnd = Start + FunctionSizeLength; - for (WasmRelocation &Rel : Relocations) { + for (const WasmRelocation &Rel : Relocations) { LLVM_DEBUG(dbgs() << " region: " << (Rel.Offset - LastRelocEnd) << "\n"); CompressedFuncSize += Rel.Offset - LastRelocEnd; CompressedFuncSize += getRelocWidth(Rel, File->calcNewValue(Rel)); @@ -263,11 +259,12 @@ void InputFunction::calculateSize() { // Override the default writeTo method so that we can (optionally) write the // compressed version of the function. void InputFunction::writeTo(uint8_t *Buf) const { - if (!File || !Config->CompressRelocTargets) + if (!File || !Config->CompressRelocations) return InputChunk::writeTo(Buf); Buf += OutputOffset; - uint8_t *Orig = Buf; (void)Orig; + uint8_t *Orig = Buf; + (void)Orig; const uint8_t *SecStart = File->CodeSection->Content.data(); const uint8_t *FuncStart = SecStart + getInputSectionOffset(); diff --git a/wasm/InputChunks.h b/wasm/InputChunks.h index 526e29870b21..a3bcbb266ec5 100644 --- a/wasm/InputChunks.h +++ b/wasm/InputChunks.h @@ -24,18 +24,9 @@ #include "Config.h" #include "InputFiles.h" #include "lld/Common/ErrorHandler.h" +#include "lld/Common/LLVM.h" #include "llvm/Object/Wasm.h" -using llvm::object::WasmSection; -using llvm::object::WasmSegment; -using llvm::wasm::WasmFunction; -using llvm::wasm::WasmRelocation; -using llvm::wasm::WasmSignature; - -namespace llvm { -class raw_ostream; -} - namespace lld { namespace wasm { @@ -49,17 +40,18 @@ public: Kind kind() const { return SectionKind; } virtual uint32_t getSize() const { return data().size(); } - - void copyRelocations(const WasmSection &Section); + virtual uint32_t getInputSize() const { return getSize(); }; virtual void writeTo(uint8_t *SectionStart) const; ArrayRef<WasmRelocation> getRelocations() const { return Relocations; } + void setRelocations(ArrayRef<WasmRelocation> Rs) { Relocations = Rs; } virtual StringRef getName() const = 0; virtual StringRef getDebugName() const = 0; virtual uint32_t getComdat() const = 0; StringRef getComdatName() const; + virtual uint32_t getInputSectionOffset() const = 0; size_t NumRelocations() const { return Relocations.size(); } void writeRelocations(llvm::raw_ostream &OS) const; @@ -77,14 +69,12 @@ protected: : File(F), Live(!Config->GcSections), SectionKind(K) {} virtual ~InputChunk() = default; virtual ArrayRef<uint8_t> data() const = 0; - virtual uint32_t getInputSectionOffset() const = 0; - virtual uint32_t getInputSize() const { return getSize(); }; // Verifies the existing data at relocation targets matches our expectations. // This is performed only debug builds as an extra sanity check. void verifyRelocTargets() const; - std::vector<WasmRelocation> Relocations; + ArrayRef<WasmRelocation> Relocations; Kind SectionKind; }; @@ -107,15 +97,15 @@ public: StringRef getName() const override { return Segment.Data.Name; } StringRef getDebugName() const override { return StringRef(); } uint32_t getComdat() const override { return Segment.Data.Comdat; } + uint32_t getInputSectionOffset() const override { + return Segment.SectionOffset; + } const OutputSegment *OutputSeg = nullptr; int32_t OutputSegmentOffset = 0; protected: ArrayRef<uint8_t> data() const override { return Segment.Data.Content; } - uint32_t getInputSectionOffset() const override { - return Segment.SectionOffset; - } const WasmSegment &Segment; }; @@ -139,15 +129,19 @@ public: uint32_t getFunctionInputOffset() const { return getInputSectionOffset(); } uint32_t getFunctionCodeOffset() const { return Function->CodeOffset; } uint32_t getSize() const override { - if (Config->CompressRelocTargets && File) { + if (Config->CompressRelocations && File) { assert(CompressedSize); return CompressedSize; } return data().size(); } + uint32_t getInputSize() const override { return Function->Size; } uint32_t getFunctionIndex() const { return FunctionIndex.getValue(); } bool hasFunctionIndex() const { return FunctionIndex.hasValue(); } void setFunctionIndex(uint32_t Index); + uint32_t getInputSectionOffset() const override { + return Function->CodeSectionOffset; + } uint32_t getTableIndex() const { return TableIndex.getValue(); } bool hasTableIndex() const { return TableIndex.hasValue(); } void setTableIndex(uint32_t Index); @@ -162,17 +156,11 @@ public: protected: ArrayRef<uint8_t> data() const override { - assert(!Config->CompressRelocTargets); + assert(!Config->CompressRelocations); return File->CodeSection->Content.slice(getInputSectionOffset(), Function->Size); } - uint32_t getInputSize() const override { return Function->Size; } - - uint32_t getInputSectionOffset() const override { - return Function->CodeSectionOffset; - } - const WasmFunction *Function; llvm::Optional<uint32_t> FunctionIndex; llvm::Optional<uint32_t> TableIndex; diff --git a/wasm/InputEvent.h b/wasm/InputEvent.h new file mode 100644 index 000000000000..d7c12627bd3d --- /dev/null +++ b/wasm/InputEvent.h @@ -0,0 +1,63 @@ +//===- InputEvent.h ---------------------------------------------*- C++ -*-===// +// +// The LLVM Linker +// +// This file is distributed under the University of Illinois Open Source +// License. See LICENSE.TXT for details. +// +//===----------------------------------------------------------------------===// +// +// Wasm events are features that suspend the current execution and transfer the +// control flow to a corresponding handler. Currently the only supported event +// kind is exceptions. +// +//===----------------------------------------------------------------------===// + +#ifndef LLD_WASM_INPUT_EVENT_H +#define LLD_WASM_INPUT_EVENT_H + +#include "Config.h" +#include "InputFiles.h" +#include "WriterUtils.h" +#include "lld/Common/ErrorHandler.h" +#include "llvm/Object/Wasm.h" + +namespace lld { +namespace wasm { + +// Represents a single Wasm Event within an input file. These are combined to +// form the final EVENTS section. +class InputEvent { +public: + InputEvent(const WasmSignature &S, const WasmEvent &E, ObjFile *F) + : File(F), Event(E), Signature(S), Live(!Config->GcSections) {} + + StringRef getName() const { return Event.SymbolName; } + const WasmEventType &getType() const { return Event.Type; } + + uint32_t getEventIndex() const { return EventIndex.getValue(); } + bool hasEventIndex() const { return EventIndex.hasValue(); } + void setEventIndex(uint32_t Index) { + assert(!hasEventIndex()); + EventIndex = Index; + } + + ObjFile *File; + WasmEvent Event; + const WasmSignature &Signature; + + bool Live = false; + +protected: + llvm::Optional<uint32_t> EventIndex; +}; + +} // namespace wasm + +inline std::string toString(const wasm::InputEvent *E) { + return (toString(E->File) + ":(" + E->getName() + ")").str(); +} + +} // namespace lld + +#endif // LLD_WASM_INPUT_EVENT_H diff --git a/wasm/InputFiles.cpp b/wasm/InputFiles.cpp index 53a24c3cffd4..e5da23db3773 100644 --- a/wasm/InputFiles.cpp +++ b/wasm/InputFiles.cpp @@ -10,6 +10,7 @@ #include "InputFiles.h" #include "Config.h" #include "InputChunks.h" +#include "InputEvent.h" #include "InputGlobal.h" #include "SymbolTable.h" #include "lld/Common/ErrorHandler.h" @@ -57,12 +58,13 @@ void ObjFile::dumpInfo() const { log("info for: " + getName() + "\n Symbols : " + Twine(Symbols.size()) + "\n Function Imports : " + Twine(WasmObj->getNumImportedFunctions()) + - "\n Global Imports : " + Twine(WasmObj->getNumImportedGlobals())); + "\n Global Imports : " + Twine(WasmObj->getNumImportedGlobals()) + + "\n Event Imports : " + Twine(WasmObj->getNumImportedEvents())); } // Relocations contain either symbol or type indices. This function takes a // relocation and returns relocated index (i.e. translates from the input -// sybmol/type space to the output symbol/type space). +// symbol/type space to the output symbol/type space). uint32_t ObjFile::calcNewIndex(const WasmRelocation &Reloc) const { if (Reloc.Type == R_WEBASSEMBLY_TYPE_INDEX_LEB) { assert(TypeIsUsed[Reloc.Index]); @@ -94,16 +96,17 @@ uint32_t ObjFile::calcExpectedValue(const WasmRelocation &Reloc) const { switch (Reloc.Type) { case R_WEBASSEMBLY_TABLE_INDEX_I32: case R_WEBASSEMBLY_TABLE_INDEX_SLEB: { - const WasmSymbol& Sym = WasmObj->syms()[Reloc.Index]; + const WasmSymbol &Sym = WasmObj->syms()[Reloc.Index]; return TableEntries[Sym.Info.ElementIndex]; } case R_WEBASSEMBLY_MEMORY_ADDR_SLEB: case R_WEBASSEMBLY_MEMORY_ADDR_I32: case R_WEBASSEMBLY_MEMORY_ADDR_LEB: { - const WasmSymbol& Sym = WasmObj->syms()[Reloc.Index]; + const WasmSymbol &Sym = WasmObj->syms()[Reloc.Index]; if (Sym.isUndefined()) return 0; - const WasmSegment& Segment = WasmObj->dataSegments()[Sym.Info.DataRef.Segment]; + const WasmSegment &Segment = + WasmObj->dataSegments()[Sym.Info.DataRef.Segment]; return Segment.Data.Offset.Value.Int32 + Sym.Info.DataRef.Offset + Reloc.Addend; } @@ -118,8 +121,9 @@ uint32_t ObjFile::calcExpectedValue(const WasmRelocation &Reloc) const { case R_WEBASSEMBLY_TYPE_INDEX_LEB: return Reloc.Index; case R_WEBASSEMBLY_FUNCTION_INDEX_LEB: - case R_WEBASSEMBLY_GLOBAL_INDEX_LEB: { - const WasmSymbol& Sym = WasmObj->syms()[Reloc.Index]; + case R_WEBASSEMBLY_GLOBAL_INDEX_LEB: + case R_WEBASSEMBLY_EVENT_INDEX_LEB: { + const WasmSymbol &Sym = WasmObj->syms()[Reloc.Index]; return Sym.Info.ElementIndex; } default: @@ -146,10 +150,13 @@ uint32_t ObjFile::calcNewValue(const WasmRelocation &Reloc) const { return getFunctionSymbol(Reloc.Index)->getFunctionIndex(); case R_WEBASSEMBLY_GLOBAL_INDEX_LEB: return getGlobalSymbol(Reloc.Index)->getGlobalIndex(); + case R_WEBASSEMBLY_EVENT_INDEX_LEB: + return getEventSymbol(Reloc.Index)->getEventIndex(); case R_WEBASSEMBLY_FUNCTION_OFFSET_I32: if (auto *Sym = dyn_cast<DefinedFunction>(getFunctionSymbol(Reloc.Index))) { - return Sym->Function->OutputOffset + - Sym->Function->getFunctionCodeOffset() + Reloc.Addend; + if (Sym->isLive()) + return Sym->Function->OutputOffset + + Sym->Function->getFunctionCodeOffset() + Reloc.Addend; } return 0; case R_WEBASSEMBLY_SECTION_OFFSET_I32: @@ -159,6 +166,37 @@ uint32_t ObjFile::calcNewValue(const WasmRelocation &Reloc) const { } } +template <class T> +static void setRelocs(const std::vector<T *> &Chunks, + const WasmSection *Section) { + if (!Section) + return; + + ArrayRef<WasmRelocation> Relocs = Section->Relocations; + assert(std::is_sorted(Relocs.begin(), Relocs.end(), + [](const WasmRelocation &R1, const WasmRelocation &R2) { + return R1.Offset < R2.Offset; + })); + assert(std::is_sorted( + Chunks.begin(), Chunks.end(), [](InputChunk *C1, InputChunk *C2) { + return C1->getInputSectionOffset() < C2->getInputSectionOffset(); + })); + + auto RelocsNext = Relocs.begin(); + auto RelocsEnd = Relocs.end(); + auto RelocLess = [](const WasmRelocation &R, uint32_t Val) { + return R.Offset < Val; + }; + for (InputChunk *C : Chunks) { + auto RelocsStart = std::lower_bound(RelocsNext, RelocsEnd, + C->getInputSectionOffset(), RelocLess); + RelocsNext = std::lower_bound( + RelocsStart, RelocsEnd, C->getInputSectionOffset() + C->getInputSize(), + RelocLess); + C->setRelocations(ArrayRef<WasmRelocation>(RelocsStart, RelocsNext)); + } +} + void ObjFile::parse() { // Parse a memory buffer as a wasm file. LLVM_DEBUG(dbgs() << "Parsing object: " << toString(this) << "\n"); @@ -200,7 +238,7 @@ void ObjFile::parse() { DataSection = &Section; } else if (Section.Type == WASM_SEC_CUSTOM) { CustomSections.emplace_back(make<InputSection>(Section, this)); - CustomSections.back()->copyRelocations(Section); + CustomSections.back()->setRelocations(Section.Relocations); CustomSectionsByIndex[SectionIndex] = CustomSections.back(); } SectionIndex++; @@ -215,11 +253,9 @@ void ObjFile::parse() { UsedComdats[I] = Symtab->addComdat(Comdats[I]); // Populate `Segments`. - for (const WasmSegment &S : WasmObj->dataSegments()) { - InputSegment *Seg = make<InputSegment>(S, this); - Seg->copyRelocations(*DataSection); - Segments.emplace_back(Seg); - } + for (const WasmSegment &S : WasmObj->dataSegments()) + Segments.emplace_back(make<InputSegment>(S, this)); + setRelocs(Segments, DataSection); // Populate `Functions`. ArrayRef<WasmFunction> Funcs = WasmObj->functions(); @@ -227,17 +263,19 @@ void ObjFile::parse() { ArrayRef<WasmSignature> Types = WasmObj->types(); Functions.reserve(Funcs.size()); - for (size_t I = 0, E = Funcs.size(); I != E; ++I) { - InputFunction *F = - make<InputFunction>(Types[FuncTypes[I]], &Funcs[I], this); - F->copyRelocations(*CodeSection); - Functions.emplace_back(F); - } + for (size_t I = 0, E = Funcs.size(); I != E; ++I) + Functions.emplace_back( + make<InputFunction>(Types[FuncTypes[I]], &Funcs[I], this)); + setRelocs(Functions, CodeSection); // Populate `Globals`. for (const WasmGlobal &G : WasmObj->globals()) Globals.emplace_back(make<InputGlobal>(G, this)); + // Populate `Events`. + for (const WasmEvent &E : WasmObj->events()) + Events.emplace_back(make<InputEvent>(Types[E.Type.SigIndex], E, this)); + // Populate `Symbols` based on the WasmSymbols in the object. Symbols.reserve(WasmObj->getNumberOfSymbols()); for (const SymbolRef &Sym : WasmObj->symbols()) { @@ -264,6 +302,10 @@ GlobalSymbol *ObjFile::getGlobalSymbol(uint32_t Index) const { return cast<GlobalSymbol>(Symbols[Index]); } +EventSymbol *ObjFile::getEventSymbol(uint32_t Index) const { + return cast<EventSymbol>(Symbols[Index]); +} + SectionSymbol *ObjFile::getSectionSymbol(uint32_t Index) const { return cast<SectionSymbol>(Symbols[Index]); } @@ -318,6 +360,13 @@ Symbol *ObjFile::createDefined(const WasmSymbol &Sym) { assert(Sym.isBindingLocal()); return make<SectionSymbol>(Name, Flags, Section, this); } + case WASM_SYMBOL_TYPE_EVENT: { + InputEvent *Event = + Events[Sym.Info.ElementIndex - WasmObj->getNumImportedEvents()]; + if (Sym.isBindingLocal()) + return make<DefinedEvent>(Name, Flags, this, Event); + return Symtab->addDefinedEvent(Name, Flags, this, Event); + } } llvm_unreachable("unknown symbol kind"); } @@ -328,7 +377,7 @@ Symbol *ObjFile::createUndefined(const WasmSymbol &Sym) { switch (Sym.Info.Kind) { case WASM_SYMBOL_TYPE_FUNCTION: - return Symtab->addUndefinedFunction(Name, Flags, this, Sym.FunctionType); + return Symtab->addUndefinedFunction(Name, Flags, this, Sym.Signature); case WASM_SYMBOL_TYPE_DATA: return Symtab->addUndefinedData(Name, Flags, this); case WASM_SYMBOL_TYPE_GLOBAL: diff --git a/wasm/InputFiles.h b/wasm/InputFiles.h index ec77446e6308..bcda9cc8ee92 100644 --- a/wasm/InputFiles.h +++ b/wasm/InputFiles.h @@ -20,21 +20,6 @@ #include "llvm/Support/MemoryBuffer.h" #include <vector> -using llvm::object::Archive; -using llvm::object::WasmObjectFile; -using llvm::object::WasmSection; -using llvm::object::WasmSymbol; -using llvm::wasm::WasmGlobal; -using llvm::wasm::WasmImport; -using llvm::wasm::WasmRelocation; -using llvm::wasm::WasmSignature; - -namespace llvm { -namespace lto { -class InputFile; -} -} // namespace llvm - namespace lld { namespace wasm { @@ -42,6 +27,7 @@ class InputChunk; class InputFunction; class InputSegment; class InputGlobal; +class InputEvent; class InputSection; class InputFile { @@ -84,12 +70,12 @@ public: explicit ArchiveFile(MemoryBufferRef M) : InputFile(ArchiveKind, M) {} static bool classof(const InputFile *F) { return F->kind() == ArchiveKind; } - void addMember(const Archive::Symbol *Sym); + void addMember(const llvm::object::Archive::Symbol *Sym); void parse() override; private: - std::unique_ptr<Archive> File; + std::unique_ptr<llvm::object::Archive> File; llvm::DenseSet<uint64_t> Seen; }; @@ -123,6 +109,7 @@ public: std::vector<InputSegment *> Segments; std::vector<InputFunction *> Functions; std::vector<InputGlobal *> Globals; + std::vector<InputEvent *> Events; std::vector<InputSection *> CustomSections; llvm::DenseMap<uint32_t, InputSection *> CustomSectionsByIndex; @@ -131,6 +118,7 @@ public: DataSymbol *getDataSymbol(uint32_t Index) const; GlobalSymbol *getGlobalSymbol(uint32_t Index) const; SectionSymbol *getSectionSymbol(uint32_t Index) const; + EventSymbol *getEventSymbol(uint32_t Index) const; private: Symbol *createDefined(const WasmSymbol &Sym); diff --git a/wasm/InputGlobal.h b/wasm/InputGlobal.h index 37d0ab903706..3b20600b22e8 100644 --- a/wasm/InputGlobal.h +++ b/wasm/InputGlobal.h @@ -16,9 +16,6 @@ #include "lld/Common/ErrorHandler.h" #include "llvm/Object/Wasm.h" -using llvm::wasm::WasmGlobal; -using llvm::wasm::WasmInitExpr; - namespace lld { namespace wasm { diff --git a/wasm/LTO.cpp b/wasm/LTO.cpp index f15551da8b80..96a947e29d41 100644 --- a/wasm/LTO.cpp +++ b/wasm/LTO.cpp @@ -36,8 +36,6 @@ #include <vector> using namespace llvm; -using namespace llvm::object; - using namespace lld; using namespace lld::wasm; @@ -55,6 +53,14 @@ static std::unique_ptr<lto::LTO> createLTO() { C.DisableVerify = Config->DisableVerify; C.DiagHandler = diagnosticHandler; C.OptLevel = Config->LTOO; + C.MAttrs = GetMAttrs(); + + if (Config->Relocatable) + C.RelocModel = None; + else if (Config->Pic) + C.RelocModel = Reloc::PIC_; + else + C.RelocModel = Reloc::Static; if (Config->SaveTemps) checkError(C.addSaveTemps(Config->OutputFile.str() + ".", @@ -72,10 +78,11 @@ BitcodeCompiler::BitcodeCompiler() : LTOObj(createLTO()) {} BitcodeCompiler::~BitcodeCompiler() = default; static void undefine(Symbol *S) { - if (isa<DefinedFunction>(S)) - replaceSymbol<UndefinedFunction>(S, S->getName(), 0); + if (auto F = dyn_cast<DefinedFunction>(S)) + replaceSymbol<UndefinedFunction>(F, F->getName(), 0, F->getFile(), + F->Signature); else if (isa<DefinedData>(S)) - replaceSymbol<UndefinedData>(S, S->getName(), 0); + replaceSymbol<UndefinedData>(S, S->getName(), 0, S->getFile()); else llvm_unreachable("unexpected symbol kind"); } diff --git a/wasm/MarkLive.cpp b/wasm/MarkLive.cpp index dfaa712c3296..3bbd1148f6ad 100644 --- a/wasm/MarkLive.cpp +++ b/wasm/MarkLive.cpp @@ -22,6 +22,7 @@ #include "MarkLive.h" #include "Config.h" #include "InputChunks.h" +#include "InputEvent.h" #include "InputGlobal.h" #include "SymbolTable.h" #include "Symbols.h" @@ -30,8 +31,6 @@ using namespace llvm; using namespace llvm::wasm; -using namespace lld; -using namespace lld::wasm; void lld::wasm::markLive() { if (!Config->GcSections) @@ -107,6 +106,9 @@ void lld::wasm::markLive() { for (InputGlobal *G : Obj->Globals) if (!G->Live) message("removing unused section " + toString(G)); + for (InputEvent *E : Obj->Events) + if (!E->Live) + message("removing unused section " + toString(E)); } for (InputChunk *C : Symtab->SyntheticFunctions) if (!C->Live) diff --git a/wasm/Options.td b/wasm/Options.td index 43588a830e31..3ed55b4bcda0 100644 --- a/wasm/Options.td +++ b/wasm/Options.td @@ -6,9 +6,10 @@ class F<string name>: Flag<["--", "-"], name>; class J<string name>: Joined<["--", "-"], name>; class S<string name>: Separate<["--", "-"], name>; -multiclass Eq<string name> { - def "": Separate<["--", "-"], name>; - def _eq: Joined<["--", "-"], name # "=">, Alias<!cast<Separate>(NAME)>; +multiclass Eq<string name, string help> { + def NAME: Separate<["--", "-"], name>; + def NAME # _eq: Joined<["--", "-"], name # "=">, Alias<!cast<Separate>(NAME)>, + HelpText<help>; } multiclass B<string name, string help1, string help2> { @@ -16,17 +17,24 @@ multiclass B<string name, string help1, string help2> { def no_ # NAME: Flag<["--", "-"], "no-" # name>, HelpText<help2>; } -// The follow flags are shared with the ELF linker +// The following flags are shared with the ELF linker def color_diagnostics: F<"color-diagnostics">, HelpText<"Use colors in diagnostics">; def color_diagnostics_eq: J<"color-diagnostics=">, HelpText<"Use colors in diagnostics; one of 'always', 'never', 'auto'">; +def compress_relocations: F<"compress-relocations">, + HelpText<"Compress the relocation targets in the code section.">; + defm demangle: B<"demangle", "Demangle symbol names", "Do not demangle symbol names">; +defm export_dynamic: B<"export-dynamic", + "Put symbols in the dynamic symbol table", + "Do not put symbols in the dynamic symbol table (default)">; + def entry: S<"entry">, MetaVarName<"<entry>">, HelpText<"Name of entry point symbol">; @@ -67,20 +75,25 @@ def o: JoinedOrSeparate<["-"], "o">, MetaVarName<"<path>">, def O: JoinedOrSeparate<["-"], "O">, HelpText<"Optimize output file size">; +defm pie: B<"pie", + "Create a position independent executable", + "Do not create a position independent executable (default)">; + defm print_gc_sections: B<"print-gc-sections", "List removed unused sections", "Do not list removed unused sections">; def relocatable: F<"relocatable">, HelpText<"Create relocatable object file">; +def shared: F<"shared">, HelpText<"Build a shared object">; + def strip_all: F<"strip-all">, HelpText<"Strip all symbols">; def strip_debug: F<"strip-debug">, HelpText<"Strip debugging information">; def threads: F<"threads">, HelpText<"Run the linker multi-threaded">; -defm undefined: Eq<"undefined">, - HelpText<"Force undefined symbol during linking">; +defm undefined: Eq<"undefined", "Force undefined symbol during linking">; def v: Flag<["-"], "v">, HelpText<"Display the version number">; @@ -102,8 +115,7 @@ def allow_undefined_file: J<"allow-undefined-file=">, def allow_undefined_file_s: Separate<["-"], "allow-undefined-file">, Alias<allow_undefined_file>; -defm export: Eq<"export">, - HelpText<"Force a symbol to be exported">; +defm export: Eq<"export", "Force a symbol to be exported">; def export_all: F<"export-all">, HelpText<"Export all symbols (normally combined with --no-gc-sections)">; @@ -117,6 +129,9 @@ def global_base: J<"global-base=">, def import_memory: F<"import-memory">, HelpText<"Import memory from the environment">; +def shared_memory: F<"shared-memory">, + HelpText<"Use shared linear memory">; + def import_table: F<"import-table">, HelpText<"Import function table from the environment">; @@ -137,12 +152,15 @@ defm whole_archive: B<"whole-archive", "Do not force load of all members in a static library (default)">; // Aliases -def alias_entry_e: JoinedOrSeparate<["-"], "e">, Alias<entry>; -def alias_entry_entry: J<"entry=">, Alias<entry>; -def alias_initial_memory_i: Flag<["-"], "i">, Alias<initial_memory>; -def alias_max_memory_m: Flag<["-"], "m">, Alias<max_memory>; -def alias_relocatable_r: Flag<["-"], "r">, Alias<relocatable>; -def alias_undefined_u: JoinedOrSeparate<["-"], "u">, Alias<undefined>; +def: JoinedOrSeparate<["-"], "e">, Alias<entry>; +def: J<"entry=">, Alias<entry>; +def: Flag<["-"], "E">, Alias<export_dynamic>, HelpText<"Alias for --export-dynamic">; +def: Flag<["-"], "i">, Alias<initial_memory>; +def: Flag<["-"], "m">, Alias<max_memory>; +def: Flag<["-"], "r">, Alias<relocatable>; +def: Flag<["-"], "s">, Alias<strip_all>, HelpText<"Alias for --strip-all">; +def: Flag<["-"], "S">, Alias<strip_debug>, HelpText<"Alias for --strip-debug">; +def: JoinedOrSeparate<["-"], "u">, Alias<undefined>; // LTO-related options. def lto_O: J<"lto-O">, MetaVarName<"<opt-level>">, @@ -153,6 +171,5 @@ def disable_verify: F<"disable-verify">; def save_temps: F<"save-temps">; def thinlto_cache_dir: J<"thinlto-cache-dir=">, HelpText<"Path to ThinLTO cached object file directory">; -defm thinlto_cache_policy: Eq<"thinlto-cache-policy">, - HelpText<"Pruning policy for the ThinLTO cache">; +defm thinlto_cache_policy: Eq<"thinlto-cache-policy", "Pruning policy for the ThinLTO cache">; def thinlto_jobs: J<"thinlto-jobs=">, HelpText<"Number of ThinLTO jobs">; diff --git a/wasm/OutputSections.cpp b/wasm/OutputSections.cpp index 256a9884f947..4123d63b7466 100644 --- a/wasm/OutputSections.cpp +++ b/wasm/OutputSections.cpp @@ -40,6 +40,8 @@ static StringRef sectionTypeToString(uint32_t SectionType) { return "MEMORY"; case WASM_SEC_GLOBAL: return "GLOBAL"; + case WASM_SEC_EVENT: + return "EVENT"; case WASM_SEC_EXPORT: return "EXPORT"; case WASM_SEC_START: @@ -136,9 +138,17 @@ DataSection::DataSection(ArrayRef<OutputSegment *> Segments) for (OutputSegment *Segment : Segments) { raw_string_ostream OS(Segment->Header); writeUleb128(OS, 0, "memory index"); - writeUleb128(OS, WASM_OPCODE_I32_CONST, "opcode:i32const"); - writeSleb128(OS, Segment->StartVA, "memory offset"); - writeUleb128(OS, WASM_OPCODE_END, "opcode:end"); + WasmInitExpr InitExpr; + if (Config->Pic) { + assert(Segments.size() <= 1 && + "Currenly only a single data segment is supported in PIC mode"); + InitExpr.Opcode = WASM_OPCODE_GLOBAL_GET; + InitExpr.Value.Global = WasmSym::MemoryBase->getGlobalIndex(); + } else { + InitExpr.Opcode = WASM_OPCODE_I32_CONST; + InitExpr.Value.Int32 = Segment->StartVA; + } + writeInitExpr(OS, InitExpr); writeUleb128(OS, Segment->Size, "segment size"); OS.flush(); diff --git a/wasm/OutputSections.h b/wasm/OutputSections.h index 189d6507c4b3..6c5baa309a98 100644 --- a/wasm/OutputSections.h +++ b/wasm/OutputSections.h @@ -13,11 +13,9 @@ #include "InputChunks.h" #include "WriterUtils.h" #include "lld/Common/ErrorHandler.h" +#include "lld/Common/LLVM.h" #include "llvm/ADT/DenseMap.h" -using llvm::raw_ostream; -using llvm::raw_string_ostream; - namespace lld { namespace wasm { @@ -82,7 +80,7 @@ public: std::string Body; protected: - raw_string_ostream BodyOutputStream; + llvm::raw_string_ostream BodyOutputStream; }; class CodeSection : public OutputSection { @@ -113,7 +111,7 @@ protected: size_t BodySize = 0; }; -// Represents a custom section in the output file. Wasm custom sections are +// Represents a custom section in the output file. Wasm custom sections are // used for storing user-defined metadata. Unlike the core sections types // they are identified by their string name. // The linker combines custom sections that have the same name by simply diff --git a/wasm/OutputSegment.h b/wasm/OutputSegment.h index d5c89cd19f4c..a982282dac10 100644 --- a/wasm/OutputSegment.h +++ b/wasm/OutputSegment.h @@ -26,7 +26,7 @@ public: void addInputSegment(InputSegment *InSeg) { Alignment = std::max(Alignment, InSeg->getAlignment()); InputSegments.push_back(InSeg); - Size = llvm::alignTo(Size, InSeg->getAlignment()); + Size = llvm::alignTo(Size, 1 << InSeg->getAlignment()); InSeg->OutputSeg = this; InSeg->OutputSegmentOffset = Size; Size += InSeg->getSize(); diff --git a/wasm/SymbolTable.cpp b/wasm/SymbolTable.cpp index e1ba23769738..c7983196db36 100644 --- a/wasm/SymbolTable.cpp +++ b/wasm/SymbolTable.cpp @@ -10,6 +10,7 @@ #include "SymbolTable.h" #include "Config.h" #include "InputChunks.h" +#include "InputEvent.h" #include "InputGlobal.h" #include "WriterUtils.h" #include "lld/Common/ErrorHandler.h" @@ -20,6 +21,7 @@ using namespace llvm; using namespace llvm::wasm; +using namespace llvm::object; using namespace lld; using namespace lld::wasm; @@ -60,7 +62,6 @@ void SymbolTable::addCombinedLTOObject() { } void SymbolTable::reportRemainingUndefines() { - SetVector<Symbol *> Undefs; for (Symbol *Sym : SymVector) { if (!Sym->isUndefined() || Sym->isWeak()) continue; @@ -68,34 +69,26 @@ void SymbolTable::reportRemainingUndefines() { continue; if (!Sym->IsUsedInRegularObj) continue; - Undefs.insert(Sym); + error(toString(Sym->getFile()) + ": undefined symbol: " + toString(*Sym)); } - - if (Undefs.empty()) - return; - - for (ObjFile *File : ObjectFiles) - for (Symbol *Sym : File->getSymbols()) - if (Undefs.count(Sym)) - error(toString(File) + ": undefined symbol: " + toString(*Sym)); - - for (Symbol *Sym : Undefs) - if (!Sym->getFile()) - error("undefined symbol: " + toString(*Sym)); } Symbol *SymbolTable::find(StringRef Name) { return SymMap.lookup(CachedHashStringRef(Name)); } -std::pair<Symbol *, bool> SymbolTable::insert(StringRef Name) { +std::pair<Symbol *, bool> SymbolTable::insert(StringRef Name, InputFile *File) { + bool Inserted = false; Symbol *&Sym = SymMap[CachedHashStringRef(Name)]; - if (Sym) - return {Sym, false}; - Sym = reinterpret_cast<Symbol *>(make<SymbolUnion>()); - Sym->IsUsedInRegularObj = false; - SymVector.emplace_back(Sym); - return {Sym, true}; + if (!Sym) { + Sym = reinterpret_cast<Symbol *>(make<SymbolUnion>()); + Sym->IsUsedInRegularObj = false; + SymVector.emplace_back(Sym); + Inserted = true; + } + if (!File || File->kind() == InputFile::ObjectKind) + Sym->IsUsedInRegularObj = true; + return {Sym, Inserted}; } static void reportTypeError(const Symbol *Existing, const InputFile *File, @@ -106,6 +99,8 @@ static void reportTypeError(const Symbol *Existing, const InputFile *File, " in " + toString(File)); } +// Check the type of new symbol matches that of the symbol is replacing. +// For functions this can also involve verifying that the signatures match. static void checkFunctionType(Symbol *Existing, const InputFile *File, const WasmSignature *NewSig) { auto ExistingFunction = dyn_cast<FunctionSymbol>(Existing); @@ -117,9 +112,9 @@ static void checkFunctionType(Symbol *Existing, const InputFile *File, if (!NewSig) return; - const WasmSignature *OldSig = ExistingFunction->FunctionType; + const WasmSignature *OldSig = ExistingFunction->Signature; if (!OldSig) { - ExistingFunction->FunctionType = NewSig; + ExistingFunction->Signature = NewSig; return; } @@ -130,8 +125,6 @@ static void checkFunctionType(Symbol *Existing, const InputFile *File, toString(*NewSig) + " in " + toString(File)); } -// Check the type of new symbol matches that of the symbol is replacing. -// For functions this can also involve verifying that the signatures match. static void checkGlobalType(const Symbol *Existing, const InputFile *File, const WasmGlobalType *NewType) { if (!isa<GlobalSymbol>(Existing)) { @@ -147,6 +140,28 @@ static void checkGlobalType(const Symbol *Existing, const InputFile *File, } } +static void checkEventType(const Symbol *Existing, const InputFile *File, + const WasmEventType *NewType, + const WasmSignature *NewSig) { + auto ExistingEvent = dyn_cast<EventSymbol>(Existing); + if (!isa<EventSymbol>(Existing)) { + reportTypeError(Existing, File, WASM_SYMBOL_TYPE_EVENT); + return; + } + + const WasmEventType *OldType = cast<EventSymbol>(Existing)->getEventType(); + const WasmSignature *OldSig = ExistingEvent->Signature; + if (NewType->Attribute != OldType->Attribute) + error("Event type mismatch: " + Existing->getName() + "\n>>> defined as " + + toString(*OldType) + " in " + toString(Existing->getFile()) + + "\n>>> defined as " + toString(*NewType) + " in " + toString(File)); + if (*NewSig != *OldSig) + warn("Event signature mismatch: " + Existing->getName() + + "\n>>> defined as " + toString(*OldSig) + " in " + + toString(Existing->getFile()) + "\n>>> defined as " + + toString(*NewSig) + " in " + toString(File)); +} + static void checkDataType(const Symbol *Existing, const InputFile *File) { if (!isa<DataSymbol>(Existing)) reportTypeError(Existing, File, WASM_SYMBOL_TYPE_DATA); @@ -158,15 +173,15 @@ DefinedFunction *SymbolTable::addSyntheticFunction(StringRef Name, LLVM_DEBUG(dbgs() << "addSyntheticFunction: " << Name << "\n"); assert(!find(Name)); SyntheticFunctions.emplace_back(Function); - return replaceSymbol<DefinedFunction>(insert(Name).first, Name, Flags, - nullptr, Function); + return replaceSymbol<DefinedFunction>(insert(Name, nullptr).first, Name, + Flags, nullptr, Function); } DefinedData *SymbolTable::addSyntheticDataSymbol(StringRef Name, uint32_t Flags) { LLVM_DEBUG(dbgs() << "addSyntheticDataSymbol: " << Name << "\n"); assert(!find(Name)); - return replaceSymbol<DefinedData>(insert(Name).first, Name, Flags); + return replaceSymbol<DefinedData>(insert(Name, nullptr).first, Name, Flags); } DefinedGlobal *SymbolTable::addSyntheticGlobal(StringRef Name, uint32_t Flags, @@ -175,8 +190,8 @@ DefinedGlobal *SymbolTable::addSyntheticGlobal(StringRef Name, uint32_t Flags, << "\n"); assert(!find(Name)); SyntheticGlobals.emplace_back(Global); - return replaceSymbol<DefinedGlobal>(insert(Name).first, Name, Flags, nullptr, - Global); + return replaceSymbol<DefinedGlobal>(insert(Name, nullptr).first, Name, Flags, + nullptr, Global); } static bool shouldReplace(const Symbol *Existing, InputFile *NewFile, @@ -210,13 +225,12 @@ static bool shouldReplace(const Symbol *Existing, InputFile *NewFile, Symbol *SymbolTable::addDefinedFunction(StringRef Name, uint32_t Flags, InputFile *File, InputFunction *Function) { - LLVM_DEBUG(dbgs() << "addDefinedFunction: " << Name << "\n"); + LLVM_DEBUG(dbgs() << "addDefinedFunction: " << Name << " [" + << (Function ? toString(Function->Signature) : "none") + << "]\n"); Symbol *S; bool WasInserted; - std::tie(S, WasInserted) = insert(Name); - - if (!File || File->kind() == InputFile::ObjectKind) - S->IsUsedInRegularObj = true; + std::tie(S, WasInserted) = insert(Name, File); if (WasInserted || S->isLazy()) { replaceSymbol<DefinedFunction>(S, Name, Flags, File, Function); @@ -226,8 +240,16 @@ Symbol *SymbolTable::addDefinedFunction(StringRef Name, uint32_t Flags, if (Function) checkFunctionType(S, File, &Function->Signature); - if (shouldReplace(S, File, Flags)) - replaceSymbol<DefinedFunction>(S, Name, Flags, File, Function); + if (shouldReplace(S, File, Flags)) { + // If the new defined function doesn't have signture (i.e. bitcode + // functions) but the old symbols does then preserve the old signature + const WasmSignature *OldSig = nullptr; + if (auto* F = dyn_cast<FunctionSymbol>(S)) + OldSig = F->Signature; + auto NewSym = replaceSymbol<DefinedFunction>(S, Name, Flags, File, Function); + if (!NewSym->Signature) + NewSym->Signature = OldSig; + } return S; } @@ -238,10 +260,7 @@ Symbol *SymbolTable::addDefinedData(StringRef Name, uint32_t Flags, << "\n"); Symbol *S; bool WasInserted; - std::tie(S, WasInserted) = insert(Name); - - if (!File || File->kind() == InputFile::ObjectKind) - S->IsUsedInRegularObj = true; + std::tie(S, WasInserted) = insert(Name, File); if (WasInserted || S->isLazy()) { replaceSymbol<DefinedData>(S, Name, Flags, File, Segment, Address, Size); @@ -258,12 +277,10 @@ Symbol *SymbolTable::addDefinedData(StringRef Name, uint32_t Flags, Symbol *SymbolTable::addDefinedGlobal(StringRef Name, uint32_t Flags, InputFile *File, InputGlobal *Global) { LLVM_DEBUG(dbgs() << "addDefinedGlobal:" << Name << "\n"); + Symbol *S; bool WasInserted; - std::tie(S, WasInserted) = insert(Name); - - if (!File || File->kind() == InputFile::ObjectKind) - S->IsUsedInRegularObj = true; + std::tie(S, WasInserted) = insert(Name, File); if (WasInserted || S->isLazy()) { replaceSymbol<DefinedGlobal>(S, Name, Flags, File, Global); @@ -277,17 +294,35 @@ Symbol *SymbolTable::addDefinedGlobal(StringRef Name, uint32_t Flags, return S; } +Symbol *SymbolTable::addDefinedEvent(StringRef Name, uint32_t Flags, + InputFile *File, InputEvent *Event) { + LLVM_DEBUG(dbgs() << "addDefinedEvent:" << Name << "\n"); + + Symbol *S; + bool WasInserted; + std::tie(S, WasInserted) = insert(Name, File); + + if (WasInserted || S->isLazy()) { + replaceSymbol<DefinedEvent>(S, Name, Flags, File, Event); + return S; + } + + checkEventType(S, File, &Event->getType(), &Event->Signature); + + if (shouldReplace(S, File, Flags)) + replaceSymbol<DefinedEvent>(S, Name, Flags, File, Event); + return S; +} + Symbol *SymbolTable::addUndefinedFunction(StringRef Name, uint32_t Flags, InputFile *File, const WasmSignature *Sig) { - LLVM_DEBUG(dbgs() << "addUndefinedFunction: " << Name << "\n"); + LLVM_DEBUG(dbgs() << "addUndefinedFunction: " << Name << + " [" << (Sig ? toString(*Sig) : "none") << "]\n"); Symbol *S; bool WasInserted; - std::tie(S, WasInserted) = insert(Name); - - if (!File || File->kind() == InputFile::ObjectKind) - S->IsUsedInRegularObj = true; + std::tie(S, WasInserted) = insert(Name, File); if (WasInserted) replaceSymbol<UndefinedFunction>(S, Name, Flags, File, Sig); @@ -305,10 +340,7 @@ Symbol *SymbolTable::addUndefinedData(StringRef Name, uint32_t Flags, Symbol *S; bool WasInserted; - std::tie(S, WasInserted) = insert(Name); - - if (!File || File->kind() == InputFile::ObjectKind) - S->IsUsedInRegularObj = true; + std::tie(S, WasInserted) = insert(Name, File); if (WasInserted) replaceSymbol<UndefinedData>(S, Name, Flags, File); @@ -326,10 +358,7 @@ Symbol *SymbolTable::addUndefinedGlobal(StringRef Name, uint32_t Flags, Symbol *S; bool WasInserted; - std::tie(S, WasInserted) = insert(Name); - - if (!File || File->kind() == InputFile::ObjectKind) - S->IsUsedInRegularObj = true; + std::tie(S, WasInserted) = insert(Name, File); if (WasInserted) replaceSymbol<UndefinedGlobal>(S, Name, Flags, File, Type); @@ -346,7 +375,7 @@ void SymbolTable::addLazy(ArchiveFile *File, const Archive::Symbol *Sym) { Symbol *S; bool WasInserted; - std::tie(S, WasInserted) = insert(Name); + std::tie(S, WasInserted) = insert(Name, nullptr); if (WasInserted) { replaceSymbol<LazySymbol>(S, Name, File, *Sym); diff --git a/wasm/SymbolTable.h b/wasm/SymbolTable.h index 26242e6cddd6..5e38e30692ab 100644 --- a/wasm/SymbolTable.h +++ b/wasm/SymbolTable.h @@ -13,12 +13,9 @@ #include "InputFiles.h" #include "LTO.h" #include "Symbols.h" +#include "lld/Common/LLVM.h" #include "llvm/ADT/CachedHashString.h" #include "llvm/ADT/DenseSet.h" -#include "llvm/Support/raw_ostream.h" - -using llvm::wasm::WasmGlobalType; -using llvm::wasm::WasmSignature; namespace lld { namespace wasm { @@ -59,6 +56,8 @@ public: uint32_t Size); Symbol *addDefinedGlobal(StringRef Name, uint32_t Flags, InputFile *File, InputGlobal *G); + Symbol *addDefinedEvent(StringRef Name, uint32_t Flags, InputFile *File, + InputEvent *E); Symbol *addUndefinedFunction(StringRef Name, uint32_t Flags, InputFile *File, const WasmSignature *Signature); @@ -66,7 +65,7 @@ public: Symbol *addUndefinedGlobal(StringRef Name, uint32_t Flags, InputFile *File, const WasmGlobalType *Type); - void addLazy(ArchiveFile *F, const Archive::Symbol *Sym); + void addLazy(ArchiveFile *F, const llvm::object::Archive::Symbol *Sym); bool addComdat(StringRef Name); @@ -77,7 +76,7 @@ public: InputFunction *Function); private: - std::pair<Symbol *, bool> insert(StringRef Name); + std::pair<Symbol *, bool> insert(StringRef Name, InputFile *File); llvm::DenseMap<llvm::CachedHashStringRef, Symbol *> SymMap; std::vector<Symbol *> SymVector; diff --git a/wasm/Symbols.cpp b/wasm/Symbols.cpp index a11081cbcf77..4bef9761ec25 100644 --- a/wasm/Symbols.cpp +++ b/wasm/Symbols.cpp @@ -10,6 +10,7 @@ #include "Symbols.h" #include "Config.h" #include "InputChunks.h" +#include "InputEvent.h" #include "InputFiles.h" #include "InputGlobal.h" #include "OutputSegment.h" @@ -27,7 +28,9 @@ DefinedFunction *WasmSym::CallCtors; DefinedData *WasmSym::DsoHandle; DefinedData *WasmSym::DataEnd; DefinedData *WasmSym::HeapBase; -DefinedGlobal *WasmSym::StackPointer; +GlobalSymbol *WasmSym::StackPointer; +UndefinedGlobal *WasmSym::TableBase; +UndefinedGlobal *WasmSym::MemoryBase; WasmSymbolType Symbol::getWasmType() const { if (isa<FunctionSymbol>(this)) @@ -36,6 +39,8 @@ WasmSymbolType Symbol::getWasmType() const { return WASM_SYMBOL_TYPE_DATA; if (isa<GlobalSymbol>(this)) return WASM_SYMBOL_TYPE_GLOBAL; + if (isa<EventSymbol>(this)) + return WASM_SYMBOL_TYPE_EVENT; if (isa<SectionSymbol>(this)) return WASM_SYMBOL_TYPE_SECTION; llvm_unreachable("invalid symbol kind"); @@ -52,6 +57,8 @@ InputChunk *Symbol::getChunk() const { bool Symbol::isLive() const { if (auto *G = dyn_cast<DefinedGlobal>(this)) return G->Global->Live; + if (auto *E = dyn_cast<DefinedEvent>(this)) + return E->Event->Live; if (InputChunk *C = getChunk()) return C->Live; return Referenced; @@ -60,6 +67,8 @@ bool Symbol::isLive() const { void Symbol::markLive() { if (auto *G = dyn_cast<DefinedGlobal>(this)) G->Global->Live = true; + if (auto *E = dyn_cast<DefinedEvent>(this)) + E->Event->Live = true; if (InputChunk *C = getChunk()) C->Live = true; Referenced = true; @@ -105,7 +114,10 @@ bool Symbol::isExported() const { if (ForceExport || Config->ExportAll) return true; - return !isHidden(); + if (Config->ExportDynamic && !isHidden()) + return true; + + return false; } uint32_t FunctionSymbol::getFunctionIndex() const { @@ -207,6 +219,32 @@ DefinedGlobal::DefinedGlobal(StringRef Name, uint32_t Flags, InputFile *File, Global ? &Global->getType() : nullptr), Global(Global) {} +uint32_t EventSymbol::getEventIndex() const { + if (auto *F = dyn_cast<DefinedEvent>(this)) + return F->Event->getEventIndex(); + assert(EventIndex != INVALID_INDEX); + return EventIndex; +} + +void EventSymbol::setEventIndex(uint32_t Index) { + LLVM_DEBUG(dbgs() << "setEventIndex " << Name << " -> " << Index << "\n"); + assert(EventIndex == INVALID_INDEX); + EventIndex = Index; +} + +bool EventSymbol::hasEventIndex() const { + if (auto *F = dyn_cast<DefinedEvent>(this)) + return F->Event->hasEventIndex(); + return EventIndex != INVALID_INDEX; +} + +DefinedEvent::DefinedEvent(StringRef Name, uint32_t Flags, InputFile *File, + InputEvent *Event) + : EventSymbol(Name, DefinedEventKind, Flags, File, + Event ? &Event->getType() : nullptr, + Event ? &Event->Signature : nullptr), + Event(Event) {} + uint32_t SectionSymbol::getOutputSectionIndex() const { LLVM_DEBUG(dbgs() << "getOutputSectionIndex: " << getName() << "\n"); assert(OutputSectionIndex != INVALID_INDEX); @@ -223,10 +261,14 @@ void SectionSymbol::setOutputSectionIndex(uint32_t Index) { void LazySymbol::fetch() { cast<ArchiveFile>(File)->addMember(&ArchiveSymbol); } std::string lld::toString(const wasm::Symbol &Sym) { + return lld::maybeDemangleSymbol(Sym.getName()); +} + +std::string lld::maybeDemangleSymbol(StringRef Name) { if (Config->Demangle) - if (Optional<std::string> S = demangleItanium(Sym.getName())) + if (Optional<std::string> S = demangleItanium(Name)) return *S; - return Sym.getName(); + return Name; } std::string lld::toString(wasm::Symbol::Kind Kind) { @@ -237,6 +279,8 @@ std::string lld::toString(wasm::Symbol::Kind Kind) { return "DefinedData"; case wasm::Symbol::DefinedGlobalKind: return "DefinedGlobal"; + case wasm::Symbol::DefinedEventKind: + return "DefinedEvent"; case wasm::Symbol::UndefinedFunctionKind: return "UndefinedFunction"; case wasm::Symbol::UndefinedDataKind: diff --git a/wasm/Symbols.h b/wasm/Symbols.h index 815cc97d22d1..11ee66550cdc 100644 --- a/wasm/Symbols.h +++ b/wasm/Symbols.h @@ -15,21 +15,17 @@ #include "llvm/Object/Archive.h" #include "llvm/Object/Wasm.h" -using llvm::object::Archive; -using llvm::object::WasmSymbol; -using llvm::wasm::WasmGlobal; -using llvm::wasm::WasmGlobalType; -using llvm::wasm::WasmSignature; -using llvm::wasm::WasmSymbolType; - namespace lld { namespace wasm { +using llvm::wasm::WasmSymbolType; + class InputFile; class InputChunk; class InputSegment; class InputFunction; class InputGlobal; +class InputEvent; class InputSection; #define INVALID_INDEX UINT32_MAX @@ -41,6 +37,7 @@ public: DefinedFunctionKind, DefinedDataKind, DefinedGlobalKind, + DefinedEventKind, SectionKind, UndefinedFunctionKind, UndefinedDataKind, @@ -52,7 +49,8 @@ public: bool isDefined() const { return SymbolKind == DefinedFunctionKind || SymbolKind == DefinedDataKind || - SymbolKind == DefinedGlobalKind || SymbolKind == SectionKind; + SymbolKind == DefinedGlobalKind || SymbolKind == DefinedEventKind || + SymbolKind == SectionKind; } bool isUndefined() const { @@ -126,12 +124,12 @@ public: void setFunctionIndex(uint32_t Index); bool hasFunctionIndex() const; - const WasmSignature *FunctionType; + const WasmSignature *Signature; protected: FunctionSymbol(StringRef Name, Kind K, uint32_t Flags, InputFile *F, - const WasmSignature *Type) - : Symbol(Name, K, Flags, F), FunctionType(Type) {} + const WasmSignature *Sig) + : Symbol(Name, K, Flags, F), Signature(Sig) {} uint32_t TableIndex = INVALID_INDEX; uint32_t FunctionIndex = INVALID_INDEX; @@ -245,8 +243,6 @@ protected: const WasmGlobalType *GlobalType) : Symbol(Name, K, Flags, F), GlobalType(GlobalType) {} - // Explicit function type, needed for undefined or synthetic functions only. - // For regular defined globals this information comes from the InputChunk. const WasmGlobalType *GlobalType; uint32_t GlobalIndex = INVALID_INDEX; }; @@ -274,16 +270,61 @@ public: } }; +// Wasm events are features that suspend the current execution and transfer the +// control flow to a corresponding handler. Currently the only supported event +// kind is exceptions. +// +// Event tags are values to distinguish different events. For exceptions, they +// can be used to distinguish different language's exceptions, i.e., all C++ +// exceptions have the same tag. Wasm can generate code capable of doing +// different handling actions based on the tag of caught exceptions. +// +// A single EventSymbol object represents a single tag. C++ exception event +// symbol is a weak symbol generated in every object file in which exceptions +// are used, and has name '__cpp_exception' for linking. +class EventSymbol : public Symbol { +public: + static bool classof(const Symbol *S) { return S->kind() == DefinedEventKind; } + + const WasmEventType *getEventType() const { return EventType; } + + // Get/set the event index + uint32_t getEventIndex() const; + void setEventIndex(uint32_t Index); + bool hasEventIndex() const; + + const WasmSignature *Signature; + +protected: + EventSymbol(StringRef Name, Kind K, uint32_t Flags, InputFile *F, + const WasmEventType *EventType, const WasmSignature *Sig) + : Symbol(Name, K, Flags, F), Signature(Sig), EventType(EventType) {} + + const WasmEventType *EventType; + uint32_t EventIndex = INVALID_INDEX; +}; + +class DefinedEvent : public EventSymbol { +public: + DefinedEvent(StringRef Name, uint32_t Flags, InputFile *File, + InputEvent *Event); + + static bool classof(const Symbol *S) { return S->kind() == DefinedEventKind; } + + InputEvent *Event; +}; + class LazySymbol : public Symbol { public: - LazySymbol(StringRef Name, InputFile *File, const Archive::Symbol &Sym) + LazySymbol(StringRef Name, InputFile *File, + const llvm::object::Archive::Symbol &Sym) : Symbol(Name, LazyKind, 0, File), ArchiveSymbol(Sym) {} static bool classof(const Symbol *S) { return S->kind() == LazyKind; } void fetch(); private: - Archive::Symbol ArchiveSymbol; + llvm::object::Archive::Symbol ArchiveSymbol; }; // linker-generated symbols @@ -291,7 +332,7 @@ struct WasmSym { // __stack_pointer // Global that holds the address of the top of the explicit value stack in // linear memory. - static DefinedGlobal *StackPointer; + static GlobalSymbol *StackPointer; // __data_end // Symbol marking the end of the data and bss. @@ -310,6 +351,14 @@ struct WasmSym { // __dso_handle // Symbol used in calls to __cxa_atexit to determine current DLL static DefinedData *DsoHandle; + + // __table_base + // Used in PIC code for offset of indirect function table + static UndefinedGlobal *TableBase; + + // __memory_base + // Used in PIC code for offset of global data + static UndefinedGlobal *MemoryBase; }; // A buffer class that is large enough to hold any Symbol-derived @@ -319,10 +368,11 @@ union SymbolUnion { alignas(DefinedFunction) char A[sizeof(DefinedFunction)]; alignas(DefinedData) char B[sizeof(DefinedData)]; alignas(DefinedGlobal) char C[sizeof(DefinedGlobal)]; - alignas(LazySymbol) char D[sizeof(LazySymbol)]; - alignas(UndefinedFunction) char E[sizeof(UndefinedFunction)]; - alignas(UndefinedData) char F[sizeof(UndefinedData)]; - alignas(UndefinedGlobal) char G[sizeof(UndefinedGlobal)]; + alignas(DefinedEvent) char D[sizeof(DefinedEvent)]; + alignas(LazySymbol) char E[sizeof(LazySymbol)]; + alignas(UndefinedFunction) char F[sizeof(UndefinedFunction)]; + alignas(UndefinedData) char G[sizeof(UndefinedData)]; + alignas(UndefinedGlobal) char H[sizeof(UndefinedGlobal)]; alignas(SectionSymbol) char I[sizeof(SectionSymbol)]; }; @@ -330,7 +380,7 @@ template <typename T, typename... ArgT> T *replaceSymbol(Symbol *S, ArgT &&... Arg) { static_assert(std::is_trivially_destructible<T>(), "Symbol types must be trivially destructible"); - static_assert(sizeof(T) <= sizeof(SymbolUnion), "Symbol too small"); + static_assert(sizeof(T) <= sizeof(SymbolUnion), "SymbolUnion too small"); static_assert(alignof(T) <= alignof(SymbolUnion), "SymbolUnion not aligned enough"); assert(static_cast<Symbol *>(static_cast<T *>(nullptr)) == nullptr && @@ -349,6 +399,7 @@ T *replaceSymbol(Symbol *S, ArgT &&... Arg) { // Returns a symbol name for an error message. std::string toString(const wasm::Symbol &Sym); std::string toString(wasm::Symbol::Kind Kind); +std::string maybeDemangleSymbol(StringRef Name); } // namespace lld diff --git a/wasm/Writer.cpp b/wasm/Writer.cpp index 37ad32452a91..819d4298fef2 100644 --- a/wasm/Writer.cpp +++ b/wasm/Writer.cpp @@ -10,6 +10,7 @@ #include "Writer.h" #include "Config.h" #include "InputChunks.h" +#include "InputEvent.h" #include "InputGlobal.h" #include "OutputSections.h" #include "OutputSegment.h" @@ -39,7 +40,6 @@ using namespace lld; using namespace lld::wasm; static constexpr int kStackAlignment = 16; -static constexpr int kInitialTableOffset = 1; static constexpr const char *kFunctionTableName = "__indirect_function_table"; namespace { @@ -81,6 +81,7 @@ private: void createFunctionSection(); void createTableSection(); void createGlobalSection(); + void createEventSection(); void createExportSection(); void createImportSection(); void createMemorySection(); @@ -90,6 +91,7 @@ private: void createCustomSections(); // Custom sections + void createDylinkSection(); void createRelocSections(); void createLinkingSection(); void createNameSection(); @@ -98,18 +100,25 @@ private: void writeSections(); uint64_t FileSize = 0; + uint32_t TableBase = 0; uint32_t NumMemoryPages = 0; uint32_t MaxMemoryPages = 0; + // Memory size and aligment. Written to the "dylink" section + // when build with -shared or -pie. + uint32_t MemAlign = 0; + uint32_t MemSize = 0; std::vector<const WasmSignature *> Types; DenseMap<WasmSignature, int32_t> TypeIndices; std::vector<const Symbol *> ImportedSymbols; unsigned NumImportedFunctions = 0; unsigned NumImportedGlobals = 0; + unsigned NumImportedEvents = 0; std::vector<WasmExport> Exports; std::vector<const DefinedData *> DefinedFakeGlobals; std::vector<InputGlobal *> InputGlobals; std::vector<InputFunction *> InputFunctions; + std::vector<InputEvent *> InputEvents; std::vector<const FunctionSymbol *> IndirectFunctions; std::vector<const Symbol *> SymtabEntries; std::vector<WasmInitEntry> InitFunctions; @@ -155,17 +164,19 @@ void Writer::createImportSection() { Import.Memory.Flags |= WASM_LIMITS_FLAG_HAS_MAX; Import.Memory.Maximum = MaxMemoryPages; } + if (Config->SharedMemory) + Import.Memory.Flags |= WASM_LIMITS_FLAG_IS_SHARED; writeImport(OS, Import); } if (Config->ImportTable) { - uint32_t TableSize = kInitialTableOffset + IndirectFunctions.size(); + uint32_t TableSize = TableBase + IndirectFunctions.size(); WasmImport Import; Import.Module = "env"; Import.Field = kFunctionTableName; Import.Kind = WASM_EXTERNAL_TABLE; - Import.Table.ElemType = WASM_TYPE_ANYFUNC; - Import.Table.Limits = {WASM_LIMITS_FLAG_HAS_MAX, TableSize, TableSize}; + Import.Table.ElemType = WASM_TYPE_FUNCREF; + Import.Table.Limits = {0, TableSize, 0}; writeImport(OS, Import); } @@ -175,11 +186,15 @@ void Writer::createImportSection() { Import.Field = Sym->getName(); if (auto *FunctionSym = dyn_cast<FunctionSymbol>(Sym)) { Import.Kind = WASM_EXTERNAL_FUNCTION; - Import.SigIndex = lookupType(*FunctionSym->FunctionType); - } else { - auto *GlobalSym = cast<GlobalSymbol>(Sym); + Import.SigIndex = lookupType(*FunctionSym->Signature); + } else if (auto *GlobalSym = dyn_cast<GlobalSymbol>(Sym)) { Import.Kind = WASM_EXTERNAL_GLOBAL; Import.Global = *GlobalSym->getGlobalType(); + } else { + auto *EventSym = cast<EventSymbol>(Sym); + Import.Kind = WASM_EXTERNAL_EVENT; + Import.Event.Attribute = EventSym->getEventType()->Attribute; + Import.Event.SigIndex = lookupType(*EventSym->Signature); } writeImport(OS, Import); } @@ -214,8 +229,12 @@ void Writer::createMemorySection() { bool HasMax = MaxMemoryPages != 0; writeUleb128(OS, 1, "memory count"); - writeUleb128(OS, HasMax ? static_cast<unsigned>(WASM_LIMITS_FLAG_HAS_MAX) : 0, - "memory limits flags"); + unsigned Flags = 0; + if (HasMax) + Flags |= WASM_LIMITS_FLAG_HAS_MAX; + if (Config->SharedMemory) + Flags |= WASM_LIMITS_FLAG_IS_SHARED; + writeUleb128(OS, Flags, "memory limits flags"); writeUleb128(OS, NumMemoryPages, "initial pages"); if (HasMax) writeUleb128(OS, MaxMemoryPages, "max pages"); @@ -241,6 +260,31 @@ void Writer::createGlobalSection() { } } +// The event section contains a list of declared wasm events associated with the +// module. Currently the only supported event kind is exceptions. A single event +// entry represents a single event with an event tag. All C++ exceptions are +// represented by a single event. An event entry in this section contains +// information on what kind of event it is (e.g. exception) and the type of +// values contained in a single event object. (In wasm, an event can contain +// multiple values of primitive types. But for C++ exceptions, we just throw a +// pointer which is an i32 value (for wasm32 architecture), so the signature of +// C++ exception is (i32)->(void), because all event types are assumed to have +// void return type to share WasmSignature with functions.) +void Writer::createEventSection() { + unsigned NumEvents = InputEvents.size(); + if (NumEvents == 0) + return; + + SyntheticSection *Section = createSyntheticSection(WASM_SEC_EVENT); + raw_ostream &OS = Section->getStream(); + + writeUleb128(OS, NumEvents, "event count"); + for (InputEvent *E : InputEvents) { + E->Event.Type.SigIndex = lookupType(E->Signature); + writeEvent(OS, E->Event); + } +} + void Writer::createTableSection() { if (Config->ImportTable) return; @@ -253,14 +297,14 @@ void Writer::createTableSection() { // no address-taken function will fail at validation time since it is // a validation error to include a call_indirect instruction if there // is not table. - uint32_t TableSize = kInitialTableOffset + IndirectFunctions.size(); + uint32_t TableSize = TableBase + IndirectFunctions.size(); SyntheticSection *Section = createSyntheticSection(WASM_SEC_TABLE); raw_ostream &OS = Section->getStream(); writeUleb128(OS, 1, "table count"); WasmLimits Limits = {WASM_LIMITS_FLAG_HAS_MAX, TableSize, TableSize}; - writeTableType(OS, WasmTable{WASM_TYPE_ANYFUNC, Limits}); + writeTableType(OS, WasmTable{WASM_TYPE_FUNCREF, Limits}); } void Writer::createExportSection() { @@ -319,12 +363,17 @@ void Writer::createElemSection() { writeUleb128(OS, 1, "segment count"); writeUleb128(OS, 0, "table index"); WasmInitExpr InitExpr; - InitExpr.Opcode = WASM_OPCODE_I32_CONST; - InitExpr.Value.Int32 = kInitialTableOffset; + if (Config->Pic) { + InitExpr.Opcode = WASM_OPCODE_GLOBAL_GET; + InitExpr.Value.Global = WasmSym::TableBase->getGlobalIndex(); + } else { + InitExpr.Opcode = WASM_OPCODE_I32_CONST; + InitExpr.Value.Int32 = TableBase; + } writeInitExpr(OS, InitExpr); writeUleb128(OS, IndirectFunctions.size(), "elem count"); - uint32_t TableIndex = kInitialTableOffset; + uint32_t TableIndex = TableBase; for (const FunctionSymbol *Sym : IndirectFunctions) { assert(Sym->getTableIndex() == TableIndex); writeUleb128(OS, Sym->getFunctionIndex(), "function index"); @@ -419,6 +468,21 @@ public: raw_string_ostream OS{Body}; }; +// Create the custom "dylink" section containing information for the dynamic +// linker. +// See +// https://github.com/WebAssembly/tool-conventions/blob/master/DynamicLinking.md +void Writer::createDylinkSection() { + SyntheticSection *Section = createSyntheticSection(WASM_SEC_CUSTOM, "dylink"); + raw_ostream &OS = Section->getStream(); + + writeUleb128(OS, MemSize, "MemSize"); + writeUleb128(OS, MemAlign, "MemAlign"); + writeUleb128(OS, IndirectFunctions.size(), "TableSize"); + writeUleb128(OS, 0, "TableAlign"); + writeUleb128(OS, 0, "Needed"); // TODO: Support "needed" shared libraries +} + // Create the custom "linking" section containing linker metadata. // This is only created when relocatable output is requested. void Writer::createLinkingSection() { @@ -448,6 +512,10 @@ void Writer::createLinkingSection() { writeUleb128(Sub.OS, G->getGlobalIndex(), "index"); if (Sym->isDefined()) writeStr(Sub.OS, Sym->getName(), "sym name"); + } else if (auto *E = dyn_cast<EventSymbol>(Sym)) { + writeUleb128(Sub.OS, E->getEventIndex(), "index"); + if (Sym->isDefined()) + writeStr(Sub.OS, Sym->getName(), "sym name"); } else if (isa<DataSymbol>(Sym)) { writeStr(Sub.OS, Sym->getName(), "sym name"); if (auto *DataSym = dyn_cast<DefinedData>(Sym)) { @@ -548,8 +616,7 @@ void Writer::createNameSection() { for (const Symbol *S : ImportedSymbols) { if (auto *F = dyn_cast<FunctionSymbol>(S)) { writeUleb128(Sub.OS, F->getFunctionIndex(), "func index"); - Optional<std::string> Name = demangleItanium(F->getName()); - writeStr(Sub.OS, Name ? StringRef(*Name) : F->getName(), "symbol name"); + writeStr(Sub.OS, toString(*S), "symbol name"); } } for (const InputFunction *F : InputFunctions) { @@ -558,8 +625,7 @@ void Writer::createNameSection() { if (!F->getDebugName().empty()) { writeStr(Sub.OS, F->getDebugName(), "symbol name"); } else { - Optional<std::string> Name = demangleItanium(F->getName()); - writeStr(Sub.OS, Name ? StringRef(*Name) : F->getName(), "symbol name"); + writeStr(Sub.OS, maybeDemangleSymbol(F->getName()), "symbol name"); } } } @@ -586,16 +652,16 @@ void Writer::writeSections() { // - heap start / unallocated // // The --stack-first option means that stack is placed before any static data. -// This can be useful since it means that stack overflow traps immediately rather -// than overwriting global data, but also increases code size since all static -// data loads and stores requires larger offsets. +// This can be useful since it means that stack overflow traps immediately +// rather than overwriting global data, but also increases code size since all +// static data loads and stores requires larger offsets. void Writer::layoutMemory() { createOutputSegments(); uint32_t MemoryPtr = 0; auto PlaceStack = [&]() { - if (Config->Relocatable) + if (Config->Relocatable || Config->Shared) return; MemoryPtr = alignTo(MemoryPtr, kStackAlignment); if (Config->ZStackSize != alignTo(Config->ZStackSize, kStackAlignment)) @@ -603,7 +669,8 @@ void Writer::layoutMemory() { log("mem: stack size = " + Twine(Config->ZStackSize)); log("mem: stack base = " + Twine(MemoryPtr)); MemoryPtr += Config->ZStackSize; - WasmSym::StackPointer->Global->Global.InitExpr.Value.Int32 = MemoryPtr; + auto *SP = cast<DefinedGlobal>(WasmSym::StackPointer); + SP->Global->Global.InitExpr.Value.Int32 = MemoryPtr; log("mem: stack top = " + Twine(MemoryPtr)); }; @@ -621,8 +688,10 @@ void Writer::layoutMemory() { if (WasmSym::DsoHandle) WasmSym::DsoHandle->setVirtualAddress(DataStart); + MemAlign = 0; for (OutputSegment *Seg : Segments) { - MemoryPtr = alignTo(MemoryPtr, Seg->Alignment); + MemAlign = std::max(MemAlign, Seg->Alignment); + MemoryPtr = alignTo(MemoryPtr, 1 << Seg->Alignment); Seg->StartVA = MemoryPtr; log(formatv("mem: {0,-15} offset={1,-8} size={2,-8} align={3}", Seg->Name, MemoryPtr, Seg->Size, Seg->Alignment)); @@ -635,6 +704,11 @@ void Writer::layoutMemory() { log("mem: static data = " + Twine(MemoryPtr - DataStart)); + if (Config->Shared) { + MemSize = MemoryPtr; + return; + } + if (!Config->StackFirst) PlaceStack(); @@ -654,8 +728,8 @@ void Writer::layoutMemory() { else MemoryPtr = Config->InitialMemory; } - uint32_t MemSize = alignTo(MemoryPtr, WasmPageSize); - NumMemoryPages = MemSize / WasmPageSize; + MemSize = MemoryPtr; + NumMemoryPages = alignTo(MemoryPtr, WasmPageSize) / WasmPageSize; log("mem: total pages = " + Twine(NumMemoryPages)); if (Config->MaxMemory != 0) { @@ -678,12 +752,15 @@ SyntheticSection *Writer::createSyntheticSection(uint32_t Type, void Writer::createSections() { // Known sections + if (Config->Pic) + createDylinkSection(); createTypeSection(); createImportSection(); createFunctionSection(); createTableSection(); createMemorySection(); createGlobalSection(); + createEventSection(); createExportSection(); createElemSection(); createCodeSection(); @@ -722,8 +799,10 @@ void Writer::calculateImports() { ImportedSymbols.emplace_back(Sym); if (auto *F = dyn_cast<FunctionSymbol>(Sym)) F->setFunctionIndex(NumImportedFunctions++); + else if (auto *G = dyn_cast<GlobalSymbol>(Sym)) + G->setGlobalIndex(NumImportedGlobals++); else - cast<GlobalSymbol>(Sym)->setGlobalIndex(NumImportedGlobals++); + cast<EventSymbol>(Sym)->setEventIndex(NumImportedEvents++); } } @@ -759,6 +838,8 @@ void Writer::calculateExports() { continue; } Export = {Name, WASM_EXTERNAL_GLOBAL, G->getGlobalIndex()}; + } else if (auto *E = dyn_cast<DefinedEvent>(Sym)) { + Export = {Name, WASM_EXTERNAL_EVENT, E->getEventIndex()}; } else { auto *D = cast<DefinedData>(Sym); DefinedFakeGlobals.emplace_back(D); @@ -836,6 +917,8 @@ void Writer::calculateTypes() { // 1. Any signature used in the TYPE relocation // 2. The signatures of all imported functions // 3. The signatures of all defined functions + // 4. The signatures of all imported events + // 5. The signatures of all defined events for (ObjFile *File : Symtab->ObjectFiles) { ArrayRef<WasmSignature> Types = File->getWasmObj()->types(); @@ -844,16 +927,23 @@ void Writer::calculateTypes() { File->TypeMap[I] = registerType(Types[I]); } - for (const Symbol *Sym : ImportedSymbols) + for (const Symbol *Sym : ImportedSymbols) { if (auto *F = dyn_cast<FunctionSymbol>(Sym)) - registerType(*F->FunctionType); + registerType(*F->Signature); + else if (auto *E = dyn_cast<EventSymbol>(Sym)) + registerType(*E->Signature); + } for (const InputFunction *F : InputFunctions) registerType(F->Signature); + + for (const InputEvent *E : InputEvents) + registerType(E->Signature); } void Writer::assignIndexes() { - uint32_t FunctionIndex = NumImportedFunctions + InputFunctions.size(); + assert(InputFunctions.empty()); + uint32_t FunctionIndex = NumImportedFunctions; auto AddDefinedFunction = [&](InputFunction *Func) { if (!Func->Live) return; @@ -870,7 +960,7 @@ void Writer::assignIndexes() { AddDefinedFunction(Func); } - uint32_t TableIndex = kInitialTableOffset; + uint32_t TableIndex = TableBase; auto HandleRelocs = [&](InputChunk *Chunk) { if (!Chunk->Live) return; @@ -902,7 +992,8 @@ void Writer::assignIndexes() { HandleRelocs(P); } - uint32_t GlobalIndex = NumImportedGlobals + InputGlobals.size(); + assert(InputGlobals.empty()); + uint32_t GlobalIndex = NumImportedGlobals; auto AddDefinedGlobal = [&](InputGlobal *Global) { if (Global->Live) { LLVM_DEBUG(dbgs() << "AddDefinedGlobal: " << GlobalIndex << "\n"); @@ -919,9 +1010,29 @@ void Writer::assignIndexes() { for (InputGlobal *Global : File->Globals) AddDefinedGlobal(Global); } + + assert(InputEvents.empty()); + uint32_t EventIndex = NumImportedEvents; + auto AddDefinedEvent = [&](InputEvent *Event) { + if (Event->Live) { + LLVM_DEBUG(dbgs() << "AddDefinedEvent: " << EventIndex << "\n"); + Event->setEventIndex(EventIndex++); + InputEvents.push_back(Event); + } + }; + + for (ObjFile *File : Symtab->ObjectFiles) { + LLVM_DEBUG(dbgs() << "Events: " << File->getName() << "\n"); + for (InputEvent *Event : File->Events) + AddDefinedEvent(Event); + } } static StringRef getOutputDataSegmentName(StringRef Name) { + // With PIC code we currently only support a single data segment since + // we only have a single __memory_base to use as our base address. + if (Config->Pic) + return "data"; if (!Config->MergeDataSegments) return Name; if (Name.startswith(".text.")) @@ -930,6 +1041,8 @@ static StringRef getOutputDataSegmentName(StringRef Name) { return ".data"; if (Name.startswith(".bss.")) return ".bss"; + if (Name.startswith(".rodata.")) + return ".rodata"; return Name; } @@ -977,7 +1090,7 @@ void Writer::createCtorFunction() { OS << BodyContent; } - ArrayRef<uint8_t> Body = toArrayRef(Saver.save(FunctionBody)); + ArrayRef<uint8_t> Body = arrayRefFromStringRef(Saver.save(FunctionBody)); cast<SyntheticFunction>(WasmSym::CallCtors->Function)->setBody(Body); } @@ -989,7 +1102,7 @@ void Writer::calculateInitFunctions() { const WasmLinkingData &L = File->getWasmObj()->linkingData(); for (const WasmInitFunc &F : L.InitFunctions) { FunctionSymbol *Sym = File->getFunctionSymbol(F.Symbol); - if (*Sym->FunctionType != WasmSignature{{}, WASM_TYPE_NORESULT}) + if (*Sym->Signature != WasmSignature{{}, {}}) error("invalid signature for init func: " + toString(*Sym)); InitFunctions.emplace_back(WasmInitEntry{Sym, F.Priority}); } @@ -1004,9 +1117,14 @@ void Writer::calculateInitFunctions() { } void Writer::run() { - if (Config->Relocatable) + if (Config->Relocatable || Config->Pic) Config->GlobalBase = 0; + // For PIC code the table base is assigned dynamically by the loader. + // For non-PIC, we start at 1 so that accessing table index 0 always traps. + if (!Config->Pic) + TableBase = 1; + log("-- calculateImports"); calculateImports(); log("-- assignIndexes"); @@ -1029,8 +1147,10 @@ void Writer::run() { if (errorHandler().Verbose) { log("Defined Functions: " + Twine(InputFunctions.size())); log("Defined Globals : " + Twine(InputGlobals.size())); + log("Defined Events : " + Twine(InputEvents.size())); log("Function Imports : " + Twine(NumImportedFunctions)); log("Global Imports : " + Twine(NumImportedGlobals)); + log("Event Imports : " + Twine(NumImportedEvents)); for (ObjFile *File : Symtab->ObjectFiles) File->dumpInfo(); } diff --git a/wasm/WriterUtils.cpp b/wasm/WriterUtils.cpp index 201529edeaa6..80bfc0916121 100644 --- a/wasm/WriterUtils.cpp +++ b/wasm/WriterUtils.cpp @@ -17,22 +17,6 @@ using namespace llvm; using namespace llvm::wasm; -using namespace lld::wasm; - -static const char *valueTypeToString(uint8_t Type) { - switch (Type) { - case WASM_TYPE_I32: - return "i32"; - case WASM_TYPE_I64: - return "i64"; - case WASM_TYPE_F32: - return "f32"; - case WASM_TYPE_F64: - return "f64"; - default: - llvm_unreachable("invalid value type"); - } -} namespace lld { @@ -73,21 +57,20 @@ void wasm::writeU32(raw_ostream &OS, uint32_t Number, const Twine &Msg) { support::endian::write(OS, Number, support::little); } -void wasm::writeValueType(raw_ostream &OS, uint8_t Type, const Twine &Msg) { - writeU8(OS, Type, Msg + "[type: " + valueTypeToString(Type) + "]"); +void wasm::writeValueType(raw_ostream &OS, ValType Type, const Twine &Msg) { + writeU8(OS, static_cast<uint8_t>(Type), + Msg + "[type: " + toString(Type) + "]"); } void wasm::writeSig(raw_ostream &OS, const WasmSignature &Sig) { writeU8(OS, WASM_TYPE_FUNC, "signature type"); - writeUleb128(OS, Sig.ParamTypes.size(), "param Count"); - for (uint8_t ParamType : Sig.ParamTypes) { + writeUleb128(OS, Sig.Params.size(), "param Count"); + for (ValType ParamType : Sig.Params) { writeValueType(OS, ParamType, "param type"); } - if (Sig.ReturnType == WASM_TYPE_NORESULT) { - writeUleb128(OS, 0, "result Count"); - } else { - writeUleb128(OS, 1, "result Count"); - writeValueType(OS, Sig.ReturnType, "result type"); + writeUleb128(OS, Sig.Returns.size(), "result Count"); + if (Sig.Returns.size()) { + writeValueType(OS, Sig.Returns[0], "result type"); } } @@ -100,7 +83,7 @@ void wasm::writeInitExpr(raw_ostream &OS, const WasmInitExpr &InitExpr) { case WASM_OPCODE_I64_CONST: writeSleb128(OS, InitExpr.Value.Int64, "literal (i64)"); break; - case WASM_OPCODE_GET_GLOBAL: + case WASM_OPCODE_GLOBAL_GET: writeUleb128(OS, InitExpr.Value.Global, "literal (global index)"); break; default: @@ -117,7 +100,8 @@ void wasm::writeLimits(raw_ostream &OS, const WasmLimits &Limits) { } void wasm::writeGlobalType(raw_ostream &OS, const WasmGlobalType &Type) { - writeValueType(OS, Type.Type, "global type"); + // TODO: Update WasmGlobalType to use ValType and remove this cast. + writeValueType(OS, ValType(Type.Type), "global type"); writeU8(OS, Type.Mutable, "global mutable"); } @@ -126,8 +110,17 @@ void wasm::writeGlobal(raw_ostream &OS, const WasmGlobal &Global) { writeInitExpr(OS, Global.InitExpr); } +void wasm::writeEventType(raw_ostream &OS, const WasmEventType &Type) { + writeUleb128(OS, Type.Attribute, "event attribute"); + writeUleb128(OS, Type.SigIndex, "sig index"); +} + +void wasm::writeEvent(raw_ostream &OS, const WasmEvent &Event) { + writeEventType(OS, Event.Type); +} + void wasm::writeTableType(raw_ostream &OS, const llvm::wasm::WasmTable &Type) { - writeU8(OS, WASM_TYPE_ANYFUNC, "table type"); + writeU8(OS, WASM_TYPE_FUNCREF, "table type"); writeLimits(OS, Type.Limits); } @@ -142,6 +135,9 @@ void wasm::writeImport(raw_ostream &OS, const WasmImport &Import) { case WASM_EXTERNAL_GLOBAL: writeGlobalType(OS, Import.Global); break; + case WASM_EXTERNAL_EVENT: + writeEventType(OS, Import.Event); + break; case WASM_EXTERNAL_MEMORY: writeLimits(OS, Import.Memory); break; @@ -178,13 +174,15 @@ void wasm::writeExport(raw_ostream &OS, const WasmExport &Export) { std::string lld::toString(ValType Type) { switch (Type) { case ValType::I32: - return "I32"; + return "i32"; case ValType::I64: - return "I64"; + return "i64"; case ValType::F32: - return "F32"; + return "f32"; case ValType::F64: - return "F64"; + return "f64"; + case ValType::V128: + return "v128"; case ValType::EXCEPT_REF: return "except_ref"; } @@ -193,20 +191,26 @@ std::string lld::toString(ValType Type) { std::string lld::toString(const WasmSignature &Sig) { SmallString<128> S("("); - for (uint32_t Type : Sig.ParamTypes) { + for (ValType Type : Sig.Params) { if (S.size() != 1) S += ", "; - S += toString(static_cast<ValType>(Type)); + S += toString(Type); } S += ") -> "; - if (Sig.ReturnType == WASM_TYPE_NORESULT) + if (Sig.Returns.size() == 0) S += "void"; else - S += toString(static_cast<ValType>(Sig.ReturnType)); + S += toString(Sig.Returns[0]); return S.str(); } -std::string lld::toString(const WasmGlobalType &Sig) { - return (Sig.Mutable ? "var " : "const ") + - toString(static_cast<ValType>(Sig.Type)); +std::string lld::toString(const WasmGlobalType &Type) { + return (Type.Mutable ? "var " : "const ") + + toString(static_cast<ValType>(Type.Type)); +} + +std::string lld::toString(const WasmEventType &Type) { + if (Type.Attribute == WASM_EVENT_ATTRIBUTE_EXCEPTION) + return "exception"; + return "unknown"; } diff --git a/wasm/WriterUtils.h b/wasm/WriterUtils.h index 74d727b24b40..7fc4b5aa83dc 100644 --- a/wasm/WriterUtils.h +++ b/wasm/WriterUtils.h @@ -13,9 +13,6 @@ #include "lld/Common/LLVM.h" #include "llvm/ADT/Twine.h" #include "llvm/Object/Wasm.h" -#include "llvm/Support/raw_ostream.h" - -using llvm::raw_ostream; namespace lld { namespace wasm { @@ -35,7 +32,8 @@ void writeU8(raw_ostream &OS, uint8_t byte, const Twine &Msg); void writeU32(raw_ostream &OS, uint32_t Number, const Twine &Msg); -void writeValueType(raw_ostream &OS, uint8_t Type, const Twine &Msg); +void writeValueType(raw_ostream &OS, llvm::wasm::ValType Type, + const Twine &Msg); void writeSig(raw_ostream &OS, const llvm::wasm::WasmSignature &Sig); @@ -47,6 +45,10 @@ void writeGlobalType(raw_ostream &OS, const llvm::wasm::WasmGlobalType &Type); void writeGlobal(raw_ostream &OS, const llvm::wasm::WasmGlobal &Global); +void writeEventType(raw_ostream &OS, const llvm::wasm::WasmEventType &Type); + +void writeEvent(raw_ostream &OS, const llvm::wasm::WasmEvent &Event); + void writeTableType(raw_ostream &OS, const llvm::wasm::WasmTable &Type); void writeImport(raw_ostream &OS, const llvm::wasm::WasmImport &Import); @@ -57,7 +59,8 @@ void writeExport(raw_ostream &OS, const llvm::wasm::WasmExport &Export); std::string toString(llvm::wasm::ValType Type); std::string toString(const llvm::wasm::WasmSignature &Sig); -std::string toString(const llvm::wasm::WasmGlobalType &Sig); +std::string toString(const llvm::wasm::WasmGlobalType &Type); +std::string toString(const llvm::wasm::WasmEventType &Type); } // namespace lld |