aboutsummaryrefslogtreecommitdiff
path: root/wasm/InputFiles.cpp
diff options
context:
space:
mode:
Diffstat (limited to 'wasm/InputFiles.cpp')
-rw-r--r--wasm/InputFiles.cpp303
1 files changed, 303 insertions, 0 deletions
diff --git a/wasm/InputFiles.cpp b/wasm/InputFiles.cpp
new file mode 100644
index 000000000000..e7463da39db9
--- /dev/null
+++ b/wasm/InputFiles.cpp
@@ -0,0 +1,303 @@
+//===- InputFiles.cpp -----------------------------------------------------===//
+//
+// The LLVM Linker
+//
+// This file is distributed under the University of Illinois Open Source
+// License. See LICENSE.TXT for details.
+//
+//===----------------------------------------------------------------------===//
+
+#include "InputFiles.h"
+
+#include "Config.h"
+#include "InputSegment.h"
+#include "SymbolTable.h"
+#include "lld/Common/ErrorHandler.h"
+#include "lld/Common/Memory.h"
+#include "llvm/Object/Binary.h"
+#include "llvm/Object/Wasm.h"
+#include "llvm/Support/raw_ostream.h"
+
+#define DEBUG_TYPE "lld"
+
+using namespace lld;
+using namespace lld::wasm;
+
+using namespace llvm;
+using namespace llvm::object;
+using namespace llvm::wasm;
+
+Optional<MemoryBufferRef> lld::wasm::readFile(StringRef Path) {
+ log("Loading: " + Path);
+
+ auto MBOrErr = MemoryBuffer::getFile(Path);
+ if (auto EC = MBOrErr.getError()) {
+ error("cannot open " + Path + ": " + EC.message());
+ return None;
+ }
+ std::unique_ptr<MemoryBuffer> &MB = *MBOrErr;
+ MemoryBufferRef MBRef = MB->getMemBufferRef();
+ make<std::unique_ptr<MemoryBuffer>>(std::move(MB)); // take MB ownership
+
+ return MBRef;
+}
+
+void ObjFile::dumpInfo() const {
+ log("reloc info for: " + getName() + "\n" +
+ " FunctionIndexOffset : " + Twine(FunctionIndexOffset) + "\n" +
+ " NumFunctionImports : " + Twine(NumFunctionImports()) + "\n" +
+ " NumGlobalImports : " + Twine(NumGlobalImports()) + "\n");
+}
+
+bool ObjFile::isImportedFunction(uint32_t Index) const {
+ return Index < NumFunctionImports();
+}
+
+Symbol *ObjFile::getFunctionSymbol(uint32_t Index) const {
+ return FunctionSymbols[Index];
+}
+
+Symbol *ObjFile::getTableSymbol(uint32_t Index) const {
+ return TableSymbols[Index];
+}
+
+Symbol *ObjFile::getGlobalSymbol(uint32_t Index) const {
+ return GlobalSymbols[Index];
+}
+
+uint32_t ObjFile::getRelocatedAddress(uint32_t Index) const {
+ return getGlobalSymbol(Index)->getVirtualAddress();
+}
+
+uint32_t ObjFile::relocateFunctionIndex(uint32_t Original) const {
+ Symbol *Sym = getFunctionSymbol(Original);
+ uint32_t Index = Sym->getOutputIndex();
+ DEBUG(dbgs() << "relocateFunctionIndex: " << toString(*Sym) << ": "
+ << Original << " -> " << Index << "\n");
+ return Index;
+}
+
+uint32_t ObjFile::relocateTypeIndex(uint32_t Original) const {
+ return TypeMap[Original];
+}
+
+uint32_t ObjFile::relocateTableIndex(uint32_t Original) const {
+ Symbol *Sym = getTableSymbol(Original);
+ uint32_t Index = Sym->getTableIndex();
+ DEBUG(dbgs() << "relocateTableIndex: " << toString(*Sym) << ": " << Original
+ << " -> " << Index << "\n");
+ return Index;
+}
+
+uint32_t ObjFile::relocateGlobalIndex(uint32_t Original) const {
+ Symbol *Sym = getGlobalSymbol(Original);
+ uint32_t Index = Sym->getOutputIndex();
+ DEBUG(dbgs() << "relocateGlobalIndex: " << toString(*Sym) << ": " << Original
+ << " -> " << Index << "\n");
+ return Index;
+}
+
+void ObjFile::parse() {
+ // Parse a memory buffer as a wasm file.
+ DEBUG(dbgs() << "Parsing object: " << toString(this) << "\n");
+ std::unique_ptr<Binary> Bin = CHECK(createBinary(MB), toString(this));
+
+ auto *Obj = dyn_cast<WasmObjectFile>(Bin.get());
+ if (!Obj)
+ fatal(toString(this) + ": not a wasm file");
+ if (!Obj->isRelocatableObject())
+ fatal(toString(this) + ": not a relocatable wasm file");
+
+ Bin.release();
+ WasmObj.reset(Obj);
+
+ // Find the code and data sections. Wasm objects can have at most one code
+ // and one data section.
+ for (const SectionRef &Sec : WasmObj->sections()) {
+ const WasmSection &Section = WasmObj->getWasmSection(Sec);
+ if (Section.Type == WASM_SEC_CODE)
+ CodeSection = &Section;
+ else if (Section.Type == WASM_SEC_DATA)
+ DataSection = &Section;
+ }
+
+ initializeSymbols();
+}
+
+// Return the InputSegment in which a given symbol is defined.
+InputSegment *ObjFile::getSegment(const WasmSymbol &WasmSym) {
+ uint32_t Address = WasmObj->getWasmSymbolValue(WasmSym);
+ for (InputSegment *Segment : Segments) {
+ if (Address >= Segment->startVA() && Address < Segment->endVA()) {
+ DEBUG(dbgs() << "Found symbol in segment: " << WasmSym.Name << " -> "
+ << Segment->getName() << "\n");
+
+ return Segment;
+ }
+ }
+ error("symbol not found in any segment: " + WasmSym.Name);
+ return nullptr;
+}
+
+static void copyRelocationsRange(std::vector<WasmRelocation> &To,
+ ArrayRef<WasmRelocation> From, size_t Start,
+ size_t End) {
+ for (const WasmRelocation &R : From)
+ if (R.Offset >= Start && R.Offset < End)
+ To.push_back(R);
+}
+
+void ObjFile::initializeSymbols() {
+ Symbols.reserve(WasmObj->getNumberOfSymbols());
+
+ for (const WasmImport &Import : WasmObj->imports()) {
+ switch (Import.Kind) {
+ case WASM_EXTERNAL_FUNCTION:
+ ++FunctionImports;
+ break;
+ case WASM_EXTERNAL_GLOBAL:
+ ++GlobalImports;
+ break;
+ }
+ }
+
+ FunctionSymbols.resize(FunctionImports + WasmObj->functions().size());
+ GlobalSymbols.resize(GlobalImports + WasmObj->globals().size());
+
+ for (const WasmSegment &S : WasmObj->dataSegments()) {
+ InputSegment *Seg = make<InputSegment>(&S, this);
+ copyRelocationsRange(Seg->Relocations, DataSection->Relocations,
+ Seg->getInputSectionOffset(),
+ Seg->getInputSectionOffset() + Seg->getSize());
+ Segments.emplace_back(Seg);
+ }
+
+ // Populate `FunctionSymbols` and `GlobalSymbols` based on the WasmSymbols
+ // in the object
+ for (const SymbolRef &Sym : WasmObj->symbols()) {
+ const WasmSymbol &WasmSym = WasmObj->getWasmSymbol(Sym.getRawDataRefImpl());
+ Symbol *S;
+ switch (WasmSym.Type) {
+ case WasmSymbol::SymbolType::FUNCTION_IMPORT:
+ case WasmSymbol::SymbolType::GLOBAL_IMPORT:
+ S = createUndefined(WasmSym);
+ break;
+ case WasmSymbol::SymbolType::GLOBAL_EXPORT:
+ S = createDefined(WasmSym, getSegment(WasmSym));
+ break;
+ case WasmSymbol::SymbolType::FUNCTION_EXPORT:
+ S = createDefined(WasmSym);
+ break;
+ case WasmSymbol::SymbolType::DEBUG_FUNCTION_NAME:
+ // These are for debugging only, no need to create linker symbols for them
+ continue;
+ }
+
+ Symbols.push_back(S);
+ if (WasmSym.isFunction()) {
+ DEBUG(dbgs() << "Function: " << WasmSym.ElementIndex << " -> "
+ << toString(*S) << "\n");
+ FunctionSymbols[WasmSym.ElementIndex] = S;
+ } else {
+ DEBUG(dbgs() << "Global: " << WasmSym.ElementIndex << " -> "
+ << toString(*S) << "\n");
+ GlobalSymbols[WasmSym.ElementIndex] = S;
+ }
+ }
+
+ // Populate `TableSymbols` with all symbols that are called indirectly
+ uint32_t SegmentCount = WasmObj->elements().size();
+ if (SegmentCount) {
+ if (SegmentCount > 1)
+ fatal(getName() + ": contains more than one element segment");
+ const WasmElemSegment &Segment = WasmObj->elements()[0];
+ if (Segment.Offset.Opcode != WASM_OPCODE_I32_CONST)
+ fatal(getName() + ": unsupported element segment");
+ if (Segment.TableIndex != 0)
+ fatal(getName() + ": unsupported table index in elem segment");
+ if (Segment.Offset.Value.Int32 != 0)
+ fatal(getName() + ": unsupported element segment offset");
+ TableSymbols.reserve(Segment.Functions.size());
+ for (uint64_t FunctionIndex : Segment.Functions)
+ TableSymbols.push_back(getFunctionSymbol(FunctionIndex));
+ }
+
+ DEBUG(dbgs() << "TableSymbols: " << TableSymbols.size() << "\n");
+ DEBUG(dbgs() << "Functions : " << FunctionSymbols.size() << "\n");
+ DEBUG(dbgs() << "Globals : " << GlobalSymbols.size() << "\n");
+}
+
+Symbol *ObjFile::createUndefined(const WasmSymbol &Sym) {
+ return Symtab->addUndefined(this, &Sym);
+}
+
+Symbol *ObjFile::createDefined(const WasmSymbol &Sym,
+ const InputSegment *Segment) {
+ Symbol *S;
+ if (Sym.isLocal()) {
+ S = make<Symbol>(Sym.Name, true);
+ Symbol::Kind Kind;
+ if (Sym.Type == WasmSymbol::SymbolType::FUNCTION_EXPORT)
+ Kind = Symbol::Kind::DefinedFunctionKind;
+ else if (Sym.Type == WasmSymbol::SymbolType::GLOBAL_EXPORT)
+ Kind = Symbol::Kind::DefinedGlobalKind;
+ else
+ llvm_unreachable("invalid local symbol type");
+ S->update(Kind, this, &Sym, Segment);
+ return S;
+ }
+ return Symtab->addDefined(this, &Sym, Segment);
+}
+
+void ArchiveFile::parse() {
+ // Parse a MemoryBufferRef as an archive file.
+ DEBUG(dbgs() << "Parsing library: " << toString(this) << "\n");
+ File = CHECK(Archive::create(MB), toString(this));
+
+ // Read the symbol table to construct Lazy symbols.
+ int Count = 0;
+ for (const Archive::Symbol &Sym : File->symbols()) {
+ Symtab->addLazy(this, &Sym);
+ ++Count;
+ }
+ DEBUG(dbgs() << "Read " << Count << " symbols\n");
+}
+
+void ArchiveFile::addMember(const Archive::Symbol *Sym) {
+ const Archive::Child &C =
+ CHECK(Sym->getMember(),
+ "could not get the member for symbol " + Sym->getName());
+
+ // Don't try to load the same member twice (this can happen when members
+ // mutually reference each other).
+ if (!Seen.insert(C.getChildOffset()).second)
+ return;
+
+ DEBUG(dbgs() << "loading lazy: " << Sym->getName() << "\n");
+ DEBUG(dbgs() << "from archive: " << toString(this) << "\n");
+
+ MemoryBufferRef MB =
+ CHECK(C.getMemoryBufferRef(),
+ "could not get the buffer for the member defining symbol " +
+ Sym->getName());
+
+ if (identify_magic(MB.getBuffer()) != file_magic::wasm_object) {
+ error("unknown file type: " + MB.getBufferIdentifier());
+ return;
+ }
+
+ InputFile *Obj = make<ObjFile>(MB);
+ Obj->ParentName = ParentName;
+ Symtab->addFile(Obj);
+}
+
+// Returns a string in the format of "foo.o" or "foo.a(bar.o)".
+std::string lld::toString(const wasm::InputFile *File) {
+ if (!File)
+ return "<internal>";
+
+ if (File->ParentName.empty())
+ return File->getName();
+
+ return (File->ParentName + "(" + File->getName() + ")").str();
+}