blob: bdef959fafdc688e2dd2d1a1ecc6c8ec29100f94 [file] [log] [blame]
Andrew Scull5e1ddfa2018-08-14 10:06:54 +01001//===- Wasm.h - Wasm object file format -------------------------*- C++ -*-===//
2//
Andrew Walbran16937d02019-10-22 13:54:20 +01003// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
Andrew Scull5e1ddfa2018-08-14 10:06:54 +01006//
7//===----------------------------------------------------------------------===//
8//
9// This file defines manifest constants for the wasm object file format.
10// See: https://github.com/WebAssembly/design/blob/master/BinaryEncoding.md
11//
12//===----------------------------------------------------------------------===//
13
14#ifndef LLVM_BINARYFORMAT_WASM_H
15#define LLVM_BINARYFORMAT_WASM_H
16
17#include "llvm/ADT/ArrayRef.h"
Olivier Deprezf4ef2d02021-04-20 13:36:24 +020018#include "llvm/ADT/Optional.h"
Andrew Scull0372a572018-11-16 15:47:06 +000019#include "llvm/ADT/SmallVector.h"
Olivier Deprezf4ef2d02021-04-20 13:36:24 +020020#include "llvm/ADT/StringRef.h"
Andrew Scull5e1ddfa2018-08-14 10:06:54 +010021
22namespace llvm {
23namespace wasm {
24
25// Object file magic string.
26const char WasmMagic[] = {'\0', 'a', 's', 'm'};
27// Wasm binary format version
28const uint32_t WasmVersion = 0x1;
Andrew Scullcdfcccc2018-10-05 20:58:37 +010029// Wasm linking metadata version
Andrew Walbran16937d02019-10-22 13:54:20 +010030const uint32_t WasmMetadataVersion = 0x2;
Andrew Scull5e1ddfa2018-08-14 10:06:54 +010031// Wasm uses a 64k page size
32const uint32_t WasmPageSize = 65536;
33
34struct WasmObjectHeader {
35 StringRef Magic;
36 uint32_t Version;
37};
38
Andrew Walbran16937d02019-10-22 13:54:20 +010039struct WasmDylinkInfo {
40 uint32_t MemorySize; // Memory size in bytes
41 uint32_t MemoryAlignment; // P2 alignment of memory
42 uint32_t TableSize; // Table size in elements
43 uint32_t TableAlignment; // P2 alignment of table
Olivier Deprezf4ef2d02021-04-20 13:36:24 +020044 std::vector<StringRef> Needed; // Shared library dependencies
Andrew Walbran16937d02019-10-22 13:54:20 +010045};
46
47struct WasmProducerInfo {
48 std::vector<std::pair<std::string, std::string>> Languages;
49 std::vector<std::pair<std::string, std::string>> Tools;
50 std::vector<std::pair<std::string, std::string>> SDKs;
51};
52
Andrew Walbran3d2c1972020-04-07 12:24:26 +010053struct WasmFeatureEntry {
54 uint8_t Prefix;
55 std::string Name;
56};
57
Andrew Scull5e1ddfa2018-08-14 10:06:54 +010058struct WasmExport {
59 StringRef Name;
60 uint8_t Kind;
61 uint32_t Index;
62};
63
64struct WasmLimits {
65 uint8_t Flags;
Olivier Deprezf4ef2d02021-04-20 13:36:24 +020066 uint64_t Initial;
67 uint64_t Maximum;
68};
69
70struct WasmTableType {
71 uint8_t ElemType;
72 WasmLimits Limits;
Andrew Scull5e1ddfa2018-08-14 10:06:54 +010073};
74
75struct WasmTable {
Olivier Deprezf4ef2d02021-04-20 13:36:24 +020076 uint32_t Index;
77 WasmTableType Type;
78 StringRef SymbolName; // from the "linking" section
Andrew Scull5e1ddfa2018-08-14 10:06:54 +010079};
80
81struct WasmInitExpr {
82 uint8_t Opcode;
83 union {
84 int32_t Int32;
85 int64_t Int64;
Olivier Deprezf4ef2d02021-04-20 13:36:24 +020086 uint32_t Float32;
87 uint64_t Float64;
Andrew Scull5e1ddfa2018-08-14 10:06:54 +010088 uint32_t Global;
89 } Value;
90};
91
92struct WasmGlobalType {
93 uint8_t Type;
94 bool Mutable;
95};
96
97struct WasmGlobal {
98 uint32_t Index;
99 WasmGlobalType Type;
100 WasmInitExpr InitExpr;
Andrew Scullcdfcccc2018-10-05 20:58:37 +0100101 StringRef SymbolName; // from the "linking" section
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100102};
103
Andrew Walbran16937d02019-10-22 13:54:20 +0100104struct WasmEventType {
105 // Kind of event. Currently only WASM_EVENT_ATTRIBUTE_EXCEPTION is possible.
106 uint32_t Attribute;
107 uint32_t SigIndex;
108};
109
110struct WasmEvent {
111 uint32_t Index;
112 WasmEventType Type;
113 StringRef SymbolName; // from the "linking" section
114};
115
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100116struct WasmImport {
117 StringRef Module;
118 StringRef Field;
119 uint8_t Kind;
120 union {
121 uint32_t SigIndex;
122 WasmGlobalType Global;
Olivier Deprezf4ef2d02021-04-20 13:36:24 +0200123 WasmTableType Table;
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100124 WasmLimits Memory;
Andrew Walbran16937d02019-10-22 13:54:20 +0100125 WasmEventType Event;
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100126 };
127};
128
129struct WasmLocalDecl {
130 uint8_t Type;
131 uint32_t Count;
132};
133
134struct WasmFunction {
135 uint32_t Index;
136 std::vector<WasmLocalDecl> Locals;
137 ArrayRef<uint8_t> Body;
138 uint32_t CodeSectionOffset;
139 uint32_t Size;
Andrew Scullcdfcccc2018-10-05 20:58:37 +0100140 uint32_t CodeOffset; // start of Locals and Body
Olivier Deprezf4ef2d02021-04-20 13:36:24 +0200141 Optional<StringRef> ExportName; // from the "export" section
Andrew Scullcdfcccc2018-10-05 20:58:37 +0100142 StringRef SymbolName; // from the "linking" section
Andrew Scull0372a572018-11-16 15:47:06 +0000143 StringRef DebugName; // from the "name" section
144 uint32_t Comdat; // from the "comdat info" section
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100145};
146
147struct WasmDataSegment {
Andrew Walbran3d2c1972020-04-07 12:24:26 +0100148 uint32_t InitFlags;
149 uint32_t MemoryIndex; // present if InitFlags & WASM_SEGMENT_HAS_MEMINDEX
150 WasmInitExpr Offset; // present if InitFlags & WASM_SEGMENT_IS_PASSIVE == 0
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100151 ArrayRef<uint8_t> Content;
Andrew Scullcdfcccc2018-10-05 20:58:37 +0100152 StringRef Name; // from the "segment info" section
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100153 uint32_t Alignment;
Andrew Walbran3d2c1972020-04-07 12:24:26 +0100154 uint32_t LinkerFlags;
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100155 uint32_t Comdat; // from the "comdat info" section
156};
157
158struct WasmElemSegment {
159 uint32_t TableIndex;
160 WasmInitExpr Offset;
161 std::vector<uint32_t> Functions;
162};
163
164// Represents the location of a Wasm data symbol within a WasmDataSegment, as
165// the index of the segment, and the offset and size within the segment.
166struct WasmDataReference {
167 uint32_t Segment;
Olivier Deprezf4ef2d02021-04-20 13:36:24 +0200168 uint64_t Offset;
169 uint64_t Size;
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100170};
171
172struct WasmRelocation {
173 uint8_t Type; // The type of the relocation.
174 uint32_t Index; // Index into either symbol or type index space.
175 uint64_t Offset; // Offset from the start of the section.
176 int64_t Addend; // A value to add to the symbol.
177};
178
179struct WasmInitFunc {
180 uint32_t Priority;
181 uint32_t Symbol;
182};
183
184struct WasmSymbolInfo {
185 StringRef Name;
186 uint8_t Kind;
187 uint32_t Flags;
Olivier Deprezf4ef2d02021-04-20 13:36:24 +0200188 // For undefined symbols the module of the import
189 Optional<StringRef> ImportModule;
190 // For undefined symbols the name of the import
191 Optional<StringRef> ImportName;
192 // For symbols to be exported from the final module
193 Optional<StringRef> ExportName;
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100194 union {
Olivier Deprezf4ef2d02021-04-20 13:36:24 +0200195 // For function, table, or global symbols, the index in function, table, or
196 // global index space.
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100197 uint32_t ElementIndex;
198 // For a data symbols, the address of the data relative to segment.
199 WasmDataReference DataRef;
200 };
201};
202
Olivier Deprezf4ef2d02021-04-20 13:36:24 +0200203enum class NameType {
204 FUNCTION,
205 GLOBAL,
206 DATA_SEGMENT,
207};
208
209struct WasmDebugName {
210 NameType Type;
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100211 uint32_t Index;
212 StringRef Name;
213};
214
215struct WasmLinkingData {
Andrew Scullcdfcccc2018-10-05 20:58:37 +0100216 uint32_t Version;
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100217 std::vector<WasmInitFunc> InitFunctions;
218 std::vector<StringRef> Comdats;
219 std::vector<WasmSymbolInfo> SymbolTable;
220};
221
222enum : unsigned {
Andrew Walbran16937d02019-10-22 13:54:20 +0100223 WASM_SEC_CUSTOM = 0, // Custom / User-defined section
224 WASM_SEC_TYPE = 1, // Function signature declarations
225 WASM_SEC_IMPORT = 2, // Import declarations
226 WASM_SEC_FUNCTION = 3, // Function declarations
227 WASM_SEC_TABLE = 4, // Indirect function table and other tables
228 WASM_SEC_MEMORY = 5, // Memory attributes
229 WASM_SEC_GLOBAL = 6, // Global declarations
230 WASM_SEC_EXPORT = 7, // Exports
231 WASM_SEC_START = 8, // Start function declaration
232 WASM_SEC_ELEM = 9, // Elements section
233 WASM_SEC_CODE = 10, // Function bodies (code)
234 WASM_SEC_DATA = 11, // Data segments
235 WASM_SEC_DATACOUNT = 12, // Data segment count
236 WASM_SEC_EVENT = 13 // Event declarations
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100237};
238
239// Type immediate encodings used in various contexts.
240enum : unsigned {
241 WASM_TYPE_I32 = 0x7F,
242 WASM_TYPE_I64 = 0x7E,
243 WASM_TYPE_F32 = 0x7D,
244 WASM_TYPE_F64 = 0x7C,
Andrew Scull0372a572018-11-16 15:47:06 +0000245 WASM_TYPE_V128 = 0x7B,
Andrew Walbran16937d02019-10-22 13:54:20 +0100246 WASM_TYPE_FUNCREF = 0x70,
Olivier Deprezf4ef2d02021-04-20 13:36:24 +0200247 WASM_TYPE_EXTERNREF = 0x6F,
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100248 WASM_TYPE_FUNC = 0x60,
249 WASM_TYPE_NORESULT = 0x40, // for blocks with no result values
250};
251
252// Kinds of externals (for imports and exports).
253enum : unsigned {
254 WASM_EXTERNAL_FUNCTION = 0x0,
255 WASM_EXTERNAL_TABLE = 0x1,
256 WASM_EXTERNAL_MEMORY = 0x2,
257 WASM_EXTERNAL_GLOBAL = 0x3,
Andrew Walbran16937d02019-10-22 13:54:20 +0100258 WASM_EXTERNAL_EVENT = 0x4,
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100259};
260
261// Opcodes used in initializer expressions.
262enum : unsigned {
263 WASM_OPCODE_END = 0x0b,
Andrew Walbran3d2c1972020-04-07 12:24:26 +0100264 WASM_OPCODE_CALL = 0x10,
Olivier Deprezf4ef2d02021-04-20 13:36:24 +0200265 WASM_OPCODE_LOCAL_GET = 0x20,
266 WASM_OPCODE_LOCAL_SET = 0x21,
Andrew Walbran16937d02019-10-22 13:54:20 +0100267 WASM_OPCODE_GLOBAL_GET = 0x23,
Olivier Deprezf4ef2d02021-04-20 13:36:24 +0200268 WASM_OPCODE_GLOBAL_SET = 0x24,
Andrew Walbran3d2c1972020-04-07 12:24:26 +0100269 WASM_OPCODE_I32_STORE = 0x36,
Olivier Deprezf4ef2d02021-04-20 13:36:24 +0200270 WASM_OPCODE_I64_STORE = 0x37,
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100271 WASM_OPCODE_I32_CONST = 0x41,
272 WASM_OPCODE_I64_CONST = 0x42,
273 WASM_OPCODE_F32_CONST = 0x43,
274 WASM_OPCODE_F64_CONST = 0x44,
Andrew Walbran3d2c1972020-04-07 12:24:26 +0100275 WASM_OPCODE_I32_ADD = 0x6a,
Olivier Deprezf4ef2d02021-04-20 13:36:24 +0200276 WASM_OPCODE_I64_ADD = 0x7c,
277 WASM_OPCODE_REF_NULL = 0xd0,
278};
279
280// Opcodes used in synthetic functions.
281enum : unsigned {
282 WASM_OPCODE_IF = 0x04,
283 WASM_OPCODE_ELSE = 0x05,
284 WASM_OPCODE_DROP = 0x1a,
Andrew Walbran3d2c1972020-04-07 12:24:26 +0100285 WASM_OPCODE_MISC_PREFIX = 0xfc,
286 WASM_OPCODE_MEMORY_INIT = 0x08,
287 WASM_OPCODE_DATA_DROP = 0x09,
Olivier Deprezf4ef2d02021-04-20 13:36:24 +0200288 WASM_OPCODE_ATOMICS_PREFIX = 0xfe,
289 WASM_OPCODE_ATOMIC_NOTIFY = 0x00,
290 WASM_OPCODE_I32_ATOMIC_WAIT = 0x01,
291 WASM_OPCODE_I32_ATOMIC_STORE = 0x17,
292 WASM_OPCODE_I32_RMW_CMPXCHG = 0x48,
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100293};
294
295enum : unsigned {
Olivier Deprezf4ef2d02021-04-20 13:36:24 +0200296 WASM_LIMITS_FLAG_NONE = 0x0,
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100297 WASM_LIMITS_FLAG_HAS_MAX = 0x1,
Andrew Walbran16937d02019-10-22 13:54:20 +0100298 WASM_LIMITS_FLAG_IS_SHARED = 0x2,
Olivier Deprezf4ef2d02021-04-20 13:36:24 +0200299 WASM_LIMITS_FLAG_IS_64 = 0x4,
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100300};
301
Andrew Walbran3d2c1972020-04-07 12:24:26 +0100302enum : unsigned {
303 WASM_SEGMENT_IS_PASSIVE = 0x01,
304 WASM_SEGMENT_HAS_MEMINDEX = 0x02,
305};
306
307// Feature policy prefixes used in the custom "target_features" section
308enum : uint8_t {
309 WASM_FEATURE_PREFIX_USED = '+',
310 WASM_FEATURE_PREFIX_REQUIRED = '=',
311 WASM_FEATURE_PREFIX_DISALLOWED = '-',
312};
313
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100314// Kind codes used in the custom "name" section
315enum : unsigned {
Olivier Deprezf4ef2d02021-04-20 13:36:24 +0200316 WASM_NAMES_FUNCTION = 1,
317 WASM_NAMES_LOCAL = 2,
318 WASM_NAMES_GLOBAL = 7,
319 WASM_NAMES_DATA_SEGMENT = 9,
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100320};
321
322// Kind codes used in the custom "linking" section
323enum : unsigned {
Andrew Scull0372a572018-11-16 15:47:06 +0000324 WASM_SEGMENT_INFO = 0x5,
325 WASM_INIT_FUNCS = 0x6,
326 WASM_COMDAT_INFO = 0x7,
327 WASM_SYMBOL_TABLE = 0x8,
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100328};
329
330// Kind codes used in the custom "linking" section in the WASM_COMDAT_INFO
331enum : unsigned {
Andrew Scull0372a572018-11-16 15:47:06 +0000332 WASM_COMDAT_DATA = 0x0,
333 WASM_COMDAT_FUNCTION = 0x1,
Olivier Deprezf4ef2d02021-04-20 13:36:24 +0200334 // GLOBAL, EVENT, and TABLE are in here but LLVM doesn't use them yet.
335 WASM_COMDAT_SECTION = 0x5,
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100336};
337
338// Kind codes used in the custom "linking" section in the WASM_SYMBOL_TABLE
339enum WasmSymbolType : unsigned {
340 WASM_SYMBOL_TYPE_FUNCTION = 0x0,
Andrew Scullcdfcccc2018-10-05 20:58:37 +0100341 WASM_SYMBOL_TYPE_DATA = 0x1,
342 WASM_SYMBOL_TYPE_GLOBAL = 0x2,
343 WASM_SYMBOL_TYPE_SECTION = 0x3,
Andrew Walbran16937d02019-10-22 13:54:20 +0100344 WASM_SYMBOL_TYPE_EVENT = 0x4,
Olivier Deprezf4ef2d02021-04-20 13:36:24 +0200345 WASM_SYMBOL_TYPE_TABLE = 0x5,
Andrew Walbran16937d02019-10-22 13:54:20 +0100346};
347
348// Kinds of event attributes.
349enum WasmEventAttribute : unsigned {
350 WASM_EVENT_ATTRIBUTE_EXCEPTION = 0x0,
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100351};
352
Andrew Scull0372a572018-11-16 15:47:06 +0000353const unsigned WASM_SYMBOL_BINDING_MASK = 0x3;
354const unsigned WASM_SYMBOL_VISIBILITY_MASK = 0xc;
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100355
Andrew Scull0372a572018-11-16 15:47:06 +0000356const unsigned WASM_SYMBOL_BINDING_GLOBAL = 0x0;
357const unsigned WASM_SYMBOL_BINDING_WEAK = 0x1;
358const unsigned WASM_SYMBOL_BINDING_LOCAL = 0x2;
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100359const unsigned WASM_SYMBOL_VISIBILITY_DEFAULT = 0x0;
Andrew Scull0372a572018-11-16 15:47:06 +0000360const unsigned WASM_SYMBOL_VISIBILITY_HIDDEN = 0x4;
361const unsigned WASM_SYMBOL_UNDEFINED = 0x10;
Andrew Walbran16937d02019-10-22 13:54:20 +0100362const unsigned WASM_SYMBOL_EXPORTED = 0x20;
363const unsigned WASM_SYMBOL_EXPLICIT_NAME = 0x40;
Olivier Deprezf4ef2d02021-04-20 13:36:24 +0200364const unsigned WASM_SYMBOL_NO_STRIP = 0x80;
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100365
366#define WASM_RELOC(name, value) name = value,
367
368enum : unsigned {
369#include "WasmRelocs.def"
370};
371
372#undef WASM_RELOC
373
Andrew Scull0372a572018-11-16 15:47:06 +0000374// Subset of types that a value can have
375enum class ValType {
376 I32 = WASM_TYPE_I32,
377 I64 = WASM_TYPE_I64,
378 F32 = WASM_TYPE_F32,
379 F64 = WASM_TYPE_F64,
380 V128 = WASM_TYPE_V128,
Olivier Deprezf4ef2d02021-04-20 13:36:24 +0200381 FUNCREF = WASM_TYPE_FUNCREF,
382 EXTERNREF = WASM_TYPE_EXTERNREF,
Andrew Scull0372a572018-11-16 15:47:06 +0000383};
384
385struct WasmSignature {
Andrew Walbran16937d02019-10-22 13:54:20 +0100386 SmallVector<ValType, 1> Returns;
387 SmallVector<ValType, 4> Params;
Andrew Scull0372a572018-11-16 15:47:06 +0000388 // Support empty and tombstone instances, needed by DenseMap.
389 enum { Plain, Empty, Tombstone } State = Plain;
390
Andrew Walbran16937d02019-10-22 13:54:20 +0100391 WasmSignature(SmallVector<ValType, 1> &&InReturns,
392 SmallVector<ValType, 4> &&InParams)
Andrew Scull0372a572018-11-16 15:47:06 +0000393 : Returns(InReturns), Params(InParams) {}
394 WasmSignature() = default;
395};
396
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100397// Useful comparison operators
398inline bool operator==(const WasmSignature &LHS, const WasmSignature &RHS) {
Andrew Scull0372a572018-11-16 15:47:06 +0000399 return LHS.State == RHS.State && LHS.Returns == RHS.Returns &&
400 LHS.Params == RHS.Params;
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100401}
402
403inline bool operator!=(const WasmSignature &LHS, const WasmSignature &RHS) {
404 return !(LHS == RHS);
405}
406
407inline bool operator==(const WasmGlobalType &LHS, const WasmGlobalType &RHS) {
408 return LHS.Type == RHS.Type && LHS.Mutable == RHS.Mutable;
409}
410
411inline bool operator!=(const WasmGlobalType &LHS, const WasmGlobalType &RHS) {
412 return !(LHS == RHS);
413}
414
Andrew Walbran16937d02019-10-22 13:54:20 +0100415std::string toString(WasmSymbolType type);
Andrew Scullcdfcccc2018-10-05 20:58:37 +0100416std::string relocTypetoString(uint32_t type);
Andrew Walbran3d2c1972020-04-07 12:24:26 +0100417bool relocTypeHasAddend(uint32_t type);
Andrew Scullcdfcccc2018-10-05 20:58:37 +0100418
Andrew Scull5e1ddfa2018-08-14 10:06:54 +0100419} // end namespace wasm
420} // end namespace llvm
421
422#endif