wasmtime_environ/module.rs
1//! Data structures for representing decoded wasm modules.
2
3use crate::prelude::*;
4use crate::*;
5use alloc::collections::BTreeMap;
6use core::ops::Range;
7use cranelift_entity::{packed_option::ReservedValue, EntityRef};
8use serde_derive::{Deserialize, Serialize};
9
10/// A WebAssembly linear memory initializer.
11#[derive(Clone, Debug, Serialize, Deserialize)]
12pub struct MemoryInitializer {
13 /// The index of a linear memory to initialize.
14 pub memory_index: MemoryIndex,
15 /// The base offset to start this segment at.
16 pub offset: ConstExpr,
17 /// The range of the data to write within the linear memory.
18 ///
19 /// This range indexes into a separately stored data section which will be
20 /// provided with the compiled module's code as well.
21 pub data: Range<u32>,
22}
23
24/// Similar to the above `MemoryInitializer` but only used when memory
25/// initializers are statically known to be valid.
26#[derive(Clone, Debug, Serialize, Deserialize)]
27pub struct StaticMemoryInitializer {
28 /// The 64-bit offset, in bytes, of where this initializer starts.
29 pub offset: u64,
30
31 /// The range of data to write at `offset`, where these indices are indexes
32 /// into the compiled wasm module's data section.
33 pub data: Range<u32>,
34}
35
36/// The type of WebAssembly linear memory initialization to use for a module.
37#[derive(Debug, Serialize, Deserialize)]
38pub enum MemoryInitialization {
39 /// Memory initialization is segmented.
40 ///
41 /// Segmented initialization can be used for any module, but it is required
42 /// if:
43 ///
44 /// * A data segment referenced an imported memory.
45 /// * A data segment uses a global base.
46 ///
47 /// Segmented initialization is performed by processing the complete set of
48 /// data segments when the module is instantiated.
49 ///
50 /// This is the default memory initialization type.
51 Segmented(Vec<MemoryInitializer>),
52
53 /// Memory initialization is statically known and involves a single `memcpy`
54 /// or otherwise simply making the defined data visible.
55 ///
56 /// To be statically initialized everything must reference a defined memory
57 /// and all data segments have a statically known in-bounds base (no
58 /// globals).
59 ///
60 /// This form of memory initialization is a more optimized version of
61 /// `Segmented` where memory can be initialized with one of a few methods:
62 ///
63 /// * First it could be initialized with a single `memcpy` of data from the
64 /// module to the linear memory.
65 /// * Otherwise techniques like `mmap` are also possible to make this data,
66 /// which might reside in a compiled module on disk, available immediately
67 /// in a linear memory's address space.
68 ///
69 /// To facilitate the latter of these techniques the `try_static_init`
70 /// function below, which creates this variant, takes a host page size
71 /// argument which can page-align everything to make mmap-ing possible.
72 Static {
73 /// The initialization contents for each linear memory.
74 ///
75 /// This array has, for each module's own linear memory, the contents
76 /// necessary to initialize it. If the memory has a `None` value then no
77 /// initialization is necessary (it's zero-filled). Otherwise with
78 /// `Some` the first element of the tuple is the offset in memory to
79 /// start the initialization and the `Range` is the range within the
80 /// final data section of the compiled module of bytes to copy into the
81 /// memory.
82 ///
83 /// The offset, range base, and range end are all guaranteed to be page
84 /// aligned to the page size passed in to `try_static_init`.
85 map: PrimaryMap<MemoryIndex, Option<StaticMemoryInitializer>>,
86 },
87}
88
89impl Default for MemoryInitialization {
90 fn default() -> Self {
91 Self::Segmented(Vec::new())
92 }
93}
94
95impl MemoryInitialization {
96 /// Returns whether this initialization is of the form
97 /// `MemoryInitialization::Segmented`.
98 pub fn is_segmented(&self) -> bool {
99 match self {
100 MemoryInitialization::Segmented(_) => true,
101 _ => false,
102 }
103 }
104
105 /// Performs the memory initialization steps for this set of initializers.
106 ///
107 /// This will perform wasm initialization in compliance with the wasm spec
108 /// and how data segments are processed. This doesn't need to necessarily
109 /// only be called as part of initialization, however, as it's structured to
110 /// allow learning about memory ahead-of-time at compile time possibly.
111 ///
112 /// This function will return true if all memory initializers are processed
113 /// successfully. If any initializer hits an error or, for example, a
114 /// global value is needed but `None` is returned, then false will be
115 /// returned. At compile-time this typically means that the "error" in
116 /// question needs to be deferred to runtime, and at runtime this means
117 /// that an invalid initializer has been found and a trap should be
118 /// generated.
119 pub fn init_memory(&self, state: &mut dyn InitMemory) -> bool {
120 let initializers = match self {
121 // Fall through below to the segmented memory one-by-one
122 // initialization.
123 MemoryInitialization::Segmented(list) => list,
124
125 // If previously switched to static initialization then pass through
126 // all those parameters here to the `write` callback.
127 //
128 // Note that existence of `Static` already guarantees that all
129 // indices are in-bounds.
130 MemoryInitialization::Static { map } => {
131 for (index, init) in map {
132 if let Some(init) = init {
133 let result = state.write(index, init);
134 if !result {
135 return result;
136 }
137 }
138 }
139 return true;
140 }
141 };
142
143 for initializer in initializers {
144 let &MemoryInitializer {
145 memory_index,
146 ref offset,
147 ref data,
148 } = initializer;
149
150 // First up determine the start/end range and verify that they're
151 // in-bounds for the initial size of the memory at `memory_index`.
152 // Note that this can bail if we don't have access to globals yet
153 // (e.g. this is a task happening before instantiation at
154 // compile-time).
155 let start = match state.eval_offset(memory_index, offset) {
156 Some(start) => start,
157 None => return false,
158 };
159 let len = u64::try_from(data.len()).unwrap();
160 let end = match start.checked_add(len) {
161 Some(end) => end,
162 None => return false,
163 };
164
165 match state.memory_size_in_bytes(memory_index) {
166 Ok(max) => {
167 if end > max {
168 return false;
169 }
170 }
171
172 // Note that computing the minimum can overflow if the page size
173 // is the default 64KiB and the memory's minimum size in pages
174 // is `1 << 48`, the maximum number of minimum pages for 64-bit
175 // memories. We don't return `false` to signal an error here and
176 // instead defer the error to runtime, when it will be
177 // impossible to allocate that much memory anyways.
178 Err(_) => {}
179 }
180
181 // The limits of the data segment have been validated at this point
182 // so the `write` callback is called with the range of data being
183 // written. Any erroneous result is propagated upwards.
184 let init = StaticMemoryInitializer {
185 offset: start,
186 data: data.clone(),
187 };
188 let result = state.write(memory_index, &init);
189 if !result {
190 return result;
191 }
192 }
193
194 return true;
195 }
196}
197
198/// The various callbacks provided here are used to drive the smaller bits of
199/// memory initialization.
200pub trait InitMemory {
201 /// Returns the size, in bytes, of the memory specified. For compile-time
202 /// purposes this would be the memory type's minimum size.
203 fn memory_size_in_bytes(&mut self, memory_index: MemoryIndex) -> Result<u64, SizeOverflow>;
204
205 /// Returns the value of the constant expression, as a `u64`. Note that
206 /// this may involve zero-extending a 32-bit global to a 64-bit number. May
207 /// return `None` to indicate that the expression involves a value which is
208 /// not available yet.
209 fn eval_offset(&mut self, memory_index: MemoryIndex, expr: &ConstExpr) -> Option<u64>;
210
211 /// A callback used to actually write data. This indicates that the
212 /// specified memory must receive the specified range of data at the
213 /// specified offset. This can return false on failure.
214 fn write(&mut self, memory_index: MemoryIndex, init: &StaticMemoryInitializer) -> bool;
215}
216
217/// Table initialization data for all tables in the module.
218#[derive(Debug, Default, Serialize, Deserialize)]
219pub struct TableInitialization {
220 /// Initial values for tables defined within the module itself.
221 ///
222 /// This contains the initial values and initializers for tables defined
223 /// within a wasm, so excluding imported tables. This initializer can
224 /// represent null-initialized tables, element-initialized tables (e.g. with
225 /// the function-references proposal), or precomputed images of table
226 /// initialization. For example table initializers to a table that are all
227 /// in-bounds will get removed from `segment` and moved into
228 /// `initial_values` here.
229 pub initial_values: PrimaryMap<DefinedTableIndex, TableInitialValue>,
230
231 /// Element segments present in the initial wasm module which are executed
232 /// at instantiation time.
233 ///
234 /// These element segments are iterated over during instantiation to apply
235 /// any segments that weren't already moved into `initial_values` above.
236 pub segments: Vec<TableSegment>,
237}
238
239/// Initial value for all elements in a table.
240#[derive(Clone, Debug, Serialize, Deserialize)]
241pub enum TableInitialValue {
242 /// Initialize each table element to null, optionally setting some elements
243 /// to non-null given the precomputed image.
244 Null {
245 /// A precomputed image of table initializers for this table.
246 ///
247 /// This image is constructed during `try_func_table_init` and
248 /// null-initialized elements are represented with
249 /// `FuncIndex::reserved_value()`. Note that this image is empty by
250 /// default and may not encompass the entire span of the table in which
251 /// case the elements are initialized to null.
252 precomputed: Vec<FuncIndex>,
253 },
254 /// An arbitrary const expression.
255 Expr(ConstExpr),
256}
257
258/// A WebAssembly table initializer segment.
259#[derive(Clone, Debug, Serialize, Deserialize)]
260pub struct TableSegment {
261 /// The index of a table to initialize.
262 pub table_index: TableIndex,
263 /// The base offset to start this segment at.
264 pub offset: ConstExpr,
265 /// The values to write into the table elements.
266 pub elements: TableSegmentElements,
267}
268
269/// Elements of a table segment, either a list of functions or list of arbitrary
270/// expressions.
271#[derive(Clone, Debug, Serialize, Deserialize)]
272pub enum TableSegmentElements {
273 /// A sequential list of functions where `FuncIndex::reserved_value()`
274 /// indicates a null function.
275 Functions(Box<[FuncIndex]>),
276 /// Arbitrary expressions, aka either functions, null or a load of a global.
277 Expressions(Box<[ConstExpr]>),
278}
279
280impl TableSegmentElements {
281 /// Returns the number of elements in this segment.
282 pub fn len(&self) -> u64 {
283 match self {
284 Self::Functions(s) => u64::try_from(s.len()).unwrap(),
285 Self::Expressions(s) => u64::try_from(s.len()).unwrap(),
286 }
287 }
288}
289
290/// A translated WebAssembly module, excluding the function bodies and
291/// memory initializers.
292#[derive(Default, Debug, Serialize, Deserialize)]
293pub struct Module {
294 /// The name of this wasm module, often found in the wasm file.
295 pub name: Option<String>,
296
297 /// All import records, in the order they are declared in the module.
298 pub initializers: Vec<Initializer>,
299
300 /// Exported entities.
301 pub exports: IndexMap<String, EntityIndex>,
302
303 /// The module "start" function, if present.
304 pub start_func: Option<FuncIndex>,
305
306 /// WebAssembly table initialization data, per table.
307 pub table_initialization: TableInitialization,
308
309 /// WebAssembly linear memory initializer.
310 pub memory_initialization: MemoryInitialization,
311
312 /// WebAssembly passive elements.
313 pub passive_elements: Vec<TableSegmentElements>,
314
315 /// The map from passive element index (element segment index space) to index in `passive_elements`.
316 pub passive_elements_map: BTreeMap<ElemIndex, usize>,
317
318 /// The map from passive data index (data segment index space) to index in `passive_data`.
319 pub passive_data_map: BTreeMap<DataIndex, Range<u32>>,
320
321 /// Types declared in the wasm module.
322 pub types: PrimaryMap<TypeIndex, ModuleInternedTypeIndex>,
323
324 /// Number of imported or aliased functions in the module.
325 pub num_imported_funcs: usize,
326
327 /// Number of imported or aliased tables in the module.
328 pub num_imported_tables: usize,
329
330 /// Number of imported or aliased memories in the module.
331 pub num_imported_memories: usize,
332
333 /// Number of imported or aliased globals in the module.
334 pub num_imported_globals: usize,
335
336 /// Number of functions that "escape" from this module may need to have a
337 /// `VMFuncRef` constructed for them.
338 ///
339 /// This is also the number of functions in the `functions` array below with
340 /// an `func_ref` index (and is the maximum func_ref index).
341 pub num_escaped_funcs: usize,
342
343 /// Number of call-indirect caches.
344 pub num_call_indirect_caches: usize,
345
346 /// Types of functions, imported and local.
347 pub functions: PrimaryMap<FuncIndex, FunctionType>,
348
349 /// WebAssembly tables.
350 pub tables: PrimaryMap<TableIndex, Table>,
351
352 /// WebAssembly linear memory plans.
353 pub memories: PrimaryMap<MemoryIndex, Memory>,
354
355 /// WebAssembly global variables.
356 pub globals: PrimaryMap<GlobalIndex, Global>,
357
358 /// WebAssembly global initializers for locally-defined globals.
359 pub global_initializers: PrimaryMap<DefinedGlobalIndex, ConstExpr>,
360}
361
362/// Initialization routines for creating an instance, encompassing imports,
363/// modules, instances, aliases, etc.
364#[derive(Debug, Serialize, Deserialize)]
365pub enum Initializer {
366 /// An imported item is required to be provided.
367 Import {
368 /// Name of this import
369 name: String,
370 /// The field name projection of this import
371 field: String,
372 /// Where this import will be placed, which also has type information
373 /// about the import.
374 index: EntityIndex,
375 },
376}
377
378impl Module {
379 /// Allocates the module data structures.
380 pub fn new() -> Self {
381 Module::default()
382 }
383
384 /// Convert a `DefinedFuncIndex` into a `FuncIndex`.
385 #[inline]
386 pub fn func_index(&self, defined_func: DefinedFuncIndex) -> FuncIndex {
387 FuncIndex::new(self.num_imported_funcs + defined_func.index())
388 }
389
390 /// Convert a `FuncIndex` into a `DefinedFuncIndex`. Returns None if the
391 /// index is an imported function.
392 #[inline]
393 pub fn defined_func_index(&self, func: FuncIndex) -> Option<DefinedFuncIndex> {
394 if func.index() < self.num_imported_funcs {
395 None
396 } else {
397 Some(DefinedFuncIndex::new(
398 func.index() - self.num_imported_funcs,
399 ))
400 }
401 }
402
403 /// Test whether the given function index is for an imported function.
404 #[inline]
405 pub fn is_imported_function(&self, index: FuncIndex) -> bool {
406 index.index() < self.num_imported_funcs
407 }
408
409 /// Convert a `DefinedTableIndex` into a `TableIndex`.
410 #[inline]
411 pub fn table_index(&self, defined_table: DefinedTableIndex) -> TableIndex {
412 TableIndex::new(self.num_imported_tables + defined_table.index())
413 }
414
415 /// Convert a `TableIndex` into a `DefinedTableIndex`. Returns None if the
416 /// index is an imported table.
417 #[inline]
418 pub fn defined_table_index(&self, table: TableIndex) -> Option<DefinedTableIndex> {
419 if table.index() < self.num_imported_tables {
420 None
421 } else {
422 Some(DefinedTableIndex::new(
423 table.index() - self.num_imported_tables,
424 ))
425 }
426 }
427
428 /// Test whether the given table index is for an imported table.
429 #[inline]
430 pub fn is_imported_table(&self, index: TableIndex) -> bool {
431 index.index() < self.num_imported_tables
432 }
433
434 /// Convert a `DefinedMemoryIndex` into a `MemoryIndex`.
435 #[inline]
436 pub fn memory_index(&self, defined_memory: DefinedMemoryIndex) -> MemoryIndex {
437 MemoryIndex::new(self.num_imported_memories + defined_memory.index())
438 }
439
440 /// Convert a `MemoryIndex` into a `DefinedMemoryIndex`. Returns None if the
441 /// index is an imported memory.
442 #[inline]
443 pub fn defined_memory_index(&self, memory: MemoryIndex) -> Option<DefinedMemoryIndex> {
444 if memory.index() < self.num_imported_memories {
445 None
446 } else {
447 Some(DefinedMemoryIndex::new(
448 memory.index() - self.num_imported_memories,
449 ))
450 }
451 }
452
453 /// Convert a `DefinedMemoryIndex` into an `OwnedMemoryIndex`. Returns None
454 /// if the index is an imported memory.
455 #[inline]
456 pub fn owned_memory_index(&self, memory: DefinedMemoryIndex) -> OwnedMemoryIndex {
457 assert!(
458 memory.index() < self.memories.len(),
459 "non-shared memory must have an owned index"
460 );
461
462 // Once we know that the memory index is not greater than the number of
463 // plans, we can iterate through the plans up to the memory index and
464 // count how many are not shared (i.e., owned).
465 let owned_memory_index = self
466 .memories
467 .iter()
468 .skip(self.num_imported_memories)
469 .take(memory.index())
470 .filter(|(_, mp)| !mp.shared)
471 .count();
472 OwnedMemoryIndex::new(owned_memory_index)
473 }
474
475 /// Test whether the given memory index is for an imported memory.
476 #[inline]
477 pub fn is_imported_memory(&self, index: MemoryIndex) -> bool {
478 index.index() < self.num_imported_memories
479 }
480
481 /// Convert a `DefinedGlobalIndex` into a `GlobalIndex`.
482 #[inline]
483 pub fn global_index(&self, defined_global: DefinedGlobalIndex) -> GlobalIndex {
484 GlobalIndex::new(self.num_imported_globals + defined_global.index())
485 }
486
487 /// Convert a `GlobalIndex` into a `DefinedGlobalIndex`. Returns None if the
488 /// index is an imported global.
489 #[inline]
490 pub fn defined_global_index(&self, global: GlobalIndex) -> Option<DefinedGlobalIndex> {
491 if global.index() < self.num_imported_globals {
492 None
493 } else {
494 Some(DefinedGlobalIndex::new(
495 global.index() - self.num_imported_globals,
496 ))
497 }
498 }
499
500 /// Test whether the given global index is for an imported global.
501 #[inline]
502 pub fn is_imported_global(&self, index: GlobalIndex) -> bool {
503 index.index() < self.num_imported_globals
504 }
505
506 /// Returns an iterator of all the imports in this module, along with their
507 /// module name, field name, and type that's being imported.
508 pub fn imports(&self) -> impl ExactSizeIterator<Item = (&str, &str, EntityType)> {
509 self.initializers.iter().map(move |i| match i {
510 Initializer::Import { name, field, index } => {
511 (name.as_str(), field.as_str(), self.type_of(*index))
512 }
513 })
514 }
515
516 /// Returns the type of an item based on its index
517 pub fn type_of(&self, index: EntityIndex) -> EntityType {
518 match index {
519 EntityIndex::Global(i) => EntityType::Global(self.globals[i]),
520 EntityIndex::Table(i) => EntityType::Table(self.tables[i]),
521 EntityIndex::Memory(i) => EntityType::Memory(self.memories[i]),
522 EntityIndex::Function(i) => {
523 EntityType::Function(EngineOrModuleTypeIndex::Module(self.functions[i].signature))
524 }
525 }
526 }
527
528 /// Appends a new function to this module with the given type information,
529 /// used for functions that either don't escape or aren't certain whether
530 /// they escape yet.
531 pub fn push_function(&mut self, signature: ModuleInternedTypeIndex) -> FuncIndex {
532 self.functions.push(FunctionType {
533 signature,
534 func_ref: FuncRefIndex::reserved_value(),
535 })
536 }
537
538 /// Returns an iterator over all of the defined function indices in this
539 /// module.
540 pub fn defined_func_indices(&self) -> impl Iterator<Item = DefinedFuncIndex> + use<> {
541 (0..self.functions.len() - self.num_imported_funcs).map(|i| DefinedFuncIndex::new(i))
542 }
543
544 /// Returns the number of tables defined by this module itself: all tables
545 /// minus imported tables.
546 pub fn num_defined_tables(&self) -> usize {
547 self.tables.len() - self.num_imported_tables
548 }
549
550 /// Returns the number of memories defined by this module itself: all
551 /// memories minus imported memories.
552 pub fn num_defined_memories(&self) -> usize {
553 self.memories.len() - self.num_imported_memories
554 }
555}
556
557/// Type information about functions in a wasm module.
558#[derive(Debug, Serialize, Deserialize)]
559pub struct FunctionType {
560 /// The type of this function, indexed into the module-wide type tables for
561 /// a module compilation.
562 pub signature: ModuleInternedTypeIndex,
563 /// The index into the funcref table, if present. Note that this is
564 /// `reserved_value()` if the function does not escape from a module.
565 pub func_ref: FuncRefIndex,
566}
567
568impl FunctionType {
569 /// Returns whether this function's type is one that "escapes" the current
570 /// module, meaning that the function is exported, used in `ref.func`, used
571 /// in a table, etc.
572 pub fn is_escaping(&self) -> bool {
573 !self.func_ref.is_reserved_value()
574 }
575}
576
577/// Index into the funcref table within a VMContext for a function.
578#[derive(Copy, Clone, PartialEq, Eq, Hash, PartialOrd, Ord, Debug, Serialize, Deserialize)]
579pub struct FuncRefIndex(u32);
580cranelift_entity::entity_impl!(FuncRefIndex);