wasmtime_environ/
module.rs

1//! Data structures for representing decoded wasm modules.
2
3use crate::prelude::*;
4use crate::*;
5use alloc::collections::BTreeMap;
6use core::ops::Range;
7use cranelift_entity::{packed_option::ReservedValue, EntityRef};
8use serde_derive::{Deserialize, Serialize};
9
10/// A WebAssembly linear memory initializer.
11#[derive(Clone, Debug, Serialize, Deserialize)]
12pub struct MemoryInitializer {
13    /// The index of a linear memory to initialize.
14    pub memory_index: MemoryIndex,
15    /// The base offset to start this segment at.
16    pub offset: ConstExpr,
17    /// The range of the data to write within the linear memory.
18    ///
19    /// This range indexes into a separately stored data section which will be
20    /// provided with the compiled module's code as well.
21    pub data: Range<u32>,
22}
23
24/// Similar to the above `MemoryInitializer` but only used when memory
25/// initializers are statically known to be valid.
26#[derive(Clone, Debug, Serialize, Deserialize)]
27pub struct StaticMemoryInitializer {
28    /// The 64-bit offset, in bytes, of where this initializer starts.
29    pub offset: u64,
30
31    /// The range of data to write at `offset`, where these indices are indexes
32    /// into the compiled wasm module's data section.
33    pub data: Range<u32>,
34}
35
36/// The type of WebAssembly linear memory initialization to use for a module.
37#[derive(Debug, Serialize, Deserialize)]
38pub enum MemoryInitialization {
39    /// Memory initialization is segmented.
40    ///
41    /// Segmented initialization can be used for any module, but it is required
42    /// if:
43    ///
44    /// * A data segment referenced an imported memory.
45    /// * A data segment uses a global base.
46    ///
47    /// Segmented initialization is performed by processing the complete set of
48    /// data segments when the module is instantiated.
49    ///
50    /// This is the default memory initialization type.
51    Segmented(Vec<MemoryInitializer>),
52
53    /// Memory initialization is statically known and involves a single `memcpy`
54    /// or otherwise simply making the defined data visible.
55    ///
56    /// To be statically initialized everything must reference a defined memory
57    /// and all data segments have a statically known in-bounds base (no
58    /// globals).
59    ///
60    /// This form of memory initialization is a more optimized version of
61    /// `Segmented` where memory can be initialized with one of a few methods:
62    ///
63    /// * First it could be initialized with a single `memcpy` of data from the
64    ///   module to the linear memory.
65    /// * Otherwise techniques like `mmap` are also possible to make this data,
66    ///   which might reside in a compiled module on disk, available immediately
67    ///   in a linear memory's address space.
68    ///
69    /// To facilitate the latter of these techniques the `try_static_init`
70    /// function below, which creates this variant, takes a host page size
71    /// argument which can page-align everything to make mmap-ing possible.
72    Static {
73        /// The initialization contents for each linear memory.
74        ///
75        /// This array has, for each module's own linear memory, the contents
76        /// necessary to initialize it. If the memory has a `None` value then no
77        /// initialization is necessary (it's zero-filled). Otherwise with
78        /// `Some` the first element of the tuple is the offset in memory to
79        /// start the initialization and the `Range` is the range within the
80        /// final data section of the compiled module of bytes to copy into the
81        /// memory.
82        ///
83        /// The offset, range base, and range end are all guaranteed to be page
84        /// aligned to the page size passed in to `try_static_init`.
85        map: PrimaryMap<MemoryIndex, Option<StaticMemoryInitializer>>,
86    },
87}
88
89impl Default for MemoryInitialization {
90    fn default() -> Self {
91        Self::Segmented(Vec::new())
92    }
93}
94
95impl MemoryInitialization {
96    /// Returns whether this initialization is of the form
97    /// `MemoryInitialization::Segmented`.
98    pub fn is_segmented(&self) -> bool {
99        match self {
100            MemoryInitialization::Segmented(_) => true,
101            _ => false,
102        }
103    }
104
105    /// Performs the memory initialization steps for this set of initializers.
106    ///
107    /// This will perform wasm initialization in compliance with the wasm spec
108    /// and how data segments are processed. This doesn't need to necessarily
109    /// only be called as part of initialization, however, as it's structured to
110    /// allow learning about memory ahead-of-time at compile time possibly.
111    ///
112    /// This function will return true if all memory initializers are processed
113    /// successfully. If any initializer hits an error or, for example, a
114    /// global value is needed but `None` is returned, then false will be
115    /// returned. At compile-time this typically means that the "error" in
116    /// question needs to be deferred to runtime, and at runtime this means
117    /// that an invalid initializer has been found and a trap should be
118    /// generated.
119    pub fn init_memory(&self, state: &mut dyn InitMemory) -> bool {
120        let initializers = match self {
121            // Fall through below to the segmented memory one-by-one
122            // initialization.
123            MemoryInitialization::Segmented(list) => list,
124
125            // If previously switched to static initialization then pass through
126            // all those parameters here to the `write` callback.
127            //
128            // Note that existence of `Static` already guarantees that all
129            // indices are in-bounds.
130            MemoryInitialization::Static { map } => {
131                for (index, init) in map {
132                    if let Some(init) = init {
133                        let result = state.write(index, init);
134                        if !result {
135                            return result;
136                        }
137                    }
138                }
139                return true;
140            }
141        };
142
143        for initializer in initializers {
144            let &MemoryInitializer {
145                memory_index,
146                ref offset,
147                ref data,
148            } = initializer;
149
150            // First up determine the start/end range and verify that they're
151            // in-bounds for the initial size of the memory at `memory_index`.
152            // Note that this can bail if we don't have access to globals yet
153            // (e.g. this is a task happening before instantiation at
154            // compile-time).
155            let start = match state.eval_offset(memory_index, offset) {
156                Some(start) => start,
157                None => return false,
158            };
159            let len = u64::try_from(data.len()).unwrap();
160            let end = match start.checked_add(len) {
161                Some(end) => end,
162                None => return false,
163            };
164
165            match state.memory_size_in_bytes(memory_index) {
166                Ok(max) => {
167                    if end > max {
168                        return false;
169                    }
170                }
171
172                // Note that computing the minimum can overflow if the page size
173                // is the default 64KiB and the memory's minimum size in pages
174                // is `1 << 48`, the maximum number of minimum pages for 64-bit
175                // memories. We don't return `false` to signal an error here and
176                // instead defer the error to runtime, when it will be
177                // impossible to allocate that much memory anyways.
178                Err(_) => {}
179            }
180
181            // The limits of the data segment have been validated at this point
182            // so the `write` callback is called with the range of data being
183            // written. Any erroneous result is propagated upwards.
184            let init = StaticMemoryInitializer {
185                offset: start,
186                data: data.clone(),
187            };
188            let result = state.write(memory_index, &init);
189            if !result {
190                return result;
191            }
192        }
193
194        return true;
195    }
196}
197
198/// The various callbacks provided here are used to drive the smaller bits of
199/// memory initialization.
200pub trait InitMemory {
201    /// Returns the size, in bytes, of the memory specified. For compile-time
202    /// purposes this would be the memory type's minimum size.
203    fn memory_size_in_bytes(&mut self, memory_index: MemoryIndex) -> Result<u64, SizeOverflow>;
204
205    /// Returns the value of the constant expression, as a `u64`. Note that
206    /// this may involve zero-extending a 32-bit global to a 64-bit number. May
207    /// return `None` to indicate that the expression involves a value which is
208    /// not available yet.
209    fn eval_offset(&mut self, memory_index: MemoryIndex, expr: &ConstExpr) -> Option<u64>;
210
211    /// A callback used to actually write data. This indicates that the
212    /// specified memory must receive the specified range of data at the
213    /// specified offset. This can return false on failure.
214    fn write(&mut self, memory_index: MemoryIndex, init: &StaticMemoryInitializer) -> bool;
215}
216
217/// Table initialization data for all tables in the module.
218#[derive(Debug, Default, Serialize, Deserialize)]
219pub struct TableInitialization {
220    /// Initial values for tables defined within the module itself.
221    ///
222    /// This contains the initial values and initializers for tables defined
223    /// within a wasm, so excluding imported tables. This initializer can
224    /// represent null-initialized tables, element-initialized tables (e.g. with
225    /// the function-references proposal), or precomputed images of table
226    /// initialization. For example table initializers to a table that are all
227    /// in-bounds will get removed from `segment` and moved into
228    /// `initial_values` here.
229    pub initial_values: PrimaryMap<DefinedTableIndex, TableInitialValue>,
230
231    /// Element segments present in the initial wasm module which are executed
232    /// at instantiation time.
233    ///
234    /// These element segments are iterated over during instantiation to apply
235    /// any segments that weren't already moved into `initial_values` above.
236    pub segments: Vec<TableSegment>,
237}
238
239/// Initial value for all elements in a table.
240#[derive(Clone, Debug, Serialize, Deserialize)]
241pub enum TableInitialValue {
242    /// Initialize each table element to null, optionally setting some elements
243    /// to non-null given the precomputed image.
244    Null {
245        /// A precomputed image of table initializers for this table.
246        ///
247        /// This image is constructed during `try_func_table_init` and
248        /// null-initialized elements are represented with
249        /// `FuncIndex::reserved_value()`. Note that this image is empty by
250        /// default and may not encompass the entire span of the table in which
251        /// case the elements are initialized to null.
252        precomputed: Vec<FuncIndex>,
253    },
254    /// An arbitrary const expression.
255    Expr(ConstExpr),
256}
257
258/// A WebAssembly table initializer segment.
259#[derive(Clone, Debug, Serialize, Deserialize)]
260pub struct TableSegment {
261    /// The index of a table to initialize.
262    pub table_index: TableIndex,
263    /// The base offset to start this segment at.
264    pub offset: ConstExpr,
265    /// The values to write into the table elements.
266    pub elements: TableSegmentElements,
267}
268
269/// Elements of a table segment, either a list of functions or list of arbitrary
270/// expressions.
271#[derive(Clone, Debug, Serialize, Deserialize)]
272pub enum TableSegmentElements {
273    /// A sequential list of functions where `FuncIndex::reserved_value()`
274    /// indicates a null function.
275    Functions(Box<[FuncIndex]>),
276    /// Arbitrary expressions, aka either functions, null or a load of a global.
277    Expressions(Box<[ConstExpr]>),
278}
279
280impl TableSegmentElements {
281    /// Returns the number of elements in this segment.
282    pub fn len(&self) -> u64 {
283        match self {
284            Self::Functions(s) => u64::try_from(s.len()).unwrap(),
285            Self::Expressions(s) => u64::try_from(s.len()).unwrap(),
286        }
287    }
288}
289
290/// A translated WebAssembly module, excluding the function bodies and
291/// memory initializers.
292#[derive(Default, Debug, Serialize, Deserialize)]
293pub struct Module {
294    /// The name of this wasm module, often found in the wasm file.
295    pub name: Option<String>,
296
297    /// All import records, in the order they are declared in the module.
298    pub initializers: Vec<Initializer>,
299
300    /// Exported entities.
301    pub exports: IndexMap<String, EntityIndex>,
302
303    /// The module "start" function, if present.
304    pub start_func: Option<FuncIndex>,
305
306    /// WebAssembly table initialization data, per table.
307    pub table_initialization: TableInitialization,
308
309    /// WebAssembly linear memory initializer.
310    pub memory_initialization: MemoryInitialization,
311
312    /// WebAssembly passive elements.
313    pub passive_elements: Vec<TableSegmentElements>,
314
315    /// The map from passive element index (element segment index space) to index in `passive_elements`.
316    pub passive_elements_map: BTreeMap<ElemIndex, usize>,
317
318    /// The map from passive data index (data segment index space) to index in `passive_data`.
319    pub passive_data_map: BTreeMap<DataIndex, Range<u32>>,
320
321    /// Types declared in the wasm module.
322    pub types: PrimaryMap<TypeIndex, ModuleInternedTypeIndex>,
323
324    /// Number of imported or aliased functions in the module.
325    pub num_imported_funcs: usize,
326
327    /// Number of imported or aliased tables in the module.
328    pub num_imported_tables: usize,
329
330    /// Number of imported or aliased memories in the module.
331    pub num_imported_memories: usize,
332
333    /// Number of imported or aliased globals in the module.
334    pub num_imported_globals: usize,
335
336    /// Number of functions that "escape" from this module may need to have a
337    /// `VMFuncRef` constructed for them.
338    ///
339    /// This is also the number of functions in the `functions` array below with
340    /// an `func_ref` index (and is the maximum func_ref index).
341    pub num_escaped_funcs: usize,
342
343    /// Number of call-indirect caches.
344    pub num_call_indirect_caches: usize,
345
346    /// Types of functions, imported and local.
347    pub functions: PrimaryMap<FuncIndex, FunctionType>,
348
349    /// WebAssembly tables.
350    pub tables: PrimaryMap<TableIndex, Table>,
351
352    /// WebAssembly linear memory plans.
353    pub memories: PrimaryMap<MemoryIndex, Memory>,
354
355    /// WebAssembly global variables.
356    pub globals: PrimaryMap<GlobalIndex, Global>,
357
358    /// WebAssembly global initializers for locally-defined globals.
359    pub global_initializers: PrimaryMap<DefinedGlobalIndex, ConstExpr>,
360}
361
362/// Initialization routines for creating an instance, encompassing imports,
363/// modules, instances, aliases, etc.
364#[derive(Debug, Serialize, Deserialize)]
365pub enum Initializer {
366    /// An imported item is required to be provided.
367    Import {
368        /// Name of this import
369        name: String,
370        /// The field name projection of this import
371        field: String,
372        /// Where this import will be placed, which also has type information
373        /// about the import.
374        index: EntityIndex,
375    },
376}
377
378impl Module {
379    /// Allocates the module data structures.
380    pub fn new() -> Self {
381        Module::default()
382    }
383
384    /// Convert a `DefinedFuncIndex` into a `FuncIndex`.
385    #[inline]
386    pub fn func_index(&self, defined_func: DefinedFuncIndex) -> FuncIndex {
387        FuncIndex::new(self.num_imported_funcs + defined_func.index())
388    }
389
390    /// Convert a `FuncIndex` into a `DefinedFuncIndex`. Returns None if the
391    /// index is an imported function.
392    #[inline]
393    pub fn defined_func_index(&self, func: FuncIndex) -> Option<DefinedFuncIndex> {
394        if func.index() < self.num_imported_funcs {
395            None
396        } else {
397            Some(DefinedFuncIndex::new(
398                func.index() - self.num_imported_funcs,
399            ))
400        }
401    }
402
403    /// Test whether the given function index is for an imported function.
404    #[inline]
405    pub fn is_imported_function(&self, index: FuncIndex) -> bool {
406        index.index() < self.num_imported_funcs
407    }
408
409    /// Convert a `DefinedTableIndex` into a `TableIndex`.
410    #[inline]
411    pub fn table_index(&self, defined_table: DefinedTableIndex) -> TableIndex {
412        TableIndex::new(self.num_imported_tables + defined_table.index())
413    }
414
415    /// Convert a `TableIndex` into a `DefinedTableIndex`. Returns None if the
416    /// index is an imported table.
417    #[inline]
418    pub fn defined_table_index(&self, table: TableIndex) -> Option<DefinedTableIndex> {
419        if table.index() < self.num_imported_tables {
420            None
421        } else {
422            Some(DefinedTableIndex::new(
423                table.index() - self.num_imported_tables,
424            ))
425        }
426    }
427
428    /// Test whether the given table index is for an imported table.
429    #[inline]
430    pub fn is_imported_table(&self, index: TableIndex) -> bool {
431        index.index() < self.num_imported_tables
432    }
433
434    /// Convert a `DefinedMemoryIndex` into a `MemoryIndex`.
435    #[inline]
436    pub fn memory_index(&self, defined_memory: DefinedMemoryIndex) -> MemoryIndex {
437        MemoryIndex::new(self.num_imported_memories + defined_memory.index())
438    }
439
440    /// Convert a `MemoryIndex` into a `DefinedMemoryIndex`. Returns None if the
441    /// index is an imported memory.
442    #[inline]
443    pub fn defined_memory_index(&self, memory: MemoryIndex) -> Option<DefinedMemoryIndex> {
444        if memory.index() < self.num_imported_memories {
445            None
446        } else {
447            Some(DefinedMemoryIndex::new(
448                memory.index() - self.num_imported_memories,
449            ))
450        }
451    }
452
453    /// Convert a `DefinedMemoryIndex` into an `OwnedMemoryIndex`. Returns None
454    /// if the index is an imported memory.
455    #[inline]
456    pub fn owned_memory_index(&self, memory: DefinedMemoryIndex) -> OwnedMemoryIndex {
457        assert!(
458            memory.index() < self.memories.len(),
459            "non-shared memory must have an owned index"
460        );
461
462        // Once we know that the memory index is not greater than the number of
463        // plans, we can iterate through the plans up to the memory index and
464        // count how many are not shared (i.e., owned).
465        let owned_memory_index = self
466            .memories
467            .iter()
468            .skip(self.num_imported_memories)
469            .take(memory.index())
470            .filter(|(_, mp)| !mp.shared)
471            .count();
472        OwnedMemoryIndex::new(owned_memory_index)
473    }
474
475    /// Test whether the given memory index is for an imported memory.
476    #[inline]
477    pub fn is_imported_memory(&self, index: MemoryIndex) -> bool {
478        index.index() < self.num_imported_memories
479    }
480
481    /// Convert a `DefinedGlobalIndex` into a `GlobalIndex`.
482    #[inline]
483    pub fn global_index(&self, defined_global: DefinedGlobalIndex) -> GlobalIndex {
484        GlobalIndex::new(self.num_imported_globals + defined_global.index())
485    }
486
487    /// Convert a `GlobalIndex` into a `DefinedGlobalIndex`. Returns None if the
488    /// index is an imported global.
489    #[inline]
490    pub fn defined_global_index(&self, global: GlobalIndex) -> Option<DefinedGlobalIndex> {
491        if global.index() < self.num_imported_globals {
492            None
493        } else {
494            Some(DefinedGlobalIndex::new(
495                global.index() - self.num_imported_globals,
496            ))
497        }
498    }
499
500    /// Test whether the given global index is for an imported global.
501    #[inline]
502    pub fn is_imported_global(&self, index: GlobalIndex) -> bool {
503        index.index() < self.num_imported_globals
504    }
505
506    /// Returns an iterator of all the imports in this module, along with their
507    /// module name, field name, and type that's being imported.
508    pub fn imports(&self) -> impl ExactSizeIterator<Item = (&str, &str, EntityType)> {
509        self.initializers.iter().map(move |i| match i {
510            Initializer::Import { name, field, index } => {
511                (name.as_str(), field.as_str(), self.type_of(*index))
512            }
513        })
514    }
515
516    /// Returns the type of an item based on its index
517    pub fn type_of(&self, index: EntityIndex) -> EntityType {
518        match index {
519            EntityIndex::Global(i) => EntityType::Global(self.globals[i]),
520            EntityIndex::Table(i) => EntityType::Table(self.tables[i]),
521            EntityIndex::Memory(i) => EntityType::Memory(self.memories[i]),
522            EntityIndex::Function(i) => {
523                EntityType::Function(EngineOrModuleTypeIndex::Module(self.functions[i].signature))
524            }
525        }
526    }
527
528    /// Appends a new function to this module with the given type information,
529    /// used for functions that either don't escape or aren't certain whether
530    /// they escape yet.
531    pub fn push_function(&mut self, signature: ModuleInternedTypeIndex) -> FuncIndex {
532        self.functions.push(FunctionType {
533            signature,
534            func_ref: FuncRefIndex::reserved_value(),
535        })
536    }
537
538    /// Returns an iterator over all of the defined function indices in this
539    /// module.
540    pub fn defined_func_indices(&self) -> impl Iterator<Item = DefinedFuncIndex> + use<> {
541        (0..self.functions.len() - self.num_imported_funcs).map(|i| DefinedFuncIndex::new(i))
542    }
543
544    /// Returns the number of tables defined by this module itself: all tables
545    /// minus imported tables.
546    pub fn num_defined_tables(&self) -> usize {
547        self.tables.len() - self.num_imported_tables
548    }
549
550    /// Returns the number of memories defined by this module itself: all
551    /// memories minus imported memories.
552    pub fn num_defined_memories(&self) -> usize {
553        self.memories.len() - self.num_imported_memories
554    }
555}
556
557/// Type information about functions in a wasm module.
558#[derive(Debug, Serialize, Deserialize)]
559pub struct FunctionType {
560    /// The type of this function, indexed into the module-wide type tables for
561    /// a module compilation.
562    pub signature: ModuleInternedTypeIndex,
563    /// The index into the funcref table, if present. Note that this is
564    /// `reserved_value()` if the function does not escape from a module.
565    pub func_ref: FuncRefIndex,
566}
567
568impl FunctionType {
569    /// Returns whether this function's type is one that "escapes" the current
570    /// module, meaning that the function is exported, used in `ref.func`, used
571    /// in a table, etc.
572    pub fn is_escaping(&self) -> bool {
573        !self.func_ref.is_reserved_value()
574    }
575}
576
577/// Index into the funcref table within a VMContext for a function.
578#[derive(Copy, Clone, PartialEq, Eq, Hash, PartialOrd, Ord, Debug, Serialize, Deserialize)]
579pub struct FuncRefIndex(u32);
580cranelift_entity::entity_impl!(FuncRefIndex);