1 use crate::prelude::*; 2 #[cfg(feature = "std")] 3 use crate::runtime::vm::open_file_for_mmap; 4 use crate::runtime::vm::{CompiledModuleId, MmapVec, ModuleMemoryImages, VMWasmCallFunction}; 5 use crate::sync::OnceLock; 6 use crate::{ 7 code::CodeObject, 8 code_memory::CodeMemory, 9 instantiate::CompiledModule, 10 resources::ResourcesRequired, 11 type_registry::TypeCollection, 12 types::{ExportType, ExternType, ImportType}, 13 Engine, 14 }; 15 use alloc::sync::Arc; 16 use core::fmt; 17 use core::ops::Range; 18 use core::ptr::NonNull; 19 #[cfg(feature = "std")] 20 use std::{fs::File, path::Path}; 21 use wasmparser::{Parser, ValidPayload, Validator}; 22 use wasmtime_environ::{ 23 CompiledModuleInfo, EntityIndex, HostPtr, ModuleTypes, ObjectKind, TypeTrace, VMOffsets, 24 VMSharedTypeIndex, 25 }; 26 mod registry; 27 28 pub use registry::*; 29 30 /// A compiled WebAssembly module, ready to be instantiated. 31 /// 32 /// A `Module` is a compiled in-memory representation of an input WebAssembly 33 /// binary. A `Module` is then used to create an [`Instance`](crate::Instance) 34 /// through an instantiation process. You cannot call functions or fetch 35 /// globals, for example, on a `Module` because it's purely a code 36 /// representation. Instead you'll need to create an 37 /// [`Instance`](crate::Instance) to interact with the wasm module. 38 /// 39 /// A `Module` can be created by compiling WebAssembly code through APIs such as 40 /// [`Module::new`]. This would be a JIT-style use case where code is compiled 41 /// just before it's used. Alternatively a `Module` can be compiled in one 42 /// process and [`Module::serialize`] can be used to save it to storage. A later 43 /// call to [`Module::deserialize`] will quickly load the module to execute and 44 /// does not need to compile any code, representing a more AOT-style use case. 45 /// 46 /// Currently a `Module` does not implement any form of tiering or dynamic 47 /// optimization of compiled code. Creation of a `Module` via [`Module::new`] or 48 /// related APIs will perform the entire compilation step synchronously. When 49 /// finished no further compilation will happen at runtime or later during 50 /// execution of WebAssembly instances for example. 51 /// 52 /// Compilation of WebAssembly by default goes through Cranelift and is 53 /// recommended to be done once-per-module. The same WebAssembly binary need not 54 /// be compiled multiple times and can instead used an embedder-cached result of 55 /// the first call. 56 /// 57 /// `Module` is thread-safe and safe to share across threads. 58 /// 59 /// ## Modules and `Clone` 60 /// 61 /// Using `clone` on a `Module` is a cheap operation. It will not create an 62 /// entirely new module, but rather just a new reference to the existing module. 63 /// In other words it's a shallow copy, not a deep copy. 64 /// 65 /// ## Examples 66 /// 67 /// There are a number of ways you can create a `Module`, for example pulling 68 /// the bytes from a number of locations. One example is loading a module from 69 /// the filesystem: 70 /// 71 /// ```no_run 72 /// # use wasmtime::*; 73 /// # fn main() -> anyhow::Result<()> { 74 /// let engine = Engine::default(); 75 /// let module = Module::from_file(&engine, "path/to/foo.wasm")?; 76 /// # Ok(()) 77 /// # } 78 /// ``` 79 /// 80 /// You can also load the wasm text format if more convenient too: 81 /// 82 /// ```no_run 83 /// # use wasmtime::*; 84 /// # fn main() -> anyhow::Result<()> { 85 /// let engine = Engine::default(); 86 /// // Now we're using the WebAssembly text extension: `.wat`! 87 /// let module = Module::from_file(&engine, "path/to/foo.wat")?; 88 /// # Ok(()) 89 /// # } 90 /// ``` 91 /// 92 /// And if you've already got the bytes in-memory you can use the 93 /// [`Module::new`] constructor: 94 /// 95 /// ```no_run 96 /// # use wasmtime::*; 97 /// # fn main() -> anyhow::Result<()> { 98 /// let engine = Engine::default(); 99 /// # let wasm_bytes: Vec<u8> = Vec::new(); 100 /// let module = Module::new(&engine, &wasm_bytes)?; 101 /// 102 /// // It also works with the text format! 103 /// let module = Module::new(&engine, "(module (func))")?; 104 /// # Ok(()) 105 /// # } 106 /// ``` 107 /// 108 /// Serializing and deserializing a module looks like: 109 /// 110 /// ```no_run 111 /// # use wasmtime::*; 112 /// # fn main() -> anyhow::Result<()> { 113 /// let engine = Engine::default(); 114 /// # let wasm_bytes: Vec<u8> = Vec::new(); 115 /// let module = Module::new(&engine, &wasm_bytes)?; 116 /// let module_bytes = module.serialize()?; 117 /// 118 /// // ... can save `module_bytes` to disk or other storage ... 119 /// 120 /// // recreate the module from the serialized bytes. For the `unsafe` bits 121 /// // see the documentation of `deserialize`. 122 /// let module = unsafe { Module::deserialize(&engine, &module_bytes)? }; 123 /// # Ok(()) 124 /// # } 125 /// ``` 126 /// 127 /// [`Config`]: crate::Config 128 #[derive(Clone)] 129 pub struct Module { 130 inner: Arc<ModuleInner>, 131 } 132 133 struct ModuleInner { 134 engine: Engine, 135 /// The compiled artifacts for this module that will be instantiated and 136 /// executed. 137 module: CompiledModule, 138 139 /// Runtime information such as the underlying mmap, type information, etc. 140 /// 141 /// Note that this `Arc` is used to share information between compiled 142 /// modules within a component. For bare core wasm modules created with 143 /// `Module::new`, for example, this is a uniquely owned `Arc`. 144 code: Arc<CodeObject>, 145 146 /// A set of initialization images for memories, if any. 147 /// 148 /// Note that this is behind a `OnceCell` to lazily create this image. On 149 /// Linux where `memfd_create` may be used to create the backing memory 150 /// image this is a pretty expensive operation, so by deferring it this 151 /// improves memory usage for modules that are created but may not ever be 152 /// instantiated. 153 memory_images: OnceLock<Option<ModuleMemoryImages>>, 154 155 /// Flag indicating whether this module can be serialized or not. 156 serializable: bool, 157 158 /// Runtime offset information for `VMContext`. 159 offsets: VMOffsets<HostPtr>, 160 } 161 162 impl fmt::Debug for Module { 163 fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result { 164 f.debug_struct("Module") 165 .field("name", &self.name()) 166 .finish_non_exhaustive() 167 } 168 } 169 170 impl fmt::Debug for ModuleInner { 171 fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result { 172 f.debug_struct("ModuleInner") 173 .field("name", &self.module.module().name.as_ref()) 174 .finish_non_exhaustive() 175 } 176 } 177 178 impl Module { 179 /// Creates a new WebAssembly `Module` from the given in-memory `bytes`. 180 /// 181 /// The `bytes` provided must be in one of the following formats: 182 /// 183 /// * A [binary-encoded][binary] WebAssembly module. This is always supported. 184 /// * A [text-encoded][text] instance of the WebAssembly text format. 185 /// This is only supported when the `wat` feature of this crate is enabled. 186 /// If this is supplied then the text format will be parsed before validation. 187 /// Note that the `wat` feature is enabled by default. 188 /// 189 /// The data for the wasm module must be loaded in-memory if it's present 190 /// elsewhere, for example on disk. This requires that the entire binary is 191 /// loaded into memory all at once, this API does not support streaming 192 /// compilation of a module. 193 /// 194 /// The WebAssembly binary will be decoded and validated. It will also be 195 /// compiled according to the configuration of the provided `engine`. 196 /// 197 /// # Errors 198 /// 199 /// This function may fail and return an error. Errors may include 200 /// situations such as: 201 /// 202 /// * The binary provided could not be decoded because it's not a valid 203 /// WebAssembly binary 204 /// * The WebAssembly binary may not validate (e.g. contains type errors) 205 /// * Implementation-specific limits were exceeded with a valid binary (for 206 /// example too many locals) 207 /// * The wasm binary may use features that are not enabled in the 208 /// configuration of `engine` 209 /// * If the `wat` feature is enabled and the input is text, then it may be 210 /// rejected if it fails to parse. 211 /// 212 /// The error returned should contain full information about why module 213 /// creation failed if one is returned. 214 /// 215 /// [binary]: https://webassembly.github.io/spec/core/binary/index.html 216 /// [text]: https://webassembly.github.io/spec/core/text/index.html 217 /// 218 /// # Examples 219 /// 220 /// The `new` function can be invoked with a in-memory array of bytes: 221 /// 222 /// ```no_run 223 /// # use wasmtime::*; 224 /// # fn main() -> anyhow::Result<()> { 225 /// # let engine = Engine::default(); 226 /// # let wasm_bytes: Vec<u8> = Vec::new(); 227 /// let module = Module::new(&engine, &wasm_bytes)?; 228 /// # Ok(()) 229 /// # } 230 /// ``` 231 /// 232 /// Or you can also pass in a string to be parsed as the wasm text 233 /// format: 234 /// 235 /// ``` 236 /// # use wasmtime::*; 237 /// # fn main() -> anyhow::Result<()> { 238 /// # let engine = Engine::default(); 239 /// let module = Module::new(&engine, "(module (func))")?; 240 /// # Ok(()) 241 /// # } 242 /// ``` 243 #[cfg(any(feature = "cranelift", feature = "winch"))] 244 pub fn new(engine: &Engine, bytes: impl AsRef<[u8]>) -> Result<Module> { 245 crate::CodeBuilder::new(engine) 246 .wasm_binary_or_text(bytes.as_ref(), None)? 247 .compile_module() 248 } 249 250 /// Creates a new WebAssembly `Module` from the contents of the given 251 /// `file` on disk. 252 /// 253 /// This is a convenience function that will read the `file` provided and 254 /// pass the bytes to the [`Module::new`] function. For more information 255 /// see [`Module::new`] 256 /// 257 /// # Examples 258 /// 259 /// ```no_run 260 /// # use wasmtime::*; 261 /// # fn main() -> anyhow::Result<()> { 262 /// let engine = Engine::default(); 263 /// let module = Module::from_file(&engine, "./path/to/foo.wasm")?; 264 /// # Ok(()) 265 /// # } 266 /// ``` 267 /// 268 /// The `.wat` text format is also supported: 269 /// 270 /// ```no_run 271 /// # use wasmtime::*; 272 /// # fn main() -> anyhow::Result<()> { 273 /// # let engine = Engine::default(); 274 /// let module = Module::from_file(&engine, "./path/to/foo.wat")?; 275 /// # Ok(()) 276 /// # } 277 /// ``` 278 #[cfg(all(feature = "std", any(feature = "cranelift", feature = "winch")))] 279 pub fn from_file(engine: &Engine, file: impl AsRef<Path>) -> Result<Module> { 280 crate::CodeBuilder::new(engine) 281 .wasm_binary_or_text_file(file.as_ref())? 282 .compile_module() 283 } 284 285 /// Creates a new WebAssembly `Module` from the given in-memory `binary` 286 /// data. 287 /// 288 /// This is similar to [`Module::new`] except that it requires that the 289 /// `binary` input is a WebAssembly binary, the text format is not supported 290 /// by this function. It's generally recommended to use [`Module::new`], but 291 /// if it's required to not support the text format this function can be 292 /// used instead. 293 /// 294 /// # Examples 295 /// 296 /// ``` 297 /// # use wasmtime::*; 298 /// # fn main() -> anyhow::Result<()> { 299 /// # let engine = Engine::default(); 300 /// let wasm = b"\0asm\x01\0\0\0"; 301 /// let module = Module::from_binary(&engine, wasm)?; 302 /// # Ok(()) 303 /// # } 304 /// ``` 305 /// 306 /// Note that the text format is **not** accepted by this function: 307 /// 308 /// ``` 309 /// # use wasmtime::*; 310 /// # fn main() -> anyhow::Result<()> { 311 /// # let engine = Engine::default(); 312 /// assert!(Module::from_binary(&engine, b"(module)").is_err()); 313 /// # Ok(()) 314 /// # } 315 /// ``` 316 #[cfg(any(feature = "cranelift", feature = "winch"))] 317 pub fn from_binary(engine: &Engine, binary: &[u8]) -> Result<Module> { 318 crate::CodeBuilder::new(engine) 319 .wasm_binary(binary, None)? 320 .compile_module() 321 } 322 323 /// Creates a new WebAssembly `Module` from the contents of the given `file` 324 /// on disk, but with assumptions that the file is from a trusted source. 325 /// The file should be a binary- or text-format WebAssembly module, or a 326 /// precompiled artifact generated by the same version of Wasmtime. 327 /// 328 /// # Unsafety 329 /// 330 /// All of the reasons that [`deserialize`] is `unsafe` apply to this 331 /// function as well. Arbitrary data loaded from a file may trick Wasmtime 332 /// into arbitrary code execution since the contents of the file are not 333 /// validated to be a valid precompiled module. 334 /// 335 /// [`deserialize`]: Module::deserialize 336 /// 337 /// Additionally though this function is also `unsafe` because the file 338 /// referenced must remain unchanged and a valid precompiled module for the 339 /// entire lifetime of the [`Module`] returned. Any changes to the file on 340 /// disk may change future instantiations of the module to be incorrect. 341 /// This is because the file is mapped into memory and lazily loaded pages 342 /// reflect the current state of the file, not necessarily the original 343 /// state of the file. 344 #[cfg(all(feature = "std", any(feature = "cranelift", feature = "winch")))] 345 pub unsafe fn from_trusted_file(engine: &Engine, file: impl AsRef<Path>) -> Result<Module> { 346 let open_file = open_file_for_mmap(file.as_ref())?; 347 let mmap = MmapVec::from_file(open_file)?; 348 if &mmap[0..4] == b"\x7fELF" { 349 let code = engine.load_code(mmap, ObjectKind::Module)?; 350 return Module::from_parts(engine, code, None); 351 } 352 353 crate::CodeBuilder::new(engine) 354 .wasm_binary_or_text(&mmap[..], Some(file.as_ref()))? 355 .compile_module() 356 } 357 358 /// Deserializes an in-memory compiled module previously created with 359 /// [`Module::serialize`] or [`Engine::precompile_module`]. 360 /// 361 /// This function will deserialize the binary blobs emitted by 362 /// [`Module::serialize`] and [`Engine::precompile_module`] back into an 363 /// in-memory [`Module`] that's ready to be instantiated. 364 /// 365 /// Note that the [`Module::deserialize_file`] method is more optimized than 366 /// this function, so if the serialized module is already present in a file 367 /// it's recommended to use that method instead. 368 /// 369 /// # Unsafety 370 /// 371 /// This function is marked as `unsafe` because if fed invalid input or used 372 /// improperly this could lead to memory safety vulnerabilities. This method 373 /// should not, for example, be exposed to arbitrary user input. 374 /// 375 /// The structure of the binary blob read here is only lightly validated 376 /// internally in `wasmtime`. This is intended to be an efficient 377 /// "rehydration" for a [`Module`] which has very few runtime checks beyond 378 /// deserialization. Arbitrary input could, for example, replace valid 379 /// compiled code with any other valid compiled code, meaning that this can 380 /// trivially be used to execute arbitrary code otherwise. 381 /// 382 /// For these reasons this function is `unsafe`. This function is only 383 /// designed to receive the previous input from [`Module::serialize`] and 384 /// [`Engine::precompile_module`]. If the exact output of those functions 385 /// (unmodified) is passed to this function then calls to this function can 386 /// be considered safe. It is the caller's responsibility to provide the 387 /// guarantee that only previously-serialized bytes are being passed in 388 /// here. 389 /// 390 /// Note that this function is designed to be safe receiving output from 391 /// *any* compiled version of `wasmtime` itself. This means that it is safe 392 /// to feed output from older versions of Wasmtime into this function, in 393 /// addition to newer versions of wasmtime (from the future!). These inputs 394 /// will deterministically and safely produce an `Err`. This function only 395 /// successfully accepts inputs from the same version of `wasmtime`, but the 396 /// safety guarantee only applies to externally-defined blobs of bytes, not 397 /// those defined by any version of wasmtime. (this means that if you cache 398 /// blobs across versions of wasmtime you can be safely guaranteed that 399 /// future versions of wasmtime will reject old cache entries). 400 pub unsafe fn deserialize(engine: &Engine, bytes: impl AsRef<[u8]>) -> Result<Module> { 401 let code = engine.load_code_bytes(bytes.as_ref(), ObjectKind::Module)?; 402 Module::from_parts(engine, code, None) 403 } 404 405 /// Same as [`deserialize`], except that the contents of `path` are read to 406 /// deserialize into a [`Module`]. 407 /// 408 /// This method is provided because it can be faster than [`deserialize`] 409 /// since the data doesn't need to be copied around, but rather the module 410 /// can be used directly from an mmap'd view of the file provided. 411 /// 412 /// [`deserialize`]: Module::deserialize 413 /// 414 /// # Unsafety 415 /// 416 /// All of the reasons that [`deserialize`] is `unsafe` applies to this 417 /// function as well. Arbitrary data loaded from a file may trick Wasmtime 418 /// into arbitrary code execution since the contents of the file are not 419 /// validated to be a valid precompiled module. 420 /// 421 /// Additionally though this function is also `unsafe` because the file 422 /// referenced must remain unchanged and a valid precompiled module for the 423 /// entire lifetime of the [`Module`] returned. Any changes to the file on 424 /// disk may change future instantiations of the module to be incorrect. 425 /// This is because the file is mapped into memory and lazily loaded pages 426 /// reflect the current state of the file, not necessarily the original 427 /// state of the file. 428 #[cfg(feature = "std")] 429 pub unsafe fn deserialize_file(engine: &Engine, path: impl AsRef<Path>) -> Result<Module> { 430 let file = open_file_for_mmap(path.as_ref())?; 431 Self::deserialize_open_file(engine, file) 432 .with_context(|| format!("failed deserialization for: {}", path.as_ref().display())) 433 } 434 435 /// Same as [`deserialize_file`], except that it takes an open `File` 436 /// instead of a path. 437 /// 438 /// This method is provided because it can be used instead of 439 /// [`deserialize_file`] in situations where `wasmtime` is running with 440 /// limited file system permissions. In that case a process 441 /// with file system access can pass already opened files to `wasmtime`. 442 /// 443 /// [`deserialize_file`]: Module::deserialize_file 444 /// 445 /// Note that the corresponding will be mapped as private writeable 446 /// (copy-on-write) and executable. For `windows` this means the file needs 447 /// to be opened with at least `FILE_GENERIC_READ | FILE_GENERIC_EXECUTE` 448 /// [`access_mode`]. 449 /// 450 /// [`access_mode`]: https://doc.rust-lang.org/std/os/windows/fs/trait.OpenOptionsExt.html#tymethod.access_mode 451 /// 452 /// # Unsafety 453 /// 454 /// All of the reasons that [`deserialize_file`] is `unsafe` applies to this 455 /// function as well. 456 #[cfg(feature = "std")] 457 pub unsafe fn deserialize_open_file(engine: &Engine, file: File) -> Result<Module> { 458 let code = engine.load_code_file(file, ObjectKind::Module)?; 459 Module::from_parts(engine, code, None) 460 } 461 462 /// Entrypoint for creating a `Module` for all above functions, both 463 /// of the AOT and jit-compiled categories. 464 /// 465 /// In all cases the compilation artifact, `code_memory`, is provided here. 466 /// The `info_and_types` argument is `None` when a module is being 467 /// deserialized from a precompiled artifact or it's `Some` if it was just 468 /// compiled and the values are already available. 469 pub(crate) fn from_parts( 470 engine: &Engine, 471 code_memory: Arc<CodeMemory>, 472 info_and_types: Option<(CompiledModuleInfo, ModuleTypes)>, 473 ) -> Result<Self> { 474 // Acquire this module's metadata and type information, deserializing 475 // it from the provided artifact if it wasn't otherwise provided 476 // already. 477 let (info, types) = match info_and_types { 478 Some((info, types)) => (info, types), 479 None => postcard::from_bytes(code_memory.wasmtime_info())?, 480 }; 481 482 // Register function type signatures into the engine for the lifetime 483 // of the `Module` that will be returned. This notably also builds up 484 // maps for trampolines to be used for this module when inserted into 485 // stores. 486 // 487 // Note that the unsafety here should be ok since the `trampolines` 488 // field should only point to valid trampoline function pointers 489 // within the text section. 490 let signatures = TypeCollection::new_for_module(engine, &types); 491 492 // Package up all our data into a `CodeObject` and delegate to the final 493 // step of module compilation. 494 let code = Arc::new(CodeObject::new(code_memory, signatures, types.into())); 495 Module::from_parts_raw(engine, code, info, true) 496 } 497 498 pub(crate) fn from_parts_raw( 499 engine: &Engine, 500 code: Arc<CodeObject>, 501 info: CompiledModuleInfo, 502 serializable: bool, 503 ) -> Result<Self> { 504 let module = 505 CompiledModule::from_artifacts(code.code_memory().clone(), info, engine.profiler())?; 506 507 // Validate the module can be used with the current instance allocator. 508 let offsets = VMOffsets::new(HostPtr, module.module()); 509 engine 510 .allocator() 511 .validate_module(module.module(), &offsets)?; 512 513 Ok(Self { 514 inner: Arc::new(ModuleInner { 515 engine: engine.clone(), 516 code, 517 memory_images: OnceLock::new(), 518 module, 519 serializable, 520 offsets, 521 }), 522 }) 523 } 524 525 /// Validates `binary` input data as a WebAssembly binary given the 526 /// configuration in `engine`. 527 /// 528 /// This function will perform a speedy validation of the `binary` input 529 /// WebAssembly module (which is in [binary form][binary], the text format 530 /// is not accepted by this function) and return either `Ok` or `Err` 531 /// depending on the results of validation. The `engine` argument indicates 532 /// configuration for WebAssembly features, for example, which are used to 533 /// indicate what should be valid and what shouldn't be. 534 /// 535 /// Validation automatically happens as part of [`Module::new`]. 536 /// 537 /// # Errors 538 /// 539 /// If validation fails for any reason (type check error, usage of a feature 540 /// that wasn't enabled, etc) then an error with a description of the 541 /// validation issue will be returned. 542 /// 543 /// [binary]: https://webassembly.github.io/spec/core/binary/index.html 544 pub fn validate(engine: &Engine, binary: &[u8]) -> Result<()> { 545 let mut validator = Validator::new_with_features(engine.features()); 546 547 let mut functions = Vec::new(); 548 for payload in Parser::new(0).parse_all(binary) { 549 let payload = payload?; 550 if let ValidPayload::Func(a, b) = validator.payload(&payload)? { 551 functions.push((a, b)); 552 } 553 if let wasmparser::Payload::Version { encoding, .. } = &payload { 554 if let wasmparser::Encoding::Component = encoding { 555 bail!("component passed to module validation"); 556 } 557 } 558 } 559 560 engine.run_maybe_parallel(functions, |(validator, body)| { 561 // FIXME: it would be best here to use a rayon-specific parallel 562 // iterator that maintains state-per-thread to share the function 563 // validator allocations (`Default::default` here) across multiple 564 // functions. 565 validator.into_validator(Default::default()).validate(&body) 566 })?; 567 Ok(()) 568 } 569 570 /// Serializes this module to a vector of bytes. 571 /// 572 /// This function is similar to the [`Engine::precompile_module`] method 573 /// where it produces an artifact of Wasmtime which is suitable to later 574 /// pass into [`Module::deserialize`]. If a module is never instantiated 575 /// then it's recommended to use [`Engine::precompile_module`] instead of 576 /// this method, but if a module is both instantiated and serialized then 577 /// this method can be useful to get the serialized version without 578 /// compiling twice. 579 #[cfg(any(feature = "cranelift", feature = "winch"))] 580 pub fn serialize(&self) -> Result<Vec<u8>> { 581 // The current representation of compiled modules within a compiled 582 // component means that it cannot be serialized. The mmap returned here 583 // is the mmap for the entire component and while it contains all 584 // necessary data to deserialize this particular module it's all 585 // embedded within component-specific information. 586 // 587 // It's not the hardest thing in the world to support this but it's 588 // expected that there's not much of a use case at this time. In theory 589 // all that needs to be done is to edit the `.wasmtime.info` section 590 // to contains this module's metadata instead of the metadata for the 591 // whole component. The metadata itself is fairly trivially 592 // recreateable here it's more that there's no easy one-off API for 593 // editing the sections of an ELF object to use here. 594 // 595 // Overall for now this simply always returns an error in this 596 // situation. If you're reading this and feel that the situation should 597 // be different please feel free to open an issue. 598 if !self.inner.serializable { 599 bail!("cannot serialize a module exported from a component"); 600 } 601 Ok(self.compiled_module().mmap().to_vec()) 602 } 603 604 pub(crate) fn compiled_module(&self) -> &CompiledModule { 605 &self.inner.module 606 } 607 608 pub(crate) fn code_object(&self) -> &Arc<CodeObject> { 609 &self.inner.code 610 } 611 612 pub(crate) fn env_module(&self) -> &Arc<wasmtime_environ::Module> { 613 self.compiled_module().module() 614 } 615 616 pub(crate) fn types(&self) -> &ModuleTypes { 617 self.inner.code.module_types() 618 } 619 620 pub(crate) fn signatures(&self) -> &TypeCollection { 621 self.inner.code.signatures() 622 } 623 624 /// Returns identifier/name that this [`Module`] has. This name 625 /// is used in traps/backtrace details. 626 /// 627 /// Note that most LLVM/clang/Rust-produced modules do not have a name 628 /// associated with them, but other wasm tooling can be used to inject or 629 /// add a name. 630 /// 631 /// # Examples 632 /// 633 /// ``` 634 /// # use wasmtime::*; 635 /// # fn main() -> anyhow::Result<()> { 636 /// # let engine = Engine::default(); 637 /// let module = Module::new(&engine, "(module $foo)")?; 638 /// assert_eq!(module.name(), Some("foo")); 639 /// 640 /// let module = Module::new(&engine, "(module)")?; 641 /// assert_eq!(module.name(), None); 642 /// 643 /// # Ok(()) 644 /// # } 645 /// ``` 646 pub fn name(&self) -> Option<&str> { 647 self.compiled_module().module().name.as_deref() 648 } 649 650 /// Returns the list of imports that this [`Module`] has and must be 651 /// satisfied. 652 /// 653 /// This function returns the list of imports that the wasm module has, but 654 /// only the types of each import. The type of each import is used to 655 /// typecheck the [`Instance::new`](crate::Instance::new) method's `imports` 656 /// argument. The arguments to that function must match up 1-to-1 with the 657 /// entries in the array returned here. 658 /// 659 /// The imports returned reflect the order of the imports in the wasm module 660 /// itself, and note that no form of deduplication happens. 661 /// 662 /// # Examples 663 /// 664 /// Modules with no imports return an empty list here: 665 /// 666 /// ``` 667 /// # use wasmtime::*; 668 /// # fn main() -> anyhow::Result<()> { 669 /// # let engine = Engine::default(); 670 /// let module = Module::new(&engine, "(module)")?; 671 /// assert_eq!(module.imports().len(), 0); 672 /// # Ok(()) 673 /// # } 674 /// ``` 675 /// 676 /// and modules with imports will have a non-empty list: 677 /// 678 /// ``` 679 /// # use wasmtime::*; 680 /// # fn main() -> anyhow::Result<()> { 681 /// # let engine = Engine::default(); 682 /// let wat = r#" 683 /// (module 684 /// (import "host" "foo" (func)) 685 /// ) 686 /// "#; 687 /// let module = Module::new(&engine, wat)?; 688 /// assert_eq!(module.imports().len(), 1); 689 /// let import = module.imports().next().unwrap(); 690 /// assert_eq!(import.module(), "host"); 691 /// assert_eq!(import.name(), "foo"); 692 /// match import.ty() { 693 /// ExternType::Func(_) => { /* ... */ } 694 /// _ => panic!("unexpected import type!"), 695 /// } 696 /// # Ok(()) 697 /// # } 698 /// ``` 699 pub fn imports<'module>( 700 &'module self, 701 ) -> impl ExactSizeIterator<Item = ImportType<'module>> + 'module { 702 let module = self.compiled_module().module(); 703 let types = self.types(); 704 let engine = self.engine(); 705 module 706 .imports() 707 .map(move |(imp_mod, imp_field, mut ty)| { 708 ty.canonicalize_for_runtime_usage(&mut |i| { 709 self.signatures().shared_type(i).unwrap() 710 }); 711 ImportType::new(imp_mod, imp_field, ty, types, engine) 712 }) 713 .collect::<Vec<_>>() 714 .into_iter() 715 } 716 717 /// Returns the list of exports that this [`Module`] has and will be 718 /// available after instantiation. 719 /// 720 /// This function will return the type of each item that will be returned 721 /// from [`Instance::exports`](crate::Instance::exports). Each entry in this 722 /// list corresponds 1-to-1 with that list, and the entries here will 723 /// indicate the name of the export along with the type of the export. 724 /// 725 /// # Examples 726 /// 727 /// Modules might not have any exports: 728 /// 729 /// ``` 730 /// # use wasmtime::*; 731 /// # fn main() -> anyhow::Result<()> { 732 /// # let engine = Engine::default(); 733 /// let module = Module::new(&engine, "(module)")?; 734 /// assert!(module.exports().next().is_none()); 735 /// # Ok(()) 736 /// # } 737 /// ``` 738 /// 739 /// When the exports are not empty, you can inspect each export: 740 /// 741 /// ``` 742 /// # use wasmtime::*; 743 /// # fn main() -> anyhow::Result<()> { 744 /// # let engine = Engine::default(); 745 /// let wat = r#" 746 /// (module 747 /// (func (export "foo")) 748 /// (memory (export "memory") 1) 749 /// ) 750 /// "#; 751 /// let module = Module::new(&engine, wat)?; 752 /// assert_eq!(module.exports().len(), 2); 753 /// 754 /// let mut exports = module.exports(); 755 /// let foo = exports.next().unwrap(); 756 /// assert_eq!(foo.name(), "foo"); 757 /// match foo.ty() { 758 /// ExternType::Func(_) => { /* ... */ } 759 /// _ => panic!("unexpected export type!"), 760 /// } 761 /// 762 /// let memory = exports.next().unwrap(); 763 /// assert_eq!(memory.name(), "memory"); 764 /// match memory.ty() { 765 /// ExternType::Memory(_) => { /* ... */ } 766 /// _ => panic!("unexpected export type!"), 767 /// } 768 /// # Ok(()) 769 /// # } 770 /// ``` 771 pub fn exports<'module>( 772 &'module self, 773 ) -> impl ExactSizeIterator<Item = ExportType<'module>> + 'module { 774 let module = self.compiled_module().module(); 775 let types = self.types(); 776 let engine = self.engine(); 777 module.exports.iter().map(move |(name, entity_index)| { 778 ExportType::new(name, module.type_of(*entity_index), types, engine) 779 }) 780 } 781 782 /// Looks up an export in this [`Module`] by name. 783 /// 784 /// This function will return the type of an export with the given name. 785 /// 786 /// # Examples 787 /// 788 /// There may be no export with that name: 789 /// 790 /// ``` 791 /// # use wasmtime::*; 792 /// # fn main() -> anyhow::Result<()> { 793 /// # let engine = Engine::default(); 794 /// let module = Module::new(&engine, "(module)")?; 795 /// assert!(module.get_export("foo").is_none()); 796 /// # Ok(()) 797 /// # } 798 /// ``` 799 /// 800 /// When there is an export with that name, it is returned: 801 /// 802 /// ``` 803 /// # use wasmtime::*; 804 /// # fn main() -> anyhow::Result<()> { 805 /// # let engine = Engine::default(); 806 /// let wat = r#" 807 /// (module 808 /// (func (export "foo")) 809 /// (memory (export "memory") 1) 810 /// ) 811 /// "#; 812 /// let module = Module::new(&engine, wat)?; 813 /// let foo = module.get_export("foo"); 814 /// assert!(foo.is_some()); 815 /// 816 /// let foo = foo.unwrap(); 817 /// match foo { 818 /// ExternType::Func(_) => { /* ... */ } 819 /// _ => panic!("unexpected export type!"), 820 /// } 821 /// 822 /// # Ok(()) 823 /// # } 824 /// ``` 825 pub fn get_export(&self, name: &str) -> Option<ExternType> { 826 let module = self.compiled_module().module(); 827 let entity_index = module.exports.get(name)?; 828 Some(ExternType::from_wasmtime( 829 self.engine(), 830 self.types(), 831 &module.type_of(*entity_index), 832 )) 833 } 834 835 /// Looks up an export in this [`Module`] by name to get its index. 836 /// 837 /// This function will return the index of an export with the given name. This can be useful 838 /// to avoid the cost of looking up the export by name multiple times. Instead the 839 /// [`ModuleExport`] can be stored and used to look up the export on the 840 /// [`Instance`](crate::Instance) later. 841 pub fn get_export_index(&self, name: &str) -> Option<ModuleExport> { 842 let compiled_module = self.compiled_module(); 843 let module = compiled_module.module(); 844 module 845 .exports 846 .get_full(name) 847 .map(|(export_name_index, _, &entity)| ModuleExport { 848 module: self.id(), 849 entity, 850 export_name_index, 851 }) 852 } 853 854 /// Returns the [`Engine`] that this [`Module`] was compiled by. 855 pub fn engine(&self) -> &Engine { 856 &self.inner.engine 857 } 858 859 /// Returns a summary of the resources required to instantiate this 860 /// [`Module`]. 861 /// 862 /// Potential uses of the returned information: 863 /// 864 /// * Determining whether your pooling allocator configuration supports 865 /// instantiating this module. 866 /// 867 /// * Deciding how many of which `Module` you want to instantiate within a 868 /// fixed amount of resources, e.g. determining whether to create 5 869 /// instances of module X or 10 instances of module Y. 870 /// 871 /// # Example 872 /// 873 /// ``` 874 /// # fn main() -> wasmtime::Result<()> { 875 /// use wasmtime::{Config, Engine, Module}; 876 /// 877 /// let mut config = Config::new(); 878 /// config.wasm_multi_memory(true); 879 /// let engine = Engine::new(&config)?; 880 /// 881 /// let module = Module::new(&engine, r#" 882 /// (module 883 /// ;; Import a memory. Doesn't count towards required resources. 884 /// (import "a" "b" (memory 10)) 885 /// ;; Define two local memories. These count towards the required 886 /// ;; resources. 887 /// (memory 1) 888 /// (memory 6) 889 /// ) 890 /// "#)?; 891 /// 892 /// let resources = module.resources_required(); 893 /// 894 /// // Instantiating the module will require allocating two memories, and 895 /// // the maximum initial memory size is six Wasm pages. 896 /// assert_eq!(resources.num_memories, 2); 897 /// assert_eq!(resources.max_initial_memory_size, Some(6)); 898 /// 899 /// // The module doesn't need any tables. 900 /// assert_eq!(resources.num_tables, 0); 901 /// assert_eq!(resources.max_initial_table_size, None); 902 /// # Ok(()) } 903 /// ``` 904 pub fn resources_required(&self) -> ResourcesRequired { 905 let em = self.env_module(); 906 let num_memories = u32::try_from(em.num_defined_memories()).unwrap(); 907 let max_initial_memory_size = em 908 .memories 909 .values() 910 .skip(em.num_imported_memories) 911 .map(|memory| memory.limits.min) 912 .max(); 913 let num_tables = u32::try_from(em.num_defined_tables()).unwrap(); 914 let max_initial_table_size = em 915 .tables 916 .values() 917 .skip(em.num_imported_tables) 918 .map(|table| table.limits.min) 919 .max(); 920 ResourcesRequired { 921 num_memories, 922 max_initial_memory_size, 923 num_tables, 924 max_initial_table_size, 925 } 926 } 927 928 /// Returns the range of bytes in memory where this module's compilation 929 /// image resides. 930 /// 931 /// The compilation image for a module contains executable code, data, debug 932 /// information, etc. This is roughly the same as the `Module::serialize` 933 /// but not the exact same. 934 /// 935 /// The range of memory reported here is exposed to allow low-level 936 /// manipulation of the memory in platform-specific manners such as using 937 /// `mlock` to force the contents to be paged in immediately or keep them 938 /// paged in after they're loaded. 939 /// 940 /// It is not safe to modify the memory in this range, nor is it safe to 941 /// modify the protections of memory in this range. 942 pub fn image_range(&self) -> Range<*const u8> { 943 self.compiled_module().mmap().image_range() 944 } 945 946 /// Force initialization of copy-on-write images to happen here-and-now 947 /// instead of when they're requested during first instantiation. 948 /// 949 /// When [copy-on-write memory 950 /// initialization](crate::Config::memory_init_cow) is enabled then Wasmtime 951 /// will lazily create the initialization image for a module. This method 952 /// can be used to explicitly dictate when this initialization happens. 953 /// 954 /// Note that this largely only matters on Linux when memfd is used. 955 /// Otherwise the copy-on-write image typically comes from disk and in that 956 /// situation the creation of the image is trivial as the image is always 957 /// sourced from disk. On Linux, though, when memfd is used a memfd is 958 /// created and the initialization image is written to it. 959 /// 960 /// Also note that this method is not required to be called, it's available 961 /// as a performance optimization if required but is otherwise handled 962 /// automatically. 963 pub fn initialize_copy_on_write_image(&self) -> Result<()> { 964 self.memory_images()?; 965 Ok(()) 966 } 967 968 /// Get the map from `.text` section offsets to Wasm binary offsets for this 969 /// module. 970 /// 971 /// Each entry is a (`.text` section offset, Wasm binary offset) pair. 972 /// 973 /// Entries are yielded in order of `.text` section offset. 974 /// 975 /// Some entries are missing a Wasm binary offset. This is for code that is 976 /// not associated with any single location in the Wasm binary, or for when 977 /// source information was optimized away. 978 /// 979 /// Not every module has an address map, since address map generation can be 980 /// turned off on `Config`. 981 /// 982 /// There is not an entry for every `.text` section offset. Every offset 983 /// after an entry's offset, but before the next entry's offset, is 984 /// considered to map to the same Wasm binary offset as the original 985 /// entry. For example, the address map will not contain the following 986 /// sequence of entries: 987 /// 988 /// ```ignore 989 /// [ 990 /// // ... 991 /// (10, Some(42)), 992 /// (11, Some(42)), 993 /// (12, Some(42)), 994 /// (13, Some(43)), 995 /// // ... 996 /// ] 997 /// ``` 998 /// 999 /// Instead, it will drop the entries for offsets `11` and `12` since they 1000 /// are the same as the entry for offset `10`: 1001 /// 1002 /// ```ignore 1003 /// [ 1004 /// // ... 1005 /// (10, Some(42)), 1006 /// (13, Some(43)), 1007 /// // ... 1008 /// ] 1009 /// ``` 1010 pub fn address_map<'a>(&'a self) -> Option<impl Iterator<Item = (usize, Option<u32>)> + 'a> { 1011 Some( 1012 wasmtime_environ::iterate_address_map( 1013 self.code_object().code_memory().address_map_data(), 1014 )? 1015 .map(|(offset, file_pos)| (offset as usize, file_pos.file_offset())), 1016 ) 1017 } 1018 1019 /// Get this module's code object's `.text` section, containing its compiled 1020 /// executable code. 1021 pub fn text(&self) -> &[u8] { 1022 self.code_object().code_memory().text() 1023 } 1024 1025 /// Get information about functions in this module's `.text` section: their 1026 /// index, name, and offset+length. 1027 /// 1028 /// Results are yielded in a ModuleFunction struct. 1029 pub fn functions<'a>(&'a self) -> impl ExactSizeIterator<Item = ModuleFunction> + 'a { 1030 let module = self.compiled_module(); 1031 module.finished_functions().map(|(idx, _)| { 1032 let loc = module.func_loc(idx); 1033 let idx = module.module().func_index(idx); 1034 ModuleFunction { 1035 index: idx, 1036 name: module.func_name(idx).map(|n| n.to_string()), 1037 offset: loc.start as usize, 1038 len: loc.length as usize, 1039 } 1040 }) 1041 } 1042 1043 pub(crate) fn id(&self) -> CompiledModuleId { 1044 self.inner.module.unique_id() 1045 } 1046 1047 pub(crate) fn offsets(&self) -> &VMOffsets<HostPtr> { 1048 &self.inner.offsets 1049 } 1050 1051 /// Return the address, in memory, of the trampoline that allows Wasm to 1052 /// call a array function of the given signature. 1053 pub(crate) fn wasm_to_array_trampoline( 1054 &self, 1055 signature: VMSharedTypeIndex, 1056 ) -> Option<NonNull<VMWasmCallFunction>> { 1057 log::trace!("Looking up trampoline for {signature:?}"); 1058 let trampoline_shared_ty = self.inner.engine.signatures().trampoline_type(signature); 1059 let trampoline_module_ty = self 1060 .inner 1061 .code 1062 .signatures() 1063 .trampoline_type(trampoline_shared_ty)?; 1064 debug_assert!(self 1065 .inner 1066 .engine 1067 .signatures() 1068 .borrow( 1069 self.inner 1070 .code 1071 .signatures() 1072 .shared_type(trampoline_module_ty) 1073 .unwrap() 1074 ) 1075 .unwrap() 1076 .unwrap_func() 1077 .is_trampoline_type()); 1078 1079 let ptr = self 1080 .compiled_module() 1081 .wasm_to_array_trampoline(trampoline_module_ty) 1082 .as_ptr() 1083 .cast::<VMWasmCallFunction>() 1084 .cast_mut(); 1085 Some(NonNull::new(ptr).unwrap()) 1086 } 1087 1088 pub(crate) fn memory_images(&self) -> Result<Option<&ModuleMemoryImages>> { 1089 let images = self 1090 .inner 1091 .memory_images 1092 .get_or_try_init(|| memory_images(&self.inner.engine, &self.inner.module))? 1093 .as_ref(); 1094 Ok(images) 1095 } 1096 1097 /// Lookup the stack map at a program counter value. 1098 pub(crate) fn lookup_stack_map(&self, pc: usize) -> Option<&wasmtime_environ::StackMap> { 1099 let text_offset = pc - self.inner.module.text().as_ptr() as usize; 1100 let (index, func_offset) = self.inner.module.func_by_text_offset(text_offset)?; 1101 let info = self.inner.module.wasm_func_info(index); 1102 1103 // Do a binary search to find the stack map for the given offset. 1104 let index = match info 1105 .stack_maps 1106 .binary_search_by_key(&func_offset, |i| i.code_offset) 1107 { 1108 // Found it. 1109 Ok(i) => i, 1110 1111 // No stack map associated with this PC. 1112 // 1113 // Because we know we are in Wasm code, and we must be at some kind 1114 // of call/safepoint, then the Cranelift backend must have avoided 1115 // emitting a stack map for this location because no refs were live. 1116 Err(_) => return None, 1117 }; 1118 1119 Some(&info.stack_maps[index].stack_map) 1120 } 1121 } 1122 1123 /// Describes a function for a given module. 1124 pub struct ModuleFunction { 1125 pub index: wasmtime_environ::FuncIndex, 1126 pub name: Option<String>, 1127 pub offset: usize, 1128 pub len: usize, 1129 } 1130 1131 impl Drop for ModuleInner { 1132 fn drop(&mut self) { 1133 // When a `Module` is being dropped that means that it's no longer 1134 // present in any `Store` and it's additionally not longer held by any 1135 // embedder. Take this opportunity to purge any lingering instantiations 1136 // within a pooling instance allocator, if applicable. 1137 self.engine 1138 .allocator() 1139 .purge_module(self.module.unique_id()); 1140 } 1141 } 1142 1143 /// Describes the location of an export in a module. 1144 #[derive(Copy, Clone)] 1145 pub struct ModuleExport { 1146 /// The module that this export is defined in. 1147 pub(crate) module: CompiledModuleId, 1148 /// A raw index into the wasm module. 1149 pub(crate) entity: EntityIndex, 1150 /// The index of the export name. 1151 pub(crate) export_name_index: usize, 1152 } 1153 1154 fn _assert_send_sync() { 1155 fn _assert<T: Send + Sync>() {} 1156 _assert::<Module>(); 1157 } 1158 1159 /// Helper method to construct a `ModuleMemoryImages` for an associated 1160 /// `CompiledModule`. 1161 fn memory_images(engine: &Engine, module: &CompiledModule) -> Result<Option<ModuleMemoryImages>> { 1162 // If initialization via copy-on-write is explicitly disabled in 1163 // configuration then this path is skipped entirely. 1164 if !engine.tunables().memory_init_cow { 1165 return Ok(None); 1166 } 1167 1168 // ... otherwise logic is delegated to the `ModuleMemoryImages::new` 1169 // constructor. 1170 let mmap = if engine.config().force_memory_init_memfd { 1171 None 1172 } else { 1173 Some(module.mmap()) 1174 }; 1175 ModuleMemoryImages::new(module.module(), module.code_memory().wasm_data(), mmap) 1176 } 1177 1178 #[cfg(test)] 1179 mod tests { 1180 use crate::{Engine, Module}; 1181 use wasmtime_environ::MemoryInitialization; 1182 1183 #[test] 1184 fn cow_on_by_default() { 1185 let engine = Engine::default(); 1186 let module = Module::new( 1187 &engine, 1188 r#" 1189 (module 1190 (memory 1) 1191 (data (i32.const 100) "abcd") 1192 ) 1193 "#, 1194 ) 1195 .unwrap(); 1196 1197 let init = &module.env_module().memory_initialization; 1198 assert!(matches!(init, MemoryInitialization::Static { .. })); 1199 } 1200 } 1201