wasmtime/compile/code_builder.rs
1use crate::Engine;
2use crate::prelude::*;
3use std::borrow::Cow;
4use std::path::Path;
5
6#[cfg(feature = "compile-time-builtins")]
7use crate::hash_map::HashMap;
8
9#[cfg(feature = "compile-time-builtins")]
10mod compile_time_builtins;
11
12/// Builder-style structure used to create a [`Module`](crate::module::Module) or
13/// pre-compile a module to a serialized list of bytes.
14///
15/// This structure can be used for more advanced configuration when compiling a
16/// WebAssembly module. Most configuration can use simpler constructors such as:
17///
18/// * [`Module::new`](crate::Module::new)
19/// * [`Module::from_file`](crate::Module::from_file)
20/// * [`Module::from_binary`](crate::Module::from_binary)
21///
22/// Note that a [`CodeBuilder`] always involves compiling WebAssembly bytes
23/// to machine code. To deserialize a list of bytes use
24/// [`Module::deserialize`](crate::Module::deserialize) instead.
25///
26/// A [`CodeBuilder`] requires a source of WebAssembly bytes to be configured
27/// before calling [`compile_module_serialized`] or [`compile_module`]. This can
28/// be provided with either the [`wasm_binary`] or [`wasm_binary_file`] method.
29/// Note that only a single source of bytes can be provided.
30///
31/// # WebAssembly Text Format
32///
33/// This builder supports the WebAssembly Text Format (`*.wat` files) through
34/// the [`CodeBuilder::wasm_binary_or_text`] and
35/// [`CodeBuilder::wasm_binary_or_text_file`] methods. These methods
36/// automatically convert WebAssembly text files to binary. Note though that
37/// this behavior is disabled if the `wat` crate feature is not enabled.
38///
39/// [`compile_module_serialized`]: CodeBuilder::compile_module_serialized
40/// [`compile_module`]: CodeBuilder::compile_module
41/// [`wasm_binary`]: CodeBuilder::wasm_binary
42/// [`wasm_binary_file`]: CodeBuilder::wasm_binary_file
43pub struct CodeBuilder<'a> {
44 pub(super) engine: &'a Engine,
45 wasm: Option<Cow<'a, [u8]>>,
46 wasm_path: Option<Cow<'a, Path>>,
47 dwarf_package: Option<Cow<'a, [u8]>>,
48 dwarf_package_path: Option<Cow<'a, Path>>,
49 unsafe_intrinsics_import: Option<String>,
50
51 /// A map from import name to the Wasm bytes of the associated compile-time
52 /// builtin and its file path, if any.
53 //
54 // XXX: we can't use `'a` here without forcing us to change a bunch of
55 // callers because `HashMap` has a `Drop` implementation, so `dropck` thinks
56 // that all `'a` borrows could be used by `CodeBuilder`'s `Drop`, which
57 // means that a bunch of the existing calls to `.wasm_bytes` and such would
58 // need to be reordered with the `CodeBuilder`'s construction.
59 #[cfg(feature = "compile-time-builtins")]
60 compile_time_builtins: HashMap<Cow<'a, str>, Cow<'a, [u8]>>,
61}
62
63/// Return value of [`CodeBuilder::hint`]
64pub enum CodeHint {
65 /// Hint that the code being compiled is a module.
66 Module,
67 /// Hint that the code being compiled is a component.
68 Component,
69}
70
71impl<'a> CodeBuilder<'a> {
72 /// Creates a new builder which will insert modules into the specified
73 /// [`Engine`].
74 pub fn new(engine: &'a Engine) -> Self {
75 CodeBuilder {
76 engine,
77 wasm: None,
78 wasm_path: None,
79 dwarf_package: None,
80 dwarf_package_path: None,
81 unsafe_intrinsics_import: None,
82 #[cfg(feature = "compile-time-builtins")]
83 compile_time_builtins: HashMap::default(),
84 }
85 }
86
87 /// Configures the WebAssembly binary that is being compiled.
88 ///
89 /// The `wasm_bytes` parameter must be a binary WebAssembly file.
90 /// This will be stored within the [`CodeBuilder`] for processing later when
91 /// compilation is finalized.
92 ///
93 /// The optional `wasm_path` parameter is the path to the `wasm_bytes` on
94 /// disk, if any. This may be used for diagnostics and other
95 /// debugging-related purposes, but this method will not read the path
96 /// specified.
97 ///
98 /// # Errors
99 ///
100 /// This method will return an error if WebAssembly bytes have already been
101 /// configured.
102 pub fn wasm_binary(
103 &mut self,
104 wasm_bytes: impl Into<Cow<'a, [u8]>>,
105 wasm_path: Option<&'a Path>,
106 ) -> Result<&mut Self> {
107 if self.wasm.is_some() {
108 bail!("cannot configure wasm bytes twice");
109 }
110 self.wasm = Some(wasm_bytes.into());
111 self.wasm_path = wasm_path.map(|p| p.into());
112
113 if self.wasm_path.is_some() {
114 self.dwarf_package_from_wasm_path()?;
115 }
116
117 Ok(self)
118 }
119
120 /// Equivalent of [`CodeBuilder::wasm_binary`] that also accepts the
121 /// WebAssembly text format.
122 ///
123 /// This method will configure the WebAssembly binary to be compiled. The
124 /// input `wasm_bytes` may either be the wasm text format or the binary
125 /// format. If the `wat` crate feature is enabled, which is enabled by
126 /// default, then the text format will automatically be converted to the
127 /// binary format.
128 ///
129 /// # Errors
130 ///
131 /// This method will return an error if WebAssembly bytes have already been
132 /// configured. This method will also return an error if `wasm_bytes` is the
133 /// wasm text format and the text syntax is not valid.
134 pub fn wasm_binary_or_text(
135 &mut self,
136 wasm_bytes: &'a [u8],
137 wasm_path: Option<&'a Path>,
138 ) -> Result<&mut Self> {
139 #[cfg(feature = "wat")]
140 let wasm_bytes = wat::parse_bytes(wasm_bytes).map_err(|mut e| {
141 if let Some(path) = wasm_path {
142 e.set_path(path);
143 }
144 e
145 })?;
146 self.wasm_binary(wasm_bytes, wasm_path)
147 }
148
149 /// Reads the `file` specified for the WebAssembly bytes that are going to
150 /// be compiled.
151 ///
152 /// This method will read `file` from the filesystem and interpret it
153 /// as a WebAssembly binary.
154 ///
155 /// A DWARF package file will be probed using the root of `file` and with a
156 /// `.dwp` extension. If found, it will be loaded and DWARF fusion
157 /// performed.
158 ///
159 /// # Errors
160 ///
161 /// This method will return an error if WebAssembly bytes have already been
162 /// configured.
163 ///
164 /// If `file` can't be read or an error happens reading it then that will
165 /// also be returned.
166 ///
167 /// If DWARF fusion is performed and the DWARF packaged file cannot be read
168 /// then an error will be returned.
169 pub fn wasm_binary_file(&mut self, file: &'a Path) -> Result<&mut Self> {
170 let wasm = std::fs::read(file)
171 .with_context(|| format!("failed to read input file: {}", file.display()))?;
172 self.wasm_binary(wasm, Some(file))
173 }
174
175 /// Equivalent of [`CodeBuilder::wasm_binary_file`] that also accepts the
176 /// WebAssembly text format.
177 ///
178 /// This method is will read the file at `path` and interpret the contents
179 /// to determine if it's the wasm text format or binary format. The file
180 /// extension of `file` is not consulted. The text format is automatically
181 /// converted to the binary format if the crate feature `wat` is active.
182 ///
183 /// # Errors
184 ///
185 /// In addition to the errors returned by [`CodeBuilder::wasm_binary_file`]
186 /// this may also fail if the text format is read and the syntax is invalid.
187 pub fn wasm_binary_or_text_file(&mut self, file: &'a Path) -> Result<&mut Self> {
188 #[cfg(feature = "wat")]
189 {
190 let wasm = wat::parse_file(file)?;
191 self.wasm_binary(wasm, Some(file))
192 }
193 #[cfg(not(feature = "wat"))]
194 {
195 self.wasm_binary_file(file)
196 }
197 }
198
199 /// Get the Wasm to be compiled.
200 ///
201 /// When using compile-time builtins, compose the builtins and the guest
202 /// Wasm together, before returning the Wasm.
203 pub(super) fn get_wasm(&self) -> Result<Cow<'_, [u8]>> {
204 let wasm = self
205 .wasm
206 .as_deref()
207 .ok_or_else(|| anyhow!("no wasm bytes have been configured"))?;
208
209 #[cfg(not(feature = "compile-time-builtins"))]
210 {
211 Ok(wasm.into())
212 }
213
214 #[cfg(feature = "compile-time-builtins")]
215 {
216 self.compose_compile_time_builtins(wasm)
217 .context("failed to compose compile-time builtins with the main Wasm")
218 }
219 }
220
221 /// Expose Wasmtime's unsafe intrinsics under the given import name.
222 ///
223 /// These intrinsics provide native memory loads and stores to Wasm; they
224 /// are *extremely* unsafe! If you are not absolutely sure that you need
225 /// these unsafe intrinsics, *do not use them!* See the safety section below
226 /// for details.
227 ///
228 /// This functionality is intended to be used when implementing
229 /// [compile-time builtins][CodeBuilder::compile_time_builtins_binary]; that
230 /// is, satisfying a Wasm import via special-cased, embedder-specific code
231 /// at compile time. You should never use these intrinsics to intentionally
232 /// subvert the Wasm sandbox. You should strive to implement safe functions
233 /// that encapsulate your uses of these intrinsics such that, regardless of
234 /// any value given as arguments, your functions *cannot* result in loading
235 /// from or storing to invalid pointers, or any other kind of unsafety. See
236 /// below for an example of the intended use cases.
237 ///
238 /// Wasmtime's unsafe intrinsics can only be exposed to Wasm components, not
239 /// core modules, currently.
240 ///
241 /// Note that when compile-time builtins are defined on a `CodeBuilder`,
242 /// only the compile-time builtins can import the unsafe intrinsics, and the
243 /// main guest program cannot import them.
244 ///
245 /// # Safety
246 ///
247 /// Extreme care must be taken when using these intrinsics.
248 ///
249 /// All loads of or stores to pointers derived from `store-data-address` are
250 /// inherently tied to a particular `T` type in a `Store<T>`. It is wildly
251 /// unsafe to run a Wasm program that uses unsafe intrinsics to access the
252 /// store's `T` inside a `Store<U>`. You must only run Wasm that uses unsafe
253 /// intrinsics in a `Store<T>` where the `T` is the type expected by the
254 /// Wasm's unsafe-intrinsics usage.
255 ///
256 /// Furthermore, usage of these intrinsics is not only tied to a particular
257 /// `T` type, but also to `T`'s layout on the host platform. The size and
258 /// alignment of `T`, the offsets of its fields, and those fields' size and
259 /// alignment can all vary across not only architecture but also operating
260 /// system. With care, you can define your `T` type such that its layout is
261 /// identical across the platforms that you run Wasm on, allowing you to
262 /// reuse the same Wasm binary and its unsafe-intrinsics usage on all your
263 /// platforms. Failing that, you must only run a Wasm program that uses
264 /// unsafe intrinsics on the host platform that its unsafe-intrinsic usage
265 /// is specialized to. See the portability section and example below for
266 /// more details.
267 ///
268 /// You are *strongly* encouraged to add assertions for the layout
269 /// properties that your unsafe-intrinsic usage's safety relies upon:
270 ///
271 /// ```rust
272 /// /// This type is used as `wasmtime::Store<MyData>` and accessed by Wasm via
273 /// /// unsafe intrinsics.
274 /// #[repr(C, align(8))]
275 /// struct MyData {
276 /// id: u64,
277 /// counter: u32,
278 /// buf: [u8; 4],
279 /// }
280 ///
281 /// // Assert that the layout is what our Wasm's unsafe-intrinsics usage expects.
282 /// static _MY_DATA_LAYOUT_ASSERTIONS: () = {
283 /// assert!(core::mem::size_of::<MyData>() == 16);
284 /// assert!(core::mem::align_of::<MyData>() == 8);
285 /// assert!(core::mem::offset_of!(MyData, id) == 0);
286 /// assert!(core::mem::offset_of!(MyData, counter) == 8);
287 /// assert!(core::mem::offset_of!(MyData, buf) == 12);
288 /// };
289 /// ```
290 ///
291 /// Finally, every pointer loaded from or stored to must:
292 ///
293 /// * Be non-null
294 ///
295 /// * Be aligned to the access type's natural alignment (e.g. 8-byte alignment
296 /// for `u64`, 4-byte alignment for `u32`, etc...)
297 ///
298 /// * Point to a memory block that is valid to read from (for loads) or
299 /// valid to write to (for stores) under Rust's pointer provenance rules
300 ///
301 /// * Point to a memory block that is at least as large as the access type's
302 /// natural size (e.g. 1 byte for `u8`, 2 bytes for `u16`, etc...)
303 ///
304 /// * Point to a memory block that is not accessed concurrently by any other
305 /// threads
306 ///
307 /// Failure to uphold any of these invariants will lead to unsafety,
308 /// undefined behavior, and/or data races.
309 ///
310 /// # Intrinsics
311 ///
312 /// | Name | Parameters | Results |
313 /// |----------------------|--------------|---------|
314 /// | `u8-native-load` | `u64` | `u8` |
315 /// | `u16-native-load` | `u64` | `u16` |
316 /// | `u32-native-load` | `u64` | `u32` |
317 /// | `u64-native-load` | `u64` | `u64` |
318 /// | `u8-native-store` | `u64`, `u8` | - |
319 /// | `u16-native-load` | `u64`, `u16` | - |
320 /// | `u32-native-load` | `u64`, `u32` | - |
321 /// | `u64-native-load` | `u64`, `u64` | - |
322 /// | `store-data-address` | - | `u64` |
323 ///
324 /// ## `*-native-load`
325 ///
326 /// These intrinsics perform an unsandboxed, unsynchronized load from native
327 /// memory, using the native endianness.
328 ///
329 /// ## `*-native-store`
330 ///
331 /// These intrinsics perform an unsandboxed, unsynchronized store to native
332 /// memory, using the native endianness.
333 ///
334 /// ## `store-data-address`
335 ///
336 /// This intrinsic function returns the pointer to the embedder's `T` data
337 /// inside a `Store<T>`.
338 ///
339 /// In general, all native load and store intinsics should operate on memory
340 /// addresses that are derived from a call to this intrinsic. If you want to
341 /// expose data for raw memory access by Wasm, put it inside the `T` in your
342 /// `Store<T>` and Wasm's access to that data should derive from this
343 /// intrinsic.
344 ///
345 /// # Portability
346 ///
347 /// Loads and stores are always performed using the architecture's native
348 /// endianness.
349 ///
350 /// Addresses passed to and returned from these intrinsics are always
351 /// 64-bits large. The upper half of the value is simply ignored on 32-bit
352 /// architectures.
353 ///
354 /// With care, you can design your store's `T` type such that accessing it
355 /// via these intrinsics is portable, and you can reuse a single Wasm binary
356 /// (and its set of intrinsic calls) across all of the platforms, with the
357 /// following rules of thumb:
358 ///
359 /// * Only access `u8`, `u16`, `u32`, and `u64` data via these intrinsics.
360 ///
361 /// * If you need to access other types of data, encode it into those types
362 /// and then access the encoded data from the intrinsics.
363 ///
364 /// * Use `union`s to encode pointers and pointer-sized data as a `u64` and
365 /// then access it via the `u64-native-{load,store}` intrinsics. See
366 /// `ExposedPointer` in the example below.
367 ///
368 /// # Example
369 ///
370 /// The following example shows how you can use unsafe intrinsics and
371 /// compile-time builtins to give Wasm direct zero-copy access to a host
372 /// buffer.
373 ///
374 /// ```rust
375 /// use std::mem;
376 /// use wasmtime::*;
377 ///
378 /// // A `*mut u8` pointer that is exposed directly to Wasm via unsafe intrinsics.
379 /// #[repr(align(8))]
380 /// union ExposedPointer {
381 /// pointer: *mut u8,
382 /// padding: u64,
383 /// }
384 ///
385 /// static _EXPOSED_POINTER_LAYOUT_ASSERTIONS: () = {
386 /// assert!(mem::size_of::<ExposedPointer>() == 8);
387 /// assert!(mem::align_of::<ExposedPointer>() == 8);
388 /// };
389 ///
390 /// impl ExposedPointer {
391 /// /// Wrap the given pointer into an `ExposedPointer`.
392 /// fn new(pointer: *mut u8) -> Self {
393 /// // NB: Zero-initialize to avoid potential footguns with accessing
394 /// // undefined bytes.
395 /// let mut p = Self { padding: 0 };
396 /// p.pointer = pointer;
397 /// p
398 /// }
399 ///
400 /// /// Get the wrapped pointer.
401 /// fn get(&self) -> *mut u8 {
402 /// unsafe { self.pointer }
403 /// }
404 /// }
405 ///
406 /// /// This is the `T` type we will put inside our
407 /// /// `wasmtime::Store<T>`s. It contains a pointer to a heap-allocated buffer
408 /// /// in host memory, which we will give Wasm zero-copy access to via unsafe
409 /// /// intrinsics.
410 /// #[repr(C)]
411 /// struct StoreData {
412 /// buf_ptr: ExposedPointer,
413 /// buf_len: u64,
414 /// }
415 ///
416 /// static _STORE_DATA_LAYOUT_ASSERTIONS: () = {
417 /// assert!(mem::size_of::<StoreData>() == 16);
418 /// assert!(mem::align_of::<StoreData>() == 8);
419 /// assert!(mem::offset_of!(StoreData, buf_ptr) == 0);
420 /// assert!(mem::offset_of!(StoreData, buf_len) == 8);
421 /// };
422 ///
423 /// impl Drop for StoreData {
424 /// fn drop(&mut self) {
425 /// let len = usize::try_from(self.buf_len).unwrap();
426 /// let ptr = std::ptr::slice_from_raw_parts_mut(self.buf_ptr.get(), len);
427 /// unsafe {
428 /// let _ = Box::from_raw(ptr);
429 /// }
430 /// }
431 /// }
432 ///
433 /// impl StoreData {
434 /// /// Create a new `StoreData`, allocating an inner buffer containing
435 /// /// `bytes`.
436 /// fn new(bytes: impl IntoIterator<Item = u8>) -> Self {
437 /// let buf: Box<[u8]> = bytes.into_iter().collect();
438 /// let ptr = Box::into_raw(buf);
439 /// Self {
440 /// buf_ptr: ExposedPointer::new(ptr.cast::<u8>()),
441 /// buf_len: u64::try_from(ptr.len()).unwrap(),
442 /// }
443 /// }
444 ///
445 /// /// Get the inner buffer as a shared slice.
446 /// fn buf(&self) -> &[u8] {
447 /// let ptr = self.buf_ptr.get().cast_const();
448 /// let len = usize::try_from(self.buf_len).unwrap();
449 /// unsafe {
450 /// std::slice::from_raw_parts(ptr, len)
451 /// }
452 /// }
453 /// }
454 ///
455 /// # fn main() -> Result<()> {
456 /// // Enable function inlining during compilation. If you are using unsafe intrinsics, you
457 /// // almost assuredly want them inlined to avoid function call overheads.
458 /// let mut config = Config::new();
459 /// config.compiler_inlining(true);
460 ///
461 /// let engine = Engine::new(&config)?;
462 /// let linker = wasmtime::component::Linker::new(&engine);
463 ///
464 /// // Create a new builder for configuring a Wasm compilation.
465 /// let mut builder = CodeBuilder::new(&engine);
466 ///
467 /// // Allow the code we are building to use Wasmtime's unsafe intrinsics.
468 /// //
469 /// // SAFETY: we wrap all usage of the intrinsics in safe APIs and only instantiate the code
470 /// // within a `Store<T>` where `T = StoreData`, as the code expects.
471 /// unsafe {
472 /// builder.expose_unsafe_intrinsics("unsafe-intrinsics");
473 /// }
474 ///
475 /// // Define the compile-time builtin that encapsulates the
476 /// // intrinsics' unsafety and builds a safe API on top of them.
477 /// unsafe {
478 /// builder.compile_time_builtins_binary_or_text(
479 /// "safe-api",
480 /// r#"
481 /// (component
482 /// (import "unsafe-intrinsics"
483 /// (instance $intrinsics
484 /// (export "store-data-address" (func (result u64)))
485 /// (export "u64-native-load" (func (param "pointer" u64) (result u64)))
486 /// (export "u8-native-load" (func (param "pointer" u64) (result u8)))
487 /// (export "u8-native-store" (func (param "pointer" u64) (param "value" u8)))
488 /// )
489 /// )
490 ///
491 /// ;; The core Wasm module that implements the safe API.
492 /// (core module $safe-api-impl
493 /// (import "" "store-data-address" (func $store-data-address (result i64)))
494 /// (import "" "u64-native-load" (func $u64-native-load (param i64) (result i64)))
495 /// (import "" "u8-native-load" (func $u8-native-load (param i64) (result i32)))
496 /// (import "" "u8-native-store" (func $u8-native-store (param i64 i32)))
497 ///
498 /// ;; Load the `StoreData::buf_ptr` field
499 /// (func $get-buf-ptr (result i64)
500 /// (call $u64-native-load (i64.add (call $store-data-address) (i64.const 0)))
501 /// )
502 ///
503 /// ;; Load the `StoreData::buf_len` field
504 /// (func $get-buf-len (result i64)
505 /// (call $u64-native-load (i64.add (call $store-data-address) (i64.const 8)))
506 /// )
507 ///
508 /// ;; Check that `$i` is within `StoreData` buffer's bounds, raising a trap
509 /// ;; otherwise.
510 /// (func $bounds-check (param $i i64)
511 /// (if (i64.lt_u (local.get $i) (call $get-buf-len))
512 /// (then (return))
513 /// (else (unreachable))
514 /// )
515 /// )
516 ///
517 /// ;; A safe function to get the `i`th byte from `StoreData`'s buffer,
518 /// ;; raising a trap on out-of-bounds accesses.
519 /// (func (export "get") (param $i i64) (result i32)
520 /// (call $bounds-check (local.get $i))
521 /// (call $u8-native-load (i64.add (call $get-buf-ptr) (local.get $i)))
522 /// )
523 ///
524 /// ;; A safe function to set the `i`th byte in `StoreData`'s buffer,
525 /// ;; raising a trap on out-of-bounds accesses.
526 /// (func (export "set") (param $i i64) (param $value i32)
527 /// (call $bounds-check (local.get $i))
528 /// (call $u8-native-store (i64.add (call $get-buf-ptr) (local.get $i))
529 /// (local.get $value))
530 /// )
531 ///
532 /// ;; A safe function to get the length of the `StoreData` buffer.
533 /// (func (export "len") (result i64)
534 /// (call $get-buf-len)
535 /// )
536 /// )
537 ///
538 /// ;; Lower the imported intrinsics from component functions to core functions.
539 /// (core func $store-data-address' (canon lower (func $intrinsics "store-data-address")))
540 /// (core func $u64-native-load' (canon lower (func $intrinsics "u64-native-load")))
541 /// (core func $u8-native-load' (canon lower (func $intrinsics "u8-native-load")))
542 /// (core func $u8-native-store' (canon lower (func $intrinsics "u8-native-store")))
543 ///
544 /// ;; Instantiate our safe API implementation, passing in the lowered unsafe
545 /// ;; intrinsics as its imports.
546 /// (core instance $instance
547 /// (instantiate $safe-api-impl
548 /// (with "" (instance
549 /// (export "store-data-address" (func $store-data-address'))
550 /// (export "u64-native-load" (func $u64-native-load'))
551 /// (export "u8-native-load" (func $u8-native-load'))
552 /// (export "u8-native-store" (func $u8-native-store'))
553 /// ))
554 /// )
555 /// )
556 ///
557 /// ;; Lift the safe API's exports from core functions to component functions
558 /// ;; and export them.
559 /// (func (export "get") (param "i" u64) (result u8)
560 /// (canon lift (core func $instance "get"))
561 /// )
562 /// (func (export "set") (param "i" u64) (param "value" u8)
563 /// (canon lift (core func $instance "set"))
564 /// )
565 /// (func (export "len") (result u64)
566 /// (canon lift (core func $instance "len"))
567 /// )
568 /// )
569 /// "#.as_bytes(),
570 /// None,
571 /// )?;
572 /// }
573 ///
574 /// // Provide the guest Wasm that we are compiling, which uses the safe API we
575 /// // implemented as a compile-time builtin.
576 /// builder.wasm_binary_or_text(
577 /// r#"
578 /// (component
579 /// ;; Import the safe API.
580 /// (import "safe-api"
581 /// (instance $safe-api
582 /// (export "get" (func (param "i" u64) (result u8)))
583 /// (export "set" (func (param "i" u64) (param "value" u8)))
584 /// (export "len" (func (result u64)))
585 /// )
586 /// )
587 ///
588 /// ;; Define this component's core module implementation.
589 /// (core module $main-impl
590 /// (import "" "get" (func $get (param i64) (result i32)))
591 /// (import "" "set" (func $set (param i64 i32)))
592 /// (import "" "len" (func $len (result i64)))
593 ///
594 /// (func (export "main")
595 /// (local $i i64)
596 /// (local $n i64)
597 ///
598 /// (local.set $i (i64.const 0))
599 /// (local.set $n (call $len))
600 ///
601 /// (loop $loop
602 /// ;; When we have iterated over every byte in the
603 /// ;; buffer, exit.
604 /// (if (i64.ge_u (local.get $i) (local.get $n))
605 /// (then (return)))
606 ///
607 /// ;; Increment the `i`th byte in the buffer.
608 /// (call $set (local.get $i)
609 /// (i32.add (call $get (local.get $i))
610 /// (i32.const 1)))
611 ///
612 /// ;; Increment `i` and continue to the next iteration
613 /// ;; of the loop.
614 /// (local.set $i (i64.add (local.get $i) (i64.const 1)))
615 /// (br $loop)
616 /// )
617 /// )
618 /// )
619 ///
620 /// ;; Lower the imported safe APIs from component functions to core functions.
621 /// (core func $get' (canon lower (func $safe-api "get")))
622 /// (core func $set' (canon lower (func $safe-api "set")))
623 /// (core func $len' (canon lower (func $safe-api "len")))
624 ///
625 /// ;; Instantiate our module, providing the lowered safe APIs as imports.
626 /// (core instance $instance
627 /// (instantiate $main-impl
628 /// (with "" (instance
629 /// (export "get" (func $get'))
630 /// (export "set" (func $set'))
631 /// (export "len" (func $len'))
632 /// ))
633 /// )
634 /// )
635 ///
636 /// ;; Lift the implementation's `main` from a core function to a component function
637 /// ;; and export it!
638 /// (func (export "main")
639 /// (canon lift (core func $instance "main"))
640 /// )
641 /// )
642 /// "#.as_bytes(),
643 /// None,
644 /// )?;
645 ///
646 /// // Finish the builder and compile the component.
647 /// let component = builder.compile_component()?;
648 ///
649 /// // Create a new `Store<StoreData>`, wrapping a buffer of the given elements.
650 /// let mut store = Store::new(&engine, StoreData::new([0, 10, 20, 30, 40, 50]));
651 ///
652 /// // Instantiate our component into the store.
653 /// let instance = linker.instantiate(&mut store, &component)?;
654 ///
655 /// // Get the instance's exported `main` function and call it.
656 /// instance
657 /// .get_typed_func::<(), ()>(&mut store, "main")?
658 /// .call(&mut store, ())?;
659 ///
660 /// // Our `StoreData`'s buffer had each element incremented directly from Wasm!
661 /// assert_eq!(store.data().buf(), &[1, 11, 21, 31, 41, 51]);
662 /// # Ok(())
663 /// # }
664 /// ```
665 pub unsafe fn expose_unsafe_intrinsics(&mut self, import_name: impl Into<String>) -> &mut Self {
666 self.unsafe_intrinsics_import = Some(import_name.into());
667 self
668 }
669
670 /// Explicitly specify DWARF `.dwp` path.
671 ///
672 /// # Errors
673 ///
674 /// This method will return an error if the `.dwp` file has already been set
675 /// through [`CodeBuilder::dwarf_package`] or auto-detection in
676 /// [`CodeBuilder::wasm_binary_file`].
677 ///
678 /// This method will also return an error if `file` cannot be read.
679 pub fn dwarf_package_file(&mut self, file: &Path) -> Result<&mut Self> {
680 if self.dwarf_package.is_some() {
681 bail!("cannot call `dwarf_package` or `dwarf_package_file` twice");
682 }
683
684 let dwarf_package = std::fs::read(file)
685 .with_context(|| format!("failed to read dwarf input file: {}", file.display()))?;
686 self.dwarf_package_path = Some(Cow::Owned(file.to_owned()));
687 self.dwarf_package = Some(dwarf_package.into());
688
689 Ok(self)
690 }
691
692 fn dwarf_package_from_wasm_path(&mut self) -> Result<&mut Self> {
693 let dwarf_package_path_buf = self.wasm_path.as_ref().unwrap().with_extension("dwp");
694 if dwarf_package_path_buf.exists() {
695 return self.dwarf_package_file(dwarf_package_path_buf.as_path());
696 }
697
698 Ok(self)
699 }
700
701 /// Gets the DWARF package.
702 pub(super) fn get_dwarf_package(&self) -> Option<&[u8]> {
703 self.dwarf_package.as_deref()
704 }
705
706 /// Set the DWARF package binary.
707 ///
708 /// Initializes `dwarf_package` from `dwp_bytes` in preparation for
709 /// DWARF fusion. Allows the DWARF package to be supplied as a byte array
710 /// when the file probing performed in `wasm_file` is not appropriate.
711 ///
712 /// # Errors
713 ///
714 /// Returns an error if the `*.dwp` file is already set via auto-probing in
715 /// [`CodeBuilder::wasm_binary_file`] or explicitly via
716 /// [`CodeBuilder::dwarf_package_file`].
717 pub fn dwarf_package(&mut self, dwp_bytes: &'a [u8]) -> Result<&mut Self> {
718 if self.dwarf_package.is_some() {
719 bail!("cannot call `dwarf_package` or `dwarf_package_file` twice");
720 }
721 self.dwarf_package = Some(dwp_bytes.into());
722 Ok(self)
723 }
724
725 /// Returns a hint, if possible, of what the provided bytes are.
726 ///
727 /// This method can be use to detect what the previously supplied bytes to
728 /// methods such as [`CodeBuilder::wasm_binary_or_text`] are. This will
729 /// return whether a module or a component was found in the provided bytes.
730 ///
731 /// This method will return `None` if wasm bytes have not been configured
732 /// or if the provided bytes don't look like either a component or a
733 /// module.
734 pub fn hint(&self) -> Option<CodeHint> {
735 let wasm = self.wasm.as_ref()?;
736 if wasmparser::Parser::is_component(wasm) {
737 Some(CodeHint::Component)
738 } else if wasmparser::Parser::is_core_wasm(wasm) {
739 Some(CodeHint::Module)
740 } else {
741 None
742 }
743 }
744
745 /// Finishes this compilation and produces a serialized list of bytes.
746 ///
747 /// This method requires that either [`CodeBuilder::wasm_binary`] or
748 /// related methods were invoked prior to indicate what is being compiled.
749 ///
750 /// This method will block the current thread until compilation has
751 /// finished, and when done the serialized artifact will be returned.
752 ///
753 /// Note that this method will never cache compilations, even if the
754 /// `cache` feature is enabled.
755 ///
756 /// # Errors
757 ///
758 /// This can fail if the input wasm module was not valid or if another
759 /// compilation-related error is encountered.
760 pub fn compile_module_serialized(&self) -> Result<Vec<u8>> {
761 ensure!(
762 self.unsafe_intrinsics_import.is_none(),
763 "`CodeBuilder::expose_unsafe_intrinsics` can only be used with components"
764 );
765
766 #[cfg(feature = "compile-time-builtins")]
767 ensure!(
768 self.get_compile_time_builtins().is_empty(),
769 "compile-time builtins can only be used with components"
770 );
771
772 let wasm = self.get_wasm()?;
773 let dwarf_package = self.get_dwarf_package();
774 let (v, _) =
775 super::build_module_artifacts(self.engine, &wasm, dwarf_package.as_deref(), &())?;
776 Ok(v)
777 }
778
779 /// Same as [`CodeBuilder::compile_module_serialized`] except that it
780 /// compiles a serialized [`Component`](crate::component::Component)
781 /// instead of a module.
782 #[cfg(feature = "component-model")]
783 pub fn compile_component_serialized(&self) -> Result<Vec<u8>> {
784 let wasm = self.get_wasm()?;
785 let (v, _) = super::build_component_artifacts(
786 self.engine,
787 &wasm,
788 None,
789 self.get_unsafe_intrinsics_import(),
790 &(),
791 )?;
792 Ok(v)
793 }
794
795 pub(super) fn get_unsafe_intrinsics_import(&self) -> Option<&str> {
796 self.unsafe_intrinsics_import.as_deref()
797 }
798}
799
800/// This is a helper struct used when caching to hash the state of an `Engine`
801/// used for module compilation.
802///
803/// The hash computed for this structure is used to key the global wasmtime
804/// cache and dictates whether artifacts are reused. Consequently the contents
805/// of this hash dictate when artifacts are or aren't re-used.
806pub struct HashedEngineCompileEnv<'a>(pub &'a Engine);
807
808impl std::hash::Hash for HashedEngineCompileEnv<'_> {
809 fn hash<H: std::hash::Hasher>(&self, hasher: &mut H) {
810 // Hash the compiler's state based on its target and configuration.
811 let compiler = self.0.compiler();
812 compiler.triple().hash(hasher);
813 compiler.flags().hash(hasher);
814 compiler.isa_flags().hash(hasher);
815
816 // Hash configuration state read for compilation
817 let config = self.0.config();
818 self.0.tunables().hash(hasher);
819 self.0.features().hash(hasher);
820 config.wmemcheck.hash(hasher);
821
822 // Catch accidental bugs of reusing across crate versions.
823 config.module_version.hash(hasher);
824 }
825}