wasmtime_environ/
gc.rs

1//! Target- and pointer-width-agnostic definitions of GC-related types and
2//! constants.
3//!
4//! These definitions are suitable for use both during compilation and at
5//! runtime.
6//!
7//! Note: We don't bother gating these on `cfg(feature = "gc")` because that
8//! makes downstream uses pretty annoying, and the primary thing we want to gate
9//! on our various `gc` cargo features is the actual garbage collection
10//! functions and their associated impact on binary size anyways.
11
12#[cfg(feature = "gc-drc")]
13pub mod drc;
14
15#[cfg(feature = "gc-null")]
16pub mod null;
17
18use crate::prelude::*;
19use crate::{
20    WasmArrayType, WasmCompositeInnerType, WasmCompositeType, WasmStorageType, WasmStructType,
21    WasmValType,
22};
23use core::alloc::Layout;
24
25/// Discriminant to check whether GC reference is an `i31ref` or not.
26pub const I31_DISCRIMINANT: u32 = 1;
27
28/// The size of the `VMGcHeader` in bytes.
29pub const VM_GC_HEADER_SIZE: u32 = 8;
30
31/// The minimum alignment of the `VMGcHeader` in bytes.
32pub const VM_GC_HEADER_ALIGN: u32 = 8;
33
34/// The offset of the `VMGcKind` field in the `VMGcHeader`.
35pub const VM_GC_HEADER_KIND_OFFSET: u32 = 0;
36
37/// The offset of the `VMSharedTypeIndex` field in the `VMGcHeader`.
38pub const VM_GC_HEADER_TYPE_INDEX_OFFSET: u32 = 4;
39
40/// Get the byte size of the given Wasm type when it is stored inside the GC
41/// heap.
42pub fn byte_size_of_wasm_ty_in_gc_heap(ty: &WasmStorageType) -> u32 {
43    match ty {
44        WasmStorageType::I8 => 1,
45        WasmStorageType::I16 => 2,
46        WasmStorageType::Val(ty) => match ty {
47            WasmValType::I32 | WasmValType::F32 | WasmValType::Ref(_) => 4,
48            WasmValType::I64 | WasmValType::F64 => 8,
49            WasmValType::V128 => 16,
50        },
51    }
52}
53
54/// Align `offset` up to `bytes`, updating `max_align` if `align` is the
55/// new maximum alignment, and returning the aligned offset.
56#[cfg(any(feature = "gc-drc", feature = "gc-null"))]
57fn align_up(offset: &mut u32, max_align: &mut u32, align: u32) -> u32 {
58    debug_assert!(max_align.is_power_of_two());
59    debug_assert!(align.is_power_of_two());
60    *offset = offset.checked_add(align - 1).unwrap() & !(align - 1);
61    *max_align = core::cmp::max(*max_align, align);
62    *offset
63}
64
65/// Define a new field of size and alignment `bytes`, updating the object's
66/// total `size` and `align` as necessary. The offset of the new field is
67/// returned.
68#[cfg(any(feature = "gc-drc", feature = "gc-null"))]
69fn field(size: &mut u32, align: &mut u32, bytes: u32) -> u32 {
70    let offset = align_up(size, align, bytes);
71    *size += bytes;
72    offset
73}
74
75/// Common code to define a GC array's layout, given the size and alignment of
76/// the collector's GC header and its expected offset of the array length field.
77#[cfg(any(feature = "gc-drc", feature = "gc-null"))]
78fn common_array_layout(
79    ty: &WasmArrayType,
80    header_size: u32,
81    header_align: u32,
82    expected_array_length_offset: u32,
83) -> GcArrayLayout {
84    use core::mem;
85
86    assert!(header_size >= crate::VM_GC_HEADER_SIZE);
87    assert!(header_align >= crate::VM_GC_HEADER_ALIGN);
88
89    let mut size = header_size;
90    let mut align = header_align;
91
92    let length_field_size = u32::try_from(mem::size_of::<u32>()).unwrap();
93    let length_field_offset = field(&mut size, &mut align, length_field_size);
94    assert_eq!(length_field_offset, expected_array_length_offset);
95
96    let elem_size = byte_size_of_wasm_ty_in_gc_heap(&ty.0.element_type);
97    let elems_offset = align_up(&mut size, &mut align, elem_size);
98    assert_eq!(elems_offset, size);
99
100    let elems_are_gc_refs = ty.0.element_type.is_vmgcref_type_and_not_i31();
101    if elems_are_gc_refs {
102        debug_assert_eq!(
103            length_field_offset + length_field_size,
104            elems_offset,
105            "DRC collector relies on GC ref elements appearing directly after the length field, without any padding",
106        );
107    }
108
109    GcArrayLayout {
110        base_size: size,
111        align,
112        elem_size,
113        elems_are_gc_refs,
114    }
115}
116
117/// Common code to define a GC struct's layout, given the size and alignment of
118/// the collector's GC header and its expected offset of the array length field.
119#[cfg(any(feature = "gc-null", feature = "gc-drc"))]
120fn common_struct_layout(
121    ty: &WasmStructType,
122    header_size: u32,
123    header_align: u32,
124) -> GcStructLayout {
125    assert!(header_size >= crate::VM_GC_HEADER_SIZE);
126    assert!(header_align >= crate::VM_GC_HEADER_ALIGN);
127
128    // Process each field, aligning it to its natural alignment.
129    //
130    // We don't try and do any fancy field reordering to minimize padding (yet?)
131    // because (a) the toolchain probably already did that and (b) we're just
132    // doing the simple thing first, and (c) this is tricky in the presence of
133    // subtyping where we need a subtype's fields to be assigned the same
134    // offsets as its supertype's fields. We can come back and improve things
135    // here if we find that (a) isn't actually holding true in practice.
136    let mut size = header_size;
137    let mut align = header_align;
138
139    let fields = ty
140        .fields
141        .iter()
142        .map(|f| {
143            let field_size = byte_size_of_wasm_ty_in_gc_heap(&f.element_type);
144            let offset = field(&mut size, &mut align, field_size);
145            let is_gc_ref = f.element_type.is_vmgcref_type_and_not_i31();
146            GcStructLayoutField { offset, is_gc_ref }
147        })
148        .collect();
149
150    // Ensure that the final size is a multiple of the alignment, for
151    // simplicity.
152    let align_size_to = align;
153    align_up(&mut size, &mut align, align_size_to);
154
155    GcStructLayout {
156        size,
157        align,
158        fields,
159    }
160}
161
162/// A trait for getting the layout of a Wasm GC struct or array inside a
163/// particular collector.
164pub trait GcTypeLayouts {
165    /// The offset of an array's length field.
166    ///
167    /// This must be the same for all arrays in the heap, regardless of their
168    /// element type.
169    fn array_length_field_offset(&self) -> u32;
170
171    /// Get this collector's layout for the given composite type.
172    ///
173    /// Returns `None` if the type is a function type, as functions are not
174    /// managed by the GC.
175    fn gc_layout(&self, ty: &WasmCompositeType) -> Option<GcLayout> {
176        assert!(!ty.shared);
177        match &ty.inner {
178            WasmCompositeInnerType::Array(ty) => Some(self.array_layout(ty).into()),
179            WasmCompositeInnerType::Struct(ty) => Some(self.struct_layout(ty).into()),
180            WasmCompositeInnerType::Func(_) => None,
181            WasmCompositeInnerType::Cont(_) => None,
182        }
183    }
184
185    /// Get this collector's layout for the given array type.
186    fn array_layout(&self, ty: &WasmArrayType) -> GcArrayLayout;
187
188    /// Get this collector's layout for the given struct type.
189    fn struct_layout(&self, ty: &WasmStructType) -> GcStructLayout;
190}
191
192/// The layout of a GC-managed object.
193#[derive(Clone, Debug)]
194pub enum GcLayout {
195    /// The layout of a GC-managed array object.
196    Array(GcArrayLayout),
197
198    /// The layout of a GC-managed struct object.
199    Struct(GcStructLayout),
200}
201
202impl From<GcArrayLayout> for GcLayout {
203    fn from(layout: GcArrayLayout) -> Self {
204        Self::Array(layout)
205    }
206}
207
208impl From<GcStructLayout> for GcLayout {
209    fn from(layout: GcStructLayout) -> Self {
210        Self::Struct(layout)
211    }
212}
213
214impl GcLayout {
215    /// Get the underlying `GcStructLayout`, or panic.
216    #[track_caller]
217    pub fn unwrap_struct(&self) -> &GcStructLayout {
218        match self {
219            Self::Struct(s) => s,
220            _ => panic!("GcLayout::unwrap_struct on non-struct GC layout"),
221        }
222    }
223
224    /// Get the underlying `GcArrayLayout`, or panic.
225    #[track_caller]
226    pub fn unwrap_array(&self) -> &GcArrayLayout {
227        match self {
228            Self::Array(a) => a,
229            _ => panic!("GcLayout::unwrap_array on non-array GC layout"),
230        }
231    }
232}
233
234/// The layout of a GC-managed array.
235///
236/// This layout is only valid for use with the GC runtime that created it. It is
237/// not valid to use one GC runtime's layout with another GC runtime, doing so
238/// is memory safe but will lead to general incorrectness like panics and wrong
239/// results.
240///
241/// All offsets are from the start of the object; that is, the size of the GC
242/// header (for example) is included in the offset.
243///
244/// All arrays are composed of the generic `VMGcHeader`, followed by
245/// collector-specific fields, followed by the contiguous array elements
246/// themselves. The array elements must be aligned to the element type's natural
247/// alignment.
248#[derive(Clone, Debug)]
249pub struct GcArrayLayout {
250    /// The size of this array object, without any elements.
251    ///
252    /// The array's elements, if any, must begin at exactly this offset.
253    pub base_size: u32,
254
255    /// The alignment of this array.
256    pub align: u32,
257
258    /// The size and natural alignment of each element in this array.
259    pub elem_size: u32,
260
261    /// Whether or not the elements of this array are GC references or not.
262    pub elems_are_gc_refs: bool,
263}
264
265impl GcArrayLayout {
266    /// Get the total size of this array for a given length of elements.
267    #[inline]
268    pub fn size_for_len(&self, len: u32) -> u32 {
269        self.elem_offset(len)
270    }
271
272    /// Get the offset of the `i`th element in an array with this layout.
273    #[inline]
274    pub fn elem_offset(&self, i: u32) -> u32 {
275        self.base_size + i * self.elem_size
276    }
277
278    /// Get a `core::alloc::Layout` for an array of this type with the given
279    /// length.
280    pub fn layout(&self, len: u32) -> Layout {
281        let size = self.size_for_len(len);
282        let size = usize::try_from(size).unwrap();
283        let align = usize::try_from(self.align).unwrap();
284        Layout::from_size_align(size, align).unwrap()
285    }
286}
287
288/// The layout for a GC-managed struct type.
289///
290/// This layout is only valid for use with the GC runtime that created it. It is
291/// not valid to use one GC runtime's layout with another GC runtime, doing so
292/// is memory safe but will lead to general incorrectness like panics and wrong
293/// results.
294///
295/// All offsets are from the start of the object; that is, the size of the GC
296/// header (for example) is included in the offset.
297#[derive(Clone, Debug)]
298pub struct GcStructLayout {
299    /// The size (in bytes) of this struct.
300    pub size: u32,
301
302    /// The alignment (in bytes) of this struct.
303    pub align: u32,
304
305    /// The fields of this struct. The `i`th entry contains information about
306    /// the `i`th struct field's layout.
307    pub fields: Vec<GcStructLayoutField>,
308}
309
310impl GcStructLayout {
311    /// Get a `core::alloc::Layout` for a struct of this type.
312    pub fn layout(&self) -> Layout {
313        let size = usize::try_from(self.size).unwrap();
314        let align = usize::try_from(self.align).unwrap();
315        Layout::from_size_align(size, align).unwrap()
316    }
317}
318
319/// A field in a `GcStructLayout`.
320#[derive(Clone, Copy, Debug)]
321pub struct GcStructLayoutField {
322    /// The offset (in bytes) of this field inside instances of this type.
323    pub offset: u32,
324
325    /// Whether or not this field might contain a reference to another GC
326    /// object.
327    ///
328    /// Note: it is okay for this to be `false` for `i31ref`s, since they never
329    /// actually reference another GC object.
330    pub is_gc_ref: bool,
331}
332
333/// The kind of an object in a GC heap.
334///
335/// Note that this type is accessed from Wasm JIT code.
336///
337/// `VMGcKind` is a bitset where to test if `a` is a subtype of an
338/// "abstract-ish" type `b`, we can simply use a single bitwise-and operation:
339///
340/// ```ignore
341/// a <: b   iff   a & b == b
342/// ```
343///
344/// For example, because `VMGcKind::AnyRef` has the high bit set, every kind
345/// representing some subtype of `anyref` also has its high bit set.
346///
347/// We say "abstract-ish" type because in addition to the abstract heap types
348/// (other than `i31`) we also have variants for `externref`s that have been
349/// converted into an `anyref` via `extern.convert_any` and `externref`s that
350/// have been converted into an `anyref` via `any.convert_extern`. Note that in
351/// the latter case, because `any.convert_extern $foo` produces a value that is
352/// not an instance of `eqref`, `VMGcKind::AnyOfExternRef & VMGcKind::EqRef !=
353/// VMGcKind::EqRef`.
354///
355/// Furthermore, this type only uses the highest 6 bits of its `u32`
356/// representation, allowing the lower 27 bytes to be bitpacked with other stuff
357/// as users see fit.
358#[repr(u32)]
359#[derive(Clone, Copy, Debug, PartialEq, Eq)]
360#[rustfmt::skip]
361#[expect(missing_docs, reason = "self-describing variants")]
362pub enum VMGcKind {
363    ExternRef      = 0b01000 << 27,
364    AnyRef         = 0b10000 << 27,
365    EqRef          = 0b10100 << 27,
366    ArrayRef       = 0b10101 << 27,
367    StructRef      = 0b10110 << 27,
368}
369
370impl VMGcKind {
371    /// Mask this value with a `u32` to get just the bits that `VMGcKind` uses.
372    pub const MASK: u32 = 0b11111 << 27;
373
374    /// Mask this value with a `u32` that potentially contains a `VMGcKind` to
375    /// get the bits that `VMGcKind` doesn't use.
376    pub const UNUSED_MASK: u32 = !Self::MASK;
377
378    /// Does the given value fit in the unused bits of a `VMGcKind`?
379    #[inline]
380    pub fn value_fits_in_unused_bits(value: u32) -> bool {
381        (value & Self::UNUSED_MASK) == value
382    }
383
384    /// Convert the given value into a `VMGcKind` by masking off the unused
385    /// bottom bits.
386    #[inline]
387    pub fn from_high_bits_of_u32(val: u32) -> VMGcKind {
388        let masked = val & Self::MASK;
389        match masked {
390            x if x == Self::ExternRef.as_u32() => Self::ExternRef,
391            x if x == Self::AnyRef.as_u32() => Self::AnyRef,
392            x if x == Self::EqRef.as_u32() => Self::EqRef,
393            x if x == Self::ArrayRef.as_u32() => Self::ArrayRef,
394            x if x == Self::StructRef.as_u32() => Self::StructRef,
395            _ => panic!("invalid `VMGcKind`: {masked:#032b}"),
396        }
397    }
398
399    /// Does this kind match the other kind?
400    ///
401    /// That is, is this kind a subtype of the other kind?
402    #[inline]
403    pub fn matches(self, other: Self) -> bool {
404        (self.as_u32() & other.as_u32()) == other.as_u32()
405    }
406
407    /// Get this `VMGcKind` as a raw `u32`.
408    #[inline]
409    pub fn as_u32(self) -> u32 {
410        self as u32
411    }
412}
413
414#[cfg(test)]
415mod tests {
416    use super::VMGcKind::*;
417    use crate::prelude::*;
418
419    #[test]
420    fn kind_matches() {
421        let all = [ExternRef, AnyRef, EqRef, ArrayRef, StructRef];
422
423        for (sup, subs) in [
424            (ExternRef, vec![]),
425            (AnyRef, vec![EqRef, ArrayRef, StructRef]),
426            (EqRef, vec![ArrayRef, StructRef]),
427            (ArrayRef, vec![]),
428            (StructRef, vec![]),
429        ] {
430            assert!(sup.matches(sup));
431            for sub in &subs {
432                assert!(sub.matches(sup));
433            }
434            for kind in all.iter().filter(|k| **k != sup && !subs.contains(k)) {
435                assert!(!kind.matches(sup));
436            }
437        }
438    }
439}