wasmtime_environ/gc.rs
1//! Target- and pointer-width-agnostic definitions of GC-related types and
2//! constants.
3//!
4//! These definitions are suitable for use both during compilation and at
5//! runtime.
6//!
7//! Note: We don't bother gating these on `cfg(feature = "gc")` because that
8//! makes downstream uses pretty annoying, and the primary thing we want to gate
9//! on our various `gc` cargo features is the actual garbage collection
10//! functions and their associated impact on binary size anyways.
11
12#[cfg(feature = "gc-drc")]
13pub mod drc;
14
15#[cfg(feature = "gc-null")]
16pub mod null;
17
18use crate::prelude::*;
19use crate::{
20 WasmArrayType, WasmCompositeInnerType, WasmCompositeType, WasmStorageType, WasmStructType,
21 WasmValType,
22};
23use core::alloc::Layout;
24
25/// Discriminant to check whether GC reference is an `i31ref` or not.
26pub const I31_DISCRIMINANT: u32 = 1;
27
28/// The size of the `VMGcHeader` in bytes.
29pub const VM_GC_HEADER_SIZE: u32 = 8;
30
31/// The minimum alignment of the `VMGcHeader` in bytes.
32pub const VM_GC_HEADER_ALIGN: u32 = 8;
33
34/// The offset of the `VMGcKind` field in the `VMGcHeader`.
35pub const VM_GC_HEADER_KIND_OFFSET: u32 = 0;
36
37/// The offset of the `VMSharedTypeIndex` field in the `VMGcHeader`.
38pub const VM_GC_HEADER_TYPE_INDEX_OFFSET: u32 = 4;
39
40/// Get the byte size of the given Wasm type when it is stored inside the GC
41/// heap.
42pub fn byte_size_of_wasm_ty_in_gc_heap(ty: &WasmStorageType) -> u32 {
43 match ty {
44 WasmStorageType::I8 => 1,
45 WasmStorageType::I16 => 2,
46 WasmStorageType::Val(ty) => match ty {
47 WasmValType::I32 | WasmValType::F32 | WasmValType::Ref(_) => 4,
48 WasmValType::I64 | WasmValType::F64 => 8,
49 WasmValType::V128 => 16,
50 },
51 }
52}
53
54/// Align `offset` up to `bytes`, updating `max_align` if `align` is the
55/// new maximum alignment, and returning the aligned offset.
56#[cfg(any(feature = "gc-drc", feature = "gc-null"))]
57fn align_up(offset: &mut u32, max_align: &mut u32, align: u32) -> u32 {
58 debug_assert!(max_align.is_power_of_two());
59 debug_assert!(align.is_power_of_two());
60 *offset = offset.checked_add(align - 1).unwrap() & !(align - 1);
61 *max_align = core::cmp::max(*max_align, align);
62 *offset
63}
64
65/// Define a new field of size and alignment `bytes`, updating the object's
66/// total `size` and `align` as necessary. The offset of the new field is
67/// returned.
68#[cfg(any(feature = "gc-drc", feature = "gc-null"))]
69fn field(size: &mut u32, align: &mut u32, bytes: u32) -> u32 {
70 let offset = align_up(size, align, bytes);
71 *size += bytes;
72 offset
73}
74
75/// Common code to define a GC array's layout, given the size and alignment of
76/// the collector's GC header and its expected offset of the array length field.
77#[cfg(any(feature = "gc-drc", feature = "gc-null"))]
78fn common_array_layout(
79 ty: &WasmArrayType,
80 header_size: u32,
81 header_align: u32,
82 expected_array_length_offset: u32,
83) -> GcArrayLayout {
84 use core::mem;
85
86 assert!(header_size >= crate::VM_GC_HEADER_SIZE);
87 assert!(header_align >= crate::VM_GC_HEADER_ALIGN);
88
89 let mut size = header_size;
90 let mut align = header_align;
91
92 let length_field_size = u32::try_from(mem::size_of::<u32>()).unwrap();
93 let length_field_offset = field(&mut size, &mut align, length_field_size);
94 assert_eq!(length_field_offset, expected_array_length_offset);
95
96 let elem_size = byte_size_of_wasm_ty_in_gc_heap(&ty.0.element_type);
97 let elems_offset = align_up(&mut size, &mut align, elem_size);
98 assert_eq!(elems_offset, size);
99
100 let elems_are_gc_refs = ty.0.element_type.is_vmgcref_type_and_not_i31();
101 if elems_are_gc_refs {
102 debug_assert_eq!(
103 length_field_offset + length_field_size,
104 elems_offset,
105 "DRC collector relies on GC ref elements appearing directly after the length field, without any padding",
106 );
107 }
108
109 GcArrayLayout {
110 base_size: size,
111 align,
112 elem_size,
113 elems_are_gc_refs,
114 }
115}
116
117/// Common code to define a GC struct's layout, given the size and alignment of
118/// the collector's GC header and its expected offset of the array length field.
119#[cfg(any(feature = "gc-null", feature = "gc-drc"))]
120fn common_struct_layout(
121 ty: &WasmStructType,
122 header_size: u32,
123 header_align: u32,
124) -> GcStructLayout {
125 assert!(header_size >= crate::VM_GC_HEADER_SIZE);
126 assert!(header_align >= crate::VM_GC_HEADER_ALIGN);
127
128 // Process each field, aligning it to its natural alignment.
129 //
130 // We don't try and do any fancy field reordering to minimize padding (yet?)
131 // because (a) the toolchain probably already did that and (b) we're just
132 // doing the simple thing first, and (c) this is tricky in the presence of
133 // subtyping where we need a subtype's fields to be assigned the same
134 // offsets as its supertype's fields. We can come back and improve things
135 // here if we find that (a) isn't actually holding true in practice.
136 let mut size = header_size;
137 let mut align = header_align;
138
139 let fields = ty
140 .fields
141 .iter()
142 .map(|f| {
143 let field_size = byte_size_of_wasm_ty_in_gc_heap(&f.element_type);
144 let offset = field(&mut size, &mut align, field_size);
145 let is_gc_ref = f.element_type.is_vmgcref_type_and_not_i31();
146 GcStructLayoutField { offset, is_gc_ref }
147 })
148 .collect();
149
150 // Ensure that the final size is a multiple of the alignment, for
151 // simplicity.
152 let align_size_to = align;
153 align_up(&mut size, &mut align, align_size_to);
154
155 GcStructLayout {
156 size,
157 align,
158 fields,
159 }
160}
161
162/// A trait for getting the layout of a Wasm GC struct or array inside a
163/// particular collector.
164pub trait GcTypeLayouts {
165 /// The offset of an array's length field.
166 ///
167 /// This must be the same for all arrays in the heap, regardless of their
168 /// element type.
169 fn array_length_field_offset(&self) -> u32;
170
171 /// Get this collector's layout for the given composite type.
172 ///
173 /// Returns `None` if the type is a function type, as functions are not
174 /// managed by the GC.
175 fn gc_layout(&self, ty: &WasmCompositeType) -> Option<GcLayout> {
176 assert!(!ty.shared);
177 match &ty.inner {
178 WasmCompositeInnerType::Array(ty) => Some(self.array_layout(ty).into()),
179 WasmCompositeInnerType::Struct(ty) => Some(self.struct_layout(ty).into()),
180 WasmCompositeInnerType::Func(_) => None,
181 WasmCompositeInnerType::Cont(_) => None,
182 }
183 }
184
185 /// Get this collector's layout for the given array type.
186 fn array_layout(&self, ty: &WasmArrayType) -> GcArrayLayout;
187
188 /// Get this collector's layout for the given struct type.
189 fn struct_layout(&self, ty: &WasmStructType) -> GcStructLayout;
190}
191
192/// The layout of a GC-managed object.
193#[derive(Clone, Debug)]
194pub enum GcLayout {
195 /// The layout of a GC-managed array object.
196 Array(GcArrayLayout),
197
198 /// The layout of a GC-managed struct object.
199 Struct(GcStructLayout),
200}
201
202impl From<GcArrayLayout> for GcLayout {
203 fn from(layout: GcArrayLayout) -> Self {
204 Self::Array(layout)
205 }
206}
207
208impl From<GcStructLayout> for GcLayout {
209 fn from(layout: GcStructLayout) -> Self {
210 Self::Struct(layout)
211 }
212}
213
214impl GcLayout {
215 /// Get the underlying `GcStructLayout`, or panic.
216 #[track_caller]
217 pub fn unwrap_struct(&self) -> &GcStructLayout {
218 match self {
219 Self::Struct(s) => s,
220 _ => panic!("GcLayout::unwrap_struct on non-struct GC layout"),
221 }
222 }
223
224 /// Get the underlying `GcArrayLayout`, or panic.
225 #[track_caller]
226 pub fn unwrap_array(&self) -> &GcArrayLayout {
227 match self {
228 Self::Array(a) => a,
229 _ => panic!("GcLayout::unwrap_array on non-array GC layout"),
230 }
231 }
232}
233
234/// The layout of a GC-managed array.
235///
236/// This layout is only valid for use with the GC runtime that created it. It is
237/// not valid to use one GC runtime's layout with another GC runtime, doing so
238/// is memory safe but will lead to general incorrectness like panics and wrong
239/// results.
240///
241/// All offsets are from the start of the object; that is, the size of the GC
242/// header (for example) is included in the offset.
243///
244/// All arrays are composed of the generic `VMGcHeader`, followed by
245/// collector-specific fields, followed by the contiguous array elements
246/// themselves. The array elements must be aligned to the element type's natural
247/// alignment.
248#[derive(Clone, Debug)]
249pub struct GcArrayLayout {
250 /// The size of this array object, without any elements.
251 ///
252 /// The array's elements, if any, must begin at exactly this offset.
253 pub base_size: u32,
254
255 /// The alignment of this array.
256 pub align: u32,
257
258 /// The size and natural alignment of each element in this array.
259 pub elem_size: u32,
260
261 /// Whether or not the elements of this array are GC references or not.
262 pub elems_are_gc_refs: bool,
263}
264
265impl GcArrayLayout {
266 /// Get the total size of this array for a given length of elements.
267 #[inline]
268 pub fn size_for_len(&self, len: u32) -> u32 {
269 self.elem_offset(len)
270 }
271
272 /// Get the offset of the `i`th element in an array with this layout.
273 #[inline]
274 pub fn elem_offset(&self, i: u32) -> u32 {
275 self.base_size + i * self.elem_size
276 }
277
278 /// Get a `core::alloc::Layout` for an array of this type with the given
279 /// length.
280 pub fn layout(&self, len: u32) -> Layout {
281 let size = self.size_for_len(len);
282 let size = usize::try_from(size).unwrap();
283 let align = usize::try_from(self.align).unwrap();
284 Layout::from_size_align(size, align).unwrap()
285 }
286}
287
288/// The layout for a GC-managed struct type.
289///
290/// This layout is only valid for use with the GC runtime that created it. It is
291/// not valid to use one GC runtime's layout with another GC runtime, doing so
292/// is memory safe but will lead to general incorrectness like panics and wrong
293/// results.
294///
295/// All offsets are from the start of the object; that is, the size of the GC
296/// header (for example) is included in the offset.
297#[derive(Clone, Debug)]
298pub struct GcStructLayout {
299 /// The size (in bytes) of this struct.
300 pub size: u32,
301
302 /// The alignment (in bytes) of this struct.
303 pub align: u32,
304
305 /// The fields of this struct. The `i`th entry contains information about
306 /// the `i`th struct field's layout.
307 pub fields: Vec<GcStructLayoutField>,
308}
309
310impl GcStructLayout {
311 /// Get a `core::alloc::Layout` for a struct of this type.
312 pub fn layout(&self) -> Layout {
313 let size = usize::try_from(self.size).unwrap();
314 let align = usize::try_from(self.align).unwrap();
315 Layout::from_size_align(size, align).unwrap()
316 }
317}
318
319/// A field in a `GcStructLayout`.
320#[derive(Clone, Copy, Debug)]
321pub struct GcStructLayoutField {
322 /// The offset (in bytes) of this field inside instances of this type.
323 pub offset: u32,
324
325 /// Whether or not this field might contain a reference to another GC
326 /// object.
327 ///
328 /// Note: it is okay for this to be `false` for `i31ref`s, since they never
329 /// actually reference another GC object.
330 pub is_gc_ref: bool,
331}
332
333/// The kind of an object in a GC heap.
334///
335/// Note that this type is accessed from Wasm JIT code.
336///
337/// `VMGcKind` is a bitset where to test if `a` is a subtype of an
338/// "abstract-ish" type `b`, we can simply use a single bitwise-and operation:
339///
340/// ```ignore
341/// a <: b iff a & b == b
342/// ```
343///
344/// For example, because `VMGcKind::AnyRef` has the high bit set, every kind
345/// representing some subtype of `anyref` also has its high bit set.
346///
347/// We say "abstract-ish" type because in addition to the abstract heap types
348/// (other than `i31`) we also have variants for `externref`s that have been
349/// converted into an `anyref` via `extern.convert_any` and `externref`s that
350/// have been converted into an `anyref` via `any.convert_extern`. Note that in
351/// the latter case, because `any.convert_extern $foo` produces a value that is
352/// not an instance of `eqref`, `VMGcKind::AnyOfExternRef & VMGcKind::EqRef !=
353/// VMGcKind::EqRef`.
354///
355/// Furthermore, this type only uses the highest 6 bits of its `u32`
356/// representation, allowing the lower 27 bytes to be bitpacked with other stuff
357/// as users see fit.
358#[repr(u32)]
359#[derive(Clone, Copy, Debug, PartialEq, Eq)]
360#[rustfmt::skip]
361#[expect(missing_docs, reason = "self-describing variants")]
362pub enum VMGcKind {
363 ExternRef = 0b01000 << 27,
364 AnyRef = 0b10000 << 27,
365 EqRef = 0b10100 << 27,
366 ArrayRef = 0b10101 << 27,
367 StructRef = 0b10110 << 27,
368}
369
370impl VMGcKind {
371 /// Mask this value with a `u32` to get just the bits that `VMGcKind` uses.
372 pub const MASK: u32 = 0b11111 << 27;
373
374 /// Mask this value with a `u32` that potentially contains a `VMGcKind` to
375 /// get the bits that `VMGcKind` doesn't use.
376 pub const UNUSED_MASK: u32 = !Self::MASK;
377
378 /// Does the given value fit in the unused bits of a `VMGcKind`?
379 #[inline]
380 pub fn value_fits_in_unused_bits(value: u32) -> bool {
381 (value & Self::UNUSED_MASK) == value
382 }
383
384 /// Convert the given value into a `VMGcKind` by masking off the unused
385 /// bottom bits.
386 #[inline]
387 pub fn from_high_bits_of_u32(val: u32) -> VMGcKind {
388 let masked = val & Self::MASK;
389 match masked {
390 x if x == Self::ExternRef.as_u32() => Self::ExternRef,
391 x if x == Self::AnyRef.as_u32() => Self::AnyRef,
392 x if x == Self::EqRef.as_u32() => Self::EqRef,
393 x if x == Self::ArrayRef.as_u32() => Self::ArrayRef,
394 x if x == Self::StructRef.as_u32() => Self::StructRef,
395 _ => panic!("invalid `VMGcKind`: {masked:#032b}"),
396 }
397 }
398
399 /// Does this kind match the other kind?
400 ///
401 /// That is, is this kind a subtype of the other kind?
402 #[inline]
403 pub fn matches(self, other: Self) -> bool {
404 (self.as_u32() & other.as_u32()) == other.as_u32()
405 }
406
407 /// Get this `VMGcKind` as a raw `u32`.
408 #[inline]
409 pub fn as_u32(self) -> u32 {
410 self as u32
411 }
412}
413
414#[cfg(test)]
415mod tests {
416 use super::VMGcKind::*;
417 use crate::prelude::*;
418
419 #[test]
420 fn kind_matches() {
421 let all = [ExternRef, AnyRef, EqRef, ArrayRef, StructRef];
422
423 for (sup, subs) in [
424 (ExternRef, vec![]),
425 (AnyRef, vec![EqRef, ArrayRef, StructRef]),
426 (EqRef, vec![ArrayRef, StructRef]),
427 (ArrayRef, vec![]),
428 (StructRef, vec![]),
429 ] {
430 assert!(sup.matches(sup));
431 for sub in &subs {
432 assert!(sub.matches(sup));
433 }
434 for kind in all.iter().filter(|k| **k != sup && !subs.contains(k)) {
435 assert!(!kind.matches(sup));
436 }
437 }
438 }
439}