1use crate::cdsl::settings::{SettingGroup, SettingGroupBuilder};
2
3pub(crate) fn define() -> SettingGroup {
4 let mut settings = SettingGroupBuilder::new("shared");
5
6 settings.add_bool(
7 "regalloc_checker",
8 "Enable the symbolic checker for register allocation.",
9 r#"
10 This performs a verification that the register allocator preserves
11 equivalent dataflow with respect to the original (pre-regalloc)
12 program. This analysis is somewhat expensive. However, if it succeeds,
13 it provides independent evidence (by a carefully-reviewed, from-first-principles
14 analysis) that no regalloc bugs were triggered for the particular compilations
15 performed. This is a valuable assurance to have as regalloc bugs can be
16 very dangerous and difficult to debug.
17 "#,
18 false,
19 );
20
21 settings.add_bool(
22 "regalloc_verbose_logs",
23 "Enable verbose debug logs for regalloc2.",
24 r#"
25 This adds extra logging for regalloc2 output, that is quite valuable to understand
26 decisions taken by the register allocator as well as debugging it. It is disabled by
27 default, as it can cause many log calls which can slow down compilation by a large
28 amount.
29 "#,
30 false,
31 );
32
33 settings.add_enum(
34 "regalloc_algorithm",
35 "Algorithm to use in register allocator.",
36 r#"
37 Supported options:
38
39 - `backtracking`: A backtracking allocator with range splitting; more expensive
40 but generates better code.
41
42 Note that the `single_pass` option is currently disabled because it does not
43 have adequate support for the kinds of allocations required by exception
44 handling (https://github.com/bytecodealliance/regalloc2/issues/217).
45 "#,
46 vec!["backtracking"],
47 );
48
49 settings.add_enum(
50 "opt_level",
51 "Optimization level for generated code.",
52 r#"
53 Supported levels:
54
55 - `none`: Minimise compile time by disabling most optimizations.
56 - `speed`: Generate the fastest possible code
57 - `speed_and_size`: like "speed", but also perform transformations aimed at reducing code size.
58 "#,
59 vec!["none", "speed", "speed_and_size"],
60 );
61
62 settings.add_bool(
63 "enable_alias_analysis",
64 "Do redundant-load optimizations with alias analysis.",
65 r#"
66 This enables the use of a simple alias analysis to optimize away redundant loads.
67 Only effective when `opt_level` is `speed` or `speed_and_size`.
68 "#,
69 true,
70 );
71
72 settings.add_bool(
73 "enable_verifier",
74 "Run the Cranelift IR verifier at strategic times during compilation.",
75 r#"
76 This makes compilation slower but catches many bugs. The verifier is always enabled by
77 default, which is useful during development.
78 "#,
79 true,
80 );
81
82 settings.add_bool(
83 "enable_pcc",
84 "Enable proof-carrying code translation validation.",
85 r#"
86 This adds a proof-carrying-code mode. Proof-carrying code (PCC) is a strategy to verify
87 that the compiler preserves certain properties or invariants in the compiled code.
88 For example, a frontend that translates WebAssembly to CLIF can embed PCC facts in
89 the CLIF, and Cranelift will verify that the final machine code satisfies the stated
90 facts at each intermediate computed value. Loads and stores can be marked as "checked"
91 and their memory effects can be verified as safe.
92 "#,
93 false,
94 );
95
96 settings.add_bool(
100 "is_pic",
101 "Enable Position-Independent Code generation.",
102 "",
103 false,
104 );
105
106 settings.add_bool(
107 "use_colocated_libcalls",
108 "Use colocated libcalls.",
109 r#"
110 Generate code that assumes that libcalls can be declared "colocated",
111 meaning they will be defined along with the current function, such that
112 they can use more efficient addressing.
113 "#,
114 false,
115 );
116
117 settings.add_bool(
118 "enable_float",
119 "Enable the use of floating-point instructions.",
120 r#"
121 Disabling use of floating-point instructions is not yet implemented.
122 "#,
123 true,
124 );
125
126 settings.add_bool(
127 "enable_nan_canonicalization",
128 "Enable NaN canonicalization.",
129 r#"
130 This replaces NaNs with a single canonical value, for users requiring
131 entirely deterministic WebAssembly computation. This is not required
132 by the WebAssembly spec, so it is not enabled by default.
133 "#,
134 false,
135 );
136
137 settings.add_bool(
138 "enable_pinned_reg",
139 "Enable the use of the pinned register.",
140 r#"
141 This register is excluded from register allocation, and is completely under the control of
142 the end-user. It is possible to read it via the get_pinned_reg instruction, and to set it
143 with the set_pinned_reg instruction.
144 "#,
145 false,
146 );
147
148 settings.add_bool(
149 "enable_atomics",
150 "Enable the use of atomic instructions",
151 "",
152 true,
153 );
154
155 settings.add_bool(
156 "enable_safepoints",
157 "Enable safepoint instruction insertions.",
158 r#"
159 This will allow the emit_stack_maps() function to insert the safepoint
160 instruction on top of calls and interrupt traps in order to display the
161 live reference values at that point in the program.
162 "#,
163 false,
164 );
165
166 settings.add_enum(
167 "tls_model",
168 "Defines the model used to perform TLS accesses.",
169 "",
170 vec!["none", "elf_gd", "macho", "coff"],
171 );
172
173 settings.add_enum(
174 "stack_switch_model",
175 "Defines the model used to performing stack switching.",
176 r#"
177 This determines the compilation of `stack_switch` instructions. If
178 set to `basic`, we simply save all registers, update stack pointer
179 and frame pointer (if needed), and jump to the target IP.
180 If set to `update_windows_tib`, we *additionally* update information
181 about the active stack in Windows' Thread Information Block.
182 "#,
183 vec!["none", "basic", "update_windows_tib"],
184 );
185
186 settings.add_enum(
187 "libcall_call_conv",
188 "Defines the calling convention to use for LibCalls call expansion.",
189 r#"
190 This may be different from the ISA default calling convention.
191
192 The default value is to use the same calling convention as the ISA
193 default calling convention.
194
195 This list should be kept in sync with the list of calling
196 conventions available in isa/call_conv.rs.
197 "#,
198 vec![
199 "isa_default",
200 "fast",
201 "cold",
202 "system_v",
203 "windows_fastcall",
204 "apple_aarch64",
205 "probestack",
206 ],
207 );
208
209 settings.add_bool(
210 "enable_llvm_abi_extensions",
211 "Enable various ABI extensions defined by LLVM's behavior.",
212 r#"
213 In some cases, LLVM's implementation of an ABI (calling convention)
214 goes beyond a standard and supports additional argument types or
215 behavior. This option instructs Cranelift codegen to follow LLVM's
216 behavior where applicable.
217
218 Currently, this applies only to Windows Fastcall on x86-64, and
219 allows an `i128` argument to be spread across two 64-bit integer
220 registers. The Fastcall implementation otherwise does not support
221 `i128` arguments, and will panic if they are present and this
222 option is not set.
223 "#,
224 false,
225 );
226
227 settings.add_bool(
228 "enable_multi_ret_implicit_sret",
229 "Enable support for sret arg introduction when there are too many ret vals.",
230 r#"
231 When there are more returns than available return registers, the
232 return value has to be returned through the introduction of a
233 return area pointer. Normally this return area pointer has to be
234 introduced as `ArgumentPurpose::StructReturn` parameter, but for
235 backward compatibility reasons Cranelift also supports implicitly
236 introducing this parameter and writing the return values through it.
237
238 **This option currently does not conform to platform ABIs and the
239 used ABI should not be assumed to remain the same between Cranelift
240 versions.**
241
242 This option is **deprecated** and will be removed in the future.
243
244 Because of the above issues, and complexities of native ABI support
245 for the concept in general, Cranelift's support for multiple return
246 values may also be removed in the future (#9510). For the most
247 robust solution, it is recommended to build a convention on top of
248 Cranelift's primitives for passing multiple return values, for
249 example by allocating a stackslot in the caller, passing it as an
250 explicit StructReturn argument, storing return values in the callee,
251 and loading results in the caller.
252 "#,
253 false,
254 );
255
256 settings.add_bool(
257 "unwind_info",
258 "Generate unwind information.",
259 r#"
260 This increases metadata size and compile time, but allows for the
261 debugger to trace frames, is needed for GC tracing that relies on
262 libunwind (such as in Wasmtime), and is unconditionally needed on
263 certain platforms (such as Windows) that must always be able to unwind.
264 "#,
265 true,
266 );
267
268 settings.add_bool(
269 "preserve_frame_pointers",
270 "Preserve frame pointers",
271 r#"
272 Preserving frame pointers -- even inside leaf functions -- makes it
273 easy to capture the stack of a running program, without requiring any
274 side tables or metadata (like `.eh_frame` sections). Many sampling
275 profilers and similar tools walk frame pointers to capture stacks.
276 Enabling this option will play nice with those tools.
277 "#,
278 false,
279 );
280
281 settings.add_bool(
282 "machine_code_cfg_info",
283 "Generate CFG metadata for machine code.",
284 r#"
285 This increases metadata size and compile time, but allows for the
286 embedder to more easily post-process or analyze the generated
287 machine code. It provides code offsets for the start of each
288 basic block in the generated machine code, and a list of CFG
289 edges (with blocks identified by start offsets) between them.
290 This is useful for, e.g., machine-code analyses that verify certain
291 properties of the generated code.
292 "#,
293 false,
294 );
295
296 settings.add_bool(
299 "enable_probestack",
300 "Enable the use of stack probes for supported calling conventions.",
301 "",
302 false,
303 );
304
305 settings.add_num(
306 "probestack_size_log2",
307 "The log2 of the size of the stack guard region.",
308 r#"
309 Stack frames larger than this size will have stack overflow checked
310 by calling the probestack function.
311
312 The default is 12, which translates to a size of 4096.
313 "#,
314 12,
315 );
316
317 settings.add_enum(
318 "probestack_strategy",
319 "Controls what kinds of stack probes are emitted.",
320 r#"
321 Supported strategies:
322
323 - `outline`: Always emits stack probes as calls to a probe stack function.
324 - `inline`: Always emits inline stack probes.
325 "#,
326 vec!["outline", "inline"],
327 );
328
329 settings.add_bool(
332 "enable_jump_tables",
333 "Enable the use of jump tables in generated machine code.",
334 "",
335 true,
336 );
337
338 settings.add_bool(
341 "enable_heap_access_spectre_mitigation",
342 "Enable Spectre mitigation on heap bounds checks.",
343 r#"
344 This is a no-op for any heap that needs no bounds checks; e.g.,
345 if the limit is static and the guard region is large enough that
346 the index cannot reach past it.
347
348 This option is enabled by default because it is highly
349 recommended for secure sandboxing. The embedder should consider
350 the security implications carefully before disabling this option.
351 "#,
352 true,
353 );
354
355 settings.add_bool(
356 "enable_table_access_spectre_mitigation",
357 "Enable Spectre mitigation on table bounds checks.",
358 r#"
359 This option uses a conditional move to ensure that when a table
360 access index is bounds-checked and a conditional branch is used
361 for the out-of-bounds case, a misspeculation of that conditional
362 branch (falsely predicted in-bounds) will select an in-bounds
363 index to load on the speculative path.
364
365 This option is enabled by default because it is highly
366 recommended for secure sandboxing. The embedder should consider
367 the security implications carefully before disabling this option.
368 "#,
369 true,
370 );
371
372 settings.add_bool(
373 "enable_incremental_compilation_cache_checks",
374 "Enable additional checks for debugging the incremental compilation cache.",
375 r#"
376 Enables additional checks that are useful during development of the incremental
377 compilation cache. This should be mostly useful for Cranelift hackers, as well as for
378 helping to debug false incremental cache positives for embedders.
379
380 This option is disabled by default and requires enabling the "incremental-cache" Cargo
381 feature in cranelift-codegen.
382 "#,
383 false,
384 );
385
386 settings.add_num(
387 "bb_padding_log2_minus_one",
388 "The log2 of the size to insert dummy padding between basic blocks",
389 r#"
390 This is a debugging option for stressing various cases during code
391 generation without requiring large functions. This will insert
392 0-byte padding between basic blocks of the specified size.
393
394 The amount of padding inserted two raised to the power of this value
395 minus one. If this value is 0 then no padding is inserted.
396
397 The default for this option is 0 to insert no padding as it's only
398 intended for testing and development.
399 "#,
400 0,
401 );
402
403 settings.add_num(
404 "log2_min_function_alignment",
405 "The log2 of the minimum alignment of functions",
406 "The bigger of this value and the default alignment will be used as actual alignment.",
407 0,
408 );
409
410 settings.build()
413}