1 use crate::cdsl::settings::{SettingGroup, SettingGroupBuilder};
2 
3 pub(crate) fn define() -> SettingGroup {
4     let mut settings = SettingGroupBuilder::new("shared");
5 
6     settings.add_bool(
7         "regalloc_checker",
8         "Enable the symbolic checker for register allocation.",
9         r#"
10             This performs a verification that the register allocator preserves
11             equivalent dataflow with respect to the original (pre-regalloc)
12             program. This analysis is somewhat expensive. However, if it succeeds,
13             it provides independent evidence (by a carefully-reviewed, from-first-principles
14             analysis) that no regalloc bugs were triggered for the particular compilations
15             performed. This is a valuable assurance to have as regalloc bugs can be
16             very dangerous and difficult to debug.
17         "#,
18         false,
19     );
20 
21     settings.add_bool(
22         "regalloc_verbose_logs",
23         "Enable verbose debug logs for regalloc2.",
24         r#"
25             This adds extra logging for regalloc2 output, that is quite valuable to understand
26             decisions taken by the register allocator as well as debugging it. It is disabled by
27             default, as it can cause many log calls which can slow down compilation by a large
28             amount.
29         "#,
30         false,
31     );
32 
33     settings.add_enum(
34         "regalloc_algorithm",
35         "Algorithm to use in register allocator.",
36         r#"
37             Supported options:
38 
39             - `backtracking`: A backtracking allocator with range splitting; more expensive
40                               but generates better code.
41             - `single_pass`: A single-pass algorithm that yields quick compilation but
42                              results in code with more register spills and moves.
43         "#,
44         vec!["backtracking", "single_pass"],
45     );
46 
47     settings.add_enum(
48         "opt_level",
49         "Optimization level for generated code.",
50         r#"
51             Supported levels:
52 
53             - `none`: Minimise compile time by disabling most optimizations.
54             - `speed`: Generate the fastest possible code
55             - `speed_and_size`: like "speed", but also perform transformations aimed at reducing code size.
56         "#,
57         vec!["none", "speed", "speed_and_size"],
58     );
59 
60     settings.add_bool(
61         "enable_alias_analysis",
62         "Do redundant-load optimizations with alias analysis.",
63         r#"
64             This enables the use of a simple alias analysis to optimize away redundant loads.
65             Only effective when `opt_level` is `speed` or `speed_and_size`.
66         "#,
67         true,
68     );
69 
70     settings.add_bool(
71         "enable_verifier",
72         "Run the Cranelift IR verifier at strategic times during compilation.",
73         r#"
74             This makes compilation slower but catches many bugs. The verifier is always enabled by
75             default, which is useful during development.
76         "#,
77         true,
78     );
79 
80     settings.add_bool(
81         "enable_pcc",
82         "Enable proof-carrying code translation validation.",
83         r#"
84             This adds a proof-carrying-code mode. Proof-carrying code (PCC) is a strategy to verify
85             that the compiler preserves certain properties or invariants in the compiled code.
86             For example, a frontend that translates WebAssembly to CLIF can embed PCC facts in
87             the CLIF, and Cranelift will verify that the final machine code satisfies the stated
88             facts at each intermediate computed value. Loads and stores can be marked as "checked"
89             and their memory effects can be verified as safe.
90         "#,
91         false,
92     );
93 
94     // Note that Cranelift doesn't currently need an is_pie flag, because PIE is
95     // just PIC where symbols can't be pre-empted, which can be expressed with the
96     // `colocated` flag on external functions and global values.
97     settings.add_bool(
98         "is_pic",
99         "Enable Position-Independent Code generation.",
100         "",
101         false,
102     );
103 
104     settings.add_bool(
105         "use_colocated_libcalls",
106         "Use colocated libcalls.",
107         r#"
108             Generate code that assumes that libcalls can be declared "colocated",
109             meaning they will be defined along with the current function, such that
110             they can use more efficient addressing.
111         "#,
112         false,
113     );
114 
115     settings.add_bool(
116         "enable_float",
117         "Enable the use of floating-point instructions.",
118         r#"
119             Disabling use of floating-point instructions is not yet implemented.
120         "#,
121         true,
122     );
123 
124     settings.add_bool(
125         "enable_nan_canonicalization",
126         "Enable NaN canonicalization.",
127         r#"
128             This replaces NaNs with a single canonical value, for users requiring
129             entirely deterministic WebAssembly computation. This is not required
130             by the WebAssembly spec, so it is not enabled by default.
131         "#,
132         false,
133     );
134 
135     settings.add_bool(
136         "enable_pinned_reg",
137         "Enable the use of the pinned register.",
138         r#"
139             This register is excluded from register allocation, and is completely under the control of
140             the end-user. It is possible to read it via the get_pinned_reg instruction, and to set it
141             with the set_pinned_reg instruction.
142         "#,
143         false,
144     );
145 
146     settings.add_bool(
147         "enable_atomics",
148         "Enable the use of atomic instructions",
149         "",
150         true,
151     );
152 
153     settings.add_bool(
154         "enable_safepoints",
155         "Enable safepoint instruction insertions.",
156         r#"
157             This will allow the emit_stack_maps() function to insert the safepoint
158             instruction on top of calls and interrupt traps in order to display the
159             live reference values at that point in the program.
160         "#,
161         false,
162     );
163 
164     settings.add_enum(
165         "tls_model",
166         "Defines the model used to perform TLS accesses.",
167         "",
168         vec!["none", "elf_gd", "macho", "coff"],
169     );
170 
171     settings.add_enum(
172         "stack_switch_model",
173         "Defines the model used to performing stack switching.",
174         r#"
175            This determines the compilation of `stack_switch` instructions. If
176            set to `basic`, we simply save all registers, update stack pointer
177            and frame pointer (if needed), and jump to the target IP.
178            If set to `update_windows_tib`, we *additionally* update information
179            about the active stack in Windows' Thread Information Block.
180         "#,
181         vec!["none", "basic", "update_windows_tib"],
182     );
183 
184     settings.add_enum(
185         "libcall_call_conv",
186         "Defines the calling convention to use for LibCalls call expansion.",
187         r#"
188             This may be different from the ISA default calling convention.
189 
190             The default value is to use the same calling convention as the ISA
191             default calling convention.
192 
193             This list should be kept in sync with the list of calling
194             conventions available in isa/call_conv.rs.
195         "#,
196         vec![
197             "isa_default",
198             "fast",
199             "cold",
200             "system_v",
201             "windows_fastcall",
202             "apple_aarch64",
203             "probestack",
204         ],
205     );
206 
207     settings.add_bool(
208         "enable_llvm_abi_extensions",
209         "Enable various ABI extensions defined by LLVM's behavior.",
210         r#"
211             In some cases, LLVM's implementation of an ABI (calling convention)
212             goes beyond a standard and supports additional argument types or
213             behavior. This option instructs Cranelift codegen to follow LLVM's
214             behavior where applicable.
215 
216             Currently, this applies only to Windows Fastcall on x86-64, and
217             allows an `i128` argument to be spread across two 64-bit integer
218             registers. The Fastcall implementation otherwise does not support
219             `i128` arguments, and will panic if they are present and this
220             option is not set.
221         "#,
222         false,
223     );
224 
225     settings.add_bool(
226         "enable_multi_ret_implicit_sret",
227         "Enable support for sret arg introduction when there are too many ret vals.",
228         r#"
229             When there are more returns than available return registers, the
230             return value has to be returned through the introduction of a
231             return area pointer. Normally this return area pointer has to be
232             introduced as `ArgumentPurpose::StructReturn` parameter, but for
233             backward compatibility reasons Cranelift also supports implicitly
234             introducing this parameter and writing the return values through it.
235 
236             **This option currently does not conform to platform ABIs and the
237             used ABI should not be assumed to remain the same between Cranelift
238             versions.**
239 
240             This option is **deprecated** and will be removed in the future.
241 
242             Because of the above issues, and complexities of native ABI support
243             for the concept in general, Cranelift's support for multiple return
244             values may also be removed in the future (#9510). For the most
245             robust solution, it is recommended to build a convention on top of
246             Cranelift's primitives for passing multiple return values, for
247             example by allocating a stackslot in the caller, passing it as an
248             explicit StructReturn argument, storing return values in the callee,
249             and loading results in the caller.
250         "#,
251         false,
252     );
253 
254     settings.add_bool(
255         "unwind_info",
256         "Generate unwind information.",
257         r#"
258             This increases metadata size and compile time, but allows for the
259             debugger to trace frames, is needed for GC tracing that relies on
260             libunwind (such as in Wasmtime), and is unconditionally needed on
261             certain platforms (such as Windows) that must always be able to unwind.
262           "#,
263         true,
264     );
265 
266     settings.add_bool(
267         "preserve_frame_pointers",
268         "Preserve frame pointers",
269         r#"
270             Preserving frame pointers -- even inside leaf functions -- makes it
271             easy to capture the stack of a running program, without requiring any
272             side tables or metadata (like `.eh_frame` sections). Many sampling
273             profilers and similar tools walk frame pointers to capture stacks.
274             Enabling this option will play nice with those tools.
275         "#,
276         false,
277     );
278 
279     settings.add_bool(
280         "machine_code_cfg_info",
281         "Generate CFG metadata for machine code.",
282         r#"
283             This increases metadata size and compile time, but allows for the
284             embedder to more easily post-process or analyze the generated
285             machine code. It provides code offsets for the start of each
286             basic block in the generated machine code, and a list of CFG
287             edges (with blocks identified by start offsets) between them.
288             This is useful for, e.g., machine-code analyses that verify certain
289             properties of the generated code.
290         "#,
291         false,
292     );
293 
294     // Stack probing options.
295 
296     settings.add_bool(
297         "enable_probestack",
298         "Enable the use of stack probes for supported calling conventions.",
299         "",
300         false,
301     );
302 
303     settings.add_num(
304         "probestack_size_log2",
305         "The log2 of the size of the stack guard region.",
306         r#"
307             Stack frames larger than this size will have stack overflow checked
308             by calling the probestack function.
309 
310             The default is 12, which translates to a size of 4096.
311         "#,
312         12,
313     );
314 
315     settings.add_enum(
316         "probestack_strategy",
317         "Controls what kinds of stack probes are emitted.",
318         r#"
319             Supported strategies:
320 
321             - `outline`: Always emits stack probes as calls to a probe stack function.
322             - `inline`: Always emits inline stack probes.
323         "#,
324         vec!["outline", "inline"],
325     );
326 
327     // Jump table options.
328 
329     settings.add_bool(
330         "enable_jump_tables",
331         "Enable the use of jump tables in generated machine code.",
332         "",
333         true,
334     );
335 
336     // Spectre options.
337 
338     settings.add_bool(
339         "enable_heap_access_spectre_mitigation",
340         "Enable Spectre mitigation on heap bounds checks.",
341         r#"
342             This is a no-op for any heap that needs no bounds checks; e.g.,
343             if the limit is static and the guard region is large enough that
344             the index cannot reach past it.
345 
346             This option is enabled by default because it is highly
347             recommended for secure sandboxing. The embedder should consider
348             the security implications carefully before disabling this option.
349         "#,
350         true,
351     );
352 
353     settings.add_bool(
354         "enable_table_access_spectre_mitigation",
355         "Enable Spectre mitigation on table bounds checks.",
356         r#"
357             This option uses a conditional move to ensure that when a table
358             access index is bounds-checked and a conditional branch is used
359             for the out-of-bounds case, a misspeculation of that conditional
360             branch (falsely predicted in-bounds) will select an in-bounds
361             index to load on the speculative path.
362 
363             This option is enabled by default because it is highly
364             recommended for secure sandboxing. The embedder should consider
365             the security implications carefully before disabling this option.
366         "#,
367         true,
368     );
369 
370     settings.add_bool(
371         "enable_incremental_compilation_cache_checks",
372         "Enable additional checks for debugging the incremental compilation cache.",
373         r#"
374             Enables additional checks that are useful during development of the incremental
375             compilation cache. This should be mostly useful for Cranelift hackers, as well as for
376             helping to debug false incremental cache positives for embedders.
377 
378             This option is disabled by default and requires enabling the "incremental-cache" Cargo
379             feature in cranelift-codegen.
380         "#,
381         false,
382     );
383 
384     settings.add_num(
385         "bb_padding_log2_minus_one",
386         "The log2 of the size to insert dummy padding between basic blocks",
387         r#"
388             This is a debugging option for stressing various cases during code
389             generation without requiring large functions. This will insert
390             0-byte padding between basic blocks of the specified size.
391 
392             The amount of padding inserted two raised to the power of this value
393             minus one. If this value is 0 then no padding is inserted.
394 
395             The default for this option is 0 to insert no padding as it's only
396             intended for testing and development.
397         "#,
398         0,
399     );
400 
401     settings.add_num(
402         "log2_min_function_alignment",
403         "The log2 of the minimum alignment of functions",
404         "The bigger of this value and the default alignment will be used as actual alignment.",
405         0,
406     );
407 
408     // When adding new settings please check if they can also be added
409     // in cranelift/fuzzgen/src/lib.rs for fuzzing.
410     settings.build()
411 }
412