CoCalc -- settings.rs

GitHub Repository: bytecodealliance/wasmtime
Path: blob/main/cranelift/codegen/meta/src/shared/settings.rs
¹⁶⁹³ views
1
use crate::cdsl::settings::{SettingGroup, SettingGroupBuilder};
2

3
pub(crate) fn define() -> SettingGroup {
4
    let mut settings = SettingGroupBuilder::new("shared");
5

6
    settings.add_bool(
7
        "regalloc_checker",
8
        "Enable the symbolic checker for register allocation.",
9
        r#"
10
            This performs a verification that the register allocator preserves
11
            equivalent dataflow with respect to the original (pre-regalloc)
12
            program. This analysis is somewhat expensive. However, if it succeeds,
13
            it provides independent evidence (by a carefully-reviewed, from-first-principles
14
            analysis) that no regalloc bugs were triggered for the particular compilations
15
            performed. This is a valuable assurance to have as regalloc bugs can be
16
            very dangerous and difficult to debug.
17
        "#,
18
        false,
19
    );
20

21
    settings.add_bool(
22
        "regalloc_verbose_logs",
23
        "Enable verbose debug logs for regalloc2.",
24
        r#"
25
            This adds extra logging for regalloc2 output, that is quite valuable to understand
26
            decisions taken by the register allocator as well as debugging it. It is disabled by
27
            default, as it can cause many log calls which can slow down compilation by a large
28
            amount.
29
        "#,
30
        false,
31
    );
32

33
    settings.add_enum(
34
        "regalloc_algorithm",
35
        "Algorithm to use in register allocator.",
36
        r#"
37
            Supported options:
38

39
            - `backtracking`: A backtracking allocator with range splitting; more expensive
40
                              but generates better code.
41
            - `single_pass`: A single-pass algorithm that yields quick compilation but
42
                             results in code with more register spills and moves.
43
        "#,
44
        vec!["backtracking", "single_pass"],
45
    );
46

47
    settings.add_enum(
48
        "opt_level",
49
        "Optimization level for generated code.",
50
        r#"
51
            Supported levels:
52

53
            - `none`: Minimise compile time by disabling most optimizations.
54
            - `speed`: Generate the fastest possible code
55
            - `speed_and_size`: like "speed", but also perform transformations aimed at reducing code size.
56
        "#,
57
        vec!["none", "speed", "speed_and_size"],
58
    );
59

60
    settings.add_bool(
61
        "enable_alias_analysis",
62
        "Do redundant-load optimizations with alias analysis.",
63
        r#"
64
            This enables the use of a simple alias analysis to optimize away redundant loads.
65
            Only effective when `opt_level` is `speed` or `speed_and_size`.
66
        "#,
67
        true,
68
    );
69

70
    settings.add_bool(
71
        "enable_verifier",
72
        "Run the Cranelift IR verifier at strategic times during compilation.",
73
        r#"
74
            This makes compilation slower but catches many bugs. The verifier is always enabled by
75
            default, which is useful during development.
76
        "#,
77
        true,
78
    );
79

80
    settings.add_bool(
81
        "enable_pcc",
82
        "Enable proof-carrying code translation validation.",
83
        r#"
84
            This adds a proof-carrying-code mode. Proof-carrying code (PCC) is a strategy to verify
85
            that the compiler preserves certain properties or invariants in the compiled code.
86
            For example, a frontend that translates WebAssembly to CLIF can embed PCC facts in
87
            the CLIF, and Cranelift will verify that the final machine code satisfies the stated
88
            facts at each intermediate computed value. Loads and stores can be marked as "checked"
89
            and their memory effects can be verified as safe.
90
        "#,
91
        false,
92
    );
93

94
    // Note that Cranelift doesn't currently need an is_pie flag, because PIE is
95
    // just PIC where symbols can't be pre-empted, which can be expressed with the
96
    // `colocated` flag on external functions and global values.
97
    settings.add_bool(
98
        "is_pic",
99
        "Enable Position-Independent Code generation.",
100
        "",
101
        false,
102
    );
103

104
    settings.add_bool(
105
        "use_colocated_libcalls",
106
        "Use colocated libcalls.",
107
        r#"
108
            Generate code that assumes that libcalls can be declared "colocated",
109
            meaning they will be defined along with the current function, such that
110
            they can use more efficient addressing.
111
        "#,
112
        false,
113
    );
114

115
    settings.add_bool(
116
        "enable_float",
117
        "Enable the use of floating-point instructions.",
118
        r#"
119
            Disabling use of floating-point instructions is not yet implemented.
120
        "#,
121
        true,
122
    );
123

124
    settings.add_bool(
125
        "enable_nan_canonicalization",
126
        "Enable NaN canonicalization.",
127
        r#"
128
            This replaces NaNs with a single canonical value, for users requiring
129
            entirely deterministic WebAssembly computation. This is not required
130
            by the WebAssembly spec, so it is not enabled by default.
131
        "#,
132
        false,
133
    );
134

135
    settings.add_bool(
136
        "enable_pinned_reg",
137
        "Enable the use of the pinned register.",
138
        r#"
139
            This register is excluded from register allocation, and is completely under the control of
140
            the end-user. It is possible to read it via the get_pinned_reg instruction, and to set it
141
            with the set_pinned_reg instruction.
142
        "#,
143
        false,
144
    );
145

146
    settings.add_bool(
147
        "enable_atomics",
148
        "Enable the use of atomic instructions",
149
        "",
150
        true,
151
    );
152

153
    settings.add_bool(
154
        "enable_safepoints",
155
        "Enable safepoint instruction insertions.",
156
        r#"
157
            This will allow the emit_stack_maps() function to insert the safepoint
158
            instruction on top of calls and interrupt traps in order to display the
159
            live reference values at that point in the program.
160
        "#,
161
        false,
162
    );
163

164
    settings.add_enum(
165
        "tls_model",
166
        "Defines the model used to perform TLS accesses.",
167
        "",
168
        vec!["none", "elf_gd", "macho", "coff"],
169
    );
170

171
    settings.add_enum(
172
        "stack_switch_model",
173
        "Defines the model used to performing stack switching.",
174
        r#"
175
           This determines the compilation of `stack_switch` instructions. If
176
           set to `basic`, we simply save all registers, update stack pointer
177
           and frame pointer (if needed), and jump to the target IP.
178
           If set to `update_windows_tib`, we *additionally* update information
179
           about the active stack in Windows' Thread Information Block.
180
        "#,
181
        vec!["none", "basic", "update_windows_tib"],
182
    );
183

184
    settings.add_enum(
185
        "libcall_call_conv",
186
        "Defines the calling convention to use for LibCalls call expansion.",
187
        r#"
188
            This may be different from the ISA default calling convention.
189

190
            The default value is to use the same calling convention as the ISA
191
            default calling convention.
192

193
            This list should be kept in sync with the list of calling
194
            conventions available in isa/call_conv.rs.
195
        "#,
196
        vec![
197
            "isa_default",
198
            "fast",
199
            "cold",
200
            "system_v",
201
            "windows_fastcall",
202
            "apple_aarch64",
203
            "probestack",
204
        ],
205
    );
206

207
    settings.add_bool(
208
        "enable_llvm_abi_extensions",
209
        "Enable various ABI extensions defined by LLVM's behavior.",
210
        r#"
211
            In some cases, LLVM's implementation of an ABI (calling convention)
212
            goes beyond a standard and supports additional argument types or
213
            behavior. This option instructs Cranelift codegen to follow LLVM's
214
            behavior where applicable.
215

216
            Currently, this applies only to Windows Fastcall on x86-64, and
217
            allows an `i128` argument to be spread across two 64-bit integer
218
            registers. The Fastcall implementation otherwise does not support
219
            `i128` arguments, and will panic if they are present and this
220
            option is not set.
221
        "#,
222
        false,
223
    );
224

225
    settings.add_bool(
226
        "enable_multi_ret_implicit_sret",
227
        "Enable support for sret arg introduction when there are too many ret vals.",
228
        r#"
229
            When there are more returns than available return registers, the
230
            return value has to be returned through the introduction of a
231
            return area pointer. Normally this return area pointer has to be
232
            introduced as `ArgumentPurpose::StructReturn` parameter, but for
233
            backward compatibility reasons Cranelift also supports implicitly
234
            introducing this parameter and writing the return values through it.
235

236
            **This option currently does not conform to platform ABIs and the
237
            used ABI should not be assumed to remain the same between Cranelift
238
            versions.**
239

240
            This option is **deprecated** and will be removed in the future.
241

242
            Because of the above issues, and complexities of native ABI support
243
            for the concept in general, Cranelift's support for multiple return
244
            values may also be removed in the future (#9510). For the most
245
            robust solution, it is recommended to build a convention on top of
246
            Cranelift's primitives for passing multiple return values, for
247
            example by allocating a stackslot in the caller, passing it as an
248
            explicit StructReturn argument, storing return values in the callee,
249
            and loading results in the caller.
250
        "#,
251
        false,
252
    );
253

254
    settings.add_bool(
255
        "unwind_info",
256
        "Generate unwind information.",
257
        r#"
258
            This increases metadata size and compile time, but allows for the
259
            debugger to trace frames, is needed for GC tracing that relies on
260
            libunwind (such as in Wasmtime), and is unconditionally needed on
261
            certain platforms (such as Windows) that must always be able to unwind.
262
          "#,
263
        true,
264
    );
265

266
    settings.add_bool(
267
        "preserve_frame_pointers",
268
        "Preserve frame pointers",
269
        r#"
270
            Preserving frame pointers -- even inside leaf functions -- makes it
271
            easy to capture the stack of a running program, without requiring any
272
            side tables or metadata (like `.eh_frame` sections). Many sampling
273
            profilers and similar tools walk frame pointers to capture stacks.
274
            Enabling this option will play nice with those tools.
275
        "#,
276
        false,
277
    );
278

279
    settings.add_bool(
280
        "machine_code_cfg_info",
281
        "Generate CFG metadata for machine code.",
282
        r#"
283
            This increases metadata size and compile time, but allows for the
284
            embedder to more easily post-process or analyze the generated
285
            machine code. It provides code offsets for the start of each
286
            basic block in the generated machine code, and a list of CFG
287
            edges (with blocks identified by start offsets) between them.
288
            This is useful for, e.g., machine-code analyses that verify certain
289
            properties of the generated code.
290
        "#,
291
        false,
292
    );
293

294
    // Stack probing options.
295

296
    settings.add_bool(
297
        "enable_probestack",
298
        "Enable the use of stack probes for supported calling conventions.",
299
        "",
300
        false,
301
    );
302

303
    settings.add_num(
304
        "probestack_size_log2",
305
        "The log2 of the size of the stack guard region.",
306
        r#"
307
            Stack frames larger than this size will have stack overflow checked
308
            by calling the probestack function.
309

310
            The default is 12, which translates to a size of 4096.
311
        "#,
312
        12,
313
    );
314

315
    settings.add_enum(
316
        "probestack_strategy",
317
        "Controls what kinds of stack probes are emitted.",
318
        r#"
319
            Supported strategies:
320

321
            - `outline`: Always emits stack probes as calls to a probe stack function.
322
            - `inline`: Always emits inline stack probes.
323
        "#,
324
        vec!["outline", "inline"],
325
    );
326

327
    // Jump table options.
328

329
    settings.add_bool(
330
        "enable_jump_tables",
331
        "Enable the use of jump tables in generated machine code.",
332
        "",
333
        true,
334
    );
335

336
    // Spectre options.
337

338
    settings.add_bool(
339
        "enable_heap_access_spectre_mitigation",
340
        "Enable Spectre mitigation on heap bounds checks.",
341
        r#"
342
            This is a no-op for any heap that needs no bounds checks; e.g.,
343
            if the limit is static and the guard region is large enough that
344
            the index cannot reach past it.
345

346
            This option is enabled by default because it is highly
347
            recommended for secure sandboxing. The embedder should consider
348
            the security implications carefully before disabling this option.
349
        "#,
350
        true,
351
    );
352

353
    settings.add_bool(
354
        "enable_table_access_spectre_mitigation",
355
        "Enable Spectre mitigation on table bounds checks.",
356
        r#"
357
            This option uses a conditional move to ensure that when a table
358
            access index is bounds-checked and a conditional branch is used
359
            for the out-of-bounds case, a misspeculation of that conditional
360
            branch (falsely predicted in-bounds) will select an in-bounds
361
            index to load on the speculative path.
362

363
            This option is enabled by default because it is highly
364
            recommended for secure sandboxing. The embedder should consider
365
            the security implications carefully before disabling this option.
366
        "#,
367
        true,
368
    );
369

370
    settings.add_bool(
371
        "enable_incremental_compilation_cache_checks",
372
        "Enable additional checks for debugging the incremental compilation cache.",
373
        r#"
374
            Enables additional checks that are useful during development of the incremental
375
            compilation cache. This should be mostly useful for Cranelift hackers, as well as for
376
            helping to debug false incremental cache positives for embedders.
377

378
            This option is disabled by default and requires enabling the "incremental-cache" Cargo
379
            feature in cranelift-codegen.
380
        "#,
381
        false,
382
    );
383

384
    settings.add_num(
385
        "bb_padding_log2_minus_one",
386
        "The log2 of the size to insert dummy padding between basic blocks",
387
        r#"
388
            This is a debugging option for stressing various cases during code
389
            generation without requiring large functions. This will insert
390
            0-byte padding between basic blocks of the specified size.
391

392
            The amount of padding inserted two raised to the power of this value
393
            minus one. If this value is 0 then no padding is inserted.
394

395
            The default for this option is 0 to insert no padding as it's only
396
            intended for testing and development.
397
        "#,
398
        0,
399
    );
400

401
    settings.add_num(
402
        "log2_min_function_alignment",
403
        "The log2 of the minimum alignment of functions",
404
        "The bigger of this value and the default alignment will be used as actual alignment.",
405
        0,
406
    );
407

408
    // When adding new settings please check if they can also be added
409
    // in cranelift/fuzzgen/src/lib.rs for fuzzing.
410
    settings.build()
411
}
412

413
Product

Resources

Company