CoCalc -- instructions.rs

GitHub Repository: bytecodealliance/wasmtime
Path: blob/main/cranelift/codegen/meta/src/shared/instructions.rs
¹⁶⁹³ views
1
#![expect(non_snake_case, reason = "DSL style here")]
2

3
use crate::cdsl::instructions::{
4
    AllInstructions, InstructionBuilder as Inst, InstructionGroupBuilder,
5
};
6
use crate::cdsl::operands::Operand;
7
use crate::cdsl::types::{LaneType, ValueType};
8
use crate::cdsl::typevar::{Interval, TypeSetBuilder, TypeVar};
9
use crate::shared::formats::Formats;
10
use crate::shared::types;
11
use crate::shared::{entities::EntityRefs, immediates::Immediates};
12

13
#[inline(never)]
14
fn define_control_flow(
15
    ig: &mut InstructionGroupBuilder,
16
    formats: &Formats,
17
    imm: &Immediates,
18
    entities: &EntityRefs,
19
) {
20
    ig.push(
21
        Inst::new(
22
            "jump",
23
            r#"
24
        Jump.
25

26
        Unconditionally jump to a basic block, passing the specified
27
        block arguments. The number and types of arguments must match the
28
        destination block.
29
        "#,
30
            &formats.jump,
31
        )
32
        .operands_in(vec![
33
            Operand::new("block_call", &entities.block_call)
34
                .with_doc("Destination basic block, with its arguments provided"),
35
        ])
36
        .branches(),
37
    );
38

39
    let ScalarTruthy = &TypeVar::new(
40
        "ScalarTruthy",
41
        "A scalar truthy type",
42
        TypeSetBuilder::new().ints(Interval::All).build(),
43
    );
44

45
    ig.push(
46
        Inst::new(
47
            "brif",
48
            r#"
49
        Conditional branch when cond is non-zero.
50

51
        Take the ``then`` branch when ``c != 0``, and the ``else`` branch otherwise.
52
        "#,
53
            &formats.brif,
54
        )
55
        .operands_in(vec![
56
            Operand::new("c", ScalarTruthy).with_doc("Controlling value to test"),
57
            Operand::new("block_then", &entities.block_then).with_doc("Then block"),
58
            Operand::new("block_else", &entities.block_else).with_doc("Else block"),
59
        ])
60
        .branches(),
61
    );
62

63
    {
64
        let _i32 = &TypeVar::new(
65
            "i32",
66
            "A 32 bit scalar integer type",
67
            TypeSetBuilder::new().ints(32..32).build(),
68
        );
69

70
        ig.push(
71
            Inst::new(
72
                "br_table",
73
                r#"
74
        Indirect branch via jump table.
75

76
        Use ``x`` as an unsigned index into the jump table ``JT``. If a jump
77
        table entry is found, branch to the corresponding block. If no entry was
78
        found or the index is out-of-bounds, branch to the default block of the
79
        table.
80

81
        Note that this branch instruction can't pass arguments to the targeted
82
        blocks. Split critical edges as needed to work around this.
83

84
        Do not confuse this with "tables" in WebAssembly. ``br_table`` is for
85
        jump tables with destinations within the current function only -- think
86
        of a ``match`` in Rust or a ``switch`` in C.  If you want to call a
87
        function in a dynamic library, that will typically use
88
        ``call_indirect``.
89
        "#,
90
                &formats.branch_table,
91
            )
92
            .operands_in(vec![
93
                Operand::new("x", _i32).with_doc("i32 index into jump table"),
94
                Operand::new("JT", &entities.jump_table),
95
            ])
96
            .branches(),
97
        );
98
    }
99

100
    let iAddr = &TypeVar::new(
101
        "iAddr",
102
        "An integer address type",
103
        TypeSetBuilder::new().ints(32..64).build(),
104
    );
105

106
    ig.push(
107
        Inst::new(
108
            "debugtrap",
109
            r#"
110
        Encodes an assembly debug trap.
111
        "#,
112
            &formats.nullary,
113
        )
114
        .other_side_effects()
115
        .can_load()
116
        .can_store(),
117
    );
118

119
    ig.push(
120
        Inst::new(
121
            "trap",
122
            r#"
123
        Terminate execution unconditionally.
124
        "#,
125
            &formats.trap,
126
        )
127
        .operands_in(vec![Operand::new("code", &imm.trapcode)])
128
        .can_trap()
129
        .terminates_block(),
130
    );
131

132
    ig.push(
133
        Inst::new(
134
            "trapz",
135
            r#"
136
        Trap when zero.
137

138
        if ``c`` is non-zero, execution continues at the following instruction.
139
        "#,
140
            &formats.cond_trap,
141
        )
142
        .operands_in(vec![
143
            Operand::new("c", ScalarTruthy).with_doc("Controlling value to test"),
144
            Operand::new("code", &imm.trapcode),
145
        ])
146
        .can_trap()
147
        // When one `trapz` dominates another `trapz` and they have identical
148
        // conditions and trap codes, it is safe to deduplicate them (like GVN,
149
        // although there is not actually any value being numbered). Either the
150
        // first `trapz` raised a trap and execution halted, or it didn't and
151
        // therefore the dominated `trapz` will not raise a trap either.
152
        .side_effects_idempotent(),
153
    );
154

155
    ig.push(
156
        Inst::new(
157
            "trapnz",
158
            r#"
159
        Trap when non-zero.
160

161
        If ``c`` is zero, execution continues at the following instruction.
162
        "#,
163
            &formats.cond_trap,
164
        )
165
        .operands_in(vec![
166
            Operand::new("c", ScalarTruthy).with_doc("Controlling value to test"),
167
            Operand::new("code", &imm.trapcode),
168
        ])
169
        .can_trap()
170
        // See the above comment for `trapz` and idempotent side effects.
171
        .side_effects_idempotent(),
172
    );
173

174
    ig.push(
175
        Inst::new(
176
            "return",
177
            r#"
178
        Return from the function.
179

180
        Unconditionally transfer control to the calling function, passing the
181
        provided return values. The list of return values must match the
182
        function signature's return types.
183
        "#,
184
            &formats.multiary,
185
        )
186
        .operands_in(vec![
187
            Operand::new("rvals", &entities.varargs).with_doc("return values"),
188
        ])
189
        .returns(),
190
    );
191

192
    ig.push(
193
        Inst::new(
194
            "call",
195
            r#"
196
        Direct function call.
197

198
        Call a function which has been declared in the preamble. The argument
199
        types must match the function's signature.
200
        "#,
201
            &formats.call,
202
        )
203
        .operands_in(vec![
204
            Operand::new("FN", &entities.func_ref)
205
                .with_doc("function to call, declared by `function`"),
206
            Operand::new("args", &entities.varargs).with_doc("call arguments"),
207
        ])
208
        .operands_out(vec![
209
            Operand::new("rvals", &entities.varargs).with_doc("return values"),
210
        ])
211
        .call(),
212
    );
213

214
    ig.push(
215
        Inst::new(
216
            "call_indirect",
217
            r#"
218
        Indirect function call.
219

220
        Call the function pointed to by `callee` with the given arguments. The
221
        called function must match the specified signature.
222

223
        Note that this is different from WebAssembly's ``call_indirect``; the
224
        callee is a native address, rather than a table index. For WebAssembly,
225
        `table_addr` and `load` are used to obtain a native address
226
        from a table.
227
        "#,
228
            &formats.call_indirect,
229
        )
230
        .operands_in(vec![
231
            Operand::new("SIG", &entities.sig_ref).with_doc("function signature"),
232
            Operand::new("callee", iAddr).with_doc("address of function to call"),
233
            Operand::new("args", &entities.varargs).with_doc("call arguments"),
234
        ])
235
        .operands_out(vec![
236
            Operand::new("rvals", &entities.varargs).with_doc("return values"),
237
        ])
238
        .call(),
239
    );
240

241
    ig.push(
242
        Inst::new(
243
            "return_call",
244
            r#"
245
        Direct tail call.
246

247
        Tail call a function which has been declared in the preamble. The
248
        argument types must match the function's signature, the caller and
249
        callee calling conventions must be the same, and must be a calling
250
        convention that supports tail calls.
251

252
        This instruction is a block terminator.
253
        "#,
254
            &formats.call,
255
        )
256
        .operands_in(vec![
257
            Operand::new("FN", &entities.func_ref)
258
                .with_doc("function to call, declared by `function`"),
259
            Operand::new("args", &entities.varargs).with_doc("call arguments"),
260
        ])
261
        .returns()
262
        .call(),
263
    );
264

265
    ig.push(
266
        Inst::new(
267
            "return_call_indirect",
268
            r#"
269
        Indirect tail call.
270

271
        Call the function pointed to by `callee` with the given arguments. The
272
        argument types must match the function's signature, the caller and
273
        callee calling conventions must be the same, and must be a calling
274
        convention that supports tail calls.
275

276
        This instruction is a block terminator.
277

278
        Note that this is different from WebAssembly's ``tail_call_indirect``;
279
        the callee is a native address, rather than a table index. For
280
        WebAssembly, `table_addr` and `load` are used to obtain a native address
281
        from a table.
282
        "#,
283
            &formats.call_indirect,
284
        )
285
        .operands_in(vec![
286
            Operand::new("SIG", &entities.sig_ref).with_doc("function signature"),
287
            Operand::new("callee", iAddr).with_doc("address of function to call"),
288
            Operand::new("args", &entities.varargs).with_doc("call arguments"),
289
        ])
290
        .returns()
291
        .call(),
292
    );
293

294
    ig.push(
295
        Inst::new(
296
            "func_addr",
297
            r#"
298
        Get the address of a function.
299

300
        Compute the absolute address of a function declared in the preamble.
301
        The returned address can be used as a ``callee`` argument to
302
        `call_indirect`. This is also a method for calling functions that
303
        are too far away to be addressable by a direct `call`
304
        instruction.
305
        "#,
306
            &formats.func_addr,
307
        )
308
        .operands_in(vec![
309
            Operand::new("FN", &entities.func_ref)
310
                .with_doc("function to call, declared by `function`"),
311
        ])
312
        .operands_out(vec![Operand::new("addr", iAddr)]),
313
    );
314

315
    ig.push(
316
        Inst::new(
317
            "try_call",
318
            r#"
319
        Call a function, catching the specified exceptions.
320

321
        Call the function pointed to by `callee` with the given arguments. On
322
        normal return, branch to the first target, with function returns
323
        available as `retN` block arguments. On exceptional return,
324
        look up the thrown exception tag in the provided exception table;
325
        if the tag matches one of the targets, branch to the matching
326
        target with the exception payloads available as `exnN` block arguments.
327
        If no tag matches, then propagate the exception up the stack.
328

329
        It is the Cranelift embedder's responsibility to define the meaning
330
        of tags: they are accepted by this instruction and passed through
331
        to unwind metadata tables in Cranelift's output. Actual unwinding is
332
        outside the purview of the core Cranelift compiler.
333

334
        Payload values on exception are passed in fixed register(s) that are
335
        defined by the platform and ABI. See the documentation on `CallConv`
336
        for details.
337
        "#,
338
            &formats.try_call,
339
        )
340
        .operands_in(vec![
341
            Operand::new("callee", &entities.func_ref)
342
                .with_doc("function to call, declared by `function`"),
343
            Operand::new("args", &entities.varargs).with_doc("call arguments"),
344
            Operand::new("ET", &entities.exception_table).with_doc("exception table"),
345
        ])
346
        .call()
347
        .branches(),
348
    );
349

350
    ig.push(
351
        Inst::new(
352
            "try_call_indirect",
353
            r#"
354
        Call a function, catching the specified exceptions.
355

356
        Call the function pointed to by `callee` with the given arguments. On
357
        normal return, branch to the first target, with function returns
358
        available as `retN` block arguments. On exceptional return,
359
        look up the thrown exception tag in the provided exception table;
360
        if the tag matches one of the targets, branch to the matching
361
        target with the exception payloads available as `exnN` block arguments.
362
        If no tag matches, then propagate the exception up the stack.
363

364
        It is the Cranelift embedder's responsibility to define the meaning
365
        of tags: they are accepted by this instruction and passed through
366
        to unwind metadata tables in Cranelift's output. Actual unwinding is
367
        outside the purview of the core Cranelift compiler.
368

369
        Payload values on exception are passed in fixed register(s) that are
370
        defined by the platform and ABI. See the documentation on `CallConv`
371
        for details.
372
        "#,
373
            &formats.try_call_indirect,
374
        )
375
        .operands_in(vec![
376
            Operand::new("callee", iAddr).with_doc("address of function to call"),
377
            Operand::new("args", &entities.varargs).with_doc("call arguments"),
378
            Operand::new("ET", &entities.exception_table).with_doc("exception table"),
379
        ])
380
        .call()
381
        .branches(),
382
    );
383
}
384

385
#[inline(never)]
386
fn define_simd_lane_access(
387
    ig: &mut InstructionGroupBuilder,
388
    formats: &Formats,
389
    imm: &Immediates,
390
    _: &EntityRefs,
391
) {
392
    let TxN = &TypeVar::new(
393
        "TxN",
394
        "A SIMD vector type",
395
        TypeSetBuilder::new()
396
            .ints(Interval::All)
397
            .floats(Interval::All)
398
            .simd_lanes(Interval::All)
399
            .dynamic_simd_lanes(Interval::All)
400
            .includes_scalars(false)
401
            .build(),
402
    );
403

404
    ig.push(
405
        Inst::new(
406
            "splat",
407
            r#"
408
        Vector splat.
409

410
        Return a vector whose lanes are all ``x``.
411
        "#,
412
            &formats.unary,
413
        )
414
        .operands_in(vec![
415
            Operand::new("x", &TxN.lane_of()).with_doc("Value to splat to all lanes"),
416
        ])
417
        .operands_out(vec![Operand::new("a", TxN)]),
418
    );
419

420
    let I8x16 = &TypeVar::new(
421
        "I8x16",
422
        "A SIMD vector type consisting of 16 lanes of 8-bit integers",
423
        TypeSetBuilder::new()
424
            .ints(8..8)
425
            .simd_lanes(16..16)
426
            .includes_scalars(false)
427
            .build(),
428
    );
429

430
    ig.push(
431
        Inst::new(
432
            "swizzle",
433
            r#"
434
        Vector swizzle.
435

436
        Returns a new vector with byte-width lanes selected from the lanes of the first input
437
        vector ``x`` specified in the second input vector ``s``. The indices ``i`` in range
438
        ``[0, 15]`` select the ``i``-th element of ``x``. For indices outside of the range the
439
        resulting lane is 0. Note that this operates on byte-width lanes.
440
        "#,
441
            &formats.binary,
442
        )
443
        .operands_in(vec![
444
            Operand::new("x", I8x16).with_doc("Vector to modify by re-arranging lanes"),
445
            Operand::new("y", I8x16).with_doc("Mask for re-arranging lanes"),
446
        ])
447
        .operands_out(vec![Operand::new("a", I8x16)]),
448
    );
449

450
    ig.push(
451
        Inst::new(
452
            "x86_pshufb",
453
            r#"
454
        A vector swizzle lookalike which has the semantics of `pshufb` on x64.
455

456
        This instruction will permute the 8-bit lanes of `x` with the indices
457
        specified in `y`. Each lane in the mask, `y`, uses the bottom four
458
        bits for selecting the lane from `x` unless the most significant bit
459
        is set, in which case the lane is zeroed. The output vector will have
460
        the following contents when the element of `y` is in these ranges:
461

462
        * `[0, 127]` -> `x[y[i] % 16]`
463
        * `[128, 255]` -> 0
464
        "#,
465
            &formats.binary,
466
        )
467
        .operands_in(vec![
468
            Operand::new("x", I8x16).with_doc("Vector to modify by re-arranging lanes"),
469
            Operand::new("y", I8x16).with_doc("Mask for re-arranging lanes"),
470
        ])
471
        .operands_out(vec![Operand::new("a", I8x16)]),
472
    );
473

474
    ig.push(
475
        Inst::new(
476
            "insertlane",
477
            r#"
478
        Insert ``y`` as lane ``Idx`` in x.
479

480
        The lane index, ``Idx``, is an immediate value, not an SSA value. It
481
        must indicate a valid lane index for the type of ``x``.
482
        "#,
483
            &formats.ternary_imm8,
484
        )
485
        .operands_in(vec![
486
            Operand::new("x", TxN).with_doc("The vector to modify"),
487
            Operand::new("y", &TxN.lane_of()).with_doc("New lane value"),
488
            Operand::new("Idx", &imm.uimm8).with_doc("Lane index"),
489
        ])
490
        .operands_out(vec![Operand::new("a", TxN)]),
491
    );
492

493
    ig.push(
494
        Inst::new(
495
            "extractlane",
496
            r#"
497
        Extract lane ``Idx`` from ``x``.
498

499
        The lane index, ``Idx``, is an immediate value, not an SSA value. It
500
        must indicate a valid lane index for the type of ``x``. Note that the upper bits of ``a``
501
        may or may not be zeroed depending on the ISA but the type system should prevent using
502
        ``a`` as anything other than the extracted value.
503
        "#,
504
            &formats.binary_imm8,
505
        )
506
        .operands_in(vec![
507
            Operand::new("x", TxN),
508
            Operand::new("Idx", &imm.uimm8).with_doc("Lane index"),
509
        ])
510
        .operands_out(vec![Operand::new("a", &TxN.lane_of())]),
511
    );
512
}
513

514
#[inline(never)]
515
fn define_simd_arithmetic(
516
    ig: &mut InstructionGroupBuilder,
517
    formats: &Formats,
518
    _: &Immediates,
519
    _: &EntityRefs,
520
) {
521
    let Int = &TypeVar::new(
522
        "Int",
523
        "A scalar or vector integer type",
524
        TypeSetBuilder::new()
525
            .ints(Interval::All)
526
            .simd_lanes(Interval::All)
527
            .build(),
528
    );
529

530
    ig.push(
531
        Inst::new(
532
            "smin",
533
            r#"
534
        Signed integer minimum.
535
        "#,
536
            &formats.binary,
537
        )
538
        .operands_in(vec![Operand::new("x", Int), Operand::new("y", Int)])
539
        .operands_out(vec![Operand::new("a", Int)]),
540
    );
541

542
    ig.push(
543
        Inst::new(
544
            "umin",
545
            r#"
546
        Unsigned integer minimum.
547
        "#,
548
            &formats.binary,
549
        )
550
        .operands_in(vec![Operand::new("x", Int), Operand::new("y", Int)])
551
        .operands_out(vec![Operand::new("a", Int)]),
552
    );
553

554
    ig.push(
555
        Inst::new(
556
            "smax",
557
            r#"
558
        Signed integer maximum.
559
        "#,
560
            &formats.binary,
561
        )
562
        .operands_in(vec![Operand::new("x", Int), Operand::new("y", Int)])
563
        .operands_out(vec![Operand::new("a", Int)]),
564
    );
565

566
    ig.push(
567
        Inst::new(
568
            "umax",
569
            r#"
570
        Unsigned integer maximum.
571
        "#,
572
            &formats.binary,
573
        )
574
        .operands_in(vec![Operand::new("x", Int), Operand::new("y", Int)])
575
        .operands_out(vec![Operand::new("a", Int)]),
576
    );
577

578
    let IxN = &TypeVar::new(
579
        "IxN",
580
        "A SIMD vector type containing integers",
581
        TypeSetBuilder::new()
582
            .ints(Interval::All)
583
            .simd_lanes(Interval::All)
584
            .includes_scalars(false)
585
            .build(),
586
    );
587

588
    ig.push(
589
        Inst::new(
590
            "avg_round",
591
            r#"
592
        Unsigned average with rounding: `a := (x + y + 1) // 2`
593

594
        The addition does not lose any information (such as from overflow).
595
        "#,
596
            &formats.binary,
597
        )
598
        .operands_in(vec![Operand::new("x", IxN), Operand::new("y", IxN)])
599
        .operands_out(vec![Operand::new("a", IxN)]),
600
    );
601

602
    ig.push(
603
        Inst::new(
604
            "uadd_sat",
605
            r#"
606
        Add with unsigned saturation.
607

608
        This is similar to `iadd` but the operands are interpreted as unsigned integers and their
609
        summed result, instead of wrapping, will be saturated to the highest unsigned integer for
610
        the controlling type (e.g. `0xFF` for i8).
611
        "#,
612
            &formats.binary,
613
        )
614
        .operands_in(vec![Operand::new("x", IxN), Operand::new("y", IxN)])
615
        .operands_out(vec![Operand::new("a", IxN)]),
616
    );
617

618
    ig.push(
619
        Inst::new(
620
            "sadd_sat",
621
            r#"
622
        Add with signed saturation.
623

624
        This is similar to `iadd` but the operands are interpreted as signed integers and their
625
        summed result, instead of wrapping, will be saturated to the lowest or highest
626
        signed integer for the controlling type (e.g. `0x80` or `0x7F` for i8). For example,
627
        since an `sadd_sat.i8` of `0x70` and `0x70` is greater than `0x7F`, the result will be
628
        clamped to `0x7F`.
629
        "#,
630
            &formats.binary,
631
        )
632
        .operands_in(vec![Operand::new("x", IxN), Operand::new("y", IxN)])
633
        .operands_out(vec![Operand::new("a", IxN)]),
634
    );
635

636
    ig.push(
637
        Inst::new(
638
            "usub_sat",
639
            r#"
640
        Subtract with unsigned saturation.
641

642
        This is similar to `isub` but the operands are interpreted as unsigned integers and their
643
        difference, instead of wrapping, will be saturated to the lowest unsigned integer for
644
        the controlling type (e.g. `0x00` for i8).
645
        "#,
646
            &formats.binary,
647
        )
648
        .operands_in(vec![Operand::new("x", IxN), Operand::new("y", IxN)])
649
        .operands_out(vec![Operand::new("a", IxN)]),
650
    );
651

652
    ig.push(
653
        Inst::new(
654
            "ssub_sat",
655
            r#"
656
        Subtract with signed saturation.
657

658
        This is similar to `isub` but the operands are interpreted as signed integers and their
659
        difference, instead of wrapping, will be saturated to the lowest or highest
660
        signed integer for the controlling type (e.g. `0x80` or `0x7F` for i8).
661
        "#,
662
            &formats.binary,
663
        )
664
        .operands_in(vec![Operand::new("x", IxN), Operand::new("y", IxN)])
665
        .operands_out(vec![Operand::new("a", IxN)]),
666
    );
667
}
668

669
pub(crate) fn define(
670
    all_instructions: &mut AllInstructions,
671
    formats: &Formats,
672
    imm: &Immediates,
673
    entities: &EntityRefs,
674
) {
675
    let mut ig = InstructionGroupBuilder::new(all_instructions);
676

677
    define_control_flow(&mut ig, formats, imm, entities);
678
    define_simd_lane_access(&mut ig, formats, imm, entities);
679
    define_simd_arithmetic(&mut ig, formats, imm, entities);
680

681
    // Operand kind shorthands.
682
    let i8: &TypeVar = &ValueType::from(LaneType::from(types::Int::I8)).into();
683
    let f16_: &TypeVar = &ValueType::from(LaneType::from(types::Float::F16)).into();
684
    let f32_: &TypeVar = &ValueType::from(LaneType::from(types::Float::F32)).into();
685
    let f64_: &TypeVar = &ValueType::from(LaneType::from(types::Float::F64)).into();
686
    let f128_: &TypeVar = &ValueType::from(LaneType::from(types::Float::F128)).into();
687

688
    // Starting definitions.
689
    let Int = &TypeVar::new(
690
        "Int",
691
        "A scalar or vector integer type",
692
        TypeSetBuilder::new()
693
            .ints(Interval::All)
694
            .simd_lanes(Interval::All)
695
            .dynamic_simd_lanes(Interval::All)
696
            .build(),
697
    );
698

699
    let NarrowInt = &TypeVar::new(
700
        "NarrowInt",
701
        "An integer type of width up to `i64`",
702
        TypeSetBuilder::new().ints(8..64).build(),
703
    );
704

705
    let ScalarTruthy = &TypeVar::new(
706
        "ScalarTruthy",
707
        "A scalar truthy type",
708
        TypeSetBuilder::new().ints(Interval::All).build(),
709
    );
710

711
    let iB = &TypeVar::new(
712
        "iB",
713
        "A scalar integer type",
714
        TypeSetBuilder::new().ints(Interval::All).build(),
715
    );
716

717
    let iSwappable = &TypeVar::new(
718
        "iSwappable",
719
        "A multi byte scalar integer type",
720
        TypeSetBuilder::new().ints(16..128).build(),
721
    );
722

723
    let iAddr = &TypeVar::new(
724
        "iAddr",
725
        "An integer address type",
726
        TypeSetBuilder::new().ints(32..64).build(),
727
    );
728

729
    let TxN = &TypeVar::new(
730
        "TxN",
731
        "A SIMD vector type",
732
        TypeSetBuilder::new()
733
            .ints(Interval::All)
734
            .floats(Interval::All)
735
            .simd_lanes(Interval::All)
736
            .includes_scalars(false)
737
            .build(),
738
    );
739
    let Any = &TypeVar::new(
740
        "Any",
741
        "Any integer, float, or reference scalar or vector type",
742
        TypeSetBuilder::new()
743
            .ints(Interval::All)
744
            .floats(Interval::All)
745
            .simd_lanes(Interval::All)
746
            .includes_scalars(true)
747
            .build(),
748
    );
749

750
    let Mem = &TypeVar::new(
751
        "Mem",
752
        "Any type that can be stored in memory",
753
        TypeSetBuilder::new()
754
            .ints(Interval::All)
755
            .floats(Interval::All)
756
            .simd_lanes(Interval::All)
757
            .dynamic_simd_lanes(Interval::All)
758
            .build(),
759
    );
760

761
    let MemTo = &TypeVar::copy_from(Mem, "MemTo".to_string());
762

763
    ig.push(
764
        Inst::new(
765
            "load",
766
            r#"
767
        Load from memory at ``p + Offset``.
768

769
        This is a polymorphic instruction that can load any value type which
770
        has a memory representation.
771
        "#,
772
            &formats.load,
773
        )
774
        .operands_in(vec![
775
            Operand::new("MemFlags", &imm.memflags),
776
            Operand::new("p", iAddr),
777
            Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"),
778
        ])
779
        .operands_out(vec![Operand::new("a", Mem).with_doc("Value loaded")])
780
        .can_load(),
781
    );
782

783
    ig.push(
784
        Inst::new(
785
            "store",
786
            r#"
787
        Store ``x`` to memory at ``p + Offset``.
788

789
        This is a polymorphic instruction that can store any value type with a
790
        memory representation.
791
        "#,
792
            &formats.store,
793
        )
794
        .operands_in(vec![
795
            Operand::new("MemFlags", &imm.memflags),
796
            Operand::new("x", Mem).with_doc("Value to be stored"),
797
            Operand::new("p", iAddr),
798
            Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"),
799
        ])
800
        .can_store(),
801
    );
802

803
    let iExt8 = &TypeVar::new(
804
        "iExt8",
805
        "An integer type with more than 8 bits",
806
        TypeSetBuilder::new().ints(16..64).build(),
807
    );
808

809
    ig.push(
810
        Inst::new(
811
            "uload8",
812
            r#"
813
        Load 8 bits from memory at ``p + Offset`` and zero-extend.
814

815
        This is equivalent to ``load.i8`` followed by ``uextend``.
816
        "#,
817
            &formats.load,
818
        )
819
        .operands_in(vec![
820
            Operand::new("MemFlags", &imm.memflags),
821
            Operand::new("p", iAddr),
822
            Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"),
823
        ])
824
        .operands_out(vec![Operand::new("a", iExt8)])
825
        .can_load(),
826
    );
827

828
    ig.push(
829
        Inst::new(
830
            "sload8",
831
            r#"
832
        Load 8 bits from memory at ``p + Offset`` and sign-extend.
833

834
        This is equivalent to ``load.i8`` followed by ``sextend``.
835
        "#,
836
            &formats.load,
837
        )
838
        .operands_in(vec![
839
            Operand::new("MemFlags", &imm.memflags),
840
            Operand::new("p", iAddr),
841
            Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"),
842
        ])
843
        .operands_out(vec![Operand::new("a", iExt8)])
844
        .can_load(),
845
    );
846

847
    ig.push(
848
        Inst::new(
849
            "istore8",
850
            r#"
851
        Store the low 8 bits of ``x`` to memory at ``p + Offset``.
852

853
        This is equivalent to ``ireduce.i8`` followed by ``store.i8``.
854
        "#,
855
            &formats.store,
856
        )
857
        .operands_in(vec![
858
            Operand::new("MemFlags", &imm.memflags),
859
            Operand::new("x", iExt8),
860
            Operand::new("p", iAddr),
861
            Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"),
862
        ])
863
        .can_store(),
864
    );
865

866
    let iExt16 = &TypeVar::new(
867
        "iExt16",
868
        "An integer type with more than 16 bits",
869
        TypeSetBuilder::new().ints(32..64).build(),
870
    );
871

872
    ig.push(
873
        Inst::new(
874
            "uload16",
875
            r#"
876
        Load 16 bits from memory at ``p + Offset`` and zero-extend.
877

878
        This is equivalent to ``load.i16`` followed by ``uextend``.
879
        "#,
880
            &formats.load,
881
        )
882
        .operands_in(vec![
883
            Operand::new("MemFlags", &imm.memflags),
884
            Operand::new("p", iAddr),
885
            Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"),
886
        ])
887
        .operands_out(vec![Operand::new("a", iExt16)])
888
        .can_load(),
889
    );
890

891
    ig.push(
892
        Inst::new(
893
            "sload16",
894
            r#"
895
        Load 16 bits from memory at ``p + Offset`` and sign-extend.
896

897
        This is equivalent to ``load.i16`` followed by ``sextend``.
898
        "#,
899
            &formats.load,
900
        )
901
        .operands_in(vec![
902
            Operand::new("MemFlags", &imm.memflags),
903
            Operand::new("p", iAddr),
904
            Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"),
905
        ])
906
        .operands_out(vec![Operand::new("a", iExt16)])
907
        .can_load(),
908
    );
909

910
    ig.push(
911
        Inst::new(
912
            "istore16",
913
            r#"
914
        Store the low 16 bits of ``x`` to memory at ``p + Offset``.
915

916
        This is equivalent to ``ireduce.i16`` followed by ``store.i16``.
917
        "#,
918
            &formats.store,
919
        )
920
        .operands_in(vec![
921
            Operand::new("MemFlags", &imm.memflags),
922
            Operand::new("x", iExt16),
923
            Operand::new("p", iAddr),
924
            Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"),
925
        ])
926
        .can_store(),
927
    );
928

929
    let iExt32 = &TypeVar::new(
930
        "iExt32",
931
        "An integer type with more than 32 bits",
932
        TypeSetBuilder::new().ints(64..64).build(),
933
    );
934

935
    ig.push(
936
        Inst::new(
937
            "uload32",
938
            r#"
939
        Load 32 bits from memory at ``p + Offset`` and zero-extend.
940

941
        This is equivalent to ``load.i32`` followed by ``uextend``.
942
        "#,
943
            &formats.load,
944
        )
945
        .operands_in(vec![
946
            Operand::new("MemFlags", &imm.memflags),
947
            Operand::new("p", iAddr),
948
            Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"),
949
        ])
950
        .operands_out(vec![Operand::new("a", iExt32)])
951
        .can_load(),
952
    );
953

954
    ig.push(
955
        Inst::new(
956
            "sload32",
957
            r#"
958
        Load 32 bits from memory at ``p + Offset`` and sign-extend.
959

960
        This is equivalent to ``load.i32`` followed by ``sextend``.
961
        "#,
962
            &formats.load,
963
        )
964
        .operands_in(vec![
965
            Operand::new("MemFlags", &imm.memflags),
966
            Operand::new("p", iAddr),
967
            Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"),
968
        ])
969
        .operands_out(vec![Operand::new("a", iExt32)])
970
        .can_load(),
971
    );
972

973
    ig.push(
974
        Inst::new(
975
            "istore32",
976
            r#"
977
        Store the low 32 bits of ``x`` to memory at ``p + Offset``.
978

979
        This is equivalent to ``ireduce.i32`` followed by ``store.i32``.
980
        "#,
981
            &formats.store,
982
        )
983
        .operands_in(vec![
984
            Operand::new("MemFlags", &imm.memflags),
985
            Operand::new("x", iExt32),
986
            Operand::new("p", iAddr),
987
            Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"),
988
        ])
989
        .can_store(),
990
    );
991
    ig.push(
992
        Inst::new(
993
            "stack_switch",
994
            r#"
995
        Suspends execution of the current stack and resumes execution of another
996
        one.
997

998
        The target stack to switch to is identified by the data stored at
999
        ``load_context_ptr``. Before switching, this instruction stores
1000
        analogous information about the
1001
        current (i.e., original) stack at ``store_context_ptr``, to
1002
        enabled switching back to the original stack at a later point.
1003

1004
        The size, alignment and layout of the information stored at
1005
        ``load_context_ptr`` and ``store_context_ptr`` is platform-dependent.
1006
        The instruction assumes that ``load_context_ptr`` and
1007
        ``store_context_ptr`` are valid pointers to memory with said layout and
1008
        alignment, and does not perform any checks on these pointers or the data
1009
        stored there.
1010

1011
        The instruction is experimental and only supported on x64 Linux at the
1012
        moment.
1013

1014
        When switching from a stack A to a stack B, one of the following cases
1015
        must apply:
1016
        1. Stack B was previously suspended using a ``stack_switch`` instruction.
1017
        2. Stack B is a newly initialized stack. The necessary initialization is
1018
        platform-dependent and will generally involve running some kind of
1019
        trampoline to start execution of a function on the new stack.
1020

1021
        In both cases, the ``in_payload`` argument of the ``stack_switch``
1022
        instruction executed on A is passed to stack B. In the first case above,
1023
        it will be the result value of the earlier ``stack_switch`` instruction
1024
        executed on stack B. In the second case, the value will be accessible to
1025
        the trampoline in a platform-dependent register.
1026

1027
        The pointers ``load_context_ptr`` and ``store_context_ptr`` are allowed
1028
        to be equal; the instruction ensures that all data is loaded from the
1029
        former before writing to the latter.
1030

1031
        Stack switching is one-shot in the sense that each ``stack_switch``
1032
        operation effectively consumes the context identified by
1033
        ``load_context_ptr``. In other words, performing two ``stack_switches``
1034
        using the same ``load_context_ptr`` causes undefined behavior, unless
1035
        the context at ``load_context_ptr`` is overwritten by another
1036
        `stack_switch` in between.
1037
        "#,
1038
            &formats.ternary,
1039
        )
1040
        .operands_in(vec![
1041
            Operand::new("store_context_ptr", iAddr),
1042
            Operand::new("load_context_ptr", iAddr),
1043
            Operand::new("in_payload0", iAddr),
1044
        ])
1045
        .operands_out(vec![Operand::new("out_payload0", iAddr)])
1046
        .other_side_effects()
1047
        .can_load()
1048
        .can_store()
1049
        .call(),
1050
    );
1051

1052
    let I16x8 = &TypeVar::new(
1053
        "I16x8",
1054
        "A SIMD vector with exactly 8 lanes of 16-bit values",
1055
        TypeSetBuilder::new()
1056
            .ints(16..16)
1057
            .simd_lanes(8..8)
1058
            .includes_scalars(false)
1059
            .build(),
1060
    );
1061

1062
    ig.push(
1063
        Inst::new(
1064
            "uload8x8",
1065
            r#"
1066
        Load an 8x8 vector (64 bits) from memory at ``p + Offset`` and zero-extend into an i16x8
1067
        vector.
1068
        "#,
1069
            &formats.load,
1070
        )
1071
        .operands_in(vec![
1072
            Operand::new("MemFlags", &imm.memflags),
1073
            Operand::new("p", iAddr),
1074
            Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"),
1075
        ])
1076
        .operands_out(vec![Operand::new("a", I16x8).with_doc("Value loaded")])
1077
        .can_load(),
1078
    );
1079

1080
    ig.push(
1081
        Inst::new(
1082
            "sload8x8",
1083
            r#"
1084
        Load an 8x8 vector (64 bits) from memory at ``p + Offset`` and sign-extend into an i16x8
1085
        vector.
1086
        "#,
1087
            &formats.load,
1088
        )
1089
        .operands_in(vec![
1090
            Operand::new("MemFlags", &imm.memflags),
1091
            Operand::new("p", iAddr),
1092
            Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"),
1093
        ])
1094
        .operands_out(vec![Operand::new("a", I16x8).with_doc("Value loaded")])
1095
        .can_load(),
1096
    );
1097

1098
    let I32x4 = &TypeVar::new(
1099
        "I32x4",
1100
        "A SIMD vector with exactly 4 lanes of 32-bit values",
1101
        TypeSetBuilder::new()
1102
            .ints(32..32)
1103
            .simd_lanes(4..4)
1104
            .includes_scalars(false)
1105
            .build(),
1106
    );
1107

1108
    ig.push(
1109
        Inst::new(
1110
            "uload16x4",
1111
            r#"
1112
        Load a 16x4 vector (64 bits) from memory at ``p + Offset`` and zero-extend into an i32x4
1113
        vector.
1114
        "#,
1115
            &formats.load,
1116
        )
1117
        .operands_in(vec![
1118
            Operand::new("MemFlags", &imm.memflags),
1119
            Operand::new("p", iAddr),
1120
            Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"),
1121
        ])
1122
        .operands_out(vec![Operand::new("a", I32x4).with_doc("Value loaded")])
1123
        .can_load(),
1124
    );
1125

1126
    ig.push(
1127
        Inst::new(
1128
            "sload16x4",
1129
            r#"
1130
        Load a 16x4 vector (64 bits) from memory at ``p + Offset`` and sign-extend into an i32x4
1131
        vector.
1132
        "#,
1133
            &formats.load,
1134
        )
1135
        .operands_in(vec![
1136
            Operand::new("MemFlags", &imm.memflags),
1137
            Operand::new("p", iAddr),
1138
            Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"),
1139
        ])
1140
        .operands_out(vec![Operand::new("a", I32x4).with_doc("Value loaded")])
1141
        .can_load(),
1142
    );
1143

1144
    let I64x2 = &TypeVar::new(
1145
        "I64x2",
1146
        "A SIMD vector with exactly 2 lanes of 64-bit values",
1147
        TypeSetBuilder::new()
1148
            .ints(64..64)
1149
            .simd_lanes(2..2)
1150
            .includes_scalars(false)
1151
            .build(),
1152
    );
1153

1154
    ig.push(
1155
        Inst::new(
1156
            "uload32x2",
1157
            r#"
1158
        Load an 32x2 vector (64 bits) from memory at ``p + Offset`` and zero-extend into an i64x2
1159
        vector.
1160
        "#,
1161
            &formats.load,
1162
        )
1163
        .operands_in(vec![
1164
            Operand::new("MemFlags", &imm.memflags),
1165
            Operand::new("p", iAddr),
1166
            Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"),
1167
        ])
1168
        .operands_out(vec![Operand::new("a", I64x2).with_doc("Value loaded")])
1169
        .can_load(),
1170
    );
1171

1172
    ig.push(
1173
        Inst::new(
1174
            "sload32x2",
1175
            r#"
1176
        Load a 32x2 vector (64 bits) from memory at ``p + Offset`` and sign-extend into an i64x2
1177
        vector.
1178
        "#,
1179
            &formats.load,
1180
        )
1181
        .operands_in(vec![
1182
            Operand::new("MemFlags", &imm.memflags),
1183
            Operand::new("p", iAddr),
1184
            Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"),
1185
        ])
1186
        .operands_out(vec![Operand::new("a", I64x2).with_doc("Value loaded")])
1187
        .can_load(),
1188
    );
1189

1190
    ig.push(
1191
        Inst::new(
1192
            "stack_load",
1193
            r#"
1194
        Load a value from a stack slot at the constant offset.
1195

1196
        This is a polymorphic instruction that can load any value type which
1197
        has a memory representation.
1198

1199
        The offset is an immediate constant, not an SSA value. The memory
1200
        access cannot go out of bounds, i.e.
1201
        `sizeof(a) + Offset <= sizeof(SS)`.
1202
        "#,
1203
            &formats.stack_load,
1204
        )
1205
        .operands_in(vec![
1206
            Operand::new("SS", &entities.stack_slot),
1207
            Operand::new("Offset", &imm.offset32).with_doc("In-bounds offset into stack slot"),
1208
        ])
1209
        .operands_out(vec![Operand::new("a", Mem).with_doc("Value loaded")])
1210
        .can_load(),
1211
    );
1212

1213
    ig.push(
1214
        Inst::new(
1215
            "stack_store",
1216
            r#"
1217
        Store a value to a stack slot at a constant offset.
1218

1219
        This is a polymorphic instruction that can store any value type with a
1220
        memory representation.
1221

1222
        The offset is an immediate constant, not an SSA value. The memory
1223
        access cannot go out of bounds, i.e.
1224
        `sizeof(a) + Offset <= sizeof(SS)`.
1225
        "#,
1226
            &formats.stack_store,
1227
        )
1228
        .operands_in(vec![
1229
            Operand::new("x", Mem).with_doc("Value to be stored"),
1230
            Operand::new("SS", &entities.stack_slot),
1231
            Operand::new("Offset", &imm.offset32).with_doc("In-bounds offset into stack slot"),
1232
        ])
1233
        .can_store(),
1234
    );
1235

1236
    ig.push(
1237
        Inst::new(
1238
            "stack_addr",
1239
            r#"
1240
        Get the address of a stack slot.
1241

1242
        Compute the absolute address of a byte in a stack slot. The offset must
1243
        refer to a byte inside the stack slot:
1244
        `0 <= Offset < sizeof(SS)`.
1245
        "#,
1246
            &formats.stack_load,
1247
        )
1248
        .operands_in(vec![
1249
            Operand::new("SS", &entities.stack_slot),
1250
            Operand::new("Offset", &imm.offset32).with_doc("In-bounds offset into stack slot"),
1251
        ])
1252
        .operands_out(vec![Operand::new("addr", iAddr)]),
1253
    );
1254

1255
    ig.push(
1256
        Inst::new(
1257
            "dynamic_stack_load",
1258
            r#"
1259
        Load a value from a dynamic stack slot.
1260

1261
        This is a polymorphic instruction that can load any value type which
1262
        has a memory representation.
1263
        "#,
1264
            &formats.dynamic_stack_load,
1265
        )
1266
        .operands_in(vec![Operand::new("DSS", &entities.dynamic_stack_slot)])
1267
        .operands_out(vec![Operand::new("a", Mem).with_doc("Value loaded")])
1268
        .can_load(),
1269
    );
1270

1271
    ig.push(
1272
        Inst::new(
1273
            "dynamic_stack_store",
1274
            r#"
1275
        Store a value to a dynamic stack slot.
1276

1277
        This is a polymorphic instruction that can store any dynamic value type with a
1278
        memory representation.
1279
        "#,
1280
            &formats.dynamic_stack_store,
1281
        )
1282
        .operands_in(vec![
1283
            Operand::new("x", Mem).with_doc("Value to be stored"),
1284
            Operand::new("DSS", &entities.dynamic_stack_slot),
1285
        ])
1286
        .can_store(),
1287
    );
1288

1289
    ig.push(
1290
        Inst::new(
1291
            "dynamic_stack_addr",
1292
            r#"
1293
        Get the address of a dynamic stack slot.
1294

1295
        Compute the absolute address of the first byte of a dynamic stack slot.
1296
        "#,
1297
            &formats.dynamic_stack_load,
1298
        )
1299
        .operands_in(vec![Operand::new("DSS", &entities.dynamic_stack_slot)])
1300
        .operands_out(vec![Operand::new("addr", iAddr)]),
1301
    );
1302

1303
    ig.push(
1304
        Inst::new(
1305
            "global_value",
1306
            r#"
1307
        Compute the value of global GV.
1308
        "#,
1309
            &formats.unary_global_value,
1310
        )
1311
        .operands_in(vec![Operand::new("GV", &entities.global_value)])
1312
        .operands_out(vec![Operand::new("a", Mem).with_doc("Value loaded")]),
1313
    );
1314

1315
    ig.push(
1316
        Inst::new(
1317
            "symbol_value",
1318
            r#"
1319
        Compute the value of global GV, which is a symbolic value.
1320
        "#,
1321
            &formats.unary_global_value,
1322
        )
1323
        .operands_in(vec![Operand::new("GV", &entities.global_value)])
1324
        .operands_out(vec![Operand::new("a", Mem).with_doc("Value loaded")]),
1325
    );
1326

1327
    ig.push(
1328
        Inst::new(
1329
            "tls_value",
1330
            r#"
1331
        Compute the value of global GV, which is a TLS (thread local storage) value.
1332
        "#,
1333
            &formats.unary_global_value,
1334
        )
1335
        .operands_in(vec![Operand::new("GV", &entities.global_value)])
1336
        .operands_out(vec![Operand::new("a", Mem).with_doc("Value loaded")]),
1337
    );
1338

1339
    // Note this instruction is marked as having other side-effects, so GVN won't try to hoist it,
1340
    // which would result in it being subject to spilling. While not hoisting would generally hurt
1341
    // performance, since a computed value used many times may need to be regenerated before each
1342
    // use, it is not the case here: this instruction doesn't generate any code.  That's because,
1343
    // by definition the pinned register is never used by the register allocator, but is written to
1344
    // and read explicitly and exclusively by set_pinned_reg and get_pinned_reg.
1345
    ig.push(
1346
        Inst::new(
1347
            "get_pinned_reg",
1348
            r#"
1349
            Gets the content of the pinned register, when it's enabled.
1350
        "#,
1351
            &formats.nullary,
1352
        )
1353
        .operands_out(vec![Operand::new("addr", iAddr)])
1354
        .other_side_effects(),
1355
    );
1356

1357
    ig.push(
1358
        Inst::new(
1359
            "set_pinned_reg",
1360
            r#"
1361
        Sets the content of the pinned register, when it's enabled.
1362
        "#,
1363
            &formats.unary,
1364
        )
1365
        .operands_in(vec![Operand::new("addr", iAddr)])
1366
        .other_side_effects(),
1367
    );
1368

1369
    ig.push(
1370
        Inst::new(
1371
            "get_frame_pointer",
1372
            r#"
1373
        Get the address in the frame pointer register.
1374

1375
        Usage of this instruction requires setting `preserve_frame_pointers` to `true`.
1376
        "#,
1377
            &formats.nullary,
1378
        )
1379
        .operands_out(vec![Operand::new("addr", iAddr)]),
1380
    );
1381

1382
    ig.push(
1383
        Inst::new(
1384
            "get_stack_pointer",
1385
            r#"
1386
        Get the address in the stack pointer register.
1387
        "#,
1388
            &formats.nullary,
1389
        )
1390
        .operands_out(vec![Operand::new("addr", iAddr)]),
1391
    );
1392

1393
    ig.push(
1394
        Inst::new(
1395
            "get_return_address",
1396
            r#"
1397
        Get the PC where this function will transfer control to when it returns.
1398

1399
        Usage of this instruction requires setting `preserve_frame_pointers` to `true`.
1400
        "#,
1401
            &formats.nullary,
1402
        )
1403
        .operands_out(vec![Operand::new("addr", iAddr)]),
1404
    );
1405

1406
    ig.push(
1407
        Inst::new(
1408
            "get_exception_handler_address",
1409
            r#"
1410
        Get the handler PC for the given exceptional edge for an
1411
        exception return from the given `try_call`-terminated block.
1412

1413
        This instruction provides the PC for the handler resume point,
1414
        as defined by the exception-handling aspect of the given
1415
        callee ABI, for a return from the given calling block.  It can
1416
        be used when the exception unwind mechanism requires manual
1417
        plumbing for this information which must be set up before the call
1418
        itself: for example, if the resume address needs to be stored in
1419
        some context structure for a runtime to resume to on error.
1420

1421
        The given caller block must end in a `try_call` and the given
1422
        exception-handling block must be one of its exceptional
1423
        successors in the associated exception-handling table. The
1424
        returned PC is *only* valid to resume to when the `try_call`
1425
        is on the stack having called the callee; in other words, when
1426
        a normal exception unwinder might otherwise resume to that
1427
        handler.
1428
        "#,
1429
            &formats.exception_handler_address,
1430
        )
1431
        .operands_in(vec![
1432
            Operand::new("block", &entities.raw_block),
1433
            Operand::new("index", &imm.imm64),
1434
        ])
1435
        .operands_out(vec![Operand::new("addr", iAddr)]),
1436
    );
1437

1438
    ig.push(
1439
        Inst::new(
1440
            "iconst",
1441
            r#"
1442
        Integer constant.
1443

1444
        Create a scalar integer SSA value with an immediate constant value, or
1445
        an integer vector where all the lanes have the same value.
1446
        "#,
1447
            &formats.unary_imm,
1448
        )
1449
        .operands_in(vec![Operand::new("N", &imm.imm64)])
1450
        .operands_out(vec![
1451
            Operand::new("a", NarrowInt).with_doc("A constant integer scalar or vector value"),
1452
        ]),
1453
    );
1454

1455
    ig.push(
1456
        Inst::new(
1457
            "f16const",
1458
            r#"
1459
        Floating point constant.
1460

1461
        Create a `f16` SSA value with an immediate constant value.
1462
        "#,
1463
            &formats.unary_ieee16,
1464
        )
1465
        .operands_in(vec![Operand::new("N", &imm.ieee16)])
1466
        .operands_out(vec![
1467
            Operand::new("a", f16_).with_doc("A constant f16 scalar value"),
1468
        ]),
1469
    );
1470

1471
    ig.push(
1472
        Inst::new(
1473
            "f32const",
1474
            r#"
1475
        Floating point constant.
1476

1477
        Create a `f32` SSA value with an immediate constant value.
1478
        "#,
1479
            &formats.unary_ieee32,
1480
        )
1481
        .operands_in(vec![Operand::new("N", &imm.ieee32)])
1482
        .operands_out(vec![
1483
            Operand::new("a", f32_).with_doc("A constant f32 scalar value"),
1484
        ]),
1485
    );
1486

1487
    ig.push(
1488
        Inst::new(
1489
            "f64const",
1490
            r#"
1491
        Floating point constant.
1492

1493
        Create a `f64` SSA value with an immediate constant value.
1494
        "#,
1495
            &formats.unary_ieee64,
1496
        )
1497
        .operands_in(vec![Operand::new("N", &imm.ieee64)])
1498
        .operands_out(vec![
1499
            Operand::new("a", f64_).with_doc("A constant f64 scalar value"),
1500
        ]),
1501
    );
1502

1503
    ig.push(
1504
        Inst::new(
1505
            "f128const",
1506
            r#"
1507
        Floating point constant.
1508

1509
        Create a `f128` SSA value with an immediate constant value.
1510
        "#,
1511
            &formats.unary_const,
1512
        )
1513
        .operands_in(vec![Operand::new("N", &entities.pool_constant)])
1514
        .operands_out(vec![
1515
            Operand::new("a", f128_).with_doc("A constant f128 scalar value"),
1516
        ]),
1517
    );
1518

1519
    ig.push(
1520
        Inst::new(
1521
            "vconst",
1522
            r#"
1523
        SIMD vector constant.
1524

1525
        Construct a vector with the given immediate bytes.
1526
        "#,
1527
            &formats.unary_const,
1528
        )
1529
        .operands_in(vec![
1530
            Operand::new("N", &entities.pool_constant)
1531
                .with_doc("The 16 immediate bytes of a 128-bit vector"),
1532
        ])
1533
        .operands_out(vec![
1534
            Operand::new("a", TxN).with_doc("A constant vector value"),
1535
        ]),
1536
    );
1537

1538
    let Tx16 = &TypeVar::new(
1539
        "Tx16",
1540
        "A SIMD vector with exactly 16 lanes of 8-bit values; eventually this may support other \
1541
         lane counts and widths",
1542
        TypeSetBuilder::new()
1543
            .ints(8..8)
1544
            .simd_lanes(16..16)
1545
            .includes_scalars(false)
1546
            .build(),
1547
    );
1548

1549
    ig.push(
1550
        Inst::new(
1551
            "shuffle",
1552
            r#"
1553
        SIMD vector shuffle.
1554

1555
        Shuffle two vectors using the given immediate bytes. For each of the 16 bytes of the
1556
        immediate, a value i of 0-15 selects the i-th element of the first vector and a value i of
1557
        16-31 selects the (i-16)th element of the second vector. Immediate values outside of the
1558
        0-31 range are not valid.
1559
        "#,
1560
            &formats.shuffle,
1561
        )
1562
        .operands_in(vec![
1563
            Operand::new("a", Tx16).with_doc("A vector value"),
1564
            Operand::new("b", Tx16).with_doc("A vector value"),
1565
            Operand::new("mask", &entities.uimm128)
1566
                .with_doc("The 16 immediate bytes used for selecting the elements to shuffle"),
1567
        ])
1568
        .operands_out(vec![Operand::new("a", Tx16).with_doc("A vector value")]),
1569
    );
1570

1571
    ig.push(Inst::new(
1572
        "nop",
1573
        r#"
1574
        Just a dummy instruction.
1575

1576
        Note: this doesn't compile to a machine code nop.
1577
        "#,
1578
        &formats.nullary,
1579
    ));
1580

1581
    ig.push(
1582
        Inst::new(
1583
            "select",
1584
            r#"
1585
        Conditional select.
1586

1587
        This instruction selects whole values. Use `bitselect` to choose each
1588
        bit according to a mask.
1589
        "#,
1590
            &formats.ternary,
1591
        )
1592
        .operands_in(vec![
1593
            Operand::new("c", ScalarTruthy).with_doc("Controlling value to test"),
1594
            Operand::new("x", Any).with_doc("Value to use when `c` is true"),
1595
            Operand::new("y", Any).with_doc("Value to use when `c` is false"),
1596
        ])
1597
        .operands_out(vec![Operand::new("a", Any)]),
1598
    );
1599

1600
    ig.push(
1601
        Inst::new(
1602
            "select_spectre_guard",
1603
            r#"
1604
            Conditional select intended for Spectre guards.
1605

1606
            This operation is semantically equivalent to a select instruction.
1607
            However, this instruction prohibits all speculation on the
1608
            controlling value when determining which input to use as the result.
1609
            As such, it is suitable for use in Spectre guards.
1610

1611
            For example, on a target which may speculatively execute branches,
1612
            the lowering of this instruction is guaranteed to not conditionally
1613
            branch. Instead it will typically lower to a conditional move
1614
            instruction. (No Spectre-vulnerable processors are known to perform
1615
            value speculation on conditional move instructions.)
1616

1617
            Ensure that the instruction you're trying to protect from Spectre
1618
            attacks has a data dependency on the result of this instruction.
1619
            That prevents an out-of-order CPU from evaluating that instruction
1620
            until the result of this one is known, which in turn will be blocked
1621
            until the controlling value is known.
1622

1623
            Typical usage is to use a bounds-check as the controlling value,
1624
            and select between either a null pointer if the bounds-check
1625
            fails, or an in-bounds address otherwise, so that dereferencing
1626
            the resulting address with a load or store instruction will trap if
1627
            the bounds-check failed. When this instruction is used in this way,
1628
            any microarchitectural side effects of the memory access will only
1629
            occur after the bounds-check finishes, which ensures that no Spectre
1630
            vulnerability will exist.
1631

1632
            Optimization opportunities for this instruction are limited compared
1633
            to a normal select instruction, but it is allowed to be replaced
1634
            by other values which are functionally equivalent as long as doing
1635
            so does not introduce any new opportunities to speculate on the
1636
            controlling value.
1637
            "#,
1638
            &formats.ternary,
1639
        )
1640
        .operands_in(vec![
1641
            Operand::new("c", ScalarTruthy).with_doc("Controlling value to test"),
1642
            Operand::new("x", Any).with_doc("Value to use when `c` is true"),
1643
            Operand::new("y", Any).with_doc("Value to use when `c` is false"),
1644
        ])
1645
        .operands_out(vec![Operand::new("a", Any)]),
1646
    );
1647

1648
    ig.push(
1649
        Inst::new(
1650
            "bitselect",
1651
            r#"
1652
        Conditional select of bits.
1653

1654
        For each bit in `c`, this instruction selects the corresponding bit from `x` if the bit
1655
        in `x` is 1 and the corresponding bit from `y` if the bit in `c` is 0. See also:
1656
        `select`.
1657
        "#,
1658
            &formats.ternary,
1659
        )
1660
        .operands_in(vec![
1661
            Operand::new("c", Any).with_doc("Controlling value to test"),
1662
            Operand::new("x", Any).with_doc("Value to use when `c` is true"),
1663
            Operand::new("y", Any).with_doc("Value to use when `c` is false"),
1664
        ])
1665
        .operands_out(vec![Operand::new("a", Any)]),
1666
    );
1667

1668
    ig.push(
1669
        Inst::new(
1670
            "x86_blendv",
1671
            r#"
1672
        A bitselect-lookalike instruction except with the semantics of
1673
        `blendv`-related instructions on x86.
1674

1675
        This instruction will use the top bit of each lane in `c`, the condition
1676
        mask. If the bit is 1 then the corresponding lane from `x` is chosen.
1677
        Otherwise the corresponding lane from `y` is chosen.
1678

1679
            "#,
1680
            &formats.ternary,
1681
        )
1682
        .operands_in(vec![
1683
            Operand::new("c", Any).with_doc("Controlling value to test"),
1684
            Operand::new("x", Any).with_doc("Value to use when `c` is true"),
1685
            Operand::new("y", Any).with_doc("Value to use when `c` is false"),
1686
        ])
1687
        .operands_out(vec![Operand::new("a", Any)]),
1688
    );
1689

1690
    ig.push(
1691
        Inst::new(
1692
            "vany_true",
1693
            r#"
1694
        Reduce a vector to a scalar boolean.
1695

1696
        Return a scalar boolean true if any lane in ``a`` is non-zero, false otherwise.
1697
        "#,
1698
            &formats.unary,
1699
        )
1700
        .operands_in(vec![Operand::new("a", TxN)])
1701
        .operands_out(vec![Operand::new("s", i8)]),
1702
    );
1703

1704
    ig.push(
1705
        Inst::new(
1706
            "vall_true",
1707
            r#"
1708
        Reduce a vector to a scalar boolean.
1709

1710
        Return a scalar boolean true if all lanes in ``i`` are non-zero, false otherwise.
1711
        "#,
1712
            &formats.unary,
1713
        )
1714
        .operands_in(vec![Operand::new("a", TxN)])
1715
        .operands_out(vec![Operand::new("s", i8)]),
1716
    );
1717

1718
    ig.push(
1719
        Inst::new(
1720
            "vhigh_bits",
1721
            r#"
1722
        Reduce a vector to a scalar integer.
1723

1724
        Return a scalar integer, consisting of the concatenation of the most significant bit
1725
        of each lane of ``a``.
1726
        "#,
1727
            &formats.unary,
1728
        )
1729
        .operands_in(vec![Operand::new("a", TxN)])
1730
        .operands_out(vec![Operand::new("x", NarrowInt)]),
1731
    );
1732

1733
    ig.push(
1734
        Inst::new(
1735
            "icmp",
1736
            r#"
1737
        Integer comparison.
1738

1739
        The condition code determines if the operands are interpreted as signed
1740
        or unsigned integers.
1741

1742
        | Signed | Unsigned | Condition             |
1743
        |--------|----------|-----------------------|
1744
        | eq     | eq       | Equal                 |
1745
        | ne     | ne       | Not equal             |
1746
        | slt    | ult      | Less than             |
1747
        | sge    | uge      | Greater than or equal |
1748
        | sgt    | ugt      | Greater than          |
1749
        | sle    | ule      | Less than or equal    |
1750

1751
        When this instruction compares integer vectors, it returns a vector of
1752
        lane-wise comparisons.
1753

1754
        When comparing scalars, the result is:
1755
            - `1` if the condition holds.
1756
            - `0` if the condition does not hold.
1757

1758
        When comparing vectors, the result is:
1759
            - `-1` (i.e. all ones) in each lane where the condition holds.
1760
            - `0` in each lane where the condition does not hold.
1761
        "#,
1762
            &formats.int_compare,
1763
        )
1764
        .operands_in(vec![
1765
            Operand::new("Cond", &imm.intcc),
1766
            Operand::new("x", Int),
1767
            Operand::new("y", Int),
1768
        ])
1769
        .operands_out(vec![Operand::new("a", &Int.as_truthy())]),
1770
    );
1771

1772
    ig.push(
1773
        Inst::new(
1774
            "icmp_imm",
1775
            r#"
1776
        Compare scalar integer to a constant.
1777

1778
        This is the same as the `icmp` instruction, except one operand is
1779
        a sign extended 64 bit immediate constant.
1780

1781
        This instruction can only compare scalars. Use `icmp` for
1782
        lane-wise vector comparisons.
1783
        "#,
1784
            &formats.int_compare_imm,
1785
        )
1786
        .operands_in(vec![
1787
            Operand::new("Cond", &imm.intcc),
1788
            Operand::new("x", iB),
1789
            Operand::new("Y", &imm.imm64),
1790
        ])
1791
        .operands_out(vec![Operand::new("a", i8)]),
1792
    );
1793

1794
    ig.push(
1795
        Inst::new(
1796
            "iadd",
1797
            r#"
1798
        Wrapping integer addition: `a := x + y \pmod{2^B}`.
1799

1800
        This instruction does not depend on the signed/unsigned interpretation
1801
        of the operands.
1802
        "#,
1803
            &formats.binary,
1804
        )
1805
        .operands_in(vec![Operand::new("x", Int), Operand::new("y", Int)])
1806
        .operands_out(vec![Operand::new("a", Int)]),
1807
    );
1808

1809
    ig.push(
1810
        Inst::new(
1811
            "isub",
1812
            r#"
1813
        Wrapping integer subtraction: `a := x - y \pmod{2^B}`.
1814

1815
        This instruction does not depend on the signed/unsigned interpretation
1816
        of the operands.
1817
        "#,
1818
            &formats.binary,
1819
        )
1820
        .operands_in(vec![Operand::new("x", Int), Operand::new("y", Int)])
1821
        .operands_out(vec![Operand::new("a", Int)]),
1822
    );
1823

1824
    ig.push(
1825
        Inst::new(
1826
            "ineg",
1827
            r#"
1828
        Integer negation: `a := -x \pmod{2^B}`.
1829
        "#,
1830
            &formats.unary,
1831
        )
1832
        .operands_in(vec![Operand::new("x", Int)])
1833
        .operands_out(vec![Operand::new("a", Int)]),
1834
    );
1835

1836
    ig.push(
1837
        Inst::new(
1838
            "iabs",
1839
            r#"
1840
        Integer absolute value with wrapping: `a := |x|`.
1841
        "#,
1842
            &formats.unary,
1843
        )
1844
        .operands_in(vec![Operand::new("x", Int)])
1845
        .operands_out(vec![Operand::new("a", Int)]),
1846
    );
1847

1848
    ig.push(
1849
        Inst::new(
1850
            "imul",
1851
            r#"
1852
        Wrapping integer multiplication: `a := x y \pmod{2^B}`.
1853

1854
        This instruction does not depend on the signed/unsigned interpretation
1855
        of the operands.
1856

1857
        Polymorphic over all integer types (vector and scalar).
1858
        "#,
1859
            &formats.binary,
1860
        )
1861
        .operands_in(vec![Operand::new("x", Int), Operand::new("y", Int)])
1862
        .operands_out(vec![Operand::new("a", Int)]),
1863
    );
1864

1865
    ig.push(
1866
        Inst::new(
1867
            "umulhi",
1868
            r#"
1869
        Unsigned integer multiplication, producing the high half of a
1870
        double-length result.
1871

1872
        Polymorphic over all integer types (vector and scalar).
1873
        "#,
1874
            &formats.binary,
1875
        )
1876
        .operands_in(vec![Operand::new("x", Int), Operand::new("y", Int)])
1877
        .operands_out(vec![Operand::new("a", Int)]),
1878
    );
1879

1880
    ig.push(
1881
        Inst::new(
1882
            "smulhi",
1883
            r#"
1884
        Signed integer multiplication, producing the high half of a
1885
        double-length result.
1886

1887
        Polymorphic over all integer types (vector and scalar).
1888
        "#,
1889
            &formats.binary,
1890
        )
1891
        .operands_in(vec![Operand::new("x", Int), Operand::new("y", Int)])
1892
        .operands_out(vec![Operand::new("a", Int)]),
1893
    );
1894

1895
    let I16or32 = &TypeVar::new(
1896
        "I16or32",
1897
        "A vector integer type with 16- or 32-bit numbers",
1898
        TypeSetBuilder::new().ints(16..32).simd_lanes(4..8).build(),
1899
    );
1900

1901
    ig.push(
1902
        Inst::new(
1903
            "sqmul_round_sat",
1904
            r#"
1905
        Fixed-point multiplication of numbers in the QN format, where N + 1
1906
        is the number bitwidth:
1907
        `a := signed_saturate((x * y + (1 << (Q - 1))) >> Q)`
1908

1909
        Polymorphic over all integer vector types with 16- or 32-bit numbers.
1910
        "#,
1911
            &formats.binary,
1912
        )
1913
        .operands_in(vec![Operand::new("x", I16or32), Operand::new("y", I16or32)])
1914
        .operands_out(vec![Operand::new("a", I16or32)]),
1915
    );
1916

1917
    ig.push(
1918
        Inst::new(
1919
            "x86_pmulhrsw",
1920
            r#"
1921
        A similar instruction to `sqmul_round_sat` except with the semantics
1922
        of x86's `pmulhrsw` instruction.
1923

1924
        This is the same as `sqmul_round_sat` except when both input lanes are
1925
        `i16::MIN`.
1926
        "#,
1927
            &formats.binary,
1928
        )
1929
        .operands_in(vec![Operand::new("x", I16or32), Operand::new("y", I16or32)])
1930
        .operands_out(vec![Operand::new("a", I16or32)]),
1931
    );
1932

1933
    // Integer division and remainder are scalar-only; most
1934
    // hardware does not directly support vector integer division.
1935

1936
    ig.push(
1937
        Inst::new(
1938
            "udiv",
1939
            r#"
1940
        Unsigned integer division: `a := \lfloor {x \over y} \rfloor`.
1941

1942
        This operation traps if the divisor is zero.
1943
        "#,
1944
            &formats.binary,
1945
        )
1946
        .operands_in(vec![Operand::new("x", iB), Operand::new("y", iB)])
1947
        .operands_out(vec![Operand::new("a", iB)])
1948
        .can_trap()
1949
        .side_effects_idempotent(),
1950
    );
1951

1952
    ig.push(
1953
        Inst::new(
1954
            "sdiv",
1955
            r#"
1956
        Signed integer division rounded toward zero: `a := sign(xy)
1957
        \lfloor {|x| \over |y|}\rfloor`.
1958

1959
        This operation traps if the divisor is zero, or if the result is not
1960
        representable in `B` bits two's complement. This only happens
1961
        when `x = -2^{B-1}, y = -1`.
1962
        "#,
1963
            &formats.binary,
1964
        )
1965
        .operands_in(vec![Operand::new("x", iB), Operand::new("y", iB)])
1966
        .operands_out(vec![Operand::new("a", iB)])
1967
        .can_trap()
1968
        .side_effects_idempotent(),
1969
    );
1970

1971
    ig.push(
1972
        Inst::new(
1973
            "urem",
1974
            r#"
1975
        Unsigned integer remainder.
1976

1977
        This operation traps if the divisor is zero.
1978
        "#,
1979
            &formats.binary,
1980
        )
1981
        .operands_in(vec![Operand::new("x", iB), Operand::new("y", iB)])
1982
        .operands_out(vec![Operand::new("a", iB)])
1983
        .can_trap()
1984
        .side_effects_idempotent(),
1985
    );
1986

1987
    ig.push(
1988
        Inst::new(
1989
            "srem",
1990
            r#"
1991
        Signed integer remainder. The result has the sign of the dividend.
1992

1993
        This operation traps if the divisor is zero.
1994
        "#,
1995
            &formats.binary,
1996
        )
1997
        .operands_in(vec![Operand::new("x", iB), Operand::new("y", iB)])
1998
        .operands_out(vec![Operand::new("a", iB)])
1999
        .can_trap()
2000
        .side_effects_idempotent(),
2001
    );
2002

2003
    ig.push(
2004
        Inst::new(
2005
            "iadd_imm",
2006
            r#"
2007
        Add immediate integer.
2008

2009
        Same as `iadd`, but one operand is a sign extended 64 bit immediate constant.
2010

2011
        Polymorphic over all scalar integer types, but does not support vector
2012
        types.
2013
        "#,
2014
            &formats.binary_imm64,
2015
        )
2016
        .operands_in(vec![Operand::new("x", iB), Operand::new("Y", &imm.imm64)])
2017
        .operands_out(vec![Operand::new("a", iB)]),
2018
    );
2019

2020
    ig.push(
2021
        Inst::new(
2022
            "imul_imm",
2023
            r#"
2024
        Integer multiplication by immediate constant.
2025

2026
        Same as `imul`, but one operand is a sign extended 64 bit immediate constant.
2027

2028
        Polymorphic over all scalar integer types, but does not support vector
2029
        types.
2030
        "#,
2031
            &formats.binary_imm64,
2032
        )
2033
        .operands_in(vec![Operand::new("x", iB), Operand::new("Y", &imm.imm64)])
2034
        .operands_out(vec![Operand::new("a", iB)]),
2035
    );
2036

2037
    ig.push(
2038
        Inst::new(
2039
            "udiv_imm",
2040
            r#"
2041
        Unsigned integer division by an immediate constant.
2042

2043
        Same as `udiv`, but one operand is a zero extended 64 bit immediate constant.
2044

2045
        This operation traps if the divisor is zero.
2046
        "#,
2047
            &formats.binary_imm64,
2048
        )
2049
        .operands_in(vec![Operand::new("x", iB), Operand::new("Y", &imm.imm64)])
2050
        .operands_out(vec![Operand::new("a", iB)]),
2051
    );
2052

2053
    ig.push(
2054
        Inst::new(
2055
            "sdiv_imm",
2056
            r#"
2057
        Signed integer division by an immediate constant.
2058

2059
        Same as `sdiv`, but one operand is a sign extended 64 bit immediate constant.
2060

2061
        This operation traps if the divisor is zero, or if the result is not
2062
        representable in `B` bits two's complement. This only happens
2063
        when `x = -2^{B-1}, Y = -1`.
2064
        "#,
2065
            &formats.binary_imm64,
2066
        )
2067
        .operands_in(vec![Operand::new("x", iB), Operand::new("Y", &imm.imm64)])
2068
        .operands_out(vec![Operand::new("a", iB)]),
2069
    );
2070

2071
    ig.push(
2072
        Inst::new(
2073
            "urem_imm",
2074
            r#"
2075
        Unsigned integer remainder with immediate divisor.
2076

2077
        Same as `urem`, but one operand is a zero extended 64 bit immediate constant.
2078

2079
        This operation traps if the divisor is zero.
2080
        "#,
2081
            &formats.binary_imm64,
2082
        )
2083
        .operands_in(vec![Operand::new("x", iB), Operand::new("Y", &imm.imm64)])
2084
        .operands_out(vec![Operand::new("a", iB)]),
2085
    );
2086

2087
    ig.push(
2088
        Inst::new(
2089
            "srem_imm",
2090
            r#"
2091
        Signed integer remainder with immediate divisor.
2092

2093
        Same as `srem`, but one operand is a sign extended 64 bit immediate constant.
2094

2095
        This operation traps if the divisor is zero.
2096
        "#,
2097
            &formats.binary_imm64,
2098
        )
2099
        .operands_in(vec![Operand::new("x", iB), Operand::new("Y", &imm.imm64)])
2100
        .operands_out(vec![Operand::new("a", iB)]),
2101
    );
2102

2103
    ig.push(
2104
        Inst::new(
2105
            "irsub_imm",
2106
            r#"
2107
        Immediate reverse wrapping subtraction: `a := Y - x \pmod{2^B}`.
2108

2109
        The immediate operand is a sign extended 64 bit constant.
2110

2111
        Also works as integer negation when `Y = 0`. Use `iadd_imm`
2112
        with a negative immediate operand for the reverse immediate
2113
        subtraction.
2114

2115
        Polymorphic over all scalar integer types, but does not support vector
2116
        types.
2117
        "#,
2118
            &formats.binary_imm64,
2119
        )
2120
        .operands_in(vec![Operand::new("x", iB), Operand::new("Y", &imm.imm64)])
2121
        .operands_out(vec![Operand::new("a", iB)]),
2122
    );
2123

2124
    ig.push(
2125
        Inst::new(
2126
            "sadd_overflow_cin",
2127
            r#"
2128
        Add signed integers with carry in and overflow out.
2129

2130
        Same as `sadd_overflow` with an additional carry input. The `c_in` type
2131
        is interpreted as 1 if it's nonzero or 0 if it's zero.
2132
        "#,
2133
            &formats.ternary,
2134
        )
2135
        .operands_in(vec![
2136
            Operand::new("x", iB),
2137
            Operand::new("y", iB),
2138
            Operand::new("c_in", i8).with_doc("Input carry flag"),
2139
        ])
2140
        .operands_out(vec![
2141
            Operand::new("a", iB),
2142
            Operand::new("c_out", i8).with_doc("Output carry flag"),
2143
        ]),
2144
    );
2145

2146
    ig.push(
2147
        Inst::new(
2148
            "uadd_overflow_cin",
2149
            r#"
2150
        Add unsigned integers with carry in and overflow out.
2151

2152
        Same as `uadd_overflow` with an additional carry input. The `c_in` type
2153
        is interpreted as 1 if it's nonzero or 0 if it's zero.
2154
        "#,
2155
            &formats.ternary,
2156
        )
2157
        .operands_in(vec![
2158
            Operand::new("x", iB),
2159
            Operand::new("y", iB),
2160
            Operand::new("c_in", i8).with_doc("Input carry flag"),
2161
        ])
2162
        .operands_out(vec![
2163
            Operand::new("a", iB),
2164
            Operand::new("c_out", i8).with_doc("Output carry flag"),
2165
        ]),
2166
    );
2167

2168
    {
2169
        let of_out = Operand::new("of", i8).with_doc("Overflow flag");
2170
        ig.push(
2171
            Inst::new(
2172
                "uadd_overflow",
2173
                r#"
2174
            Add integers unsigned with overflow out.
2175
            ``of`` is set when the addition overflowed.
2176
            ```text
2177
                a &= x + y \pmod 2^B \\
2178
                of &= x+y >= 2^B
2179
            ```
2180
            Polymorphic over all scalar integer types, but does not support vector
2181
            types.
2182
            "#,
2183
                &formats.binary,
2184
            )
2185
            .operands_in(vec![Operand::new("x", iB), Operand::new("y", iB)])
2186
            .operands_out(vec![Operand::new("a", iB), of_out.clone()]),
2187
        );
2188

2189
        ig.push(
2190
            Inst::new(
2191
                "sadd_overflow",
2192
                r#"
2193
            Add integers signed with overflow out.
2194
            ``of`` is set when the addition over- or underflowed.
2195
            Polymorphic over all scalar integer types, but does not support vector
2196
            types.
2197
            "#,
2198
                &formats.binary,
2199
            )
2200
            .operands_in(vec![Operand::new("x", iB), Operand::new("y", iB)])
2201
            .operands_out(vec![Operand::new("a", iB), of_out.clone()]),
2202
        );
2203

2204
        ig.push(
2205
            Inst::new(
2206
                "usub_overflow",
2207
                r#"
2208
            Subtract integers unsigned with overflow out.
2209
            ``of`` is set when the subtraction underflowed.
2210
            ```text
2211
                a &= x - y \pmod 2^B \\
2212
                of &= x - y < 0
2213
            ```
2214
            Polymorphic over all scalar integer types, but does not support vector
2215
            types.
2216
            "#,
2217
                &formats.binary,
2218
            )
2219
            .operands_in(vec![Operand::new("x", iB), Operand::new("y", iB)])
2220
            .operands_out(vec![Operand::new("a", iB), of_out.clone()]),
2221
        );
2222

2223
        ig.push(
2224
            Inst::new(
2225
                "ssub_overflow",
2226
                r#"
2227
            Subtract integers signed with overflow out.
2228
            ``of`` is set when the subtraction over- or underflowed.
2229
            Polymorphic over all scalar integer types, but does not support vector
2230
            types.
2231
            "#,
2232
                &formats.binary,
2233
            )
2234
            .operands_in(vec![Operand::new("x", iB), Operand::new("y", iB)])
2235
            .operands_out(vec![Operand::new("a", iB), of_out.clone()]),
2236
        );
2237

2238
        {
2239
            let NarrowScalar = &TypeVar::new(
2240
                "NarrowScalar",
2241
                "A scalar integer type up to 64 bits",
2242
                TypeSetBuilder::new().ints(8..64).build(),
2243
            );
2244

2245
            ig.push(
2246
                Inst::new(
2247
                    "umul_overflow",
2248
                    r#"
2249
                Multiply integers unsigned with overflow out.
2250
                ``of`` is set when the multiplication overflowed.
2251
                ```text
2252
                    a &= x * y \pmod 2^B \\
2253
                    of &= x * y > 2^B
2254
                ```
2255
                Polymorphic over all scalar integer types except i128, but does not support vector
2256
                types.
2257
                "#,
2258
                    &formats.binary,
2259
                )
2260
                .operands_in(vec![
2261
                    Operand::new("x", NarrowScalar),
2262
                    Operand::new("y", NarrowScalar),
2263
                ])
2264
                .operands_out(vec![Operand::new("a", NarrowScalar), of_out.clone()]),
2265
            );
2266

2267
            ig.push(
2268
                Inst::new(
2269
                    "smul_overflow",
2270
                    r#"
2271
                Multiply integers signed with overflow out.
2272
                ``of`` is set when the multiplication over- or underflowed.
2273
                Polymorphic over all scalar integer types except i128, but does not support vector
2274
                types.
2275
                "#,
2276
                    &formats.binary,
2277
                )
2278
                .operands_in(vec![
2279
                    Operand::new("x", NarrowScalar),
2280
                    Operand::new("y", NarrowScalar),
2281
                ])
2282
                .operands_out(vec![Operand::new("a", NarrowScalar), of_out.clone()]),
2283
            );
2284
        }
2285
    }
2286

2287
    let i32_64 = &TypeVar::new(
2288
        "i32_64",
2289
        "A 32 or 64-bit scalar integer type",
2290
        TypeSetBuilder::new().ints(32..64).build(),
2291
    );
2292

2293
    ig.push(
2294
        Inst::new(
2295
            "uadd_overflow_trap",
2296
            r#"
2297
        Unsigned addition of x and y, trapping if the result overflows.
2298

2299
        Accepts 32 or 64-bit integers, and does not support vector types.
2300
        "#,
2301
            &formats.int_add_trap,
2302
        )
2303
        .operands_in(vec![
2304
            Operand::new("x", i32_64),
2305
            Operand::new("y", i32_64),
2306
            Operand::new("code", &imm.trapcode),
2307
        ])
2308
        .operands_out(vec![Operand::new("a", i32_64)])
2309
        .can_trap()
2310
        .side_effects_idempotent(),
2311
    );
2312

2313
    ig.push(
2314
        Inst::new(
2315
            "ssub_overflow_bin",
2316
            r#"
2317
        Subtract signed integers with borrow in and overflow out.
2318

2319
        Same as `ssub_overflow` with an additional borrow input. The `b_in` type
2320
        is interpreted as 1 if it's nonzero or 0 if it's zero. The computation
2321
        performed here is `x - (y + (b_in != 0))`.
2322
        "#,
2323
            &formats.ternary,
2324
        )
2325
        .operands_in(vec![
2326
            Operand::new("x", iB),
2327
            Operand::new("y", iB),
2328
            Operand::new("b_in", i8).with_doc("Input borrow flag"),
2329
        ])
2330
        .operands_out(vec![
2331
            Operand::new("a", iB),
2332
            Operand::new("b_out", i8).with_doc("Output borrow flag"),
2333
        ]),
2334
    );
2335

2336
    ig.push(
2337
        Inst::new(
2338
            "usub_overflow_bin",
2339
            r#"
2340
        Subtract unsigned integers with borrow in and overflow out.
2341

2342
        Same as `usub_overflow` with an additional borrow input. The `b_in` type
2343
        is interpreted as 1 if it's nonzero or 0 if it's zero. The computation
2344
        performed here is `x - (y + (b_in != 0))`.
2345
        "#,
2346
            &formats.ternary,
2347
        )
2348
        .operands_in(vec![
2349
            Operand::new("x", iB),
2350
            Operand::new("y", iB),
2351
            Operand::new("b_in", i8).with_doc("Input borrow flag"),
2352
        ])
2353
        .operands_out(vec![
2354
            Operand::new("a", iB),
2355
            Operand::new("b_out", i8).with_doc("Output borrow flag"),
2356
        ]),
2357
    );
2358

2359
    let bits = &TypeVar::new(
2360
        "bits",
2361
        "Any integer, float, or vector type",
2362
        TypeSetBuilder::new()
2363
            .ints(Interval::All)
2364
            .floats(Interval::All)
2365
            .simd_lanes(Interval::All)
2366
            .includes_scalars(true)
2367
            .build(),
2368
    );
2369

2370
    ig.push(
2371
        Inst::new(
2372
            "band",
2373
            r#"
2374
        Bitwise and.
2375
        "#,
2376
            &formats.binary,
2377
        )
2378
        .operands_in(vec![Operand::new("x", bits), Operand::new("y", bits)])
2379
        .operands_out(vec![Operand::new("a", bits)]),
2380
    );
2381

2382
    ig.push(
2383
        Inst::new(
2384
            "bor",
2385
            r#"
2386
        Bitwise or.
2387
        "#,
2388
            &formats.binary,
2389
        )
2390
        .operands_in(vec![Operand::new("x", bits), Operand::new("y", bits)])
2391
        .operands_out(vec![Operand::new("a", bits)]),
2392
    );
2393

2394
    ig.push(
2395
        Inst::new(
2396
            "bxor",
2397
            r#"
2398
        Bitwise xor.
2399
        "#,
2400
            &formats.binary,
2401
        )
2402
        .operands_in(vec![Operand::new("x", bits), Operand::new("y", bits)])
2403
        .operands_out(vec![Operand::new("a", bits)]),
2404
    );
2405

2406
    ig.push(
2407
        Inst::new(
2408
            "bnot",
2409
            r#"
2410
        Bitwise not.
2411
        "#,
2412
            &formats.unary,
2413
        )
2414
        .operands_in(vec![Operand::new("x", bits)])
2415
        .operands_out(vec![Operand::new("a", bits)]),
2416
    );
2417

2418
    ig.push(
2419
        Inst::new(
2420
            "band_not",
2421
            r#"
2422
        Bitwise and not.
2423

2424
        Computes `x & ~y`.
2425
        "#,
2426
            &formats.binary,
2427
        )
2428
        .operands_in(vec![Operand::new("x", bits), Operand::new("y", bits)])
2429
        .operands_out(vec![Operand::new("a", bits)]),
2430
    );
2431

2432
    ig.push(
2433
        Inst::new(
2434
            "bor_not",
2435
            r#"
2436
        Bitwise or not.
2437

2438
        Computes `x | ~y`.
2439
        "#,
2440
            &formats.binary,
2441
        )
2442
        .operands_in(vec![Operand::new("x", bits), Operand::new("y", bits)])
2443
        .operands_out(vec![Operand::new("a", bits)]),
2444
    );
2445

2446
    ig.push(
2447
        Inst::new(
2448
            "bxor_not",
2449
            r#"
2450
        Bitwise xor not.
2451

2452
        Computes `x ^ ~y`.
2453
        "#,
2454
            &formats.binary,
2455
        )
2456
        .operands_in(vec![Operand::new("x", bits), Operand::new("y", bits)])
2457
        .operands_out(vec![Operand::new("a", bits)]),
2458
    );
2459

2460
    ig.push(
2461
        Inst::new(
2462
            "band_imm",
2463
            r#"
2464
        Bitwise and with immediate.
2465

2466
        Same as `band`, but one operand is a zero extended 64 bit immediate constant.
2467

2468
        Polymorphic over all scalar integer types, but does not support vector
2469
        types.
2470
        "#,
2471
            &formats.binary_imm64,
2472
        )
2473
        .operands_in(vec![Operand::new("x", iB), Operand::new("Y", &imm.imm64)])
2474
        .operands_out(vec![Operand::new("a", iB)]),
2475
    );
2476

2477
    ig.push(
2478
        Inst::new(
2479
            "bor_imm",
2480
            r#"
2481
        Bitwise or with immediate.
2482

2483
        Same as `bor`, but one operand is a zero extended 64 bit immediate constant.
2484

2485
        Polymorphic over all scalar integer types, but does not support vector
2486
        types.
2487
        "#,
2488
            &formats.binary_imm64,
2489
        )
2490
        .operands_in(vec![Operand::new("x", iB), Operand::new("Y", &imm.imm64)])
2491
        .operands_out(vec![Operand::new("a", iB)]),
2492
    );
2493

2494
    ig.push(
2495
        Inst::new(
2496
            "bxor_imm",
2497
            r#"
2498
        Bitwise xor with immediate.
2499

2500
        Same as `bxor`, but one operand is a zero extended 64 bit immediate constant.
2501

2502
        Polymorphic over all scalar integer types, but does not support vector
2503
        types.
2504
        "#,
2505
            &formats.binary_imm64,
2506
        )
2507
        .operands_in(vec![Operand::new("x", iB), Operand::new("Y", &imm.imm64)])
2508
        .operands_out(vec![Operand::new("a", iB)]),
2509
    );
2510

2511
    ig.push(
2512
        Inst::new(
2513
            "rotl",
2514
            r#"
2515
        Rotate left.
2516

2517
        Rotate the bits in ``x`` by ``y`` places.
2518
        "#,
2519
            &formats.binary,
2520
        )
2521
        .operands_in(vec![
2522
            Operand::new("x", Int).with_doc("Scalar or vector value to shift"),
2523
            Operand::new("y", iB).with_doc("Number of bits to shift"),
2524
        ])
2525
        .operands_out(vec![Operand::new("a", Int)]),
2526
    );
2527

2528
    ig.push(
2529
        Inst::new(
2530
            "rotr",
2531
            r#"
2532
        Rotate right.
2533

2534
        Rotate the bits in ``x`` by ``y`` places.
2535
        "#,
2536
            &formats.binary,
2537
        )
2538
        .operands_in(vec![
2539
            Operand::new("x", Int).with_doc("Scalar or vector value to shift"),
2540
            Operand::new("y", iB).with_doc("Number of bits to shift"),
2541
        ])
2542
        .operands_out(vec![Operand::new("a", Int)]),
2543
    );
2544

2545
    ig.push(
2546
        Inst::new(
2547
            "rotl_imm",
2548
            r#"
2549
        Rotate left by immediate.
2550

2551
        Same as `rotl`, but one operand is a zero extended 64 bit immediate constant.
2552
        "#,
2553
            &formats.binary_imm64,
2554
        )
2555
        .operands_in(vec![
2556
            Operand::new("x", Int).with_doc("Scalar or vector value to shift"),
2557
            Operand::new("Y", &imm.imm64),
2558
        ])
2559
        .operands_out(vec![Operand::new("a", Int)]),
2560
    );
2561

2562
    ig.push(
2563
        Inst::new(
2564
            "rotr_imm",
2565
            r#"
2566
        Rotate right by immediate.
2567

2568
        Same as `rotr`, but one operand is a zero extended 64 bit immediate constant.
2569
        "#,
2570
            &formats.binary_imm64,
2571
        )
2572
        .operands_in(vec![
2573
            Operand::new("x", Int).with_doc("Scalar or vector value to shift"),
2574
            Operand::new("Y", &imm.imm64),
2575
        ])
2576
        .operands_out(vec![Operand::new("a", Int)]),
2577
    );
2578

2579
    ig.push(
2580
        Inst::new(
2581
            "ishl",
2582
            r#"
2583
        Integer shift left. Shift the bits in ``x`` towards the MSB by ``y``
2584
        places. Shift in zero bits to the LSB.
2585

2586
        The shift amount is masked to the size of ``x``.
2587

2588
        When shifting a B-bits integer type, this instruction computes:
2589

2590
        ```text
2591
            s &:= y \pmod B,
2592
            a &:= x \cdot 2^s \pmod{2^B}.
2593
        ```
2594
        "#,
2595
            &formats.binary,
2596
        )
2597
        .operands_in(vec![
2598
            Operand::new("x", Int).with_doc("Scalar or vector value to shift"),
2599
            Operand::new("y", iB).with_doc("Number of bits to shift"),
2600
        ])
2601
        .operands_out(vec![Operand::new("a", Int)]),
2602
    );
2603

2604
    ig.push(
2605
        Inst::new(
2606
            "ushr",
2607
            r#"
2608
        Unsigned shift right. Shift bits in ``x`` towards the LSB by ``y``
2609
        places, shifting in zero bits to the MSB. Also called a *logical
2610
        shift*.
2611

2612
        The shift amount is masked to the size of ``x``.
2613

2614
        When shifting a B-bits integer type, this instruction computes:
2615

2616
        ```text
2617
            s &:= y \pmod B,
2618
            a &:= \lfloor x \cdot 2^{-s} \rfloor.
2619
        ```
2620
        "#,
2621
            &formats.binary,
2622
        )
2623
        .operands_in(vec![
2624
            Operand::new("x", Int).with_doc("Scalar or vector value to shift"),
2625
            Operand::new("y", iB).with_doc("Number of bits to shift"),
2626
        ])
2627
        .operands_out(vec![Operand::new("a", Int)]),
2628
    );
2629

2630
    ig.push(
2631
        Inst::new(
2632
            "sshr",
2633
            r#"
2634
        Signed shift right. Shift bits in ``x`` towards the LSB by ``y``
2635
        places, shifting in sign bits to the MSB. Also called an *arithmetic
2636
        shift*.
2637

2638
        The shift amount is masked to the size of ``x``.
2639
        "#,
2640
            &formats.binary,
2641
        )
2642
        .operands_in(vec![
2643
            Operand::new("x", Int).with_doc("Scalar or vector value to shift"),
2644
            Operand::new("y", iB).with_doc("Number of bits to shift"),
2645
        ])
2646
        .operands_out(vec![Operand::new("a", Int)]),
2647
    );
2648

2649
    ig.push(
2650
        Inst::new(
2651
            "ishl_imm",
2652
            r#"
2653
        Integer shift left by immediate.
2654

2655
        The shift amount is masked to the size of ``x``.
2656
        "#,
2657
            &formats.binary_imm64,
2658
        )
2659
        .operands_in(vec![
2660
            Operand::new("x", Int).with_doc("Scalar or vector value to shift"),
2661
            Operand::new("Y", &imm.imm64),
2662
        ])
2663
        .operands_out(vec![Operand::new("a", Int)]),
2664
    );
2665

2666
    ig.push(
2667
        Inst::new(
2668
            "ushr_imm",
2669
            r#"
2670
        Unsigned shift right by immediate.
2671

2672
        The shift amount is masked to the size of ``x``.
2673
        "#,
2674
            &formats.binary_imm64,
2675
        )
2676
        .operands_in(vec![
2677
            Operand::new("x", Int).with_doc("Scalar or vector value to shift"),
2678
            Operand::new("Y", &imm.imm64),
2679
        ])
2680
        .operands_out(vec![Operand::new("a", Int)]),
2681
    );
2682

2683
    ig.push(
2684
        Inst::new(
2685
            "sshr_imm",
2686
            r#"
2687
        Signed shift right by immediate.
2688

2689
        The shift amount is masked to the size of ``x``.
2690
        "#,
2691
            &formats.binary_imm64,
2692
        )
2693
        .operands_in(vec![
2694
            Operand::new("x", Int).with_doc("Scalar or vector value to shift"),
2695
            Operand::new("Y", &imm.imm64),
2696
        ])
2697
        .operands_out(vec![Operand::new("a", Int)]),
2698
    );
2699

2700
    ig.push(
2701
        Inst::new(
2702
            "bitrev",
2703
            r#"
2704
        Reverse the bits of a integer.
2705

2706
        Reverses the bits in ``x``.
2707
        "#,
2708
            &formats.unary,
2709
        )
2710
        .operands_in(vec![Operand::new("x", iB)])
2711
        .operands_out(vec![Operand::new("a", iB)]),
2712
    );
2713

2714
    ig.push(
2715
        Inst::new(
2716
            "clz",
2717
            r#"
2718
        Count leading zero bits.
2719

2720
        Starting from the MSB in ``x``, count the number of zero bits before
2721
        reaching the first one bit. When ``x`` is zero, returns the size of x
2722
        in bits.
2723
        "#,
2724
            &formats.unary,
2725
        )
2726
        .operands_in(vec![Operand::new("x", iB)])
2727
        .operands_out(vec![Operand::new("a", iB)]),
2728
    );
2729

2730
    ig.push(
2731
        Inst::new(
2732
            "cls",
2733
            r#"
2734
        Count leading sign bits.
2735

2736
        Starting from the MSB after the sign bit in ``x``, count the number of
2737
        consecutive bits identical to the sign bit. When ``x`` is 0 or -1,
2738
        returns one less than the size of x in bits.
2739
        "#,
2740
            &formats.unary,
2741
        )
2742
        .operands_in(vec![Operand::new("x", iB)])
2743
        .operands_out(vec![Operand::new("a", iB)]),
2744
    );
2745

2746
    ig.push(
2747
        Inst::new(
2748
            "ctz",
2749
            r#"
2750
        Count trailing zeros.
2751

2752
        Starting from the LSB in ``x``, count the number of zero bits before
2753
        reaching the first one bit. When ``x`` is zero, returns the size of x
2754
        in bits.
2755
        "#,
2756
            &formats.unary,
2757
        )
2758
        .operands_in(vec![Operand::new("x", iB)])
2759
        .operands_out(vec![Operand::new("a", iB)]),
2760
    );
2761

2762
    ig.push(
2763
        Inst::new(
2764
            "bswap",
2765
            r#"
2766
        Reverse the byte order of an integer.
2767

2768
        Reverses the bytes in ``x``.
2769
        "#,
2770
            &formats.unary,
2771
        )
2772
        .operands_in(vec![Operand::new("x", iSwappable)])
2773
        .operands_out(vec![Operand::new("a", iSwappable)]),
2774
    );
2775

2776
    ig.push(
2777
        Inst::new(
2778
            "popcnt",
2779
            r#"
2780
        Population count
2781

2782
        Count the number of one bits in ``x``.
2783
        "#,
2784
            &formats.unary,
2785
        )
2786
        .operands_in(vec![Operand::new("x", Int)])
2787
        .operands_out(vec![Operand::new("a", Int)]),
2788
    );
2789

2790
    let Float = &TypeVar::new(
2791
        "Float",
2792
        "A scalar or vector floating point number",
2793
        TypeSetBuilder::new()
2794
            .floats(Interval::All)
2795
            .simd_lanes(Interval::All)
2796
            .dynamic_simd_lanes(Interval::All)
2797
            .build(),
2798
    );
2799

2800
    ig.push(
2801
        Inst::new(
2802
            "fcmp",
2803
            r#"
2804
        Floating point comparison.
2805

2806
        Two IEEE 754-2008 floating point numbers, `x` and `y`, relate to each
2807
        other in exactly one of four ways:
2808

2809
        ```text
2810
        == ==========================================
2811
        UN Unordered when one or both numbers is NaN.
2812
        EQ When `x = y`. (And `0.0 = -0.0`).
2813
        LT When `x < y`.
2814
        GT When `x > y`.
2815
        == ==========================================
2816
        ```
2817

2818
        The 14 `floatcc` condition codes each correspond to a subset of
2819
        the four relations, except for the empty set which would always be
2820
        false, and the full set which would always be true.
2821

2822
        The condition codes are divided into 7 'ordered' conditions which don't
2823
        include UN, and 7 unordered conditions which all include UN.
2824

2825
        ```text
2826
        +-------+------------+---------+------------+-------------------------+
2827
        |Ordered             |Unordered             |Condition                |
2828
        +=======+============+=========+============+=========================+
2829
        |ord    |EQ | LT | GT|uno      |UN          |NaNs absent / present.   |
2830
        +-------+------------+---------+------------+-------------------------+
2831
        |eq     |EQ          |ueq      |UN | EQ     |Equal                    |
2832
        +-------+------------+---------+------------+-------------------------+
2833
        |one    |LT | GT     |ne       |UN | LT | GT|Not equal                |
2834
        +-------+------------+---------+------------+-------------------------+
2835
        |lt     |LT          |ult      |UN | LT     |Less than                |
2836
        +-------+------------+---------+------------+-------------------------+
2837
        |le     |LT | EQ     |ule      |UN | LT | EQ|Less than or equal       |
2838
        +-------+------------+---------+------------+-------------------------+
2839
        |gt     |GT          |ugt      |UN | GT     |Greater than             |
2840
        +-------+------------+---------+------------+-------------------------+
2841
        |ge     |GT | EQ     |uge      |UN | GT | EQ|Greater than or equal    |
2842
        +-------+------------+---------+------------+-------------------------+
2843
        ```
2844

2845
        The standard C comparison operators, `<, <=, >, >=`, are all ordered,
2846
        so they are false if either operand is NaN. The C equality operator,
2847
        `==`, is ordered, and since inequality is defined as the logical
2848
        inverse it is *unordered*. They map to the `floatcc` condition
2849
        codes as follows:
2850

2851
        ```text
2852
        ==== ====== ============
2853
        C    `Cond` Subset
2854
        ==== ====== ============
2855
        `==` eq     EQ
2856
        `!=` ne     UN | LT | GT
2857
        `<`  lt     LT
2858
        `<=` le     LT | EQ
2859
        `>`  gt     GT
2860
        `>=` ge     GT | EQ
2861
        ==== ====== ============
2862
        ```
2863

2864
        This subset of condition codes also corresponds to the WebAssembly
2865
        floating point comparisons of the same name.
2866

2867
        When this instruction compares floating point vectors, it returns a
2868
        vector with the results of lane-wise comparisons.
2869

2870
        When comparing scalars, the result is:
2871
            - `1` if the condition holds.
2872
            - `0` if the condition does not hold.
2873

2874
        When comparing vectors, the result is:
2875
            - `-1` (i.e. all ones) in each lane where the condition holds.
2876
            - `0` in each lane where the condition does not hold.
2877
        "#,
2878
            &formats.float_compare,
2879
        )
2880
        .operands_in(vec![
2881
            Operand::new("Cond", &imm.floatcc),
2882
            Operand::new("x", Float),
2883
            Operand::new("y", Float),
2884
        ])
2885
        .operands_out(vec![Operand::new("a", &Float.as_truthy())]),
2886
    );
2887

2888
    ig.push(
2889
        Inst::new(
2890
            "fadd",
2891
            r#"
2892
        Floating point addition.
2893
        "#,
2894
            &formats.binary,
2895
        )
2896
        .operands_in(vec![Operand::new("x", Float), Operand::new("y", Float)])
2897
        .operands_out(vec![
2898
            Operand::new("a", Float).with_doc("Result of applying operator to each lane"),
2899
        ]),
2900
    );
2901

2902
    ig.push(
2903
        Inst::new(
2904
            "fsub",
2905
            r#"
2906
        Floating point subtraction.
2907
        "#,
2908
            &formats.binary,
2909
        )
2910
        .operands_in(vec![Operand::new("x", Float), Operand::new("y", Float)])
2911
        .operands_out(vec![
2912
            Operand::new("a", Float).with_doc("Result of applying operator to each lane"),
2913
        ]),
2914
    );
2915

2916
    ig.push(
2917
        Inst::new(
2918
            "fmul",
2919
            r#"
2920
        Floating point multiplication.
2921
        "#,
2922
            &formats.binary,
2923
        )
2924
        .operands_in(vec![Operand::new("x", Float), Operand::new("y", Float)])
2925
        .operands_out(vec![
2926
            Operand::new("a", Float).with_doc("Result of applying operator to each lane"),
2927
        ]),
2928
    );
2929

2930
    ig.push(
2931
        Inst::new(
2932
            "fdiv",
2933
            r#"
2934
        Floating point division.
2935

2936
        Unlike the integer division instructions ` and
2937
        `udiv`, this can't trap. Division by zero is infinity or
2938
        NaN, depending on the dividend.
2939
        "#,
2940
            &formats.binary,
2941
        )
2942
        .operands_in(vec![Operand::new("x", Float), Operand::new("y", Float)])
2943
        .operands_out(vec![
2944
            Operand::new("a", Float).with_doc("Result of applying operator to each lane"),
2945
        ]),
2946
    );
2947

2948
    ig.push(
2949
        Inst::new(
2950
            "sqrt",
2951
            r#"
2952
        Floating point square root.
2953
        "#,
2954
            &formats.unary,
2955
        )
2956
        .operands_in(vec![Operand::new("x", Float)])
2957
        .operands_out(vec![
2958
            Operand::new("a", Float).with_doc("Result of applying operator to each lane"),
2959
        ]),
2960
    );
2961

2962
    ig.push(
2963
        Inst::new(
2964
            "fma",
2965
            r#"
2966
        Floating point fused multiply-and-add.
2967

2968
        Computes `a := xy+z` without any intermediate rounding of the
2969
        product.
2970
        "#,
2971
            &formats.ternary,
2972
        )
2973
        .operands_in(vec![
2974
            Operand::new("x", Float),
2975
            Operand::new("y", Float),
2976
            Operand::new("z", Float),
2977
        ])
2978
        .operands_out(vec![
2979
            Operand::new("a", Float).with_doc("Result of applying operator to each lane"),
2980
        ]),
2981
    );
2982

2983
    ig.push(
2984
        Inst::new(
2985
            "fneg",
2986
            r#"
2987
        Floating point negation.
2988

2989
        Note that this is a pure bitwise operation.
2990
        "#,
2991
            &formats.unary,
2992
        )
2993
        .operands_in(vec![Operand::new("x", Float)])
2994
        .operands_out(vec![
2995
            Operand::new("a", Float).with_doc("``x`` with its sign bit inverted"),
2996
        ]),
2997
    );
2998

2999
    ig.push(
3000
        Inst::new(
3001
            "fabs",
3002
            r#"
3003
        Floating point absolute value.
3004

3005
        Note that this is a pure bitwise operation.
3006
        "#,
3007
            &formats.unary,
3008
        )
3009
        .operands_in(vec![Operand::new("x", Float)])
3010
        .operands_out(vec![
3011
            Operand::new("a", Float).with_doc("``x`` with its sign bit cleared"),
3012
        ]),
3013
    );
3014

3015
    ig.push(
3016
        Inst::new(
3017
            "fcopysign",
3018
            r#"
3019
        Floating point copy sign.
3020

3021
        Note that this is a pure bitwise operation. The sign bit from ``y`` is
3022
        copied to the sign bit of ``x``.
3023
        "#,
3024
            &formats.binary,
3025
        )
3026
        .operands_in(vec![Operand::new("x", Float), Operand::new("y", Float)])
3027
        .operands_out(vec![
3028
            Operand::new("a", Float).with_doc("``x`` with its sign bit changed to that of ``y``"),
3029
        ]),
3030
    );
3031

3032
    ig.push(
3033
        Inst::new(
3034
            "fmin",
3035
            r#"
3036
        Floating point minimum, propagating NaNs using the WebAssembly rules.
3037

3038
        If either operand is NaN, this returns NaN with an unspecified sign. Furthermore, if
3039
        each input NaN consists of a mantissa whose most significant bit is 1 and the rest is
3040
        0, then the output has the same form. Otherwise, the output mantissa's most significant
3041
        bit is 1 and the rest is unspecified.
3042
        "#,
3043
            &formats.binary,
3044
        )
3045
        .operands_in(vec![Operand::new("x", Float), Operand::new("y", Float)])
3046
        .operands_out(vec![
3047
            Operand::new("a", Float).with_doc("The smaller of ``x`` and ``y``"),
3048
        ]),
3049
    );
3050

3051
    ig.push(
3052
        Inst::new(
3053
            "fmax",
3054
            r#"
3055
        Floating point maximum, propagating NaNs using the WebAssembly rules.
3056

3057
        If either operand is NaN, this returns NaN with an unspecified sign. Furthermore, if
3058
        each input NaN consists of a mantissa whose most significant bit is 1 and the rest is
3059
        0, then the output has the same form. Otherwise, the output mantissa's most significant
3060
        bit is 1 and the rest is unspecified.
3061
        "#,
3062
            &formats.binary,
3063
        )
3064
        .operands_in(vec![Operand::new("x", Float), Operand::new("y", Float)])
3065
        .operands_out(vec![
3066
            Operand::new("a", Float).with_doc("The larger of ``x`` and ``y``"),
3067
        ]),
3068
    );
3069

3070
    ig.push(
3071
        Inst::new(
3072
            "ceil",
3073
            r#"
3074
        Round floating point round to integral, towards positive infinity.
3075
        "#,
3076
            &formats.unary,
3077
        )
3078
        .operands_in(vec![Operand::new("x", Float)])
3079
        .operands_out(vec![
3080
            Operand::new("a", Float).with_doc("``x`` rounded to integral value"),
3081
        ]),
3082
    );
3083

3084
    ig.push(
3085
        Inst::new(
3086
            "floor",
3087
            r#"
3088
        Round floating point round to integral, towards negative infinity.
3089
        "#,
3090
            &formats.unary,
3091
        )
3092
        .operands_in(vec![Operand::new("x", Float)])
3093
        .operands_out(vec![
3094
            Operand::new("a", Float).with_doc("``x`` rounded to integral value"),
3095
        ]),
3096
    );
3097

3098
    ig.push(
3099
        Inst::new(
3100
            "trunc",
3101
            r#"
3102
        Round floating point round to integral, towards zero.
3103
        "#,
3104
            &formats.unary,
3105
        )
3106
        .operands_in(vec![Operand::new("x", Float)])
3107
        .operands_out(vec![
3108
            Operand::new("a", Float).with_doc("``x`` rounded to integral value"),
3109
        ]),
3110
    );
3111

3112
    ig.push(
3113
        Inst::new(
3114
            "nearest",
3115
            r#"
3116
        Round floating point round to integral, towards nearest with ties to
3117
        even.
3118
        "#,
3119
            &formats.unary,
3120
        )
3121
        .operands_in(vec![Operand::new("x", Float)])
3122
        .operands_out(vec![
3123
            Operand::new("a", Float).with_doc("``x`` rounded to integral value"),
3124
        ]),
3125
    );
3126

3127
    ig.push(
3128
        Inst::new(
3129
            "bitcast",
3130
            r#"
3131
        Reinterpret the bits in `x` as a different type.
3132

3133
        The input and output types must be storable to memory and of the same
3134
        size. A bitcast is equivalent to storing one type and loading the other
3135
        type from the same address, both using the specified MemFlags.
3136

3137
        Note that this operation only supports the `big` or `little` MemFlags.
3138
        The specified byte order only affects the result in the case where
3139
        input and output types differ in lane count/size.  In this case, the
3140
        operation is only valid if a byte order specifier is provided.
3141
        "#,
3142
            &formats.load_no_offset,
3143
        )
3144
        .operands_in(vec![
3145
            Operand::new("MemFlags", &imm.memflags),
3146
            Operand::new("x", Mem),
3147
        ])
3148
        .operands_out(vec![
3149
            Operand::new("a", MemTo).with_doc("Bits of `x` reinterpreted"),
3150
        ]),
3151
    );
3152

3153
    ig.push(
3154
        Inst::new(
3155
            "scalar_to_vector",
3156
            r#"
3157
            Copies a scalar value to a vector value.  The scalar is copied into the
3158
            least significant lane of the vector, and all other lanes will be zero.
3159
            "#,
3160
            &formats.unary,
3161
        )
3162
        .operands_in(vec![
3163
            Operand::new("s", &TxN.lane_of()).with_doc("A scalar value"),
3164
        ])
3165
        .operands_out(vec![Operand::new("a", TxN).with_doc("A vector value")]),
3166
    );
3167

3168
    let Truthy = &TypeVar::new(
3169
        "Truthy",
3170
        "A scalar whose values are truthy",
3171
        TypeSetBuilder::new().ints(Interval::All).build(),
3172
    );
3173
    let IntTo = &TypeVar::new(
3174
        "IntTo",
3175
        "An integer type",
3176
        TypeSetBuilder::new().ints(Interval::All).build(),
3177
    );
3178

3179
    ig.push(
3180
        Inst::new(
3181
            "bmask",
3182
            r#"
3183
        Convert `x` to an integer mask.
3184

3185
        Non-zero maps to all 1s and zero maps to all 0s.
3186
        "#,
3187
            &formats.unary,
3188
        )
3189
        .operands_in(vec![Operand::new("x", Truthy)])
3190
        .operands_out(vec![Operand::new("a", IntTo)]),
3191
    );
3192

3193
    let Int = &TypeVar::new(
3194
        "Int",
3195
        "A scalar integer type",
3196
        TypeSetBuilder::new().ints(Interval::All).build(),
3197
    );
3198

3199
    ig.push(
3200
        Inst::new(
3201
            "ireduce",
3202
            r#"
3203
        Convert `x` to a smaller integer type by discarding
3204
        the most significant bits.
3205

3206
        This is the same as reducing modulo `2^n`.
3207
        "#,
3208
            &formats.unary,
3209
        )
3210
        .operands_in(vec![
3211
            Operand::new("x", &Int.wider())
3212
                .with_doc("A scalar integer type, wider than the controlling type"),
3213
        ])
3214
        .operands_out(vec![Operand::new("a", Int)]),
3215
    );
3216

3217
    let I16or32or64xN = &TypeVar::new(
3218
        "I16or32or64xN",
3219
        "A SIMD vector type containing integer lanes 16, 32, or 64 bits wide",
3220
        TypeSetBuilder::new()
3221
            .ints(16..64)
3222
            .simd_lanes(2..8)
3223
            .dynamic_simd_lanes(2..8)
3224
            .includes_scalars(false)
3225
            .build(),
3226
    );
3227

3228
    ig.push(
3229
        Inst::new(
3230
            "snarrow",
3231
            r#"
3232
        Combine `x` and `y` into a vector with twice the lanes but half the integer width while
3233
        saturating overflowing values to the signed maximum and minimum.
3234

3235
        The lanes will be concatenated after narrowing. For example, when `x` and `y` are `i32x4`
3236
        and `x = [x3, x2, x1, x0]` and `y = [y3, y2, y1, y0]`, then after narrowing the value
3237
        returned is an `i16x8`: `a = [y3', y2', y1', y0', x3', x2', x1', x0']`.
3238
            "#,
3239
            &formats.binary,
3240
        )
3241
        .operands_in(vec![
3242
            Operand::new("x", I16or32or64xN),
3243
            Operand::new("y", I16or32or64xN),
3244
        ])
3245
        .operands_out(vec![Operand::new("a", &I16or32or64xN.split_lanes())]),
3246
    );
3247

3248
    ig.push(
3249
        Inst::new(
3250
            "unarrow",
3251
            r#"
3252
        Combine `x` and `y` into a vector with twice the lanes but half the integer width while
3253
        saturating overflowing values to the unsigned maximum and minimum.
3254

3255
        Note that all input lanes are considered signed: any negative lanes will overflow and be
3256
        replaced with the unsigned minimum, `0x00`.
3257

3258
        The lanes will be concatenated after narrowing. For example, when `x` and `y` are `i32x4`
3259
        and `x = [x3, x2, x1, x0]` and `y = [y3, y2, y1, y0]`, then after narrowing the value
3260
        returned is an `i16x8`: `a = [y3', y2', y1', y0', x3', x2', x1', x0']`.
3261
            "#,
3262
            &formats.binary,
3263
        )
3264
        .operands_in(vec![
3265
            Operand::new("x", I16or32or64xN),
3266
            Operand::new("y", I16or32or64xN),
3267
        ])
3268
        .operands_out(vec![Operand::new("a", &I16or32or64xN.split_lanes())]),
3269
    );
3270

3271
    ig.push(
3272
        Inst::new(
3273
            "uunarrow",
3274
            r#"
3275
        Combine `x` and `y` into a vector with twice the lanes but half the integer width while
3276
        saturating overflowing values to the unsigned maximum and minimum.
3277

3278
        Note that all input lanes are considered unsigned: any negative values will be interpreted as unsigned, overflowing and being replaced with the unsigned maximum.
3279

3280
        The lanes will be concatenated after narrowing. For example, when `x` and `y` are `i32x4`
3281
        and `x = [x3, x2, x1, x0]` and `y = [y3, y2, y1, y0]`, then after narrowing the value
3282
        returned is an `i16x8`: `a = [y3', y2', y1', y0', x3', x2', x1', x0']`.
3283
            "#,
3284
            &formats.binary,
3285
        )
3286
        .operands_in(vec![Operand::new("x", I16or32or64xN), Operand::new("y", I16or32or64xN)])
3287
        .operands_out(vec![Operand::new("a", &I16or32or64xN.split_lanes())]),
3288
    );
3289

3290
    let I8or16or32xN = &TypeVar::new(
3291
        "I8or16or32xN",
3292
        "A SIMD vector type containing integer lanes 8, 16, or 32 bits wide.",
3293
        TypeSetBuilder::new()
3294
            .ints(8..32)
3295
            .simd_lanes(2..16)
3296
            .dynamic_simd_lanes(2..16)
3297
            .includes_scalars(false)
3298
            .build(),
3299
    );
3300

3301
    ig.push(
3302
        Inst::new(
3303
            "swiden_low",
3304
            r#"
3305
        Widen the low lanes of `x` using signed extension.
3306

3307
        This will double the lane width and halve the number of lanes.
3308
            "#,
3309
            &formats.unary,
3310
        )
3311
        .operands_in(vec![Operand::new("x", I8or16or32xN)])
3312
        .operands_out(vec![Operand::new("a", &I8or16or32xN.merge_lanes())]),
3313
    );
3314

3315
    ig.push(
3316
        Inst::new(
3317
            "swiden_high",
3318
            r#"
3319
        Widen the high lanes of `x` using signed extension.
3320

3321
        This will double the lane width and halve the number of lanes.
3322
            "#,
3323
            &formats.unary,
3324
        )
3325
        .operands_in(vec![Operand::new("x", I8or16or32xN)])
3326
        .operands_out(vec![Operand::new("a", &I8or16or32xN.merge_lanes())]),
3327
    );
3328

3329
    ig.push(
3330
        Inst::new(
3331
            "uwiden_low",
3332
            r#"
3333
        Widen the low lanes of `x` using unsigned extension.
3334

3335
        This will double the lane width and halve the number of lanes.
3336
            "#,
3337
            &formats.unary,
3338
        )
3339
        .operands_in(vec![Operand::new("x", I8or16or32xN)])
3340
        .operands_out(vec![Operand::new("a", &I8or16or32xN.merge_lanes())]),
3341
    );
3342

3343
    ig.push(
3344
        Inst::new(
3345
            "uwiden_high",
3346
            r#"
3347
            Widen the high lanes of `x` using unsigned extension.
3348

3349
            This will double the lane width and halve the number of lanes.
3350
            "#,
3351
            &formats.unary,
3352
        )
3353
        .operands_in(vec![Operand::new("x", I8or16or32xN)])
3354
        .operands_out(vec![Operand::new("a", &I8or16or32xN.merge_lanes())]),
3355
    );
3356

3357
    ig.push(
3358
        Inst::new(
3359
            "iadd_pairwise",
3360
            r#"
3361
        Does lane-wise integer pairwise addition on two operands, putting the
3362
        combined results into a single vector result. Here a pair refers to adjacent
3363
        lanes in a vector, i.e. i*2 + (i*2+1) for i == num_lanes/2. The first operand
3364
        pairwise add results will make up the low half of the resulting vector while
3365
        the second operand pairwise add results will make up the upper half of the
3366
        resulting vector.
3367
            "#,
3368
            &formats.binary,
3369
        )
3370
        .operands_in(vec![
3371
            Operand::new("x", I8or16or32xN),
3372
            Operand::new("y", I8or16or32xN),
3373
        ])
3374
        .operands_out(vec![Operand::new("a", I8or16or32xN)]),
3375
    );
3376

3377
    let I8x16 = &TypeVar::new(
3378
        "I8x16",
3379
        "A SIMD vector type consisting of 16 lanes of 8-bit integers",
3380
        TypeSetBuilder::new()
3381
            .ints(8..8)
3382
            .simd_lanes(16..16)
3383
            .includes_scalars(false)
3384
            .build(),
3385
    );
3386

3387
    ig.push(
3388
        Inst::new(
3389
            "x86_pmaddubsw",
3390
            r#"
3391
        An instruction with equivalent semantics to `pmaddubsw` on x86.
3392

3393
        This instruction will take signed bytes from the first argument and
3394
        multiply them against unsigned bytes in the second argument. Adjacent
3395
        pairs are then added, with saturating, to a 16-bit value and are packed
3396
        into the result.
3397
            "#,
3398
            &formats.binary,
3399
        )
3400
        .operands_in(vec![Operand::new("x", I8x16), Operand::new("y", I8x16)])
3401
        .operands_out(vec![Operand::new("a", I16x8)]),
3402
    );
3403

3404
    ig.push(
3405
        Inst::new(
3406
            "uextend",
3407
            r#"
3408
        Convert `x` to a larger integer type by zero-extending.
3409

3410
        Each lane in `x` is converted to a larger integer type by adding
3411
        zeroes. The result has the same numerical value as `x` when both are
3412
        interpreted as unsigned integers.
3413

3414
        The result type must have the same number of vector lanes as the input,
3415
        and each lane must not have fewer bits that the input lanes. If the
3416
        input and output types are the same, this is a no-op.
3417
        "#,
3418
            &formats.unary,
3419
        )
3420
        .operands_in(vec![Operand::new("x", &Int.narrower()).with_doc(
3421
            "A scalar integer type, narrower than the controlling type",
3422
        )])
3423
        .operands_out(vec![Operand::new("a", Int)]),
3424
    );
3425

3426
    ig.push(
3427
        Inst::new(
3428
            "sextend",
3429
            r#"
3430
        Convert `x` to a larger integer type by sign-extending.
3431

3432
        Each lane in `x` is converted to a larger integer type by replicating
3433
        the sign bit. The result has the same numerical value as `x` when both
3434
        are interpreted as signed integers.
3435

3436
        The result type must have the same number of vector lanes as the input,
3437
        and each lane must not have fewer bits that the input lanes. If the
3438
        input and output types are the same, this is a no-op.
3439
        "#,
3440
            &formats.unary,
3441
        )
3442
        .operands_in(vec![Operand::new("x", &Int.narrower()).with_doc(
3443
            "A scalar integer type, narrower than the controlling type",
3444
        )])
3445
        .operands_out(vec![Operand::new("a", Int)]),
3446
    );
3447

3448
    let FloatScalar = &TypeVar::new(
3449
        "FloatScalar",
3450
        "A scalar only floating point number",
3451
        TypeSetBuilder::new().floats(Interval::All).build(),
3452
    );
3453

3454
    ig.push(
3455
        Inst::new(
3456
            "fpromote",
3457
            r#"
3458
        Convert `x` to a larger floating point format.
3459

3460
        Each lane in `x` is converted to the destination floating point format.
3461
        This is an exact operation.
3462

3463
        Cranelift currently only supports two floating point formats
3464
        - `f32` and `f64`. This may change in the future.
3465

3466
        The result type must have the same number of vector lanes as the input,
3467
        and the result lanes must not have fewer bits than the input lanes.
3468
        "#,
3469
            &formats.unary,
3470
        )
3471
        .operands_in(vec![Operand::new("x", &FloatScalar.narrower()).with_doc(
3472
            "A scalar only floating point number, narrower than the controlling type",
3473
        )])
3474
        .operands_out(vec![Operand::new("a", FloatScalar)]),
3475
    );
3476

3477
    ig.push(
3478
        Inst::new(
3479
            "fdemote",
3480
            r#"
3481
        Convert `x` to a smaller floating point format.
3482

3483
        Each lane in `x` is converted to the destination floating point format
3484
        by rounding to nearest, ties to even.
3485

3486
        Cranelift currently only supports two floating point formats
3487
        - `f32` and `f64`. This may change in the future.
3488

3489
        The result type must have the same number of vector lanes as the input,
3490
        and the result lanes must not have more bits than the input lanes.
3491
        "#,
3492
            &formats.unary,
3493
        )
3494
        .operands_in(vec![Operand::new("x", &FloatScalar.wider()).with_doc(
3495
            "A scalar only floating point number, wider than the controlling type",
3496
        )])
3497
        .operands_out(vec![Operand::new("a", FloatScalar)]),
3498
    );
3499

3500
    let F64x2 = &TypeVar::new(
3501
        "F64x2",
3502
        "A SIMD vector type consisting of 2 lanes of 64-bit floats",
3503
        TypeSetBuilder::new()
3504
            .floats(64..64)
3505
            .simd_lanes(2..2)
3506
            .includes_scalars(false)
3507
            .build(),
3508
    );
3509
    let F32x4 = &TypeVar::new(
3510
        "F32x4",
3511
        "A SIMD vector type consisting of 4 lanes of 32-bit floats",
3512
        TypeSetBuilder::new()
3513
            .floats(32..32)
3514
            .simd_lanes(4..4)
3515
            .includes_scalars(false)
3516
            .build(),
3517
    );
3518

3519
    ig.push(
3520
        Inst::new(
3521
            "fvdemote",
3522
            r#"
3523
                Convert `x` to a smaller floating point format.
3524

3525
                Each lane in `x` is converted to the destination floating point format
3526
                by rounding to nearest, ties to even.
3527

3528
                Cranelift currently only supports two floating point formats
3529
                - `f32` and `f64`. This may change in the future.
3530

3531
                Fvdemote differs from fdemote in that with fvdemote it targets vectors.
3532
                Fvdemote is constrained to having the input type being F64x2 and the result
3533
                type being F32x4. The result lane that was the upper half of the input lane
3534
                is initialized to zero.
3535
                "#,
3536
            &formats.unary,
3537
        )
3538
        .operands_in(vec![Operand::new("x", F64x2)])
3539
        .operands_out(vec![Operand::new("a", F32x4)]),
3540
    );
3541

3542
    ig.push(
3543
        Inst::new(
3544
            "fvpromote_low",
3545
            r#"
3546
        Converts packed single precision floating point to packed double precision floating point.
3547

3548
        Considering only the lower half of the register, the low lanes in `x` are interpreted as
3549
        single precision floats that are then converted to a double precision floats.
3550

3551
        The result type will have half the number of vector lanes as the input. Fvpromote_low is
3552
        constrained to input F32x4 with a result type of F64x2.
3553
        "#,
3554
            &formats.unary,
3555
        )
3556
        .operands_in(vec![Operand::new("a", F32x4)])
3557
        .operands_out(vec![Operand::new("x", F64x2)]),
3558
    );
3559

3560
    let IntTo = &TypeVar::new(
3561
        "IntTo",
3562
        "An scalar only integer type",
3563
        TypeSetBuilder::new().ints(Interval::All).build(),
3564
    );
3565

3566
    ig.push(
3567
        Inst::new(
3568
            "fcvt_to_uint",
3569
            r#"
3570
        Converts floating point scalars to unsigned integer.
3571

3572
        Only operates on `x` if it is a scalar. If `x` is NaN or if
3573
        the unsigned integral value cannot be represented in the result
3574
        type, this instruction traps.
3575

3576
        "#,
3577
            &formats.unary,
3578
        )
3579
        .operands_in(vec![Operand::new("x", FloatScalar)])
3580
        .operands_out(vec![Operand::new("a", IntTo)])
3581
        .can_trap()
3582
        .side_effects_idempotent(),
3583
    );
3584

3585
    ig.push(
3586
        Inst::new(
3587
            "fcvt_to_sint",
3588
            r#"
3589
        Converts floating point scalars to signed integer.
3590

3591
        Only operates on `x` if it is a scalar. If `x` is NaN or if
3592
        the unsigned integral value cannot be represented in the result
3593
        type, this instruction traps.
3594

3595
        "#,
3596
            &formats.unary,
3597
        )
3598
        .operands_in(vec![Operand::new("x", FloatScalar)])
3599
        .operands_out(vec![Operand::new("a", IntTo)])
3600
        .can_trap()
3601
        .side_effects_idempotent(),
3602
    );
3603

3604
    let IntTo = &TypeVar::new(
3605
        "IntTo",
3606
        "A larger integer type with the same number of lanes",
3607
        TypeSetBuilder::new()
3608
            .ints(Interval::All)
3609
            .simd_lanes(Interval::All)
3610
            .build(),
3611
    );
3612

3613
    ig.push(
3614
        Inst::new(
3615
            "fcvt_to_uint_sat",
3616
            r#"
3617
        Convert floating point to unsigned integer as fcvt_to_uint does, but
3618
        saturates the input instead of trapping. NaN and negative values are
3619
        converted to 0.
3620
        "#,
3621
            &formats.unary,
3622
        )
3623
        .operands_in(vec![Operand::new("x", Float)])
3624
        .operands_out(vec![Operand::new("a", IntTo)]),
3625
    );
3626

3627
    ig.push(
3628
        Inst::new(
3629
            "fcvt_to_sint_sat",
3630
            r#"
3631
        Convert floating point to signed integer as fcvt_to_sint does, but
3632
        saturates the input instead of trapping. NaN values are converted to 0.
3633
        "#,
3634
            &formats.unary,
3635
        )
3636
        .operands_in(vec![Operand::new("x", Float)])
3637
        .operands_out(vec![Operand::new("a", IntTo)]),
3638
    );
3639

3640
    ig.push(
3641
        Inst::new(
3642
            "x86_cvtt2dq",
3643
            r#"
3644
        A float-to-integer conversion instruction for vectors-of-floats which
3645
        has the same semantics as `cvttp{s,d}2dq` on x86. This specifically
3646
        returns `INT_MIN` for NaN or out-of-bounds lanes.
3647
        "#,
3648
            &formats.unary,
3649
        )
3650
        .operands_in(vec![Operand::new("x", Float)])
3651
        .operands_out(vec![Operand::new("a", IntTo)]),
3652
    );
3653

3654
    let Int = &TypeVar::new(
3655
        "Int",
3656
        "A scalar or vector integer type",
3657
        TypeSetBuilder::new()
3658
            .ints(Interval::All)
3659
            .simd_lanes(Interval::All)
3660
            .build(),
3661
    );
3662

3663
    let FloatTo = &TypeVar::new(
3664
        "FloatTo",
3665
        "A scalar or vector floating point number",
3666
        TypeSetBuilder::new()
3667
            .floats(Interval::All)
3668
            .simd_lanes(Interval::All)
3669
            .build(),
3670
    );
3671

3672
    ig.push(
3673
        Inst::new(
3674
            "fcvt_from_uint",
3675
            r#"
3676
        Convert unsigned integer to floating point.
3677

3678
        Each lane in `x` is interpreted as an unsigned integer and converted to
3679
        floating point using round to nearest, ties to even.
3680

3681
        The result type must have the same number of vector lanes as the input.
3682
        "#,
3683
            &formats.unary,
3684
        )
3685
        .operands_in(vec![Operand::new("x", Int)])
3686
        .operands_out(vec![Operand::new("a", FloatTo)]),
3687
    );
3688

3689
    ig.push(
3690
        Inst::new(
3691
            "fcvt_from_sint",
3692
            r#"
3693
        Convert signed integer to floating point.
3694

3695
        Each lane in `x` is interpreted as a signed integer and converted to
3696
        floating point using round to nearest, ties to even.
3697

3698
        The result type must have the same number of vector lanes as the input.
3699
        "#,
3700
            &formats.unary,
3701
        )
3702
        .operands_in(vec![Operand::new("x", Int)])
3703
        .operands_out(vec![Operand::new("a", FloatTo)]),
3704
    );
3705

3706
    let WideInt = &TypeVar::new(
3707
        "WideInt",
3708
        "An integer type of width `i16` upwards",
3709
        TypeSetBuilder::new().ints(16..128).build(),
3710
    );
3711

3712
    ig.push(
3713
        Inst::new(
3714
            "isplit",
3715
            r#"
3716
        Split an integer into low and high parts.
3717

3718
        Vectors of integers are split lane-wise, so the results have the same
3719
        number of lanes as the input, but the lanes are half the size.
3720

3721
        Returns the low half of `x` and the high half of `x` as two independent
3722
        values.
3723
        "#,
3724
            &formats.unary,
3725
        )
3726
        .operands_in(vec![Operand::new("x", WideInt)])
3727
        .operands_out(vec![
3728
            Operand::new("lo", &WideInt.half_width()).with_doc("The low bits of `x`"),
3729
            Operand::new("hi", &WideInt.half_width()).with_doc("The high bits of `x`"),
3730
        ]),
3731
    );
3732

3733
    ig.push(
3734
        Inst::new(
3735
            "iconcat",
3736
            r#"
3737
        Concatenate low and high bits to form a larger integer type.
3738

3739
        Vectors of integers are concatenated lane-wise such that the result has
3740
        the same number of lanes as the inputs, but the lanes are twice the
3741
        size.
3742
        "#,
3743
            &formats.binary,
3744
        )
3745
        .operands_in(vec![
3746
            Operand::new("lo", NarrowInt),
3747
            Operand::new("hi", NarrowInt),
3748
        ])
3749
        .operands_out(vec![
3750
            Operand::new("a", &NarrowInt.double_width())
3751
                .with_doc("The concatenation of `lo` and `hi`"),
3752
        ]),
3753
    );
3754

3755
    // Instructions relating to atomic memory accesses and fences
3756
    let AtomicMem = &TypeVar::new(
3757
        "AtomicMem",
3758
        "Any type that can be stored in memory, which can be used in an atomic operation",
3759
        TypeSetBuilder::new().ints(8..128).build(),
3760
    );
3761

3762
    ig.push(
3763
        Inst::new(
3764
            "atomic_rmw",
3765
            r#"
3766
        Atomically read-modify-write memory at `p`, with second operand `x`.  The old value is
3767
        returned.  `p` has the type of the target word size, and `x` may be any integer type; note
3768
        that some targets require specific target features to be enabled in order to support 128-bit
3769
        integer atomics.  The type of the returned value is the same as the type of `x`.  This
3770
        operation is sequentially consistent and creates happens-before edges that order normal
3771
        (non-atomic) loads and stores.
3772
        "#,
3773
            &formats.atomic_rmw,
3774
        )
3775
        .operands_in(vec![
3776
            Operand::new("MemFlags", &imm.memflags),
3777
            Operand::new("AtomicRmwOp", &imm.atomic_rmw_op),
3778
            Operand::new("p", iAddr),
3779
            Operand::new("x", AtomicMem).with_doc("Value to be atomically stored"),
3780
        ])
3781
        .operands_out(vec![
3782
            Operand::new("a", AtomicMem).with_doc("Value atomically loaded"),
3783
        ])
3784
        .can_load()
3785
        .can_store()
3786
        .other_side_effects(),
3787
    );
3788

3789
    ig.push(
3790
        Inst::new(
3791
            "atomic_cas",
3792
            r#"
3793
        Perform an atomic compare-and-swap operation on memory at `p`, with expected value `e`,
3794
        storing `x` if the value at `p` equals `e`.  The old value at `p` is returned,
3795
        regardless of whether the operation succeeds or fails.  `p` has the type of the target
3796
        word size, and `x` and `e` must have the same type and the same size, which may be any
3797
        integer type; note that some targets require specific target features to be enabled in order
3798
        to support 128-bit integer atomics.  The type of the returned value is the same as the type
3799
        of `x` and `e`.  This operation is sequentially consistent and creates happens-before edges
3800
        that order normal (non-atomic) loads and stores.
3801
        "#,
3802
            &formats.atomic_cas,
3803
        )
3804
        .operands_in(vec![
3805
            Operand::new("MemFlags", &imm.memflags),
3806
            Operand::new("p", iAddr),
3807
            Operand::new("e", AtomicMem).with_doc("Expected value in CAS"),
3808
            Operand::new("x", AtomicMem).with_doc("Value to be atomically stored"),
3809
        ])
3810
        .operands_out(vec![
3811
            Operand::new("a", AtomicMem).with_doc("Value atomically loaded"),
3812
        ])
3813
        .can_load()
3814
        .can_store()
3815
        .other_side_effects(),
3816
    );
3817

3818
    ig.push(
3819
        Inst::new(
3820
            "atomic_load",
3821
            r#"
3822
        Atomically load from memory at `p`.
3823

3824
        This is a polymorphic instruction that can load any value type which has a memory
3825
        representation.  It can only be used for integer types; note that some targets require
3826
        specific target features to be enabled in order to support 128-bit integer atomics. This
3827
        operation is sequentially consistent and creates happens-before edges that order normal
3828
        (non-atomic) loads and stores.
3829
        "#,
3830
            &formats.load_no_offset,
3831
        )
3832
        .operands_in(vec![
3833
            Operand::new("MemFlags", &imm.memflags),
3834
            Operand::new("p", iAddr),
3835
        ])
3836
        .operands_out(vec![
3837
            Operand::new("a", AtomicMem).with_doc("Value atomically loaded"),
3838
        ])
3839
        .can_load()
3840
        .other_side_effects(),
3841
    );
3842

3843
    ig.push(
3844
        Inst::new(
3845
            "atomic_store",
3846
            r#"
3847
        Atomically store `x` to memory at `p`.
3848

3849
        This is a polymorphic instruction that can store any value type with a memory
3850
        representation.  It can only be used for integer types; note that some targets require
3851
        specific target features to be enabled in order to support 128-bit integer atomics This
3852
        operation is sequentially consistent and creates happens-before edges that order normal
3853
        (non-atomic) loads and stores.
3854
        "#,
3855
            &formats.store_no_offset,
3856
        )
3857
        .operands_in(vec![
3858
            Operand::new("MemFlags", &imm.memflags),
3859
            Operand::new("x", AtomicMem).with_doc("Value to be atomically stored"),
3860
            Operand::new("p", iAddr),
3861
        ])
3862
        .can_store()
3863
        .other_side_effects(),
3864
    );
3865

3866
    ig.push(
3867
        Inst::new(
3868
            "fence",
3869
            r#"
3870
        A memory fence.  This must provide ordering to ensure that, at a minimum, neither loads
3871
        nor stores of any kind may move forwards or backwards across the fence.  This operation
3872
        is sequentially consistent.
3873
        "#,
3874
            &formats.nullary,
3875
        )
3876
        .other_side_effects(),
3877
    );
3878

3879
    let TxN = &TypeVar::new(
3880
        "TxN",
3881
        "A dynamic vector type",
3882
        TypeSetBuilder::new()
3883
            .ints(Interval::All)
3884
            .floats(Interval::All)
3885
            .dynamic_simd_lanes(Interval::All)
3886
            .build(),
3887
    );
3888

3889
    ig.push(
3890
        Inst::new(
3891
            "extract_vector",
3892
            r#"
3893
        Return a fixed length sub vector, extracted from a dynamic vector.
3894
        "#,
3895
            &formats.binary_imm8,
3896
        )
3897
        .operands_in(vec![
3898
            Operand::new("x", TxN).with_doc("The dynamic vector to extract from"),
3899
            Operand::new("y", &imm.uimm8).with_doc("128-bit vector index"),
3900
        ])
3901
        .operands_out(vec![
3902
            Operand::new("a", &TxN.dynamic_to_vector()).with_doc("New fixed vector"),
3903
        ]),
3904
    );
3905
}
3906

3907
Product

Resources

Company