CoCalc -- mod.rs

GitHub Repository: bytecodealliance/wasmtime
Path: blob/main/cranelift/codegen/src/isa/aarch64/inst/mod.rs
¹⁶⁹³ views
1
//! This module defines aarch64-specific machine instruction types.
2

3
use crate::binemit::{Addend, CodeOffset, Reloc};
4
use crate::ir::types::{F16, F32, F64, F128, I8, I8X16, I16, I32, I64, I128};
5
use crate::ir::{MemFlags, Type, types};
6
use crate::isa::{CallConv, FunctionAlignment};
7
use crate::machinst::*;
8
use crate::{CodegenError, CodegenResult, settings};
9

10
use crate::machinst::{PrettyPrint, Reg, RegClass, Writable};
11

12
use alloc::vec::Vec;
13
use core::slice;
14
use smallvec::{SmallVec, smallvec};
15
use std::fmt::Write;
16
use std::string::{String, ToString};
17

18
pub(crate) mod regs;
19
pub(crate) use self::regs::*;
20
pub mod imms;
21
pub use self::imms::*;
22
pub mod args;
23
pub use self::args::*;
24
pub mod emit;
25
pub(crate) use self::emit::*;
26
use crate::isa::aarch64::abi::AArch64MachineDeps;
27

28
pub(crate) mod unwind;
29

30
#[cfg(test)]
31
mod emit_tests;
32

33
//=============================================================================
34
// Instructions (top level): definition
35

36
pub use crate::isa::aarch64::lower::isle::generated_code::{
37
    ALUOp, ALUOp3, AMode, APIKey, AtomicRMWLoopOp, AtomicRMWOp, BitOp, BranchTargetType, FPUOp1,
38
    FPUOp2, FPUOp3, FpuRoundMode, FpuToIntOp, IntToFpuOp, MInst as Inst, MoveWideOp, VecALUModOp,
39
    VecALUOp, VecExtendOp, VecLanesOp, VecMisc2, VecPairOp, VecRRLongOp, VecRRNarrowOp,
40
    VecRRPairLongOp, VecRRRLongModOp, VecRRRLongOp, VecShiftImmModOp, VecShiftImmOp,
41
};
42

43
/// A floating-point unit (FPU) operation with two args, a register and an immediate.
44
#[derive(Copy, Clone, Debug)]
45
pub enum FPUOpRI {
46
    /// Unsigned right shift. Rd = Rn << #imm
47
    UShr32(FPURightShiftImm),
48
    /// Unsigned right shift. Rd = Rn << #imm
49
    UShr64(FPURightShiftImm),
50
}
51

52
/// A floating-point unit (FPU) operation with two args, a register and
53
/// an immediate that modifies its dest (so takes that input value as a
54
/// separate virtual register).
55
#[derive(Copy, Clone, Debug)]
56
pub enum FPUOpRIMod {
57
    /// Shift left and insert. Rd |= Rn << #imm
58
    Sli32(FPULeftShiftImm),
59
    /// Shift left and insert. Rd |= Rn << #imm
60
    Sli64(FPULeftShiftImm),
61
}
62

63
impl BitOp {
64
    /// Get the assembly mnemonic for this opcode.
65
    pub fn op_str(&self) -> &'static str {
66
        match self {
67
            BitOp::RBit => "rbit",
68
            BitOp::Clz => "clz",
69
            BitOp::Cls => "cls",
70
            BitOp::Rev16 => "rev16",
71
            BitOp::Rev32 => "rev32",
72
            BitOp::Rev64 => "rev64",
73
        }
74
    }
75
}
76

77
/// Additional information for `return_call[_ind]` instructions, left out of
78
/// line to lower the size of the `Inst` enum.
79
#[derive(Clone, Debug)]
80
pub struct ReturnCallInfo<T> {
81
    /// Where this call is going to
82
    pub dest: T,
83
    /// Arguments to the call instruction.
84
    pub uses: CallArgList,
85
    /// The size of the new stack frame's stack arguments. This is necessary
86
    /// for copying the frame over our current frame. It must already be
87
    /// allocated on the stack.
88
    pub new_stack_arg_size: u32,
89
    /// API key to use to restore the return address, if any.
90
    pub key: Option<APIKey>,
91
}
92

93
fn count_zero_half_words(mut value: u64, num_half_words: u8) -> usize {
94
    let mut count = 0;
95
    for _ in 0..num_half_words {
96
        if value & 0xffff == 0 {
97
            count += 1;
98
        }
99
        value >>= 16;
100
    }
101

102
    count
103
}
104

105
impl Inst {
106
    /// Create an instruction that loads a constant, using one of several options (MOVZ, MOVN,
107
    /// logical immediate, or constant pool).
108
    pub fn load_constant(rd: Writable<Reg>, value: u64) -> SmallVec<[Inst; 4]> {
109
        // NB: this is duplicated in `lower/isle.rs` and `inst.isle` right now,
110
        // if modifications are made here before this is deleted after moving to
111
        // ISLE then those locations should be updated as well.
112

113
        if let Some(imm) = MoveWideConst::maybe_from_u64(value) {
114
            // 16-bit immediate (shifted by 0, 16, 32 or 48 bits) in MOVZ
115
            smallvec![Inst::MovWide {
116
                op: MoveWideOp::MovZ,
117
                rd,
118
                imm,
119
                size: OperandSize::Size64
120
            }]
121
        } else if let Some(imm) = MoveWideConst::maybe_from_u64(!value) {
122
            // 16-bit immediate (shifted by 0, 16, 32 or 48 bits) in MOVN
123
            smallvec![Inst::MovWide {
124
                op: MoveWideOp::MovN,
125
                rd,
126
                imm,
127
                size: OperandSize::Size64
128
            }]
129
        } else if let Some(imml) = ImmLogic::maybe_from_u64(value, I64) {
130
            // Weird logical-instruction immediate in ORI using zero register
131
            smallvec![Inst::AluRRImmLogic {
132
                alu_op: ALUOp::Orr,
133
                size: OperandSize::Size64,
134
                rd,
135
                rn: zero_reg(),
136
                imml,
137
            }]
138
        } else {
139
            let mut insts = smallvec![];
140

141
            // If the top 32 bits are zero, use 32-bit `mov` operations.
142
            let (num_half_words, size, negated) = if value >> 32 == 0 {
143
                (2, OperandSize::Size32, (!value << 32) >> 32)
144
            } else {
145
                (4, OperandSize::Size64, !value)
146
            };
147

148
            // If the number of 0xffff half words is greater than the number of 0x0000 half words
149
            // it is more efficient to use `movn` for the first instruction.
150
            let first_is_inverted = count_zero_half_words(negated, num_half_words)
151
                > count_zero_half_words(value, num_half_words);
152

153
            // Either 0xffff or 0x0000 half words can be skipped, depending on the first
154
            // instruction used.
155
            let ignored_halfword = if first_is_inverted { 0xffff } else { 0 };
156

157
            let halfwords: SmallVec<[_; 4]> = (0..num_half_words)
158
                .filter_map(|i| {
159
                    let imm16 = (value >> (16 * i)) & 0xffff;
160
                    if imm16 == ignored_halfword {
161
                        None
162
                    } else {
163
                        Some((i, imm16))
164
                    }
165
                })
166
                .collect();
167

168
            let mut prev_result = None;
169
            for (i, imm16) in halfwords {
170
                let shift = i * 16;
171

172
                if let Some(rn) = prev_result {
173
                    let imm = MoveWideConst::maybe_with_shift(imm16 as u16, shift).unwrap();
174
                    insts.push(Inst::MovK { rd, rn, imm, size });
175
                } else {
176
                    if first_is_inverted {
177
                        let imm =
178
                            MoveWideConst::maybe_with_shift(((!imm16) & 0xffff) as u16, shift)
179
                                .unwrap();
180
                        insts.push(Inst::MovWide {
181
                            op: MoveWideOp::MovN,
182
                            rd,
183
                            imm,
184
                            size,
185
                        });
186
                    } else {
187
                        let imm = MoveWideConst::maybe_with_shift(imm16 as u16, shift).unwrap();
188
                        insts.push(Inst::MovWide {
189
                            op: MoveWideOp::MovZ,
190
                            rd,
191
                            imm,
192
                            size,
193
                        });
194
                    }
195
                }
196

197
                prev_result = Some(rd.to_reg());
198
            }
199

200
            assert!(prev_result.is_some());
201

202
            insts
203
        }
204
    }
205

206
    /// Generic constructor for a load (zero-extending where appropriate).
207
    pub fn gen_load(into_reg: Writable<Reg>, mem: AMode, ty: Type, flags: MemFlags) -> Inst {
208
        match ty {
209
            I8 => Inst::ULoad8 {
210
                rd: into_reg,
211
                mem,
212
                flags,
213
            },
214
            I16 => Inst::ULoad16 {
215
                rd: into_reg,
216
                mem,
217
                flags,
218
            },
219
            I32 => Inst::ULoad32 {
220
                rd: into_reg,
221
                mem,
222
                flags,
223
            },
224
            I64 => Inst::ULoad64 {
225
                rd: into_reg,
226
                mem,
227
                flags,
228
            },
229
            _ => {
230
                if ty.is_vector() || ty.is_float() {
231
                    let bits = ty_bits(ty);
232
                    let rd = into_reg;
233

234
                    match bits {
235
                        128 => Inst::FpuLoad128 { rd, mem, flags },
236
                        64 => Inst::FpuLoad64 { rd, mem, flags },
237
                        32 => Inst::FpuLoad32 { rd, mem, flags },
238
                        16 => Inst::FpuLoad16 { rd, mem, flags },
239
                        _ => unimplemented!("gen_load({})", ty),
240
                    }
241
                } else {
242
                    unimplemented!("gen_load({})", ty);
243
                }
244
            }
245
        }
246
    }
247

248
    /// Generic constructor for a store.
249
    pub fn gen_store(mem: AMode, from_reg: Reg, ty: Type, flags: MemFlags) -> Inst {
250
        match ty {
251
            I8 => Inst::Store8 {
252
                rd: from_reg,
253
                mem,
254
                flags,
255
            },
256
            I16 => Inst::Store16 {
257
                rd: from_reg,
258
                mem,
259
                flags,
260
            },
261
            I32 => Inst::Store32 {
262
                rd: from_reg,
263
                mem,
264
                flags,
265
            },
266
            I64 => Inst::Store64 {
267
                rd: from_reg,
268
                mem,
269
                flags,
270
            },
271
            _ => {
272
                if ty.is_vector() || ty.is_float() {
273
                    let bits = ty_bits(ty);
274
                    let rd = from_reg;
275

276
                    match bits {
277
                        128 => Inst::FpuStore128 { rd, mem, flags },
278
                        64 => Inst::FpuStore64 { rd, mem, flags },
279
                        32 => Inst::FpuStore32 { rd, mem, flags },
280
                        16 => Inst::FpuStore16 { rd, mem, flags },
281
                        _ => unimplemented!("gen_store({})", ty),
282
                    }
283
                } else {
284
                    unimplemented!("gen_store({})", ty);
285
                }
286
            }
287
        }
288
    }
289

290
    /// What type does this load or store instruction access in memory? When
291
    /// uimm12 encoding is used, the size of this type is the amount that
292
    /// immediate offsets are scaled by.
293
    pub fn mem_type(&self) -> Option<Type> {
294
        match self {
295
            Inst::ULoad8 { .. } => Some(I8),
296
            Inst::SLoad8 { .. } => Some(I8),
297
            Inst::ULoad16 { .. } => Some(I16),
298
            Inst::SLoad16 { .. } => Some(I16),
299
            Inst::ULoad32 { .. } => Some(I32),
300
            Inst::SLoad32 { .. } => Some(I32),
301
            Inst::ULoad64 { .. } => Some(I64),
302
            Inst::FpuLoad16 { .. } => Some(F16),
303
            Inst::FpuLoad32 { .. } => Some(F32),
304
            Inst::FpuLoad64 { .. } => Some(F64),
305
            Inst::FpuLoad128 { .. } => Some(I8X16),
306
            Inst::Store8 { .. } => Some(I8),
307
            Inst::Store16 { .. } => Some(I16),
308
            Inst::Store32 { .. } => Some(I32),
309
            Inst::Store64 { .. } => Some(I64),
310
            Inst::FpuStore16 { .. } => Some(F16),
311
            Inst::FpuStore32 { .. } => Some(F32),
312
            Inst::FpuStore64 { .. } => Some(F64),
313
            Inst::FpuStore128 { .. } => Some(I8X16),
314
            _ => None,
315
        }
316
    }
317
}
318

319
//=============================================================================
320
// Instructions: get_regs
321

322
fn memarg_operands(memarg: &mut AMode, collector: &mut impl OperandVisitor) {
323
    match memarg {
324
        AMode::Unscaled { rn, .. } | AMode::UnsignedOffset { rn, .. } => {
325
            collector.reg_use(rn);
326
        }
327
        AMode::RegReg { rn, rm, .. }
328
        | AMode::RegScaled { rn, rm, .. }
329
        | AMode::RegScaledExtended { rn, rm, .. }
330
        | AMode::RegExtended { rn, rm, .. } => {
331
            collector.reg_use(rn);
332
            collector.reg_use(rm);
333
        }
334
        AMode::Label { .. } => {}
335
        AMode::SPPreIndexed { .. } | AMode::SPPostIndexed { .. } => {}
336
        AMode::FPOffset { .. } | AMode::IncomingArg { .. } => {}
337
        AMode::SPOffset { .. } | AMode::SlotOffset { .. } => {}
338
        AMode::RegOffset { rn, .. } => {
339
            collector.reg_use(rn);
340
        }
341
        AMode::Const { .. } => {}
342
    }
343
}
344

345
fn pairmemarg_operands(pairmemarg: &mut PairAMode, collector: &mut impl OperandVisitor) {
346
    match pairmemarg {
347
        PairAMode::SignedOffset { reg, .. } => {
348
            collector.reg_use(reg);
349
        }
350
        PairAMode::SPPreIndexed { .. } | PairAMode::SPPostIndexed { .. } => {}
351
    }
352
}
353

354
fn aarch64_get_operands(inst: &mut Inst, collector: &mut impl OperandVisitor) {
355
    match inst {
356
        Inst::AluRRR { rd, rn, rm, .. } => {
357
            collector.reg_def(rd);
358
            collector.reg_use(rn);
359
            collector.reg_use(rm);
360
        }
361
        Inst::AluRRRR { rd, rn, rm, ra, .. } => {
362
            collector.reg_def(rd);
363
            collector.reg_use(rn);
364
            collector.reg_use(rm);
365
            collector.reg_use(ra);
366
        }
367
        Inst::AluRRImm12 { rd, rn, .. } => {
368
            collector.reg_def(rd);
369
            collector.reg_use(rn);
370
        }
371
        Inst::AluRRImmLogic { rd, rn, .. } => {
372
            collector.reg_def(rd);
373
            collector.reg_use(rn);
374
        }
375
        Inst::AluRRImmShift { rd, rn, .. } => {
376
            collector.reg_def(rd);
377
            collector.reg_use(rn);
378
        }
379
        Inst::AluRRRShift { rd, rn, rm, .. } => {
380
            collector.reg_def(rd);
381
            collector.reg_use(rn);
382
            collector.reg_use(rm);
383
        }
384
        Inst::AluRRRExtend { rd, rn, rm, .. } => {
385
            collector.reg_def(rd);
386
            collector.reg_use(rn);
387
            collector.reg_use(rm);
388
        }
389
        Inst::BitRR { rd, rn, .. } => {
390
            collector.reg_def(rd);
391
            collector.reg_use(rn);
392
        }
393
        Inst::ULoad8 { rd, mem, .. }
394
        | Inst::SLoad8 { rd, mem, .. }
395
        | Inst::ULoad16 { rd, mem, .. }
396
        | Inst::SLoad16 { rd, mem, .. }
397
        | Inst::ULoad32 { rd, mem, .. }
398
        | Inst::SLoad32 { rd, mem, .. }
399
        | Inst::ULoad64 { rd, mem, .. } => {
400
            collector.reg_def(rd);
401
            memarg_operands(mem, collector);
402
        }
403
        Inst::Store8 { rd, mem, .. }
404
        | Inst::Store16 { rd, mem, .. }
405
        | Inst::Store32 { rd, mem, .. }
406
        | Inst::Store64 { rd, mem, .. } => {
407
            collector.reg_use(rd);
408
            memarg_operands(mem, collector);
409
        }
410
        Inst::StoreP64 { rt, rt2, mem, .. } => {
411
            collector.reg_use(rt);
412
            collector.reg_use(rt2);
413
            pairmemarg_operands(mem, collector);
414
        }
415
        Inst::LoadP64 { rt, rt2, mem, .. } => {
416
            collector.reg_def(rt);
417
            collector.reg_def(rt2);
418
            pairmemarg_operands(mem, collector);
419
        }
420
        Inst::Mov { rd, rm, .. } => {
421
            collector.reg_def(rd);
422
            collector.reg_use(rm);
423
        }
424
        Inst::MovFromPReg { rd, rm } => {
425
            debug_assert!(rd.to_reg().is_virtual());
426
            collector.reg_def(rd);
427
            collector.reg_fixed_nonallocatable(*rm);
428
        }
429
        Inst::MovToPReg { rd, rm } => {
430
            debug_assert!(rm.is_virtual());
431
            collector.reg_fixed_nonallocatable(*rd);
432
            collector.reg_use(rm);
433
        }
434
        Inst::MovK { rd, rn, .. } => {
435
            collector.reg_use(rn);
436
            collector.reg_reuse_def(rd, 0); // `rn` == `rd`.
437
        }
438
        Inst::MovWide { rd, .. } => {
439
            collector.reg_def(rd);
440
        }
441
        Inst::CSel { rd, rn, rm, .. } => {
442
            collector.reg_def(rd);
443
            collector.reg_use(rn);
444
            collector.reg_use(rm);
445
        }
446
        Inst::CSNeg { rd, rn, rm, .. } => {
447
            collector.reg_def(rd);
448
            collector.reg_use(rn);
449
            collector.reg_use(rm);
450
        }
451
        Inst::CSet { rd, .. } | Inst::CSetm { rd, .. } => {
452
            collector.reg_def(rd);
453
        }
454
        Inst::CCmp { rn, rm, .. } => {
455
            collector.reg_use(rn);
456
            collector.reg_use(rm);
457
        }
458
        Inst::CCmpImm { rn, .. } => {
459
            collector.reg_use(rn);
460
        }
461
        Inst::AtomicRMWLoop {
462
            op,
463
            addr,
464
            operand,
465
            oldval,
466
            scratch1,
467
            scratch2,
468
            ..
469
        } => {
470
            collector.reg_fixed_use(addr, xreg(25));
471
            collector.reg_fixed_use(operand, xreg(26));
472
            collector.reg_fixed_def(oldval, xreg(27));
473
            collector.reg_fixed_def(scratch1, xreg(24));
474
            if *op != AtomicRMWLoopOp::Xchg {
475
                collector.reg_fixed_def(scratch2, xreg(28));
476
            }
477
        }
478
        Inst::AtomicRMW { rs, rt, rn, .. } => {
479
            collector.reg_use(rs);
480
            collector.reg_def(rt);
481
            collector.reg_use(rn);
482
        }
483
        Inst::AtomicCAS { rd, rs, rt, rn, .. } => {
484
            collector.reg_reuse_def(rd, 1); // reuse `rs`.
485
            collector.reg_use(rs);
486
            collector.reg_use(rt);
487
            collector.reg_use(rn);
488
        }
489
        Inst::AtomicCASLoop {
490
            addr,
491
            expected,
492
            replacement,
493
            oldval,
494
            scratch,
495
            ..
496
        } => {
497
            collector.reg_fixed_use(addr, xreg(25));
498
            collector.reg_fixed_use(expected, xreg(26));
499
            collector.reg_fixed_use(replacement, xreg(28));
500
            collector.reg_fixed_def(oldval, xreg(27));
501
            collector.reg_fixed_def(scratch, xreg(24));
502
        }
503
        Inst::LoadAcquire { rt, rn, .. } => {
504
            collector.reg_use(rn);
505
            collector.reg_def(rt);
506
        }
507
        Inst::StoreRelease { rt, rn, .. } => {
508
            collector.reg_use(rn);
509
            collector.reg_use(rt);
510
        }
511
        Inst::Fence {} | Inst::Csdb {} => {}
512
        Inst::FpuMove32 { rd, rn } => {
513
            collector.reg_def(rd);
514
            collector.reg_use(rn);
515
        }
516
        Inst::FpuMove64 { rd, rn } => {
517
            collector.reg_def(rd);
518
            collector.reg_use(rn);
519
        }
520
        Inst::FpuMove128 { rd, rn } => {
521
            collector.reg_def(rd);
522
            collector.reg_use(rn);
523
        }
524
        Inst::FpuMoveFromVec { rd, rn, .. } => {
525
            collector.reg_def(rd);
526
            collector.reg_use(rn);
527
        }
528
        Inst::FpuExtend { rd, rn, .. } => {
529
            collector.reg_def(rd);
530
            collector.reg_use(rn);
531
        }
532
        Inst::FpuRR { rd, rn, .. } => {
533
            collector.reg_def(rd);
534
            collector.reg_use(rn);
535
        }
536
        Inst::FpuRRR { rd, rn, rm, .. } => {
537
            collector.reg_def(rd);
538
            collector.reg_use(rn);
539
            collector.reg_use(rm);
540
        }
541
        Inst::FpuRRI { rd, rn, .. } => {
542
            collector.reg_def(rd);
543
            collector.reg_use(rn);
544
        }
545
        Inst::FpuRRIMod { rd, ri, rn, .. } => {
546
            collector.reg_reuse_def(rd, 1); // reuse `ri`.
547
            collector.reg_use(ri);
548
            collector.reg_use(rn);
549
        }
550
        Inst::FpuRRRR { rd, rn, rm, ra, .. } => {
551
            collector.reg_def(rd);
552
            collector.reg_use(rn);
553
            collector.reg_use(rm);
554
            collector.reg_use(ra);
555
        }
556
        Inst::VecMisc { rd, rn, .. } => {
557
            collector.reg_def(rd);
558
            collector.reg_use(rn);
559
        }
560

561
        Inst::VecLanes { rd, rn, .. } => {
562
            collector.reg_def(rd);
563
            collector.reg_use(rn);
564
        }
565
        Inst::VecShiftImm { rd, rn, .. } => {
566
            collector.reg_def(rd);
567
            collector.reg_use(rn);
568
        }
569
        Inst::VecShiftImmMod { rd, ri, rn, .. } => {
570
            collector.reg_reuse_def(rd, 1); // `rd` == `ri`.
571
            collector.reg_use(ri);
572
            collector.reg_use(rn);
573
        }
574
        Inst::VecExtract { rd, rn, rm, .. } => {
575
            collector.reg_def(rd);
576
            collector.reg_use(rn);
577
            collector.reg_use(rm);
578
        }
579
        Inst::VecTbl { rd, rn, rm } => {
580
            collector.reg_use(rn);
581
            collector.reg_use(rm);
582
            collector.reg_def(rd);
583
        }
584
        Inst::VecTblExt { rd, ri, rn, rm } => {
585
            collector.reg_use(rn);
586
            collector.reg_use(rm);
587
            collector.reg_reuse_def(rd, 3); // `rd` == `ri`.
588
            collector.reg_use(ri);
589
        }
590

591
        Inst::VecTbl2 { rd, rn, rn2, rm } => {
592
            // Constrain to v30 / v31 so that we satisfy the "adjacent
593
            // registers" constraint without use of pinned vregs in
594
            // lowering.
595
            collector.reg_fixed_use(rn, vreg(30));
596
            collector.reg_fixed_use(rn2, vreg(31));
597
            collector.reg_use(rm);
598
            collector.reg_def(rd);
599
        }
600
        Inst::VecTbl2Ext {
601
            rd,
602
            ri,
603
            rn,
604
            rn2,
605
            rm,
606
        } => {
607
            // Constrain to v30 / v31 so that we satisfy the "adjacent
608
            // registers" constraint without use of pinned vregs in
609
            // lowering.
610
            collector.reg_fixed_use(rn, vreg(30));
611
            collector.reg_fixed_use(rn2, vreg(31));
612
            collector.reg_use(rm);
613
            collector.reg_reuse_def(rd, 4); // `rd` == `ri`.
614
            collector.reg_use(ri);
615
        }
616
        Inst::VecLoadReplicate { rd, rn, .. } => {
617
            collector.reg_def(rd);
618
            collector.reg_use(rn);
619
        }
620
        Inst::VecCSel { rd, rn, rm, .. } => {
621
            collector.reg_def(rd);
622
            collector.reg_use(rn);
623
            collector.reg_use(rm);
624
        }
625
        Inst::FpuCmp { rn, rm, .. } => {
626
            collector.reg_use(rn);
627
            collector.reg_use(rm);
628
        }
629
        Inst::FpuLoad16 { rd, mem, .. } => {
630
            collector.reg_def(rd);
631
            memarg_operands(mem, collector);
632
        }
633
        Inst::FpuLoad32 { rd, mem, .. } => {
634
            collector.reg_def(rd);
635
            memarg_operands(mem, collector);
636
        }
637
        Inst::FpuLoad64 { rd, mem, .. } => {
638
            collector.reg_def(rd);
639
            memarg_operands(mem, collector);
640
        }
641
        Inst::FpuLoad128 { rd, mem, .. } => {
642
            collector.reg_def(rd);
643
            memarg_operands(mem, collector);
644
        }
645
        Inst::FpuStore16 { rd, mem, .. } => {
646
            collector.reg_use(rd);
647
            memarg_operands(mem, collector);
648
        }
649
        Inst::FpuStore32 { rd, mem, .. } => {
650
            collector.reg_use(rd);
651
            memarg_operands(mem, collector);
652
        }
653
        Inst::FpuStore64 { rd, mem, .. } => {
654
            collector.reg_use(rd);
655
            memarg_operands(mem, collector);
656
        }
657
        Inst::FpuStore128 { rd, mem, .. } => {
658
            collector.reg_use(rd);
659
            memarg_operands(mem, collector);
660
        }
661
        Inst::FpuLoadP64 { rt, rt2, mem, .. } => {
662
            collector.reg_def(rt);
663
            collector.reg_def(rt2);
664
            pairmemarg_operands(mem, collector);
665
        }
666
        Inst::FpuStoreP64 { rt, rt2, mem, .. } => {
667
            collector.reg_use(rt);
668
            collector.reg_use(rt2);
669
            pairmemarg_operands(mem, collector);
670
        }
671
        Inst::FpuLoadP128 { rt, rt2, mem, .. } => {
672
            collector.reg_def(rt);
673
            collector.reg_def(rt2);
674
            pairmemarg_operands(mem, collector);
675
        }
676
        Inst::FpuStoreP128 { rt, rt2, mem, .. } => {
677
            collector.reg_use(rt);
678
            collector.reg_use(rt2);
679
            pairmemarg_operands(mem, collector);
680
        }
681
        Inst::FpuToInt { rd, rn, .. } => {
682
            collector.reg_def(rd);
683
            collector.reg_use(rn);
684
        }
685
        Inst::IntToFpu { rd, rn, .. } => {
686
            collector.reg_def(rd);
687
            collector.reg_use(rn);
688
        }
689
        Inst::FpuCSel16 { rd, rn, rm, .. }
690
        | Inst::FpuCSel32 { rd, rn, rm, .. }
691
        | Inst::FpuCSel64 { rd, rn, rm, .. } => {
692
            collector.reg_def(rd);
693
            collector.reg_use(rn);
694
            collector.reg_use(rm);
695
        }
696
        Inst::FpuRound { rd, rn, .. } => {
697
            collector.reg_def(rd);
698
            collector.reg_use(rn);
699
        }
700
        Inst::MovToFpu { rd, rn, .. } => {
701
            collector.reg_def(rd);
702
            collector.reg_use(rn);
703
        }
704
        Inst::FpuMoveFPImm { rd, .. } => {
705
            collector.reg_def(rd);
706
        }
707
        Inst::MovToVec { rd, ri, rn, .. } => {
708
            collector.reg_reuse_def(rd, 1); // `rd` == `ri`.
709
            collector.reg_use(ri);
710
            collector.reg_use(rn);
711
        }
712
        Inst::MovFromVec { rd, rn, .. } | Inst::MovFromVecSigned { rd, rn, .. } => {
713
            collector.reg_def(rd);
714
            collector.reg_use(rn);
715
        }
716
        Inst::VecDup { rd, rn, .. } => {
717
            collector.reg_def(rd);
718
            collector.reg_use(rn);
719
        }
720
        Inst::VecDupFromFpu { rd, rn, .. } => {
721
            collector.reg_def(rd);
722
            collector.reg_use(rn);
723
        }
724
        Inst::VecDupFPImm { rd, .. } => {
725
            collector.reg_def(rd);
726
        }
727
        Inst::VecDupImm { rd, .. } => {
728
            collector.reg_def(rd);
729
        }
730
        Inst::VecExtend { rd, rn, .. } => {
731
            collector.reg_def(rd);
732
            collector.reg_use(rn);
733
        }
734
        Inst::VecMovElement { rd, ri, rn, .. } => {
735
            collector.reg_reuse_def(rd, 1); // `rd` == `ri`.
736
            collector.reg_use(ri);
737
            collector.reg_use(rn);
738
        }
739
        Inst::VecRRLong { rd, rn, .. } => {
740
            collector.reg_def(rd);
741
            collector.reg_use(rn);
742
        }
743
        Inst::VecRRNarrowLow { rd, rn, .. } => {
744
            collector.reg_use(rn);
745
            collector.reg_def(rd);
746
        }
747
        Inst::VecRRNarrowHigh { rd, ri, rn, .. } => {
748
            collector.reg_use(rn);
749
            collector.reg_reuse_def(rd, 2); // `rd` == `ri`.
750
            collector.reg_use(ri);
751
        }
752
        Inst::VecRRPair { rd, rn, .. } => {
753
            collector.reg_def(rd);
754
            collector.reg_use(rn);
755
        }
756
        Inst::VecRRRLong { rd, rn, rm, .. } => {
757
            collector.reg_def(rd);
758
            collector.reg_use(rn);
759
            collector.reg_use(rm);
760
        }
761
        Inst::VecRRRLongMod { rd, ri, rn, rm, .. } => {
762
            collector.reg_reuse_def(rd, 1); // `rd` == `ri`.
763
            collector.reg_use(ri);
764
            collector.reg_use(rn);
765
            collector.reg_use(rm);
766
        }
767
        Inst::VecRRPairLong { rd, rn, .. } => {
768
            collector.reg_def(rd);
769
            collector.reg_use(rn);
770
        }
771
        Inst::VecRRR { rd, rn, rm, .. } => {
772
            collector.reg_def(rd);
773
            collector.reg_use(rn);
774
            collector.reg_use(rm);
775
        }
776
        Inst::VecRRRMod { rd, ri, rn, rm, .. } | Inst::VecFmlaElem { rd, ri, rn, rm, .. } => {
777
            collector.reg_reuse_def(rd, 1); // `rd` == `ri`.
778
            collector.reg_use(ri);
779
            collector.reg_use(rn);
780
            collector.reg_use(rm);
781
        }
782
        Inst::MovToNZCV { rn } => {
783
            collector.reg_use(rn);
784
        }
785
        Inst::MovFromNZCV { rd } => {
786
            collector.reg_def(rd);
787
        }
788
        Inst::Extend { rd, rn, .. } => {
789
            collector.reg_def(rd);
790
            collector.reg_use(rn);
791
        }
792
        Inst::Args { args } => {
793
            for ArgPair { vreg, preg } in args {
794
                collector.reg_fixed_def(vreg, *preg);
795
            }
796
        }
797
        Inst::Rets { rets } => {
798
            for RetPair { vreg, preg } in rets {
799
                collector.reg_fixed_use(vreg, *preg);
800
            }
801
        }
802
        Inst::Ret { .. } | Inst::AuthenticatedRet { .. } => {}
803
        Inst::Jump { .. } => {}
804
        Inst::Call { info, .. } => {
805
            let CallInfo { uses, defs, .. } = &mut **info;
806
            for CallArgPair { vreg, preg } in uses {
807
                collector.reg_fixed_use(vreg, *preg);
808
            }
809
            for CallRetPair { vreg, location } in defs {
810
                match location {
811
                    RetLocation::Reg(preg, ..) => collector.reg_fixed_def(vreg, *preg),
812
                    RetLocation::Stack(..) => collector.any_def(vreg),
813
                }
814
            }
815
            collector.reg_clobbers(info.clobbers);
816
            if let Some(try_call_info) = &mut info.try_call_info {
817
                try_call_info.collect_operands(collector);
818
            }
819
        }
820
        Inst::CallInd { info, .. } => {
821
            let CallInfo {
822
                dest, uses, defs, ..
823
            } = &mut **info;
824
            collector.reg_use(dest);
825
            for CallArgPair { vreg, preg } in uses {
826
                collector.reg_fixed_use(vreg, *preg);
827
            }
828
            for CallRetPair { vreg, location } in defs {
829
                match location {
830
                    RetLocation::Reg(preg, ..) => collector.reg_fixed_def(vreg, *preg),
831
                    RetLocation::Stack(..) => collector.any_def(vreg),
832
                }
833
            }
834
            collector.reg_clobbers(info.clobbers);
835
            if let Some(try_call_info) = &mut info.try_call_info {
836
                try_call_info.collect_operands(collector);
837
            }
838
        }
839
        Inst::ReturnCall { info } => {
840
            for CallArgPair { vreg, preg } in &mut info.uses {
841
                collector.reg_fixed_use(vreg, *preg);
842
            }
843
        }
844
        Inst::ReturnCallInd { info } => {
845
            // TODO(https://github.com/bytecodealliance/regalloc2/issues/145):
846
            // This shouldn't be a fixed register constraint, but it's not clear how to pick a
847
            // register that won't be clobbered by the callee-save restore code emitted with a
848
            // return_call_indirect.
849
            collector.reg_fixed_use(&mut info.dest, xreg(1));
850
            for CallArgPair { vreg, preg } in &mut info.uses {
851
                collector.reg_fixed_use(vreg, *preg);
852
            }
853
        }
854
        Inst::CondBr { kind, .. } => match kind {
855
            CondBrKind::Zero(rt, _) | CondBrKind::NotZero(rt, _) => collector.reg_use(rt),
856
            CondBrKind::Cond(_) => {}
857
        },
858
        Inst::TestBitAndBranch { rn, .. } => {
859
            collector.reg_use(rn);
860
        }
861
        Inst::IndirectBr { rn, .. } => {
862
            collector.reg_use(rn);
863
        }
864
        Inst::Nop0 | Inst::Nop4 => {}
865
        Inst::Brk => {}
866
        Inst::Udf { .. } => {}
867
        Inst::TrapIf { kind, .. } => match kind {
868
            CondBrKind::Zero(rt, _) | CondBrKind::NotZero(rt, _) => collector.reg_use(rt),
869
            CondBrKind::Cond(_) => {}
870
        },
871
        Inst::Adr { rd, .. } | Inst::Adrp { rd, .. } => {
872
            collector.reg_def(rd);
873
        }
874
        Inst::Word4 { .. } | Inst::Word8 { .. } => {}
875
        Inst::JTSequence {
876
            ridx, rtmp1, rtmp2, ..
877
        } => {
878
            collector.reg_use(ridx);
879
            collector.reg_early_def(rtmp1);
880
            collector.reg_early_def(rtmp2);
881
        }
882
        Inst::LoadExtNameGot { rd, .. }
883
        | Inst::LoadExtNameNear { rd, .. }
884
        | Inst::LoadExtNameFar { rd, .. } => {
885
            collector.reg_def(rd);
886
        }
887
        Inst::LoadAddr { rd, mem } => {
888
            collector.reg_def(rd);
889
            memarg_operands(mem, collector);
890
        }
891
        Inst::Paci { .. } | Inst::Xpaclri => {
892
            // Neither LR nor SP is an allocatable register, so there is no need
893
            // to do anything.
894
        }
895
        Inst::Bti { .. } => {}
896

897
        Inst::ElfTlsGetAddr { rd, tmp, .. } => {
898
            // TLSDESC has a very neat calling convention. It is required to preserve
899
            // all registers except x0 and x30. X30 is non allocatable in cranelift since
900
            // its the link register.
901
            //
902
            // Additionally we need a second register as a temporary register for the
903
            // TLSDESC sequence. This register can be any register other than x0 (and x30).
904
            collector.reg_fixed_def(rd, regs::xreg(0));
905
            collector.reg_early_def(tmp);
906
        }
907
        Inst::MachOTlsGetAddr { rd, .. } => {
908
            collector.reg_fixed_def(rd, regs::xreg(0));
909
            let mut clobbers =
910
                AArch64MachineDeps::get_regs_clobbered_by_call(CallConv::AppleAarch64, false);
911
            clobbers.remove(regs::xreg_preg(0));
912
            collector.reg_clobbers(clobbers);
913
        }
914
        Inst::Unwind { .. } => {}
915
        Inst::EmitIsland { .. } => {}
916
        Inst::DummyUse { reg } => {
917
            collector.reg_use(reg);
918
        }
919
        Inst::LabelAddress { dst, .. } => {
920
            collector.reg_def(dst);
921
        }
922
        Inst::StackProbeLoop { start, end, .. } => {
923
            collector.reg_early_def(start);
924
            collector.reg_use(end);
925
        }
926
    }
927
}
928

929
//=============================================================================
930
// Instructions: misc functions and external interface
931

932
impl MachInst for Inst {
933
    type ABIMachineSpec = AArch64MachineDeps;
934
    type LabelUse = LabelUse;
935

936
    // "CLIF" in hex, to make the trap recognizable during
937
    // debugging.
938
    const TRAP_OPCODE: &'static [u8] = &0xc11f_u32.to_le_bytes();
939

940
    fn get_operands(&mut self, collector: &mut impl OperandVisitor) {
941
        aarch64_get_operands(self, collector);
942
    }
943

944
    fn is_move(&self) -> Option<(Writable<Reg>, Reg)> {
945
        match self {
946
            &Inst::Mov {
947
                size: OperandSize::Size64,
948
                rd,
949
                rm,
950
            } => Some((rd, rm)),
951
            &Inst::FpuMove64 { rd, rn } => Some((rd, rn)),
952
            &Inst::FpuMove128 { rd, rn } => Some((rd, rn)),
953
            _ => None,
954
        }
955
    }
956

957
    fn is_included_in_clobbers(&self) -> bool {
958
        let (caller, callee, is_exception) = match self {
959
            Inst::Args { .. } => return false,
960
            Inst::Call { info } => (
961
                info.caller_conv,
962
                info.callee_conv,
963
                info.try_call_info.is_some(),
964
            ),
965
            Inst::CallInd { info } => (
966
                info.caller_conv,
967
                info.callee_conv,
968
                info.try_call_info.is_some(),
969
            ),
970
            _ => return true,
971
        };
972

973
        // We exclude call instructions from the clobber-set when they are calls
974
        // from caller to callee that both clobber the same register (such as
975
        // using the same or similar ABIs). Such calls cannot possibly force any
976
        // new registers to be saved in the prologue, because anything that the
977
        // callee clobbers, the caller is also allowed to clobber. This both
978
        // saves work and enables us to more precisely follow the
979
        // half-caller-save, half-callee-save SysV ABI for some vector
980
        // registers.
981
        //
982
        // See the note in [crate::isa::aarch64::abi::is_caller_save_reg] for
983
        // more information on this ABI-implementation hack.
984
        let caller_clobbers = AArch64MachineDeps::get_regs_clobbered_by_call(caller, false);
985
        let callee_clobbers = AArch64MachineDeps::get_regs_clobbered_by_call(callee, is_exception);
986

987
        let mut all_clobbers = caller_clobbers;
988
        all_clobbers.union_from(callee_clobbers);
989
        all_clobbers != caller_clobbers
990
    }
991

992
    fn is_trap(&self) -> bool {
993
        match self {
994
            Self::Udf { .. } => true,
995
            _ => false,
996
        }
997
    }
998

999
    fn is_args(&self) -> bool {
1000
        match self {
1001
            Self::Args { .. } => true,
1002
            _ => false,
1003
        }
1004
    }
1005

1006
    fn call_type(&self) -> CallType {
1007
        match self {
1008
            Inst::Call { .. }
1009
            | Inst::CallInd { .. }
1010
            | Inst::ElfTlsGetAddr { .. }
1011
            | Inst::MachOTlsGetAddr { .. } => CallType::Regular,
1012

1013
            Inst::ReturnCall { .. } | Inst::ReturnCallInd { .. } => CallType::TailCall,
1014

1015
            _ => CallType::None,
1016
        }
1017
    }
1018

1019
    fn is_term(&self) -> MachTerminator {
1020
        match self {
1021
            &Inst::Rets { .. } => MachTerminator::Ret,
1022
            &Inst::ReturnCall { .. } | &Inst::ReturnCallInd { .. } => MachTerminator::RetCall,
1023
            &Inst::Jump { .. } => MachTerminator::Branch,
1024
            &Inst::CondBr { .. } => MachTerminator::Branch,
1025
            &Inst::TestBitAndBranch { .. } => MachTerminator::Branch,
1026
            &Inst::IndirectBr { .. } => MachTerminator::Branch,
1027
            &Inst::JTSequence { .. } => MachTerminator::Branch,
1028
            &Inst::Call { ref info } if info.try_call_info.is_some() => MachTerminator::Branch,
1029
            &Inst::CallInd { ref info } if info.try_call_info.is_some() => MachTerminator::Branch,
1030
            _ => MachTerminator::None,
1031
        }
1032
    }
1033

1034
    fn is_mem_access(&self) -> bool {
1035
        match self {
1036
            &Inst::ULoad8 { .. }
1037
            | &Inst::SLoad8 { .. }
1038
            | &Inst::ULoad16 { .. }
1039
            | &Inst::SLoad16 { .. }
1040
            | &Inst::ULoad32 { .. }
1041
            | &Inst::SLoad32 { .. }
1042
            | &Inst::ULoad64 { .. }
1043
            | &Inst::LoadP64 { .. }
1044
            | &Inst::FpuLoad16 { .. }
1045
            | &Inst::FpuLoad32 { .. }
1046
            | &Inst::FpuLoad64 { .. }
1047
            | &Inst::FpuLoad128 { .. }
1048
            | &Inst::FpuLoadP64 { .. }
1049
            | &Inst::FpuLoadP128 { .. }
1050
            | &Inst::Store8 { .. }
1051
            | &Inst::Store16 { .. }
1052
            | &Inst::Store32 { .. }
1053
            | &Inst::Store64 { .. }
1054
            | &Inst::StoreP64 { .. }
1055
            | &Inst::FpuStore16 { .. }
1056
            | &Inst::FpuStore32 { .. }
1057
            | &Inst::FpuStore64 { .. }
1058
            | &Inst::FpuStore128 { .. } => true,
1059
            // TODO: verify this carefully
1060
            _ => false,
1061
        }
1062
    }
1063

1064
    fn gen_move(to_reg: Writable<Reg>, from_reg: Reg, ty: Type) -> Inst {
1065
        let bits = ty.bits();
1066

1067
        assert!(bits <= 128);
1068
        assert!(to_reg.to_reg().class() == from_reg.class());
1069
        match from_reg.class() {
1070
            RegClass::Int => Inst::Mov {
1071
                size: OperandSize::Size64,
1072
                rd: to_reg,
1073
                rm: from_reg,
1074
            },
1075
            RegClass::Float => {
1076
                if bits > 64 {
1077
                    Inst::FpuMove128 {
1078
                        rd: to_reg,
1079
                        rn: from_reg,
1080
                    }
1081
                } else {
1082
                    Inst::FpuMove64 {
1083
                        rd: to_reg,
1084
                        rn: from_reg,
1085
                    }
1086
                }
1087
            }
1088
            RegClass::Vector => unreachable!(),
1089
        }
1090
    }
1091

1092
    fn is_safepoint(&self) -> bool {
1093
        match self {
1094
            Inst::Call { .. } | Inst::CallInd { .. } => true,
1095
            _ => false,
1096
        }
1097
    }
1098

1099
    fn gen_dummy_use(reg: Reg) -> Inst {
1100
        Inst::DummyUse { reg }
1101
    }
1102

1103
    fn gen_nop(preferred_size: usize) -> Inst {
1104
        if preferred_size == 0 {
1105
            return Inst::Nop0;
1106
        }
1107
        // We can't give a NOP (or any insn) < 4 bytes.
1108
        assert!(preferred_size >= 4);
1109
        Inst::Nop4
1110
    }
1111

1112
    fn rc_for_type(ty: Type) -> CodegenResult<(&'static [RegClass], &'static [Type])> {
1113
        match ty {
1114
            I8 => Ok((&[RegClass::Int], &[I8])),
1115
            I16 => Ok((&[RegClass::Int], &[I16])),
1116
            I32 => Ok((&[RegClass::Int], &[I32])),
1117
            I64 => Ok((&[RegClass::Int], &[I64])),
1118
            F16 => Ok((&[RegClass::Float], &[F16])),
1119
            F32 => Ok((&[RegClass::Float], &[F32])),
1120
            F64 => Ok((&[RegClass::Float], &[F64])),
1121
            F128 => Ok((&[RegClass::Float], &[F128])),
1122
            I128 => Ok((&[RegClass::Int, RegClass::Int], &[I64, I64])),
1123
            _ if ty.is_vector() && ty.bits() <= 128 => {
1124
                let types = &[types::I8X2, types::I8X4, types::I8X8, types::I8X16];
1125
                Ok((
1126
                    &[RegClass::Float],
1127
                    slice::from_ref(&types[ty.bytes().ilog2() as usize - 1]),
1128
                ))
1129
            }
1130
            _ if ty.is_dynamic_vector() => Ok((&[RegClass::Float], &[I8X16])),
1131
            _ => Err(CodegenError::Unsupported(format!(
1132
                "Unexpected SSA-value type: {ty}"
1133
            ))),
1134
        }
1135
    }
1136

1137
    fn canonical_type_for_rc(rc: RegClass) -> Type {
1138
        match rc {
1139
            RegClass::Float => types::I8X16,
1140
            RegClass::Int => types::I64,
1141
            RegClass::Vector => unreachable!(),
1142
        }
1143
    }
1144

1145
    fn gen_jump(target: MachLabel) -> Inst {
1146
        Inst::Jump {
1147
            dest: BranchTarget::Label(target),
1148
        }
1149
    }
1150

1151
    fn worst_case_size() -> CodeOffset {
1152
        // The maximum size, in bytes, of any `Inst`'s emitted code. We have at least one case of
1153
        // an 8-instruction sequence (saturating int-to-float conversions) with three embedded
1154
        // 64-bit f64 constants.
1155
        //
1156
        // Note that inline jump-tables handle island/pool insertion separately, so we do not need
1157
        // to account for them here (otherwise the worst case would be 2^31 * 4, clearly not
1158
        // feasible for other reasons).
1159
        44
1160
    }
1161

1162
    fn ref_type_regclass(_: &settings::Flags) -> RegClass {
1163
        RegClass::Int
1164
    }
1165

1166
    fn gen_block_start(
1167
        is_indirect_branch_target: bool,
1168
        is_forward_edge_cfi_enabled: bool,
1169
    ) -> Option<Self> {
1170
        if is_indirect_branch_target && is_forward_edge_cfi_enabled {
1171
            Some(Inst::Bti {
1172
                targets: BranchTargetType::J,
1173
            })
1174
        } else {
1175
            None
1176
        }
1177
    }
1178

1179
    fn function_alignment() -> FunctionAlignment {
1180
        // We use 32-byte alignment for performance reasons, but for correctness
1181
        // we would only need 4-byte alignment.
1182
        FunctionAlignment {
1183
            minimum: 4,
1184
            preferred: 32,
1185
        }
1186
    }
1187
}
1188

1189
//=============================================================================
1190
// Pretty-printing of instructions.
1191

1192
fn mem_finalize_for_show(mem: &AMode, access_ty: Type, state: &EmitState) -> (String, String) {
1193
    let (mem_insts, mem) = mem_finalize(None, mem, access_ty, state);
1194
    let mut mem_str = mem_insts
1195
        .into_iter()
1196
        .map(|inst| inst.print_with_state(&mut EmitState::default()))
1197
        .collect::<Vec<_>>()
1198
        .join(" ; ");
1199
    if !mem_str.is_empty() {
1200
        mem_str += " ; ";
1201
    }
1202

1203
    let mem = mem.pretty_print(access_ty.bytes() as u8);
1204
    (mem_str, mem)
1205
}
1206

1207
fn pretty_print_try_call(info: &TryCallInfo) -> String {
1208
    format!(
1209
        "; b {:?}; catch [{}]",
1210
        info.continuation,
1211
        info.pretty_print_dests()
1212
    )
1213
}
1214

1215
impl Inst {
1216
    fn print_with_state(&self, state: &mut EmitState) -> String {
1217
        fn op_name(alu_op: ALUOp) -> &'static str {
1218
            match alu_op {
1219
                ALUOp::Add => "add",
1220
                ALUOp::Sub => "sub",
1221
                ALUOp::Orr => "orr",
1222
                ALUOp::And => "and",
1223
                ALUOp::AndS => "ands",
1224
                ALUOp::Eor => "eor",
1225
                ALUOp::AddS => "adds",
1226
                ALUOp::SubS => "subs",
1227
                ALUOp::SMulH => "smulh",
1228
                ALUOp::UMulH => "umulh",
1229
                ALUOp::SDiv => "sdiv",
1230
                ALUOp::UDiv => "udiv",
1231
                ALUOp::AndNot => "bic",
1232
                ALUOp::OrrNot => "orn",
1233
                ALUOp::EorNot => "eon",
1234
                ALUOp::Extr => "extr",
1235
                ALUOp::Lsr => "lsr",
1236
                ALUOp::Asr => "asr",
1237
                ALUOp::Lsl => "lsl",
1238
                ALUOp::Adc => "adc",
1239
                ALUOp::AdcS => "adcs",
1240
                ALUOp::Sbc => "sbc",
1241
                ALUOp::SbcS => "sbcs",
1242
            }
1243
        }
1244

1245
        match self {
1246
            &Inst::Nop0 => "nop-zero-len".to_string(),
1247
            &Inst::Nop4 => "nop".to_string(),
1248
            &Inst::AluRRR {
1249
                alu_op,
1250
                size,
1251
                rd,
1252
                rn,
1253
                rm,
1254
            } => {
1255
                let op = op_name(alu_op);
1256
                let rd = pretty_print_ireg(rd.to_reg(), size);
1257
                let rn = pretty_print_ireg(rn, size);
1258
                let rm = pretty_print_ireg(rm, size);
1259
                format!("{op} {rd}, {rn}, {rm}")
1260
            }
1261
            &Inst::AluRRRR {
1262
                alu_op,
1263
                size,
1264
                rd,
1265
                rn,
1266
                rm,
1267
                ra,
1268
            } => {
1269
                let (op, da_size) = match alu_op {
1270
                    ALUOp3::MAdd => ("madd", size),
1271
                    ALUOp3::MSub => ("msub", size),
1272
                    ALUOp3::UMAddL => ("umaddl", OperandSize::Size64),
1273
                    ALUOp3::SMAddL => ("smaddl", OperandSize::Size64),
1274
                };
1275
                let rd = pretty_print_ireg(rd.to_reg(), da_size);
1276
                let rn = pretty_print_ireg(rn, size);
1277
                let rm = pretty_print_ireg(rm, size);
1278
                let ra = pretty_print_ireg(ra, da_size);
1279

1280
                format!("{op} {rd}, {rn}, {rm}, {ra}")
1281
            }
1282
            &Inst::AluRRImm12 {
1283
                alu_op,
1284
                size,
1285
                rd,
1286
                rn,
1287
                ref imm12,
1288
            } => {
1289
                let op = op_name(alu_op);
1290
                let rd = pretty_print_ireg(rd.to_reg(), size);
1291
                let rn = pretty_print_ireg(rn, size);
1292

1293
                if imm12.bits == 0 && alu_op == ALUOp::Add && size.is64() {
1294
                    // special-case MOV (used for moving into SP).
1295
                    format!("mov {rd}, {rn}")
1296
                } else {
1297
                    let imm12 = imm12.pretty_print(0);
1298
                    format!("{op} {rd}, {rn}, {imm12}")
1299
                }
1300
            }
1301
            &Inst::AluRRImmLogic {
1302
                alu_op,
1303
                size,
1304
                rd,
1305
                rn,
1306
                ref imml,
1307
            } => {
1308
                let op = op_name(alu_op);
1309
                let rd = pretty_print_ireg(rd.to_reg(), size);
1310
                let rn = pretty_print_ireg(rn, size);
1311
                let imml = imml.pretty_print(0);
1312
                format!("{op} {rd}, {rn}, {imml}")
1313
            }
1314
            &Inst::AluRRImmShift {
1315
                alu_op,
1316
                size,
1317
                rd,
1318
                rn,
1319
                ref immshift,
1320
            } => {
1321
                let op = op_name(alu_op);
1322
                let rd = pretty_print_ireg(rd.to_reg(), size);
1323
                let rn = pretty_print_ireg(rn, size);
1324
                let immshift = immshift.pretty_print(0);
1325
                format!("{op} {rd}, {rn}, {immshift}")
1326
            }
1327
            &Inst::AluRRRShift {
1328
                alu_op,
1329
                size,
1330
                rd,
1331
                rn,
1332
                rm,
1333
                ref shiftop,
1334
            } => {
1335
                let op = op_name(alu_op);
1336
                let rd = pretty_print_ireg(rd.to_reg(), size);
1337
                let rn = pretty_print_ireg(rn, size);
1338
                let rm = pretty_print_ireg(rm, size);
1339
                let shiftop = shiftop.pretty_print(0);
1340
                format!("{op} {rd}, {rn}, {rm}, {shiftop}")
1341
            }
1342
            &Inst::AluRRRExtend {
1343
                alu_op,
1344
                size,
1345
                rd,
1346
                rn,
1347
                rm,
1348
                ref extendop,
1349
            } => {
1350
                let op = op_name(alu_op);
1351
                let rd = pretty_print_ireg(rd.to_reg(), size);
1352
                let rn = pretty_print_ireg(rn, size);
1353
                let rm = pretty_print_ireg(rm, size);
1354
                let extendop = extendop.pretty_print(0);
1355
                format!("{op} {rd}, {rn}, {rm}, {extendop}")
1356
            }
1357
            &Inst::BitRR { op, size, rd, rn } => {
1358
                let op = op.op_str();
1359
                let rd = pretty_print_ireg(rd.to_reg(), size);
1360
                let rn = pretty_print_ireg(rn, size);
1361
                format!("{op} {rd}, {rn}")
1362
            }
1363
            &Inst::ULoad8 { rd, ref mem, .. }
1364
            | &Inst::SLoad8 { rd, ref mem, .. }
1365
            | &Inst::ULoad16 { rd, ref mem, .. }
1366
            | &Inst::SLoad16 { rd, ref mem, .. }
1367
            | &Inst::ULoad32 { rd, ref mem, .. }
1368
            | &Inst::SLoad32 { rd, ref mem, .. }
1369
            | &Inst::ULoad64 { rd, ref mem, .. } => {
1370
                let is_unscaled = match &mem {
1371
                    &AMode::Unscaled { .. } => true,
1372
                    _ => false,
1373
                };
1374
                let (op, size) = match (self, is_unscaled) {
1375
                    (&Inst::ULoad8 { .. }, false) => ("ldrb", OperandSize::Size32),
1376
                    (&Inst::ULoad8 { .. }, true) => ("ldurb", OperandSize::Size32),
1377
                    (&Inst::SLoad8 { .. }, false) => ("ldrsb", OperandSize::Size64),
1378
                    (&Inst::SLoad8 { .. }, true) => ("ldursb", OperandSize::Size64),
1379
                    (&Inst::ULoad16 { .. }, false) => ("ldrh", OperandSize::Size32),
1380
                    (&Inst::ULoad16 { .. }, true) => ("ldurh", OperandSize::Size32),
1381
                    (&Inst::SLoad16 { .. }, false) => ("ldrsh", OperandSize::Size64),
1382
                    (&Inst::SLoad16 { .. }, true) => ("ldursh", OperandSize::Size64),
1383
                    (&Inst::ULoad32 { .. }, false) => ("ldr", OperandSize::Size32),
1384
                    (&Inst::ULoad32 { .. }, true) => ("ldur", OperandSize::Size32),
1385
                    (&Inst::SLoad32 { .. }, false) => ("ldrsw", OperandSize::Size64),
1386
                    (&Inst::SLoad32 { .. }, true) => ("ldursw", OperandSize::Size64),
1387
                    (&Inst::ULoad64 { .. }, false) => ("ldr", OperandSize::Size64),
1388
                    (&Inst::ULoad64 { .. }, true) => ("ldur", OperandSize::Size64),
1389
                    _ => unreachable!(),
1390
                };
1391

1392
                let rd = pretty_print_ireg(rd.to_reg(), size);
1393
                let mem = mem.clone();
1394
                let access_ty = self.mem_type().unwrap();
1395
                let (mem_str, mem) = mem_finalize_for_show(&mem, access_ty, state);
1396

1397
                format!("{mem_str}{op} {rd}, {mem}")
1398
            }
1399
            &Inst::Store8 { rd, ref mem, .. }
1400
            | &Inst::Store16 { rd, ref mem, .. }
1401
            | &Inst::Store32 { rd, ref mem, .. }
1402
            | &Inst::Store64 { rd, ref mem, .. } => {
1403
                let is_unscaled = match &mem {
1404
                    &AMode::Unscaled { .. } => true,
1405
                    _ => false,
1406
                };
1407
                let (op, size) = match (self, is_unscaled) {
1408
                    (&Inst::Store8 { .. }, false) => ("strb", OperandSize::Size32),
1409
                    (&Inst::Store8 { .. }, true) => ("sturb", OperandSize::Size32),
1410
                    (&Inst::Store16 { .. }, false) => ("strh", OperandSize::Size32),
1411
                    (&Inst::Store16 { .. }, true) => ("sturh", OperandSize::Size32),
1412
                    (&Inst::Store32 { .. }, false) => ("str", OperandSize::Size32),
1413
                    (&Inst::Store32 { .. }, true) => ("stur", OperandSize::Size32),
1414
                    (&Inst::Store64 { .. }, false) => ("str", OperandSize::Size64),
1415
                    (&Inst::Store64 { .. }, true) => ("stur", OperandSize::Size64),
1416
                    _ => unreachable!(),
1417
                };
1418

1419
                let rd = pretty_print_ireg(rd, size);
1420
                let mem = mem.clone();
1421
                let access_ty = self.mem_type().unwrap();
1422
                let (mem_str, mem) = mem_finalize_for_show(&mem, access_ty, state);
1423

1424
                format!("{mem_str}{op} {rd}, {mem}")
1425
            }
1426
            &Inst::StoreP64 {
1427
                rt, rt2, ref mem, ..
1428
            } => {
1429
                let rt = pretty_print_ireg(rt, OperandSize::Size64);
1430
                let rt2 = pretty_print_ireg(rt2, OperandSize::Size64);
1431
                let mem = mem.clone();
1432
                let mem = mem.pretty_print_default();
1433
                format!("stp {rt}, {rt2}, {mem}")
1434
            }
1435
            &Inst::LoadP64 {
1436
                rt, rt2, ref mem, ..
1437
            } => {
1438
                let rt = pretty_print_ireg(rt.to_reg(), OperandSize::Size64);
1439
                let rt2 = pretty_print_ireg(rt2.to_reg(), OperandSize::Size64);
1440
                let mem = mem.clone();
1441
                let mem = mem.pretty_print_default();
1442
                format!("ldp {rt}, {rt2}, {mem}")
1443
            }
1444
            &Inst::Mov { size, rd, rm } => {
1445
                let rd = pretty_print_ireg(rd.to_reg(), size);
1446
                let rm = pretty_print_ireg(rm, size);
1447
                format!("mov {rd}, {rm}")
1448
            }
1449
            &Inst::MovFromPReg { rd, rm } => {
1450
                let rd = pretty_print_ireg(rd.to_reg(), OperandSize::Size64);
1451
                let rm = show_ireg_sized(rm.into(), OperandSize::Size64);
1452
                format!("mov {rd}, {rm}")
1453
            }
1454
            &Inst::MovToPReg { rd, rm } => {
1455
                let rd = show_ireg_sized(rd.into(), OperandSize::Size64);
1456
                let rm = pretty_print_ireg(rm, OperandSize::Size64);
1457
                format!("mov {rd}, {rm}")
1458
            }
1459
            &Inst::MovWide {
1460
                op,
1461
                rd,
1462
                ref imm,
1463
                size,
1464
            } => {
1465
                let op_str = match op {
1466
                    MoveWideOp::MovZ => "movz",
1467
                    MoveWideOp::MovN => "movn",
1468
                };
1469
                let rd = pretty_print_ireg(rd.to_reg(), size);
1470
                let imm = imm.pretty_print(0);
1471
                format!("{op_str} {rd}, {imm}")
1472
            }
1473
            &Inst::MovK {
1474
                rd,
1475
                rn,
1476
                ref imm,
1477
                size,
1478
            } => {
1479
                let rn = pretty_print_ireg(rn, size);
1480
                let rd = pretty_print_ireg(rd.to_reg(), size);
1481
                let imm = imm.pretty_print(0);
1482
                format!("movk {rd}, {rn}, {imm}")
1483
            }
1484
            &Inst::CSel { rd, rn, rm, cond } => {
1485
                let rd = pretty_print_ireg(rd.to_reg(), OperandSize::Size64);
1486
                let rn = pretty_print_ireg(rn, OperandSize::Size64);
1487
                let rm = pretty_print_ireg(rm, OperandSize::Size64);
1488
                let cond = cond.pretty_print(0);
1489
                format!("csel {rd}, {rn}, {rm}, {cond}")
1490
            }
1491
            &Inst::CSNeg { rd, rn, rm, cond } => {
1492
                let rd = pretty_print_ireg(rd.to_reg(), OperandSize::Size64);
1493
                let rn = pretty_print_ireg(rn, OperandSize::Size64);
1494
                let rm = pretty_print_ireg(rm, OperandSize::Size64);
1495
                let cond = cond.pretty_print(0);
1496
                format!("csneg {rd}, {rn}, {rm}, {cond}")
1497
            }
1498
            &Inst::CSet { rd, cond } => {
1499
                let rd = pretty_print_ireg(rd.to_reg(), OperandSize::Size64);
1500
                let cond = cond.pretty_print(0);
1501
                format!("cset {rd}, {cond}")
1502
            }
1503
            &Inst::CSetm { rd, cond } => {
1504
                let rd = pretty_print_ireg(rd.to_reg(), OperandSize::Size64);
1505
                let cond = cond.pretty_print(0);
1506
                format!("csetm {rd}, {cond}")
1507
            }
1508
            &Inst::CCmp {
1509
                size,
1510
                rn,
1511
                rm,
1512
                nzcv,
1513
                cond,
1514
            } => {
1515
                let rn = pretty_print_ireg(rn, size);
1516
                let rm = pretty_print_ireg(rm, size);
1517
                let nzcv = nzcv.pretty_print(0);
1518
                let cond = cond.pretty_print(0);
1519
                format!("ccmp {rn}, {rm}, {nzcv}, {cond}")
1520
            }
1521
            &Inst::CCmpImm {
1522
                size,
1523
                rn,
1524
                imm,
1525
                nzcv,
1526
                cond,
1527
            } => {
1528
                let rn = pretty_print_ireg(rn, size);
1529
                let imm = imm.pretty_print(0);
1530
                let nzcv = nzcv.pretty_print(0);
1531
                let cond = cond.pretty_print(0);
1532
                format!("ccmp {rn}, {imm}, {nzcv}, {cond}")
1533
            }
1534
            &Inst::AtomicRMW {
1535
                rs, rt, rn, ty, op, ..
1536
            } => {
1537
                let op = match op {
1538
                    AtomicRMWOp::Add => "ldaddal",
1539
                    AtomicRMWOp::Clr => "ldclral",
1540
                    AtomicRMWOp::Eor => "ldeoral",
1541
                    AtomicRMWOp::Set => "ldsetal",
1542
                    AtomicRMWOp::Smax => "ldsmaxal",
1543
                    AtomicRMWOp::Umax => "ldumaxal",
1544
                    AtomicRMWOp::Smin => "ldsminal",
1545
                    AtomicRMWOp::Umin => "lduminal",
1546
                    AtomicRMWOp::Swp => "swpal",
1547
                };
1548

1549
                let size = OperandSize::from_ty(ty);
1550
                let rs = pretty_print_ireg(rs, size);
1551
                let rt = pretty_print_ireg(rt.to_reg(), size);
1552
                let rn = pretty_print_ireg(rn, OperandSize::Size64);
1553

1554
                let ty_suffix = match ty {
1555
                    I8 => "b",
1556
                    I16 => "h",
1557
                    _ => "",
1558
                };
1559
                format!("{op}{ty_suffix} {rs}, {rt}, [{rn}]")
1560
            }
1561
            &Inst::AtomicRMWLoop {
1562
                ty,
1563
                op,
1564
                addr,
1565
                operand,
1566
                oldval,
1567
                scratch1,
1568
                scratch2,
1569
                ..
1570
            } => {
1571
                let op = match op {
1572
                    AtomicRMWLoopOp::Add => "add",
1573
                    AtomicRMWLoopOp::Sub => "sub",
1574
                    AtomicRMWLoopOp::Eor => "eor",
1575
                    AtomicRMWLoopOp::Orr => "orr",
1576
                    AtomicRMWLoopOp::And => "and",
1577
                    AtomicRMWLoopOp::Nand => "nand",
1578
                    AtomicRMWLoopOp::Smin => "smin",
1579
                    AtomicRMWLoopOp::Smax => "smax",
1580
                    AtomicRMWLoopOp::Umin => "umin",
1581
                    AtomicRMWLoopOp::Umax => "umax",
1582
                    AtomicRMWLoopOp::Xchg => "xchg",
1583
                };
1584
                let addr = pretty_print_ireg(addr, OperandSize::Size64);
1585
                let operand = pretty_print_ireg(operand, OperandSize::Size64);
1586
                let oldval = pretty_print_ireg(oldval.to_reg(), OperandSize::Size64);
1587
                let scratch1 = pretty_print_ireg(scratch1.to_reg(), OperandSize::Size64);
1588
                let scratch2 = pretty_print_ireg(scratch2.to_reg(), OperandSize::Size64);
1589
                format!(
1590
                    "atomic_rmw_loop_{}_{} addr={} operand={} oldval={} scratch1={} scratch2={}",
1591
                    op,
1592
                    ty.bits(),
1593
                    addr,
1594
                    operand,
1595
                    oldval,
1596
                    scratch1,
1597
                    scratch2,
1598
                )
1599
            }
1600
            &Inst::AtomicCAS {
1601
                rd, rs, rt, rn, ty, ..
1602
            } => {
1603
                let op = match ty {
1604
                    I8 => "casalb",
1605
                    I16 => "casalh",
1606
                    I32 | I64 => "casal",
1607
                    _ => panic!("Unsupported type: {ty}"),
1608
                };
1609
                let size = OperandSize::from_ty(ty);
1610
                let rd = pretty_print_ireg(rd.to_reg(), size);
1611
                let rs = pretty_print_ireg(rs, size);
1612
                let rt = pretty_print_ireg(rt, size);
1613
                let rn = pretty_print_ireg(rn, OperandSize::Size64);
1614

1615
                format!("{op} {rd}, {rs}, {rt}, [{rn}]")
1616
            }
1617
            &Inst::AtomicCASLoop {
1618
                ty,
1619
                addr,
1620
                expected,
1621
                replacement,
1622
                oldval,
1623
                scratch,
1624
                ..
1625
            } => {
1626
                let addr = pretty_print_ireg(addr, OperandSize::Size64);
1627
                let expected = pretty_print_ireg(expected, OperandSize::Size64);
1628
                let replacement = pretty_print_ireg(replacement, OperandSize::Size64);
1629
                let oldval = pretty_print_ireg(oldval.to_reg(), OperandSize::Size64);
1630
                let scratch = pretty_print_ireg(scratch.to_reg(), OperandSize::Size64);
1631
                format!(
1632
                    "atomic_cas_loop_{} addr={}, expect={}, replacement={}, oldval={}, scratch={}",
1633
                    ty.bits(),
1634
                    addr,
1635
                    expected,
1636
                    replacement,
1637
                    oldval,
1638
                    scratch,
1639
                )
1640
            }
1641
            &Inst::LoadAcquire {
1642
                access_ty, rt, rn, ..
1643
            } => {
1644
                let (op, ty) = match access_ty {
1645
                    I8 => ("ldarb", I32),
1646
                    I16 => ("ldarh", I32),
1647
                    I32 => ("ldar", I32),
1648
                    I64 => ("ldar", I64),
1649
                    _ => panic!("Unsupported type: {access_ty}"),
1650
                };
1651
                let size = OperandSize::from_ty(ty);
1652
                let rn = pretty_print_ireg(rn, OperandSize::Size64);
1653
                let rt = pretty_print_ireg(rt.to_reg(), size);
1654
                format!("{op} {rt}, [{rn}]")
1655
            }
1656
            &Inst::StoreRelease {
1657
                access_ty, rt, rn, ..
1658
            } => {
1659
                let (op, ty) = match access_ty {
1660
                    I8 => ("stlrb", I32),
1661
                    I16 => ("stlrh", I32),
1662
                    I32 => ("stlr", I32),
1663
                    I64 => ("stlr", I64),
1664
                    _ => panic!("Unsupported type: {access_ty}"),
1665
                };
1666
                let size = OperandSize::from_ty(ty);
1667
                let rn = pretty_print_ireg(rn, OperandSize::Size64);
1668
                let rt = pretty_print_ireg(rt, size);
1669
                format!("{op} {rt}, [{rn}]")
1670
            }
1671
            &Inst::Fence {} => {
1672
                format!("dmb ish")
1673
            }
1674
            &Inst::Csdb {} => {
1675
                format!("csdb")
1676
            }
1677
            &Inst::FpuMove32 { rd, rn } => {
1678
                let rd = pretty_print_vreg_scalar(rd.to_reg(), ScalarSize::Size32);
1679
                let rn = pretty_print_vreg_scalar(rn, ScalarSize::Size32);
1680
                format!("fmov {rd}, {rn}")
1681
            }
1682
            &Inst::FpuMove64 { rd, rn } => {
1683
                let rd = pretty_print_vreg_scalar(rd.to_reg(), ScalarSize::Size64);
1684
                let rn = pretty_print_vreg_scalar(rn, ScalarSize::Size64);
1685
                format!("fmov {rd}, {rn}")
1686
            }
1687
            &Inst::FpuMove128 { rd, rn } => {
1688
                let rd = pretty_print_reg(rd.to_reg());
1689
                let rn = pretty_print_reg(rn);
1690
                format!("mov {rd}.16b, {rn}.16b")
1691
            }
1692
            &Inst::FpuMoveFromVec { rd, rn, idx, size } => {
1693
                let rd = pretty_print_vreg_scalar(rd.to_reg(), size.lane_size());
1694
                let rn = pretty_print_vreg_element(rn, idx as usize, size.lane_size());
1695
                format!("mov {rd}, {rn}")
1696
            }
1697
            &Inst::FpuExtend { rd, rn, size } => {
1698
                let rd = pretty_print_vreg_scalar(rd.to_reg(), size);
1699
                let rn = pretty_print_vreg_scalar(rn, size);
1700
                format!("fmov {rd}, {rn}")
1701
            }
1702
            &Inst::FpuRR {
1703
                fpu_op,
1704
                size,
1705
                rd,
1706
                rn,
1707
            } => {
1708
                let op = match fpu_op {
1709
                    FPUOp1::Abs => "fabs",
1710
                    FPUOp1::Neg => "fneg",
1711
                    FPUOp1::Sqrt => "fsqrt",
1712
                    FPUOp1::Cvt32To64 | FPUOp1::Cvt64To32 => "fcvt",
1713
                };
1714
                let dst_size = match fpu_op {
1715
                    FPUOp1::Cvt32To64 => ScalarSize::Size64,
1716
                    FPUOp1::Cvt64To32 => ScalarSize::Size32,
1717
                    _ => size,
1718
                };
1719
                let rd = pretty_print_vreg_scalar(rd.to_reg(), dst_size);
1720
                let rn = pretty_print_vreg_scalar(rn, size);
1721
                format!("{op} {rd}, {rn}")
1722
            }
1723
            &Inst::FpuRRR {
1724
                fpu_op,
1725
                size,
1726
                rd,
1727
                rn,
1728
                rm,
1729
            } => {
1730
                let op = match fpu_op {
1731
                    FPUOp2::Add => "fadd",
1732
                    FPUOp2::Sub => "fsub",
1733
                    FPUOp2::Mul => "fmul",
1734
                    FPUOp2::Div => "fdiv",
1735
                    FPUOp2::Max => "fmax",
1736
                    FPUOp2::Min => "fmin",
1737
                };
1738
                let rd = pretty_print_vreg_scalar(rd.to_reg(), size);
1739
                let rn = pretty_print_vreg_scalar(rn, size);
1740
                let rm = pretty_print_vreg_scalar(rm, size);
1741
                format!("{op} {rd}, {rn}, {rm}")
1742
            }
1743
            &Inst::FpuRRI { fpu_op, rd, rn } => {
1744
                let (op, imm, vector) = match fpu_op {
1745
                    FPUOpRI::UShr32(imm) => ("ushr", imm.pretty_print(0), true),
1746
                    FPUOpRI::UShr64(imm) => ("ushr", imm.pretty_print(0), false),
1747
                };
1748

1749
                let (rd, rn) = if vector {
1750
                    (
1751
                        pretty_print_vreg_vector(rd.to_reg(), VectorSize::Size32x2),
1752
                        pretty_print_vreg_vector(rn, VectorSize::Size32x2),
1753
                    )
1754
                } else {
1755
                    (
1756
                        pretty_print_vreg_scalar(rd.to_reg(), ScalarSize::Size64),
1757
                        pretty_print_vreg_scalar(rn, ScalarSize::Size64),
1758
                    )
1759
                };
1760
                format!("{op} {rd}, {rn}, {imm}")
1761
            }
1762
            &Inst::FpuRRIMod { fpu_op, rd, ri, rn } => {
1763
                let (op, imm, vector) = match fpu_op {
1764
                    FPUOpRIMod::Sli32(imm) => ("sli", imm.pretty_print(0), true),
1765
                    FPUOpRIMod::Sli64(imm) => ("sli", imm.pretty_print(0), false),
1766
                };
1767

1768
                let (rd, ri, rn) = if vector {
1769
                    (
1770
                        pretty_print_vreg_vector(rd.to_reg(), VectorSize::Size32x2),
1771
                        pretty_print_vreg_vector(ri, VectorSize::Size32x2),
1772
                        pretty_print_vreg_vector(rn, VectorSize::Size32x2),
1773
                    )
1774
                } else {
1775
                    (
1776
                        pretty_print_vreg_scalar(rd.to_reg(), ScalarSize::Size64),
1777
                        pretty_print_vreg_scalar(ri, ScalarSize::Size64),
1778
                        pretty_print_vreg_scalar(rn, ScalarSize::Size64),
1779
                    )
1780
                };
1781
                format!("{op} {rd}, {ri}, {rn}, {imm}")
1782
            }
1783
            &Inst::FpuRRRR {
1784
                fpu_op,
1785
                size,
1786
                rd,
1787
                rn,
1788
                rm,
1789
                ra,
1790
            } => {
1791
                let op = match fpu_op {
1792
                    FPUOp3::MAdd => "fmadd",
1793
                    FPUOp3::MSub => "fmsub",
1794
                    FPUOp3::NMAdd => "fnmadd",
1795
                    FPUOp3::NMSub => "fnmsub",
1796
                };
1797
                let rd = pretty_print_vreg_scalar(rd.to_reg(), size);
1798
                let rn = pretty_print_vreg_scalar(rn, size);
1799
                let rm = pretty_print_vreg_scalar(rm, size);
1800
                let ra = pretty_print_vreg_scalar(ra, size);
1801
                format!("{op} {rd}, {rn}, {rm}, {ra}")
1802
            }
1803
            &Inst::FpuCmp { size, rn, rm } => {
1804
                let rn = pretty_print_vreg_scalar(rn, size);
1805
                let rm = pretty_print_vreg_scalar(rm, size);
1806
                format!("fcmp {rn}, {rm}")
1807
            }
1808
            &Inst::FpuLoad16 { rd, ref mem, .. } => {
1809
                let rd = pretty_print_vreg_scalar(rd.to_reg(), ScalarSize::Size16);
1810
                let mem = mem.clone();
1811
                let access_ty = self.mem_type().unwrap();
1812
                let (mem_str, mem) = mem_finalize_for_show(&mem, access_ty, state);
1813
                format!("{mem_str}ldr {rd}, {mem}")
1814
            }
1815
            &Inst::FpuLoad32 { rd, ref mem, .. } => {
1816
                let rd = pretty_print_vreg_scalar(rd.to_reg(), ScalarSize::Size32);
1817
                let mem = mem.clone();
1818
                let access_ty = self.mem_type().unwrap();
1819
                let (mem_str, mem) = mem_finalize_for_show(&mem, access_ty, state);
1820
                format!("{mem_str}ldr {rd}, {mem}")
1821
            }
1822
            &Inst::FpuLoad64 { rd, ref mem, .. } => {
1823
                let rd = pretty_print_vreg_scalar(rd.to_reg(), ScalarSize::Size64);
1824
                let mem = mem.clone();
1825
                let access_ty = self.mem_type().unwrap();
1826
                let (mem_str, mem) = mem_finalize_for_show(&mem, access_ty, state);
1827
                format!("{mem_str}ldr {rd}, {mem}")
1828
            }
1829
            &Inst::FpuLoad128 { rd, ref mem, .. } => {
1830
                let rd = pretty_print_reg(rd.to_reg());
1831
                let rd = "q".to_string() + &rd[1..];
1832
                let mem = mem.clone();
1833
                let access_ty = self.mem_type().unwrap();
1834
                let (mem_str, mem) = mem_finalize_for_show(&mem, access_ty, state);
1835
                format!("{mem_str}ldr {rd}, {mem}")
1836
            }
1837
            &Inst::FpuStore16 { rd, ref mem, .. } => {
1838
                let rd = pretty_print_vreg_scalar(rd, ScalarSize::Size16);
1839
                let mem = mem.clone();
1840
                let access_ty = self.mem_type().unwrap();
1841
                let (mem_str, mem) = mem_finalize_for_show(&mem, access_ty, state);
1842
                format!("{mem_str}str {rd}, {mem}")
1843
            }
1844
            &Inst::FpuStore32 { rd, ref mem, .. } => {
1845
                let rd = pretty_print_vreg_scalar(rd, ScalarSize::Size32);
1846
                let mem = mem.clone();
1847
                let access_ty = self.mem_type().unwrap();
1848
                let (mem_str, mem) = mem_finalize_for_show(&mem, access_ty, state);
1849
                format!("{mem_str}str {rd}, {mem}")
1850
            }
1851
            &Inst::FpuStore64 { rd, ref mem, .. } => {
1852
                let rd = pretty_print_vreg_scalar(rd, ScalarSize::Size64);
1853
                let mem = mem.clone();
1854
                let access_ty = self.mem_type().unwrap();
1855
                let (mem_str, mem) = mem_finalize_for_show(&mem, access_ty, state);
1856
                format!("{mem_str}str {rd}, {mem}")
1857
            }
1858
            &Inst::FpuStore128 { rd, ref mem, .. } => {
1859
                let rd = pretty_print_reg(rd);
1860
                let rd = "q".to_string() + &rd[1..];
1861
                let mem = mem.clone();
1862
                let access_ty = self.mem_type().unwrap();
1863
                let (mem_str, mem) = mem_finalize_for_show(&mem, access_ty, state);
1864
                format!("{mem_str}str {rd}, {mem}")
1865
            }
1866
            &Inst::FpuLoadP64 {
1867
                rt, rt2, ref mem, ..
1868
            } => {
1869
                let rt = pretty_print_vreg_scalar(rt.to_reg(), ScalarSize::Size64);
1870
                let rt2 = pretty_print_vreg_scalar(rt2.to_reg(), ScalarSize::Size64);
1871
                let mem = mem.clone();
1872
                let mem = mem.pretty_print_default();
1873

1874
                format!("ldp {rt}, {rt2}, {mem}")
1875
            }
1876
            &Inst::FpuStoreP64 {
1877
                rt, rt2, ref mem, ..
1878
            } => {
1879
                let rt = pretty_print_vreg_scalar(rt, ScalarSize::Size64);
1880
                let rt2 = pretty_print_vreg_scalar(rt2, ScalarSize::Size64);
1881
                let mem = mem.clone();
1882
                let mem = mem.pretty_print_default();
1883

1884
                format!("stp {rt}, {rt2}, {mem}")
1885
            }
1886
            &Inst::FpuLoadP128 {
1887
                rt, rt2, ref mem, ..
1888
            } => {
1889
                let rt = pretty_print_vreg_scalar(rt.to_reg(), ScalarSize::Size128);
1890
                let rt2 = pretty_print_vreg_scalar(rt2.to_reg(), ScalarSize::Size128);
1891
                let mem = mem.clone();
1892
                let mem = mem.pretty_print_default();
1893

1894
                format!("ldp {rt}, {rt2}, {mem}")
1895
            }
1896
            &Inst::FpuStoreP128 {
1897
                rt, rt2, ref mem, ..
1898
            } => {
1899
                let rt = pretty_print_vreg_scalar(rt, ScalarSize::Size128);
1900
                let rt2 = pretty_print_vreg_scalar(rt2, ScalarSize::Size128);
1901
                let mem = mem.clone();
1902
                let mem = mem.pretty_print_default();
1903

1904
                format!("stp {rt}, {rt2}, {mem}")
1905
            }
1906
            &Inst::FpuToInt { op, rd, rn } => {
1907
                let (op, sizesrc, sizedest) = match op {
1908
                    FpuToIntOp::F32ToI32 => ("fcvtzs", ScalarSize::Size32, OperandSize::Size32),
1909
                    FpuToIntOp::F32ToU32 => ("fcvtzu", ScalarSize::Size32, OperandSize::Size32),
1910
                    FpuToIntOp::F32ToI64 => ("fcvtzs", ScalarSize::Size32, OperandSize::Size64),
1911
                    FpuToIntOp::F32ToU64 => ("fcvtzu", ScalarSize::Size32, OperandSize::Size64),
1912
                    FpuToIntOp::F64ToI32 => ("fcvtzs", ScalarSize::Size64, OperandSize::Size32),
1913
                    FpuToIntOp::F64ToU32 => ("fcvtzu", ScalarSize::Size64, OperandSize::Size32),
1914
                    FpuToIntOp::F64ToI64 => ("fcvtzs", ScalarSize::Size64, OperandSize::Size64),
1915
                    FpuToIntOp::F64ToU64 => ("fcvtzu", ScalarSize::Size64, OperandSize::Size64),
1916
                };
1917
                let rd = pretty_print_ireg(rd.to_reg(), sizedest);
1918
                let rn = pretty_print_vreg_scalar(rn, sizesrc);
1919
                format!("{op} {rd}, {rn}")
1920
            }
1921
            &Inst::IntToFpu { op, rd, rn } => {
1922
                let (op, sizesrc, sizedest) = match op {
1923
                    IntToFpuOp::I32ToF32 => ("scvtf", OperandSize::Size32, ScalarSize::Size32),
1924
                    IntToFpuOp::U32ToF32 => ("ucvtf", OperandSize::Size32, ScalarSize::Size32),
1925
                    IntToFpuOp::I64ToF32 => ("scvtf", OperandSize::Size64, ScalarSize::Size32),
1926
                    IntToFpuOp::U64ToF32 => ("ucvtf", OperandSize::Size64, ScalarSize::Size32),
1927
                    IntToFpuOp::I32ToF64 => ("scvtf", OperandSize::Size32, ScalarSize::Size64),
1928
                    IntToFpuOp::U32ToF64 => ("ucvtf", OperandSize::Size32, ScalarSize::Size64),
1929
                    IntToFpuOp::I64ToF64 => ("scvtf", OperandSize::Size64, ScalarSize::Size64),
1930
                    IntToFpuOp::U64ToF64 => ("ucvtf", OperandSize::Size64, ScalarSize::Size64),
1931
                };
1932
                let rd = pretty_print_vreg_scalar(rd.to_reg(), sizedest);
1933
                let rn = pretty_print_ireg(rn, sizesrc);
1934
                format!("{op} {rd}, {rn}")
1935
            }
1936
            &Inst::FpuCSel16 { rd, rn, rm, cond } => {
1937
                let rd = pretty_print_vreg_scalar(rd.to_reg(), ScalarSize::Size16);
1938
                let rn = pretty_print_vreg_scalar(rn, ScalarSize::Size16);
1939
                let rm = pretty_print_vreg_scalar(rm, ScalarSize::Size16);
1940
                let cond = cond.pretty_print(0);
1941
                format!("fcsel {rd}, {rn}, {rm}, {cond}")
1942
            }
1943
            &Inst::FpuCSel32 { rd, rn, rm, cond } => {
1944
                let rd = pretty_print_vreg_scalar(rd.to_reg(), ScalarSize::Size32);
1945
                let rn = pretty_print_vreg_scalar(rn, ScalarSize::Size32);
1946
                let rm = pretty_print_vreg_scalar(rm, ScalarSize::Size32);
1947
                let cond = cond.pretty_print(0);
1948
                format!("fcsel {rd}, {rn}, {rm}, {cond}")
1949
            }
1950
            &Inst::FpuCSel64 { rd, rn, rm, cond } => {
1951
                let rd = pretty_print_vreg_scalar(rd.to_reg(), ScalarSize::Size64);
1952
                let rn = pretty_print_vreg_scalar(rn, ScalarSize::Size64);
1953
                let rm = pretty_print_vreg_scalar(rm, ScalarSize::Size64);
1954
                let cond = cond.pretty_print(0);
1955
                format!("fcsel {rd}, {rn}, {rm}, {cond}")
1956
            }
1957
            &Inst::FpuRound { op, rd, rn } => {
1958
                let (inst, size) = match op {
1959
                    FpuRoundMode::Minus32 => ("frintm", ScalarSize::Size32),
1960
                    FpuRoundMode::Minus64 => ("frintm", ScalarSize::Size64),
1961
                    FpuRoundMode::Plus32 => ("frintp", ScalarSize::Size32),
1962
                    FpuRoundMode::Plus64 => ("frintp", ScalarSize::Size64),
1963
                    FpuRoundMode::Zero32 => ("frintz", ScalarSize::Size32),
1964
                    FpuRoundMode::Zero64 => ("frintz", ScalarSize::Size64),
1965
                    FpuRoundMode::Nearest32 => ("frintn", ScalarSize::Size32),
1966
                    FpuRoundMode::Nearest64 => ("frintn", ScalarSize::Size64),
1967
                };
1968
                let rd = pretty_print_vreg_scalar(rd.to_reg(), size);
1969
                let rn = pretty_print_vreg_scalar(rn, size);
1970
                format!("{inst} {rd}, {rn}")
1971
            }
1972
            &Inst::MovToFpu { rd, rn, size } => {
1973
                let operand_size = size.operand_size();
1974
                let rd = pretty_print_vreg_scalar(rd.to_reg(), size);
1975
                let rn = pretty_print_ireg(rn, operand_size);
1976
                format!("fmov {rd}, {rn}")
1977
            }
1978
            &Inst::FpuMoveFPImm { rd, imm, size } => {
1979
                let imm = imm.pretty_print(0);
1980
                let rd = pretty_print_vreg_scalar(rd.to_reg(), size);
1981

1982
                format!("fmov {rd}, {imm}")
1983
            }
1984
            &Inst::MovToVec {
1985
                rd,
1986
                ri,
1987
                rn,
1988
                idx,
1989
                size,
1990
            } => {
1991
                let rd = pretty_print_vreg_element(rd.to_reg(), idx as usize, size.lane_size());
1992
                let ri = pretty_print_vreg_element(ri, idx as usize, size.lane_size());
1993
                let rn = pretty_print_ireg(rn, size.operand_size());
1994
                format!("mov {rd}, {ri}, {rn}")
1995
            }
1996
            &Inst::MovFromVec { rd, rn, idx, size } => {
1997
                let op = match size {
1998
                    ScalarSize::Size8 => "umov",
1999
                    ScalarSize::Size16 => "umov",
2000
                    ScalarSize::Size32 => "mov",
2001
                    ScalarSize::Size64 => "mov",
2002
                    _ => unimplemented!(),
2003
                };
2004
                let rd = pretty_print_ireg(rd.to_reg(), size.operand_size());
2005
                let rn = pretty_print_vreg_element(rn, idx as usize, size);
2006
                format!("{op} {rd}, {rn}")
2007
            }
2008
            &Inst::MovFromVecSigned {
2009
                rd,
2010
                rn,
2011
                idx,
2012
                size,
2013
                scalar_size,
2014
            } => {
2015
                let rd = pretty_print_ireg(rd.to_reg(), scalar_size);
2016
                let rn = pretty_print_vreg_element(rn, idx as usize, size.lane_size());
2017
                format!("smov {rd}, {rn}")
2018
            }
2019
            &Inst::VecDup { rd, rn, size } => {
2020
                let rd = pretty_print_vreg_vector(rd.to_reg(), size);
2021
                let rn = pretty_print_ireg(rn, size.operand_size());
2022
                format!("dup {rd}, {rn}")
2023
            }
2024
            &Inst::VecDupFromFpu { rd, rn, size, lane } => {
2025
                let rd = pretty_print_vreg_vector(rd.to_reg(), size);
2026
                let rn = pretty_print_vreg_element(rn, lane.into(), size.lane_size());
2027
                format!("dup {rd}, {rn}")
2028
            }
2029
            &Inst::VecDupFPImm { rd, imm, size } => {
2030
                let imm = imm.pretty_print(0);
2031
                let rd = pretty_print_vreg_vector(rd.to_reg(), size);
2032

2033
                format!("fmov {rd}, {imm}")
2034
            }
2035
            &Inst::VecDupImm {
2036
                rd,
2037
                imm,
2038
                invert,
2039
                size,
2040
            } => {
2041
                let imm = imm.pretty_print(0);
2042
                let op = if invert { "mvni" } else { "movi" };
2043
                let rd = pretty_print_vreg_vector(rd.to_reg(), size);
2044

2045
                format!("{op} {rd}, {imm}")
2046
            }
2047
            &Inst::VecExtend {
2048
                t,
2049
                rd,
2050
                rn,
2051
                high_half,
2052
                lane_size,
2053
            } => {
2054
                let vec64 = VectorSize::from_lane_size(lane_size.narrow(), false);
2055
                let vec128 = VectorSize::from_lane_size(lane_size.narrow(), true);
2056
                let rd_size = VectorSize::from_lane_size(lane_size, true);
2057
                let (op, rn_size) = match (t, high_half) {
2058
                    (VecExtendOp::Sxtl, false) => ("sxtl", vec64),
2059
                    (VecExtendOp::Sxtl, true) => ("sxtl2", vec128),
2060
                    (VecExtendOp::Uxtl, false) => ("uxtl", vec64),
2061
                    (VecExtendOp::Uxtl, true) => ("uxtl2", vec128),
2062
                };
2063
                let rd = pretty_print_vreg_vector(rd.to_reg(), rd_size);
2064
                let rn = pretty_print_vreg_vector(rn, rn_size);
2065
                format!("{op} {rd}, {rn}")
2066
            }
2067
            &Inst::VecMovElement {
2068
                rd,
2069
                ri,
2070
                rn,
2071
                dest_idx,
2072
                src_idx,
2073
                size,
2074
            } => {
2075
                let rd =
2076
                    pretty_print_vreg_element(rd.to_reg(), dest_idx as usize, size.lane_size());
2077
                let ri = pretty_print_vreg_element(ri, dest_idx as usize, size.lane_size());
2078
                let rn = pretty_print_vreg_element(rn, src_idx as usize, size.lane_size());
2079
                format!("mov {rd}, {ri}, {rn}")
2080
            }
2081
            &Inst::VecRRLong {
2082
                op,
2083
                rd,
2084
                rn,
2085
                high_half,
2086
            } => {
2087
                let (op, rd_size, size, suffix) = match (op, high_half) {
2088
                    (VecRRLongOp::Fcvtl16, false) => {
2089
                        ("fcvtl", VectorSize::Size32x4, VectorSize::Size16x4, "")
2090
                    }
2091
                    (VecRRLongOp::Fcvtl16, true) => {
2092
                        ("fcvtl2", VectorSize::Size32x4, VectorSize::Size16x8, "")
2093
                    }
2094
                    (VecRRLongOp::Fcvtl32, false) => {
2095
                        ("fcvtl", VectorSize::Size64x2, VectorSize::Size32x2, "")
2096
                    }
2097
                    (VecRRLongOp::Fcvtl32, true) => {
2098
                        ("fcvtl2", VectorSize::Size64x2, VectorSize::Size32x4, "")
2099
                    }
2100
                    (VecRRLongOp::Shll8, false) => {
2101
                        ("shll", VectorSize::Size16x8, VectorSize::Size8x8, ", #8")
2102
                    }
2103
                    (VecRRLongOp::Shll8, true) => {
2104
                        ("shll2", VectorSize::Size16x8, VectorSize::Size8x16, ", #8")
2105
                    }
2106
                    (VecRRLongOp::Shll16, false) => {
2107
                        ("shll", VectorSize::Size32x4, VectorSize::Size16x4, ", #16")
2108
                    }
2109
                    (VecRRLongOp::Shll16, true) => {
2110
                        ("shll2", VectorSize::Size32x4, VectorSize::Size16x8, ", #16")
2111
                    }
2112
                    (VecRRLongOp::Shll32, false) => {
2113
                        ("shll", VectorSize::Size64x2, VectorSize::Size32x2, ", #32")
2114
                    }
2115
                    (VecRRLongOp::Shll32, true) => {
2116
                        ("shll2", VectorSize::Size64x2, VectorSize::Size32x4, ", #32")
2117
                    }
2118
                };
2119
                let rd = pretty_print_vreg_vector(rd.to_reg(), rd_size);
2120
                let rn = pretty_print_vreg_vector(rn, size);
2121

2122
                format!("{op} {rd}, {rn}{suffix}")
2123
            }
2124
            &Inst::VecRRNarrowLow {
2125
                op,
2126
                rd,
2127
                rn,
2128
                lane_size,
2129
                ..
2130
            }
2131
            | &Inst::VecRRNarrowHigh {
2132
                op,
2133
                rd,
2134
                rn,
2135
                lane_size,
2136
                ..
2137
            } => {
2138
                let vec64 = VectorSize::from_lane_size(lane_size, false);
2139
                let vec128 = VectorSize::from_lane_size(lane_size, true);
2140
                let rn_size = VectorSize::from_lane_size(lane_size.widen(), true);
2141
                let high_half = match self {
2142
                    &Inst::VecRRNarrowLow { .. } => false,
2143
                    &Inst::VecRRNarrowHigh { .. } => true,
2144
                    _ => unreachable!(),
2145
                };
2146
                let (op, rd_size) = match (op, high_half) {
2147
                    (VecRRNarrowOp::Xtn, false) => ("xtn", vec64),
2148
                    (VecRRNarrowOp::Xtn, true) => ("xtn2", vec128),
2149
                    (VecRRNarrowOp::Sqxtn, false) => ("sqxtn", vec64),
2150
                    (VecRRNarrowOp::Sqxtn, true) => ("sqxtn2", vec128),
2151
                    (VecRRNarrowOp::Sqxtun, false) => ("sqxtun", vec64),
2152
                    (VecRRNarrowOp::Sqxtun, true) => ("sqxtun2", vec128),
2153
                    (VecRRNarrowOp::Uqxtn, false) => ("uqxtn", vec64),
2154
                    (VecRRNarrowOp::Uqxtn, true) => ("uqxtn2", vec128),
2155
                    (VecRRNarrowOp::Fcvtn, false) => ("fcvtn", vec64),
2156
                    (VecRRNarrowOp::Fcvtn, true) => ("fcvtn2", vec128),
2157
                };
2158
                let rn = pretty_print_vreg_vector(rn, rn_size);
2159
                let rd = pretty_print_vreg_vector(rd.to_reg(), rd_size);
2160
                let ri = match self {
2161
                    &Inst::VecRRNarrowLow { .. } => "".to_string(),
2162
                    &Inst::VecRRNarrowHigh { ri, .. } => {
2163
                        format!("{}, ", pretty_print_vreg_vector(ri, rd_size))
2164
                    }
2165
                    _ => unreachable!(),
2166
                };
2167

2168
                format!("{op} {rd}, {ri}{rn}")
2169
            }
2170
            &Inst::VecRRPair { op, rd, rn } => {
2171
                let op = match op {
2172
                    VecPairOp::Addp => "addp",
2173
                };
2174
                let rd = pretty_print_vreg_scalar(rd.to_reg(), ScalarSize::Size64);
2175
                let rn = pretty_print_vreg_vector(rn, VectorSize::Size64x2);
2176

2177
                format!("{op} {rd}, {rn}")
2178
            }
2179
            &Inst::VecRRPairLong { op, rd, rn } => {
2180
                let (op, dest, src) = match op {
2181
                    VecRRPairLongOp::Saddlp8 => {
2182
                        ("saddlp", VectorSize::Size16x8, VectorSize::Size8x16)
2183
                    }
2184
                    VecRRPairLongOp::Saddlp16 => {
2185
                        ("saddlp", VectorSize::Size32x4, VectorSize::Size16x8)
2186
                    }
2187
                    VecRRPairLongOp::Uaddlp8 => {
2188
                        ("uaddlp", VectorSize::Size16x8, VectorSize::Size8x16)
2189
                    }
2190
                    VecRRPairLongOp::Uaddlp16 => {
2191
                        ("uaddlp", VectorSize::Size32x4, VectorSize::Size16x8)
2192
                    }
2193
                };
2194
                let rd = pretty_print_vreg_vector(rd.to_reg(), dest);
2195
                let rn = pretty_print_vreg_vector(rn, src);
2196

2197
                format!("{op} {rd}, {rn}")
2198
            }
2199
            &Inst::VecRRR {
2200
                rd,
2201
                rn,
2202
                rm,
2203
                alu_op,
2204
                size,
2205
            } => {
2206
                let (op, size) = match alu_op {
2207
                    VecALUOp::Sqadd => ("sqadd", size),
2208
                    VecALUOp::Uqadd => ("uqadd", size),
2209
                    VecALUOp::Sqsub => ("sqsub", size),
2210
                    VecALUOp::Uqsub => ("uqsub", size),
2211
                    VecALUOp::Cmeq => ("cmeq", size),
2212
                    VecALUOp::Cmge => ("cmge", size),
2213
                    VecALUOp::Cmgt => ("cmgt", size),
2214
                    VecALUOp::Cmhs => ("cmhs", size),
2215
                    VecALUOp::Cmhi => ("cmhi", size),
2216
                    VecALUOp::Fcmeq => ("fcmeq", size),
2217
                    VecALUOp::Fcmgt => ("fcmgt", size),
2218
                    VecALUOp::Fcmge => ("fcmge", size),
2219
                    VecALUOp::And => ("and", VectorSize::Size8x16),
2220
                    VecALUOp::Bic => ("bic", VectorSize::Size8x16),
2221
                    VecALUOp::Orr => ("orr", VectorSize::Size8x16),
2222
                    VecALUOp::Eor => ("eor", VectorSize::Size8x16),
2223
                    VecALUOp::Umaxp => ("umaxp", size),
2224
                    VecALUOp::Add => ("add", size),
2225
                    VecALUOp::Sub => ("sub", size),
2226
                    VecALUOp::Mul => ("mul", size),
2227
                    VecALUOp::Sshl => ("sshl", size),
2228
                    VecALUOp::Ushl => ("ushl", size),
2229
                    VecALUOp::Umin => ("umin", size),
2230
                    VecALUOp::Smin => ("smin", size),
2231
                    VecALUOp::Umax => ("umax", size),
2232
                    VecALUOp::Smax => ("smax", size),
2233
                    VecALUOp::Urhadd => ("urhadd", size),
2234
                    VecALUOp::Fadd => ("fadd", size),
2235
                    VecALUOp::Fsub => ("fsub", size),
2236
                    VecALUOp::Fdiv => ("fdiv", size),
2237
                    VecALUOp::Fmax => ("fmax", size),
2238
                    VecALUOp::Fmin => ("fmin", size),
2239
                    VecALUOp::Fmul => ("fmul", size),
2240
                    VecALUOp::Addp => ("addp", size),
2241
                    VecALUOp::Zip1 => ("zip1", size),
2242
                    VecALUOp::Zip2 => ("zip2", size),
2243
                    VecALUOp::Sqrdmulh => ("sqrdmulh", size),
2244
                    VecALUOp::Uzp1 => ("uzp1", size),
2245
                    VecALUOp::Uzp2 => ("uzp2", size),
2246
                    VecALUOp::Trn1 => ("trn1", size),
2247
                    VecALUOp::Trn2 => ("trn2", size),
2248
                };
2249
                let rd = pretty_print_vreg_vector(rd.to_reg(), size);
2250
                let rn = pretty_print_vreg_vector(rn, size);
2251
                let rm = pretty_print_vreg_vector(rm, size);
2252
                format!("{op} {rd}, {rn}, {rm}")
2253
            }
2254
            &Inst::VecRRRMod {
2255
                rd,
2256
                ri,
2257
                rn,
2258
                rm,
2259
                alu_op,
2260
                size,
2261
            } => {
2262
                let (op, size) = match alu_op {
2263
                    VecALUModOp::Bsl => ("bsl", VectorSize::Size8x16),
2264
                    VecALUModOp::Fmla => ("fmla", size),
2265
                    VecALUModOp::Fmls => ("fmls", size),
2266
                };
2267
                let rd = pretty_print_vreg_vector(rd.to_reg(), size);
2268
                let ri = pretty_print_vreg_vector(ri, size);
2269
                let rn = pretty_print_vreg_vector(rn, size);
2270
                let rm = pretty_print_vreg_vector(rm, size);
2271
                format!("{op} {rd}, {ri}, {rn}, {rm}")
2272
            }
2273
            &Inst::VecFmlaElem {
2274
                rd,
2275
                ri,
2276
                rn,
2277
                rm,
2278
                alu_op,
2279
                size,
2280
                idx,
2281
            } => {
2282
                let (op, size) = match alu_op {
2283
                    VecALUModOp::Fmla => ("fmla", size),
2284
                    VecALUModOp::Fmls => ("fmls", size),
2285
                    _ => unreachable!(),
2286
                };
2287
                let rd = pretty_print_vreg_vector(rd.to_reg(), size);
2288
                let ri = pretty_print_vreg_vector(ri, size);
2289
                let rn = pretty_print_vreg_vector(rn, size);
2290
                let rm = pretty_print_vreg_element(rm, idx.into(), size.lane_size());
2291
                format!("{op} {rd}, {ri}, {rn}, {rm}")
2292
            }
2293
            &Inst::VecRRRLong {
2294
                rd,
2295
                rn,
2296
                rm,
2297
                alu_op,
2298
                high_half,
2299
            } => {
2300
                let (op, dest_size, src_size) = match (alu_op, high_half) {
2301
                    (VecRRRLongOp::Smull8, false) => {
2302
                        ("smull", VectorSize::Size16x8, VectorSize::Size8x8)
2303
                    }
2304
                    (VecRRRLongOp::Smull8, true) => {
2305
                        ("smull2", VectorSize::Size16x8, VectorSize::Size8x16)
2306
                    }
2307
                    (VecRRRLongOp::Smull16, false) => {
2308
                        ("smull", VectorSize::Size32x4, VectorSize::Size16x4)
2309
                    }
2310
                    (VecRRRLongOp::Smull16, true) => {
2311
                        ("smull2", VectorSize::Size32x4, VectorSize::Size16x8)
2312
                    }
2313
                    (VecRRRLongOp::Smull32, false) => {
2314
                        ("smull", VectorSize::Size64x2, VectorSize::Size32x2)
2315
                    }
2316
                    (VecRRRLongOp::Smull32, true) => {
2317
                        ("smull2", VectorSize::Size64x2, VectorSize::Size32x4)
2318
                    }
2319
                    (VecRRRLongOp::Umull8, false) => {
2320
                        ("umull", VectorSize::Size16x8, VectorSize::Size8x8)
2321
                    }
2322
                    (VecRRRLongOp::Umull8, true) => {
2323
                        ("umull2", VectorSize::Size16x8, VectorSize::Size8x16)
2324
                    }
2325
                    (VecRRRLongOp::Umull16, false) => {
2326
                        ("umull", VectorSize::Size32x4, VectorSize::Size16x4)
2327
                    }
2328
                    (VecRRRLongOp::Umull16, true) => {
2329
                        ("umull2", VectorSize::Size32x4, VectorSize::Size16x8)
2330
                    }
2331
                    (VecRRRLongOp::Umull32, false) => {
2332
                        ("umull", VectorSize::Size64x2, VectorSize::Size32x2)
2333
                    }
2334
                    (VecRRRLongOp::Umull32, true) => {
2335
                        ("umull2", VectorSize::Size64x2, VectorSize::Size32x4)
2336
                    }
2337
                };
2338
                let rd = pretty_print_vreg_vector(rd.to_reg(), dest_size);
2339
                let rn = pretty_print_vreg_vector(rn, src_size);
2340
                let rm = pretty_print_vreg_vector(rm, src_size);
2341
                format!("{op} {rd}, {rn}, {rm}")
2342
            }
2343
            &Inst::VecRRRLongMod {
2344
                rd,
2345
                ri,
2346
                rn,
2347
                rm,
2348
                alu_op,
2349
                high_half,
2350
            } => {
2351
                let (op, dest_size, src_size) = match (alu_op, high_half) {
2352
                    (VecRRRLongModOp::Umlal8, false) => {
2353
                        ("umlal", VectorSize::Size16x8, VectorSize::Size8x8)
2354
                    }
2355
                    (VecRRRLongModOp::Umlal8, true) => {
2356
                        ("umlal2", VectorSize::Size16x8, VectorSize::Size8x16)
2357
                    }
2358
                    (VecRRRLongModOp::Umlal16, false) => {
2359
                        ("umlal", VectorSize::Size32x4, VectorSize::Size16x4)
2360
                    }
2361
                    (VecRRRLongModOp::Umlal16, true) => {
2362
                        ("umlal2", VectorSize::Size32x4, VectorSize::Size16x8)
2363
                    }
2364
                    (VecRRRLongModOp::Umlal32, false) => {
2365
                        ("umlal", VectorSize::Size64x2, VectorSize::Size32x2)
2366
                    }
2367
                    (VecRRRLongModOp::Umlal32, true) => {
2368
                        ("umlal2", VectorSize::Size64x2, VectorSize::Size32x4)
2369
                    }
2370
                };
2371
                let rd = pretty_print_vreg_vector(rd.to_reg(), dest_size);
2372
                let ri = pretty_print_vreg_vector(ri, dest_size);
2373
                let rn = pretty_print_vreg_vector(rn, src_size);
2374
                let rm = pretty_print_vreg_vector(rm, src_size);
2375
                format!("{op} {rd}, {ri}, {rn}, {rm}")
2376
            }
2377
            &Inst::VecMisc { op, rd, rn, size } => {
2378
                let (op, size, suffix) = match op {
2379
                    VecMisc2::Not => (
2380
                        "mvn",
2381
                        if size.is_128bits() {
2382
                            VectorSize::Size8x16
2383
                        } else {
2384
                            VectorSize::Size8x8
2385
                        },
2386
                        "",
2387
                    ),
2388
                    VecMisc2::Neg => ("neg", size, ""),
2389
                    VecMisc2::Abs => ("abs", size, ""),
2390
                    VecMisc2::Fabs => ("fabs", size, ""),
2391
                    VecMisc2::Fneg => ("fneg", size, ""),
2392
                    VecMisc2::Fsqrt => ("fsqrt", size, ""),
2393
                    VecMisc2::Rev16 => ("rev16", size, ""),
2394
                    VecMisc2::Rev32 => ("rev32", size, ""),
2395
                    VecMisc2::Rev64 => ("rev64", size, ""),
2396
                    VecMisc2::Fcvtzs => ("fcvtzs", size, ""),
2397
                    VecMisc2::Fcvtzu => ("fcvtzu", size, ""),
2398
                    VecMisc2::Scvtf => ("scvtf", size, ""),
2399
                    VecMisc2::Ucvtf => ("ucvtf", size, ""),
2400
                    VecMisc2::Frintn => ("frintn", size, ""),
2401
                    VecMisc2::Frintz => ("frintz", size, ""),
2402
                    VecMisc2::Frintm => ("frintm", size, ""),
2403
                    VecMisc2::Frintp => ("frintp", size, ""),
2404
                    VecMisc2::Cnt => ("cnt", size, ""),
2405
                    VecMisc2::Cmeq0 => ("cmeq", size, ", #0"),
2406
                    VecMisc2::Cmge0 => ("cmge", size, ", #0"),
2407
                    VecMisc2::Cmgt0 => ("cmgt", size, ", #0"),
2408
                    VecMisc2::Cmle0 => ("cmle", size, ", #0"),
2409
                    VecMisc2::Cmlt0 => ("cmlt", size, ", #0"),
2410
                    VecMisc2::Fcmeq0 => ("fcmeq", size, ", #0.0"),
2411
                    VecMisc2::Fcmge0 => ("fcmge", size, ", #0.0"),
2412
                    VecMisc2::Fcmgt0 => ("fcmgt", size, ", #0.0"),
2413
                    VecMisc2::Fcmle0 => ("fcmle", size, ", #0.0"),
2414
                    VecMisc2::Fcmlt0 => ("fcmlt", size, ", #0.0"),
2415
                };
2416
                let rd = pretty_print_vreg_vector(rd.to_reg(), size);
2417
                let rn = pretty_print_vreg_vector(rn, size);
2418
                format!("{op} {rd}, {rn}{suffix}")
2419
            }
2420
            &Inst::VecLanes { op, rd, rn, size } => {
2421
                let op = match op {
2422
                    VecLanesOp::Uminv => "uminv",
2423
                    VecLanesOp::Addv => "addv",
2424
                };
2425
                let rd = pretty_print_vreg_scalar(rd.to_reg(), size.lane_size());
2426
                let rn = pretty_print_vreg_vector(rn, size);
2427
                format!("{op} {rd}, {rn}")
2428
            }
2429
            &Inst::VecShiftImm {
2430
                op,
2431
                rd,
2432
                rn,
2433
                size,
2434
                imm,
2435
            } => {
2436
                let op = match op {
2437
                    VecShiftImmOp::Shl => "shl",
2438
                    VecShiftImmOp::Ushr => "ushr",
2439
                    VecShiftImmOp::Sshr => "sshr",
2440
                };
2441
                let rd = pretty_print_vreg_vector(rd.to_reg(), size);
2442
                let rn = pretty_print_vreg_vector(rn, size);
2443
                format!("{op} {rd}, {rn}, #{imm}")
2444
            }
2445
            &Inst::VecShiftImmMod {
2446
                op,
2447
                rd,
2448
                ri,
2449
                rn,
2450
                size,
2451
                imm,
2452
            } => {
2453
                let op = match op {
2454
                    VecShiftImmModOp::Sli => "sli",
2455
                };
2456
                let rd = pretty_print_vreg_vector(rd.to_reg(), size);
2457
                let ri = pretty_print_vreg_vector(ri, size);
2458
                let rn = pretty_print_vreg_vector(rn, size);
2459
                format!("{op} {rd}, {ri}, {rn}, #{imm}")
2460
            }
2461
            &Inst::VecExtract { rd, rn, rm, imm4 } => {
2462
                let rd = pretty_print_vreg_vector(rd.to_reg(), VectorSize::Size8x16);
2463
                let rn = pretty_print_vreg_vector(rn, VectorSize::Size8x16);
2464
                let rm = pretty_print_vreg_vector(rm, VectorSize::Size8x16);
2465
                format!("ext {rd}, {rn}, {rm}, #{imm4}")
2466
            }
2467
            &Inst::VecTbl { rd, rn, rm } => {
2468
                let rn = pretty_print_vreg_vector(rn, VectorSize::Size8x16);
2469
                let rm = pretty_print_vreg_vector(rm, VectorSize::Size8x16);
2470
                let rd = pretty_print_vreg_vector(rd.to_reg(), VectorSize::Size8x16);
2471
                format!("tbl {rd}, {{ {rn} }}, {rm}")
2472
            }
2473
            &Inst::VecTblExt { rd, ri, rn, rm } => {
2474
                let rn = pretty_print_vreg_vector(rn, VectorSize::Size8x16);
2475
                let rm = pretty_print_vreg_vector(rm, VectorSize::Size8x16);
2476
                let rd = pretty_print_vreg_vector(rd.to_reg(), VectorSize::Size8x16);
2477
                let ri = pretty_print_vreg_vector(ri, VectorSize::Size8x16);
2478
                format!("tbx {rd}, {ri}, {{ {rn} }}, {rm}")
2479
            }
2480
            &Inst::VecTbl2 { rd, rn, rn2, rm } => {
2481
                let rn = pretty_print_vreg_vector(rn, VectorSize::Size8x16);
2482
                let rn2 = pretty_print_vreg_vector(rn2, VectorSize::Size8x16);
2483
                let rm = pretty_print_vreg_vector(rm, VectorSize::Size8x16);
2484
                let rd = pretty_print_vreg_vector(rd.to_reg(), VectorSize::Size8x16);
2485
                format!("tbl {rd}, {{ {rn}, {rn2} }}, {rm}")
2486
            }
2487
            &Inst::VecTbl2Ext {
2488
                rd,
2489
                ri,
2490
                rn,
2491
                rn2,
2492
                rm,
2493
            } => {
2494
                let rn = pretty_print_vreg_vector(rn, VectorSize::Size8x16);
2495
                let rn2 = pretty_print_vreg_vector(rn2, VectorSize::Size8x16);
2496
                let rm = pretty_print_vreg_vector(rm, VectorSize::Size8x16);
2497
                let rd = pretty_print_vreg_vector(rd.to_reg(), VectorSize::Size8x16);
2498
                let ri = pretty_print_vreg_vector(ri, VectorSize::Size8x16);
2499
                format!("tbx {rd}, {ri}, {{ {rn}, {rn2} }}, {rm}")
2500
            }
2501
            &Inst::VecLoadReplicate { rd, rn, size, .. } => {
2502
                let rd = pretty_print_vreg_vector(rd.to_reg(), size);
2503
                let rn = pretty_print_reg(rn);
2504

2505
                format!("ld1r {{ {rd} }}, [{rn}]")
2506
            }
2507
            &Inst::VecCSel { rd, rn, rm, cond } => {
2508
                let rd = pretty_print_vreg_vector(rd.to_reg(), VectorSize::Size8x16);
2509
                let rn = pretty_print_vreg_vector(rn, VectorSize::Size8x16);
2510
                let rm = pretty_print_vreg_vector(rm, VectorSize::Size8x16);
2511
                let cond = cond.pretty_print(0);
2512
                format!("vcsel {rd}, {rn}, {rm}, {cond} (if-then-else diamond)")
2513
            }
2514
            &Inst::MovToNZCV { rn } => {
2515
                let rn = pretty_print_reg(rn);
2516
                format!("msr nzcv, {rn}")
2517
            }
2518
            &Inst::MovFromNZCV { rd } => {
2519
                let rd = pretty_print_reg(rd.to_reg());
2520
                format!("mrs {rd}, nzcv")
2521
            }
2522
            &Inst::Extend {
2523
                rd,
2524
                rn,
2525
                signed: false,
2526
                from_bits: 1,
2527
                ..
2528
            } => {
2529
                let rd = pretty_print_ireg(rd.to_reg(), OperandSize::Size32);
2530
                let rn = pretty_print_ireg(rn, OperandSize::Size32);
2531
                format!("and {rd}, {rn}, #1")
2532
            }
2533
            &Inst::Extend {
2534
                rd,
2535
                rn,
2536
                signed: false,
2537
                from_bits: 32,
2538
                to_bits: 64,
2539
            } => {
2540
                // The case of a zero extension from 32 to 64 bits, is implemented
2541
                // with a "mov" to a 32-bit (W-reg) dest, because this zeroes
2542
                // the top 32 bits.
2543
                let rd = pretty_print_ireg(rd.to_reg(), OperandSize::Size32);
2544
                let rn = pretty_print_ireg(rn, OperandSize::Size32);
2545
                format!("mov {rd}, {rn}")
2546
            }
2547
            &Inst::Extend {
2548
                rd,
2549
                rn,
2550
                signed,
2551
                from_bits,
2552
                to_bits,
2553
            } => {
2554
                assert!(from_bits <= to_bits);
2555
                let op = match (signed, from_bits) {
2556
                    (false, 8) => "uxtb",
2557
                    (true, 8) => "sxtb",
2558
                    (false, 16) => "uxth",
2559
                    (true, 16) => "sxth",
2560
                    (true, 32) => "sxtw",
2561
                    (true, _) => "sbfx",
2562
                    (false, _) => "ubfx",
2563
                };
2564
                if op == "sbfx" || op == "ubfx" {
2565
                    let dest_size = OperandSize::from_bits(to_bits);
2566
                    let rd = pretty_print_ireg(rd.to_reg(), dest_size);
2567
                    let rn = pretty_print_ireg(rn, dest_size);
2568
                    format!("{op} {rd}, {rn}, #0, #{from_bits}")
2569
                } else {
2570
                    let dest_size = if signed {
2571
                        OperandSize::from_bits(to_bits)
2572
                    } else {
2573
                        OperandSize::Size32
2574
                    };
2575
                    let rd = pretty_print_ireg(rd.to_reg(), dest_size);
2576
                    let rn = pretty_print_ireg(rn, OperandSize::from_bits(from_bits));
2577
                    format!("{op} {rd}, {rn}")
2578
                }
2579
            }
2580
            &Inst::Call { ref info } => {
2581
                let try_call = info
2582
                    .try_call_info
2583
                    .as_ref()
2584
                    .map(|tci| pretty_print_try_call(tci))
2585
                    .unwrap_or_default();
2586
                format!("bl 0{try_call}")
2587
            }
2588
            &Inst::CallInd { ref info } => {
2589
                let rn = pretty_print_reg(info.dest);
2590
                let try_call = info
2591
                    .try_call_info
2592
                    .as_ref()
2593
                    .map(|tci| pretty_print_try_call(tci))
2594
                    .unwrap_or_default();
2595
                format!("blr {rn}{try_call}")
2596
            }
2597
            &Inst::ReturnCall { ref info } => {
2598
                let mut s = format!(
2599
                    "return_call {:?} new_stack_arg_size:{}",
2600
                    info.dest, info.new_stack_arg_size
2601
                );
2602
                for ret in &info.uses {
2603
                    let preg = pretty_print_reg(ret.preg);
2604
                    let vreg = pretty_print_reg(ret.vreg);
2605
                    write!(&mut s, " {vreg}={preg}").unwrap();
2606
                }
2607
                s
2608
            }
2609
            &Inst::ReturnCallInd { ref info } => {
2610
                let callee = pretty_print_reg(info.dest);
2611
                let mut s = format!(
2612
                    "return_call_ind {callee} new_stack_arg_size:{}",
2613
                    info.new_stack_arg_size
2614
                );
2615
                for ret in &info.uses {
2616
                    let preg = pretty_print_reg(ret.preg);
2617
                    let vreg = pretty_print_reg(ret.vreg);
2618
                    write!(&mut s, " {vreg}={preg}").unwrap();
2619
                }
2620
                s
2621
            }
2622
            &Inst::Args { ref args } => {
2623
                let mut s = "args".to_string();
2624
                for arg in args {
2625
                    let preg = pretty_print_reg(arg.preg);
2626
                    let def = pretty_print_reg(arg.vreg.to_reg());
2627
                    write!(&mut s, " {def}={preg}").unwrap();
2628
                }
2629
                s
2630
            }
2631
            &Inst::Rets { ref rets } => {
2632
                let mut s = "rets".to_string();
2633
                for ret in rets {
2634
                    let preg = pretty_print_reg(ret.preg);
2635
                    let vreg = pretty_print_reg(ret.vreg);
2636
                    write!(&mut s, " {vreg}={preg}").unwrap();
2637
                }
2638
                s
2639
            }
2640
            &Inst::Ret {} => "ret".to_string(),
2641
            &Inst::AuthenticatedRet { key, is_hint } => {
2642
                let key = match key {
2643
                    APIKey::AZ => "az",
2644
                    APIKey::BZ => "bz",
2645
                    APIKey::ASP => "asp",
2646
                    APIKey::BSP => "bsp",
2647
                };
2648
                match is_hint {
2649
                    false => format!("reta{key}"),
2650
                    true => format!("auti{key} ; ret"),
2651
                }
2652
            }
2653
            &Inst::Jump { ref dest } => {
2654
                let dest = dest.pretty_print(0);
2655
                format!("b {dest}")
2656
            }
2657
            &Inst::CondBr {
2658
                ref taken,
2659
                ref not_taken,
2660
                ref kind,
2661
            } => {
2662
                let taken = taken.pretty_print(0);
2663
                let not_taken = not_taken.pretty_print(0);
2664
                match kind {
2665
                    &CondBrKind::Zero(reg, size) => {
2666
                        let reg = pretty_print_reg_sized(reg, size);
2667
                        format!("cbz {reg}, {taken} ; b {not_taken}")
2668
                    }
2669
                    &CondBrKind::NotZero(reg, size) => {
2670
                        let reg = pretty_print_reg_sized(reg, size);
2671
                        format!("cbnz {reg}, {taken} ; b {not_taken}")
2672
                    }
2673
                    &CondBrKind::Cond(c) => {
2674
                        let c = c.pretty_print(0);
2675
                        format!("b.{c} {taken} ; b {not_taken}")
2676
                    }
2677
                }
2678
            }
2679
            &Inst::TestBitAndBranch {
2680
                kind,
2681
                ref taken,
2682
                ref not_taken,
2683
                rn,
2684
                bit,
2685
            } => {
2686
                let cond = match kind {
2687
                    TestBitAndBranchKind::Z => "z",
2688
                    TestBitAndBranchKind::NZ => "nz",
2689
                };
2690
                let taken = taken.pretty_print(0);
2691
                let not_taken = not_taken.pretty_print(0);
2692
                let rn = pretty_print_reg(rn);
2693
                format!("tb{cond} {rn}, #{bit}, {taken} ; b {not_taken}")
2694
            }
2695
            &Inst::IndirectBr { rn, .. } => {
2696
                let rn = pretty_print_reg(rn);
2697
                format!("br {rn}")
2698
            }
2699
            &Inst::Brk => "brk #0xf000".to_string(),
2700
            &Inst::Udf { .. } => "udf #0xc11f".to_string(),
2701
            &Inst::TrapIf {
2702
                ref kind,
2703
                trap_code,
2704
            } => match kind {
2705
                &CondBrKind::Zero(reg, size) => {
2706
                    let reg = pretty_print_reg_sized(reg, size);
2707
                    format!("cbz {reg}, #trap={trap_code}")
2708
                }
2709
                &CondBrKind::NotZero(reg, size) => {
2710
                    let reg = pretty_print_reg_sized(reg, size);
2711
                    format!("cbnz {reg}, #trap={trap_code}")
2712
                }
2713
                &CondBrKind::Cond(c) => {
2714
                    let c = c.pretty_print(0);
2715
                    format!("b.{c} #trap={trap_code}")
2716
                }
2717
            },
2718
            &Inst::Adr { rd, off } => {
2719
                let rd = pretty_print_reg(rd.to_reg());
2720
                format!("adr {rd}, pc+{off}")
2721
            }
2722
            &Inst::Adrp { rd, off } => {
2723
                let rd = pretty_print_reg(rd.to_reg());
2724
                // This instruction addresses 4KiB pages, so multiply it by the page size.
2725
                let byte_offset = off * 4096;
2726
                format!("adrp {rd}, pc+{byte_offset}")
2727
            }
2728
            &Inst::Word4 { data } => format!("data.i32 {data}"),
2729
            &Inst::Word8 { data } => format!("data.i64 {data}"),
2730
            &Inst::JTSequence {
2731
                default,
2732
                ref targets,
2733
                ridx,
2734
                rtmp1,
2735
                rtmp2,
2736
                ..
2737
            } => {
2738
                let ridx = pretty_print_reg(ridx);
2739
                let rtmp1 = pretty_print_reg(rtmp1.to_reg());
2740
                let rtmp2 = pretty_print_reg(rtmp2.to_reg());
2741
                let default_target = BranchTarget::Label(default).pretty_print(0);
2742
                format!(
2743
                    concat!(
2744
                        "b.hs {} ; ",
2745
                        "csel {}, xzr, {}, hs ; ",
2746
                        "csdb ; ",
2747
                        "adr {}, pc+16 ; ",
2748
                        "ldrsw {}, [{}, {}, uxtw #2] ; ",
2749
                        "add {}, {}, {} ; ",
2750
                        "br {} ; ",
2751
                        "jt_entries {:?}"
2752
                    ),
2753
                    default_target,
2754
                    rtmp2,
2755
                    ridx,
2756
                    rtmp1,
2757
                    rtmp2,
2758
                    rtmp1,
2759
                    rtmp2,
2760
                    rtmp1,
2761
                    rtmp1,
2762
                    rtmp2,
2763
                    rtmp1,
2764
                    targets
2765
                )
2766
            }
2767
            &Inst::LoadExtNameGot { rd, ref name } => {
2768
                let rd = pretty_print_reg(rd.to_reg());
2769
                format!("load_ext_name_got {rd}, {name:?}")
2770
            }
2771
            &Inst::LoadExtNameNear {
2772
                rd,
2773
                ref name,
2774
                offset,
2775
            } => {
2776
                let rd = pretty_print_reg(rd.to_reg());
2777
                format!("load_ext_name_near {rd}, {name:?}+{offset}")
2778
            }
2779
            &Inst::LoadExtNameFar {
2780
                rd,
2781
                ref name,
2782
                offset,
2783
            } => {
2784
                let rd = pretty_print_reg(rd.to_reg());
2785
                format!("load_ext_name_far {rd}, {name:?}+{offset}")
2786
            }
2787
            &Inst::LoadAddr { rd, ref mem } => {
2788
                // TODO: we really should find a better way to avoid duplication of
2789
                // this logic between `emit()` and `show_rru()` -- a separate 1-to-N
2790
                // expansion stage (i.e., legalization, but without the slow edit-in-place
2791
                // of the existing legalization framework).
2792
                let mem = mem.clone();
2793
                let (mem_insts, mem) = mem_finalize(None, &mem, I8, state);
2794
                let mut ret = String::new();
2795
                for inst in mem_insts.into_iter() {
2796
                    ret.push_str(&inst.print_with_state(&mut EmitState::default()));
2797
                }
2798
                let (reg, index_reg, offset) = match mem {
2799
                    AMode::RegExtended { rn, rm, extendop } => (rn, Some((rm, extendop)), 0),
2800
                    AMode::Unscaled { rn, simm9 } => (rn, None, simm9.value()),
2801
                    AMode::UnsignedOffset { rn, uimm12 } => (rn, None, uimm12.value() as i32),
2802
                    _ => panic!("Unsupported case for LoadAddr: {mem:?}"),
2803
                };
2804
                let abs_offset = if offset < 0 {
2805
                    -offset as u64
2806
                } else {
2807
                    offset as u64
2808
                };
2809
                let alu_op = if offset < 0 { ALUOp::Sub } else { ALUOp::Add };
2810

2811
                if let Some((idx, extendop)) = index_reg {
2812
                    let add = Inst::AluRRRExtend {
2813
                        alu_op: ALUOp::Add,
2814
                        size: OperandSize::Size64,
2815
                        rd,
2816
                        rn: reg,
2817
                        rm: idx,
2818
                        extendop,
2819
                    };
2820

2821
                    ret.push_str(&add.print_with_state(&mut EmitState::default()));
2822
                } else if offset == 0 {
2823
                    let mov = Inst::gen_move(rd, reg, I64);
2824
                    ret.push_str(&mov.print_with_state(&mut EmitState::default()));
2825
                } else if let Some(imm12) = Imm12::maybe_from_u64(abs_offset) {
2826
                    let add = Inst::AluRRImm12 {
2827
                        alu_op,
2828
                        size: OperandSize::Size64,
2829
                        rd,
2830
                        rn: reg,
2831
                        imm12,
2832
                    };
2833
                    ret.push_str(&add.print_with_state(&mut EmitState::default()));
2834
                } else {
2835
                    let tmp = writable_spilltmp_reg();
2836
                    for inst in Inst::load_constant(tmp, abs_offset).into_iter() {
2837
                        ret.push_str(&inst.print_with_state(&mut EmitState::default()));
2838
                    }
2839
                    let add = Inst::AluRRR {
2840
                        alu_op,
2841
                        size: OperandSize::Size64,
2842
                        rd,
2843
                        rn: reg,
2844
                        rm: tmp.to_reg(),
2845
                    };
2846
                    ret.push_str(&add.print_with_state(&mut EmitState::default()));
2847
                }
2848
                ret
2849
            }
2850
            &Inst::Paci { key } => {
2851
                let key = match key {
2852
                    APIKey::AZ => "az",
2853
                    APIKey::BZ => "bz",
2854
                    APIKey::ASP => "asp",
2855
                    APIKey::BSP => "bsp",
2856
                };
2857

2858
                "paci".to_string() + key
2859
            }
2860
            &Inst::Xpaclri => "xpaclri".to_string(),
2861
            &Inst::Bti { targets } => {
2862
                let targets = match targets {
2863
                    BranchTargetType::None => "",
2864
                    BranchTargetType::C => " c",
2865
                    BranchTargetType::J => " j",
2866
                    BranchTargetType::JC => " jc",
2867
                };
2868

2869
                "bti".to_string() + targets
2870
            }
2871
            &Inst::EmitIsland { needed_space } => format!("emit_island {needed_space}"),
2872

2873
            &Inst::ElfTlsGetAddr {
2874
                ref symbol,
2875
                rd,
2876
                tmp,
2877
            } => {
2878
                let rd = pretty_print_reg(rd.to_reg());
2879
                let tmp = pretty_print_reg(tmp.to_reg());
2880
                format!("elf_tls_get_addr {}, {}, {}", rd, tmp, symbol.display(None))
2881
            }
2882
            &Inst::MachOTlsGetAddr { ref symbol, rd } => {
2883
                let rd = pretty_print_reg(rd.to_reg());
2884
                format!("macho_tls_get_addr {}, {}", rd, symbol.display(None))
2885
            }
2886
            &Inst::Unwind { ref inst } => {
2887
                format!("unwind {inst:?}")
2888
            }
2889
            &Inst::DummyUse { reg } => {
2890
                let reg = pretty_print_reg(reg);
2891
                format!("dummy_use {reg}")
2892
            }
2893
            &Inst::LabelAddress { dst, label } => {
2894
                let dst = pretty_print_reg(dst.to_reg());
2895
                format!("label_address {dst}, {label:?}")
2896
            }
2897
            &Inst::StackProbeLoop { start, end, step } => {
2898
                let start = pretty_print_reg(start.to_reg());
2899
                let end = pretty_print_reg(end);
2900
                let step = step.pretty_print(0);
2901
                format!("stack_probe_loop {start}, {end}, {step}")
2902
            }
2903
        }
2904
    }
2905
}
2906

2907
//=============================================================================
2908
// Label fixups and jump veneers.
2909

2910
/// Different forms of label references for different instruction formats.
2911
#[derive(Clone, Copy, Debug, PartialEq, Eq)]
2912
pub enum LabelUse {
2913
    /// 14-bit branch offset (conditional branches). PC-rel, offset is imm <<
2914
    /// 2. Immediate is 14 signed bits, in bits 18:5. Used by tbz and tbnz.
2915
    Branch14,
2916
    /// 19-bit branch offset (conditional branches). PC-rel, offset is imm << 2. Immediate is 19
2917
    /// signed bits, in bits 23:5. Used by cbz, cbnz, b.cond.
2918
    Branch19,
2919
    /// 26-bit branch offset (unconditional branches). PC-rel, offset is imm << 2. Immediate is 26
2920
    /// signed bits, in bits 25:0. Used by b, bl.
2921
    Branch26,
2922
    /// 19-bit offset for LDR (load literal). PC-rel, offset is imm << 2. Immediate is 19 signed bits,
2923
    /// in bits 23:5.
2924
    Ldr19,
2925
    /// 21-bit offset for ADR (get address of label). PC-rel, offset is not shifted. Immediate is
2926
    /// 21 signed bits, with high 19 bits in bits 23:5 and low 2 bits in bits 30:29.
2927
    Adr21,
2928
    /// 32-bit PC relative constant offset (from address of constant itself),
2929
    /// signed. Used in jump tables.
2930
    PCRel32,
2931
}
2932

2933
impl MachInstLabelUse for LabelUse {
2934
    /// Alignment for veneer code. Every AArch64 instruction must be 4-byte-aligned.
2935
    const ALIGN: CodeOffset = 4;
2936

2937
    /// Maximum PC-relative range (positive), inclusive.
2938
    fn max_pos_range(self) -> CodeOffset {
2939
        match self {
2940
            // N-bit immediate, left-shifted by 2, for (N+2) bits of total
2941
            // range. Signed, so +2^(N+1) from zero. Likewise for two other
2942
            // shifted cases below.
2943
            LabelUse::Branch14 => (1 << 15) - 1,
2944
            LabelUse::Branch19 => (1 << 20) - 1,
2945
            LabelUse::Branch26 => (1 << 27) - 1,
2946
            LabelUse::Ldr19 => (1 << 20) - 1,
2947
            // Adr does not shift its immediate, so the 21-bit immediate gives 21 bits of total
2948
            // range.
2949
            LabelUse::Adr21 => (1 << 20) - 1,
2950
            LabelUse::PCRel32 => 0x7fffffff,
2951
        }
2952
    }
2953

2954
    /// Maximum PC-relative range (negative).
2955
    fn max_neg_range(self) -> CodeOffset {
2956
        // All forms are twos-complement signed offsets, so negative limit is one more than
2957
        // positive limit.
2958
        self.max_pos_range() + 1
2959
    }
2960

2961
    /// Size of window into code needed to do the patch.
2962
    fn patch_size(self) -> CodeOffset {
2963
        // Patch is on one instruction only for all of these label reference types.
2964
        4
2965
    }
2966

2967
    /// Perform the patch.
2968
    fn patch(self, buffer: &mut [u8], use_offset: CodeOffset, label_offset: CodeOffset) {
2969
        let pc_rel = (label_offset as i64) - (use_offset as i64);
2970
        debug_assert!(pc_rel <= self.max_pos_range() as i64);
2971
        debug_assert!(pc_rel >= -(self.max_neg_range() as i64));
2972
        let pc_rel = pc_rel as u32;
2973
        let insn_word = u32::from_le_bytes([buffer[0], buffer[1], buffer[2], buffer[3]]);
2974
        let mask = match self {
2975
            LabelUse::Branch14 => 0x0007ffe0, // bits 18..5 inclusive
2976
            LabelUse::Branch19 => 0x00ffffe0, // bits 23..5 inclusive
2977
            LabelUse::Branch26 => 0x03ffffff, // bits 25..0 inclusive
2978
            LabelUse::Ldr19 => 0x00ffffe0,    // bits 23..5 inclusive
2979
            LabelUse::Adr21 => 0x60ffffe0,    // bits 30..29, 25..5 inclusive
2980
            LabelUse::PCRel32 => 0xffffffff,
2981
        };
2982
        let pc_rel_shifted = match self {
2983
            LabelUse::Adr21 | LabelUse::PCRel32 => pc_rel,
2984
            _ => {
2985
                debug_assert!(pc_rel & 3 == 0);
2986
                pc_rel >> 2
2987
            }
2988
        };
2989
        let pc_rel_inserted = match self {
2990
            LabelUse::Branch14 => (pc_rel_shifted & 0x3fff) << 5,
2991
            LabelUse::Branch19 | LabelUse::Ldr19 => (pc_rel_shifted & 0x7ffff) << 5,
2992
            LabelUse::Branch26 => pc_rel_shifted & 0x3ffffff,
2993
            // Note: the *low* two bits of offset are put in the
2994
            // *high* bits (30, 29).
2995
            LabelUse::Adr21 => (pc_rel_shifted & 0x1ffffc) << 3 | (pc_rel_shifted & 3) << 29,
2996
            LabelUse::PCRel32 => pc_rel_shifted,
2997
        };
2998
        let is_add = match self {
2999
            LabelUse::PCRel32 => true,
3000
            _ => false,
3001
        };
3002
        let insn_word = if is_add {
3003
            insn_word.wrapping_add(pc_rel_inserted)
3004
        } else {
3005
            (insn_word & !mask) | pc_rel_inserted
3006
        };
3007
        buffer[0..4].clone_from_slice(&u32::to_le_bytes(insn_word));
3008
    }
3009

3010
    /// Is a veneer supported for this label reference type?
3011
    fn supports_veneer(self) -> bool {
3012
        match self {
3013
            LabelUse::Branch14 | LabelUse::Branch19 => true, // veneer is a Branch26
3014
            LabelUse::Branch26 => true,                      // veneer is a PCRel32
3015
            _ => false,
3016
        }
3017
    }
3018

3019
    /// How large is the veneer, if supported?
3020
    fn veneer_size(self) -> CodeOffset {
3021
        match self {
3022
            LabelUse::Branch14 | LabelUse::Branch19 => 4,
3023
            LabelUse::Branch26 => 20,
3024
            _ => unreachable!(),
3025
        }
3026
    }
3027

3028
    fn worst_case_veneer_size() -> CodeOffset {
3029
        20
3030
    }
3031

3032
    /// Generate a veneer into the buffer, given that this veneer is at `veneer_offset`, and return
3033
    /// an offset and label-use for the veneer's use of the original label.
3034
    fn generate_veneer(
3035
        self,
3036
        buffer: &mut [u8],
3037
        veneer_offset: CodeOffset,
3038
    ) -> (CodeOffset, LabelUse) {
3039
        match self {
3040
            LabelUse::Branch14 | LabelUse::Branch19 => {
3041
                // veneer is a Branch26 (unconditional branch). Just encode directly here -- don't
3042
                // bother with constructing an Inst.
3043
                let insn_word = 0b000101 << 26;
3044
                buffer[0..4].clone_from_slice(&u32::to_le_bytes(insn_word));
3045
                (veneer_offset, LabelUse::Branch26)
3046
            }
3047

3048
            // This is promoting a 26-bit call/jump to a 32-bit call/jump to
3049
            // get a further range. This jump translates to a jump to a
3050
            // relative location based on the address of the constant loaded
3051
            // from here.
3052
            //
3053
            // If this path is taken from a call instruction then caller-saved
3054
            // registers are available (minus arguments), so x16/x17 are
3055
            // available. Otherwise for intra-function jumps we also reserve
3056
            // x16/x17 as spill-style registers. In both cases these are
3057
            // available for us to use.
3058
            LabelUse::Branch26 => {
3059
                let tmp1 = regs::spilltmp_reg();
3060
                let tmp1_w = regs::writable_spilltmp_reg();
3061
                let tmp2 = regs::tmp2_reg();
3062
                let tmp2_w = regs::writable_tmp2_reg();
3063
                // ldrsw x16, 16
3064
                let ldr = emit::enc_ldst_imm19(0b1001_1000, 16 / 4, tmp1);
3065
                // adr x17, 12
3066
                let adr = emit::enc_adr(12, tmp2_w);
3067
                // add x16, x16, x17
3068
                let add = emit::enc_arith_rrr(0b10001011_000, 0, tmp1_w, tmp1, tmp2);
3069
                // br x16
3070
                let br = emit::enc_br(tmp1);
3071
                buffer[0..4].clone_from_slice(&u32::to_le_bytes(ldr));
3072
                buffer[4..8].clone_from_slice(&u32::to_le_bytes(adr));
3073
                buffer[8..12].clone_from_slice(&u32::to_le_bytes(add));
3074
                buffer[12..16].clone_from_slice(&u32::to_le_bytes(br));
3075
                // the 4-byte signed immediate we'll load is after these
3076
                // instructions, 16-bytes in.
3077
                (veneer_offset + 16, LabelUse::PCRel32)
3078
            }
3079

3080
            _ => panic!("Unsupported label-reference type for veneer generation!"),
3081
        }
3082
    }
3083

3084
    fn from_reloc(reloc: Reloc, addend: Addend) -> Option<LabelUse> {
3085
        match (reloc, addend) {
3086
            (Reloc::Arm64Call, 0) => Some(LabelUse::Branch26),
3087
            _ => None,
3088
        }
3089
    }
3090
}
3091

3092
#[cfg(test)]
3093
mod tests {
3094
    use super::*;
3095

3096
    #[test]
3097
    fn inst_size_test() {
3098
        // This test will help with unintentionally growing the size
3099
        // of the Inst enum.
3100
        let expected = if cfg!(target_pointer_width = "32") && !cfg!(target_arch = "arm") {
3101
            28
3102
        } else {
3103
            32
3104
        };
3105
        assert_eq!(expected, std::mem::size_of::<Inst>());
3106
    }
3107
}
3108

3109
Product

Resources

Company