CoCalc -- PPCInstructionSelector.cpp

GitHub Repository: freebsd/freebsd-src
Path: blob/main/contrib/llvm-project/llvm/lib/Target/PowerPC/GISel/PPCInstructionSelector.cpp
³⁵²⁹⁴ views
1
//===- PPCInstructionSelector.cpp --------------------------------*- C++ -*-==//
2
//
3
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4
// See https://llvm.org/LICENSE.txt for license information.
5
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6
//
7
//===----------------------------------------------------------------------===//
8
/// \file
9
/// This file implements the targeting of the InstructionSelector class for
10
/// PowerPC.
11
//===----------------------------------------------------------------------===//
12

13
#include "PPC.h"
14
#include "PPCInstrInfo.h"
15
#include "PPCMachineFunctionInfo.h"
16
#include "PPCRegisterBankInfo.h"
17
#include "PPCSubtarget.h"
18
#include "PPCTargetMachine.h"
19
#include "llvm/CodeGen/GlobalISel/GIMatchTableExecutorImpl.h"
20
#include "llvm/CodeGen/GlobalISel/GenericMachineInstrs.h"
21
#include "llvm/CodeGen/GlobalISel/InstructionSelector.h"
22
#include "llvm/CodeGen/GlobalISel/MachineIRBuilder.h"
23
#include "llvm/CodeGen/MachineConstantPool.h"
24
#include "llvm/CodeGen/MachineFunction.h"
25
#include "llvm/IR/IntrinsicsPowerPC.h"
26
#include "llvm/Support/Debug.h"
27

28
#define DEBUG_TYPE "ppc-gisel"
29

30
using namespace llvm;
31

32
namespace {
33

34
#define GET_GLOBALISEL_PREDICATE_BITSET
35
#include "PPCGenGlobalISel.inc"
36
#undef GET_GLOBALISEL_PREDICATE_BITSET
37

38
class PPCInstructionSelector : public InstructionSelector {
39
public:
40
  PPCInstructionSelector(const PPCTargetMachine &TM, const PPCSubtarget &STI,
41
                         const PPCRegisterBankInfo &RBI);
42

43
  bool select(MachineInstr &I) override;
44
  static const char *getName() { return DEBUG_TYPE; }
45

46
private:
47
  /// tblgen generated 'select' implementation that is used as the initial
48
  /// selector for the patterns that do not require complex C++.
49
  bool selectImpl(MachineInstr &I, CodeGenCoverage &CoverageInfo) const;
50

51
  bool selectFPToInt(MachineInstr &I, MachineBasicBlock &MBB,
52
                  MachineRegisterInfo &MRI) const;
53
  bool selectIntToFP(MachineInstr &I, MachineBasicBlock &MBB,
54
                  MachineRegisterInfo &MRI) const;
55

56
  bool selectZExt(MachineInstr &I, MachineBasicBlock &MBB,
57
                  MachineRegisterInfo &MRI) const;
58
  bool selectConstantPool(MachineInstr &I, MachineBasicBlock &MBB,
59
                          MachineRegisterInfo &MRI) const;
60

61
  std::optional<bool> selectI64ImmDirect(MachineInstr &I,
62
                                         MachineBasicBlock &MBB,
63
                                         MachineRegisterInfo &MRI, Register Reg,
64
                                         uint64_t Imm) const;
65
  bool selectI64Imm(MachineInstr &I, MachineBasicBlock &MBB,
66
                    MachineRegisterInfo &MRI) const;
67

68
  const PPCTargetMachine &TM;
69
  const PPCSubtarget &STI;
70
  const PPCInstrInfo &TII;
71
  const PPCRegisterInfo &TRI;
72
  const PPCRegisterBankInfo &RBI;
73

74
#define GET_GLOBALISEL_PREDICATES_DECL
75
#include "PPCGenGlobalISel.inc"
76
#undef GET_GLOBALISEL_PREDICATES_DECL
77

78
#define GET_GLOBALISEL_TEMPORARIES_DECL
79
#include "PPCGenGlobalISel.inc"
80
#undef GET_GLOBALISEL_TEMPORARIES_DECL
81
};
82

83
} // end anonymous namespace
84

85
#define GET_GLOBALISEL_IMPL
86
#include "PPCGenGlobalISel.inc"
87
#undef GET_GLOBALISEL_IMPL
88

89
PPCInstructionSelector::PPCInstructionSelector(const PPCTargetMachine &TM,
90
                                               const PPCSubtarget &STI,
91
                                               const PPCRegisterBankInfo &RBI)
92
    : TM(TM), STI(STI), TII(*STI.getInstrInfo()), TRI(*STI.getRegisterInfo()),
93
      RBI(RBI),
94
#define GET_GLOBALISEL_PREDICATES_INIT
95
#include "PPCGenGlobalISel.inc"
96
#undef GET_GLOBALISEL_PREDICATES_INIT
97
#define GET_GLOBALISEL_TEMPORARIES_INIT
98
#include "PPCGenGlobalISel.inc"
99
#undef GET_GLOBALISEL_TEMPORARIES_INIT
100
{
101
}
102

103
static const TargetRegisterClass *getRegClass(LLT Ty, const RegisterBank *RB) {
104
  if (RB->getID() == PPC::GPRRegBankID) {
105
    if (Ty.getSizeInBits() == 64)
106
      return &PPC::G8RCRegClass;
107
    if (Ty.getSizeInBits() <= 32)
108
      return &PPC::GPRCRegClass;
109
  }
110
  if (RB->getID() == PPC::FPRRegBankID) {
111
    if (Ty.getSizeInBits() == 32)
112
      return &PPC::F4RCRegClass;
113
    if (Ty.getSizeInBits() == 64)
114
      return &PPC::F8RCRegClass;
115
  }
116
  if (RB->getID() == PPC::VECRegBankID) {
117
    if (Ty.getSizeInBits() == 128)
118
      return &PPC::VSRCRegClass;
119
  }
120
  if (RB->getID() == PPC::CRRegBankID) {
121
    if (Ty.getSizeInBits() == 1)
122
      return &PPC::CRBITRCRegClass;
123
    if (Ty.getSizeInBits() == 4)
124
      return &PPC::CRRCRegClass;
125
  }
126

127
  llvm_unreachable("Unknown RegBank!");
128
}
129

130
static bool selectCopy(MachineInstr &I, const TargetInstrInfo &TII,
131
                       MachineRegisterInfo &MRI, const TargetRegisterInfo &TRI,
132
                       const RegisterBankInfo &RBI) {
133
  Register DstReg = I.getOperand(0).getReg();
134

135
  if (DstReg.isPhysical())
136
    return true;
137

138
  const RegisterBank *DstRegBank = RBI.getRegBank(DstReg, MRI, TRI);
139
  const TargetRegisterClass *DstRC =
140
      getRegClass(MRI.getType(DstReg), DstRegBank);
141

142
  // No need to constrain SrcReg. It will get constrained when we hit another of
143
  // its use or its defs.
144
  // Copies do not have constraints.
145
  if (!RBI.constrainGenericRegister(DstReg, *DstRC, MRI)) {
146
    LLVM_DEBUG(dbgs() << "Failed to constrain " << TII.getName(I.getOpcode())
147
                      << " operand\n");
148
    return false;
149
  }
150

151
  return true;
152
}
153

154
static unsigned selectLoadStoreOp(unsigned GenericOpc, unsigned RegBankID,
155
                                  unsigned OpSize) {
156
  const bool IsStore = GenericOpc == TargetOpcode::G_STORE;
157
  switch (RegBankID) {
158
  case PPC::GPRRegBankID:
159
    switch (OpSize) {
160
    case 32:
161
      return IsStore ? PPC::STW : PPC::LWZ;
162
    case 64:
163
      return IsStore ? PPC::STD : PPC::LD;
164
    default:
165
      llvm_unreachable("Unexpected size!");
166
    }
167
    break;
168
  case PPC::FPRRegBankID:
169
    switch (OpSize) {
170
    case 32:
171
      return IsStore ? PPC::STFS : PPC::LFS;
172
    case 64:
173
      return IsStore ? PPC::STFD : PPC::LFD;
174
    default:
175
      llvm_unreachable("Unexpected size!");
176
    }
177
    break;
178
  default:
179
    llvm_unreachable("Unexpected register bank!");
180
  }
181
  return GenericOpc;
182
}
183

184
bool PPCInstructionSelector::selectIntToFP(MachineInstr &I,
185
                                           MachineBasicBlock &MBB,
186
                                           MachineRegisterInfo &MRI) const {
187
  if (!STI.hasDirectMove() || !STI.isPPC64() || !STI.hasFPCVT())
188
    return false;
189

190
  const DebugLoc &DbgLoc = I.getDebugLoc();
191
  const Register DstReg = I.getOperand(0).getReg();
192
  const Register SrcReg = I.getOperand(1).getReg();
193

194
  Register MoveReg = MRI.createVirtualRegister(&PPC::VSFRCRegClass);
195

196
  // For now, only handle the case for 64 bit integer.
197
  BuildMI(MBB, I, DbgLoc, TII.get(PPC::MTVSRD), MoveReg).addReg(SrcReg);
198

199
  bool IsSingle = MRI.getType(DstReg).getSizeInBits() == 32;
200
  bool IsSigned = I.getOpcode() == TargetOpcode::G_SITOFP;
201
  unsigned ConvOp = IsSingle ? (IsSigned ? PPC::XSCVSXDSP : PPC::XSCVUXDSP)
202
                             : (IsSigned ? PPC::XSCVSXDDP : PPC::XSCVUXDDP);
203

204
  MachineInstr *MI =
205
      BuildMI(MBB, I, DbgLoc, TII.get(ConvOp), DstReg).addReg(MoveReg);
206

207
  I.eraseFromParent();
208
  return constrainSelectedInstRegOperands(*MI, TII, TRI, RBI);
209
}
210

211
bool PPCInstructionSelector::selectFPToInt(MachineInstr &I,
212
                                           MachineBasicBlock &MBB,
213
                                           MachineRegisterInfo &MRI) const {
214
  if (!STI.hasDirectMove() || !STI.isPPC64() || !STI.hasFPCVT())
215
    return false;
216

217
  const DebugLoc &DbgLoc = I.getDebugLoc();
218
  const Register DstReg = I.getOperand(0).getReg();
219
  const Register SrcReg = I.getOperand(1).getReg();
220

221
  Register CopyReg = MRI.createVirtualRegister(&PPC::VSFRCRegClass);
222
  BuildMI(MBB, I, DbgLoc, TII.get(TargetOpcode::COPY), CopyReg).addReg(SrcReg);
223

224
  Register ConvReg = MRI.createVirtualRegister(&PPC::VSFRCRegClass);
225

226
  bool IsSigned = I.getOpcode() == TargetOpcode::G_FPTOSI;
227

228
  // single-precision is stored as double-precision on PPC in registers, so
229
  // always use double-precision convertions.
230
  unsigned ConvOp = IsSigned ? PPC::XSCVDPSXDS : PPC::XSCVDPUXDS;
231

232
  BuildMI(MBB, I, DbgLoc, TII.get(ConvOp), ConvReg).addReg(CopyReg);
233

234
  MachineInstr *MI =
235
      BuildMI(MBB, I, DbgLoc, TII.get(PPC::MFVSRD), DstReg).addReg(ConvReg);
236

237
  I.eraseFromParent();
238
  return constrainSelectedInstRegOperands(*MI, TII, TRI, RBI);
239
}
240

241
bool PPCInstructionSelector::selectZExt(MachineInstr &I, MachineBasicBlock &MBB,
242
                                        MachineRegisterInfo &MRI) const {
243
  const Register DstReg = I.getOperand(0).getReg();
244
  const LLT DstTy = MRI.getType(DstReg);
245
  const RegisterBank *DstRegBank = RBI.getRegBank(DstReg, MRI, TRI);
246

247
  const Register SrcReg = I.getOperand(1).getReg();
248

249
  assert(DstTy.getSizeInBits() == 64 && "Unexpected dest size!");
250
  assert(MRI.getType(SrcReg).getSizeInBits() == 32 && "Unexpected src size!");
251

252
  Register ImpDefReg =
253
      MRI.createVirtualRegister(getRegClass(DstTy, DstRegBank));
254
  BuildMI(MBB, I, I.getDebugLoc(), TII.get(TargetOpcode::IMPLICIT_DEF),
255
          ImpDefReg);
256

257
  Register NewDefReg =
258
      MRI.createVirtualRegister(getRegClass(DstTy, DstRegBank));
259
  BuildMI(MBB, I, I.getDebugLoc(), TII.get(TargetOpcode::INSERT_SUBREG),
260
          NewDefReg)
261
      .addReg(ImpDefReg)
262
      .addReg(SrcReg)
263
      .addImm(PPC::sub_32);
264

265
  MachineInstr *MI =
266
      BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::RLDICL), DstReg)
267
          .addReg(NewDefReg)
268
          .addImm(0)
269
          .addImm(32);
270

271
  I.eraseFromParent();
272
  return constrainSelectedInstRegOperands(*MI, TII, TRI, RBI);
273
}
274

275
// For any 32 < Num < 64, check if the Imm contains at least Num consecutive
276
// zeros and return the number of bits by the left of these consecutive zeros.
277
static uint32_t findContiguousZerosAtLeast(uint64_t Imm, unsigned Num) {
278
  uint32_t HiTZ = llvm::countr_zero<uint32_t>(Hi_32(Imm));
279
  uint32_t LoLZ = llvm::countl_zero<uint32_t>(Lo_32(Imm));
280
  if ((HiTZ + LoLZ) >= Num)
281
    return (32 + HiTZ);
282
  return 0;
283
}
284

285
// Direct materialization of 64-bit constants by enumerated patterns.
286
// Similar to PPCISelDAGToDAG::selectI64ImmDirect().
287
std::optional<bool> PPCInstructionSelector::selectI64ImmDirect(MachineInstr &I,
288
                                                MachineBasicBlock &MBB,
289
                                                MachineRegisterInfo &MRI,
290
                                                Register Reg,
291
                                                uint64_t Imm) const {
292
  unsigned TZ = llvm::countr_zero<uint64_t>(Imm);
293
  unsigned LZ = llvm::countl_zero<uint64_t>(Imm);
294
  unsigned TO = llvm::countr_one<uint64_t>(Imm);
295
  unsigned LO = llvm::countl_one<uint64_t>(Imm);
296
  uint32_t Hi32 = Hi_32(Imm);
297
  uint32_t Lo32 = Lo_32(Imm);
298
  uint32_t Shift = 0;
299

300
  // Following patterns use 1 instructions to materialize the Imm.
301

302
  // 1-1) Patterns : {zeros}{15-bit valve}
303
  //                 {ones}{15-bit valve}
304
  if (isInt<16>(Imm))
305
    return BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::LI8), Reg)
306
        .addImm(Imm)
307
        .constrainAllUses(TII, TRI, RBI);
308
  // 1-2) Patterns : {zeros}{15-bit valve}{16 zeros}
309
  //                 {ones}{15-bit valve}{16 zeros}
310
  if (TZ > 15 && (LZ > 32 || LO > 32))
311
    return BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::LIS8), Reg)
312
        .addImm((Imm >> 16) & 0xffff)
313
        .constrainAllUses(TII, TRI, RBI);
314

315
  // Following patterns use 2 instructions to materialize the Imm.
316

317
  assert(LZ < 64 && "Unexpected leading zeros here.");
318
  // Count of ones follwing the leading zeros.
319
  unsigned FO = llvm::countl_one<uint64_t>(Imm << LZ);
320
  // 2-1) Patterns : {zeros}{31-bit value}
321
  //                 {ones}{31-bit value}
322
  if (isInt<32>(Imm)) {
323
    uint64_t ImmHi16 = (Imm >> 16) & 0xffff;
324
    unsigned Opcode = ImmHi16 ? PPC::LIS8 : PPC::LI8;
325
    Register TmpReg = MRI.createVirtualRegister(&PPC::G8RCRegClass);
326
    if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(Opcode), TmpReg)
327
             .addImm((Imm >> 16) & 0xffff)
328
             .constrainAllUses(TII, TRI, RBI))
329
      return false;
330
    return BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::ORI8), Reg)
331
        .addReg(TmpReg, RegState::Kill)
332
        .addImm(Imm & 0xffff)
333
        .constrainAllUses(TII, TRI, RBI);
334
  }
335
  // 2-2) Patterns : {zeros}{ones}{15-bit value}{zeros}
336
  //                 {zeros}{15-bit value}{zeros}
337
  //                 {zeros}{ones}{15-bit value}
338
  //                 {ones}{15-bit value}{zeros}
339
  // We can take advantage of LI's sign-extension semantics to generate leading
340
  // ones, and then use RLDIC to mask off the ones in both sides after rotation.
341
  if ((LZ + FO + TZ) > 48) {
342
    Register TmpReg = MRI.createVirtualRegister(&PPC::G8RCRegClass);
343
    if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::LI8), TmpReg)
344
             .addImm((Imm >> TZ) & 0xffff)
345
             .constrainAllUses(TII, TRI, RBI))
346
      return false;
347
    return BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::RLDIC), Reg)
348
        .addReg(TmpReg, RegState::Kill)
349
        .addImm(TZ)
350
        .addImm(LZ)
351
        .constrainAllUses(TII, TRI, RBI);
352
  }
353
  // 2-3) Pattern : {zeros}{15-bit value}{ones}
354
  // Shift right the Imm by (48 - LZ) bits to construct a negtive 16 bits value,
355
  // therefore we can take advantage of LI's sign-extension semantics, and then
356
  // mask them off after rotation.
357
  //
358
  // +--LZ--||-15-bit-||--TO--+     +-------------|--16-bit--+
359
  // |00000001bbbbbbbbb1111111| ->  |00000000000001bbbbbbbbb1|
360
  // +------------------------+     +------------------------+
361
  // 63                      0      63                      0
362
  //          Imm                   (Imm >> (48 - LZ) & 0xffff)
363
  // +----sext-----|--16-bit--+     +clear-|-----------------+
364
  // |11111111111111bbbbbbbbb1| ->  |00000001bbbbbbbbb1111111|
365
  // +------------------------+     +------------------------+
366
  // 63                      0      63                      0
367
  // LI8: sext many leading zeros   RLDICL: rotate left (48 - LZ), clear left LZ
368
  if ((LZ + TO) > 48) {
369
    // Since the immediates with (LZ > 32) have been handled by previous
370
    // patterns, here we have (LZ <= 32) to make sure we will not shift right
371
    // the Imm by a negative value.
372
    assert(LZ <= 32 && "Unexpected shift value.");
373
    Register TmpReg = MRI.createVirtualRegister(&PPC::G8RCRegClass);
374
    if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::LI8), TmpReg)
375
             .addImm(Imm >> (48 - LZ) & 0xffff)
376
             .constrainAllUses(TII, TRI, RBI))
377
      return false;
378
    return BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::RLDICL), Reg)
379
        .addReg(TmpReg, RegState::Kill)
380
        .addImm(48 - LZ)
381
        .addImm(LZ)
382
        .constrainAllUses(TII, TRI, RBI);
383
  }
384
  // 2-4) Patterns : {zeros}{ones}{15-bit value}{ones}
385
  //                 {ones}{15-bit value}{ones}
386
  // We can take advantage of LI's sign-extension semantics to generate leading
387
  // ones, and then use RLDICL to mask off the ones in left sides (if required)
388
  // after rotation.
389
  //
390
  // +-LZ-FO||-15-bit-||--TO--+     +-------------|--16-bit--+
391
  // |00011110bbbbbbbbb1111111| ->  |000000000011110bbbbbbbbb|
392
  // +------------------------+     +------------------------+
393
  // 63                      0      63                      0
394
  //            Imm                    (Imm >> TO) & 0xffff
395
  // +----sext-----|--16-bit--+     +LZ|---------------------+
396
  // |111111111111110bbbbbbbbb| ->  |00011110bbbbbbbbb1111111|
397
  // +------------------------+     +------------------------+
398
  // 63                      0      63                      0
399
  // LI8: sext many leading zeros   RLDICL: rotate left TO, clear left LZ
400
  if ((LZ + FO + TO) > 48) {
401
    Register TmpReg = MRI.createVirtualRegister(&PPC::G8RCRegClass);
402
    if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::LI8), TmpReg)
403
             .addImm((Imm >> TO) & 0xffff)
404
             .constrainAllUses(TII, TRI, RBI))
405
      return false;
406
    return BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::RLDICL), Reg)
407
        .addReg(TmpReg, RegState::Kill)
408
        .addImm(TO)
409
        .addImm(LZ)
410
        .constrainAllUses(TII, TRI, RBI);
411
  }
412
  // 2-5) Pattern : {32 zeros}{****}{0}{15-bit value}
413
  // If Hi32 is zero and the Lo16(in Lo32) can be presented as a positive 16 bit
414
  // value, we can use LI for Lo16 without generating leading ones then add the
415
  // Hi16(in Lo32).
416
  if (LZ == 32 && ((Lo32 & 0x8000) == 0)) {
417
    Register TmpReg = MRI.createVirtualRegister(&PPC::G8RCRegClass);
418
    if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::LI8), TmpReg)
419
             .addImm(Lo32 & 0xffff)
420
             .constrainAllUses(TII, TRI, RBI))
421
      return false;
422
    return BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::ORIS8), Reg)
423
        .addReg(TmpReg, RegState::Kill)
424
        .addImm(Lo32 >> 16)
425
        .constrainAllUses(TII, TRI, RBI);
426
  }
427
  // 2-6) Patterns : {******}{49 zeros}{******}
428
  //                 {******}{49 ones}{******}
429
  // If the Imm contains 49 consecutive zeros/ones, it means that a total of 15
430
  // bits remain on both sides. Rotate right the Imm to construct an int<16>
431
  // value, use LI for int<16> value and then use RLDICL without mask to rotate
432
  // it back.
433
  //
434
  // 1) findContiguousZerosAtLeast(Imm, 49)
435
  // +------|--zeros-|------+     +---ones--||---15 bit--+
436
  // |bbbbbb0000000000aaaaaa| ->  |0000000000aaaaaabbbbbb|
437
  // +----------------------+     +----------------------+
438
  // 63                    0      63                    0
439
  //
440
  // 2) findContiguousZerosAtLeast(~Imm, 49)
441
  // +------|--ones--|------+     +---ones--||---15 bit--+
442
  // |bbbbbb1111111111aaaaaa| ->  |1111111111aaaaaabbbbbb|
443
  // +----------------------+     +----------------------+
444
  // 63                    0      63                    0
445
  if ((Shift = findContiguousZerosAtLeast(Imm, 49)) ||
446
      (Shift = findContiguousZerosAtLeast(~Imm, 49))) {
447
    uint64_t RotImm = APInt(64, Imm).rotr(Shift).getZExtValue();
448
    Register TmpReg = MRI.createVirtualRegister(&PPC::G8RCRegClass);
449
    if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::LI8), TmpReg)
450
             .addImm(RotImm & 0xffff)
451
             .constrainAllUses(TII, TRI, RBI))
452
      return false;
453
    return BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::RLDICL), Reg)
454
        .addReg(TmpReg, RegState::Kill)
455
        .addImm(Shift)
456
        .addImm(0)
457
        .constrainAllUses(TII, TRI, RBI);
458
  }
459

460
  // Following patterns use 3 instructions to materialize the Imm.
461

462
  // 3-1) Patterns : {zeros}{ones}{31-bit value}{zeros}
463
  //                 {zeros}{31-bit value}{zeros}
464
  //                 {zeros}{ones}{31-bit value}
465
  //                 {ones}{31-bit value}{zeros}
466
  // We can take advantage of LIS's sign-extension semantics to generate leading
467
  // ones, add the remaining bits with ORI, and then use RLDIC to mask off the
468
  // ones in both sides after rotation.
469
  if ((LZ + FO + TZ) > 32) {
470
    uint64_t ImmHi16 = (Imm >> (TZ + 16)) & 0xffff;
471
    unsigned Opcode = ImmHi16 ? PPC::LIS8 : PPC::LI8;
472
    Register TmpReg = MRI.createVirtualRegister(&PPC::G8RCRegClass);
473
    Register Tmp2Reg = MRI.createVirtualRegister(&PPC::G8RCRegClass);
474
    if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(Opcode), TmpReg)
475
             .addImm(ImmHi16)
476
             .constrainAllUses(TII, TRI, RBI))
477
      return false;
478
    if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::ORI8), Tmp2Reg)
479
             .addReg(TmpReg, RegState::Kill)
480
             .addImm((Imm >> TZ) & 0xffff)
481
             .constrainAllUses(TII, TRI, RBI))
482
      return false;
483
    return BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::RLDIC), Reg)
484
        .addReg(Tmp2Reg, RegState::Kill)
485
        .addImm(TZ)
486
        .addImm(LZ)
487
        .constrainAllUses(TII, TRI, RBI);
488
  }
489
  // 3-2) Pattern : {zeros}{31-bit value}{ones}
490
  // Shift right the Imm by (32 - LZ) bits to construct a negative 32 bits
491
  // value, therefore we can take advantage of LIS's sign-extension semantics,
492
  // add the remaining bits with ORI, and then mask them off after rotation.
493
  // This is similar to Pattern 2-3, please refer to the diagram there.
494
  if ((LZ + TO) > 32) {
495
    // Since the immediates with (LZ > 32) have been handled by previous
496
    // patterns, here we have (LZ <= 32) to make sure we will not shift right
497
    // the Imm by a negative value.
498
    assert(LZ <= 32 && "Unexpected shift value.");
499
    Register TmpReg = MRI.createVirtualRegister(&PPC::G8RCRegClass);
500
    Register Tmp2Reg = MRI.createVirtualRegister(&PPC::G8RCRegClass);
501
    if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::LIS8), TmpReg)
502
            .addImm((Imm >> (48 - LZ)) & 0xffff)
503
            .constrainAllUses(TII, TRI, RBI))
504
      return false;
505
    if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::ORI8), Tmp2Reg)
506
             .addReg(TmpReg, RegState::Kill)
507
             .addImm((Imm >> (32 - LZ)) & 0xffff)
508
             .constrainAllUses(TII, TRI, RBI))
509
      return false;
510
    return BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::RLDICL), Reg)
511
        .addReg(Tmp2Reg, RegState::Kill)
512
        .addImm(32 - LZ)
513
        .addImm(LZ)
514
        .constrainAllUses(TII, TRI, RBI);
515
  }
516
  // 3-3) Patterns : {zeros}{ones}{31-bit value}{ones}
517
  //                 {ones}{31-bit value}{ones}
518
  // We can take advantage of LIS's sign-extension semantics to generate leading
519
  // ones, add the remaining bits with ORI, and then use RLDICL to mask off the
520
  // ones in left sides (if required) after rotation.
521
  // This is similar to Pattern 2-4, please refer to the diagram there.
522
  if ((LZ + FO + TO) > 32) {
523
    Register TmpReg = MRI.createVirtualRegister(&PPC::G8RCRegClass);
524
    Register Tmp2Reg = MRI.createVirtualRegister(&PPC::G8RCRegClass);
525
    if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::LIS8), TmpReg)
526
             .addImm((Imm >> (TO + 16)) & 0xffff)
527
             .constrainAllUses(TII, TRI, RBI))
528
      return false;
529
    if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::ORI8), Tmp2Reg)
530
             .addReg(TmpReg, RegState::Kill)
531
             .addImm((Imm >> TO) & 0xffff)
532
             .constrainAllUses(TII, TRI, RBI))
533
      return false;
534
    return BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::RLDICL), Reg)
535
        .addReg(Tmp2Reg, RegState::Kill)
536
        .addImm(TO)
537
        .addImm(LZ)
538
        .constrainAllUses(TII, TRI, RBI);
539
  }
540
  // 3-4) Patterns : High word == Low word
541
  if (Hi32 == Lo32) {
542
    // Handle the first 32 bits.
543
    uint64_t ImmHi16 = (Lo32 >> 16) & 0xffff;
544
    unsigned Opcode = ImmHi16 ? PPC::LIS8 : PPC::LI8;
545
    Register TmpReg = MRI.createVirtualRegister(&PPC::G8RCRegClass);
546
    Register Tmp2Reg = MRI.createVirtualRegister(&PPC::G8RCRegClass);
547
    if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(Opcode), TmpReg)
548
             .addImm(ImmHi16)
549
             .constrainAllUses(TII, TRI, RBI))
550
      return false;
551
    if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::ORI8), Tmp2Reg)
552
             .addReg(TmpReg, RegState::Kill)
553
             .addImm(Lo32 & 0xffff)
554
             .constrainAllUses(TII, TRI, RBI))
555
      return false;
556
    return BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::RLDIMI), Reg)
557
        .addReg(Tmp2Reg)
558
        .addReg(Tmp2Reg, RegState::Kill)
559
        .addImm(32)
560
        .addImm(0)
561
        .constrainAllUses(TII, TRI, RBI);
562
  }
563
  // 3-5) Patterns : {******}{33 zeros}{******}
564
  //                 {******}{33 ones}{******}
565
  // If the Imm contains 33 consecutive zeros/ones, it means that a total of 31
566
  // bits remain on both sides. Rotate right the Imm to construct an int<32>
567
  // value, use LIS + ORI for int<32> value and then use RLDICL without mask to
568
  // rotate it back.
569
  // This is similar to Pattern 2-6, please refer to the diagram there.
570
  if ((Shift = findContiguousZerosAtLeast(Imm, 33)) ||
571
      (Shift = findContiguousZerosAtLeast(~Imm, 33))) {
572
    uint64_t RotImm = APInt(64, Imm).rotr(Shift).getZExtValue();
573
    uint64_t ImmHi16 = (RotImm >> 16) & 0xffff;
574
    unsigned Opcode = ImmHi16 ? PPC::LIS8 : PPC::LI8;
575
    Register TmpReg = MRI.createVirtualRegister(&PPC::G8RCRegClass);
576
    Register Tmp2Reg = MRI.createVirtualRegister(&PPC::G8RCRegClass);
577
    if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(Opcode), TmpReg)
578
             .addImm(ImmHi16)
579
             .constrainAllUses(TII, TRI, RBI))
580
      return false;
581
    if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::ORI8), Tmp2Reg)
582
             .addReg(TmpReg, RegState::Kill)
583
             .addImm(RotImm & 0xffff)
584
             .constrainAllUses(TII, TRI, RBI))
585
      return false;
586
    return BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::RLDICL), Reg)
587
        .addReg(Tmp2Reg, RegState::Kill)
588
        .addImm(Shift)
589
        .addImm(0)
590
        .constrainAllUses(TII, TRI, RBI);
591
  }
592

593
  // If we end up here then no instructions were inserted.
594
  return std::nullopt;
595
}
596

597
// Derived from PPCISelDAGToDAG::selectI64Imm().
598
// TODO: Add support for prefixed instructions.
599
bool PPCInstructionSelector::selectI64Imm(MachineInstr &I,
600
                                          MachineBasicBlock &MBB,
601
                                          MachineRegisterInfo &MRI) const {
602
  assert(I.getOpcode() == TargetOpcode::G_CONSTANT && "Unexpected G code");
603

604
  Register DstReg = I.getOperand(0).getReg();
605
  int64_t Imm = I.getOperand(1).getCImm()->getValue().getZExtValue();
606
  // No more than 3 instructions are used if we can select the i64 immediate
607
  // directly.
608
  if (std::optional<bool> Res = selectI64ImmDirect(I, MBB, MRI, DstReg, Imm)) {
609
    I.eraseFromParent();
610
    return *Res;
611
  }
612

613
  // Calculate the last bits as required.
614
  uint32_t Hi16 = (Lo_32(Imm) >> 16) & 0xffff;
615
  uint32_t Lo16 = Lo_32(Imm) & 0xffff;
616

617
  Register Reg =
618
      (Hi16 || Lo16) ? MRI.createVirtualRegister(&PPC::G8RCRegClass) : DstReg;
619

620
  // Handle the upper 32 bit value.
621
  std::optional<bool> Res =
622
      selectI64ImmDirect(I, MBB, MRI, Reg, Imm & 0xffffffff00000000);
623
  if (!Res || !*Res)
624
    return false;
625

626
  // Add in the last bits as required.
627
  if (Hi16) {
628
    Register TmpReg =
629
        Lo16 ? MRI.createVirtualRegister(&PPC::G8RCRegClass) : DstReg;
630
    if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::ORIS8), TmpReg)
631
             .addReg(Reg, RegState::Kill)
632
             .addImm(Hi16)
633
             .constrainAllUses(TII, TRI, RBI))
634
      return false;
635
    Reg = TmpReg;
636
  }
637
  if (Lo16) {
638
    if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::ORI8), DstReg)
639
             .addReg(Reg, RegState::Kill)
640
             .addImm(Lo16)
641
             .constrainAllUses(TII, TRI, RBI))
642
      return false;
643
  }
644
  I.eraseFromParent();
645
  return true;
646
}
647

648
bool PPCInstructionSelector::selectConstantPool(
649
    MachineInstr &I, MachineBasicBlock &MBB, MachineRegisterInfo &MRI) const {
650
  const DebugLoc &DbgLoc = I.getDebugLoc();
651
  MachineFunction *MF = MBB.getParent();
652

653
  // TODO: handle 32-bit.
654
  // TODO: Enabling floating point constant pool selection on AIX requires
655
  // global isel on big endian target enabled first.
656
  // See CallLowering::enableBigEndian().
657
  if (!STI.isPPC64() || !STI.isLittleEndian())
658
    return false;
659

660
  MF->getInfo<PPCFunctionInfo>()->setUsesTOCBasePtr();
661

662
  const Register DstReg = I.getOperand(0).getReg();
663
  unsigned CPI = I.getOperand(1).getIndex();
664

665
  // Address stored in the TOC entry. This is related to code model and the ABI
666
  // we are currently using. For now we only handle 64-bit Linux LE. PowerPC
667
  // only supports small, medium and large code model.
668
  const CodeModel::Model CModel = TM.getCodeModel();
669
  assert(!(CModel == CodeModel::Tiny || CModel == CodeModel::Kernel) &&
670
         "PowerPC doesn't support tiny or kernel code models.");
671

672
  const MCRegister TOCReg = STI.getTOCPointerRegister();
673
  MachineMemOperand *MMO = MF->getMachineMemOperand(
674
      MachinePointerInfo::getGOT(*MF), MachineMemOperand::MOLoad,
675
      MRI.getType(DstReg), MF->getDataLayout().getPointerABIAlignment(0));
676

677
  MachineInstr *MI = nullptr;
678
  // For now we only handle 64-bit Linux.
679
  if (CModel == CodeModel::Small) {
680
    // For small code model, generate LDtocCPT(CPI, X2).
681
    MI = BuildMI(MBB, I, DbgLoc, TII.get(PPC::LDtocCPT), DstReg)
682
             .addConstantPoolIndex(CPI)
683
             .addReg(TOCReg)
684
             .addMemOperand(MMO);
685
  } else {
686
    Register HaAddrReg = MRI.createVirtualRegister(&PPC::G8RCRegClass);
687
    BuildMI(MBB, I, DbgLoc, TII.get(PPC::ADDIStocHA8), HaAddrReg)
688
        .addReg(TOCReg)
689
        .addConstantPoolIndex(CPI);
690

691
    if (CModel == CodeModel::Large)
692
      // For large code model, generate LDtocL(CPI, ADDIStocHA8(X2, CPI))
693
      MI = BuildMI(MBB, I, DbgLoc, TII.get(PPC::LDtocL), DstReg)
694
               .addConstantPoolIndex(CPI)
695
               .addReg(HaAddrReg)
696
               .addMemOperand(MMO);
697
    else
698
      // For medium code model, generate ADDItocL8(CPI, ADDIStocHA8(X2, CPI))
699
      MI = BuildMI(MBB, I, DbgLoc, TII.get(PPC::ADDItocL8), DstReg)
700
               .addReg(HaAddrReg)
701
               .addConstantPoolIndex(CPI);
702
  }
703

704
  I.eraseFromParent();
705
  return constrainSelectedInstRegOperands(*MI, TII, TRI, RBI);
706
}
707

708
bool PPCInstructionSelector::select(MachineInstr &I) {
709
  auto &MBB = *I.getParent();
710
  auto &MF = *MBB.getParent();
711
  auto &MRI = MF.getRegInfo();
712

713
  if (!isPreISelGenericOpcode(I.getOpcode())) {
714
    if (I.isCopy())
715
      return selectCopy(I, TII, MRI, TRI, RBI);
716

717
    return true;
718
  }
719

720
  if (selectImpl(I, *CoverageInfo))
721
    return true;
722

723
  unsigned Opcode = I.getOpcode();
724

725
  switch (Opcode) {
726
  default:
727
    return false;
728
  case TargetOpcode::G_LOAD:
729
  case TargetOpcode::G_STORE: {
730
    GLoadStore &LdSt = cast<GLoadStore>(I);
731
    LLT PtrTy = MRI.getType(LdSt.getPointerReg());
732

733
    if (PtrTy != LLT::pointer(0, 64)) {
734
      LLVM_DEBUG(dbgs() << "Load/Store pointer has type: " << PtrTy
735
                        << ", expected: " << LLT::pointer(0, 64) << '\n');
736
      return false;
737
    }
738

739
    auto SelectLoadStoreAddressingMode = [&]() -> MachineInstr * {
740
      const unsigned NewOpc = selectLoadStoreOp(
741
          I.getOpcode(), RBI.getRegBank(LdSt.getReg(0), MRI, TRI)->getID(),
742
          LdSt.getMemSizeInBits().getValue());
743

744
      if (NewOpc == I.getOpcode())
745
        return nullptr;
746

747
      // For now, simply use DForm with load/store addr as base and 0 as imm.
748
      // FIXME: optimize load/store with some specific address patterns.
749
      I.setDesc(TII.get(NewOpc));
750
      Register AddrReg = I.getOperand(1).getReg();
751
      bool IsKill = I.getOperand(1).isKill();
752
      I.getOperand(1).ChangeToImmediate(0);
753
      I.addOperand(*I.getParent()->getParent(),
754
                   MachineOperand::CreateReg(AddrReg, /* isDef */ false,
755
                                             /* isImp */ false, IsKill));
756
      return &I;
757
    };
758

759
    MachineInstr *LoadStore = SelectLoadStoreAddressingMode();
760
    if (!LoadStore)
761
      return false;
762

763
    return constrainSelectedInstRegOperands(*LoadStore, TII, TRI, RBI);
764
  }
765
  case TargetOpcode::G_SITOFP:
766
  case TargetOpcode::G_UITOFP:
767
    return selectIntToFP(I, MBB, MRI);
768
  case TargetOpcode::G_FPTOSI:
769
  case TargetOpcode::G_FPTOUI:
770
    return selectFPToInt(I, MBB, MRI);
771
  // G_SEXT will be selected in tb-gen pattern.
772
  case TargetOpcode::G_ZEXT:
773
    return selectZExt(I, MBB, MRI);
774
  case TargetOpcode::G_CONSTANT:
775
    return selectI64Imm(I, MBB, MRI);
776
  case TargetOpcode::G_CONSTANT_POOL:
777
    return selectConstantPool(I, MBB, MRI);
778
  }
779
  return false;
780
}
781

782
namespace llvm {
783
InstructionSelector *
784
createPPCInstructionSelector(const PPCTargetMachine &TM,
785
                             const PPCSubtarget &Subtarget,
786
                             const PPCRegisterBankInfo &RBI) {
787
  return new PPCInstructionSelector(TM, Subtarget, RBI);
788
}
789
} // end namespace llvm
790

791
Product

Resources

Company