Book a Demo!
CoCalc Logo Icon
StoreFeaturesDocsShareSupportNewsAboutPoliciesSign UpSign In
freebsd
GitHub Repository: freebsd/freebsd-src
Path: blob/main/contrib/llvm-project/lld/ELF/Thunks.cpp
34878 views
1
//===- Thunks.cpp --------------------------------------------------------===//
2
//
3
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4
// See https://llvm.org/LICENSE.txt for license information.
5
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6
//
7
//===---------------------------------------------------------------------===//
8
//
9
// This file contains Thunk subclasses.
10
//
11
// A thunk is a small piece of code written after an input section
12
// which is used to jump between "incompatible" functions
13
// such as MIPS PIC and non-PIC or ARM non-Thumb and Thumb functions.
14
//
15
// If a jump target is too far and its address doesn't fit to a
16
// short jump instruction, we need to create a thunk too, but we
17
// haven't supported it yet.
18
//
19
// i386 and x86-64 don't need thunks.
20
//
21
//===---------------------------------------------------------------------===//
22
23
#include "Thunks.h"
24
#include "Config.h"
25
#include "InputFiles.h"
26
#include "InputSection.h"
27
#include "OutputSections.h"
28
#include "Symbols.h"
29
#include "SyntheticSections.h"
30
#include "Target.h"
31
#include "lld/Common/CommonLinkerContext.h"
32
#include "llvm/BinaryFormat/ELF.h"
33
#include "llvm/Support/Casting.h"
34
#include "llvm/Support/ErrorHandling.h"
35
#include "llvm/Support/MathExtras.h"
36
#include <cstdint>
37
#include <cstring>
38
39
using namespace llvm;
40
using namespace llvm::object;
41
using namespace llvm::ELF;
42
using namespace lld;
43
using namespace lld::elf;
44
45
namespace {
46
47
// Base class for AArch64 thunks.
48
//
49
// An AArch64 thunk may be either short or long. A short thunk is simply a
50
// branch (B) instruction, and it may be used to call AArch64 functions when the
51
// distance from the thunk to the target is less than 128MB. Long thunks can
52
// branch to any virtual address and they are implemented in the derived
53
// classes. This class tries to create a short thunk if the target is in range,
54
// otherwise it creates a long thunk.
55
class AArch64Thunk : public Thunk {
56
public:
57
AArch64Thunk(Symbol &dest, int64_t addend) : Thunk(dest, addend) {}
58
bool getMayUseShortThunk();
59
void writeTo(uint8_t *buf) override;
60
61
private:
62
bool mayUseShortThunk = true;
63
virtual void writeLong(uint8_t *buf) = 0;
64
};
65
66
// AArch64 long range Thunks.
67
class AArch64ABSLongThunk final : public AArch64Thunk {
68
public:
69
AArch64ABSLongThunk(Symbol &dest, int64_t addend)
70
: AArch64Thunk(dest, addend) {}
71
uint32_t size() override { return getMayUseShortThunk() ? 4 : 16; }
72
void addSymbols(ThunkSection &isec) override;
73
74
private:
75
void writeLong(uint8_t *buf) override;
76
};
77
78
class AArch64ADRPThunk final : public AArch64Thunk {
79
public:
80
AArch64ADRPThunk(Symbol &dest, int64_t addend) : AArch64Thunk(dest, addend) {}
81
uint32_t size() override { return getMayUseShortThunk() ? 4 : 12; }
82
void addSymbols(ThunkSection &isec) override;
83
84
private:
85
void writeLong(uint8_t *buf) override;
86
};
87
88
// Base class for ARM thunks.
89
//
90
// An ARM thunk may be either short or long. A short thunk is simply a branch
91
// (B) instruction, and it may be used to call ARM functions when the distance
92
// from the thunk to the target is less than 32MB. Long thunks can branch to any
93
// virtual address and can switch between ARM and Thumb, and they are
94
// implemented in the derived classes. This class tries to create a short thunk
95
// if the target is in range, otherwise it creates a long thunk.
96
class ARMThunk : public Thunk {
97
public:
98
ARMThunk(Symbol &dest, int64_t addend) : Thunk(dest, addend) {}
99
100
bool getMayUseShortThunk();
101
uint32_t size() override { return getMayUseShortThunk() ? 4 : sizeLong(); }
102
void writeTo(uint8_t *buf) override;
103
bool isCompatibleWith(const InputSection &isec,
104
const Relocation &rel) const override;
105
106
// Returns the size of a long thunk.
107
virtual uint32_t sizeLong() = 0;
108
109
// Writes a long thunk to Buf.
110
virtual void writeLong(uint8_t *buf) = 0;
111
112
private:
113
// This field tracks whether all previously considered layouts would allow
114
// this thunk to be short. If we have ever needed a long thunk, we always
115
// create a long thunk, even if the thunk may be short given the current
116
// distance to the target. We do this because transitioning from long to short
117
// can create layout oscillations in certain corner cases which would prevent
118
// the layout from converging.
119
bool mayUseShortThunk = true;
120
};
121
122
// Base class for Thumb-2 thunks.
123
//
124
// This class is similar to ARMThunk, but it uses the Thumb-2 B.W instruction
125
// which has a range of 16MB.
126
class ThumbThunk : public Thunk {
127
public:
128
ThumbThunk(Symbol &dest, int64_t addend) : Thunk(dest, addend) {
129
alignment = 2;
130
}
131
132
bool getMayUseShortThunk();
133
uint32_t size() override { return getMayUseShortThunk() ? 4 : sizeLong(); }
134
void writeTo(uint8_t *buf) override;
135
bool isCompatibleWith(const InputSection &isec,
136
const Relocation &rel) const override;
137
138
// Returns the size of a long thunk.
139
virtual uint32_t sizeLong() = 0;
140
141
// Writes a long thunk to Buf.
142
virtual void writeLong(uint8_t *buf) = 0;
143
144
private:
145
// See comment in ARMThunk above.
146
bool mayUseShortThunk = true;
147
};
148
149
// Specific ARM Thunk implementations. The naming convention is:
150
// Source State, TargetState, Target Requirement, ABS or PI, Range
151
class ARMV7ABSLongThunk final : public ARMThunk {
152
public:
153
ARMV7ABSLongThunk(Symbol &dest, int64_t addend) : ARMThunk(dest, addend) {}
154
155
uint32_t sizeLong() override { return 12; }
156
void writeLong(uint8_t *buf) override;
157
void addSymbols(ThunkSection &isec) override;
158
};
159
160
class ARMV7PILongThunk final : public ARMThunk {
161
public:
162
ARMV7PILongThunk(Symbol &dest, int64_t addend) : ARMThunk(dest, addend) {}
163
164
uint32_t sizeLong() override { return 16; }
165
void writeLong(uint8_t *buf) override;
166
void addSymbols(ThunkSection &isec) override;
167
};
168
169
class ThumbV7ABSLongThunk final : public ThumbThunk {
170
public:
171
ThumbV7ABSLongThunk(Symbol &dest, int64_t addend)
172
: ThumbThunk(dest, addend) {}
173
174
uint32_t sizeLong() override { return 10; }
175
void writeLong(uint8_t *buf) override;
176
void addSymbols(ThunkSection &isec) override;
177
};
178
179
class ThumbV7PILongThunk final : public ThumbThunk {
180
public:
181
ThumbV7PILongThunk(Symbol &dest, int64_t addend) : ThumbThunk(dest, addend) {}
182
183
uint32_t sizeLong() override { return 12; }
184
void writeLong(uint8_t *buf) override;
185
void addSymbols(ThunkSection &isec) override;
186
};
187
188
// Implementations of Thunks for Arm v6-M. Only Thumb instructions are permitted
189
class ThumbV6MABSLongThunk final : public ThumbThunk {
190
public:
191
ThumbV6MABSLongThunk(Symbol &dest, int64_t addend)
192
: ThumbThunk(dest, addend) {}
193
194
uint32_t sizeLong() override { return 12; }
195
void writeLong(uint8_t *buf) override;
196
void addSymbols(ThunkSection &isec) override;
197
};
198
199
class ThumbV6MABSXOLongThunk final : public ThumbThunk {
200
public:
201
ThumbV6MABSXOLongThunk(Symbol &dest, int64_t addend)
202
: ThumbThunk(dest, addend) {}
203
204
uint32_t sizeLong() override { return 20; }
205
void writeLong(uint8_t *buf) override;
206
void addSymbols(ThunkSection &isec) override;
207
};
208
209
class ThumbV6MPILongThunk final : public ThumbThunk {
210
public:
211
ThumbV6MPILongThunk(Symbol &dest, int64_t addend)
212
: ThumbThunk(dest, addend) {}
213
214
uint32_t sizeLong() override { return 16; }
215
void writeLong(uint8_t *buf) override;
216
void addSymbols(ThunkSection &isec) override;
217
};
218
219
// Architectures v4, v5 and v6 do not support the movt/movw instructions. v5 and
220
// v6 support BLX to which BL instructions can be rewritten inline. There are no
221
// Thumb entrypoints for v5 and v6 as there is no Thumb branch instruction on
222
// these architecture that can result in a thunk.
223
224
// LDR on v5 and v6 can switch processor state, so for v5 and v6,
225
// ARMV5LongLdrPcThunk can be used for both Arm->Arm and Arm->Thumb calls. v4
226
// can also use this thunk, but only for Arm->Arm calls.
227
class ARMV5LongLdrPcThunk final : public ARMThunk {
228
public:
229
ARMV5LongLdrPcThunk(Symbol &dest, int64_t addend) : ARMThunk(dest, addend) {}
230
231
uint32_t sizeLong() override { return 8; }
232
void writeLong(uint8_t *buf) override;
233
void addSymbols(ThunkSection &isec) override;
234
};
235
236
// Implementations of Thunks for v4. BLX is not supported, and loads
237
// will not invoke Arm/Thumb state changes.
238
class ARMV4PILongBXThunk final : public ARMThunk {
239
public:
240
ARMV4PILongBXThunk(Symbol &dest, int64_t addend) : ARMThunk(dest, addend) {}
241
242
uint32_t sizeLong() override { return 16; }
243
void writeLong(uint8_t *buf) override;
244
void addSymbols(ThunkSection &isec) override;
245
};
246
247
class ARMV4PILongThunk final : public ARMThunk {
248
public:
249
ARMV4PILongThunk(Symbol &dest, int64_t addend) : ARMThunk(dest, addend) {}
250
251
uint32_t sizeLong() override { return 12; }
252
void writeLong(uint8_t *buf) override;
253
void addSymbols(ThunkSection &isec) override;
254
};
255
256
class ThumbV4PILongBXThunk final : public ThumbThunk {
257
public:
258
ThumbV4PILongBXThunk(Symbol &dest, int64_t addend)
259
: ThumbThunk(dest, addend) {}
260
261
uint32_t sizeLong() override { return 16; }
262
void writeLong(uint8_t *buf) override;
263
void addSymbols(ThunkSection &isec) override;
264
};
265
266
class ThumbV4PILongThunk final : public ThumbThunk {
267
public:
268
ThumbV4PILongThunk(Symbol &dest, int64_t addend)
269
: ThumbThunk(dest, addend) {}
270
271
uint32_t sizeLong() override { return 20; }
272
void writeLong(uint8_t *buf) override;
273
void addSymbols(ThunkSection &isec) override;
274
};
275
276
class ARMV4ABSLongBXThunk final : public ARMThunk {
277
public:
278
ARMV4ABSLongBXThunk(Symbol &dest, int64_t addend) : ARMThunk(dest, addend) {}
279
280
uint32_t sizeLong() override { return 12; }
281
void writeLong(uint8_t *buf) override;
282
void addSymbols(ThunkSection &isec) override;
283
};
284
285
class ThumbV4ABSLongBXThunk final : public ThumbThunk {
286
public:
287
ThumbV4ABSLongBXThunk(Symbol &dest, int64_t addend)
288
: ThumbThunk(dest, addend) {}
289
290
uint32_t sizeLong() override { return 12; }
291
void writeLong(uint8_t *buf) override;
292
void addSymbols(ThunkSection &isec) override;
293
};
294
295
class ThumbV4ABSLongThunk final : public ThumbThunk {
296
public:
297
ThumbV4ABSLongThunk(Symbol &dest, int64_t addend)
298
: ThumbThunk(dest, addend) {}
299
300
uint32_t sizeLong() override { return 16; }
301
void writeLong(uint8_t *buf) override;
302
void addSymbols(ThunkSection &isec) override;
303
};
304
305
// The AVR devices need thunks for R_AVR_LO8_LDI_GS/R_AVR_HI8_LDI_GS
306
// when their destination is out of range [0, 0x1ffff].
307
class AVRThunk : public Thunk {
308
public:
309
AVRThunk(Symbol &dest, int64_t addend) : Thunk(dest, addend) {}
310
uint32_t size() override { return 4; }
311
void writeTo(uint8_t *buf) override;
312
void addSymbols(ThunkSection &isec) override;
313
};
314
315
// MIPS LA25 thunk
316
class MipsThunk final : public Thunk {
317
public:
318
MipsThunk(Symbol &dest) : Thunk(dest, 0) {}
319
320
uint32_t size() override { return 16; }
321
void writeTo(uint8_t *buf) override;
322
void addSymbols(ThunkSection &isec) override;
323
InputSection *getTargetInputSection() const override;
324
};
325
326
// microMIPS R2-R5 LA25 thunk
327
class MicroMipsThunk final : public Thunk {
328
public:
329
MicroMipsThunk(Symbol &dest) : Thunk(dest, 0) {}
330
331
uint32_t size() override { return 14; }
332
void writeTo(uint8_t *buf) override;
333
void addSymbols(ThunkSection &isec) override;
334
InputSection *getTargetInputSection() const override;
335
};
336
337
// microMIPS R6 LA25 thunk
338
class MicroMipsR6Thunk final : public Thunk {
339
public:
340
MicroMipsR6Thunk(Symbol &dest) : Thunk(dest, 0) {}
341
342
uint32_t size() override { return 12; }
343
void writeTo(uint8_t *buf) override;
344
void addSymbols(ThunkSection &isec) override;
345
InputSection *getTargetInputSection() const override;
346
};
347
348
class PPC32PltCallStub final : public Thunk {
349
public:
350
// For R_PPC_PLTREL24, Thunk::addend records the addend which will be used to
351
// decide the offsets in the call stub.
352
PPC32PltCallStub(const InputSection &isec, const Relocation &rel,
353
Symbol &dest)
354
: Thunk(dest, rel.addend), file(isec.file) {}
355
uint32_t size() override { return 16; }
356
void writeTo(uint8_t *buf) override;
357
void addSymbols(ThunkSection &isec) override;
358
bool isCompatibleWith(const InputSection &isec, const Relocation &rel) const override;
359
360
private:
361
// Records the call site of the call stub.
362
const InputFile *file;
363
};
364
365
class PPC32LongThunk final : public Thunk {
366
public:
367
PPC32LongThunk(Symbol &dest, int64_t addend) : Thunk(dest, addend) {}
368
uint32_t size() override { return config->isPic ? 32 : 16; }
369
void writeTo(uint8_t *buf) override;
370
void addSymbols(ThunkSection &isec) override;
371
};
372
373
// PPC64 Plt call stubs.
374
// Any call site that needs to call through a plt entry needs a call stub in
375
// the .text section. The call stub is responsible for:
376
// 1) Saving the toc-pointer to the stack.
377
// 2) Loading the target functions address from the procedure linkage table into
378
// r12 for use by the target functions global entry point, and into the count
379
// register.
380
// 3) Transferring control to the target function through an indirect branch.
381
class PPC64PltCallStub final : public Thunk {
382
public:
383
PPC64PltCallStub(Symbol &dest) : Thunk(dest, 0) {}
384
uint32_t size() override { return 20; }
385
void writeTo(uint8_t *buf) override;
386
void addSymbols(ThunkSection &isec) override;
387
bool isCompatibleWith(const InputSection &isec,
388
const Relocation &rel) const override;
389
};
390
391
// PPC64 R2 Save Stub
392
// When the caller requires a valid R2 TOC pointer but the callee does not
393
// require a TOC pointer and the callee cannot guarantee that it doesn't
394
// clobber R2 then we need to save R2. This stub:
395
// 1) Saves the TOC pointer to the stack.
396
// 2) Tail calls the callee.
397
class PPC64R2SaveStub final : public Thunk {
398
public:
399
PPC64R2SaveStub(Symbol &dest, int64_t addend) : Thunk(dest, addend) {
400
alignment = 16;
401
}
402
403
// To prevent oscillations in layout when moving from short to long thunks
404
// we make sure that once a thunk has been set to long it cannot go back.
405
bool getMayUseShortThunk() {
406
if (!mayUseShortThunk)
407
return false;
408
if (!isInt<26>(computeOffset())) {
409
mayUseShortThunk = false;
410
return false;
411
}
412
return true;
413
}
414
uint32_t size() override { return getMayUseShortThunk() ? 8 : 32; }
415
void writeTo(uint8_t *buf) override;
416
void addSymbols(ThunkSection &isec) override;
417
bool isCompatibleWith(const InputSection &isec,
418
const Relocation &rel) const override;
419
420
private:
421
// Transitioning from long to short can create layout oscillations in
422
// certain corner cases which would prevent the layout from converging.
423
// This is similar to the handling for ARMThunk.
424
bool mayUseShortThunk = true;
425
int64_t computeOffset() const {
426
return destination.getVA() - (getThunkTargetSym()->getVA() + 4);
427
}
428
};
429
430
// PPC64 R12 Setup Stub
431
// When a caller that does not maintain TOC calls a target which may possibly
432
// use TOC (either non-preemptible with localentry>1 or preemptible), we need to
433
// set r12 to satisfy the requirement of the global entry point.
434
class PPC64R12SetupStub final : public Thunk {
435
public:
436
PPC64R12SetupStub(Symbol &dest, bool gotPlt)
437
: Thunk(dest, 0), gotPlt(gotPlt) {
438
alignment = 16;
439
}
440
uint32_t size() override { return 32; }
441
void writeTo(uint8_t *buf) override;
442
void addSymbols(ThunkSection &isec) override;
443
bool isCompatibleWith(const InputSection &isec,
444
const Relocation &rel) const override;
445
446
private:
447
bool gotPlt;
448
};
449
450
// A bl instruction uses a signed 24 bit offset, with an implicit 4 byte
451
// alignment. This gives a possible 26 bits of 'reach'. If the call offset is
452
// larger than that we need to emit a long-branch thunk. The target address
453
// of the callee is stored in a table to be accessed TOC-relative. Since the
454
// call must be local (a non-local call will have a PltCallStub instead) the
455
// table stores the address of the callee's local entry point. For
456
// position-independent code a corresponding relative dynamic relocation is
457
// used.
458
class PPC64LongBranchThunk : public Thunk {
459
public:
460
uint32_t size() override { return 32; }
461
void writeTo(uint8_t *buf) override;
462
void addSymbols(ThunkSection &isec) override;
463
bool isCompatibleWith(const InputSection &isec,
464
const Relocation &rel) const override;
465
466
protected:
467
PPC64LongBranchThunk(Symbol &dest, int64_t addend) : Thunk(dest, addend) {}
468
};
469
470
class PPC64PILongBranchThunk final : public PPC64LongBranchThunk {
471
public:
472
PPC64PILongBranchThunk(Symbol &dest, int64_t addend)
473
: PPC64LongBranchThunk(dest, addend) {
474
assert(!dest.isPreemptible);
475
if (std::optional<uint32_t> index =
476
in.ppc64LongBranchTarget->addEntry(&dest, addend)) {
477
mainPart->relaDyn->addRelativeReloc(
478
target->relativeRel, *in.ppc64LongBranchTarget, *index * UINT64_C(8),
479
dest, addend + getPPC64GlobalEntryToLocalEntryOffset(dest.stOther),
480
target->symbolicRel, R_ABS);
481
}
482
}
483
};
484
485
class PPC64PDLongBranchThunk final : public PPC64LongBranchThunk {
486
public:
487
PPC64PDLongBranchThunk(Symbol &dest, int64_t addend)
488
: PPC64LongBranchThunk(dest, addend) {
489
in.ppc64LongBranchTarget->addEntry(&dest, addend);
490
}
491
};
492
493
} // end anonymous namespace
494
495
Defined *Thunk::addSymbol(StringRef name, uint8_t type, uint64_t value,
496
InputSectionBase &section) {
497
Defined *d = addSyntheticLocal(name, type, value, /*size=*/0, section);
498
syms.push_back(d);
499
return d;
500
}
501
502
void Thunk::setOffset(uint64_t newOffset) {
503
for (Defined *d : syms)
504
d->value = d->value - offset + newOffset;
505
offset = newOffset;
506
}
507
508
// AArch64 Thunk base class.
509
static uint64_t getAArch64ThunkDestVA(const Symbol &s, int64_t a) {
510
uint64_t v = s.isInPlt() ? s.getPltVA() : s.getVA(a);
511
return v;
512
}
513
514
bool AArch64Thunk::getMayUseShortThunk() {
515
if (!mayUseShortThunk)
516
return false;
517
uint64_t s = getAArch64ThunkDestVA(destination, addend);
518
uint64_t p = getThunkTargetSym()->getVA();
519
mayUseShortThunk = llvm::isInt<28>(s - p);
520
return mayUseShortThunk;
521
}
522
523
void AArch64Thunk::writeTo(uint8_t *buf) {
524
if (!getMayUseShortThunk()) {
525
writeLong(buf);
526
return;
527
}
528
uint64_t s = getAArch64ThunkDestVA(destination, addend);
529
uint64_t p = getThunkTargetSym()->getVA();
530
write32(buf, 0x14000000); // b S
531
target->relocateNoSym(buf, R_AARCH64_CALL26, s - p);
532
}
533
534
// AArch64 long range Thunks.
535
void AArch64ABSLongThunk::writeLong(uint8_t *buf) {
536
const uint8_t data[] = {
537
0x50, 0x00, 0x00, 0x58, // ldr x16, L0
538
0x00, 0x02, 0x1f, 0xd6, // br x16
539
0x00, 0x00, 0x00, 0x00, // L0: .xword S
540
0x00, 0x00, 0x00, 0x00,
541
};
542
uint64_t s = getAArch64ThunkDestVA(destination, addend);
543
memcpy(buf, data, sizeof(data));
544
target->relocateNoSym(buf + 8, R_AARCH64_ABS64, s);
545
}
546
547
void AArch64ABSLongThunk::addSymbols(ThunkSection &isec) {
548
addSymbol(saver().save("__AArch64AbsLongThunk_" + destination.getName()),
549
STT_FUNC, 0, isec);
550
addSymbol("$x", STT_NOTYPE, 0, isec);
551
if (!getMayUseShortThunk())
552
addSymbol("$d", STT_NOTYPE, 8, isec);
553
}
554
555
// This Thunk has a maximum range of 4Gb, this is sufficient for all programs
556
// using the small code model, including pc-relative ones. At time of writing
557
// clang and gcc do not support the large code model for position independent
558
// code so it is safe to use this for position independent thunks without
559
// worrying about the destination being more than 4Gb away.
560
void AArch64ADRPThunk::writeLong(uint8_t *buf) {
561
const uint8_t data[] = {
562
0x10, 0x00, 0x00, 0x90, // adrp x16, Dest R_AARCH64_ADR_PREL_PG_HI21(Dest)
563
0x10, 0x02, 0x00, 0x91, // add x16, x16, R_AARCH64_ADD_ABS_LO12_NC(Dest)
564
0x00, 0x02, 0x1f, 0xd6, // br x16
565
};
566
uint64_t s = getAArch64ThunkDestVA(destination, addend);
567
uint64_t p = getThunkTargetSym()->getVA();
568
memcpy(buf, data, sizeof(data));
569
target->relocateNoSym(buf, R_AARCH64_ADR_PREL_PG_HI21,
570
getAArch64Page(s) - getAArch64Page(p));
571
target->relocateNoSym(buf + 4, R_AARCH64_ADD_ABS_LO12_NC, s);
572
}
573
574
void AArch64ADRPThunk::addSymbols(ThunkSection &isec) {
575
addSymbol(saver().save("__AArch64ADRPThunk_" + destination.getName()),
576
STT_FUNC, 0, isec);
577
addSymbol("$x", STT_NOTYPE, 0, isec);
578
}
579
580
// ARM Target Thunks
581
static uint64_t getARMThunkDestVA(const Symbol &s) {
582
uint64_t v = s.isInPlt() ? s.getPltVA() : s.getVA();
583
return SignExtend64<32>(v);
584
}
585
586
// This function returns true if the target is not Thumb and is within 2^26, and
587
// it has not previously returned false (see comment for mayUseShortThunk).
588
bool ARMThunk::getMayUseShortThunk() {
589
if (!mayUseShortThunk)
590
return false;
591
uint64_t s = getARMThunkDestVA(destination);
592
if (s & 1) {
593
mayUseShortThunk = false;
594
return false;
595
}
596
uint64_t p = getThunkTargetSym()->getVA();
597
int64_t offset = s - p - 8;
598
mayUseShortThunk = llvm::isInt<26>(offset);
599
return mayUseShortThunk;
600
}
601
602
void ARMThunk::writeTo(uint8_t *buf) {
603
if (!getMayUseShortThunk()) {
604
writeLong(buf);
605
return;
606
}
607
608
uint64_t s = getARMThunkDestVA(destination);
609
uint64_t p = getThunkTargetSym()->getVA();
610
int64_t offset = s - p - 8;
611
write32(buf, 0xea000000); // b S
612
target->relocateNoSym(buf, R_ARM_JUMP24, offset);
613
}
614
615
bool ARMThunk::isCompatibleWith(const InputSection &isec,
616
const Relocation &rel) const {
617
// v4T does not have BLX, so also deny R_ARM_THM_CALL
618
if (!config->armHasBlx && rel.type == R_ARM_THM_CALL)
619
return false;
620
621
// Thumb branch relocations can't use BLX
622
return rel.type != R_ARM_THM_JUMP19 && rel.type != R_ARM_THM_JUMP24;
623
}
624
625
// This function returns true if:
626
// the target is Thumb
627
// && is within branch range
628
// && this function has not previously returned false
629
// (see comment for mayUseShortThunk)
630
// && the arch supports Thumb branch range extension.
631
bool ThumbThunk::getMayUseShortThunk() {
632
if (!mayUseShortThunk || !config->armJ1J2BranchEncoding)
633
return false;
634
uint64_t s = getARMThunkDestVA(destination);
635
if ((s & 1) == 0) {
636
mayUseShortThunk = false;
637
return false;
638
}
639
uint64_t p = getThunkTargetSym()->getVA() & ~1;
640
int64_t offset = s - p - 4;
641
mayUseShortThunk = llvm::isInt<25>(offset);
642
return mayUseShortThunk;
643
}
644
645
void ThumbThunk::writeTo(uint8_t *buf) {
646
if (!getMayUseShortThunk()) {
647
writeLong(buf);
648
return;
649
}
650
651
uint64_t s = getARMThunkDestVA(destination);
652
uint64_t p = getThunkTargetSym()->getVA();
653
int64_t offset = s - p - 4;
654
write16(buf + 0, 0xf000); // b.w S
655
write16(buf + 2, 0xb000);
656
target->relocateNoSym(buf, R_ARM_THM_JUMP24, offset);
657
}
658
659
bool ThumbThunk::isCompatibleWith(const InputSection &isec,
660
const Relocation &rel) const {
661
// v4T does not have BLX, so also deny R_ARM_CALL
662
if (!config->armHasBlx && rel.type == R_ARM_CALL)
663
return false;
664
665
// ARM branch relocations can't use BLX
666
return rel.type != R_ARM_JUMP24 && rel.type != R_ARM_PC24 && rel.type != R_ARM_PLT32;
667
}
668
669
void ARMV7ABSLongThunk::writeLong(uint8_t *buf) {
670
write32(buf + 0, 0xe300c000); // movw ip,:lower16:S
671
write32(buf + 4, 0xe340c000); // movt ip,:upper16:S
672
write32(buf + 8, 0xe12fff1c); // bx ip
673
uint64_t s = getARMThunkDestVA(destination);
674
target->relocateNoSym(buf, R_ARM_MOVW_ABS_NC, s);
675
target->relocateNoSym(buf + 4, R_ARM_MOVT_ABS, s);
676
}
677
678
void ARMV7ABSLongThunk::addSymbols(ThunkSection &isec) {
679
addSymbol(saver().save("__ARMv7ABSLongThunk_" + destination.getName()),
680
STT_FUNC, 0, isec);
681
addSymbol("$a", STT_NOTYPE, 0, isec);
682
}
683
684
void ThumbV7ABSLongThunk::writeLong(uint8_t *buf) {
685
write16(buf + 0, 0xf240); // movw ip, :lower16:S
686
write16(buf + 2, 0x0c00);
687
write16(buf + 4, 0xf2c0); // movt ip, :upper16:S
688
write16(buf + 6, 0x0c00);
689
write16(buf + 8, 0x4760); // bx ip
690
uint64_t s = getARMThunkDestVA(destination);
691
target->relocateNoSym(buf, R_ARM_THM_MOVW_ABS_NC, s);
692
target->relocateNoSym(buf + 4, R_ARM_THM_MOVT_ABS, s);
693
}
694
695
void ThumbV7ABSLongThunk::addSymbols(ThunkSection &isec) {
696
addSymbol(saver().save("__Thumbv7ABSLongThunk_" + destination.getName()),
697
STT_FUNC, 1, isec);
698
addSymbol("$t", STT_NOTYPE, 0, isec);
699
}
700
701
void ARMV7PILongThunk::writeLong(uint8_t *buf) {
702
write32(buf + 0, 0xe30fcff0); // P: movw ip,:lower16:S - (P + (L1-P) + 8)
703
write32(buf + 4, 0xe340c000); // movt ip,:upper16:S - (P + (L1-P) + 8)
704
write32(buf + 8, 0xe08cc00f); // L1: add ip, ip, pc
705
write32(buf + 12, 0xe12fff1c); // bx ip
706
uint64_t s = getARMThunkDestVA(destination);
707
uint64_t p = getThunkTargetSym()->getVA();
708
int64_t offset = s - p - 16;
709
target->relocateNoSym(buf, R_ARM_MOVW_PREL_NC, offset);
710
target->relocateNoSym(buf + 4, R_ARM_MOVT_PREL, offset);
711
}
712
713
void ARMV7PILongThunk::addSymbols(ThunkSection &isec) {
714
addSymbol(saver().save("__ARMV7PILongThunk_" + destination.getName()),
715
STT_FUNC, 0, isec);
716
addSymbol("$a", STT_NOTYPE, 0, isec);
717
}
718
719
void ThumbV7PILongThunk::writeLong(uint8_t *buf) {
720
write16(buf + 0, 0xf64f); // P: movw ip,:lower16:S - (P + (L1-P) + 4)
721
write16(buf + 2, 0x7cf4);
722
write16(buf + 4, 0xf2c0); // movt ip,:upper16:S - (P + (L1-P) + 4)
723
write16(buf + 6, 0x0c00);
724
write16(buf + 8, 0x44fc); // L1: add ip, pc
725
write16(buf + 10, 0x4760); // bx ip
726
uint64_t s = getARMThunkDestVA(destination);
727
uint64_t p = getThunkTargetSym()->getVA() & ~0x1;
728
int64_t offset = s - p - 12;
729
target->relocateNoSym(buf, R_ARM_THM_MOVW_PREL_NC, offset);
730
target->relocateNoSym(buf + 4, R_ARM_THM_MOVT_PREL, offset);
731
}
732
733
void ThumbV7PILongThunk::addSymbols(ThunkSection &isec) {
734
addSymbol(saver().save("__ThumbV7PILongThunk_" + destination.getName()),
735
STT_FUNC, 1, isec);
736
addSymbol("$t", STT_NOTYPE, 0, isec);
737
}
738
739
void ThumbV6MABSLongThunk::writeLong(uint8_t *buf) {
740
// Most Thumb instructions cannot access the high registers r8 - r15. As the
741
// only register we can corrupt is r12 we must instead spill a low register
742
// to the stack to use as a scratch register. We push r1 even though we
743
// don't need to get some space to use for the return address.
744
write16(buf + 0, 0xb403); // push {r0, r1} ; Obtain scratch registers
745
write16(buf + 2, 0x4801); // ldr r0, [pc, #4] ; L1
746
write16(buf + 4, 0x9001); // str r0, [sp, #4] ; SP + 4 = S
747
write16(buf + 6, 0xbd01); // pop {r0, pc} ; restore r0 and branch to dest
748
write32(buf + 8, 0x00000000); // L1: .word S
749
uint64_t s = getARMThunkDestVA(destination);
750
target->relocateNoSym(buf + 8, R_ARM_ABS32, s);
751
}
752
753
void ThumbV6MABSLongThunk::addSymbols(ThunkSection &isec) {
754
addSymbol(saver().save("__Thumbv6MABSLongThunk_" + destination.getName()),
755
STT_FUNC, 1, isec);
756
addSymbol("$t", STT_NOTYPE, 0, isec);
757
if (!getMayUseShortThunk())
758
addSymbol("$d", STT_NOTYPE, 8, isec);
759
}
760
761
void ThumbV6MABSXOLongThunk::writeLong(uint8_t *buf) {
762
// Most Thumb instructions cannot access the high registers r8 - r15. As the
763
// only register we can corrupt is r12 we must instead spill a low register
764
// to the stack to use as a scratch register. We push r1 even though we
765
// don't need to get some space to use for the return address.
766
write16(buf + 0, 0xb403); // push {r0, r1} ; Obtain scratch registers
767
write16(buf + 2, 0x2000); // movs r0, :upper8_15:S
768
write16(buf + 4, 0x0200); // lsls r0, r0, #8
769
write16(buf + 6, 0x3000); // adds r0, :upper0_7:S
770
write16(buf + 8, 0x0200); // lsls r0, r0, #8
771
write16(buf + 10, 0x3000); // adds r0, :lower8_15:S
772
write16(buf + 12, 0x0200); // lsls r0, r0, #8
773
write16(buf + 14, 0x3000); // adds r0, :lower0_7:S
774
write16(buf + 16, 0x9001); // str r0, [sp, #4] ; SP + 4 = S
775
write16(buf + 18, 0xbd01); // pop {r0, pc} ; restore r0 and branch to dest
776
uint64_t s = getARMThunkDestVA(destination);
777
target->relocateNoSym(buf + 2, R_ARM_THM_ALU_ABS_G3, s);
778
target->relocateNoSym(buf + 6, R_ARM_THM_ALU_ABS_G2_NC, s);
779
target->relocateNoSym(buf + 10, R_ARM_THM_ALU_ABS_G1_NC, s);
780
target->relocateNoSym(buf + 14, R_ARM_THM_ALU_ABS_G0_NC, s);
781
}
782
783
void ThumbV6MABSXOLongThunk::addSymbols(ThunkSection &isec) {
784
addSymbol(saver().save("__Thumbv6MABSXOLongThunk_" + destination.getName()),
785
STT_FUNC, 1, isec);
786
addSymbol("$t", STT_NOTYPE, 0, isec);
787
}
788
789
void ThumbV6MPILongThunk::writeLong(uint8_t *buf) {
790
// Most Thumb instructions cannot access the high registers r8 - r15. As the
791
// only register we can corrupt is ip (r12) we must instead spill a low
792
// register to the stack to use as a scratch register.
793
write16(buf + 0, 0xb401); // P: push {r0} ; Obtain scratch register
794
write16(buf + 2, 0x4802); // ldr r0, [pc, #8] ; L2
795
write16(buf + 4, 0x4684); // mov ip, r0 ; high to low register
796
write16(buf + 6, 0xbc01); // pop {r0} ; restore scratch register
797
write16(buf + 8, 0x44e7); // L1: add pc, ip ; transfer control
798
write16(buf + 10, 0x46c0); // nop ; pad to 4-byte boundary
799
write32(buf + 12, 0x00000000); // L2: .word S - (P + (L1 - P) + 4)
800
uint64_t s = getARMThunkDestVA(destination);
801
uint64_t p = getThunkTargetSym()->getVA() & ~0x1;
802
target->relocateNoSym(buf + 12, R_ARM_REL32, s - p - 12);
803
}
804
805
void ThumbV6MPILongThunk::addSymbols(ThunkSection &isec) {
806
addSymbol(saver().save("__Thumbv6MPILongThunk_" + destination.getName()),
807
STT_FUNC, 1, isec);
808
addSymbol("$t", STT_NOTYPE, 0, isec);
809
if (!getMayUseShortThunk())
810
addSymbol("$d", STT_NOTYPE, 12, isec);
811
}
812
813
void ARMV5LongLdrPcThunk::writeLong(uint8_t *buf) {
814
write32(buf + 0, 0xe51ff004); // ldr pc, [pc,#-4] ; L1
815
write32(buf + 4, 0x00000000); // L1: .word S
816
target->relocateNoSym(buf + 4, R_ARM_ABS32, getARMThunkDestVA(destination));
817
}
818
819
void ARMV5LongLdrPcThunk::addSymbols(ThunkSection &isec) {
820
addSymbol(saver().save("__ARMv5LongLdrPcThunk_" + destination.getName()),
821
STT_FUNC, 0, isec);
822
addSymbol("$a", STT_NOTYPE, 0, isec);
823
if (!getMayUseShortThunk())
824
addSymbol("$d", STT_NOTYPE, 4, isec);
825
}
826
827
void ARMV4ABSLongBXThunk::writeLong(uint8_t *buf) {
828
write32(buf + 0, 0xe59fc000); // ldr r12, [pc] ; L1
829
write32(buf + 4, 0xe12fff1c); // bx r12
830
write32(buf + 8, 0x00000000); // L1: .word S
831
target->relocateNoSym(buf + 8, R_ARM_ABS32, getARMThunkDestVA(destination));
832
}
833
834
void ARMV4ABSLongBXThunk::addSymbols(ThunkSection &isec) {
835
addSymbol(saver().save("__ARMv4ABSLongBXThunk_" + destination.getName()),
836
STT_FUNC, 0, isec);
837
addSymbol("$a", STT_NOTYPE, 0, isec);
838
if (!getMayUseShortThunk())
839
addSymbol("$d", STT_NOTYPE, 8, isec);
840
}
841
842
void ThumbV4ABSLongBXThunk::writeLong(uint8_t *buf) {
843
write16(buf + 0, 0x4778); // bx pc
844
write16(buf + 2, 0xe7fd); // b #-6 ; Arm recommended sequence to follow bx pc
845
write32(buf + 4, 0xe51ff004); // ldr pc, [pc, #-4] ; L1
846
write32(buf + 8, 0x00000000); // L1: .word S
847
target->relocateNoSym(buf + 8, R_ARM_ABS32, getARMThunkDestVA(destination));
848
}
849
850
void ThumbV4ABSLongBXThunk::addSymbols(ThunkSection &isec) {
851
addSymbol(saver().save("__Thumbv4ABSLongBXThunk_" + destination.getName()),
852
STT_FUNC, 1, isec);
853
addSymbol("$t", STT_NOTYPE, 0, isec);
854
addSymbol("$a", STT_NOTYPE, 4, isec);
855
if (!getMayUseShortThunk())
856
addSymbol("$d", STT_NOTYPE, 8, isec);
857
}
858
859
void ThumbV4ABSLongThunk::writeLong(uint8_t *buf) {
860
write16(buf + 0, 0x4778); // bx pc
861
write16(buf + 2, 0xe7fd); // b #-6 ; Arm recommended sequence to follow bx pc
862
write32(buf + 4, 0xe59fc000); // ldr r12, [pc] ; L1
863
write32(buf + 8, 0xe12fff1c); // bx r12
864
write32(buf + 12, 0x00000000); // L1: .word S
865
target->relocateNoSym(buf + 12, R_ARM_ABS32, getARMThunkDestVA(destination));
866
}
867
868
void ThumbV4ABSLongThunk::addSymbols(ThunkSection &isec) {
869
addSymbol(saver().save("__Thumbv4ABSLongThunk_" + destination.getName()),
870
STT_FUNC, 1, isec);
871
addSymbol("$t", STT_NOTYPE, 0, isec);
872
addSymbol("$a", STT_NOTYPE, 4, isec);
873
if (!getMayUseShortThunk())
874
addSymbol("$d", STT_NOTYPE, 12, isec);
875
}
876
877
void ARMV4PILongBXThunk::writeLong(uint8_t *buf) {
878
write32(buf + 0, 0xe59fc004); // P: ldr ip, [pc,#4] ; L2
879
write32(buf + 4, 0xe08fc00c); // L1: add ip, pc, ip
880
write32(buf + 8, 0xe12fff1c); // bx ip
881
write32(buf + 12, 0x00000000); // L2: .word S - (P + (L1 - P) + 8)
882
uint64_t s = getARMThunkDestVA(destination);
883
uint64_t p = getThunkTargetSym()->getVA() & ~0x1;
884
target->relocateNoSym(buf + 12, R_ARM_REL32, s - p - 12);
885
}
886
887
void ARMV4PILongBXThunk::addSymbols(ThunkSection &isec) {
888
addSymbol(saver().save("__ARMv4PILongBXThunk_" + destination.getName()),
889
STT_FUNC, 0, isec);
890
addSymbol("$a", STT_NOTYPE, 0, isec);
891
if (!getMayUseShortThunk())
892
addSymbol("$d", STT_NOTYPE, 12, isec);
893
}
894
895
void ARMV4PILongThunk::writeLong(uint8_t *buf) {
896
write32(buf + 0, 0xe59fc000); // P: ldr ip, [pc] ; L2
897
write32(buf + 4, 0xe08ff00c); // L1: add pc, pc, r12
898
write32(buf + 8, 0x00000000); // L2: .word S - (P + (L1 - P) + 8)
899
uint64_t s = getARMThunkDestVA(destination);
900
uint64_t p = getThunkTargetSym()->getVA() & ~0x1;
901
target->relocateNoSym(buf + 8, R_ARM_REL32, s - p - 12);
902
}
903
904
void ARMV4PILongThunk::addSymbols(ThunkSection &isec) {
905
addSymbol(saver().save("__ARMv4PILongThunk_" + destination.getName()),
906
STT_FUNC, 0, isec);
907
addSymbol("$a", STT_NOTYPE, 0, isec);
908
if (!getMayUseShortThunk())
909
addSymbol("$d", STT_NOTYPE, 8, isec);
910
}
911
912
void ThumbV4PILongBXThunk::writeLong(uint8_t *buf) {
913
write16(buf + 0, 0x4778); // P: bx pc
914
write16(buf + 2, 0xe7fd); // b #-6 ; Arm recommended sequence to follow bx pc
915
write32(buf + 4, 0xe59fc000); // ldr r12, [pc] ; L2
916
write32(buf + 8, 0xe08cf00f); // L1: add pc, r12, pc
917
write32(buf + 12, 0x00000000); // L2: .word S - (P + (L1 - P) + 8)
918
uint64_t s = getARMThunkDestVA(destination);
919
uint64_t p = getThunkTargetSym()->getVA() & ~0x1;
920
target->relocateNoSym(buf + 12, R_ARM_REL32, s - p - 16);
921
}
922
923
void ThumbV4PILongBXThunk::addSymbols(ThunkSection &isec) {
924
addSymbol(saver().save("__Thumbv4PILongBXThunk_" + destination.getName()),
925
STT_FUNC, 1, isec);
926
addSymbol("$t", STT_NOTYPE, 0, isec);
927
addSymbol("$a", STT_NOTYPE, 4, isec);
928
if (!getMayUseShortThunk())
929
addSymbol("$d", STT_NOTYPE, 12, isec);
930
}
931
932
void ThumbV4PILongThunk::writeLong(uint8_t *buf) {
933
write16(buf + 0, 0x4778); // P: bx pc
934
write16(buf + 2, 0xe7fd); // b #-6 ; Arm recommended sequence to follow bx pc
935
write32(buf + 4, 0xe59fc004); // ldr ip, [pc,#4] ; L2
936
write32(buf + 8, 0xe08fc00c); // L1: add ip, pc, ip
937
write32(buf + 12, 0xe12fff1c); // bx ip
938
write32(buf + 16, 0x00000000); // L2: .word S - (P + (L1 - P) + 8)
939
uint64_t s = getARMThunkDestVA(destination);
940
uint64_t p = getThunkTargetSym()->getVA() & ~0x1;
941
target->relocateNoSym(buf + 16, R_ARM_REL32, s - p - 16);
942
}
943
944
void ThumbV4PILongThunk::addSymbols(ThunkSection &isec) {
945
addSymbol(saver().save("__Thumbv4PILongThunk_" + destination.getName()),
946
STT_FUNC, 1, isec);
947
addSymbol("$t", STT_NOTYPE, 0, isec);
948
addSymbol("$a", STT_NOTYPE, 4, isec);
949
if (!getMayUseShortThunk())
950
addSymbol("$d", STT_NOTYPE, 16, isec);
951
}
952
953
// Use the long jump which covers a range up to 8MiB.
954
void AVRThunk::writeTo(uint8_t *buf) {
955
write32(buf, 0x940c); // jmp func
956
target->relocateNoSym(buf, R_AVR_CALL, destination.getVA());
957
}
958
959
void AVRThunk::addSymbols(ThunkSection &isec) {
960
addSymbol(saver().save("__AVRThunk_" + destination.getName()), STT_FUNC, 0,
961
isec);
962
}
963
964
// Write MIPS LA25 thunk code to call PIC function from the non-PIC one.
965
void MipsThunk::writeTo(uint8_t *buf) {
966
uint64_t s = destination.getVA();
967
write32(buf, 0x3c190000); // lui $25, %hi(func)
968
write32(buf + 4, 0x08000000 | (s >> 2)); // j func
969
write32(buf + 8, 0x27390000); // addiu $25, $25, %lo(func)
970
write32(buf + 12, 0x00000000); // nop
971
target->relocateNoSym(buf, R_MIPS_HI16, s);
972
target->relocateNoSym(buf + 8, R_MIPS_LO16, s);
973
}
974
975
void MipsThunk::addSymbols(ThunkSection &isec) {
976
addSymbol(saver().save("__LA25Thunk_" + destination.getName()), STT_FUNC, 0,
977
isec);
978
}
979
980
InputSection *MipsThunk::getTargetInputSection() const {
981
auto &dr = cast<Defined>(destination);
982
return dyn_cast<InputSection>(dr.section);
983
}
984
985
// Write microMIPS R2-R5 LA25 thunk code
986
// to call PIC function from the non-PIC one.
987
void MicroMipsThunk::writeTo(uint8_t *buf) {
988
uint64_t s = destination.getVA();
989
write16(buf, 0x41b9); // lui $25, %hi(func)
990
write16(buf + 4, 0xd400); // j func
991
write16(buf + 8, 0x3339); // addiu $25, $25, %lo(func)
992
write16(buf + 12, 0x0c00); // nop
993
target->relocateNoSym(buf, R_MICROMIPS_HI16, s);
994
target->relocateNoSym(buf + 4, R_MICROMIPS_26_S1, s);
995
target->relocateNoSym(buf + 8, R_MICROMIPS_LO16, s);
996
}
997
998
void MicroMipsThunk::addSymbols(ThunkSection &isec) {
999
Defined *d =
1000
addSymbol(saver().save("__microLA25Thunk_" + destination.getName()),
1001
STT_FUNC, 0, isec);
1002
d->stOther |= STO_MIPS_MICROMIPS;
1003
}
1004
1005
InputSection *MicroMipsThunk::getTargetInputSection() const {
1006
auto &dr = cast<Defined>(destination);
1007
return dyn_cast<InputSection>(dr.section);
1008
}
1009
1010
// Write microMIPS R6 LA25 thunk code
1011
// to call PIC function from the non-PIC one.
1012
void MicroMipsR6Thunk::writeTo(uint8_t *buf) {
1013
uint64_t s = destination.getVA();
1014
uint64_t p = getThunkTargetSym()->getVA();
1015
write16(buf, 0x1320); // lui $25, %hi(func)
1016
write16(buf + 4, 0x3339); // addiu $25, $25, %lo(func)
1017
write16(buf + 8, 0x9400); // bc func
1018
target->relocateNoSym(buf, R_MICROMIPS_HI16, s);
1019
target->relocateNoSym(buf + 4, R_MICROMIPS_LO16, s);
1020
target->relocateNoSym(buf + 8, R_MICROMIPS_PC26_S1, s - p - 12);
1021
}
1022
1023
void MicroMipsR6Thunk::addSymbols(ThunkSection &isec) {
1024
Defined *d =
1025
addSymbol(saver().save("__microLA25Thunk_" + destination.getName()),
1026
STT_FUNC, 0, isec);
1027
d->stOther |= STO_MIPS_MICROMIPS;
1028
}
1029
1030
InputSection *MicroMipsR6Thunk::getTargetInputSection() const {
1031
auto &dr = cast<Defined>(destination);
1032
return dyn_cast<InputSection>(dr.section);
1033
}
1034
1035
void elf::writePPC32PltCallStub(uint8_t *buf, uint64_t gotPltVA,
1036
const InputFile *file, int64_t addend) {
1037
if (!config->isPic) {
1038
write32(buf + 0, 0x3d600000 | (gotPltVA + 0x8000) >> 16); // lis r11,ha
1039
write32(buf + 4, 0x816b0000 | (uint16_t)gotPltVA); // lwz r11,l(r11)
1040
write32(buf + 8, 0x7d6903a6); // mtctr r11
1041
write32(buf + 12, 0x4e800420); // bctr
1042
return;
1043
}
1044
uint32_t offset;
1045
if (addend >= 0x8000) {
1046
// The stub loads an address relative to r30 (.got2+Addend). Addend is
1047
// almost always 0x8000. The address of .got2 is different in another object
1048
// file, so a stub cannot be shared.
1049
offset = gotPltVA -
1050
(in.ppc32Got2->getParent()->getVA() +
1051
(file->ppc32Got2 ? file->ppc32Got2->outSecOff : 0) + addend);
1052
} else {
1053
// The stub loads an address relative to _GLOBAL_OFFSET_TABLE_ (which is
1054
// currently the address of .got).
1055
offset = gotPltVA - in.got->getVA();
1056
}
1057
uint16_t ha = (offset + 0x8000) >> 16, l = (uint16_t)offset;
1058
if (ha == 0) {
1059
write32(buf + 0, 0x817e0000 | l); // lwz r11,l(r30)
1060
write32(buf + 4, 0x7d6903a6); // mtctr r11
1061
write32(buf + 8, 0x4e800420); // bctr
1062
write32(buf + 12, 0x60000000); // nop
1063
} else {
1064
write32(buf + 0, 0x3d7e0000 | ha); // addis r11,r30,ha
1065
write32(buf + 4, 0x816b0000 | l); // lwz r11,l(r11)
1066
write32(buf + 8, 0x7d6903a6); // mtctr r11
1067
write32(buf + 12, 0x4e800420); // bctr
1068
}
1069
}
1070
1071
void PPC32PltCallStub::writeTo(uint8_t *buf) {
1072
writePPC32PltCallStub(buf, destination.getGotPltVA(), file, addend);
1073
}
1074
1075
void PPC32PltCallStub::addSymbols(ThunkSection &isec) {
1076
std::string buf;
1077
raw_string_ostream os(buf);
1078
os << format_hex_no_prefix(addend, 8);
1079
if (!config->isPic)
1080
os << ".plt_call32.";
1081
else if (addend >= 0x8000)
1082
os << ".got2.plt_pic32.";
1083
else
1084
os << ".plt_pic32.";
1085
os << destination.getName();
1086
addSymbol(saver().save(os.str()), STT_FUNC, 0, isec);
1087
}
1088
1089
bool PPC32PltCallStub::isCompatibleWith(const InputSection &isec,
1090
const Relocation &rel) const {
1091
return !config->isPic || (isec.file == file && rel.addend == addend);
1092
}
1093
1094
void PPC32LongThunk::addSymbols(ThunkSection &isec) {
1095
addSymbol(saver().save("__LongThunk_" + destination.getName()), STT_FUNC, 0,
1096
isec);
1097
}
1098
1099
void PPC32LongThunk::writeTo(uint8_t *buf) {
1100
auto ha = [](uint32_t v) -> uint16_t { return (v + 0x8000) >> 16; };
1101
auto lo = [](uint32_t v) -> uint16_t { return v; };
1102
uint32_t d = destination.getVA(addend);
1103
if (config->isPic) {
1104
uint32_t off = d - (getThunkTargetSym()->getVA() + 8);
1105
write32(buf + 0, 0x7c0802a6); // mflr r12,0
1106
write32(buf + 4, 0x429f0005); // bcl r20,r31,.+4
1107
write32(buf + 8, 0x7d8802a6); // mtctr r12
1108
write32(buf + 12, 0x3d8c0000 | ha(off)); // addis r12,r12,off@ha
1109
write32(buf + 16, 0x398c0000 | lo(off)); // addi r12,r12,off@l
1110
write32(buf + 20, 0x7c0803a6); // mtlr r0
1111
buf += 24;
1112
} else {
1113
write32(buf + 0, 0x3d800000 | ha(d)); // lis r12,d@ha
1114
write32(buf + 4, 0x398c0000 | lo(d)); // addi r12,r12,d@l
1115
buf += 8;
1116
}
1117
write32(buf + 0, 0x7d8903a6); // mtctr r12
1118
write32(buf + 4, 0x4e800420); // bctr
1119
}
1120
1121
void elf::writePPC64LoadAndBranch(uint8_t *buf, int64_t offset) {
1122
uint16_t offHa = (offset + 0x8000) >> 16;
1123
uint16_t offLo = offset & 0xffff;
1124
1125
write32(buf + 0, 0x3d820000 | offHa); // addis r12, r2, OffHa
1126
write32(buf + 4, 0xe98c0000 | offLo); // ld r12, OffLo(r12)
1127
write32(buf + 8, 0x7d8903a6); // mtctr r12
1128
write32(buf + 12, 0x4e800420); // bctr
1129
}
1130
1131
void PPC64PltCallStub::writeTo(uint8_t *buf) {
1132
int64_t offset = destination.getGotPltVA() - getPPC64TocBase();
1133
// Save the TOC pointer to the save-slot reserved in the call frame.
1134
write32(buf + 0, 0xf8410018); // std r2,24(r1)
1135
writePPC64LoadAndBranch(buf + 4, offset);
1136
}
1137
1138
void PPC64PltCallStub::addSymbols(ThunkSection &isec) {
1139
Defined *s = addSymbol(saver().save("__plt_" + destination.getName()),
1140
STT_FUNC, 0, isec);
1141
s->setNeedsTocRestore(true);
1142
s->file = destination.file;
1143
}
1144
1145
bool PPC64PltCallStub::isCompatibleWith(const InputSection &isec,
1146
const Relocation &rel) const {
1147
return rel.type == R_PPC64_REL24 || rel.type == R_PPC64_REL14;
1148
}
1149
1150
void PPC64R2SaveStub::writeTo(uint8_t *buf) {
1151
const int64_t offset = computeOffset();
1152
write32(buf + 0, 0xf8410018); // std r2,24(r1)
1153
// The branch offset needs to fit in 26 bits.
1154
if (getMayUseShortThunk()) {
1155
write32(buf + 4, 0x48000000 | (offset & 0x03fffffc)); // b <offset>
1156
} else if (isInt<34>(offset)) {
1157
int nextInstOffset;
1158
uint64_t tocOffset = destination.getVA() - getPPC64TocBase();
1159
if (tocOffset >> 16 > 0) {
1160
const uint64_t addi = ADDI_R12_TO_R12_NO_DISP | (tocOffset & 0xffff);
1161
const uint64_t addis =
1162
ADDIS_R12_TO_R2_NO_DISP | ((tocOffset >> 16) & 0xffff);
1163
write32(buf + 4, addis); // addis r12, r2 , top of offset
1164
write32(buf + 8, addi); // addi r12, r12, bottom of offset
1165
nextInstOffset = 12;
1166
} else {
1167
const uint64_t addi = ADDI_R12_TO_R2_NO_DISP | (tocOffset & 0xffff);
1168
write32(buf + 4, addi); // addi r12, r2, offset
1169
nextInstOffset = 8;
1170
}
1171
write32(buf + nextInstOffset, MTCTR_R12); // mtctr r12
1172
write32(buf + nextInstOffset + 4, BCTR); // bctr
1173
} else {
1174
in.ppc64LongBranchTarget->addEntry(&destination, addend);
1175
const int64_t offsetFromTOC =
1176
in.ppc64LongBranchTarget->getEntryVA(&destination, addend) -
1177
getPPC64TocBase();
1178
writePPC64LoadAndBranch(buf + 4, offsetFromTOC);
1179
}
1180
}
1181
1182
void PPC64R2SaveStub::addSymbols(ThunkSection &isec) {
1183
Defined *s = addSymbol(saver().save("__toc_save_" + destination.getName()),
1184
STT_FUNC, 0, isec);
1185
s->setNeedsTocRestore(true);
1186
}
1187
1188
bool PPC64R2SaveStub::isCompatibleWith(const InputSection &isec,
1189
const Relocation &rel) const {
1190
return rel.type == R_PPC64_REL24 || rel.type == R_PPC64_REL14;
1191
}
1192
1193
void PPC64R12SetupStub::writeTo(uint8_t *buf) {
1194
int64_t offset = (gotPlt ? destination.getGotPltVA() : destination.getVA()) -
1195
getThunkTargetSym()->getVA();
1196
if (!isInt<34>(offset))
1197
reportRangeError(buf, offset, 34, destination, "R12 setup stub offset");
1198
1199
int nextInstOffset;
1200
if (config->power10Stubs) {
1201
const uint64_t imm = (((offset >> 16) & 0x3ffff) << 32) | (offset & 0xffff);
1202
// pld 12, func@plt@pcrel or paddi r12, 0, func@pcrel
1203
writePrefixedInstruction(
1204
buf, (gotPlt ? PLD_R12_NO_DISP : PADDI_R12_NO_DISP) | imm);
1205
nextInstOffset = 8;
1206
} else {
1207
uint32_t off = offset - 8;
1208
write32(buf + 0, 0x7d8802a6); // mflr 12
1209
write32(buf + 4, 0x429f0005); // bcl 20,31,.+4
1210
write32(buf + 8, 0x7d6802a6); // mflr 11
1211
write32(buf + 12, 0x7d8803a6); // mtlr 12
1212
write32(buf + 16,
1213
0x3d8b0000 | ((off + 0x8000) >> 16)); // addis 12,11,off@ha
1214
if (gotPlt)
1215
write32(buf + 20, 0xe98c0000 | (off & 0xffff)); // ld 12, off@l(12)
1216
else
1217
write32(buf + 20, 0x398c0000 | (off & 0xffff)); // addi 12,12,off@l
1218
nextInstOffset = 24;
1219
}
1220
write32(buf + nextInstOffset, MTCTR_R12); // mtctr r12
1221
write32(buf + nextInstOffset + 4, BCTR); // bctr
1222
}
1223
1224
void PPC64R12SetupStub::addSymbols(ThunkSection &isec) {
1225
addSymbol(saver().save((gotPlt ? "__plt_pcrel_" : "__gep_setup_") +
1226
destination.getName()),
1227
STT_FUNC, 0, isec);
1228
}
1229
1230
bool PPC64R12SetupStub::isCompatibleWith(const InputSection &isec,
1231
const Relocation &rel) const {
1232
return rel.type == R_PPC64_REL24_NOTOC;
1233
}
1234
1235
void PPC64LongBranchThunk::writeTo(uint8_t *buf) {
1236
int64_t offset = in.ppc64LongBranchTarget->getEntryVA(&destination, addend) -
1237
getPPC64TocBase();
1238
writePPC64LoadAndBranch(buf, offset);
1239
}
1240
1241
void PPC64LongBranchThunk::addSymbols(ThunkSection &isec) {
1242
addSymbol(saver().save("__long_branch_" + destination.getName()), STT_FUNC, 0,
1243
isec);
1244
}
1245
1246
bool PPC64LongBranchThunk::isCompatibleWith(const InputSection &isec,
1247
const Relocation &rel) const {
1248
return rel.type == R_PPC64_REL24 || rel.type == R_PPC64_REL14;
1249
}
1250
1251
Thunk::Thunk(Symbol &d, int64_t a) : destination(d), addend(a), offset(0) {
1252
destination.thunkAccessed = true;
1253
}
1254
1255
Thunk::~Thunk() = default;
1256
1257
static Thunk *addThunkAArch64(RelType type, Symbol &s, int64_t a) {
1258
if (type != R_AARCH64_CALL26 && type != R_AARCH64_JUMP26 &&
1259
type != R_AARCH64_PLT32)
1260
fatal("unrecognized relocation type");
1261
if (config->picThunk)
1262
return make<AArch64ADRPThunk>(s, a);
1263
return make<AArch64ABSLongThunk>(s, a);
1264
}
1265
1266
// Creates a thunk for long branches or Thumb-ARM interworking.
1267
// Arm Architectures v4t does not support Thumb2 technology, and does not
1268
// support BLX or LDR Arm/Thumb state switching. This means that
1269
// - MOVT and MOVW instructions cannot be used.
1270
// - We can't rewrite BL in place to BLX. We will need thunks.
1271
//
1272
// TODO: use B for short Thumb->Arm thunks instead of LDR (this doesn't work for
1273
// Arm->Thumb, as in Arm state no BX PC trick; it doesn't switch state).
1274
static Thunk *addThunkArmv4(RelType reloc, Symbol &s, int64_t a) {
1275
bool thumb_target = s.getVA(a) & 1;
1276
1277
switch (reloc) {
1278
case R_ARM_PC24:
1279
case R_ARM_PLT32:
1280
case R_ARM_JUMP24:
1281
case R_ARM_CALL:
1282
if (config->picThunk) {
1283
if (thumb_target)
1284
return make<ARMV4PILongBXThunk>(s, a);
1285
return make<ARMV4PILongThunk>(s, a);
1286
}
1287
if (thumb_target)
1288
return make<ARMV4ABSLongBXThunk>(s, a);
1289
return make<ARMV5LongLdrPcThunk>(s, a);
1290
case R_ARM_THM_CALL:
1291
if (config->picThunk) {
1292
if (thumb_target)
1293
return make<ThumbV4PILongThunk>(s, a);
1294
return make<ThumbV4PILongBXThunk>(s, a);
1295
}
1296
if (thumb_target)
1297
return make<ThumbV4ABSLongThunk>(s, a);
1298
return make<ThumbV4ABSLongBXThunk>(s, a);
1299
}
1300
fatal("relocation " + toString(reloc) + " to " + toString(s) +
1301
" not supported for Armv4 or Armv4T target");
1302
}
1303
1304
// Creates a thunk for Thumb-ARM interworking compatible with Armv5 and Armv6.
1305
// Arm Architectures v5 and v6 do not support Thumb2 technology. This means that
1306
// - MOVT and MOVW instructions cannot be used
1307
// - Only Thumb relocation that can generate a Thunk is a BL, this can always
1308
// be transformed into a BLX
1309
static Thunk *addThunkArmv5v6(RelType reloc, Symbol &s, int64_t a) {
1310
switch (reloc) {
1311
case R_ARM_PC24:
1312
case R_ARM_PLT32:
1313
case R_ARM_JUMP24:
1314
case R_ARM_CALL:
1315
case R_ARM_THM_CALL:
1316
if (config->picThunk)
1317
return make<ARMV4PILongBXThunk>(s, a);
1318
return make<ARMV5LongLdrPcThunk>(s, a);
1319
}
1320
fatal("relocation " + toString(reloc) + " to " + toString(s) +
1321
" not supported for Armv5 or Armv6 targets");
1322
}
1323
1324
// Create a thunk for Thumb long branch on V6-M.
1325
// Arm Architecture v6-M only supports Thumb instructions. This means
1326
// - MOVT and MOVW instructions cannot be used.
1327
// - Only a limited number of instructions can access registers r8 and above
1328
// - No interworking support is needed (all Thumb).
1329
static Thunk *addThunkV6M(const InputSection &isec, RelType reloc, Symbol &s,
1330
int64_t a) {
1331
const bool isPureCode = isec.getParent()->flags & SHF_ARM_PURECODE;
1332
switch (reloc) {
1333
case R_ARM_THM_JUMP19:
1334
case R_ARM_THM_JUMP24:
1335
case R_ARM_THM_CALL:
1336
if (config->isPic) {
1337
if (!isPureCode)
1338
return make<ThumbV6MPILongThunk>(s, a);
1339
1340
fatal("relocation " + toString(reloc) + " to " + toString(s) +
1341
" not supported for Armv6-M targets for position independent"
1342
" and execute only code");
1343
}
1344
if (isPureCode)
1345
return make<ThumbV6MABSXOLongThunk>(s, a);
1346
return make<ThumbV6MABSLongThunk>(s, a);
1347
}
1348
fatal("relocation " + toString(reloc) + " to " + toString(s) +
1349
" not supported for Armv6-M targets");
1350
}
1351
1352
// Creates a thunk for Thumb-ARM interworking or branch range extension.
1353
static Thunk *addThunkArm(const InputSection &isec, RelType reloc, Symbol &s,
1354
int64_t a) {
1355
// Decide which Thunk is needed based on:
1356
// Available instruction set
1357
// - An Arm Thunk can only be used if Arm state is available.
1358
// - A Thumb Thunk can only be used if Thumb state is available.
1359
// - Can only use a Thunk if it uses instructions that the Target supports.
1360
// Relocation is branch or branch and link
1361
// - Branch instructions cannot change state, can only select Thunk that
1362
// starts in the same state as the caller.
1363
// - Branch and link relocations can change state, can select Thunks from
1364
// either Arm or Thumb.
1365
// Position independent Thunks if we require position independent code.
1366
// Execute Only Thunks if the output section is execute only code.
1367
1368
// Handle architectures that have restrictions on the instructions that they
1369
// can use in Thunks. The flags below are set by reading the BuildAttributes
1370
// of the input objects. InputFiles.cpp contains the mapping from ARM
1371
// architecture to flag.
1372
if (!config->armHasMovtMovw) {
1373
if (config->armJ1J2BranchEncoding)
1374
return addThunkV6M(isec, reloc, s, a);
1375
if (config->armHasBlx)
1376
return addThunkArmv5v6(reloc, s, a);
1377
return addThunkArmv4(reloc, s, a);
1378
}
1379
1380
switch (reloc) {
1381
case R_ARM_PC24:
1382
case R_ARM_PLT32:
1383
case R_ARM_JUMP24:
1384
case R_ARM_CALL:
1385
if (config->picThunk)
1386
return make<ARMV7PILongThunk>(s, a);
1387
return make<ARMV7ABSLongThunk>(s, a);
1388
case R_ARM_THM_JUMP19:
1389
case R_ARM_THM_JUMP24:
1390
case R_ARM_THM_CALL:
1391
if (config->picThunk)
1392
return make<ThumbV7PILongThunk>(s, a);
1393
return make<ThumbV7ABSLongThunk>(s, a);
1394
}
1395
fatal("unrecognized relocation type");
1396
}
1397
1398
static Thunk *addThunkAVR(RelType type, Symbol &s, int64_t a) {
1399
switch (type) {
1400
case R_AVR_LO8_LDI_GS:
1401
case R_AVR_HI8_LDI_GS:
1402
return make<AVRThunk>(s, a);
1403
default:
1404
fatal("unrecognized relocation type " + toString(type));
1405
}
1406
}
1407
1408
static Thunk *addThunkMips(RelType type, Symbol &s) {
1409
if ((s.stOther & STO_MIPS_MICROMIPS) && isMipsR6())
1410
return make<MicroMipsR6Thunk>(s);
1411
if (s.stOther & STO_MIPS_MICROMIPS)
1412
return make<MicroMipsThunk>(s);
1413
return make<MipsThunk>(s);
1414
}
1415
1416
static Thunk *addThunkPPC32(const InputSection &isec, const Relocation &rel,
1417
Symbol &s) {
1418
assert((rel.type == R_PPC_LOCAL24PC || rel.type == R_PPC_REL24 ||
1419
rel.type == R_PPC_PLTREL24) &&
1420
"unexpected relocation type for thunk");
1421
if (s.isInPlt())
1422
return make<PPC32PltCallStub>(isec, rel, s);
1423
return make<PPC32LongThunk>(s, rel.addend);
1424
}
1425
1426
static Thunk *addThunkPPC64(RelType type, Symbol &s, int64_t a) {
1427
assert((type == R_PPC64_REL14 || type == R_PPC64_REL24 ||
1428
type == R_PPC64_REL24_NOTOC) &&
1429
"unexpected relocation type for thunk");
1430
1431
// If we are emitting stubs for NOTOC relocations, we need to tell
1432
// the PLT resolver that there can be multiple TOCs.
1433
if (type == R_PPC64_REL24_NOTOC)
1434
getPPC64TargetInfo()->ppc64DynamicSectionOpt = 0x2;
1435
1436
if (s.isInPlt())
1437
return type == R_PPC64_REL24_NOTOC
1438
? (Thunk *)make<PPC64R12SetupStub>(s, /*gotPlt=*/true)
1439
: (Thunk *)make<PPC64PltCallStub>(s);
1440
1441
// This check looks at the st_other bits of the callee. If the value is 1
1442
// then the callee clobbers the TOC and we need an R2 save stub when RelType
1443
// is R_PPC64_REL14 or R_PPC64_REL24.
1444
if ((type == R_PPC64_REL14 || type == R_PPC64_REL24) && (s.stOther >> 5) == 1)
1445
return make<PPC64R2SaveStub>(s, a);
1446
1447
if (type == R_PPC64_REL24_NOTOC)
1448
return make<PPC64R12SetupStub>(s, /*gotPlt=*/false);
1449
1450
if (config->picThunk)
1451
return make<PPC64PILongBranchThunk>(s, a);
1452
1453
return make<PPC64PDLongBranchThunk>(s, a);
1454
}
1455
1456
Thunk *elf::addThunk(const InputSection &isec, Relocation &rel) {
1457
Symbol &s = *rel.sym;
1458
int64_t a = rel.addend;
1459
1460
switch (config->emachine) {
1461
case EM_AARCH64:
1462
return addThunkAArch64(rel.type, s, a);
1463
case EM_ARM:
1464
return addThunkArm(isec, rel.type, s, a);
1465
case EM_AVR:
1466
return addThunkAVR(rel.type, s, a);
1467
case EM_MIPS:
1468
return addThunkMips(rel.type, s);
1469
case EM_PPC:
1470
return addThunkPPC32(isec, rel, s);
1471
case EM_PPC64:
1472
return addThunkPPC64(rel.type, s, a);
1473
default:
1474
llvm_unreachable("add Thunk only supported for ARM, AVR, Mips and PowerPC");
1475
}
1476
}
1477
1478