Path: blob/main/contrib/llvm-project/llvm/lib/ExecutionEngine/Orc/OrcABISupport.cpp
35269 views
//===------------- OrcABISupport.cpp - ABI specific support code ----------===//1//2// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.3// See https://llvm.org/LICENSE.txt for license information.4// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception5//6//===----------------------------------------------------------------------===//78#include "llvm/ExecutionEngine/Orc/OrcABISupport.h"9#include "llvm/Support/FormatVariadic.h"10#include "llvm/Support/Process.h"11#include "llvm/Support/raw_ostream.h"1213#define DEBUG_TYPE "orc"1415using namespace llvm;16using namespace llvm::orc;1718template <typename ORCABI>19static bool stubAndPointerRangesOk(ExecutorAddr StubBlockAddr,20ExecutorAddr PointerBlockAddr,21unsigned NumStubs) {22constexpr unsigned MaxDisp = ORCABI::StubToPointerMaxDisplacement;23ExecutorAddr FirstStub = StubBlockAddr;24ExecutorAddr LastStub = FirstStub + ((NumStubs - 1) * ORCABI::StubSize);25ExecutorAddr FirstPointer = PointerBlockAddr;26ExecutorAddr LastPointer = FirstPointer + ((NumStubs - 1) * ORCABI::StubSize);2728if (FirstStub < FirstPointer) {29if (LastStub >= FirstPointer)30return false; // Ranges overlap.31return (FirstPointer - FirstStub <= MaxDisp) &&32(LastPointer - LastStub <= MaxDisp); // out-of-range.33}3435if (LastPointer >= FirstStub)36return false; // Ranges overlap.3738return (FirstStub - FirstPointer <= MaxDisp) &&39(LastStub - LastPointer <= MaxDisp);40}4142namespace llvm {43namespace orc {4445void OrcAArch64::writeResolverCode(char *ResolverWorkingMem,46ExecutorAddr ResolverTargetAddress,47ExecutorAddr ReentryFnAddr,48ExecutorAddr ReentryCtxAddr) {4950const uint32_t ResolverCode[] = {51// resolver_entry:520xa9bf47fd, // 0x000: stp x29, x17, [sp, #-16]!530x910003fd, // 0x004: mov x29, sp540xa9bf73fb, // 0x008: stp x27, x28, [sp, #-16]!550xa9bf6bf9, // 0x00c: stp x25, x26, [sp, #-16]!560xa9bf63f7, // 0x010: stp x23, x24, [sp, #-16]!570xa9bf5bf5, // 0x014: stp x21, x22, [sp, #-16]!580xa9bf53f3, // 0x018: stp x19, x20, [sp, #-16]!590xa9bf3fee, // 0x01c: stp x14, x15, [sp, #-16]!600xa9bf37ec, // 0x020: stp x12, x13, [sp, #-16]!610xa9bf2fea, // 0x024: stp x10, x11, [sp, #-16]!620xa9bf27e8, // 0x028: stp x8, x9, [sp, #-16]!630xa9bf1fe6, // 0x02c: stp x6, x7, [sp, #-16]!640xa9bf17e4, // 0x030: stp x4, x5, [sp, #-16]!650xa9bf0fe2, // 0x034: stp x2, x3, [sp, #-16]!660xa9bf07e0, // 0x038: stp x0, x1, [sp, #-16]!670xadbf7ffe, // 0x03c: stp q30, q31, [sp, #-32]!680xadbf77fc, // 0x040: stp q28, q29, [sp, #-32]!690xadbf6ffa, // 0x044: stp q26, q27, [sp, #-32]!700xadbf67f8, // 0x048: stp q24, q25, [sp, #-32]!710xadbf5ff6, // 0x04c: stp q22, q23, [sp, #-32]!720xadbf57f4, // 0x050: stp q20, q21, [sp, #-32]!730xadbf4ff2, // 0x054: stp q18, q19, [sp, #-32]!740xadbf47f0, // 0x058: stp q16, q17, [sp, #-32]!750xadbf3fee, // 0x05c: stp q14, q15, [sp, #-32]!760xadbf37ec, // 0x060: stp q12, q13, [sp, #-32]!770xadbf2fea, // 0x064: stp q10, q11, [sp, #-32]!780xadbf27e8, // 0x068: stp q8, q9, [sp, #-32]!790xadbf1fe6, // 0x06c: stp q6, q7, [sp, #-32]!800xadbf17e4, // 0x070: stp q4, q5, [sp, #-32]!810xadbf0fe2, // 0x074: stp q2, q3, [sp, #-32]!820xadbf07e0, // 0x078: stp q0, q1, [sp, #-32]!830x580004e0, // 0x07c: ldr x0, Lreentry_ctx_ptr840xaa1e03e1, // 0x080: mov x1, x30850xd1003021, // 0x084: sub x1, x1, #12860x58000442, // 0x088: ldr x2, Lreentry_fn_ptr870xd63f0040, // 0x08c: blr x2880xaa0003f1, // 0x090: mov x17, x0890xacc107e0, // 0x094: ldp q0, q1, [sp], #32900xacc10fe2, // 0x098: ldp q2, q3, [sp], #32910xacc117e4, // 0x09c: ldp q4, q5, [sp], #32920xacc11fe6, // 0x0a0: ldp q6, q7, [sp], #32930xacc127e8, // 0x0a4: ldp q8, q9, [sp], #32940xacc12fea, // 0x0a8: ldp q10, q11, [sp], #32950xacc137ec, // 0x0ac: ldp q12, q13, [sp], #32960xacc13fee, // 0x0b0: ldp q14, q15, [sp], #32970xacc147f0, // 0x0b4: ldp q16, q17, [sp], #32980xacc14ff2, // 0x0b8: ldp q18, q19, [sp], #32990xacc157f4, // 0x0bc: ldp q20, q21, [sp], #321000xacc15ff6, // 0x0c0: ldp q22, q23, [sp], #321010xacc167f8, // 0x0c4: ldp q24, q25, [sp], #321020xacc16ffa, // 0x0c8: ldp q26, q27, [sp], #321030xacc177fc, // 0x0cc: ldp q28, q29, [sp], #321040xacc17ffe, // 0x0d0: ldp q30, q31, [sp], #321050xa8c107e0, // 0x0d4: ldp x0, x1, [sp], #161060xa8c10fe2, // 0x0d8: ldp x2, x3, [sp], #161070xa8c117e4, // 0x0dc: ldp x4, x5, [sp], #161080xa8c11fe6, // 0x0e0: ldp x6, x7, [sp], #161090xa8c127e8, // 0x0e4: ldp x8, x9, [sp], #161100xa8c12fea, // 0x0e8: ldp x10, x11, [sp], #161110xa8c137ec, // 0x0ec: ldp x12, x13, [sp], #161120xa8c13fee, // 0x0f0: ldp x14, x15, [sp], #161130xa8c153f3, // 0x0f4: ldp x19, x20, [sp], #161140xa8c15bf5, // 0x0f8: ldp x21, x22, [sp], #161150xa8c163f7, // 0x0fc: ldp x23, x24, [sp], #161160xa8c16bf9, // 0x100: ldp x25, x26, [sp], #161170xa8c173fb, // 0x104: ldp x27, x28, [sp], #161180xa8c17bfd, // 0x108: ldp x29, x30, [sp], #161190xd65f0220, // 0x10c: ret x171200x01234567, // 0x110: Lreentry_fn_ptr:1210xdeadbeef, // 0x114: .quad 01220x98765432, // 0x118: Lreentry_ctx_ptr:1230xcafef00d // 0x11c: .quad 0124};125126const unsigned ReentryFnAddrOffset = 0x110;127const unsigned ReentryCtxAddrOffset = 0x118;128129memcpy(ResolverWorkingMem, ResolverCode, sizeof(ResolverCode));130memcpy(ResolverWorkingMem + ReentryFnAddrOffset, &ReentryFnAddr,131sizeof(uint64_t));132memcpy(ResolverWorkingMem + ReentryCtxAddrOffset, &ReentryCtxAddr,133sizeof(uint64_t));134}135136void OrcAArch64::writeTrampolines(char *TrampolineBlockWorkingMem,137ExecutorAddr TrampolineBlockTargetAddress,138ExecutorAddr ResolverAddr,139unsigned NumTrampolines) {140141unsigned OffsetToPtr = alignTo(NumTrampolines * TrampolineSize, 8);142143memcpy(TrampolineBlockWorkingMem + OffsetToPtr, &ResolverAddr,144sizeof(uint64_t));145146// OffsetToPtr is actually the offset from the PC for the 2nd instruction, so147// subtract 32-bits.148OffsetToPtr -= 4;149150uint32_t *Trampolines =151reinterpret_cast<uint32_t *>(TrampolineBlockWorkingMem);152153for (unsigned I = 0; I < NumTrampolines; ++I, OffsetToPtr -= TrampolineSize) {154Trampolines[3 * I + 0] = 0xaa1e03f1; // mov x17, x30155Trampolines[3 * I + 1] = 0x58000010 | (OffsetToPtr << 3); // adr x16, Lptr156Trampolines[3 * I + 2] = 0xd63f0200; // blr x16157}158}159160void OrcAArch64::writeIndirectStubsBlock(161char *StubsBlockWorkingMem, ExecutorAddr StubsBlockTargetAddress,162ExecutorAddr PointersBlockTargetAddress, unsigned NumStubs) {163// Stub format is:164//165// .section __orc_stubs166// stub1:167// ldr x16, ptr1 ; PC-rel load of ptr1168// br x16 ; Jump to resolver169// stub2:170// ldr x16, ptr2 ; PC-rel load of ptr2171// br x16 ; Jump to resolver172//173// ...174//175// .section __orc_ptrs176// ptr1:177// .quad 0x0178// ptr2:179// .quad 0x0180//181// ...182183static_assert(StubSize == PointerSize,184"Pointer and stub size must match for algorithm below");185assert(stubAndPointerRangesOk<OrcAArch64>(186StubsBlockTargetAddress, PointersBlockTargetAddress, NumStubs) &&187"PointersBlock is out of range");188uint64_t PtrDisplacement =189PointersBlockTargetAddress - StubsBlockTargetAddress;190assert((PtrDisplacement % 8 == 0) &&191"Displacement to pointer is not a multiple of 8");192uint64_t *Stub = reinterpret_cast<uint64_t *>(StubsBlockWorkingMem);193uint64_t PtrOffsetField = ((PtrDisplacement >> 2) & 0x7ffff) << 5;194195for (unsigned I = 0; I < NumStubs; ++I)196Stub[I] = 0xd61f020058000010 | PtrOffsetField;197}198199void OrcX86_64_Base::writeTrampolines(char *TrampolineBlockWorkingMem,200ExecutorAddr TrampolineBlockTargetAddress,201ExecutorAddr ResolverAddr,202unsigned NumTrampolines) {203204unsigned OffsetToPtr = NumTrampolines * TrampolineSize;205206memcpy(TrampolineBlockWorkingMem + OffsetToPtr, &ResolverAddr,207sizeof(uint64_t));208209uint64_t *Trampolines =210reinterpret_cast<uint64_t *>(TrampolineBlockWorkingMem);211uint64_t CallIndirPCRel = 0xf1c40000000015ff;212213for (unsigned I = 0; I < NumTrampolines; ++I, OffsetToPtr -= TrampolineSize)214Trampolines[I] = CallIndirPCRel | ((OffsetToPtr - 6) << 16);215}216217void OrcX86_64_Base::writeIndirectStubsBlock(218char *StubsBlockWorkingMem, ExecutorAddr StubsBlockTargetAddress,219ExecutorAddr PointersBlockTargetAddress, unsigned NumStubs) {220// Stub format is:221//222// .section __orc_stubs223// stub1:224// jmpq *ptr1(%rip)225// .byte 0xC4 ; <- Invalid opcode padding.226// .byte 0xF1227// stub2:228// jmpq *ptr2(%rip)229//230// ...231//232// .section __orc_ptrs233// ptr1:234// .quad 0x0235// ptr2:236// .quad 0x0237//238// ...239240// Populate the stubs page stubs and mark it executable.241static_assert(StubSize == PointerSize,242"Pointer and stub size must match for algorithm below");243assert(stubAndPointerRangesOk<OrcX86_64_Base>(244StubsBlockTargetAddress, PointersBlockTargetAddress, NumStubs) &&245"PointersBlock is out of range");246uint64_t *Stub = reinterpret_cast<uint64_t *>(StubsBlockWorkingMem);247uint64_t PtrOffsetField =248(PointersBlockTargetAddress - StubsBlockTargetAddress - 6) << 16;249for (unsigned I = 0; I < NumStubs; ++I)250Stub[I] = 0xF1C40000000025ff | PtrOffsetField;251}252253void OrcX86_64_SysV::writeResolverCode(char *ResolverWorkingMem,254ExecutorAddr ResolverTargetAddress,255ExecutorAddr ReentryFnAddr,256ExecutorAddr ReentryCtxAddr) {257258LLVM_DEBUG({259dbgs() << "Writing resolver code to "260<< formatv("{0:x16}", ResolverTargetAddress) << "\n";261});262263const uint8_t ResolverCode[] = {264// resolver_entry:2650x55, // 0x00: pushq %rbp2660x48, 0x89, 0xe5, // 0x01: movq %rsp, %rbp2670x50, // 0x04: pushq %rax2680x53, // 0x05: pushq %rbx2690x51, // 0x06: pushq %rcx2700x52, // 0x07: pushq %rdx2710x56, // 0x08: pushq %rsi2720x57, // 0x09: pushq %rdi2730x41, 0x50, // 0x0a: pushq %r82740x41, 0x51, // 0x0c: pushq %r92750x41, 0x52, // 0x0e: pushq %r102760x41, 0x53, // 0x10: pushq %r112770x41, 0x54, // 0x12: pushq %r122780x41, 0x55, // 0x14: pushq %r132790x41, 0x56, // 0x16: pushq %r142800x41, 0x57, // 0x18: pushq %r152810x48, 0x81, 0xec, 0x08, 0x02, 0x00, 0x00, // 0x1a: subq 0x208, %rsp2820x48, 0x0f, 0xae, 0x04, 0x24, // 0x21: fxsave64 (%rsp)2830x48, 0xbf, // 0x26: movabsq <CBMgr>, %rdi284285// 0x28: JIT re-entry ctx addr.2860x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,2872880x48, 0x8b, 0x75, 0x08, // 0x30: movq 8(%rbp), %rsi2890x48, 0x83, 0xee, 0x06, // 0x34: subq $6, %rsi2900x48, 0xb8, // 0x38: movabsq <REntry>, %rax291292// 0x3a: JIT re-entry fn addr:2930x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,2942950xff, 0xd0, // 0x42: callq *%rax2960x48, 0x89, 0x45, 0x08, // 0x44: movq %rax, 8(%rbp)2970x48, 0x0f, 0xae, 0x0c, 0x24, // 0x48: fxrstor64 (%rsp)2980x48, 0x81, 0xc4, 0x08, 0x02, 0x00, 0x00, // 0x4d: addq 0x208, %rsp2990x41, 0x5f, // 0x54: popq %r153000x41, 0x5e, // 0x56: popq %r143010x41, 0x5d, // 0x58: popq %r133020x41, 0x5c, // 0x5a: popq %r123030x41, 0x5b, // 0x5c: popq %r113040x41, 0x5a, // 0x5e: popq %r103050x41, 0x59, // 0x60: popq %r93060x41, 0x58, // 0x62: popq %r83070x5f, // 0x64: popq %rdi3080x5e, // 0x65: popq %rsi3090x5a, // 0x66: popq %rdx3100x59, // 0x67: popq %rcx3110x5b, // 0x68: popq %rbx3120x58, // 0x69: popq %rax3130x5d, // 0x6a: popq %rbp3140xc3, // 0x6b: retq315};316317const unsigned ReentryFnAddrOffset = 0x3a;318const unsigned ReentryCtxAddrOffset = 0x28;319320memcpy(ResolverWorkingMem, ResolverCode, sizeof(ResolverCode));321memcpy(ResolverWorkingMem + ReentryFnAddrOffset, &ReentryFnAddr,322sizeof(uint64_t));323memcpy(ResolverWorkingMem + ReentryCtxAddrOffset, &ReentryCtxAddr,324sizeof(uint64_t));325}326327void OrcX86_64_Win32::writeResolverCode(char *ResolverWorkingMem,328ExecutorAddr ResolverTargetAddress,329ExecutorAddr ReentryFnAddr,330ExecutorAddr ReentryCtxAddr) {331332// resolverCode is similar to OrcX86_64 with differences specific to windows333// x64 calling convention: arguments go into rcx, rdx and come in reverse334// order, shadow space allocation on stack335const uint8_t ResolverCode[] = {336// resolver_entry:3370x55, // 0x00: pushq %rbp3380x48, 0x89, 0xe5, // 0x01: movq %rsp, %rbp3390x50, // 0x04: pushq %rax3400x53, // 0x05: pushq %rbx3410x51, // 0x06: pushq %rcx3420x52, // 0x07: pushq %rdx3430x56, // 0x08: pushq %rsi3440x57, // 0x09: pushq %rdi3450x41, 0x50, // 0x0a: pushq %r83460x41, 0x51, // 0x0c: pushq %r93470x41, 0x52, // 0x0e: pushq %r103480x41, 0x53, // 0x10: pushq %r113490x41, 0x54, // 0x12: pushq %r123500x41, 0x55, // 0x14: pushq %r133510x41, 0x56, // 0x16: pushq %r143520x41, 0x57, // 0x18: pushq %r153530x48, 0x81, 0xec, 0x08, 0x02, 0x00, 0x00, // 0x1a: subq 0x208, %rsp3540x48, 0x0f, 0xae, 0x04, 0x24, // 0x21: fxsave64 (%rsp)3553560x48, 0xb9, // 0x26: movabsq <CBMgr>, %rcx357// 0x28: JIT re-entry ctx addr.3580x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,3593600x48, 0x8B, 0x55, 0x08, // 0x30: mov rdx, [rbp+0x8]3610x48, 0x83, 0xea, 0x06, // 0x34: sub rdx, 0x63623630x48, 0xb8, // 0x38: movabsq <REntry>, %rax364// 0x3a: JIT re-entry fn addr:3650x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,366367// 0x42: sub rsp, 0x20 (Allocate shadow space)3680x48, 0x83, 0xEC, 0x20,3690xff, 0xd0, // 0x46: callq *%rax370371// 0x48: add rsp, 0x20 (Free shadow space)3720x48, 0x83, 0xC4, 0x20,3733740x48, 0x89, 0x45, 0x08, // 0x4C: movq %rax, 8(%rbp)3750x48, 0x0f, 0xae, 0x0c, 0x24, // 0x50: fxrstor64 (%rsp)3760x48, 0x81, 0xc4, 0x08, 0x02, 0x00, 0x00, // 0x55: addq 0x208, %rsp3770x41, 0x5f, // 0x5C: popq %r153780x41, 0x5e, // 0x5E: popq %r143790x41, 0x5d, // 0x60: popq %r133800x41, 0x5c, // 0x62: popq %r123810x41, 0x5b, // 0x64: popq %r113820x41, 0x5a, // 0x66: popq %r103830x41, 0x59, // 0x68: popq %r93840x41, 0x58, // 0x6a: popq %r83850x5f, // 0x6c: popq %rdi3860x5e, // 0x6d: popq %rsi3870x5a, // 0x6e: popq %rdx3880x59, // 0x6f: popq %rcx3890x5b, // 0x70: popq %rbx3900x58, // 0x71: popq %rax3910x5d, // 0x72: popq %rbp3920xc3, // 0x73: retq393};394395const unsigned ReentryFnAddrOffset = 0x3a;396const unsigned ReentryCtxAddrOffset = 0x28;397398memcpy(ResolverWorkingMem, ResolverCode, sizeof(ResolverCode));399memcpy(ResolverWorkingMem + ReentryFnAddrOffset, &ReentryFnAddr,400sizeof(uint64_t));401memcpy(ResolverWorkingMem + ReentryCtxAddrOffset, &ReentryCtxAddr,402sizeof(uint64_t));403}404405void OrcI386::writeResolverCode(char *ResolverWorkingMem,406ExecutorAddr ResolverTargetAddress,407ExecutorAddr ReentryFnAddr,408ExecutorAddr ReentryCtxAddr) {409410assert((ReentryFnAddr.getValue() >> 32) == 0 && "ReentryFnAddr out of range");411assert((ReentryCtxAddr.getValue() >> 32) == 0 &&412"ReentryCtxAddr out of range");413414const uint8_t ResolverCode[] = {415// resolver_entry:4160x55, // 0x00: pushl %ebp4170x89, 0xe5, // 0x01: movl %esp, %ebp4180x54, // 0x03: pushl %esp4190x83, 0xe4, 0xf0, // 0x04: andl $-0x10, %esp4200x50, // 0x07: pushl %eax4210x53, // 0x08: pushl %ebx4220x51, // 0x09: pushl %ecx4230x52, // 0x0a: pushl %edx4240x56, // 0x0b: pushl %esi4250x57, // 0x0c: pushl %edi4260x81, 0xec, 0x18, 0x02, 0x00, 0x00, // 0x0d: subl $0x218, %esp4270x0f, 0xae, 0x44, 0x24, 0x10, // 0x13: fxsave 0x10(%esp)4280x8b, 0x75, 0x04, // 0x18: movl 0x4(%ebp), %esi4290x83, 0xee, 0x05, // 0x1b: subl $0x5, %esi4300x89, 0x74, 0x24, 0x04, // 0x1e: movl %esi, 0x4(%esp)4310xc7, 0x04, 0x24, 0x00, 0x00, 0x00,4320x00, // 0x22: movl <cbmgr>, (%esp)4330xb8, 0x00, 0x00, 0x00, 0x00, // 0x29: movl <reentry>, %eax4340xff, 0xd0, // 0x2e: calll *%eax4350x89, 0x45, 0x04, // 0x30: movl %eax, 0x4(%ebp)4360x0f, 0xae, 0x4c, 0x24, 0x10, // 0x33: fxrstor 0x10(%esp)4370x81, 0xc4, 0x18, 0x02, 0x00, 0x00, // 0x38: addl $0x218, %esp4380x5f, // 0x3e: popl %edi4390x5e, // 0x3f: popl %esi4400x5a, // 0x40: popl %edx4410x59, // 0x41: popl %ecx4420x5b, // 0x42: popl %ebx4430x58, // 0x43: popl %eax4440x8b, 0x65, 0xfc, // 0x44: movl -0x4(%ebp), %esp4450x5d, // 0x48: popl %ebp4460xc3 // 0x49: retl447};448449const unsigned ReentryFnAddrOffset = 0x2a;450const unsigned ReentryCtxAddrOffset = 0x25;451452memcpy(ResolverWorkingMem, ResolverCode, sizeof(ResolverCode));453memcpy(ResolverWorkingMem + ReentryFnAddrOffset, &ReentryFnAddr,454sizeof(uint32_t));455memcpy(ResolverWorkingMem + ReentryCtxAddrOffset, &ReentryCtxAddr,456sizeof(uint32_t));457}458459void OrcI386::writeTrampolines(char *TrampolineWorkingMem,460ExecutorAddr TrampolineBlockTargetAddress,461ExecutorAddr ResolverAddr,462unsigned NumTrampolines) {463assert((ResolverAddr.getValue() >> 32) == 0 && "ResolverAddr out of range");464465uint64_t CallRelImm = 0xF1C4C400000000e8;466uint64_t ResolverRel = ResolverAddr - TrampolineBlockTargetAddress - 5;467468uint64_t *Trampolines = reinterpret_cast<uint64_t *>(TrampolineWorkingMem);469for (unsigned I = 0; I < NumTrampolines; ++I, ResolverRel -= TrampolineSize)470Trampolines[I] = CallRelImm | (ResolverRel << 8);471}472473void OrcI386::writeIndirectStubsBlock(char *StubsBlockWorkingMem,474ExecutorAddr StubsBlockTargetAddress,475ExecutorAddr PointersBlockTargetAddress,476unsigned NumStubs) {477assert((StubsBlockTargetAddress.getValue() >> 32) == 0 &&478"StubsBlockTargetAddress is out of range");479assert((PointersBlockTargetAddress.getValue() >> 32) == 0 &&480"PointersBlockTargetAddress is out of range");481482// Stub format is:483//484// .section __orc_stubs485// stub1:486// jmpq *ptr1487// .byte 0xC4 ; <- Invalid opcode padding.488// .byte 0xF1489// stub2:490// jmpq *ptr2491//492// ...493//494// .section __orc_ptrs495// ptr1:496// .quad 0x0497// ptr2:498// .quad 0x0499//500// ...501502assert(stubAndPointerRangesOk<OrcI386>(503StubsBlockTargetAddress, PointersBlockTargetAddress, NumStubs) &&504"PointersBlock is out of range");505506uint64_t *Stub = reinterpret_cast<uint64_t *>(StubsBlockWorkingMem);507uint64_t PtrAddr = PointersBlockTargetAddress.getValue();508for (unsigned I = 0; I < NumStubs; ++I, PtrAddr += 4)509Stub[I] = 0xF1C40000000025ff | (PtrAddr << 16);510}511512void OrcMips32_Base::writeResolverCode(char *ResolverWorkingMem,513ExecutorAddr ResolverTargetAddress,514ExecutorAddr ReentryFnAddr,515ExecutorAddr ReentryCtxAddr,516bool isBigEndian) {517518const uint32_t ResolverCode[] = {519// resolver_entry:5200x27bdff98, // 0x00: addiu $sp,$sp,-1045210xafa20000, // 0x04: sw $v0,0($sp)5220xafa30004, // 0x08: sw $v1,4($sp)5230xafa40008, // 0x0c: sw $a0,8($sp)5240xafa5000c, // 0x10: sw $a1,12($sp)5250xafa60010, // 0x14: sw $a2,16($sp)5260xafa70014, // 0x18: sw $a3,20($sp)5270xafb00018, // 0x1c: sw $s0,24($sp)5280xafb1001c, // 0x20: sw $s1,28($sp)5290xafb20020, // 0x24: sw $s2,32($sp)5300xafb30024, // 0x28: sw $s3,36($sp)5310xafb40028, // 0x2c: sw $s4,40($sp)5320xafb5002c, // 0x30: sw $s5,44($sp)5330xafb60030, // 0x34: sw $s6,48($sp)5340xafb70034, // 0x38: sw $s7,52($sp)5350xafa80038, // 0x3c: sw $t0,56($sp)5360xafa9003c, // 0x40: sw $t1,60($sp)5370xafaa0040, // 0x44: sw $t2,64($sp)5380xafab0044, // 0x48: sw $t3,68($sp)5390xafac0048, // 0x4c: sw $t4,72($sp)5400xafad004c, // 0x50: sw $t5,76($sp)5410xafae0050, // 0x54: sw $t6,80($sp)5420xafaf0054, // 0x58: sw $t7,84($sp)5430xafb80058, // 0x5c: sw $t8,88($sp)5440xafb9005c, // 0x60: sw $t9,92($sp)5450xafbe0060, // 0x64: sw $fp,96($sp)5460xafbf0064, // 0x68: sw $ra,100($sp)547548// JIT re-entry ctx addr.5490x00000000, // 0x6c: lui $a0,ctx5500x00000000, // 0x70: addiu $a0,$a0,ctx5515520x03e02825, // 0x74: move $a1, $ra5530x24a5ffec, // 0x78: addiu $a1,$a1,-20554555// JIT re-entry fn addr:5560x00000000, // 0x7c: lui $t9,reentry5570x00000000, // 0x80: addiu $t9,$t9,reentry5585590x0320f809, // 0x84: jalr $t95600x00000000, // 0x88: nop5610x8fbf0064, // 0x8c: lw $ra,100($sp)5620x8fbe0060, // 0x90: lw $fp,96($sp)5630x8fb9005c, // 0x94: lw $t9,92($sp)5640x8fb80058, // 0x98: lw $t8,88($sp)5650x8faf0054, // 0x9c: lw $t7,84($sp)5660x8fae0050, // 0xa0: lw $t6,80($sp)5670x8fad004c, // 0xa4: lw $t5,76($sp)5680x8fac0048, // 0xa8: lw $t4,72($sp)5690x8fab0044, // 0xac: lw $t3,68($sp)5700x8faa0040, // 0xb0: lw $t2,64($sp)5710x8fa9003c, // 0xb4: lw $t1,60($sp)5720x8fa80038, // 0xb8: lw $t0,56($sp)5730x8fb70034, // 0xbc: lw $s7,52($sp)5740x8fb60030, // 0xc0: lw $s6,48($sp)5750x8fb5002c, // 0xc4: lw $s5,44($sp)5760x8fb40028, // 0xc8: lw $s4,40($sp)5770x8fb30024, // 0xcc: lw $s3,36($sp)5780x8fb20020, // 0xd0: lw $s2,32($sp)5790x8fb1001c, // 0xd4: lw $s1,28($sp)5800x8fb00018, // 0xd8: lw $s0,24($sp)5810x8fa70014, // 0xdc: lw $a3,20($sp)5820x8fa60010, // 0xe0: lw $a2,16($sp)5830x8fa5000c, // 0xe4: lw $a1,12($sp)5840x8fa40008, // 0xe8: lw $a0,8($sp)5850x27bd0068, // 0xec: addiu $sp,$sp,1045860x0300f825, // 0xf0: move $ra, $t85870x03200008, // 0xf4: jr $t95880x00000000, // 0xf8: move $t9, $v0/v1589};590591const unsigned ReentryFnAddrOffset = 0x7c; // JIT re-entry fn addr lui592const unsigned ReentryCtxAddrOffset = 0x6c; // JIT re-entry context addr lui593const unsigned Offsett = 0xf8;594595memcpy(ResolverWorkingMem, ResolverCode, sizeof(ResolverCode));596597// Depending on endian return value will be in v0 or v1.598uint32_t MoveVxT9 = isBigEndian ? 0x0060c825 : 0x0040c825;599memcpy(ResolverWorkingMem + Offsett, &MoveVxT9, sizeof(MoveVxT9));600601uint32_t ReentryCtxLUi =6020x3c040000 | (((ReentryCtxAddr.getValue() + 0x8000) >> 16) & 0xFFFF);603uint32_t ReentryCtxADDiu = 0x24840000 | (ReentryCtxAddr.getValue() & 0xFFFF);604memcpy(ResolverWorkingMem + ReentryCtxAddrOffset, &ReentryCtxLUi,605sizeof(ReentryCtxLUi));606memcpy(ResolverWorkingMem + ReentryCtxAddrOffset + 4, &ReentryCtxADDiu,607sizeof(ReentryCtxADDiu));608609uint32_t ReentryFnLUi =6100x3c190000 | (((ReentryFnAddr.getValue() + 0x8000) >> 16) & 0xFFFF);611uint32_t ReentryFnADDiu = 0x27390000 | (ReentryFnAddr.getValue() & 0xFFFF);612memcpy(ResolverWorkingMem + ReentryFnAddrOffset, &ReentryFnLUi,613sizeof(ReentryFnLUi));614memcpy(ResolverWorkingMem + ReentryFnAddrOffset + 4, &ReentryFnADDiu,615sizeof(ReentryFnADDiu));616}617618void OrcMips32_Base::writeTrampolines(char *TrampolineBlockWorkingMem,619ExecutorAddr TrampolineBlockTargetAddress,620ExecutorAddr ResolverAddr,621unsigned NumTrampolines) {622623assert((ResolverAddr.getValue() >> 32) == 0 && "ResolverAddr out of range");624625uint32_t *Trampolines =626reinterpret_cast<uint32_t *>(TrampolineBlockWorkingMem);627uint32_t RHiAddr = ((ResolverAddr.getValue() + 0x8000) >> 16);628629for (unsigned I = 0; I < NumTrampolines; ++I) {630// move $t8,$ra631// lui $t9,ResolverAddr632// addiu $t9,$t9,ResolverAddr633// jalr $t9634// nop635Trampolines[5 * I + 0] = 0x03e0c025;636Trampolines[5 * I + 1] = 0x3c190000 | (RHiAddr & 0xFFFF);637Trampolines[5 * I + 2] = 0x27390000 | (ResolverAddr.getValue() & 0xFFFF);638Trampolines[5 * I + 3] = 0x0320f809;639Trampolines[5 * I + 4] = 0x00000000;640}641}642643void OrcMips32_Base::writeIndirectStubsBlock(644char *StubsBlockWorkingMem, ExecutorAddr StubsBlockTargetAddress,645ExecutorAddr PointersBlockTargetAddress, unsigned NumStubs) {646assert((StubsBlockTargetAddress.getValue() >> 32) == 0 &&647"InitialPtrVal is out of range");648649// Stub format is:650//651// .section __orc_stubs652// stub1:653// lui $t9, ptr1654// lw $t9, %lo(ptr1)($t9)655// jr $t9656// stub2:657// lui $t9, ptr2658// lw $t9,%lo(ptr1)($t9)659// jr $t9660//661// ...662//663// .section __orc_ptrs664// ptr1:665// .word 0x0666// ptr2:667// .word 0x0668//669// i..670671assert(stubAndPointerRangesOk<OrcMips32_Base>(672StubsBlockTargetAddress, PointersBlockTargetAddress, NumStubs) &&673"PointersBlock is out of range");674675// Populate the stubs page stubs and mark it executable.676uint32_t *Stub = reinterpret_cast<uint32_t *>(StubsBlockWorkingMem);677uint64_t PtrAddr = PointersBlockTargetAddress.getValue();678679for (unsigned I = 0; I < NumStubs; ++I) {680uint32_t HiAddr = ((PtrAddr + 0x8000) >> 16);681Stub[4 * I + 0] = 0x3c190000 | (HiAddr & 0xFFFF); // lui $t9,ptr1682Stub[4 * I + 1] = 0x8f390000 | (PtrAddr & 0xFFFF); // lw $t9,%lo(ptr1)($t9)683Stub[4 * I + 2] = 0x03200008; // jr $t9684Stub[4 * I + 3] = 0x00000000; // nop685PtrAddr += 4;686}687}688689void OrcMips64::writeResolverCode(char *ResolverWorkingMem,690ExecutorAddr ResolverTargetAddress,691ExecutorAddr ReentryFnAddr,692ExecutorAddr ReentryCtxAddr) {693694const uint32_t ResolverCode[] = {695//resolver_entry:6960x67bdff30, // 0x00: daddiu $sp,$sp,-2086970xffa20000, // 0x04: sd v0,0(sp)6980xffa30008, // 0x08: sd v1,8(sp)6990xffa40010, // 0x0c: sd a0,16(sp)7000xffa50018, // 0x10: sd a1,24(sp)7010xffa60020, // 0x14: sd a2,32(sp)7020xffa70028, // 0x18: sd a3,40(sp)7030xffa80030, // 0x1c: sd a4,48(sp)7040xffa90038, // 0x20: sd a5,56(sp)7050xffaa0040, // 0x24: sd a6,64(sp)7060xffab0048, // 0x28: sd a7,72(sp)7070xffac0050, // 0x2c: sd t0,80(sp)7080xffad0058, // 0x30: sd t1,88(sp)7090xffae0060, // 0x34: sd t2,96(sp)7100xffaf0068, // 0x38: sd t3,104(sp)7110xffb00070, // 0x3c: sd s0,112(sp)7120xffb10078, // 0x40: sd s1,120(sp)7130xffb20080, // 0x44: sd s2,128(sp)7140xffb30088, // 0x48: sd s3,136(sp)7150xffb40090, // 0x4c: sd s4,144(sp)7160xffb50098, // 0x50: sd s5,152(sp)7170xffb600a0, // 0x54: sd s6,160(sp)7180xffb700a8, // 0x58: sd s7,168(sp)7190xffb800b0, // 0x5c: sd t8,176(sp)7200xffb900b8, // 0x60: sd t9,184(sp)7210xffbe00c0, // 0x64: sd fp,192(sp)7220xffbf00c8, // 0x68: sd ra,200(sp)723724// JIT re-entry ctx addr.7250x00000000, // 0x6c: lui $a0,heighest(ctx)7260x00000000, // 0x70: daddiu $a0,$a0,heigher(ctx)7270x00000000, // 0x74: dsll $a0,$a0,167280x00000000, // 0x78: daddiu $a0,$a0,hi(ctx)7290x00000000, // 0x7c: dsll $a0,$a0,167300x00000000, // 0x80: daddiu $a0,$a0,lo(ctx)7317320x03e02825, // 0x84: move $a1, $ra7330x64a5ffdc, // 0x88: daddiu $a1,$a1,-36734735// JIT re-entry fn addr:7360x00000000, // 0x8c: lui $t9,reentry7370x00000000, // 0x90: daddiu $t9,$t9,reentry7380x00000000, // 0x94: dsll $t9,$t9,7390x00000000, // 0x98: daddiu $t9,$t9,7400x00000000, // 0x9c: dsll $t9,$t9,7410x00000000, // 0xa0: daddiu $t9,$t9,7420x0320f809, // 0xa4: jalr $t97430x00000000, // 0xa8: nop7440xdfbf00c8, // 0xac: ld ra, 200(sp)7450xdfbe00c0, // 0xb0: ld fp, 192(sp)7460xdfb900b8, // 0xb4: ld t9, 184(sp)7470xdfb800b0, // 0xb8: ld t8, 176(sp)7480xdfb700a8, // 0xbc: ld s7, 168(sp)7490xdfb600a0, // 0xc0: ld s6, 160(sp)7500xdfb50098, // 0xc4: ld s5, 152(sp)7510xdfb40090, // 0xc8: ld s4, 144(sp)7520xdfb30088, // 0xcc: ld s3, 136(sp)7530xdfb20080, // 0xd0: ld s2, 128(sp)7540xdfb10078, // 0xd4: ld s1, 120(sp)7550xdfb00070, // 0xd8: ld s0, 112(sp)7560xdfaf0068, // 0xdc: ld t3, 104(sp)7570xdfae0060, // 0xe0: ld t2, 96(sp)7580xdfad0058, // 0xe4: ld t1, 88(sp)7590xdfac0050, // 0xe8: ld t0, 80(sp)7600xdfab0048, // 0xec: ld a7, 72(sp)7610xdfaa0040, // 0xf0: ld a6, 64(sp)7620xdfa90038, // 0xf4: ld a5, 56(sp)7630xdfa80030, // 0xf8: ld a4, 48(sp)7640xdfa70028, // 0xfc: ld a3, 40(sp)7650xdfa60020, // 0x100: ld a2, 32(sp)7660xdfa50018, // 0x104: ld a1, 24(sp)7670xdfa40010, // 0x108: ld a0, 16(sp)7680xdfa30008, // 0x10c: ld v1, 8(sp)7690x67bd00d0, // 0x110: daddiu $sp,$sp,2087700x0300f825, // 0x114: move $ra, $t87710x03200008, // 0x118: jr $t97720x0040c825, // 0x11c: move $t9, $v0773};774775const unsigned ReentryFnAddrOffset = 0x8c; // JIT re-entry fn addr lui776const unsigned ReentryCtxAddrOffset = 0x6c; // JIT re-entry ctx addr lui777778memcpy(ResolverWorkingMem, ResolverCode, sizeof(ResolverCode));779780uint32_t ReentryCtxLUi =7810x3c040000 |782(((ReentryCtxAddr.getValue() + 0x800080008000) >> 48) & 0xFFFF);783uint32_t ReentryCtxDADDiu =7840x64840000 | (((ReentryCtxAddr.getValue() + 0x80008000) >> 32) & 0xFFFF);785uint32_t ReentryCtxDSLL = 0x00042438;786uint32_t ReentryCtxDADDiu2 =7870x64840000 | ((((ReentryCtxAddr.getValue() + 0x8000) >> 16) & 0xFFFF));788uint32_t ReentryCtxDSLL2 = 0x00042438;789uint32_t ReentryCtxDADDiu3 =7900x64840000 | (ReentryCtxAddr.getValue() & 0xFFFF);791792memcpy(ResolverWorkingMem + ReentryCtxAddrOffset, &ReentryCtxLUi,793sizeof(ReentryCtxLUi));794memcpy(ResolverWorkingMem + (ReentryCtxAddrOffset + 4), &ReentryCtxDADDiu,795sizeof(ReentryCtxDADDiu));796memcpy(ResolverWorkingMem + (ReentryCtxAddrOffset + 8), &ReentryCtxDSLL,797sizeof(ReentryCtxDSLL));798memcpy(ResolverWorkingMem + (ReentryCtxAddrOffset + 12), &ReentryCtxDADDiu2,799sizeof(ReentryCtxDADDiu2));800memcpy(ResolverWorkingMem + (ReentryCtxAddrOffset + 16), &ReentryCtxDSLL2,801sizeof(ReentryCtxDSLL2));802memcpy(ResolverWorkingMem + (ReentryCtxAddrOffset + 20), &ReentryCtxDADDiu3,803sizeof(ReentryCtxDADDiu3));804805uint32_t ReentryFnLUi =8060x3c190000 |807(((ReentryFnAddr.getValue() + 0x800080008000) >> 48) & 0xFFFF);808809uint32_t ReentryFnDADDiu =8100x67390000 | (((ReentryFnAddr.getValue() + 0x80008000) >> 32) & 0xFFFF);811812uint32_t ReentryFnDSLL = 0x0019cc38;813814uint32_t ReentryFnDADDiu2 =8150x67390000 | (((ReentryFnAddr.getValue() + 0x8000) >> 16) & 0xFFFF);816817uint32_t ReentryFnDSLL2 = 0x0019cc38;818819uint32_t ReentryFnDADDiu3 = 0x67390000 | (ReentryFnAddr.getValue() & 0xFFFF);820821memcpy(ResolverWorkingMem + ReentryFnAddrOffset, &ReentryFnLUi,822sizeof(ReentryFnLUi));823memcpy(ResolverWorkingMem + (ReentryFnAddrOffset + 4), &ReentryFnDADDiu,824sizeof(ReentryFnDADDiu));825memcpy(ResolverWorkingMem + (ReentryFnAddrOffset + 8), &ReentryFnDSLL,826sizeof(ReentryFnDSLL));827memcpy(ResolverWorkingMem + (ReentryFnAddrOffset + 12), &ReentryFnDADDiu2,828sizeof(ReentryFnDADDiu2));829memcpy(ResolverWorkingMem + (ReentryFnAddrOffset + 16), &ReentryFnDSLL2,830sizeof(ReentryFnDSLL2));831memcpy(ResolverWorkingMem + (ReentryFnAddrOffset + 20), &ReentryFnDADDiu3,832sizeof(ReentryFnDADDiu3));833}834835void OrcMips64::writeTrampolines(char *TrampolineBlockWorkingMem,836ExecutorAddr TrampolineBlockTargetAddress,837ExecutorAddr ResolverAddr,838unsigned NumTrampolines) {839840uint32_t *Trampolines =841reinterpret_cast<uint32_t *>(TrampolineBlockWorkingMem);842843uint64_t HeighestAddr = ((ResolverAddr.getValue() + 0x800080008000) >> 48);844uint64_t HeigherAddr = ((ResolverAddr.getValue() + 0x80008000) >> 32);845uint64_t HiAddr = ((ResolverAddr.getValue() + 0x8000) >> 16);846847for (unsigned I = 0; I < NumTrampolines; ++I) {848Trampolines[10 * I + 0] = 0x03e0c025; // move $t8,$ra849Trampolines[10 * I + 1] = 0x3c190000 | (HeighestAddr & 0xFFFF); // lui $t9,resolveAddr850Trampolines[10 * I + 2] = 0x67390000 | (HeigherAddr & 0xFFFF); // daddiu $t9,$t9,%higher(resolveAddr)851Trampolines[10 * I + 3] = 0x0019cc38; // dsll $t9,$t9,16852Trampolines[10 * I + 4] = 0x67390000 | (HiAddr & 0xFFFF); // daddiu $t9,$t9,%hi(ptr)853Trampolines[10 * I + 5] = 0x0019cc38; // dsll $t9,$t9,16854Trampolines[10 * I + 6] = 0x67390000 | (ResolverAddr.getValue() &8550xFFFF); // daddiu $t9,$t9,%lo(ptr)856Trampolines[10 * I + 7] = 0x0320f809; // jalr $t9857Trampolines[10 * I + 8] = 0x00000000; // nop858Trampolines[10 * I + 9] = 0x00000000; // nop859}860}861862void OrcMips64::writeIndirectStubsBlock(char *StubsBlockWorkingMem,863ExecutorAddr StubsBlockTargetAddress,864ExecutorAddr PointersBlockTargetAddress,865unsigned NumStubs) {866// Stub format is:867//868// .section __orc_stubs869// stub1:870// lui $t9,ptr1871// dsll $t9,$t9,16872// daddiu $t9,$t9,%hi(ptr)873// dsll $t9,$t9,16874// ld $t9,%lo(ptr)875// jr $t9876// stub2:877// lui $t9,ptr1878// dsll $t9,$t9,16879// daddiu $t9,$t9,%hi(ptr)880// dsll $t9,$t9,16881// ld $t9,%lo(ptr)882// jr $t9883//884// ...885//886// .section __orc_ptrs887// ptr1:888// .dword 0x0889// ptr2:890// .dword 0x0891//892// ...893894assert(stubAndPointerRangesOk<OrcMips64>(895StubsBlockTargetAddress, PointersBlockTargetAddress, NumStubs) &&896"PointersBlock is out of range");897898// Populate the stubs page stubs and mark it executable.899uint32_t *Stub = reinterpret_cast<uint32_t *>(StubsBlockWorkingMem);900uint64_t PtrAddr = PointersBlockTargetAddress.getValue();901902for (unsigned I = 0; I < NumStubs; ++I, PtrAddr += 8) {903uint64_t HeighestAddr = ((PtrAddr + 0x800080008000) >> 48);904uint64_t HeigherAddr = ((PtrAddr + 0x80008000) >> 32);905uint64_t HiAddr = ((PtrAddr + 0x8000) >> 16);906Stub[8 * I + 0] = 0x3c190000 | (HeighestAddr & 0xFFFF); // lui $t9,ptr1907Stub[8 * I + 1] = 0x67390000 | (HeigherAddr & 0xFFFF); // daddiu $t9,$t9,%higher(ptr)908Stub[8 * I + 2] = 0x0019cc38; // dsll $t9,$t9,16909Stub[8 * I + 3] = 0x67390000 | (HiAddr & 0xFFFF); // daddiu $t9,$t9,%hi(ptr)910Stub[8 * I + 4] = 0x0019cc38; // dsll $t9,$t9,16911Stub[8 * I + 5] = 0xdf390000 | (PtrAddr & 0xFFFF); // ld $t9,%lo(ptr)912Stub[8 * I + 6] = 0x03200008; // jr $t9913Stub[8 * I + 7] = 0x00000000; // nop914}915}916917void OrcRiscv64::writeResolverCode(char *ResolverWorkingMem,918ExecutorAddr ResolverTargetAddress,919ExecutorAddr ReentryFnAddr,920ExecutorAddr ReentryCtxAddr) {921922const uint32_t ResolverCode[] = {9230xef810113, // 0x00: addi sp,sp,-2649240x00813023, // 0x04: sd s0,0(sp)9250x00913423, // 0x08: sd s1,8(sp)9260x01213823, // 0x0c: sd s2,16(sp)9270x01313c23, // 0x10: sd s3,24(sp)9280x03413023, // 0x14: sd s4,32(sp)9290x03513423, // 0x18: sd s5,40(sp)9300x03613823, // 0x1c: sd s6,48(sp)9310x03713c23, // 0x20: sd s7,56(sp)9320x05813023, // 0x24: sd s8,64(sp)9330x05913423, // 0x28: sd s9,72(sp)9340x05a13823, // 0x2c: sd s10,80(sp)9350x05b13c23, // 0x30: sd s11,88(sp)9360x06113023, // 0x34: sd ra,96(sp)9370x06a13423, // 0x38: sd a0,104(sp)9380x06b13823, // 0x3c: sd a1,112(sp)9390x06c13c23, // 0x40: sd a2,120(sp)9400x08d13023, // 0x44: sd a3,128(sp)9410x08e13423, // 0x48: sd a4,136(sp)9420x08f13823, // 0x4c: sd a5,144(sp)9430x09013c23, // 0x50: sd a6,152(sp)9440x0b113023, // 0x54: sd a7,160(sp)9450x0a813427, // 0x58: fsd fs0,168(sp)9460x0a913827, // 0x5c: fsd fs1,176(sp)9470x0b213c27, // 0x60: fsd fs2,184(sp)9480x0d313027, // 0x64: fsd fs3,192(sp)9490x0d413427, // 0x68: fsd fs4,200(sp)9500x0d513827, // 0x6c: fsd fs5,208(sp)9510x0d613c27, // 0x70: fsd fs6,216(sp)9520x0f713027, // 0x74: fsd fs7,224(sp)9530x0f813427, // 0x78: fsd fs8,232(sp)9540x0f913827, // 0x7c: fsd fs9,240(sp)9550x0fa13c27, // 0x80: fsd fs10,248(sp)9560x11b13027, // 0x84: fsd fs11,256(sp)9570x00000517, // 0x88: auipc a0,0x09580x0b053503, // 0x8c: ld a0,176(a0) # 0x1389590x00030593, // 0x90: mv a1,t19600xff458593, // 0x94: addi a1,a1,-129610x00000617, // 0x98: auipc a2,0x09620x0a863603, // 0x9c: ld a2,168(a2) # 0x1409630x000600e7, // 0xa0: jalr a29640x00050293, // 0xa4: mv t0,a09650x00013403, // 0xa8: ld s0,0(sp)9660x00813483, // 0xac: ld s1,8(sp)9670x01013903, // 0xb0: ld s2,16(sp)9680x01813983, // 0xb4: ld s3,24(sp)9690x02013a03, // 0xb8: ld s4,32(sp)9700x02813a83, // 0xbc: ld s5,40(sp)9710x03013b03, // 0xc0: ld s6,48(sp)9720x03813b83, // 0xc4: ld s7,56(sp)9730x04013c03, // 0xc8: ld s8,64(sp)9740x04813c83, // 0xcc: ld s9,72(sp)9750x05013d03, // 0xd0: ld s10,80(sp)9760x05813d83, // 0xd4: ld s11,88(sp)9770x06013083, // 0xd8: ld ra,96(sp)9780x06813503, // 0xdc: ld a0,104(sp)9790x07013583, // 0xe0: ld a1,112(sp)9800x07813603, // 0xe4: ld a2,120(sp)9810x08013683, // 0xe8: ld a3,128(sp)9820x08813703, // 0xec: ld a4,136(sp)9830x09013783, // 0xf0: ld a5,144(sp)9840x09813803, // 0xf4: ld a6,152(sp)9850x0a013883, // 0xf8: ld a7,160(sp)9860x0a813407, // 0xfc: fld fs0,168(sp)9870x0b013487, // 0x100: fld fs1,176(sp)9880x0b813907, // 0x104: fld fs2,184(sp)9890x0c013987, // 0x108: fld fs3,192(sp)9900x0c813a07, // 0x10c: fld fs4,200(sp)9910x0d013a87, // 0x110: fld fs5,208(sp)9920x0d813b07, // 0x114: fld fs6,216(sp)9930x0e013b87, // 0x118: fld fs7,224(sp)9940x0e813c07, // 0x11c: fld fs8,232(sp)9950x0f013c87, // 0x120: fld fs9,240(sp)9960x0f813d07, // 0x124: fld fs10,248(sp)9970x10013d87, // 0x128: fld fs11,256(sp)9980x10810113, // 0x12c: addi sp,sp,2649990x00028067, // 0x130: jr t010000x12345678, // 0x134: padding to align at 8 byte10010x12345678, // 0x138: Lreentry_ctx_ptr:10020xdeadbeef, // 0x13c: .quad 010030x98765432, // 0x140: Lreentry_fn_ptr:10040xcafef00d // 0x144: .quad 01005};10061007const unsigned ReentryCtxAddrOffset = 0x138;1008const unsigned ReentryFnAddrOffset = 0x140;10091010memcpy(ResolverWorkingMem, ResolverCode, sizeof(ResolverCode));1011memcpy(ResolverWorkingMem + ReentryFnAddrOffset, &ReentryFnAddr,1012sizeof(uint64_t));1013memcpy(ResolverWorkingMem + ReentryCtxAddrOffset, &ReentryCtxAddr,1014sizeof(uint64_t));1015}10161017void OrcRiscv64::writeTrampolines(char *TrampolineBlockWorkingMem,1018ExecutorAddr TrampolineBlockTargetAddress,1019ExecutorAddr ResolverAddr,1020unsigned NumTrampolines) {10211022unsigned OffsetToPtr = alignTo(NumTrampolines * TrampolineSize, 8);10231024memcpy(TrampolineBlockWorkingMem + OffsetToPtr, &ResolverAddr,1025sizeof(uint64_t));10261027uint32_t *Trampolines =1028reinterpret_cast<uint32_t *>(TrampolineBlockWorkingMem);1029for (unsigned I = 0; I < NumTrampolines; ++I, OffsetToPtr -= TrampolineSize) {1030uint32_t Hi20 = (OffsetToPtr + 0x800) & 0xFFFFF000;1031uint32_t Lo12 = OffsetToPtr - Hi20;1032Trampolines[4 * I + 0] = 0x00000297 | Hi20; // auipc t0, %hi(Lptr)1033Trampolines[4 * I + 1] =10340x0002b283 | ((Lo12 & 0xFFF) << 20); // ld t0, %lo(Lptr)1035Trampolines[4 * I + 2] = 0x00028367; // jalr t1, t01036Trampolines[4 * I + 3] = 0xdeadface; // padding1037}1038}10391040void OrcRiscv64::writeIndirectStubsBlock(1041char *StubsBlockWorkingMem, ExecutorAddr StubsBlockTargetAddress,1042ExecutorAddr PointersBlockTargetAddress, unsigned NumStubs) {1043// Stub format is:1044//1045// .section __orc_stubs1046// stub1:1047// auipc t0, %hi(ptr1) ; PC-rel load of ptr11048// ld t0, %lo(t0)1049// jr t0 ; Jump to resolver1050// .quad 0 ; Pad to 16 bytes1051// stub2:1052// auipc t0, %hi(ptr1) ; PC-rel load of ptr11053// ld t0, %lo(t0)1054// jr t0 ; Jump to resolver1055// .quad 01056//1057// ...1058//1059// .section __orc_ptrs1060// ptr1:1061// .quad 0x01062// ptr2:1063// .quad 0x01064//1065// ...10661067assert(stubAndPointerRangesOk<OrcRiscv64>(1068StubsBlockTargetAddress, PointersBlockTargetAddress, NumStubs) &&1069"PointersBlock is out of range");10701071uint32_t *Stub = reinterpret_cast<uint32_t *>(StubsBlockWorkingMem);10721073for (unsigned I = 0; I < NumStubs; ++I) {1074uint64_t PtrDisplacement =1075PointersBlockTargetAddress - StubsBlockTargetAddress;1076uint32_t Hi20 = (PtrDisplacement + 0x800) & 0xFFFFF000;1077uint32_t Lo12 = PtrDisplacement - Hi20;1078Stub[4 * I + 0] = 0x00000297 | Hi20; // auipc t0, %hi(Lptr)1079Stub[4 * I + 1] = 0x0002b283 | ((Lo12 & 0xFFF) << 20); // ld t0, %lo(Lptr)1080Stub[4 * I + 2] = 0x00028067; // jr t01081Stub[4 * I + 3] = 0xfeedbeef; // padding1082PointersBlockTargetAddress += PointerSize;1083StubsBlockTargetAddress += StubSize;1084}1085}10861087void OrcLoongArch64::writeResolverCode(char *ResolverWorkingMem,1088ExecutorAddr ResolverTargetAddress,1089ExecutorAddr ReentryFnAddr,1090ExecutorAddr ReentryCtxAddr) {10911092LLVM_DEBUG({1093dbgs() << "Writing resolver code to "1094<< formatv("{0:x16}", ResolverTargetAddress) << "\n";1095});10961097const uint32_t ResolverCode[] = {10980x02fde063, // 0x0: addi.d $sp, $sp, -136(0xf78)10990x29c00061, // 0x4: st.d $ra, $sp, 011000x29c02064, // 0x8: st.d $a0, $sp, 8(0x8)11010x29c04065, // 0xc: st.d $a1, $sp, 16(0x10)11020x29c06066, // 0x10: st.d $a2, $sp, 24(0x18)11030x29c08067, // 0x14: st.d $a3, $sp, 32(0x20)11040x29c0a068, // 0x18: st.d $a4, $sp, 40(0x28)11050x29c0c069, // 0x1c: st.d $a5, $sp, 48(0x30)11060x29c0e06a, // 0x20: st.d $a6, $sp, 56(0x38)11070x29c1006b, // 0x24: st.d $a7, $sp, 64(0x40)11080x2bc12060, // 0x28: fst.d $fa0, $sp, 72(0x48)11090x2bc14061, // 0x2c: fst.d $fa1, $sp, 80(0x50)11100x2bc16062, // 0x30: fst.d $fa2, $sp, 88(0x58)11110x2bc18063, // 0x34: fst.d $fa3, $sp, 96(0x60)11120x2bc1a064, // 0x38: fst.d $fa4, $sp, 104(0x68)11130x2bc1c065, // 0x3c: fst.d $fa5, $sp, 112(0x70)11140x2bc1e066, // 0x40: fst.d $fa6, $sp, 120(0x78)11150x2bc20067, // 0x44: fst.d $fa7, $sp, 128(0x80)11160x1c000004, // 0x48: pcaddu12i $a0, 011170x28c1c084, // 0x4c: ld.d $a0, $a0, 112(0x70)11180x001501a5, // 0x50: move $a1, $t111190x02ffd0a5, // 0x54: addi.d $a1, $a1, -12(0xff4)11200x1c000006, // 0x58: pcaddu12i $a2, 011210x28c1a0c6, // 0x5c: ld.d $a2, $a2, 104(0x68)11220x4c0000c1, // 0x60: jirl $ra, $a2, 011230x0015008c, // 0x64: move $t0, $a011240x2b820067, // 0x68: fld.d $fa7, $sp, 128(0x80)11250x2b81e066, // 0x6c: fld.d $fa6, $sp, 120(0x78)11260x2b81c065, // 0x70: fld.d $fa5, $sp, 112(0x70)11270x2b81a064, // 0x74: fld.d $fa4, $sp, 104(0x68)11280x2b818063, // 0x78: fld.d $fa3, $sp, 96(0x60)11290x2b816062, // 0x7c: fld.d $fa2, $sp, 88(0x58)11300x2b814061, // 0x80: fld.d $fa1, $sp, 80(0x50)11310x2b812060, // 0x84: fld.d $fa0, $sp, 72(0x48)11320x28c1006b, // 0x88: ld.d $a7, $sp, 64(0x40)11330x28c0e06a, // 0x8c: ld.d $a6, $sp, 56(0x38)11340x28c0c069, // 0x90: ld.d $a5, $sp, 48(0x30)11350x28c0a068, // 0x94: ld.d $a4, $sp, 40(0x28)11360x28c08067, // 0x98: ld.d $a3, $sp, 32(0x20)11370x28c06066, // 0x9c: ld.d $a2, $sp, 24(0x18)11380x28c04065, // 0xa0: ld.d $a1, $sp, 16(0x10)11390x28c02064, // 0xa4: ld.d $a0, $sp, 8(0x8)11400x28c00061, // 0xa8: ld.d $ra, $sp, 011410x02c22063, // 0xac: addi.d $sp, $sp, 136(0x88)11420x4c000180, // 0xb0: jr $t011430x00000000, // 0xb4: padding to align at 8 bytes11440x01234567, // 0xb8: Lreentry_ctx_ptr:11450xdeedbeef, // 0xbc: .dword 011460x98765432, // 0xc0: Lreentry_fn_ptr:11470xcafef00d, // 0xc4: .dword 01148};11491150const unsigned ReentryCtxAddrOffset = 0xb8;1151const unsigned ReentryFnAddrOffset = 0xc0;11521153memcpy(ResolverWorkingMem, ResolverCode, sizeof(ResolverCode));1154memcpy(ResolverWorkingMem + ReentryFnAddrOffset, &ReentryFnAddr,1155sizeof(uint64_t));1156memcpy(ResolverWorkingMem + ReentryCtxAddrOffset, &ReentryCtxAddr,1157sizeof(uint64_t));1158}11591160void OrcLoongArch64::writeTrampolines(char *TrampolineBlockWorkingMem,1161ExecutorAddr TrampolineBlockTargetAddress,1162ExecutorAddr ResolverAddr,1163unsigned NumTrampolines) {11641165LLVM_DEBUG({1166dbgs() << "Writing trampoline code to "1167<< formatv("{0:x16}", TrampolineBlockTargetAddress) << "\n";1168});11691170unsigned OffsetToPtr = alignTo(NumTrampolines * TrampolineSize, 8);11711172memcpy(TrampolineBlockWorkingMem + OffsetToPtr, &ResolverAddr,1173sizeof(uint64_t));11741175uint32_t *Trampolines =1176reinterpret_cast<uint32_t *>(TrampolineBlockWorkingMem);1177for (unsigned I = 0; I < NumTrampolines; ++I, OffsetToPtr -= TrampolineSize) {1178uint32_t Hi20 = (OffsetToPtr + 0x800) & 0xfffff000;1179uint32_t Lo12 = OffsetToPtr - Hi20;1180Trampolines[4 * I + 0] =11810x1c00000c |1182(((Hi20 >> 12) & 0xfffff) << 5); // pcaddu12i $t0, %pc_hi20(Lptr)1183Trampolines[4 * I + 1] =11840x28c0018c | ((Lo12 & 0xfff) << 10); // ld.d $t0, $t0, %pc_lo12(Lptr)1185Trampolines[4 * I + 2] = 0x4c00018d; // jirl $t1, $t0, 01186Trampolines[4 * I + 3] = 0x0; // padding1187}1188}11891190void OrcLoongArch64::writeIndirectStubsBlock(1191char *StubsBlockWorkingMem, ExecutorAddr StubsBlockTargetAddress,1192ExecutorAddr PointersBlockTargetAddress, unsigned NumStubs) {1193// Stub format is:1194//1195// .section __orc_stubs1196// stub1:1197// pcaddu12i $t0, %pc_hi20(ptr1) ; PC-rel load of ptr11198// ld.d $t0, $t0, %pc_lo12(ptr1)1199// jr $t0 ; Jump to resolver1200// .dword 0 ; Pad to 16 bytes1201// stub2:1202// pcaddu12i $t0, %pc_hi20(ptr2) ; PC-rel load of ptr21203// ld.d $t0, $t0, %pc_lo12(ptr2)1204// jr $t0 ; Jump to resolver1205// .dword 0 ; Pad to 16 bytes1206// ...1207//1208// .section __orc_ptrs1209// ptr1:1210// .dword 0x01211// ptr2:1212// .dword 0x01213// ...1214LLVM_DEBUG({1215dbgs() << "Writing stubs code to "1216<< formatv("{0:x16}", StubsBlockTargetAddress) << "\n";1217});1218assert(stubAndPointerRangesOk<OrcLoongArch64>(1219StubsBlockTargetAddress, PointersBlockTargetAddress, NumStubs) &&1220"PointersBlock is out of range");12211222uint32_t *Stub = reinterpret_cast<uint32_t *>(StubsBlockWorkingMem);12231224for (unsigned I = 0; I < NumStubs; ++I) {1225uint64_t PtrDisplacement =1226PointersBlockTargetAddress - StubsBlockTargetAddress;1227uint32_t Hi20 = (PtrDisplacement + 0x800) & 0xfffff000;1228uint32_t Lo12 = PtrDisplacement - Hi20;1229Stub[4 * I + 0] = 0x1c00000c | (((Hi20 >> 12) & 0xfffff)1230<< 5); // pcaddu12i $t0, %pc_hi20(Lptr)1231Stub[4 * I + 1] =12320x28c0018c | ((Lo12 & 0xfff) << 10); // ld.d $t0, $t0, %pc_lo12(Lptr)1233Stub[4 * I + 2] = 0x4c000180; // jr $t01234Stub[4 * I + 3] = 0x0; // padding1235PointersBlockTargetAddress += PointerSize;1236StubsBlockTargetAddress += StubSize;1237}1238}12391240} // End namespace orc.1241} // End namespace llvm.124212431244