mirror of
https://github.com/RPCS3/llvm.git
synced 2025-05-18 19:36:36 +00:00

to reflect the new license. We understand that people may be surprised that we're moving the header entirely to discuss the new license. We checked this carefully with the Foundation's lawyer and we believe this is the correct approach. Essentially, all code in the project is now made available by the LLVM project under our new license, so you will see that the license headers include that license only. Some of our contributors have contributed code under our old license, and accordingly, we have retained a copy of our old license notice in the top-level files in each project and repository. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@351636 91177308-0d34-0410-b5e6-96231b3b80d8
984 lines
44 KiB
C++
984 lines
44 KiB
C++
//===------------- OrcABISupport.cpp - ABI specific support code ----------===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "llvm/ExecutionEngine/Orc/OrcABISupport.h"
|
|
#include "llvm/Support/Process.h"
|
|
|
|
namespace llvm {
|
|
namespace orc {
|
|
|
|
void OrcAArch64::writeResolverCode(uint8_t *ResolverMem, JITReentryFn ReentryFn,
|
|
void *CallbackMgr) {
|
|
|
|
const uint32_t ResolverCode[] = {
|
|
// resolver_entry:
|
|
0xa9bf47fd, // 0x000: stp x29, x17, [sp, #-16]!
|
|
0x910003fd, // 0x004: mov x29, sp
|
|
0xa9bf73fb, // 0x008: stp x27, x28, [sp, #-16]!
|
|
0xa9bf6bf9, // 0x00c: stp x25, x26, [sp, #-16]!
|
|
0xa9bf63f7, // 0x010: stp x23, x24, [sp, #-16]!
|
|
0xa9bf5bf5, // 0x014: stp x21, x22, [sp, #-16]!
|
|
0xa9bf53f3, // 0x018: stp x19, x20, [sp, #-16]!
|
|
0xa9bf3fee, // 0x01c: stp x14, x15, [sp, #-16]!
|
|
0xa9bf37ec, // 0x020: stp x12, x13, [sp, #-16]!
|
|
0xa9bf2fea, // 0x024: stp x10, x11, [sp, #-16]!
|
|
0xa9bf27e8, // 0x028: stp x8, x9, [sp, #-16]!
|
|
0xa9bf1fe6, // 0x02c: stp x6, x7, [sp, #-16]!
|
|
0xa9bf17e4, // 0x030: stp x4, x5, [sp, #-16]!
|
|
0xa9bf0fe2, // 0x034: stp x2, x3, [sp, #-16]!
|
|
0xa9bf07e0, // 0x038: stp x0, x1, [sp, #-16]!
|
|
0xadbf7ffe, // 0x03c: stp q30, q31, [sp, #-32]!
|
|
0xadbf77fc, // 0x040: stp q28, q29, [sp, #-32]!
|
|
0xadbf6ffa, // 0x044: stp q26, q27, [sp, #-32]!
|
|
0xadbf67f8, // 0x048: stp q24, q25, [sp, #-32]!
|
|
0xadbf5ff6, // 0x04c: stp q22, q23, [sp, #-32]!
|
|
0xadbf57f4, // 0x050: stp q20, q21, [sp, #-32]!
|
|
0xadbf4ff2, // 0x054: stp q18, q19, [sp, #-32]!
|
|
0xadbf47f0, // 0x058: stp q16, q17, [sp, #-32]!
|
|
0xadbf3fee, // 0x05c: stp q14, q15, [sp, #-32]!
|
|
0xadbf37ec, // 0x060: stp q12, q13, [sp, #-32]!
|
|
0xadbf2fea, // 0x064: stp q10, q11, [sp, #-32]!
|
|
0xadbf27e8, // 0x068: stp q8, q9, [sp, #-32]!
|
|
0xadbf1fe6, // 0x06c: stp q6, q7, [sp, #-32]!
|
|
0xadbf17e4, // 0x070: stp q4, q5, [sp, #-32]!
|
|
0xadbf0fe2, // 0x074: stp q2, q3, [sp, #-32]!
|
|
0xadbf07e0, // 0x078: stp q0, q1, [sp, #-32]!
|
|
0x580004e0, // 0x07c: ldr x0, Lcallbackmgr
|
|
0xaa1e03e1, // 0x080: mov x1, x30
|
|
0xd1003021, // 0x084: sub x1, x1, #12
|
|
0x58000442, // 0x088: ldr x2, Lreentry_fn_ptr
|
|
0xd63f0040, // 0x08c: blr x2
|
|
0xaa0003f1, // 0x090: mov x17, x0
|
|
0xacc107e0, // 0x094: ldp q0, q1, [sp], #32
|
|
0xacc10fe2, // 0x098: ldp q2, q3, [sp], #32
|
|
0xacc117e4, // 0x09c: ldp q4, q5, [sp], #32
|
|
0xacc11fe6, // 0x0a0: ldp q6, q7, [sp], #32
|
|
0xacc127e8, // 0x0a4: ldp q8, q9, [sp], #32
|
|
0xacc12fea, // 0x0a8: ldp q10, q11, [sp], #32
|
|
0xacc137ec, // 0x0ac: ldp q12, q13, [sp], #32
|
|
0xacc13fee, // 0x0b0: ldp q14, q15, [sp], #32
|
|
0xacc147f0, // 0x0b4: ldp q16, q17, [sp], #32
|
|
0xacc14ff2, // 0x0b8: ldp q18, q19, [sp], #32
|
|
0xacc157f4, // 0x0bc: ldp q20, q21, [sp], #32
|
|
0xacc15ff6, // 0x0c0: ldp q22, q23, [sp], #32
|
|
0xacc167f8, // 0x0c4: ldp q24, q25, [sp], #32
|
|
0xacc16ffa, // 0x0c8: ldp q26, q27, [sp], #32
|
|
0xacc177fc, // 0x0cc: ldp q28, q29, [sp], #32
|
|
0xacc17ffe, // 0x0d0: ldp q30, q31, [sp], #32
|
|
0xa8c107e0, // 0x0d4: ldp x0, x1, [sp], #16
|
|
0xa8c10fe2, // 0x0d8: ldp x2, x3, [sp], #16
|
|
0xa8c117e4, // 0x0dc: ldp x4, x5, [sp], #16
|
|
0xa8c11fe6, // 0x0e0: ldp x6, x7, [sp], #16
|
|
0xa8c127e8, // 0x0e4: ldp x8, x9, [sp], #16
|
|
0xa8c12fea, // 0x0e8: ldp x10, x11, [sp], #16
|
|
0xa8c137ec, // 0x0ec: ldp x12, x13, [sp], #16
|
|
0xa8c13fee, // 0x0f0: ldp x14, x15, [sp], #16
|
|
0xa8c153f3, // 0x0f4: ldp x19, x20, [sp], #16
|
|
0xa8c15bf5, // 0x0f8: ldp x21, x22, [sp], #16
|
|
0xa8c163f7, // 0x0fc: ldp x23, x24, [sp], #16
|
|
0xa8c16bf9, // 0x100: ldp x25, x26, [sp], #16
|
|
0xa8c173fb, // 0x104: ldp x27, x28, [sp], #16
|
|
0xa8c17bfd, // 0x108: ldp x29, x30, [sp], #16
|
|
0xd65f0220, // 0x10c: ret x17
|
|
0x01234567, // 0x110: Lreentry_fn_ptr:
|
|
0xdeadbeef, // 0x114: .quad 0
|
|
0x98765432, // 0x118: Lcallbackmgr:
|
|
0xcafef00d // 0x11c: .quad 0
|
|
};
|
|
|
|
const unsigned ReentryFnAddrOffset = 0x110;
|
|
const unsigned CallbackMgrAddrOffset = 0x118;
|
|
|
|
memcpy(ResolverMem, ResolverCode, sizeof(ResolverCode));
|
|
memcpy(ResolverMem + ReentryFnAddrOffset, &ReentryFn, sizeof(ReentryFn));
|
|
memcpy(ResolverMem + CallbackMgrAddrOffset, &CallbackMgr,
|
|
sizeof(CallbackMgr));
|
|
}
|
|
|
|
void OrcAArch64::writeTrampolines(uint8_t *TrampolineMem, void *ResolverAddr,
|
|
unsigned NumTrampolines) {
|
|
|
|
unsigned OffsetToPtr = alignTo(NumTrampolines * TrampolineSize, 8);
|
|
|
|
memcpy(TrampolineMem + OffsetToPtr, &ResolverAddr, sizeof(void *));
|
|
|
|
// OffsetToPtr is actually the offset from the PC for the 2nd instruction, so
|
|
// subtract 32-bits.
|
|
OffsetToPtr -= 4;
|
|
|
|
uint32_t *Trampolines = reinterpret_cast<uint32_t *>(TrampolineMem);
|
|
|
|
for (unsigned I = 0; I < NumTrampolines; ++I, OffsetToPtr -= TrampolineSize) {
|
|
Trampolines[3 * I + 0] = 0xaa1e03f1; // mov x17, x30
|
|
Trampolines[3 * I + 1] = 0x58000010 | (OffsetToPtr << 3); // adr x16, Lptr
|
|
Trampolines[3 * I + 2] = 0xd63f0200; // blr x16
|
|
}
|
|
|
|
}
|
|
|
|
Error OrcAArch64::emitIndirectStubsBlock(IndirectStubsInfo &StubsInfo,
|
|
unsigned MinStubs,
|
|
void *InitialPtrVal) {
|
|
// Stub format is:
|
|
//
|
|
// .section __orc_stubs
|
|
// stub1:
|
|
// ldr x0, ptr1 ; PC-rel load of ptr1
|
|
// br x0 ; Jump to resolver
|
|
// stub2:
|
|
// ldr x0, ptr2 ; PC-rel load of ptr2
|
|
// br x0 ; Jump to resolver
|
|
//
|
|
// ...
|
|
//
|
|
// .section __orc_ptrs
|
|
// ptr1:
|
|
// .quad 0x0
|
|
// ptr2:
|
|
// .quad 0x0
|
|
//
|
|
// ...
|
|
|
|
const unsigned StubSize = IndirectStubsInfo::StubSize;
|
|
|
|
// Emit at least MinStubs, rounded up to fill the pages allocated.
|
|
unsigned PageSize = sys::Process::getPageSize();
|
|
unsigned NumPages = ((MinStubs * StubSize) + (PageSize - 1)) / PageSize;
|
|
unsigned NumStubs = (NumPages * PageSize) / StubSize;
|
|
|
|
// Allocate memory for stubs and pointers in one call.
|
|
std::error_code EC;
|
|
auto StubsMem = sys::OwningMemoryBlock(sys::Memory::allocateMappedMemory(
|
|
2 * NumPages * PageSize, nullptr,
|
|
sys::Memory::MF_READ | sys::Memory::MF_WRITE, EC));
|
|
|
|
if (EC)
|
|
return errorCodeToError(EC);
|
|
|
|
// Create separate MemoryBlocks representing the stubs and pointers.
|
|
sys::MemoryBlock StubsBlock(StubsMem.base(), NumPages * PageSize);
|
|
sys::MemoryBlock PtrsBlock(static_cast<char *>(StubsMem.base()) +
|
|
NumPages * PageSize,
|
|
NumPages * PageSize);
|
|
|
|
// Populate the stubs page stubs and mark it executable.
|
|
uint64_t *Stub = reinterpret_cast<uint64_t *>(StubsBlock.base());
|
|
uint64_t PtrOffsetField = static_cast<uint64_t>(NumPages * PageSize)
|
|
<< 3;
|
|
|
|
for (unsigned I = 0; I < NumStubs; ++I)
|
|
Stub[I] = 0xd61f020058000010 | PtrOffsetField;
|
|
|
|
if (auto EC = sys::Memory::protectMappedMemory(
|
|
StubsBlock, sys::Memory::MF_READ | sys::Memory::MF_EXEC))
|
|
return errorCodeToError(EC);
|
|
|
|
// Initialize all pointers to point at FailureAddress.
|
|
void **Ptr = reinterpret_cast<void **>(PtrsBlock.base());
|
|
for (unsigned I = 0; I < NumStubs; ++I)
|
|
Ptr[I] = InitialPtrVal;
|
|
|
|
StubsInfo = IndirectStubsInfo(NumStubs, std::move(StubsMem));
|
|
|
|
return Error::success();
|
|
}
|
|
|
|
void OrcX86_64_Base::writeTrampolines(uint8_t *TrampolineMem,
|
|
void *ResolverAddr,
|
|
unsigned NumTrampolines) {
|
|
|
|
unsigned OffsetToPtr = NumTrampolines * TrampolineSize;
|
|
|
|
memcpy(TrampolineMem + OffsetToPtr, &ResolverAddr, sizeof(void *));
|
|
|
|
uint64_t *Trampolines = reinterpret_cast<uint64_t *>(TrampolineMem);
|
|
uint64_t CallIndirPCRel = 0xf1c40000000015ff;
|
|
|
|
for (unsigned I = 0; I < NumTrampolines; ++I, OffsetToPtr -= TrampolineSize)
|
|
Trampolines[I] = CallIndirPCRel | ((OffsetToPtr - 6) << 16);
|
|
}
|
|
|
|
Error OrcX86_64_Base::emitIndirectStubsBlock(IndirectStubsInfo &StubsInfo,
|
|
unsigned MinStubs,
|
|
void *InitialPtrVal) {
|
|
// Stub format is:
|
|
//
|
|
// .section __orc_stubs
|
|
// stub1:
|
|
// jmpq *ptr1(%rip)
|
|
// .byte 0xC4 ; <- Invalid opcode padding.
|
|
// .byte 0xF1
|
|
// stub2:
|
|
// jmpq *ptr2(%rip)
|
|
//
|
|
// ...
|
|
//
|
|
// .section __orc_ptrs
|
|
// ptr1:
|
|
// .quad 0x0
|
|
// ptr2:
|
|
// .quad 0x0
|
|
//
|
|
// ...
|
|
|
|
const unsigned StubSize = IndirectStubsInfo::StubSize;
|
|
|
|
// Emit at least MinStubs, rounded up to fill the pages allocated.
|
|
unsigned PageSize = sys::Process::getPageSize();
|
|
unsigned NumPages = ((MinStubs * StubSize) + (PageSize - 1)) / PageSize;
|
|
unsigned NumStubs = (NumPages * PageSize) / StubSize;
|
|
|
|
// Allocate memory for stubs and pointers in one call.
|
|
std::error_code EC;
|
|
auto StubsMem = sys::OwningMemoryBlock(sys::Memory::allocateMappedMemory(
|
|
2 * NumPages * PageSize, nullptr,
|
|
sys::Memory::MF_READ | sys::Memory::MF_WRITE, EC));
|
|
|
|
if (EC)
|
|
return errorCodeToError(EC);
|
|
|
|
// Create separate MemoryBlocks representing the stubs and pointers.
|
|
sys::MemoryBlock StubsBlock(StubsMem.base(), NumPages * PageSize);
|
|
sys::MemoryBlock PtrsBlock(static_cast<char *>(StubsMem.base()) +
|
|
NumPages * PageSize,
|
|
NumPages * PageSize);
|
|
|
|
// Populate the stubs page stubs and mark it executable.
|
|
uint64_t *Stub = reinterpret_cast<uint64_t *>(StubsBlock.base());
|
|
uint64_t PtrOffsetField = static_cast<uint64_t>(NumPages * PageSize - 6)
|
|
<< 16;
|
|
for (unsigned I = 0; I < NumStubs; ++I)
|
|
Stub[I] = 0xF1C40000000025ff | PtrOffsetField;
|
|
|
|
if (auto EC = sys::Memory::protectMappedMemory(
|
|
StubsBlock, sys::Memory::MF_READ | sys::Memory::MF_EXEC))
|
|
return errorCodeToError(EC);
|
|
|
|
// Initialize all pointers to point at FailureAddress.
|
|
void **Ptr = reinterpret_cast<void **>(PtrsBlock.base());
|
|
for (unsigned I = 0; I < NumStubs; ++I)
|
|
Ptr[I] = InitialPtrVal;
|
|
|
|
StubsInfo = IndirectStubsInfo(NumStubs, std::move(StubsMem));
|
|
|
|
return Error::success();
|
|
}
|
|
|
|
void OrcX86_64_SysV::writeResolverCode(uint8_t *ResolverMem,
|
|
JITReentryFn ReentryFn,
|
|
void *CallbackMgr) {
|
|
|
|
const uint8_t ResolverCode[] = {
|
|
// resolver_entry:
|
|
0x55, // 0x00: pushq %rbp
|
|
0x48, 0x89, 0xe5, // 0x01: movq %rsp, %rbp
|
|
0x50, // 0x04: pushq %rax
|
|
0x53, // 0x05: pushq %rbx
|
|
0x51, // 0x06: pushq %rcx
|
|
0x52, // 0x07: pushq %rdx
|
|
0x56, // 0x08: pushq %rsi
|
|
0x57, // 0x09: pushq %rdi
|
|
0x41, 0x50, // 0x0a: pushq %r8
|
|
0x41, 0x51, // 0x0c: pushq %r9
|
|
0x41, 0x52, // 0x0e: pushq %r10
|
|
0x41, 0x53, // 0x10: pushq %r11
|
|
0x41, 0x54, // 0x12: pushq %r12
|
|
0x41, 0x55, // 0x14: pushq %r13
|
|
0x41, 0x56, // 0x16: pushq %r14
|
|
0x41, 0x57, // 0x18: pushq %r15
|
|
0x48, 0x81, 0xec, 0x08, 0x02, 0x00, 0x00, // 0x1a: subq 0x208, %rsp
|
|
0x48, 0x0f, 0xae, 0x04, 0x24, // 0x21: fxsave64 (%rsp)
|
|
0x48, 0xbf, // 0x26: movabsq <CBMgr>, %rdi
|
|
|
|
// 0x28: Callback manager addr.
|
|
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
|
|
|
|
0x48, 0x8b, 0x75, 0x08, // 0x30: movq 8(%rbp), %rsi
|
|
0x48, 0x83, 0xee, 0x06, // 0x34: subq $6, %rsi
|
|
0x48, 0xb8, // 0x38: movabsq <REntry>, %rax
|
|
|
|
// 0x3a: JIT re-entry fn addr:
|
|
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
|
|
|
|
0xff, 0xd0, // 0x42: callq *%rax
|
|
0x48, 0x89, 0x45, 0x08, // 0x44: movq %rax, 8(%rbp)
|
|
0x48, 0x0f, 0xae, 0x0c, 0x24, // 0x48: fxrstor64 (%rsp)
|
|
0x48, 0x81, 0xc4, 0x08, 0x02, 0x00, 0x00, // 0x4d: addq 0x208, %rsp
|
|
0x41, 0x5f, // 0x54: popq %r15
|
|
0x41, 0x5e, // 0x56: popq %r14
|
|
0x41, 0x5d, // 0x58: popq %r13
|
|
0x41, 0x5c, // 0x5a: popq %r12
|
|
0x41, 0x5b, // 0x5c: popq %r11
|
|
0x41, 0x5a, // 0x5e: popq %r10
|
|
0x41, 0x59, // 0x60: popq %r9
|
|
0x41, 0x58, // 0x62: popq %r8
|
|
0x5f, // 0x64: popq %rdi
|
|
0x5e, // 0x65: popq %rsi
|
|
0x5a, // 0x66: popq %rdx
|
|
0x59, // 0x67: popq %rcx
|
|
0x5b, // 0x68: popq %rbx
|
|
0x58, // 0x69: popq %rax
|
|
0x5d, // 0x6a: popq %rbp
|
|
0xc3, // 0x6b: retq
|
|
};
|
|
|
|
const unsigned ReentryFnAddrOffset = 0x3a;
|
|
const unsigned CallbackMgrAddrOffset = 0x28;
|
|
|
|
memcpy(ResolverMem, ResolverCode, sizeof(ResolverCode));
|
|
memcpy(ResolverMem + ReentryFnAddrOffset, &ReentryFn, sizeof(ReentryFn));
|
|
memcpy(ResolverMem + CallbackMgrAddrOffset, &CallbackMgr,
|
|
sizeof(CallbackMgr));
|
|
}
|
|
|
|
void OrcX86_64_Win32::writeResolverCode(uint8_t *ResolverMem,
|
|
JITReentryFn ReentryFn,
|
|
void *CallbackMgr) {
|
|
|
|
// resolverCode is similar to OrcX86_64 with differences specific to windows x64 calling convention:
|
|
// arguments go into rcx, rdx and come in reverse order, shadow space allocation on stack
|
|
const uint8_t ResolverCode[] = {
|
|
// resolver_entry:
|
|
0x55, // 0x00: pushq %rbp
|
|
0x48, 0x89, 0xe5, // 0x01: movq %rsp, %rbp
|
|
0x50, // 0x04: pushq %rax
|
|
0x53, // 0x05: pushq %rbx
|
|
0x51, // 0x06: pushq %rcx
|
|
0x52, // 0x07: pushq %rdx
|
|
0x56, // 0x08: pushq %rsi
|
|
0x57, // 0x09: pushq %rdi
|
|
0x41, 0x50, // 0x0a: pushq %r8
|
|
0x41, 0x51, // 0x0c: pushq %r9
|
|
0x41, 0x52, // 0x0e: pushq %r10
|
|
0x41, 0x53, // 0x10: pushq %r11
|
|
0x41, 0x54, // 0x12: pushq %r12
|
|
0x41, 0x55, // 0x14: pushq %r13
|
|
0x41, 0x56, // 0x16: pushq %r14
|
|
0x41, 0x57, // 0x18: pushq %r15
|
|
0x48, 0x81, 0xec, 0x08, 0x02, 0x00, 0x00, // 0x1a: subq 0x208, %rsp
|
|
0x48, 0x0f, 0xae, 0x04, 0x24, // 0x21: fxsave64 (%rsp)
|
|
|
|
0x48, 0xb9, // 0x26: movabsq <CBMgr>, %rcx
|
|
// 0x28: Callback manager addr.
|
|
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
|
|
|
|
0x48, 0x8B, 0x55, 0x08, // 0x30: mov rdx, [rbp+0x8]
|
|
0x48, 0x83, 0xea, 0x06, // 0x34: sub rdx, 0x6
|
|
|
|
0x48, 0xb8, // 0x38: movabsq <REntry>, %rax
|
|
// 0x3a: JIT re-entry fn addr:
|
|
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
|
|
|
|
// 0x42: sub rsp, 0x20 (Allocate shadow space)
|
|
0x48, 0x83, 0xEC, 0x20,
|
|
0xff, 0xd0, // 0x46: callq *%rax
|
|
|
|
// 0x48: add rsp, 0x20 (Free shadow space)
|
|
0x48, 0x83, 0xC4, 0x20,
|
|
|
|
0x48, 0x89, 0x45, 0x08, // 0x4C: movq %rax, 8(%rbp)
|
|
0x48, 0x0f, 0xae, 0x0c, 0x24, // 0x50: fxrstor64 (%rsp)
|
|
0x48, 0x81, 0xc4, 0x08, 0x02, 0x00, 0x00, // 0x55: addq 0x208, %rsp
|
|
0x41, 0x5f, // 0x5C: popq %r15
|
|
0x41, 0x5e, // 0x5E: popq %r14
|
|
0x41, 0x5d, // 0x60: popq %r13
|
|
0x41, 0x5c, // 0x62: popq %r12
|
|
0x41, 0x5b, // 0x64: popq %r11
|
|
0x41, 0x5a, // 0x66: popq %r10
|
|
0x41, 0x59, // 0x68: popq %r9
|
|
0x41, 0x58, // 0x6a: popq %r8
|
|
0x5f, // 0x6c: popq %rdi
|
|
0x5e, // 0x6d: popq %rsi
|
|
0x5a, // 0x6e: popq %rdx
|
|
0x59, // 0x6f: popq %rcx
|
|
0x5b, // 0x70: popq %rbx
|
|
0x58, // 0x71: popq %rax
|
|
0x5d, // 0x72: popq %rbp
|
|
0xc3, // 0x73: retq
|
|
};
|
|
|
|
|
|
const unsigned ReentryFnAddrOffset = 0x3a;
|
|
const unsigned CallbackMgrAddrOffset = 0x28;
|
|
|
|
memcpy(ResolverMem, ResolverCode, sizeof(ResolverCode));
|
|
memcpy(ResolverMem + ReentryFnAddrOffset, &ReentryFn, sizeof(ReentryFn));
|
|
memcpy(ResolverMem + CallbackMgrAddrOffset, &CallbackMgr,
|
|
sizeof(CallbackMgr));
|
|
}
|
|
|
|
void OrcI386::writeResolverCode(uint8_t *ResolverMem, JITReentryFn ReentryFn,
|
|
void *CallbackMgr) {
|
|
|
|
const uint8_t ResolverCode[] = {
|
|
// resolver_entry:
|
|
0x55, // 0x00: pushl %ebp
|
|
0x89, 0xe5, // 0x01: movl %esp, %ebp
|
|
0x54, // 0x03: pushl %esp
|
|
0x83, 0xe4, 0xf0, // 0x04: andl $-0x10, %esp
|
|
0x50, // 0x07: pushl %eax
|
|
0x53, // 0x08: pushl %ebx
|
|
0x51, // 0x09: pushl %ecx
|
|
0x52, // 0x0a: pushl %edx
|
|
0x56, // 0x0b: pushl %esi
|
|
0x57, // 0x0c: pushl %edi
|
|
0x81, 0xec, 0x18, 0x02, 0x00, 0x00, // 0x0d: subl $0x218, %esp
|
|
0x0f, 0xae, 0x44, 0x24, 0x10, // 0x13: fxsave 0x10(%esp)
|
|
0x8b, 0x75, 0x04, // 0x18: movl 0x4(%ebp), %esi
|
|
0x83, 0xee, 0x05, // 0x1b: subl $0x5, %esi
|
|
0x89, 0x74, 0x24, 0x04, // 0x1e: movl %esi, 0x4(%esp)
|
|
0xc7, 0x04, 0x24, 0x00, 0x00, 0x00,
|
|
0x00, // 0x22: movl <cbmgr>, (%esp)
|
|
0xb8, 0x00, 0x00, 0x00, 0x00, // 0x29: movl <reentry>, %eax
|
|
0xff, 0xd0, // 0x2e: calll *%eax
|
|
0x89, 0x45, 0x04, // 0x30: movl %eax, 0x4(%ebp)
|
|
0x0f, 0xae, 0x4c, 0x24, 0x10, // 0x33: fxrstor 0x10(%esp)
|
|
0x81, 0xc4, 0x18, 0x02, 0x00, 0x00, // 0x38: addl $0x218, %esp
|
|
0x5f, // 0x3e: popl %edi
|
|
0x5e, // 0x3f: popl %esi
|
|
0x5a, // 0x40: popl %edx
|
|
0x59, // 0x41: popl %ecx
|
|
0x5b, // 0x42: popl %ebx
|
|
0x58, // 0x43: popl %eax
|
|
0x8b, 0x65, 0xfc, // 0x44: movl -0x4(%ebp), %esp
|
|
0x5d, // 0x48: popl %ebp
|
|
0xc3 // 0x49: retl
|
|
};
|
|
|
|
const unsigned ReentryFnAddrOffset = 0x2a;
|
|
const unsigned CallbackMgrAddrOffset = 0x25;
|
|
|
|
memcpy(ResolverMem, ResolverCode, sizeof(ResolverCode));
|
|
memcpy(ResolverMem + ReentryFnAddrOffset, &ReentryFn, sizeof(ReentryFn));
|
|
memcpy(ResolverMem + CallbackMgrAddrOffset, &CallbackMgr,
|
|
sizeof(CallbackMgr));
|
|
}
|
|
|
|
void OrcI386::writeTrampolines(uint8_t *TrampolineMem, void *ResolverAddr,
|
|
unsigned NumTrampolines) {
|
|
|
|
uint64_t CallRelImm = 0xF1C4C400000000e8;
|
|
uint64_t Resolver = reinterpret_cast<uint64_t>(ResolverAddr);
|
|
uint64_t ResolverRel =
|
|
Resolver - reinterpret_cast<uint64_t>(TrampolineMem) - 5;
|
|
|
|
uint64_t *Trampolines = reinterpret_cast<uint64_t *>(TrampolineMem);
|
|
for (unsigned I = 0; I < NumTrampolines; ++I, ResolverRel -= TrampolineSize)
|
|
Trampolines[I] = CallRelImm | (ResolverRel << 8);
|
|
}
|
|
|
|
Error OrcI386::emitIndirectStubsBlock(IndirectStubsInfo &StubsInfo,
|
|
unsigned MinStubs, void *InitialPtrVal) {
|
|
// Stub format is:
|
|
//
|
|
// .section __orc_stubs
|
|
// stub1:
|
|
// jmpq *ptr1
|
|
// .byte 0xC4 ; <- Invalid opcode padding.
|
|
// .byte 0xF1
|
|
// stub2:
|
|
// jmpq *ptr2
|
|
//
|
|
// ...
|
|
//
|
|
// .section __orc_ptrs
|
|
// ptr1:
|
|
// .quad 0x0
|
|
// ptr2:
|
|
// .quad 0x0
|
|
//
|
|
// ...
|
|
|
|
const unsigned StubSize = IndirectStubsInfo::StubSize;
|
|
|
|
// Emit at least MinStubs, rounded up to fill the pages allocated.
|
|
unsigned PageSize = sys::Process::getPageSize();
|
|
unsigned NumPages = ((MinStubs * StubSize) + (PageSize - 1)) / PageSize;
|
|
unsigned NumStubs = (NumPages * PageSize) / StubSize;
|
|
|
|
// Allocate memory for stubs and pointers in one call.
|
|
std::error_code EC;
|
|
auto StubsMem = sys::OwningMemoryBlock(sys::Memory::allocateMappedMemory(
|
|
2 * NumPages * PageSize, nullptr,
|
|
sys::Memory::MF_READ | sys::Memory::MF_WRITE, EC));
|
|
|
|
if (EC)
|
|
return errorCodeToError(EC);
|
|
|
|
// Create separate MemoryBlocks representing the stubs and pointers.
|
|
sys::MemoryBlock StubsBlock(StubsMem.base(), NumPages * PageSize);
|
|
sys::MemoryBlock PtrsBlock(static_cast<char *>(StubsMem.base()) +
|
|
NumPages * PageSize,
|
|
NumPages * PageSize);
|
|
|
|
// Populate the stubs page stubs and mark it executable.
|
|
uint64_t *Stub = reinterpret_cast<uint64_t *>(StubsBlock.base());
|
|
uint64_t PtrAddr = reinterpret_cast<uint64_t>(PtrsBlock.base());
|
|
for (unsigned I = 0; I < NumStubs; ++I, PtrAddr += 4)
|
|
Stub[I] = 0xF1C40000000025ff | (PtrAddr << 16);
|
|
|
|
if (auto EC = sys::Memory::protectMappedMemory(
|
|
StubsBlock, sys::Memory::MF_READ | sys::Memory::MF_EXEC))
|
|
return errorCodeToError(EC);
|
|
|
|
// Initialize all pointers to point at FailureAddress.
|
|
void **Ptr = reinterpret_cast<void **>(PtrsBlock.base());
|
|
for (unsigned I = 0; I < NumStubs; ++I)
|
|
Ptr[I] = InitialPtrVal;
|
|
|
|
StubsInfo = IndirectStubsInfo(NumStubs, std::move(StubsMem));
|
|
|
|
return Error::success();
|
|
}
|
|
|
|
void OrcMips32_Base::writeResolverCode(uint8_t *ResolverMem,
|
|
JITReentryFn ReentryFn,
|
|
void *CallbackMgr, bool isBigEndian) {
|
|
|
|
const uint32_t ResolverCode[] = {
|
|
// resolver_entry:
|
|
0x27bdff98, // 0x00: addiu $sp,$sp,-104
|
|
0xafa20000, // 0x04: sw $v0,0($sp)
|
|
0xafa30004, // 0x08: sw $v1,4($sp)
|
|
0xafa40008, // 0x0c: sw $a0,8($sp)
|
|
0xafa5000c, // 0x10: sw $a1,12($sp)
|
|
0xafa60010, // 0x14: sw $a2,16($sp)
|
|
0xafa70014, // 0x18: sw $a3,20($sp)
|
|
0xafb00018, // 0x1c: sw $s0,24($sp)
|
|
0xafb1001c, // 0x20: sw $s1,28($sp)
|
|
0xafb20020, // 0x24: sw $s2,32($sp)
|
|
0xafb30024, // 0x28: sw $s3,36($sp)
|
|
0xafb40028, // 0x2c: sw $s4,40($sp)
|
|
0xafb5002c, // 0x30: sw $s5,44($sp)
|
|
0xafb60030, // 0x34: sw $s6,48($sp)
|
|
0xafb70034, // 0x38: sw $s7,52($sp)
|
|
0xafa80038, // 0x3c: sw $t0,56($sp)
|
|
0xafa9003c, // 0x40: sw $t1,60($sp)
|
|
0xafaa0040, // 0x44: sw $t2,64($sp)
|
|
0xafab0044, // 0x48: sw $t3,68($sp)
|
|
0xafac0048, // 0x4c: sw $t4,72($sp)
|
|
0xafad004c, // 0x50: sw $t5,76($sp)
|
|
0xafae0050, // 0x54: sw $t6,80($sp)
|
|
0xafaf0054, // 0x58: sw $t7,84($sp)
|
|
0xafb80058, // 0x5c: sw $t8,88($sp)
|
|
0xafb9005c, // 0x60: sw $t9,92($sp)
|
|
0xafbe0060, // 0x64: sw $fp,96($sp)
|
|
0xafbf0064, // 0x68: sw $ra,100($sp)
|
|
|
|
// Callback manager addr.
|
|
0x00000000, // 0x6c: lui $a0,callbackmgr
|
|
0x00000000, // 0x70: addiu $a0,$a0,callbackmgr
|
|
|
|
0x03e02825, // 0x74: move $a1, $ra
|
|
0x24a5ffec, // 0x78: addiu $a1,$a1,-20
|
|
|
|
// JIT re-entry fn addr:
|
|
0x00000000, // 0x7c: lui $t9,reentry
|
|
0x00000000, // 0x80: addiu $t9,$t9,reentry
|
|
|
|
0x0320f809, // 0x84: jalr $t9
|
|
0x00000000, // 0x88: nop
|
|
0x8fbf0064, // 0x8c: lw $ra,100($sp)
|
|
0x8fbe0060, // 0x90: lw $fp,96($sp)
|
|
0x8fb9005c, // 0x94: lw $t9,92($sp)
|
|
0x8fb80058, // 0x98: lw $t8,88($sp)
|
|
0x8faf0054, // 0x9c: lw $t7,84($sp)
|
|
0x8fae0050, // 0xa0: lw $t6,80($sp)
|
|
0x8fad004c, // 0xa4: lw $t5,76($sp)
|
|
0x8fac0048, // 0xa8: lw $t4,72($sp)
|
|
0x8fab0044, // 0xac: lw $t3,68($sp)
|
|
0x8faa0040, // 0xb0: lw $t2,64($sp)
|
|
0x8fa9003c, // 0xb4: lw $t1,60($sp)
|
|
0x8fa80038, // 0xb8: lw $t0,56($sp)
|
|
0x8fb70034, // 0xbc: lw $s7,52($sp)
|
|
0x8fb60030, // 0xc0: lw $s6,48($sp)
|
|
0x8fb5002c, // 0xc4: lw $s5,44($sp)
|
|
0x8fb40028, // 0xc8: lw $s4,40($sp)
|
|
0x8fb30024, // 0xcc: lw $s3,36($sp)
|
|
0x8fb20020, // 0xd0: lw $s2,32($sp)
|
|
0x8fb1001c, // 0xd4: lw $s1,28($sp)
|
|
0x8fb00018, // 0xd8: lw $s0,24($sp)
|
|
0x8fa70014, // 0xdc: lw $a3,20($sp)
|
|
0x8fa60010, // 0xe0: lw $a2,16($sp)
|
|
0x8fa5000c, // 0xe4: lw $a1,12($sp)
|
|
0x8fa40008, // 0xe8: lw $a0,8($sp)
|
|
0x27bd0068, // 0xec: addiu $sp,$sp,104
|
|
0x0300f825, // 0xf0: move $ra, $t8
|
|
0x03200008, // 0xf4: jr $t9
|
|
0x00000000, // 0xf8: move $t9, $v0/v1
|
|
};
|
|
|
|
const unsigned ReentryFnAddrOffset = 0x7c; // JIT re-entry fn addr lui
|
|
const unsigned CallbackMgrAddrOffset = 0x6c; // Callback manager addr lui
|
|
const unsigned Offsett = 0xf8;
|
|
|
|
memcpy(ResolverMem, ResolverCode, sizeof(ResolverCode));
|
|
|
|
// Depending on endian return value will be in v0 or v1.
|
|
uint32_t MoveVxT9 = isBigEndian ? 0x0060c825 : 0x0040c825;
|
|
memcpy(ResolverMem + Offsett, &MoveVxT9, sizeof(MoveVxT9));
|
|
|
|
uint64_t CallMgrAddr = reinterpret_cast<uint64_t>(CallbackMgr);
|
|
uint32_t CallMgrLUi = 0x3c040000 | (((CallMgrAddr + 0x8000) >> 16) & 0xFFFF);
|
|
uint32_t CallMgrADDiu = 0x24840000 | ((CallMgrAddr) & 0xFFFF);
|
|
memcpy(ResolverMem + CallbackMgrAddrOffset, &CallMgrLUi, sizeof(CallMgrLUi));
|
|
memcpy(ResolverMem + CallbackMgrAddrOffset + 4, &CallMgrADDiu,
|
|
sizeof(CallMgrADDiu));
|
|
|
|
uint64_t ReentryAddr = reinterpret_cast<uint64_t>(ReentryFn);
|
|
uint32_t ReentryLUi = 0x3c190000 | (((ReentryAddr + 0x8000) >> 16) & 0xFFFF);
|
|
uint32_t ReentryADDiu = 0x27390000 | ((ReentryAddr) & 0xFFFF);
|
|
memcpy(ResolverMem + ReentryFnAddrOffset, &ReentryLUi, sizeof(ReentryLUi));
|
|
memcpy(ResolverMem + ReentryFnAddrOffset + 4, &ReentryADDiu,
|
|
sizeof(ReentryADDiu));
|
|
}
|
|
|
|
void OrcMips32_Base::writeTrampolines(uint8_t *TrampolineMem,
|
|
void *ResolverAddr,
|
|
unsigned NumTrampolines) {
|
|
|
|
uint32_t *Trampolines = reinterpret_cast<uint32_t *>(TrampolineMem);
|
|
uint64_t ResolveAddr = reinterpret_cast<uint64_t>(ResolverAddr);
|
|
uint32_t RHiAddr = ((ResolveAddr + 0x8000) >> 16);
|
|
|
|
for (unsigned I = 0; I < NumTrampolines; ++I) {
|
|
Trampolines[5 * I + 0] = 0x03e0c025; // move $t8,$ra
|
|
Trampolines[5 * I + 1] = 0x3c190000 | (RHiAddr & 0xFFFF); // lui $t9,resolveAddr
|
|
Trampolines[5 * I + 2] = 0x27390000 | (ResolveAddr & 0xFFFF); // addiu $t9,$t9,resolveAddr
|
|
Trampolines[5 * I + 3] = 0x0320f809; // jalr $t9
|
|
Trampolines[5 * I + 4] = 0x00000000; // nop
|
|
}
|
|
}
|
|
|
|
Error OrcMips32_Base::emitIndirectStubsBlock(IndirectStubsInfo &StubsInfo,
|
|
unsigned MinStubs,
|
|
void *InitialPtrVal) {
|
|
// Stub format is:
|
|
//
|
|
// .section __orc_stubs
|
|
// stub1:
|
|
// lui $t9, ptr1
|
|
// lw $t9, %lo(ptr1)($t9)
|
|
// jr $t9
|
|
// stub2:
|
|
// lui $t9, ptr2
|
|
// lw $t9,%lo(ptr1)($t9)
|
|
// jr $t9
|
|
//
|
|
// ...
|
|
//
|
|
// .section __orc_ptrs
|
|
// ptr1:
|
|
// .word 0x0
|
|
// ptr2:
|
|
// .word 0x0
|
|
//
|
|
// ...
|
|
|
|
const unsigned StubSize = IndirectStubsInfo::StubSize;
|
|
|
|
// Emit at least MinStubs, rounded up to fill the pages allocated.
|
|
unsigned PageSize = sys::Process::getPageSize();
|
|
unsigned NumPages = ((MinStubs * StubSize) + (PageSize - 1)) / PageSize;
|
|
unsigned NumStubs = (NumPages * PageSize) / StubSize;
|
|
|
|
// Allocate memory for stubs and pointers in one call.
|
|
std::error_code EC;
|
|
auto StubsMem = sys::OwningMemoryBlock(sys::Memory::allocateMappedMemory(
|
|
2 * NumPages * PageSize, nullptr,
|
|
sys::Memory::MF_READ | sys::Memory::MF_WRITE, EC));
|
|
|
|
if (EC)
|
|
return errorCodeToError(EC);
|
|
|
|
// Create separate MemoryBlocks representing the stubs and pointers.
|
|
sys::MemoryBlock StubsBlock(StubsMem.base(), NumPages * PageSize);
|
|
sys::MemoryBlock PtrsBlock(static_cast<char *>(StubsMem.base()) +
|
|
NumPages * PageSize,
|
|
NumPages * PageSize);
|
|
|
|
// Populate the stubs page stubs and mark it executable.
|
|
uint32_t *Stub = reinterpret_cast<uint32_t *>(StubsBlock.base());
|
|
uint64_t PtrAddr = reinterpret_cast<uint64_t>(Stub) + NumPages * PageSize;
|
|
|
|
for (unsigned I = 0; I < NumStubs; ++I) {
|
|
uint32_t HiAddr = ((PtrAddr + 0x8000) >> 16);
|
|
Stub[4 * I + 0] = 0x3c190000 | (HiAddr & 0xFFFF); // lui $t9,ptr1
|
|
Stub[4 * I + 1] = 0x8f390000 | (PtrAddr & 0xFFFF); // lw $t9,%lo(ptr1)($t9)
|
|
Stub[4 * I + 2] = 0x03200008; // jr $t9
|
|
Stub[4 * I + 3] = 0x00000000; // nop
|
|
PtrAddr += 4;
|
|
}
|
|
|
|
if (auto EC = sys::Memory::protectMappedMemory(
|
|
StubsBlock, sys::Memory::MF_READ | sys::Memory::MF_EXEC))
|
|
return errorCodeToError(EC);
|
|
|
|
// Initialize all pointers to point at FailureAddress.
|
|
void **Ptr = reinterpret_cast<void **>(PtrsBlock.base());
|
|
for (unsigned I = 0; I < NumStubs; ++I)
|
|
Ptr[I] = InitialPtrVal;
|
|
|
|
StubsInfo = IndirectStubsInfo(NumStubs, std::move(StubsMem));
|
|
|
|
return Error::success();
|
|
}
|
|
|
|
void OrcMips64::writeResolverCode(uint8_t *ResolverMem, JITReentryFn ReentryFn,
|
|
void *CallbackMgr) {
|
|
|
|
const uint32_t ResolverCode[] = {
|
|
//resolver_entry:
|
|
0x67bdff30, // 0x00: daddiu $sp,$sp,-208
|
|
0xffa20000, // 0x04: sd v0,0(sp)
|
|
0xffa30008, // 0x08: sd v1,8(sp)
|
|
0xffa40010, // 0x0c: sd a0,16(sp)
|
|
0xffa50018, // 0x10: sd a1,24(sp)
|
|
0xffa60020, // 0x14: sd a2,32(sp)
|
|
0xffa70028, // 0x18: sd a3,40(sp)
|
|
0xffa80030, // 0x1c: sd a4,48(sp)
|
|
0xffa90038, // 0x20: sd a5,56(sp)
|
|
0xffaa0040, // 0x24: sd a6,64(sp)
|
|
0xffab0048, // 0x28: sd a7,72(sp)
|
|
0xffac0050, // 0x2c: sd t0,80(sp)
|
|
0xffad0058, // 0x30: sd t1,88(sp)
|
|
0xffae0060, // 0x34: sd t2,96(sp)
|
|
0xffaf0068, // 0x38: sd t3,104(sp)
|
|
0xffb00070, // 0x3c: sd s0,112(sp)
|
|
0xffb10078, // 0x40: sd s1,120(sp)
|
|
0xffb20080, // 0x44: sd s2,128(sp)
|
|
0xffb30088, // 0x48: sd s3,136(sp)
|
|
0xffb40090, // 0x4c: sd s4,144(sp)
|
|
0xffb50098, // 0x50: sd s5,152(sp)
|
|
0xffb600a0, // 0x54: sd s6,160(sp)
|
|
0xffb700a8, // 0x58: sd s7,168(sp)
|
|
0xffb800b0, // 0x5c: sd t8,176(sp)
|
|
0xffb900b8, // 0x60: sd t9,184(sp)
|
|
0xffbe00c0, // 0x64: sd fp,192(sp)
|
|
0xffbf00c8, // 0x68: sd ra,200(sp)
|
|
|
|
// Callback manager addr.
|
|
0x00000000, // 0x6c: lui $a0,heighest(callbackmgr)
|
|
0x00000000, // 0x70: daddiu $a0,$a0,heigher(callbackmgr)
|
|
0x00000000, // 0x74: dsll $a0,$a0,16
|
|
0x00000000, // 0x78: daddiu $a0,$a0,hi(callbackmgr)
|
|
0x00000000, // 0x7c: dsll $a0,$a0,16
|
|
0x00000000, // 0x80: daddiu $a0,$a0,lo(callbackmgr)
|
|
|
|
0x03e02825, // 0x84: move $a1, $ra
|
|
0x64a5ffdc, // 0x88: daddiu $a1,$a1,-36
|
|
|
|
// JIT re-entry fn addr:
|
|
0x00000000, // 0x8c: lui $t9,reentry
|
|
0x00000000, // 0x90: daddiu $t9,$t9,reentry
|
|
0x00000000, // 0x94: dsll $t9,$t9,
|
|
0x00000000, // 0x98: daddiu $t9,$t9,
|
|
0x00000000, // 0x9c: dsll $t9,$t9,
|
|
0x00000000, // 0xa0: daddiu $t9,$t9,
|
|
0x0320f809, // 0xa4: jalr $t9
|
|
0x00000000, // 0xa8: nop
|
|
0xdfbf00c8, // 0xac: ld ra, 200(sp)
|
|
0xdfbe00c0, // 0xb0: ld fp, 192(sp)
|
|
0xdfb900b8, // 0xb4: ld t9, 184(sp)
|
|
0xdfb800b0, // 0xb8: ld t8, 176(sp)
|
|
0xdfb700a8, // 0xbc: ld s7, 168(sp)
|
|
0xdfb600a0, // 0xc0: ld s6, 160(sp)
|
|
0xdfb50098, // 0xc4: ld s5, 152(sp)
|
|
0xdfb40090, // 0xc8: ld s4, 144(sp)
|
|
0xdfb30088, // 0xcc: ld s3, 136(sp)
|
|
0xdfb20080, // 0xd0: ld s2, 128(sp)
|
|
0xdfb10078, // 0xd4: ld s1, 120(sp)
|
|
0xdfb00070, // 0xd8: ld s0, 112(sp)
|
|
0xdfaf0068, // 0xdc: ld t3, 104(sp)
|
|
0xdfae0060, // 0xe0: ld t2, 96(sp)
|
|
0xdfad0058, // 0xe4: ld t1, 88(sp)
|
|
0xdfac0050, // 0xe8: ld t0, 80(sp)
|
|
0xdfab0048, // 0xec: ld a7, 72(sp)
|
|
0xdfaa0040, // 0xf0: ld a6, 64(sp)
|
|
0xdfa90038, // 0xf4: ld a5, 56(sp)
|
|
0xdfa80030, // 0xf8: ld a4, 48(sp)
|
|
0xdfa70028, // 0xfc: ld a3, 40(sp)
|
|
0xdfa60020, // 0x100: ld a2, 32(sp)
|
|
0xdfa50018, // 0x104: ld a1, 24(sp)
|
|
0xdfa40010, // 0x108: ld a0, 16(sp)
|
|
0xdfa30008, // 0x10c: ld v1, 8(sp)
|
|
0x67bd00d0, // 0x110: daddiu $sp,$sp,208
|
|
0x0300f825, // 0x114: move $ra, $t8
|
|
0x03200008, // 0x118: jr $t9
|
|
0x0040c825, // 0x11c: move $t9, $v0
|
|
};
|
|
|
|
const unsigned ReentryFnAddrOffset = 0x8c; // JIT re-entry fn addr lui
|
|
const unsigned CallbackMgrAddrOffset = 0x6c; // Callback manager addr lui
|
|
|
|
memcpy(ResolverMem, ResolverCode, sizeof(ResolverCode));
|
|
|
|
uint64_t CallMgrAddr = reinterpret_cast<uint64_t>(CallbackMgr);
|
|
|
|
uint32_t CallMgrLUi =
|
|
0x3c040000 | (((CallMgrAddr + 0x800080008000) >> 48) & 0xFFFF);
|
|
uint32_t CallMgrDADDiu =
|
|
0x64840000 | (((CallMgrAddr + 0x80008000) >> 32) & 0xFFFF);
|
|
uint32_t CallMgrDSLL = 0x00042438;
|
|
uint32_t CallMgrDADDiu2 =
|
|
0x64840000 | ((((CallMgrAddr + 0x8000) >> 16) & 0xFFFF));
|
|
uint32_t CallMgrDSLL2 = 0x00042438;
|
|
uint32_t CallMgrDADDiu3 = 0x64840000 | ((CallMgrAddr)&0xFFFF);
|
|
|
|
memcpy(ResolverMem + CallbackMgrAddrOffset, &CallMgrLUi, sizeof(CallMgrLUi));
|
|
memcpy(ResolverMem + (CallbackMgrAddrOffset + 4), &CallMgrDADDiu,
|
|
sizeof(CallMgrDADDiu));
|
|
memcpy(ResolverMem + (CallbackMgrAddrOffset + 8), &CallMgrDSLL,
|
|
sizeof(CallMgrDSLL));
|
|
memcpy(ResolverMem + (CallbackMgrAddrOffset + 12), &CallMgrDADDiu2,
|
|
sizeof(CallMgrDADDiu2));
|
|
memcpy(ResolverMem + (CallbackMgrAddrOffset + 16), &CallMgrDSLL2,
|
|
sizeof(CallMgrDSLL2));
|
|
memcpy(ResolverMem + (CallbackMgrAddrOffset + 20), &CallMgrDADDiu3,
|
|
sizeof(CallMgrDADDiu3));
|
|
|
|
uint64_t ReentryAddr = reinterpret_cast<uint64_t>(ReentryFn);
|
|
|
|
uint32_t ReentryLUi =
|
|
0x3c190000 | (((ReentryAddr + 0x800080008000) >> 48) & 0xFFFF);
|
|
|
|
uint32_t ReentryDADDiu =
|
|
0x67390000 | (((ReentryAddr + 0x80008000) >> 32) & 0xFFFF);
|
|
|
|
uint32_t ReentryDSLL = 0x0019cc38;
|
|
|
|
uint32_t ReentryDADDiu2 =
|
|
0x67390000 | (((ReentryAddr + 0x8000) >> 16) & 0xFFFF);
|
|
|
|
uint32_t ReentryDSLL2 = 0x0019cc38;
|
|
|
|
uint32_t ReentryDADDiu3 = 0x67390000 | ((ReentryAddr)&0xFFFF);
|
|
|
|
memcpy(ResolverMem + ReentryFnAddrOffset, &ReentryLUi, sizeof(ReentryLUi));
|
|
memcpy(ResolverMem + (ReentryFnAddrOffset + 4), &ReentryDADDiu,
|
|
sizeof(ReentryDADDiu));
|
|
memcpy(ResolverMem + (ReentryFnAddrOffset + 8), &ReentryDSLL,
|
|
sizeof(ReentryDSLL));
|
|
memcpy(ResolverMem + (ReentryFnAddrOffset + 12), &ReentryDADDiu2,
|
|
sizeof(ReentryDADDiu2));
|
|
memcpy(ResolverMem + (ReentryFnAddrOffset + 16), &ReentryDSLL2,
|
|
sizeof(ReentryDSLL2));
|
|
memcpy(ResolverMem + (ReentryFnAddrOffset + 20), &ReentryDADDiu3,
|
|
sizeof(ReentryDADDiu3));
|
|
}
|
|
|
|
void OrcMips64::writeTrampolines(uint8_t *TrampolineMem, void *ResolverAddr,
|
|
unsigned NumTrampolines) {
|
|
|
|
uint32_t *Trampolines = reinterpret_cast<uint32_t *>(TrampolineMem);
|
|
uint64_t ResolveAddr = reinterpret_cast<uint64_t>(ResolverAddr);
|
|
|
|
uint64_t HeighestAddr = ((ResolveAddr + 0x800080008000) >> 48);
|
|
uint64_t HeigherAddr = ((ResolveAddr + 0x80008000) >> 32);
|
|
uint64_t HiAddr = ((ResolveAddr + 0x8000) >> 16);
|
|
|
|
for (unsigned I = 0; I < NumTrampolines; ++I) {
|
|
Trampolines[10 * I + 0] = 0x03e0c025; // move $t8,$ra
|
|
Trampolines[10 * I + 1] = 0x3c190000 | (HeighestAddr & 0xFFFF); // lui $t9,resolveAddr
|
|
Trampolines[10 * I + 2] = 0x67390000 | (HeigherAddr & 0xFFFF); // daddiu $t9,$t9,%higher(resolveAddr)
|
|
Trampolines[10 * I + 3] = 0x0019cc38; // dsll $t9,$t9,16
|
|
Trampolines[10 * I + 4] = 0x67390000 | (HiAddr & 0xFFFF); // daddiu $t9,$t9,%hi(ptr)
|
|
Trampolines[10 * I + 5] = 0x0019cc38; // dsll $t9,$t9,16
|
|
Trampolines[10 * I + 6] = 0x67390000 | (ResolveAddr & 0xFFFF); // daddiu $t9,$t9,%lo(ptr)
|
|
Trampolines[10 * I + 7] = 0x0320f809; // jalr $t9
|
|
Trampolines[10 * I + 8] = 0x00000000; // nop
|
|
Trampolines[10 * I + 9] = 0x00000000; // nop
|
|
}
|
|
}
|
|
|
|
Error OrcMips64::emitIndirectStubsBlock(IndirectStubsInfo &StubsInfo,
|
|
unsigned MinStubs,
|
|
void *InitialPtrVal) {
|
|
// Stub format is:
|
|
//
|
|
// .section __orc_stubs
|
|
// stub1:
|
|
// lui $t9,ptr1
|
|
// dsll $t9,$t9,16
|
|
// daddiu $t9,$t9,%hi(ptr)
|
|
// dsll $t9,$t9,16
|
|
// ld $t9,%lo(ptr)
|
|
// jr $t9
|
|
// stub2:
|
|
// lui $t9,ptr1
|
|
// dsll $t9,$t9,16
|
|
// daddiu $t9,$t9,%hi(ptr)
|
|
// dsll $t9,$t9,16
|
|
// ld $t9,%lo(ptr)
|
|
// jr $t9
|
|
//
|
|
// ...
|
|
//
|
|
// .section __orc_ptrs
|
|
// ptr1:
|
|
// .dword 0x0
|
|
// ptr2:
|
|
// .dword 0x0
|
|
//
|
|
// ...
|
|
const unsigned StubSize = IndirectStubsInfo::StubSize;
|
|
|
|
// Emit at least MinStubs, rounded up to fill the pages allocated.
|
|
unsigned PageSize = sys::Process::getPageSize();
|
|
unsigned NumPages = ((MinStubs * StubSize) + (PageSize - 1)) / PageSize;
|
|
unsigned NumStubs = (NumPages * PageSize) / StubSize;
|
|
|
|
// Allocate memory for stubs and pointers in one call.
|
|
std::error_code EC;
|
|
auto StubsMem = sys::OwningMemoryBlock(sys::Memory::allocateMappedMemory(
|
|
2 * NumPages * PageSize, nullptr,
|
|
sys::Memory::MF_READ | sys::Memory::MF_WRITE, EC));
|
|
|
|
if (EC)
|
|
return errorCodeToError(EC);
|
|
|
|
// Create separate MemoryBlocks representing the stubs and pointers.
|
|
sys::MemoryBlock StubsBlock(StubsMem.base(), NumPages * PageSize);
|
|
sys::MemoryBlock PtrsBlock(static_cast<char *>(StubsMem.base()) +
|
|
NumPages * PageSize,
|
|
NumPages * PageSize);
|
|
|
|
// Populate the stubs page stubs and mark it executable.
|
|
uint32_t *Stub = reinterpret_cast<uint32_t *>(StubsBlock.base());
|
|
uint64_t PtrAddr = reinterpret_cast<uint64_t>(PtrsBlock.base());
|
|
|
|
for (unsigned I = 0; I < NumStubs; ++I, PtrAddr += 8) {
|
|
uint64_t HeighestAddr = ((PtrAddr + 0x800080008000) >> 48);
|
|
uint64_t HeigherAddr = ((PtrAddr + 0x80008000) >> 32);
|
|
uint64_t HiAddr = ((PtrAddr + 0x8000) >> 16);
|
|
Stub[8 * I + 0] = 0x3c190000 | (HeighestAddr & 0xFFFF); // lui $t9,ptr1
|
|
Stub[8 * I + 1] = 0x67390000 | (HeigherAddr & 0xFFFF); // daddiu $t9,$t9,%higher(ptr)
|
|
Stub[8 * I + 2] = 0x0019cc38; // dsll $t9,$t9,16
|
|
Stub[8 * I + 3] = 0x67390000 | (HiAddr & 0xFFFF); // daddiu $t9,$t9,%hi(ptr)
|
|
Stub[8 * I + 4] = 0x0019cc38; // dsll $t9,$t9,16
|
|
Stub[8 * I + 5] = 0xdf390000 | (PtrAddr & 0xFFFF); // ld $t9,%lo(ptr)
|
|
Stub[8 * I + 6] = 0x03200008; // jr $t9
|
|
Stub[8 * I + 7] = 0x00000000; // nop
|
|
}
|
|
|
|
if (auto EC = sys::Memory::protectMappedMemory(
|
|
StubsBlock, sys::Memory::MF_READ | sys::Memory::MF_EXEC))
|
|
return errorCodeToError(EC);
|
|
|
|
// Initialize all pointers to point at FailureAddress.
|
|
void **Ptr = reinterpret_cast<void **>(PtrsBlock.base());
|
|
for (unsigned I = 0; I < NumStubs; ++I)
|
|
Ptr[I] = InitialPtrVal;
|
|
|
|
StubsInfo = IndirectStubsInfo(NumStubs, std::move(StubsMem));
|
|
|
|
return Error::success();
|
|
}
|
|
} // End namespace orc.
|
|
} // End namespace llvm.
|