2023-03-17 19:20:37 +00:00
|
|
|
// This file is part of the Luau programming language and is licensed under MIT License; see LICENSE.txt for details
|
|
|
|
#include "CodeGenA64.h"
|
|
|
|
|
|
|
|
#include "Luau/AssemblyBuilderA64.h"
|
|
|
|
#include "Luau/UnwindBuilder.h"
|
|
|
|
|
2023-05-19 20:37:30 +01:00
|
|
|
#include "BitUtils.h"
|
2023-03-17 19:20:37 +00:00
|
|
|
#include "NativeState.h"
|
2023-03-24 18:03:04 +00:00
|
|
|
#include "EmitCommonA64.h"
|
2023-03-17 19:20:37 +00:00
|
|
|
|
|
|
|
#include "lstate.h"
|
|
|
|
|
|
|
|
namespace Luau
|
|
|
|
{
|
|
|
|
namespace CodeGen
|
|
|
|
{
|
|
|
|
namespace A64
|
|
|
|
{
|
|
|
|
|
2023-04-14 19:06:22 +01:00
|
|
|
struct EntryLocations
|
2023-03-17 19:20:37 +00:00
|
|
|
{
|
2023-04-14 19:06:22 +01:00
|
|
|
Label start;
|
|
|
|
Label prologueEnd;
|
|
|
|
Label epilogueStart;
|
|
|
|
};
|
|
|
|
|
|
|
|
static void emitExit(AssemblyBuilderA64& build, bool continueInVm)
|
|
|
|
{
|
|
|
|
build.mov(x0, continueInVm);
|
|
|
|
build.ldr(x1, mem(rNativeContext, offsetof(NativeContext, gateExit)));
|
|
|
|
build.br(x1);
|
|
|
|
}
|
|
|
|
|
2023-08-11 15:42:37 +01:00
|
|
|
static void emitUpdatePcForExit(AssemblyBuilderA64& build)
|
2023-07-07 21:10:48 +01:00
|
|
|
{
|
|
|
|
// x0 = pcpos * sizeof(Instruction)
|
|
|
|
build.add(x0, rCode, x0);
|
|
|
|
build.ldr(x1, mem(rState, offsetof(lua_State, ci)));
|
|
|
|
build.str(x0, mem(x1, offsetof(CallInfo, savedpc)));
|
2023-08-11 15:42:37 +01:00
|
|
|
}
|
2023-07-07 21:10:48 +01:00
|
|
|
|
2023-08-11 15:42:37 +01:00
|
|
|
static void emitClearNativeFlag(AssemblyBuilderA64& build)
|
|
|
|
{
|
|
|
|
build.ldr(x0, mem(rState, offsetof(lua_State, ci)));
|
|
|
|
build.ldr(w1, mem(x0, offsetof(CallInfo, flags)));
|
|
|
|
build.mov(w2, ~LUA_CALLINFO_NATIVE);
|
|
|
|
build.and_(w1, w1, w2);
|
|
|
|
build.str(w1, mem(x0, offsetof(CallInfo, flags)));
|
2023-07-07 21:10:48 +01:00
|
|
|
}
|
|
|
|
|
2023-04-14 19:06:22 +01:00
|
|
|
static void emitInterrupt(AssemblyBuilderA64& build)
|
|
|
|
{
|
|
|
|
// x0 = pc offset
|
|
|
|
// x1 = return address in native code
|
2023-04-28 20:55:13 +01:00
|
|
|
|
|
|
|
Label skip;
|
2023-04-14 19:06:22 +01:00
|
|
|
|
|
|
|
// Stash return address in rBase; we need to reload rBase anyway
|
|
|
|
build.mov(rBase, x1);
|
|
|
|
|
2023-04-28 20:55:13 +01:00
|
|
|
// Load interrupt handler; it may be nullptr in case the update raced with the check before we got here
|
|
|
|
build.ldr(x2, mem(rState, offsetof(lua_State, global)));
|
|
|
|
build.ldr(x2, mem(x2, offsetof(global_State, cb.interrupt)));
|
|
|
|
build.cbz(x2, skip);
|
|
|
|
|
2023-04-14 19:06:22 +01:00
|
|
|
// Update savedpc; required in case interrupt errors
|
|
|
|
build.add(x0, rCode, x0);
|
|
|
|
build.ldr(x1, mem(rState, offsetof(lua_State, ci)));
|
|
|
|
build.str(x0, mem(x1, offsetof(CallInfo, savedpc)));
|
|
|
|
|
|
|
|
// Call interrupt
|
|
|
|
build.mov(x0, rState);
|
|
|
|
build.mov(w1, -1);
|
|
|
|
build.blr(x2);
|
|
|
|
|
|
|
|
// Check if we need to exit
|
|
|
|
build.ldrb(w0, mem(rState, offsetof(lua_State, status)));
|
|
|
|
build.cbz(w0, skip);
|
|
|
|
|
|
|
|
// L->ci->savedpc--
|
|
|
|
// note: recomputing this avoids having to stash x0
|
|
|
|
build.ldr(x1, mem(rState, offsetof(lua_State, ci)));
|
|
|
|
build.ldr(x0, mem(x1, offsetof(CallInfo, savedpc)));
|
|
|
|
build.sub(x0, x0, sizeof(Instruction));
|
|
|
|
build.str(x0, mem(x1, offsetof(CallInfo, savedpc)));
|
|
|
|
|
|
|
|
emitExit(build, /* continueInVm */ false);
|
|
|
|
|
|
|
|
build.setLabel(skip);
|
|
|
|
|
|
|
|
// Return back to caller; rBase has stashed return address
|
|
|
|
build.mov(x0, rBase);
|
|
|
|
|
|
|
|
emitUpdateBase(build); // interrupt may have reallocated stack
|
|
|
|
|
|
|
|
build.br(x0);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void emitReentry(AssemblyBuilderA64& build, ModuleHelpers& helpers)
|
|
|
|
{
|
|
|
|
// x0 = closure object to reentry (equal to clvalue(L->ci->func))
|
|
|
|
|
|
|
|
// If the fallback requested an exit, we need to do this right away
|
|
|
|
build.cbz(x0, helpers.exitNoContinueVm);
|
|
|
|
|
|
|
|
emitUpdateBase(build);
|
|
|
|
|
|
|
|
// Need to update state of the current function before we jump away
|
|
|
|
build.ldr(x1, mem(x0, offsetof(Closure, l.p))); // cl->l.p aka proto
|
|
|
|
|
2023-05-19 20:37:30 +01:00
|
|
|
build.ldr(x2, mem(rState, offsetof(lua_State, ci))); // L->ci
|
|
|
|
|
|
|
|
// We need to check if the new frame can be executed natively
|
2023-05-25 22:36:34 +01:00
|
|
|
// TODO: .flags and .savedpc load below can be fused with ldp
|
2023-05-19 20:37:30 +01:00
|
|
|
build.ldr(w3, mem(x2, offsetof(CallInfo, flags)));
|
2023-05-25 22:36:34 +01:00
|
|
|
build.tbz(x3, countrz(LUA_CALLINFO_NATIVE), helpers.exitContinueVm);
|
2023-05-19 20:37:30 +01:00
|
|
|
|
2023-04-14 19:06:22 +01:00
|
|
|
build.mov(rClosure, x0);
|
2023-05-25 22:36:34 +01:00
|
|
|
|
|
|
|
LUAU_ASSERT(offsetof(Proto, code) == offsetof(Proto, k) + 8);
|
|
|
|
build.ldp(rConstants, rCode, mem(x1, offsetof(Proto, k))); // proto->k, proto->code
|
2023-04-14 19:06:22 +01:00
|
|
|
|
|
|
|
// Get instruction index from instruction pointer
|
|
|
|
// To get instruction index from instruction pointer, we need to divide byte offset by 4
|
2023-04-28 20:55:13 +01:00
|
|
|
// But we will actually need to scale instruction index by 4 back to byte offset later so it cancels out
|
2023-04-14 19:06:22 +01:00
|
|
|
build.ldr(x2, mem(x2, offsetof(CallInfo, savedpc))); // L->ci->savedpc
|
2023-05-19 20:37:30 +01:00
|
|
|
build.sub(x2, x2, rCode);
|
2023-04-14 19:06:22 +01:00
|
|
|
|
|
|
|
// Get new instruction location and jump to it
|
2023-05-19 20:37:30 +01:00
|
|
|
LUAU_ASSERT(offsetof(Proto, exectarget) == offsetof(Proto, execdata) + 8);
|
|
|
|
build.ldp(x3, x4, mem(x1, offsetof(Proto, execdata)));
|
|
|
|
build.ldr(w2, mem(x3, x2));
|
|
|
|
build.add(x4, x4, x2);
|
|
|
|
build.br(x4);
|
2023-04-14 19:06:22 +01:00
|
|
|
}
|
|
|
|
|
2023-06-09 18:08:00 +01:00
|
|
|
void emitReturn(AssemblyBuilderA64& build, ModuleHelpers& helpers)
|
|
|
|
{
|
|
|
|
// x1 = res
|
|
|
|
// w2 = number of written values
|
|
|
|
|
|
|
|
// x0 = ci
|
|
|
|
build.ldr(x0, mem(rState, offsetof(lua_State, ci)));
|
|
|
|
// w3 = ci->nresults
|
|
|
|
build.ldr(w3, mem(x0, offsetof(CallInfo, nresults)));
|
|
|
|
|
|
|
|
Label skipResultCopy;
|
|
|
|
|
|
|
|
// Fill the rest of the expected results (nresults - written) with 'nil'
|
|
|
|
build.cmp(w2, w3);
|
|
|
|
build.b(ConditionA64::GreaterEqual, skipResultCopy);
|
|
|
|
|
|
|
|
// TODO: cmp above could compute this and flags using subs
|
|
|
|
build.sub(w2, w3, w2); // counter = nresults - written
|
|
|
|
build.mov(w4, LUA_TNIL);
|
|
|
|
|
|
|
|
Label repeatNilLoop = build.setLabel();
|
|
|
|
build.str(w4, mem(x1, offsetof(TValue, tt)));
|
|
|
|
build.add(x1, x1, sizeof(TValue));
|
|
|
|
build.sub(w2, w2, 1);
|
|
|
|
build.cbnz(w2, repeatNilLoop);
|
|
|
|
|
|
|
|
build.setLabel(skipResultCopy);
|
|
|
|
|
|
|
|
// x2 = cip = ci - 1
|
|
|
|
build.sub(x2, x0, sizeof(CallInfo));
|
|
|
|
|
|
|
|
// res = cip->top when nresults >= 0
|
|
|
|
Label skipFixedRetTop;
|
|
|
|
build.tbnz(w3, 31, skipFixedRetTop);
|
|
|
|
build.ldr(x1, mem(x2, offsetof(CallInfo, top))); // res = cip->top
|
|
|
|
build.setLabel(skipFixedRetTop);
|
|
|
|
|
|
|
|
// Update VM state (ci, base, top)
|
|
|
|
build.str(x2, mem(rState, offsetof(lua_State, ci))); // L->ci = cip
|
|
|
|
build.ldr(rBase, mem(x2, offsetof(CallInfo, base))); // sync base = L->base while we have a chance
|
|
|
|
build.str(rBase, mem(rState, offsetof(lua_State, base))); // L->base = cip->base
|
|
|
|
|
|
|
|
build.str(x1, mem(rState, offsetof(lua_State, top))); // L->top = res
|
|
|
|
|
|
|
|
// Unlikely, but this might be the last return from VM
|
|
|
|
build.ldr(w4, mem(x0, offsetof(CallInfo, flags)));
|
|
|
|
build.tbnz(w4, countrz(LUA_CALLINFO_RETURN), helpers.exitNoContinueVm);
|
|
|
|
|
|
|
|
// Continue in interpreter if function has no native data
|
|
|
|
build.ldr(w4, mem(x2, offsetof(CallInfo, flags)));
|
|
|
|
build.tbz(w4, countrz(LUA_CALLINFO_NATIVE), helpers.exitContinueVm);
|
|
|
|
|
|
|
|
// Need to update state of the current function before we jump away
|
|
|
|
build.ldr(rClosure, mem(x2, offsetof(CallInfo, func)));
|
|
|
|
build.ldr(rClosure, mem(rClosure, offsetof(TValue, value.gc)));
|
|
|
|
|
|
|
|
build.ldr(x1, mem(rClosure, offsetof(Closure, l.p))); // cl->l.p aka proto
|
|
|
|
|
|
|
|
LUAU_ASSERT(offsetof(Proto, code) == offsetof(Proto, k) + 8);
|
|
|
|
build.ldp(rConstants, rCode, mem(x1, offsetof(Proto, k))); // proto->k, proto->code
|
|
|
|
|
|
|
|
// Get instruction index from instruction pointer
|
|
|
|
// To get instruction index from instruction pointer, we need to divide byte offset by 4
|
|
|
|
// But we will actually need to scale instruction index by 4 back to byte offset later so it cancels out
|
|
|
|
build.ldr(x2, mem(x2, offsetof(CallInfo, savedpc))); // cip->savedpc
|
|
|
|
build.sub(x2, x2, rCode);
|
|
|
|
|
|
|
|
// Get new instruction location and jump to it
|
|
|
|
LUAU_ASSERT(offsetof(Proto, exectarget) == offsetof(Proto, execdata) + 8);
|
|
|
|
build.ldp(x3, x4, mem(x1, offsetof(Proto, execdata)));
|
|
|
|
build.ldr(w2, mem(x3, x2));
|
|
|
|
build.add(x4, x4, x2);
|
|
|
|
build.br(x4);
|
|
|
|
}
|
|
|
|
|
2023-04-14 19:06:22 +01:00
|
|
|
static EntryLocations buildEntryFunction(AssemblyBuilderA64& build, UnwindBuilder& unwind)
|
|
|
|
{
|
|
|
|
EntryLocations locations;
|
2023-03-17 19:20:37 +00:00
|
|
|
|
2023-03-24 18:03:04 +00:00
|
|
|
// Arguments: x0 = lua_State*, x1 = Proto*, x2 = native code pointer to jump to, x3 = NativeContext*
|
|
|
|
|
2023-04-14 19:06:22 +01:00
|
|
|
locations.start = build.setLabel();
|
2023-03-24 18:03:04 +00:00
|
|
|
|
|
|
|
// prologue
|
|
|
|
build.sub(sp, sp, kStackSize);
|
|
|
|
build.stp(x29, x30, mem(sp)); // fp, lr
|
2023-03-17 19:20:37 +00:00
|
|
|
|
2023-03-24 18:03:04 +00:00
|
|
|
// stash non-volatile registers used for execution environment
|
|
|
|
build.stp(x19, x20, mem(sp, 16));
|
|
|
|
build.stp(x21, x22, mem(sp, 32));
|
|
|
|
build.stp(x23, x24, mem(sp, 48));
|
2023-08-18 19:15:41 +01:00
|
|
|
build.str(x25, mem(sp, 64));
|
2023-03-24 18:03:04 +00:00
|
|
|
|
|
|
|
build.mov(x29, sp); // this is only necessary if we maintain frame pointers, which we do in the JIT for now
|
2023-03-17 19:20:37 +00:00
|
|
|
|
2023-04-14 19:06:22 +01:00
|
|
|
locations.prologueEnd = build.setLabel();
|
2023-03-17 19:20:37 +00:00
|
|
|
|
2023-05-05 22:52:49 +01:00
|
|
|
uint32_t prologueSize = build.getLabelOffset(locations.prologueEnd) - build.getLabelOffset(locations.start);
|
|
|
|
|
2023-03-17 19:20:37 +00:00
|
|
|
// Setup native execution environment
|
2023-03-24 18:03:04 +00:00
|
|
|
build.mov(rState, x0);
|
|
|
|
build.mov(rNativeContext, x3);
|
2023-08-18 19:15:41 +01:00
|
|
|
build.ldr(rGlobalState, mem(x0, offsetof(lua_State, global)));
|
2023-03-24 18:03:04 +00:00
|
|
|
|
|
|
|
build.ldr(rBase, mem(x0, offsetof(lua_State, base))); // L->base
|
2023-05-25 22:36:34 +01:00
|
|
|
|
|
|
|
LUAU_ASSERT(offsetof(Proto, code) == offsetof(Proto, k) + 8);
|
|
|
|
build.ldp(rConstants, rCode, mem(x1, offsetof(Proto, k))); // proto->k, proto->code
|
2023-03-17 19:20:37 +00:00
|
|
|
|
2023-03-24 18:03:04 +00:00
|
|
|
build.ldr(x9, mem(x0, offsetof(lua_State, ci))); // L->ci
|
|
|
|
build.ldr(x9, mem(x9, offsetof(CallInfo, func))); // L->ci->func
|
|
|
|
build.ldr(rClosure, mem(x9, offsetof(TValue, value.gc))); // L->ci->func->value.gc aka cl
|
|
|
|
|
|
|
|
// Jump to the specified instruction; further control flow will be handled with custom ABI with register setup from EmitCommonA64.h
|
2023-03-17 19:20:37 +00:00
|
|
|
build.br(x2);
|
|
|
|
|
|
|
|
// Even though we jumped away, we will return here in the end
|
2023-04-14 19:06:22 +01:00
|
|
|
locations.epilogueStart = build.setLabel();
|
2023-03-17 19:20:37 +00:00
|
|
|
|
|
|
|
// Cleanup and exit
|
2023-08-18 19:15:41 +01:00
|
|
|
build.ldr(x25, mem(sp, 64));
|
2023-03-24 18:03:04 +00:00
|
|
|
build.ldp(x23, x24, mem(sp, 48));
|
|
|
|
build.ldp(x21, x22, mem(sp, 32));
|
|
|
|
build.ldp(x19, x20, mem(sp, 16));
|
|
|
|
build.ldp(x29, x30, mem(sp)); // fp, lr
|
|
|
|
build.add(sp, sp, kStackSize);
|
2023-03-17 19:20:37 +00:00
|
|
|
|
|
|
|
build.ret();
|
|
|
|
|
2023-04-14 19:06:22 +01:00
|
|
|
// Our entry function is special, it spans the whole remaining code area
|
2023-05-05 22:52:49 +01:00
|
|
|
unwind.startFunction();
|
2023-08-18 19:15:41 +01:00
|
|
|
unwind.prologueA64(prologueSize, kStackSize, {x29, x30, x19, x20, x21, x22, x23, x24, x25});
|
2023-04-14 19:06:22 +01:00
|
|
|
unwind.finishFunction(build.getLabelOffset(locations.start), kFullBlockFuncton);
|
|
|
|
|
|
|
|
return locations;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool initHeaderFunctions(NativeState& data)
|
|
|
|
{
|
|
|
|
AssemblyBuilderA64 build(/* logText= */ false);
|
|
|
|
UnwindBuilder& unwind = *data.unwindBuilder.get();
|
|
|
|
|
2023-05-05 22:52:49 +01:00
|
|
|
unwind.startInfo(UnwindBuilder::A64);
|
2023-04-14 19:06:22 +01:00
|
|
|
|
|
|
|
EntryLocations entryLocations = buildEntryFunction(build, unwind);
|
|
|
|
|
2023-03-17 19:20:37 +00:00
|
|
|
build.finalize();
|
|
|
|
|
2023-04-14 19:06:22 +01:00
|
|
|
unwind.finishInfo();
|
|
|
|
|
2023-03-17 19:20:37 +00:00
|
|
|
LUAU_ASSERT(build.data.empty());
|
|
|
|
|
2023-04-14 19:06:22 +01:00
|
|
|
uint8_t* codeStart = nullptr;
|
2023-03-17 19:20:37 +00:00
|
|
|
if (!data.codeAllocator.allocate(build.data.data(), int(build.data.size()), reinterpret_cast<const uint8_t*>(build.code.data()),
|
2023-04-14 19:06:22 +01:00
|
|
|
int(build.code.size() * sizeof(build.code[0])), data.gateData, data.gateDataSize, codeStart))
|
2023-03-17 19:20:37 +00:00
|
|
|
{
|
2023-05-25 22:36:34 +01:00
|
|
|
LUAU_ASSERT(!"Failed to create entry function");
|
2023-03-17 19:20:37 +00:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Set the offset at the begining so that functions in new blocks will not overlay the locations
|
|
|
|
// specified by the unwind information of the entry function
|
2023-04-14 19:06:22 +01:00
|
|
|
unwind.setBeginOffset(build.getLabelOffset(entryLocations.prologueEnd));
|
2023-03-17 19:20:37 +00:00
|
|
|
|
2023-04-14 19:06:22 +01:00
|
|
|
data.context.gateEntry = codeStart + build.getLabelOffset(entryLocations.start);
|
|
|
|
data.context.gateExit = codeStart + build.getLabelOffset(entryLocations.epilogueStart);
|
2023-03-17 19:20:37 +00:00
|
|
|
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2023-03-24 18:03:04 +00:00
|
|
|
void assembleHelpers(AssemblyBuilderA64& build, ModuleHelpers& helpers)
|
|
|
|
{
|
2023-08-11 15:42:37 +01:00
|
|
|
if (build.logText)
|
|
|
|
build.logAppend("; updatePcAndContinueInVm\n");
|
|
|
|
build.setLabel(helpers.updatePcAndContinueInVm);
|
|
|
|
emitUpdatePcForExit(build);
|
|
|
|
|
2023-07-07 21:10:48 +01:00
|
|
|
if (build.logText)
|
|
|
|
build.logAppend("; exitContinueVmClearNativeFlag\n");
|
|
|
|
build.setLabel(helpers.exitContinueVmClearNativeFlag);
|
|
|
|
emitClearNativeFlag(build);
|
|
|
|
|
2023-03-24 18:03:04 +00:00
|
|
|
if (build.logText)
|
|
|
|
build.logAppend("; exitContinueVm\n");
|
2023-06-16 18:35:18 +01:00
|
|
|
build.setLabel(helpers.exitContinueVm);
|
2023-03-24 18:03:04 +00:00
|
|
|
emitExit(build, /* continueInVm */ true);
|
|
|
|
|
|
|
|
if (build.logText)
|
|
|
|
build.logAppend("; exitNoContinueVm\n");
|
2023-06-16 18:35:18 +01:00
|
|
|
build.setLabel(helpers.exitNoContinueVm);
|
2023-03-24 18:03:04 +00:00
|
|
|
emitExit(build, /* continueInVm */ false);
|
2023-03-31 19:42:49 +01:00
|
|
|
|
|
|
|
if (build.logText)
|
|
|
|
build.logAppend("; reentry\n");
|
2023-06-16 18:35:18 +01:00
|
|
|
build.setLabel(helpers.reentry);
|
2023-03-31 19:42:49 +01:00
|
|
|
emitReentry(build, helpers);
|
|
|
|
|
|
|
|
if (build.logText)
|
|
|
|
build.logAppend("; interrupt\n");
|
2023-06-16 18:35:18 +01:00
|
|
|
build.setLabel(helpers.interrupt);
|
2023-03-31 19:42:49 +01:00
|
|
|
emitInterrupt(build);
|
2023-06-09 18:08:00 +01:00
|
|
|
|
|
|
|
if (build.logText)
|
|
|
|
build.logAppend("; return\n");
|
2023-06-16 18:35:18 +01:00
|
|
|
build.setLabel(helpers.return_);
|
2023-06-09 18:08:00 +01:00
|
|
|
emitReturn(build, helpers);
|
2023-03-24 18:03:04 +00:00
|
|
|
}
|
|
|
|
|
2023-03-17 19:20:37 +00:00
|
|
|
} // namespace A64
|
|
|
|
} // namespace CodeGen
|
|
|
|
} // namespace Luau
|