mirror of
https://github.com/luau-lang/luau.git
synced 2025-01-08 12:29:09 +00:00
c7c986b996
* Fixed `Frontend::markDirty` not working on modules that were not typechecked yet * Fixed generic variadic function unification succeeding when it should have reported an error New Type Solver: * Implemented semantic subtyping check for function types Native Code Generation: * Improved performance of numerical loops with a constant step * Simplified IR for `bit32.extract` calls extracting first/last bits * Improved performance of NaN checks
225 lines
8.1 KiB
C++
225 lines
8.1 KiB
C++
// This file is part of the Luau programming language and is licensed under MIT License; see LICENSE.txt for details
|
|
#pragma once
|
|
|
|
#include "Luau/AssemblyBuilderX64.h"
|
|
|
|
#include "EmitCommon.h"
|
|
|
|
#include "lobject.h"
|
|
#include "ltm.h"
|
|
|
|
// MS x64 ABI reminder:
|
|
// Arguments: rcx, rdx, r8, r9 ('overlapped' with xmm0-xmm3)
|
|
// Return: rax, xmm0
|
|
// Nonvolatile: r12-r15, rdi, rsi, rbx, rbp
|
|
// SIMD: only xmm6-xmm15 are non-volatile, all ymm upper parts are volatile
|
|
|
|
// AMD64 ABI reminder:
|
|
// Arguments: rdi, rsi, rdx, rcx, r8, r9 (xmm0-xmm7)
|
|
// Return: rax, rdx, xmm0, xmm1
|
|
// Nonvolatile: r12-r15, rbx, rbp
|
|
// SIMD: all volatile
|
|
|
|
namespace Luau
|
|
{
|
|
namespace CodeGen
|
|
{
|
|
|
|
enum class IrCondition : uint8_t;
|
|
struct NativeState;
|
|
struct IrOp;
|
|
|
|
namespace X64
|
|
{
|
|
|
|
struct IrRegAllocX64;
|
|
|
|
constexpr uint32_t kFunctionAlignment = 32;
|
|
|
|
// Data that is very common to access is placed in non-volatile registers
|
|
constexpr RegisterX64 rState = r15; // lua_State* L
|
|
constexpr RegisterX64 rBase = r14; // StkId base
|
|
constexpr RegisterX64 rNativeContext = r13; // NativeContext* context
|
|
constexpr RegisterX64 rConstants = r12; // TValue* k
|
|
|
|
constexpr unsigned kExtraLocals = 3; // Number of 8 byte slots available for specialized local variables specified below
|
|
constexpr unsigned kSpillSlots = 5; // Number of 8 byte slots available for register allocator to spill data into
|
|
static_assert((kExtraLocals + kSpillSlots) * 8 % 16 == 0, "locals have to preserve 16 byte alignment");
|
|
|
|
constexpr uint8_t kWindowsFirstNonVolXmmReg = 6;
|
|
|
|
constexpr uint8_t kWindowsUsableXmmRegs = 10; // Some xmm regs are non-volatile, we have to balance how many we want to use/preserve
|
|
constexpr uint8_t kSystemVUsableXmmRegs = 16; // All xmm regs are volatile
|
|
|
|
inline uint8_t getXmmRegisterCount(ABIX64 abi)
|
|
{
|
|
return abi == ABIX64::SystemV ? kSystemVUsableXmmRegs : kWindowsUsableXmmRegs;
|
|
}
|
|
|
|
// Native code is as stackless as the interpreter, so we can place some data on the stack once and have it accessible at any point
|
|
// Stack is separated into sections for different data. See CodeGenX64.cpp for layout overview
|
|
constexpr unsigned kStackAlign = 8; // Bytes we need to align the stack for non-vol xmm register storage
|
|
constexpr unsigned kStackLocalStorage = 8 * kExtraLocals;
|
|
constexpr unsigned kStackSpillStorage = 8 * kSpillSlots;
|
|
constexpr unsigned kStackExtraArgumentStorage = 2 * 8; // Bytes for 5th and 6th function call arguments used under Windows ABI
|
|
constexpr unsigned kStackRegHomeStorage = 4 * 8; // Register 'home' locations that can be used by callees under Windows ABI
|
|
|
|
inline unsigned getNonVolXmmStorageSize(ABIX64 abi, uint8_t xmmRegCount)
|
|
{
|
|
if (abi == ABIX64::SystemV)
|
|
return 0;
|
|
|
|
// First 6 are volatile
|
|
if (xmmRegCount <= kWindowsFirstNonVolXmmReg)
|
|
return 0;
|
|
|
|
LUAU_ASSERT(xmmRegCount <= 16);
|
|
return (xmmRegCount - kWindowsFirstNonVolXmmReg) * 16;
|
|
}
|
|
|
|
// Useful offsets to specific parts
|
|
constexpr unsigned kStackOffsetToLocals = kStackExtraArgumentStorage + kStackRegHomeStorage;
|
|
constexpr unsigned kStackOffsetToSpillSlots = kStackOffsetToLocals + kStackLocalStorage;
|
|
|
|
inline unsigned getFullStackSize(ABIX64 abi, uint8_t xmmRegCount)
|
|
{
|
|
return kStackOffsetToSpillSlots + kStackSpillStorage + getNonVolXmmStorageSize(abi, xmmRegCount) + kStackAlign;
|
|
}
|
|
|
|
constexpr OperandX64 sClosure = qword[rsp + kStackOffsetToLocals + 0]; // Closure* cl
|
|
constexpr OperandX64 sCode = qword[rsp + kStackOffsetToLocals + 8]; // Instruction* code
|
|
constexpr OperandX64 sTemporarySlot = addr[rsp + kStackOffsetToLocals + 16];
|
|
|
|
constexpr OperandX64 sSpillArea = addr[rsp + kStackOffsetToSpillSlots];
|
|
|
|
inline OperandX64 luauReg(int ri)
|
|
{
|
|
return xmmword[rBase + ri * sizeof(TValue)];
|
|
}
|
|
|
|
inline OperandX64 luauRegAddress(int ri)
|
|
{
|
|
return addr[rBase + ri * sizeof(TValue)];
|
|
}
|
|
|
|
inline OperandX64 luauRegValue(int ri)
|
|
{
|
|
return qword[rBase + ri * sizeof(TValue) + offsetof(TValue, value)];
|
|
}
|
|
|
|
inline OperandX64 luauRegTag(int ri)
|
|
{
|
|
return dword[rBase + ri * sizeof(TValue) + offsetof(TValue, tt)];
|
|
}
|
|
|
|
inline OperandX64 luauRegValueInt(int ri)
|
|
{
|
|
return dword[rBase + ri * sizeof(TValue) + offsetof(TValue, value)];
|
|
}
|
|
|
|
inline OperandX64 luauRegValueVector(int ri, int index)
|
|
{
|
|
return dword[rBase + ri * sizeof(TValue) + offsetof(TValue, value) + (sizeof(float) * index)];
|
|
}
|
|
|
|
inline OperandX64 luauConstant(int ki)
|
|
{
|
|
return xmmword[rConstants + ki * sizeof(TValue)];
|
|
}
|
|
|
|
inline OperandX64 luauConstantAddress(int ki)
|
|
{
|
|
return addr[rConstants + ki * sizeof(TValue)];
|
|
}
|
|
|
|
inline OperandX64 luauConstantTag(int ki)
|
|
{
|
|
return dword[rConstants + ki * sizeof(TValue) + offsetof(TValue, tt)];
|
|
}
|
|
|
|
inline OperandX64 luauConstantValue(int ki)
|
|
{
|
|
return qword[rConstants + ki * sizeof(TValue) + offsetof(TValue, value)];
|
|
}
|
|
|
|
inline OperandX64 luauNodeKeyValue(RegisterX64 node)
|
|
{
|
|
return qword[node + offsetof(LuaNode, key) + offsetof(TKey, value)];
|
|
}
|
|
|
|
// Note: tag has dirty upper bits
|
|
inline OperandX64 luauNodeKeyTag(RegisterX64 node)
|
|
{
|
|
return dword[node + offsetof(LuaNode, key) + kOffsetOfTKeyTagNext];
|
|
}
|
|
|
|
inline void setLuauReg(AssemblyBuilderX64& build, RegisterX64 tmp, int ri, OperandX64 op)
|
|
{
|
|
LUAU_ASSERT(op.cat == CategoryX64::mem);
|
|
|
|
build.vmovups(tmp, op);
|
|
build.vmovups(luauReg(ri), tmp);
|
|
}
|
|
|
|
inline void jumpIfTagIs(AssemblyBuilderX64& build, int ri, lua_Type tag, Label& label)
|
|
{
|
|
build.cmp(luauRegTag(ri), tag);
|
|
build.jcc(ConditionX64::Equal, label);
|
|
}
|
|
|
|
inline void jumpIfTagIsNot(AssemblyBuilderX64& build, int ri, lua_Type tag, Label& label)
|
|
{
|
|
build.cmp(luauRegTag(ri), tag);
|
|
build.jcc(ConditionX64::NotEqual, label);
|
|
}
|
|
|
|
// Note: fallthrough label should be placed after this condition
|
|
inline void jumpIfFalsy(AssemblyBuilderX64& build, int ri, Label& target, Label& fallthrough)
|
|
{
|
|
jumpIfTagIs(build, ri, LUA_TNIL, target); // false if nil
|
|
jumpIfTagIsNot(build, ri, LUA_TBOOLEAN, fallthrough); // true if not nil or boolean
|
|
|
|
build.cmp(luauRegValueInt(ri), 0);
|
|
build.jcc(ConditionX64::Equal, target); // true if boolean value is 'true'
|
|
}
|
|
|
|
// Note: fallthrough label should be placed after this condition
|
|
inline void jumpIfTruthy(AssemblyBuilderX64& build, int ri, Label& target, Label& fallthrough)
|
|
{
|
|
jumpIfTagIs(build, ri, LUA_TNIL, fallthrough); // false if nil
|
|
jumpIfTagIsNot(build, ri, LUA_TBOOLEAN, target); // true if not nil or boolean
|
|
|
|
build.cmp(luauRegValueInt(ri), 0);
|
|
build.jcc(ConditionX64::NotEqual, target); // true if boolean value is 'true'
|
|
}
|
|
|
|
void jumpOnNumberCmp(AssemblyBuilderX64& build, RegisterX64 tmp, OperandX64 lhs, OperandX64 rhs, IrCondition cond, Label& label);
|
|
|
|
ConditionX64 getConditionInt(IrCondition cond);
|
|
|
|
void getTableNodeAtCachedSlot(AssemblyBuilderX64& build, RegisterX64 tmp, RegisterX64 node, RegisterX64 table, int pcpos);
|
|
void convertNumberToIndexOrJump(AssemblyBuilderX64& build, RegisterX64 tmp, RegisterX64 numd, RegisterX64 numi, Label& label);
|
|
|
|
void callArithHelper(IrRegAllocX64& regs, AssemblyBuilderX64& build, int ra, int rb, OperandX64 c, TMS tm);
|
|
void callLengthHelper(IrRegAllocX64& regs, AssemblyBuilderX64& build, int ra, int rb);
|
|
void callGetTable(IrRegAllocX64& regs, AssemblyBuilderX64& build, int rb, OperandX64 c, int ra);
|
|
void callSetTable(IrRegAllocX64& regs, AssemblyBuilderX64& build, int rb, OperandX64 c, int ra);
|
|
void checkObjectBarrierConditions(AssemblyBuilderX64& build, RegisterX64 tmp, RegisterX64 object, IrOp ra, int ratag, Label& skip);
|
|
void callBarrierObject(IrRegAllocX64& regs, AssemblyBuilderX64& build, RegisterX64 object, IrOp objectOp, IrOp ra, int ratag);
|
|
void callBarrierTableFast(IrRegAllocX64& regs, AssemblyBuilderX64& build, RegisterX64 table, IrOp tableOp);
|
|
void callStepGc(IrRegAllocX64& regs, AssemblyBuilderX64& build);
|
|
|
|
void emitClearNativeFlag(AssemblyBuilderX64& build);
|
|
void emitExit(AssemblyBuilderX64& build, bool continueInVm);
|
|
void emitUpdateBase(AssemblyBuilderX64& build);
|
|
void emitInterrupt(AssemblyBuilderX64& build);
|
|
void emitFallback(IrRegAllocX64& regs, AssemblyBuilderX64& build, int offset, int pcpos);
|
|
|
|
void emitUpdatePcForExit(AssemblyBuilderX64& build);
|
|
void emitContinueCallInVm(AssemblyBuilderX64& build);
|
|
|
|
void emitReturn(AssemblyBuilderX64& build, ModuleHelpers& helpers);
|
|
|
|
} // namespace X64
|
|
} // namespace CodeGen
|
|
} // namespace Luau
|