2022-10-13 23:59:53 +01:00
|
|
|
// This file is part of the Luau programming language and is licensed under MIT License; see LICENSE.txt for details
|
|
|
|
#include "Luau/CodeGen.h"
|
|
|
|
|
|
|
|
#include "Luau/Common.h"
|
|
|
|
#include "Luau/CodeAllocator.h"
|
|
|
|
#include "Luau/CodeBlockUnwind.h"
|
2023-02-03 12:34:12 +00:00
|
|
|
#include "Luau/IrAnalysis.h"
|
|
|
|
#include "Luau/IrBuilder.h"
|
2023-03-24 17:34:14 +00:00
|
|
|
#include "Luau/IrDump.h"
|
|
|
|
#include "Luau/IrUtils.h"
|
2023-02-24 18:24:22 +00:00
|
|
|
#include "Luau/OptimizeConstProp.h"
|
2023-02-10 18:50:54 +00:00
|
|
|
#include "Luau/OptimizeFinalX64.h"
|
2023-03-17 14:59:30 +00:00
|
|
|
|
2022-10-13 23:59:53 +01:00
|
|
|
#include "Luau/UnwindBuilder.h"
|
|
|
|
#include "Luau/UnwindBuilderDwarf2.h"
|
|
|
|
#include "Luau/UnwindBuilderWin.h"
|
|
|
|
|
2023-03-17 14:59:30 +00:00
|
|
|
#include "Luau/AssemblyBuilderA64.h"
|
2023-03-24 17:34:14 +00:00
|
|
|
#include "Luau/AssemblyBuilderX64.h"
|
2023-03-17 14:59:30 +00:00
|
|
|
|
2022-10-13 23:59:53 +01:00
|
|
|
#include "CustomExecUtils.h"
|
2023-03-24 17:34:14 +00:00
|
|
|
#include "NativeState.h"
|
|
|
|
|
2023-03-17 14:59:30 +00:00
|
|
|
#include "CodeGenA64.h"
|
2023-03-24 17:34:14 +00:00
|
|
|
#include "EmitCommonA64.h"
|
|
|
|
#include "IrLoweringA64.h"
|
|
|
|
|
|
|
|
#include "CodeGenX64.h"
|
2022-10-13 23:59:53 +01:00
|
|
|
#include "EmitCommonX64.h"
|
|
|
|
#include "EmitInstructionX64.h"
|
2023-01-27 21:28:45 +00:00
|
|
|
#include "IrLoweringX64.h"
|
2022-10-13 23:59:53 +01:00
|
|
|
|
|
|
|
#include "lapi.h"
|
|
|
|
|
2023-03-24 17:34:14 +00:00
|
|
|
#include <algorithm>
|
2022-10-13 23:59:53 +01:00
|
|
|
#include <memory>
|
|
|
|
|
|
|
|
#if defined(__x86_64__) || defined(_M_X64)
|
|
|
|
#ifdef _MSC_VER
|
|
|
|
#include <intrin.h> // __cpuid
|
|
|
|
#else
|
|
|
|
#include <cpuid.h> // __cpuid
|
|
|
|
#endif
|
|
|
|
#endif
|
|
|
|
|
2023-03-31 13:21:14 +01:00
|
|
|
#if defined(__aarch64__)
|
|
|
|
#ifdef __APPLE__
|
|
|
|
#include <sys/sysctl.h>
|
|
|
|
#endif
|
|
|
|
#endif
|
|
|
|
|
2023-02-24 18:24:22 +00:00
|
|
|
LUAU_FASTFLAGVARIABLE(DebugCodegenNoOpt, false)
|
2023-01-27 21:28:45 +00:00
|
|
|
|
2022-10-13 23:59:53 +01:00
|
|
|
namespace Luau
|
|
|
|
{
|
|
|
|
namespace CodeGen
|
|
|
|
{
|
|
|
|
|
2023-03-17 14:59:30 +00:00
|
|
|
static NativeProto* createNativeProto(Proto* proto, const IrBuilder& ir)
|
|
|
|
{
|
|
|
|
NativeProto* result = new NativeProto();
|
|
|
|
|
|
|
|
result->proto = proto;
|
|
|
|
result->instTargets = new uintptr_t[proto->sizecode];
|
|
|
|
|
|
|
|
for (int i = 0; i < proto->sizecode; i++)
|
|
|
|
{
|
|
|
|
auto [irLocation, asmLocation] = ir.function.bcMapping[i];
|
|
|
|
|
|
|
|
result->instTargets[i] = irLocation == ~0u ? 0 : asmLocation;
|
|
|
|
}
|
2022-10-21 18:33:43 +01:00
|
|
|
|
2023-03-17 14:59:30 +00:00
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
2023-03-24 17:34:14 +00:00
|
|
|
template<typename AssemblyBuilder, typename IrLowering>
|
2023-04-07 20:56:27 +01:00
|
|
|
static bool lowerImpl(AssemblyBuilder& build, IrLowering& lowering, IrFunction& function, int bytecodeid, AssemblyOptions options)
|
2023-03-24 17:34:14 +00:00
|
|
|
{
|
|
|
|
// While we will need a better block ordering in the future, right now we want to mostly preserve build order with fallbacks outlined
|
|
|
|
std::vector<uint32_t> sortedBlocks;
|
|
|
|
sortedBlocks.reserve(function.blocks.size());
|
|
|
|
for (uint32_t i = 0; i < function.blocks.size(); i++)
|
|
|
|
sortedBlocks.push_back(i);
|
|
|
|
|
|
|
|
std::sort(sortedBlocks.begin(), sortedBlocks.end(), [&](uint32_t idxA, uint32_t idxB) {
|
|
|
|
const IrBlock& a = function.blocks[idxA];
|
|
|
|
const IrBlock& b = function.blocks[idxB];
|
|
|
|
|
|
|
|
// Place fallback blocks at the end
|
|
|
|
if ((a.kind == IrBlockKind::Fallback) != (b.kind == IrBlockKind::Fallback))
|
|
|
|
return (a.kind == IrBlockKind::Fallback) < (b.kind == IrBlockKind::Fallback);
|
|
|
|
|
|
|
|
// Try to order by instruction order
|
|
|
|
return a.start < b.start;
|
|
|
|
});
|
|
|
|
|
|
|
|
DenseHashMap<uint32_t, uint32_t> bcLocations{~0u};
|
|
|
|
|
|
|
|
// Create keys for IR assembly locations that original bytecode instruction are interested in
|
|
|
|
for (const auto& [irLocation, asmLocation] : function.bcMapping)
|
|
|
|
{
|
|
|
|
if (irLocation != ~0u)
|
|
|
|
bcLocations[irLocation] = 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
DenseHashMap<uint32_t, uint32_t> indexIrToBc{~0u};
|
|
|
|
bool outputEnabled = options.includeAssembly || options.includeIr;
|
|
|
|
|
|
|
|
if (outputEnabled && options.annotator)
|
|
|
|
{
|
|
|
|
// Create reverse mapping from IR location to bytecode location
|
|
|
|
for (size_t i = 0; i < function.bcMapping.size(); ++i)
|
|
|
|
{
|
|
|
|
uint32_t irLocation = function.bcMapping[i].irLocation;
|
|
|
|
|
|
|
|
if (irLocation != ~0u)
|
|
|
|
indexIrToBc[irLocation] = uint32_t(i);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
IrToStringContext ctx{build.text, function.blocks, function.constants, function.cfg};
|
|
|
|
|
|
|
|
// We use this to skip outlined fallback blocks from IR/asm text output
|
|
|
|
size_t textSize = build.text.length();
|
|
|
|
uint32_t codeSize = build.getCodeSize();
|
|
|
|
bool seenFallback = false;
|
|
|
|
|
|
|
|
IrBlock dummy;
|
|
|
|
dummy.start = ~0u;
|
|
|
|
|
|
|
|
for (size_t i = 0; i < sortedBlocks.size(); ++i)
|
|
|
|
{
|
|
|
|
uint32_t blockIndex = sortedBlocks[i];
|
|
|
|
|
|
|
|
IrBlock& block = function.blocks[blockIndex];
|
|
|
|
|
|
|
|
if (block.kind == IrBlockKind::Dead)
|
|
|
|
continue;
|
|
|
|
|
|
|
|
LUAU_ASSERT(block.start != ~0u);
|
|
|
|
LUAU_ASSERT(block.finish != ~0u);
|
|
|
|
|
|
|
|
// If we want to skip fallback code IR/asm, we'll record when those blocks start once we see them
|
|
|
|
if (block.kind == IrBlockKind::Fallback && !seenFallback)
|
|
|
|
{
|
|
|
|
textSize = build.text.length();
|
|
|
|
codeSize = build.getCodeSize();
|
|
|
|
seenFallback = true;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (options.includeIr)
|
|
|
|
{
|
|
|
|
build.logAppend("# ");
|
|
|
|
toStringDetailed(ctx, block, blockIndex, /* includeUseInfo */ true);
|
|
|
|
}
|
|
|
|
|
|
|
|
build.setLabel(block.label);
|
|
|
|
|
|
|
|
for (uint32_t index = block.start; index <= block.finish; index++)
|
|
|
|
{
|
|
|
|
LUAU_ASSERT(index < function.instructions.size());
|
|
|
|
|
|
|
|
// If IR instruction is the first one for the original bytecode, we can annotate it with source code text
|
|
|
|
if (outputEnabled && options.annotator)
|
|
|
|
{
|
|
|
|
if (uint32_t* bcIndex = indexIrToBc.find(index))
|
|
|
|
options.annotator(options.annotatorContext, build.text, bytecodeid, *bcIndex);
|
|
|
|
}
|
|
|
|
|
|
|
|
// If bytecode needs the location of this instruction for jumps, record it
|
|
|
|
if (uint32_t* bcLocation = bcLocations.find(index))
|
|
|
|
{
|
|
|
|
Label label = (index == block.start) ? block.label : build.setLabel();
|
|
|
|
*bcLocation = build.getLabelOffset(label);
|
|
|
|
}
|
|
|
|
|
|
|
|
IrInst& inst = function.instructions[index];
|
|
|
|
|
|
|
|
// Skip pseudo instructions, but make sure they are not used at this stage
|
|
|
|
// This also prevents them from getting into text output when that's enabled
|
|
|
|
if (isPseudo(inst.cmd))
|
|
|
|
{
|
|
|
|
LUAU_ASSERT(inst.useCount == 0);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (options.includeIr)
|
|
|
|
{
|
|
|
|
build.logAppend("# ");
|
|
|
|
toStringDetailed(ctx, inst, index, /* includeUseInfo */ true);
|
|
|
|
}
|
|
|
|
|
|
|
|
IrBlock& next = i + 1 < sortedBlocks.size() ? function.blocks[sortedBlocks[i + 1]] : dummy;
|
|
|
|
|
|
|
|
lowering.lowerInst(inst, index, next);
|
2023-04-07 20:56:27 +01:00
|
|
|
|
|
|
|
if (lowering.hasError())
|
|
|
|
return false;
|
2023-03-24 17:34:14 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
if (options.includeIr)
|
|
|
|
build.logAppend("#\n");
|
|
|
|
}
|
|
|
|
|
|
|
|
if (outputEnabled && !options.includeOutlinedCode && seenFallback)
|
|
|
|
{
|
|
|
|
build.text.resize(textSize);
|
|
|
|
|
|
|
|
if (options.includeAssembly)
|
|
|
|
build.logAppend("; skipping %u bytes of outlined code\n", unsigned((build.getCodeSize() - codeSize) * sizeof(build.code[0])));
|
|
|
|
}
|
|
|
|
|
|
|
|
// Copy assembly locations of IR instructions that are mapped to bytecode instructions
|
|
|
|
for (auto& [irLocation, asmLocation] : function.bcMapping)
|
|
|
|
{
|
|
|
|
if (irLocation != ~0u)
|
|
|
|
asmLocation = bcLocations[irLocation];
|
|
|
|
}
|
2023-04-07 20:56:27 +01:00
|
|
|
|
|
|
|
return true;
|
2023-03-24 17:34:14 +00:00
|
|
|
}
|
|
|
|
|
2023-03-31 13:21:14 +01:00
|
|
|
[[maybe_unused]] static bool lowerIr(
|
2023-03-17 14:59:30 +00:00
|
|
|
X64::AssemblyBuilderX64& build, IrBuilder& ir, NativeState& data, ModuleHelpers& helpers, Proto* proto, AssemblyOptions options)
|
2022-10-27 23:22:49 +01:00
|
|
|
{
|
2023-03-17 14:59:30 +00:00
|
|
|
constexpr uint32_t kFunctionAlignment = 32;
|
2022-10-27 23:22:49 +01:00
|
|
|
|
2023-03-17 14:59:30 +00:00
|
|
|
optimizeMemoryOperandsX64(ir.function);
|
2022-11-04 17:02:37 +00:00
|
|
|
|
2023-03-17 14:59:30 +00:00
|
|
|
build.align(kFunctionAlignment, X64::AlignmentDataX64::Ud2);
|
|
|
|
|
2023-03-24 17:34:14 +00:00
|
|
|
X64::IrLoweringX64 lowering(build, helpers, data, ir.function);
|
2023-03-17 14:59:30 +00:00
|
|
|
|
2023-04-07 20:56:27 +01:00
|
|
|
return lowerImpl(build, lowering, ir.function, proto->bytecodeid, options);
|
2022-10-27 23:22:49 +01:00
|
|
|
}
|
|
|
|
|
2023-03-31 13:21:14 +01:00
|
|
|
[[maybe_unused]] static bool lowerIr(
|
2023-03-17 14:59:30 +00:00
|
|
|
A64::AssemblyBuilderA64& build, IrBuilder& ir, NativeState& data, ModuleHelpers& helpers, Proto* proto, AssemblyOptions options)
|
2022-10-13 23:59:53 +01:00
|
|
|
{
|
2023-03-31 13:21:14 +01:00
|
|
|
if (!A64::IrLoweringA64::canLower(ir.function))
|
|
|
|
return false;
|
2022-10-13 23:59:53 +01:00
|
|
|
|
2023-03-31 13:21:14 +01:00
|
|
|
A64::IrLoweringA64 lowering(build, helpers, data, proto, ir.function);
|
2022-10-13 23:59:53 +01:00
|
|
|
|
2023-04-07 20:56:27 +01:00
|
|
|
return lowerImpl(build, lowering, ir.function, proto->bytecodeid, options);
|
2023-03-17 14:59:30 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
template<typename AssemblyBuilder>
|
|
|
|
static NativeProto* assembleFunction(AssemblyBuilder& build, NativeState& data, ModuleHelpers& helpers, Proto* proto, AssemblyOptions options)
|
|
|
|
{
|
2023-01-27 21:28:45 +00:00
|
|
|
if (options.includeAssembly || options.includeIr)
|
2022-10-13 23:59:53 +01:00
|
|
|
{
|
|
|
|
if (proto->debugname)
|
2023-03-10 19:20:04 +00:00
|
|
|
build.logAppend("; function %s(", getstr(proto->debugname));
|
2022-10-13 23:59:53 +01:00
|
|
|
else
|
2023-03-10 19:20:04 +00:00
|
|
|
build.logAppend("; function(");
|
|
|
|
|
|
|
|
for (int i = 0; i < proto->numparams; i++)
|
|
|
|
{
|
|
|
|
LocVar* var = proto->locvars ? &proto->locvars[proto->sizelocvars - proto->numparams + i] : nullptr;
|
|
|
|
|
|
|
|
if (var && var->varname)
|
|
|
|
build.logAppend("%s%s", i == 0 ? "" : ", ", getstr(var->varname));
|
|
|
|
else
|
|
|
|
build.logAppend("%s$arg%d", i == 0 ? "" : ", ", i);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (proto->numparams != 0 && proto->is_vararg)
|
|
|
|
build.logAppend(", ...)");
|
|
|
|
else
|
|
|
|
build.logAppend(")");
|
2022-10-13 23:59:53 +01:00
|
|
|
|
|
|
|
if (proto->linedefined >= 0)
|
|
|
|
build.logAppend(" line %d\n", proto->linedefined);
|
|
|
|
else
|
|
|
|
build.logAppend("\n");
|
|
|
|
}
|
|
|
|
|
2023-03-17 14:59:30 +00:00
|
|
|
IrBuilder ir;
|
|
|
|
ir.buildFunctionIr(proto);
|
2022-10-21 18:33:43 +01:00
|
|
|
|
2023-03-24 17:34:14 +00:00
|
|
|
computeCfgInfo(ir.function);
|
|
|
|
|
2023-02-24 18:24:22 +00:00
|
|
|
if (!FFlag::DebugCodegenNoOpt)
|
2022-10-27 23:22:49 +01:00
|
|
|
{
|
2023-03-17 14:59:30 +00:00
|
|
|
constPropInBlockChains(ir);
|
2022-10-27 23:22:49 +01:00
|
|
|
}
|
|
|
|
|
2023-03-31 13:21:14 +01:00
|
|
|
if (!lowerIr(build, ir, data, helpers, proto, options))
|
|
|
|
{
|
|
|
|
if (build.logText)
|
|
|
|
build.logAppend("; skipping (can't lower)\n\n");
|
|
|
|
|
|
|
|
return nullptr;
|
|
|
|
}
|
2022-10-13 23:59:53 +01:00
|
|
|
|
|
|
|
if (build.logText)
|
|
|
|
build.logAppend("\n");
|
|
|
|
|
2023-03-17 14:59:30 +00:00
|
|
|
return createNativeProto(proto, ir);
|
2022-10-13 23:59:53 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
static void destroyNativeProto(NativeProto* nativeProto)
|
|
|
|
{
|
|
|
|
delete[] nativeProto->instTargets;
|
|
|
|
delete nativeProto;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void onCloseState(lua_State* L)
|
|
|
|
{
|
|
|
|
destroyNativeState(L);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void onDestroyFunction(lua_State* L, Proto* proto)
|
|
|
|
{
|
|
|
|
NativeProto* nativeProto = getProtoExecData(proto);
|
|
|
|
LUAU_ASSERT(nativeProto->proto == proto);
|
|
|
|
|
|
|
|
setProtoExecData(proto, nullptr);
|
|
|
|
destroyNativeProto(nativeProto);
|
|
|
|
}
|
|
|
|
|
|
|
|
static int onEnter(lua_State* L, Proto* proto)
|
|
|
|
{
|
|
|
|
if (L->singlestep)
|
|
|
|
return 1;
|
|
|
|
|
|
|
|
NativeState* data = getNativeState(L);
|
|
|
|
|
|
|
|
if (!L->ci->savedpc)
|
|
|
|
L->ci->savedpc = proto->code;
|
|
|
|
|
|
|
|
// We will jump into native code through a gateway
|
|
|
|
bool (*gate)(lua_State*, Proto*, uintptr_t, NativeContext*) = (bool (*)(lua_State*, Proto*, uintptr_t, NativeContext*))data->context.gateEntry;
|
|
|
|
|
|
|
|
NativeProto* nativeProto = getProtoExecData(proto);
|
|
|
|
uintptr_t target = nativeProto->instTargets[L->ci->savedpc - proto->code];
|
|
|
|
|
|
|
|
// Returns 1 to finish the function in the VM
|
|
|
|
return gate(L, proto, target, &data->context);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void onSetBreakpoint(lua_State* L, Proto* proto, int instruction)
|
|
|
|
{
|
|
|
|
if (!getProtoExecData(proto))
|
|
|
|
return;
|
|
|
|
|
|
|
|
LUAU_ASSERT(!"native breakpoints are not implemented");
|
|
|
|
}
|
|
|
|
|
2023-03-31 13:21:14 +01:00
|
|
|
#if defined(__aarch64__)
|
|
|
|
static unsigned int getCpuFeaturesA64()
|
|
|
|
{
|
|
|
|
unsigned int result = 0;
|
|
|
|
|
|
|
|
#ifdef __APPLE__
|
|
|
|
int jscvt = 0;
|
|
|
|
size_t jscvtLen = sizeof(jscvt);
|
|
|
|
if (sysctlbyname("hw.optional.arm.FEAT_JSCVT", &jscvt, &jscvtLen, nullptr, 0) == 0 && jscvt == 1)
|
|
|
|
result |= A64::Feature_JSCVT;
|
|
|
|
#endif
|
|
|
|
|
|
|
|
return result;
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
2022-10-13 23:59:53 +01:00
|
|
|
bool isSupported()
|
|
|
|
{
|
|
|
|
#if !LUA_CUSTOM_EXECUTION
|
|
|
|
return false;
|
|
|
|
#elif defined(__x86_64__) || defined(_M_X64)
|
|
|
|
if (LUA_EXTRA_SIZE != 1)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
if (sizeof(TValue) != 16)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
if (sizeof(LuaNode) != 32)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
int cpuinfo[4] = {};
|
|
|
|
#ifdef _MSC_VER
|
|
|
|
__cpuid(cpuinfo, 1);
|
|
|
|
#else
|
|
|
|
__cpuid(1, cpuinfo[0], cpuinfo[1], cpuinfo[2], cpuinfo[3]);
|
|
|
|
#endif
|
|
|
|
|
|
|
|
// We require AVX1 support for VEX encoded XMM operations
|
|
|
|
// We also requre SSE4.1 support for ROUNDSD but the AVX check below covers it
|
|
|
|
// https://en.wikipedia.org/wiki/CPUID#EAX=1:_Processor_Info_and_Feature_Bits
|
|
|
|
if ((cpuinfo[2] & (1 << 28)) == 0)
|
|
|
|
return false;
|
|
|
|
|
2023-03-17 14:59:30 +00:00
|
|
|
return true;
|
|
|
|
#elif defined(__aarch64__)
|
2023-03-31 13:21:14 +01:00
|
|
|
if (LUA_EXTRA_SIZE != 1)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
if (sizeof(TValue) != 16)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
if (sizeof(LuaNode) != 32)
|
|
|
|
return false;
|
|
|
|
|
2023-03-24 17:34:14 +00:00
|
|
|
// TODO: A64 codegen does not generate correct unwind info at the moment so it requires longjmp instead of C++ exceptions
|
2023-03-31 13:21:14 +01:00
|
|
|
if (!LUA_USE_LONGJMP)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
return true;
|
2022-10-13 23:59:53 +01:00
|
|
|
#else
|
|
|
|
return false;
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
|
|
|
void create(lua_State* L)
|
|
|
|
{
|
|
|
|
LUAU_ASSERT(isSupported());
|
|
|
|
|
|
|
|
NativeState& data = *createNativeState(L);
|
|
|
|
|
|
|
|
#if defined(_WIN32)
|
|
|
|
data.unwindBuilder = std::make_unique<UnwindBuilderWin>();
|
|
|
|
#else
|
|
|
|
data.unwindBuilder = std::make_unique<UnwindBuilderDwarf2>();
|
|
|
|
#endif
|
|
|
|
|
|
|
|
data.codeAllocator.context = data.unwindBuilder.get();
|
|
|
|
data.codeAllocator.createBlockUnwindInfo = createBlockUnwindInfo;
|
|
|
|
data.codeAllocator.destroyBlockUnwindInfo = destroyBlockUnwindInfo;
|
|
|
|
|
|
|
|
initFallbackTable(data);
|
|
|
|
initHelperFunctions(data);
|
|
|
|
|
2023-03-17 14:59:30 +00:00
|
|
|
#if defined(__x86_64__) || defined(_M_X64)
|
2023-03-03 13:45:38 +00:00
|
|
|
if (!X64::initEntryFunction(data))
|
2022-10-13 23:59:53 +01:00
|
|
|
{
|
|
|
|
destroyNativeState(L);
|
|
|
|
return;
|
|
|
|
}
|
2023-03-17 14:59:30 +00:00
|
|
|
#elif defined(__aarch64__)
|
|
|
|
if (!A64::initEntryFunction(data))
|
|
|
|
{
|
|
|
|
destroyNativeState(L);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
#endif
|
2022-10-13 23:59:53 +01:00
|
|
|
|
|
|
|
lua_ExecutionCallbacks* ecb = getExecutionCallbacks(L);
|
|
|
|
|
|
|
|
ecb->close = onCloseState;
|
|
|
|
ecb->destroy = onDestroyFunction;
|
|
|
|
ecb->enter = onEnter;
|
|
|
|
ecb->setbreakpoint = onSetBreakpoint;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void gatherFunctions(std::vector<Proto*>& results, Proto* proto)
|
|
|
|
{
|
|
|
|
if (results.size() <= size_t(proto->bytecodeid))
|
|
|
|
results.resize(proto->bytecodeid + 1);
|
|
|
|
|
|
|
|
// Skip protos that we've already compiled in this run: this happens because at -O2, inlined functions get their protos reused
|
|
|
|
if (results[proto->bytecodeid])
|
|
|
|
return;
|
|
|
|
|
|
|
|
results[proto->bytecodeid] = proto;
|
|
|
|
|
|
|
|
for (int i = 0; i < proto->sizep; i++)
|
|
|
|
gatherFunctions(results, proto->p[i]);
|
|
|
|
}
|
|
|
|
|
|
|
|
void compile(lua_State* L, int idx)
|
|
|
|
{
|
|
|
|
LUAU_ASSERT(lua_isLfunction(L, idx));
|
|
|
|
const TValue* func = luaA_toobject(L, idx);
|
|
|
|
|
|
|
|
// If initialization has failed, do not compile any functions
|
|
|
|
if (!getNativeState(L))
|
|
|
|
return;
|
|
|
|
|
2023-03-17 14:59:30 +00:00
|
|
|
#if defined(__aarch64__)
|
2023-03-31 13:21:14 +01:00
|
|
|
A64::AssemblyBuilderA64 build(/* logText= */ false, getCpuFeaturesA64());
|
2023-03-17 14:59:30 +00:00
|
|
|
#else
|
2023-03-03 13:45:38 +00:00
|
|
|
X64::AssemblyBuilderX64 build(/* logText= */ false);
|
2023-03-17 14:59:30 +00:00
|
|
|
#endif
|
|
|
|
|
2022-10-13 23:59:53 +01:00
|
|
|
NativeState* data = getNativeState(L);
|
|
|
|
|
|
|
|
std::vector<Proto*> protos;
|
|
|
|
gatherFunctions(protos, clvalue(func)->l.p);
|
|
|
|
|
2022-10-27 23:22:49 +01:00
|
|
|
ModuleHelpers helpers;
|
2023-03-24 17:34:14 +00:00
|
|
|
#if defined(__aarch64__)
|
|
|
|
A64::assembleHelpers(build, helpers);
|
|
|
|
#else
|
2023-03-17 14:59:30 +00:00
|
|
|
X64::assembleHelpers(build, helpers);
|
|
|
|
#endif
|
2022-10-27 23:22:49 +01:00
|
|
|
|
2022-10-13 23:59:53 +01:00
|
|
|
std::vector<NativeProto*> results;
|
|
|
|
results.reserve(protos.size());
|
|
|
|
|
|
|
|
// Skip protos that have been compiled during previous invocations of CodeGen::compile
|
|
|
|
for (Proto* p : protos)
|
|
|
|
if (p && getProtoExecData(p) == nullptr)
|
2023-03-31 13:21:14 +01:00
|
|
|
if (NativeProto* np = assembleFunction(build, *data, helpers, p, {}))
|
|
|
|
results.push_back(np);
|
2022-10-13 23:59:53 +01:00
|
|
|
|
|
|
|
build.finalize();
|
|
|
|
|
2023-03-31 13:21:14 +01:00
|
|
|
// If no functions were assembled, we don't need to allocate/copy executable pages for helpers
|
|
|
|
if (results.empty())
|
|
|
|
return;
|
|
|
|
|
2022-10-13 23:59:53 +01:00
|
|
|
uint8_t* nativeData = nullptr;
|
|
|
|
size_t sizeNativeData = 0;
|
|
|
|
uint8_t* codeStart = nullptr;
|
2023-03-17 14:59:30 +00:00
|
|
|
if (!data->codeAllocator.allocate(build.data.data(), int(build.data.size()), reinterpret_cast<const uint8_t*>(build.code.data()),
|
|
|
|
int(build.code.size() * sizeof(build.code[0])), nativeData, sizeNativeData, codeStart))
|
2022-10-13 23:59:53 +01:00
|
|
|
{
|
|
|
|
for (NativeProto* result : results)
|
|
|
|
destroyNativeProto(result);
|
|
|
|
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Relocate instruction offsets
|
|
|
|
for (NativeProto* result : results)
|
|
|
|
{
|
|
|
|
for (int i = 0; i < result->proto->sizecode; i++)
|
2023-03-17 14:59:30 +00:00
|
|
|
result->instTargets[i] += uintptr_t(codeStart);
|
2022-11-04 17:02:37 +00:00
|
|
|
|
|
|
|
LUAU_ASSERT(result->proto->sizecode);
|
|
|
|
result->entryTarget = result->instTargets[0];
|
2022-10-13 23:59:53 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
// Link native proto objects to Proto; the memory is now managed by VM and will be freed via onDestroyFunction
|
|
|
|
for (NativeProto* result : results)
|
|
|
|
setProtoExecData(result->proto, result);
|
|
|
|
}
|
|
|
|
|
2022-10-21 18:33:43 +01:00
|
|
|
std::string getAssembly(lua_State* L, int idx, AssemblyOptions options)
|
2022-10-13 23:59:53 +01:00
|
|
|
{
|
|
|
|
LUAU_ASSERT(lua_isLfunction(L, idx));
|
|
|
|
const TValue* func = luaA_toobject(L, idx);
|
|
|
|
|
2023-03-17 14:59:30 +00:00
|
|
|
#if defined(__aarch64__)
|
2023-03-31 13:21:14 +01:00
|
|
|
A64::AssemblyBuilderA64 build(/* logText= */ options.includeAssembly, getCpuFeaturesA64());
|
2023-03-17 14:59:30 +00:00
|
|
|
#else
|
2023-03-03 13:45:38 +00:00
|
|
|
X64::AssemblyBuilderX64 build(/* logText= */ options.includeAssembly);
|
2023-03-17 14:59:30 +00:00
|
|
|
#endif
|
2022-10-21 18:33:43 +01:00
|
|
|
|
2022-10-13 23:59:53 +01:00
|
|
|
NativeState data;
|
|
|
|
initFallbackTable(data);
|
|
|
|
|
|
|
|
std::vector<Proto*> protos;
|
|
|
|
gatherFunctions(protos, clvalue(func)->l.p);
|
|
|
|
|
2022-10-27 23:22:49 +01:00
|
|
|
ModuleHelpers helpers;
|
2023-03-24 17:34:14 +00:00
|
|
|
#if defined(__aarch64__)
|
|
|
|
A64::assembleHelpers(build, helpers);
|
|
|
|
#else
|
2023-03-17 14:59:30 +00:00
|
|
|
X64::assembleHelpers(build, helpers);
|
|
|
|
#endif
|
2022-10-27 23:22:49 +01:00
|
|
|
|
2022-10-13 23:59:53 +01:00
|
|
|
for (Proto* p : protos)
|
|
|
|
if (p)
|
2023-03-31 13:21:14 +01:00
|
|
|
if (NativeProto* np = assembleFunction(build, data, helpers, p, options))
|
|
|
|
destroyNativeProto(np);
|
2022-10-13 23:59:53 +01:00
|
|
|
|
|
|
|
build.finalize();
|
|
|
|
|
2022-10-21 18:33:43 +01:00
|
|
|
if (options.outputBinary)
|
2023-03-24 17:34:14 +00:00
|
|
|
return std::string(reinterpret_cast<const char*>(build.code.data()), reinterpret_cast<const char*>(build.code.data() + build.code.size())) +
|
2023-03-17 14:59:30 +00:00
|
|
|
std::string(build.data.begin(), build.data.end());
|
2022-10-21 18:33:43 +01:00
|
|
|
else
|
|
|
|
return build.text;
|
2022-10-13 23:59:53 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
} // namespace CodeGen
|
|
|
|
} // namespace Luau
|