2021-10-29 21:25:12 +01:00
|
|
|
// This file is part of the Luau programming language and is licensed under MIT License; see LICENSE.txt for details
|
|
|
|
#pragma once
|
|
|
|
|
|
|
|
#include "Luau/Bytecode.h"
|
|
|
|
#include "Luau/DenseHash.h"
|
2022-04-21 22:44:27 +01:00
|
|
|
#include "Luau/StringUtils.h"
|
2021-10-29 21:25:12 +01:00
|
|
|
|
|
|
|
#include <string>
|
|
|
|
|
|
|
|
namespace Luau
|
|
|
|
{
|
|
|
|
|
|
|
|
class BytecodeEncoder
|
|
|
|
{
|
|
|
|
public:
|
|
|
|
virtual ~BytecodeEncoder() {}
|
|
|
|
|
2023-08-18 19:15:41 +01:00
|
|
|
virtual void encode(uint32_t* data, size_t count) = 0;
|
2021-10-29 21:25:12 +01:00
|
|
|
};
|
|
|
|
|
|
|
|
class BytecodeBuilder
|
|
|
|
{
|
|
|
|
public:
|
|
|
|
// BytecodeBuilder does *not* copy the data passed via StringRef; instead, it keeps the ref around until finalize()
|
|
|
|
// Please be careful with the lifetime of the data that's being passed because of this.
|
|
|
|
// The safe and correct pattern is to only build StringRefs out of pieces of AST (AstName or AstArray<>) that are backed by AstAllocator.
|
|
|
|
// Note that you must finalize() the builder before the Allocator backing the Ast is destroyed.
|
|
|
|
struct StringRef
|
|
|
|
{
|
|
|
|
// To construct a StringRef, use sref() from Compiler.cpp.
|
|
|
|
const char* data = nullptr;
|
|
|
|
size_t length = 0;
|
|
|
|
|
|
|
|
bool operator==(const StringRef& other) const;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct TableShape
|
|
|
|
{
|
|
|
|
static const unsigned int kMaxLength = 32;
|
|
|
|
|
|
|
|
int32_t keys[kMaxLength];
|
|
|
|
unsigned int length = 0;
|
|
|
|
|
|
|
|
bool operator==(const TableShape& other) const;
|
|
|
|
};
|
|
|
|
|
|
|
|
BytecodeBuilder(BytecodeEncoder* encoder = 0);
|
|
|
|
|
|
|
|
uint32_t beginFunction(uint8_t numparams, bool isvararg = false);
|
2023-07-14 19:08:53 +01:00
|
|
|
void endFunction(uint8_t maxstacksize, uint8_t numupvalues, uint8_t flags = 0);
|
2021-10-29 21:25:12 +01:00
|
|
|
|
|
|
|
void setMainFunction(uint32_t fid);
|
|
|
|
|
|
|
|
int32_t addConstantNil();
|
|
|
|
int32_t addConstantBoolean(bool value);
|
|
|
|
int32_t addConstantNumber(double value);
|
Optimize vector literals by storing them in the constant table (#1096)
With this optimization, built-in vector constructor calls with 3/4 arguments are detected by the compiler and turned into vector constants when the arguments are constant numbers.
Requires optimization level 2 because built-ins are not folded otherwise by the compiler.
Bytecode version is bumped because of the new constant type, but old bytecode versions can still be loaded.
The following synthetic benchmark shows ~6.6x improvement.
```
local v
for i = 1, 10000000 do
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
end
```
Also tried a more real world scenario and could see a few percent improvement.
Added a new fast flag LuauVectorLiterals for enabling the feature.
---------
Co-authored-by: Petri Häkkinen <petrih@rmd.remedy.fi>
Co-authored-by: vegorov-rbx <75688451+vegorov-rbx@users.noreply.github.com>
Co-authored-by: Arseny Kapoulkine <arseny.kapoulkine@gmail.com>
2023-11-17 12:54:32 +00:00
|
|
|
int32_t addConstantVector(float x, float y, float z, float w);
|
2021-10-29 21:25:12 +01:00
|
|
|
int32_t addConstantString(StringRef value);
|
|
|
|
int32_t addImport(uint32_t iid);
|
|
|
|
int32_t addConstantTable(const TableShape& shape);
|
|
|
|
int32_t addConstantClosure(uint32_t fid);
|
|
|
|
|
|
|
|
int16_t addChildFunction(uint32_t fid);
|
|
|
|
|
|
|
|
void emitABC(LuauOpcode op, uint8_t a, uint8_t b, uint8_t c);
|
|
|
|
void emitAD(LuauOpcode op, uint8_t a, int16_t d);
|
|
|
|
void emitE(LuauOpcode op, int32_t e);
|
|
|
|
void emitAux(uint32_t aux);
|
|
|
|
|
|
|
|
size_t emitLabel();
|
|
|
|
|
|
|
|
[[nodiscard]] bool patchJumpD(size_t jumpLabel, size_t targetLabel);
|
|
|
|
[[nodiscard]] bool patchSkipC(size_t jumpLabel, size_t targetLabel);
|
|
|
|
|
|
|
|
void foldJumps();
|
|
|
|
void expandJumps();
|
|
|
|
|
2023-06-16 18:35:18 +01:00
|
|
|
void setFunctionTypeInfo(std::string value);
|
|
|
|
|
2021-10-29 21:25:12 +01:00
|
|
|
void setDebugFunctionName(StringRef name);
|
2022-01-07 01:46:53 +00:00
|
|
|
void setDebugFunctionLineDefined(int line);
|
2021-10-29 21:25:12 +01:00
|
|
|
void setDebugLine(int line);
|
|
|
|
void pushDebugLocal(StringRef name, uint8_t reg, uint32_t startpc, uint32_t endpc);
|
|
|
|
void pushDebugUpval(StringRef name);
|
2023-04-28 20:55:13 +01:00
|
|
|
|
|
|
|
size_t getInstructionCount() const;
|
2023-11-03 23:45:04 +00:00
|
|
|
size_t getTotalInstructionCount() const;
|
2021-10-29 21:25:12 +01:00
|
|
|
uint32_t getDebugPC() const;
|
|
|
|
|
2022-04-21 22:44:27 +01:00
|
|
|
void addDebugRemark(const char* format, ...) LUAU_PRINTF_ATTR(2, 3);
|
|
|
|
|
2021-10-29 21:25:12 +01:00
|
|
|
void finalize();
|
|
|
|
|
|
|
|
enum DumpFlags
|
|
|
|
{
|
|
|
|
Dump_Code = 1 << 0,
|
|
|
|
Dump_Lines = 1 << 1,
|
|
|
|
Dump_Source = 1 << 2,
|
|
|
|
Dump_Locals = 1 << 3,
|
2022-04-21 22:44:27 +01:00
|
|
|
Dump_Remarks = 1 << 4,
|
2021-10-29 21:25:12 +01:00
|
|
|
};
|
|
|
|
|
|
|
|
void setDumpFlags(uint32_t flags)
|
|
|
|
{
|
|
|
|
dumpFlags = flags;
|
|
|
|
dumpFunctionPtr = &BytecodeBuilder::dumpCurrentFunction;
|
|
|
|
}
|
|
|
|
|
|
|
|
void setDumpSource(const std::string& source);
|
|
|
|
|
2022-10-14 20:48:41 +01:00
|
|
|
bool needsDebugRemarks() const
|
|
|
|
{
|
|
|
|
return (dumpFlags & Dump_Remarks) != 0;
|
|
|
|
}
|
|
|
|
|
2021-10-29 21:25:12 +01:00
|
|
|
const std::string& getBytecode() const
|
|
|
|
{
|
|
|
|
LUAU_ASSERT(!bytecode.empty()); // did you forget to call finalize?
|
|
|
|
return bytecode;
|
|
|
|
}
|
|
|
|
|
|
|
|
std::string dumpFunction(uint32_t id) const;
|
|
|
|
std::string dumpEverything() const;
|
2022-10-14 20:48:41 +01:00
|
|
|
std::string dumpSourceRemarks() const;
|
2023-06-16 18:35:18 +01:00
|
|
|
std::string dumpTypeInfo() const;
|
2021-10-29 21:25:12 +01:00
|
|
|
|
2022-10-28 11:37:29 +01:00
|
|
|
void annotateInstruction(std::string& result, uint32_t fid, uint32_t instpos) const;
|
2022-10-21 18:54:01 +01:00
|
|
|
|
2021-10-29 21:25:12 +01:00
|
|
|
static uint32_t getImportId(int32_t id0);
|
|
|
|
static uint32_t getImportId(int32_t id0, int32_t id1);
|
|
|
|
static uint32_t getImportId(int32_t id0, int32_t id1, int32_t id2);
|
|
|
|
|
2023-01-13 22:10:01 +00:00
|
|
|
static int decomposeImportId(uint32_t ids, int32_t& id0, int32_t& id1, int32_t& id2);
|
|
|
|
|
2021-10-29 21:25:12 +01:00
|
|
|
static uint32_t getStringHash(StringRef key);
|
|
|
|
|
|
|
|
static std::string getError(const std::string& message);
|
|
|
|
|
2022-06-24 02:56:00 +01:00
|
|
|
static uint8_t getVersion();
|
2023-06-16 18:35:18 +01:00
|
|
|
static uint8_t getTypeEncodingVersion();
|
2022-06-24 02:56:00 +01:00
|
|
|
|
2021-10-29 21:25:12 +01:00
|
|
|
private:
|
|
|
|
struct Constant
|
|
|
|
{
|
|
|
|
enum Type
|
|
|
|
{
|
|
|
|
Type_Nil,
|
|
|
|
Type_Boolean,
|
|
|
|
Type_Number,
|
Optimize vector literals by storing them in the constant table (#1096)
With this optimization, built-in vector constructor calls with 3/4 arguments are detected by the compiler and turned into vector constants when the arguments are constant numbers.
Requires optimization level 2 because built-ins are not folded otherwise by the compiler.
Bytecode version is bumped because of the new constant type, but old bytecode versions can still be loaded.
The following synthetic benchmark shows ~6.6x improvement.
```
local v
for i = 1, 10000000 do
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
end
```
Also tried a more real world scenario and could see a few percent improvement.
Added a new fast flag LuauVectorLiterals for enabling the feature.
---------
Co-authored-by: Petri Häkkinen <petrih@rmd.remedy.fi>
Co-authored-by: vegorov-rbx <75688451+vegorov-rbx@users.noreply.github.com>
Co-authored-by: Arseny Kapoulkine <arseny.kapoulkine@gmail.com>
2023-11-17 12:54:32 +00:00
|
|
|
Type_Vector,
|
2021-10-29 21:25:12 +01:00
|
|
|
Type_String,
|
|
|
|
Type_Import,
|
|
|
|
Type_Table,
|
|
|
|
Type_Closure,
|
|
|
|
};
|
|
|
|
|
|
|
|
Type type;
|
|
|
|
union
|
|
|
|
{
|
|
|
|
bool valueBoolean;
|
|
|
|
double valueNumber;
|
Optimize vector literals by storing them in the constant table (#1096)
With this optimization, built-in vector constructor calls with 3/4 arguments are detected by the compiler and turned into vector constants when the arguments are constant numbers.
Requires optimization level 2 because built-ins are not folded otherwise by the compiler.
Bytecode version is bumped because of the new constant type, but old bytecode versions can still be loaded.
The following synthetic benchmark shows ~6.6x improvement.
```
local v
for i = 1, 10000000 do
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
end
```
Also tried a more real world scenario and could see a few percent improvement.
Added a new fast flag LuauVectorLiterals for enabling the feature.
---------
Co-authored-by: Petri Häkkinen <petrih@rmd.remedy.fi>
Co-authored-by: vegorov-rbx <75688451+vegorov-rbx@users.noreply.github.com>
Co-authored-by: Arseny Kapoulkine <arseny.kapoulkine@gmail.com>
2023-11-17 12:54:32 +00:00
|
|
|
float valueVector[4];
|
2021-10-29 21:25:12 +01:00
|
|
|
unsigned int valueString; // index into string table
|
|
|
|
uint32_t valueImport; // 10-10-10-2 encoded import id
|
|
|
|
uint32_t valueTable; // index into tableShapes[]
|
|
|
|
uint32_t valueClosure; // index of function in global list
|
|
|
|
};
|
|
|
|
};
|
|
|
|
|
|
|
|
struct ConstantKey
|
|
|
|
{
|
|
|
|
Constant::Type type;
|
Optimize vector literals by storing them in the constant table (#1096)
With this optimization, built-in vector constructor calls with 3/4 arguments are detected by the compiler and turned into vector constants when the arguments are constant numbers.
Requires optimization level 2 because built-ins are not folded otherwise by the compiler.
Bytecode version is bumped because of the new constant type, but old bytecode versions can still be loaded.
The following synthetic benchmark shows ~6.6x improvement.
```
local v
for i = 1, 10000000 do
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
end
```
Also tried a more real world scenario and could see a few percent improvement.
Added a new fast flag LuauVectorLiterals for enabling the feature.
---------
Co-authored-by: Petri Häkkinen <petrih@rmd.remedy.fi>
Co-authored-by: vegorov-rbx <75688451+vegorov-rbx@users.noreply.github.com>
Co-authored-by: Arseny Kapoulkine <arseny.kapoulkine@gmail.com>
2023-11-17 12:54:32 +00:00
|
|
|
// Note: this stores value* from Constant; when type is Type_Number, this stores the same bits as double does but in uint64_t.
|
|
|
|
// For Type_Vector, x and y are stored in 'value' and z and w are stored in 'extra'.
|
2021-10-29 21:25:12 +01:00
|
|
|
uint64_t value;
|
Optimize vector literals by storing them in the constant table (#1096)
With this optimization, built-in vector constructor calls with 3/4 arguments are detected by the compiler and turned into vector constants when the arguments are constant numbers.
Requires optimization level 2 because built-ins are not folded otherwise by the compiler.
Bytecode version is bumped because of the new constant type, but old bytecode versions can still be loaded.
The following synthetic benchmark shows ~6.6x improvement.
```
local v
for i = 1, 10000000 do
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
end
```
Also tried a more real world scenario and could see a few percent improvement.
Added a new fast flag LuauVectorLiterals for enabling the feature.
---------
Co-authored-by: Petri Häkkinen <petrih@rmd.remedy.fi>
Co-authored-by: vegorov-rbx <75688451+vegorov-rbx@users.noreply.github.com>
Co-authored-by: Arseny Kapoulkine <arseny.kapoulkine@gmail.com>
2023-11-17 12:54:32 +00:00
|
|
|
uint64_t extra = 0;
|
2021-10-29 21:25:12 +01:00
|
|
|
|
|
|
|
bool operator==(const ConstantKey& key) const
|
|
|
|
{
|
Optimize vector literals by storing them in the constant table (#1096)
With this optimization, built-in vector constructor calls with 3/4 arguments are detected by the compiler and turned into vector constants when the arguments are constant numbers.
Requires optimization level 2 because built-ins are not folded otherwise by the compiler.
Bytecode version is bumped because of the new constant type, but old bytecode versions can still be loaded.
The following synthetic benchmark shows ~6.6x improvement.
```
local v
for i = 1, 10000000 do
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
v = vector(1, 2, 3)
end
```
Also tried a more real world scenario and could see a few percent improvement.
Added a new fast flag LuauVectorLiterals for enabling the feature.
---------
Co-authored-by: Petri Häkkinen <petrih@rmd.remedy.fi>
Co-authored-by: vegorov-rbx <75688451+vegorov-rbx@users.noreply.github.com>
Co-authored-by: Arseny Kapoulkine <arseny.kapoulkine@gmail.com>
2023-11-17 12:54:32 +00:00
|
|
|
return type == key.type && value == key.value && extra == key.extra;
|
2021-10-29 21:25:12 +01:00
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
struct Function
|
|
|
|
{
|
|
|
|
std::string data;
|
|
|
|
|
|
|
|
uint8_t maxstacksize = 0;
|
|
|
|
uint8_t numparams = 0;
|
|
|
|
uint8_t numupvalues = 0;
|
|
|
|
bool isvararg = false;
|
|
|
|
|
|
|
|
unsigned int debugname = 0;
|
2022-01-07 01:46:53 +00:00
|
|
|
int debuglinedefined = 0;
|
2021-10-29 21:25:12 +01:00
|
|
|
|
|
|
|
std::string dump;
|
|
|
|
std::string dumpname;
|
2022-10-21 18:54:01 +01:00
|
|
|
std::vector<int> dumpinstoffs;
|
2023-06-16 18:35:18 +01:00
|
|
|
std::string typeinfo;
|
2021-10-29 21:25:12 +01:00
|
|
|
};
|
|
|
|
|
|
|
|
struct DebugLocal
|
|
|
|
{
|
|
|
|
unsigned int name;
|
|
|
|
|
|
|
|
uint8_t reg;
|
|
|
|
uint32_t startpc;
|
|
|
|
uint32_t endpc;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct DebugUpval
|
|
|
|
{
|
|
|
|
unsigned int name;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct Jump
|
|
|
|
{
|
|
|
|
uint32_t source;
|
|
|
|
uint32_t target;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct StringRefHash
|
|
|
|
{
|
|
|
|
size_t operator()(const StringRef& v) const;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct ConstantKeyHash
|
|
|
|
{
|
|
|
|
size_t operator()(const ConstantKey& key) const;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct TableShapeHash
|
|
|
|
{
|
|
|
|
size_t operator()(const TableShape& v) const;
|
|
|
|
};
|
|
|
|
|
|
|
|
std::vector<Function> functions;
|
|
|
|
uint32_t currentFunction = ~0u;
|
|
|
|
uint32_t mainFunction = ~0u;
|
|
|
|
|
2023-11-03 23:45:04 +00:00
|
|
|
size_t totalInstructionCount = 0;
|
2021-10-29 21:25:12 +01:00
|
|
|
std::vector<uint32_t> insns;
|
|
|
|
std::vector<int> lines;
|
|
|
|
std::vector<Constant> constants;
|
|
|
|
std::vector<uint32_t> protos;
|
|
|
|
std::vector<Jump> jumps;
|
|
|
|
|
|
|
|
std::vector<TableShape> tableShapes;
|
|
|
|
|
|
|
|
bool hasLongJumps = false;
|
|
|
|
|
|
|
|
DenseHashMap<ConstantKey, int32_t, ConstantKeyHash> constantMap;
|
|
|
|
DenseHashMap<TableShape, int32_t, TableShapeHash> tableShapeMap;
|
2022-05-20 01:02:24 +01:00
|
|
|
DenseHashMap<uint32_t, int16_t> protoMap;
|
2021-10-29 21:25:12 +01:00
|
|
|
|
|
|
|
int debugLine = 0;
|
|
|
|
|
|
|
|
std::vector<DebugLocal> debugLocals;
|
|
|
|
std::vector<DebugUpval> debugUpvals;
|
|
|
|
|
|
|
|
DenseHashMap<StringRef, unsigned int, StringRefHash> stringTable;
|
2023-01-13 22:10:01 +00:00
|
|
|
std::vector<StringRef> debugStrings;
|
2021-10-29 21:25:12 +01:00
|
|
|
|
2022-04-29 02:24:24 +01:00
|
|
|
std::vector<std::pair<uint32_t, uint32_t>> debugRemarks;
|
2022-04-21 22:44:27 +01:00
|
|
|
std::string debugRemarkBuffer;
|
|
|
|
|
2021-10-29 21:25:12 +01:00
|
|
|
BytecodeEncoder* encoder = nullptr;
|
|
|
|
std::string bytecode;
|
|
|
|
|
|
|
|
uint32_t dumpFlags = 0;
|
|
|
|
std::vector<std::string> dumpSource;
|
2022-10-14 20:48:41 +01:00
|
|
|
std::vector<std::pair<int, std::string>> dumpRemarks;
|
2021-10-29 21:25:12 +01:00
|
|
|
|
2022-10-21 18:54:01 +01:00
|
|
|
std::string (BytecodeBuilder::*dumpFunctionPtr)(std::vector<int>&) const = nullptr;
|
2021-10-29 21:25:12 +01:00
|
|
|
|
|
|
|
void validate() const;
|
2022-10-21 18:54:01 +01:00
|
|
|
void validateInstructions() const;
|
|
|
|
void validateVariadic() const;
|
2021-10-29 21:25:12 +01:00
|
|
|
|
2022-10-21 18:54:01 +01:00
|
|
|
std::string dumpCurrentFunction(std::vector<int>& dumpinstoffs) const;
|
2023-01-13 22:10:01 +00:00
|
|
|
void dumpConstant(std::string& result, int k) const;
|
2022-05-26 23:08:16 +01:00
|
|
|
void dumpInstruction(const uint32_t* opcode, std::string& output, int targetLabel) const;
|
2021-10-29 21:25:12 +01:00
|
|
|
|
2023-07-14 19:08:53 +01:00
|
|
|
void writeFunction(std::string& ss, uint32_t id, uint8_t flags) const;
|
2021-10-29 21:25:12 +01:00
|
|
|
void writeLineInfo(std::string& ss) const;
|
|
|
|
void writeStringTable(std::string& ss) const;
|
|
|
|
|
|
|
|
int32_t addConstant(const ConstantKey& key, const Constant& value);
|
|
|
|
unsigned int addStringTableEntry(StringRef value);
|
|
|
|
};
|
|
|
|
|
|
|
|
} // namespace Luau
|