luau/Compiler/include/Luau/BytecodeBuilder.h

328 lines
8.8 KiB
C
Raw Normal View History

// This file is part of the Luau programming language and is licensed under MIT License; see LICENSE.txt for details
#pragma once
#include "Luau/Bytecode.h"
#include "Luau/DenseHash.h"
2022-04-21 22:04:22 +01:00
#include "Luau/StringUtils.h"
#include <string>
namespace Luau
{
class BytecodeEncoder
{
public:
virtual ~BytecodeEncoder() {}
2023-08-18 18:06:29 +01:00
virtual void encode(uint32_t* data, size_t count) = 0;
};
class BytecodeBuilder
{
public:
// BytecodeBuilder does *not* copy the data passed via StringRef; instead, it keeps the ref around until finalize()
// Please be careful with the lifetime of the data that's being passed because of this.
// The safe and correct pattern is to only build StringRefs out of pieces of AST (AstName or AstArray<>) that are backed by AstAllocator.
// Note that you must finalize() the builder before the Allocator backing the Ast is destroyed.
struct StringRef
{
// To construct a StringRef, use sref() from Compiler.cpp.
const char* data = nullptr;
size_t length = 0;
bool operator==(const StringRef& other) const;
};
struct TableShape
{
static const unsigned int kMaxLength = 32;
int32_t keys[kMaxLength];
unsigned int length = 0;
bool operator==(const TableShape& other) const;
};
BytecodeBuilder(BytecodeEncoder* encoder = 0);
uint32_t beginFunction(uint8_t numparams, bool isvararg = false);
2023-07-14 16:57:16 +01:00
void endFunction(uint8_t maxstacksize, uint8_t numupvalues, uint8_t flags = 0);
void setMainFunction(uint32_t fid);
int32_t addConstantNil();
int32_t addConstantBoolean(bool value);
int32_t addConstantNumber(double value);
int32_t addConstantVector(float x, float y, float z, float w);
int32_t addConstantString(StringRef value);
int32_t addImport(uint32_t iid);
int32_t addConstantTable(const TableShape& shape);
int32_t addConstantClosure(uint32_t fid);
int16_t addChildFunction(uint32_t fid);
void emitABC(LuauOpcode op, uint8_t a, uint8_t b, uint8_t c);
void emitAD(LuauOpcode op, uint8_t a, int16_t d);
void emitE(LuauOpcode op, int32_t e);
void emitAux(uint32_t aux);
size_t emitLabel();
[[nodiscard]] bool patchJumpD(size_t jumpLabel, size_t targetLabel);
[[nodiscard]] bool patchSkipC(size_t jumpLabel, size_t targetLabel);
void foldJumps();
void expandJumps();
2023-06-16 18:01:18 +01:00
void setFunctionTypeInfo(std::string value);
2024-04-25 21:57:23 +01:00
void pushLocalTypeInfo(LuauBytecodeType type, uint8_t reg, uint32_t startpc, uint32_t endpc);
void pushUpvalTypeInfo(LuauBytecodeType type);
2023-06-16 18:01:18 +01:00
2024-05-31 18:46:33 +01:00
uint32_t addUserdataType(const char* name);
void useUserdataType(uint32_t index);
void setDebugFunctionName(StringRef name);
2022-01-06 22:10:07 +00:00
void setDebugFunctionLineDefined(int line);
void setDebugLine(int line);
void pushDebugLocal(StringRef name, uint8_t reg, uint32_t startpc, uint32_t endpc);
void pushDebugUpval(StringRef name);
2023-04-28 12:55:55 +01:00
size_t getInstructionCount() const;
2023-11-03 19:47:28 +00:00
size_t getTotalInstructionCount() const;
uint32_t getDebugPC() const;
2022-04-21 22:04:22 +01:00
void addDebugRemark(const char* format, ...) LUAU_PRINTF_ATTR(2, 3);
void finalize();
enum DumpFlags
{
Dump_Code = 1 << 0,
Dump_Lines = 1 << 1,
Dump_Source = 1 << 2,
Dump_Locals = 1 << 3,
2022-04-21 22:04:22 +01:00
Dump_Remarks = 1 << 4,
2024-04-25 21:57:23 +01:00
Dump_Types = 1 << 5,
};
void setDumpFlags(uint32_t flags)
{
dumpFlags = flags;
dumpFunctionPtr = &BytecodeBuilder::dumpCurrentFunction;
}
void setDumpSource(const std::string& source);
2022-10-13 23:59:53 +01:00
bool needsDebugRemarks() const
{
return (dumpFlags & Dump_Remarks) != 0;
}
const std::string& getBytecode() const
{
LUAU_ASSERT(!bytecode.empty()); // did you forget to call finalize?
return bytecode;
}
std::string dumpFunction(uint32_t id) const;
std::string dumpEverything() const;
2022-10-13 23:59:53 +01:00
std::string dumpSourceRemarks() const;
2023-06-16 18:01:18 +01:00
std::string dumpTypeInfo() const;
2022-10-27 23:22:49 +01:00
void annotateInstruction(std::string& result, uint32_t fid, uint32_t instpos) const;
2022-10-21 18:33:43 +01:00
static uint32_t getImportId(int32_t id0);
static uint32_t getImportId(int32_t id0, int32_t id1);
static uint32_t getImportId(int32_t id0, int32_t id1, int32_t id2);
2023-01-13 20:36:28 +00:00
static int decomposeImportId(uint32_t ids, int32_t& id0, int32_t& id1, int32_t& id2);
static uint32_t getStringHash(StringRef key);
static std::string getError(const std::string& message);
2022-06-24 02:44:07 +01:00
static uint8_t getVersion();
2023-06-16 18:01:18 +01:00
static uint8_t getTypeEncodingVersion();
2022-06-24 02:44:07 +01:00
private:
struct Constant
{
enum Type
{
Type_Nil,
Type_Boolean,
Type_Number,
Type_Vector,
Type_String,
Type_Import,
Type_Table,
Type_Closure,
};
Type type;
union
{
bool valueBoolean;
double valueNumber;
float valueVector[4];
unsigned int valueString; // index into string table
uint32_t valueImport; // 10-10-10-2 encoded import id
uint32_t valueTable; // index into tableShapes[]
uint32_t valueClosure; // index of function in global list
};
};
struct ConstantKey
{
Constant::Type type;
// Note: this stores value* from Constant; when type is Type_Number, this stores the same bits as double does but in uint64_t.
// For Type_Vector, x and y are stored in 'value' and z and w are stored in 'extra'.
uint64_t value;
uint64_t extra = 0;
bool operator==(const ConstantKey& key) const
{
return type == key.type && value == key.value && extra == key.extra;
}
};
struct Function
{
std::string data;
uint8_t maxstacksize = 0;
uint8_t numparams = 0;
uint8_t numupvalues = 0;
bool isvararg = false;
unsigned int debugname = 0;
2022-01-06 22:10:07 +00:00
int debuglinedefined = 0;
std::string dump;
std::string dumpname;
2022-10-21 18:33:43 +01:00
std::vector<int> dumpinstoffs;
2023-06-16 18:01:18 +01:00
std::string typeinfo;
};
struct DebugLocal
{
unsigned int name;
uint8_t reg;
uint32_t startpc;
uint32_t endpc;
};
struct DebugUpval
{
unsigned int name;
};
2024-04-25 21:57:23 +01:00
struct TypedLocal
{
LuauBytecodeType type;
uint8_t reg;
uint32_t startpc;
uint32_t endpc;
};
struct TypedUpval
{
LuauBytecodeType type;
};
2024-05-31 18:46:33 +01:00
struct UserdataType
{
std::string name;
uint32_t nameRef = 0;
bool used = false;
};
struct Jump
{
uint32_t source;
uint32_t target;
};
struct StringRefHash
{
size_t operator()(const StringRef& v) const;
};
struct ConstantKeyHash
{
size_t operator()(const ConstantKey& key) const;
};
struct TableShapeHash
{
size_t operator()(const TableShape& v) const;
};
std::vector<Function> functions;
uint32_t currentFunction = ~0u;
uint32_t mainFunction = ~0u;
2023-11-03 19:47:28 +00:00
size_t totalInstructionCount = 0;
std::vector<uint32_t> insns;
std::vector<int> lines;
std::vector<Constant> constants;
std::vector<uint32_t> protos;
std::vector<Jump> jumps;
std::vector<TableShape> tableShapes;
bool hasLongJumps = false;
DenseHashMap<ConstantKey, int32_t, ConstantKeyHash> constantMap;
DenseHashMap<TableShape, int32_t, TableShapeHash> tableShapeMap;
2022-05-20 00:46:52 +01:00
DenseHashMap<uint32_t, int16_t> protoMap;
int debugLine = 0;
std::vector<DebugLocal> debugLocals;
std::vector<DebugUpval> debugUpvals;
2024-04-25 21:57:23 +01:00
std::vector<TypedLocal> typedLocals;
std::vector<TypedUpval> typedUpvals;
2024-05-31 18:46:33 +01:00
std::vector<UserdataType> userdataTypes;
DenseHashMap<StringRef, unsigned int, StringRefHash> stringTable;
2023-01-13 20:36:28 +00:00
std::vector<StringRef> debugStrings;
2022-04-29 02:04:52 +01:00
std::vector<std::pair<uint32_t, uint32_t>> debugRemarks;
2022-04-21 22:04:22 +01:00
std::string debugRemarkBuffer;
BytecodeEncoder* encoder = nullptr;
std::string bytecode;
uint32_t dumpFlags = 0;
std::vector<std::string> dumpSource;
2022-10-13 23:59:53 +01:00
std::vector<std::pair<int, std::string>> dumpRemarks;
2024-04-25 21:57:23 +01:00
std::string tempTypeInfo;
2022-10-21 18:33:43 +01:00
std::string (BytecodeBuilder::*dumpFunctionPtr)(std::vector<int>&) const = nullptr;
void validate() const;
2022-10-21 18:33:43 +01:00
void validateInstructions() const;
void validateVariadic() const;
2022-10-21 18:33:43 +01:00
std::string dumpCurrentFunction(std::vector<int>& dumpinstoffs) const;
2023-01-13 20:36:28 +00:00
void dumpConstant(std::string& result, int k) const;
2022-05-26 21:33:48 +01:00
void dumpInstruction(const uint32_t* opcode, std::string& output, int targetLabel) const;
2024-04-25 21:57:23 +01:00
void writeFunction(std::string& ss, uint32_t id, uint8_t flags);
void writeLineInfo(std::string& ss) const;
void writeStringTable(std::string& ss) const;
int32_t addConstant(const ConstantKey& key, const Constant& value);
unsigned int addStringTableEntry(StringRef value);
2024-05-31 18:46:33 +01:00
const char* tryGetUserdataTypeName(LuauBytecodeType type) const;
};
} // namespace Luau