luau/CodeGen/include/Luau/AssemblyBuilderA64.h

293 lines
12 KiB
C
Raw Normal View History

2022-11-04 17:02:37 +00:00
// This file is part of the Luau programming language and is licensed under MIT License; see LICENSE.txt for details
#pragma once
#include "Luau/RegisterA64.h"
#include "Luau/AddressA64.h"
#include "Luau/ConditionA64.h"
#include "Luau/Label.h"
#include <string>
#include <vector>
namespace Luau
{
namespace CodeGen
{
2023-03-03 13:45:38 +00:00
namespace A64
{
2022-11-04 17:02:37 +00:00
2023-03-31 13:21:14 +01:00
enum FeaturesA64
{
Feature_JSCVT = 1 << 0,
};
2022-11-04 17:02:37 +00:00
class AssemblyBuilderA64
{
public:
2023-03-31 13:21:14 +01:00
explicit AssemblyBuilderA64(bool logText, unsigned int features = 0);
2022-11-04 17:02:37 +00:00
~AssemblyBuilderA64();
// Moves
void mov(RegisterA64 dst, RegisterA64 src);
2023-03-24 17:34:14 +00:00
void mov(RegisterA64 dst, int src); // macro
// Moves of 32-bit immediates get decomposed into one or more of these
void movz(RegisterA64 dst, uint16_t src, int shift = 0);
void movn(RegisterA64 dst, uint16_t src, int shift = 0);
2022-11-04 17:02:37 +00:00
void movk(RegisterA64 dst, uint16_t src, int shift = 0);
// Arithmetics
void add(RegisterA64 dst, RegisterA64 src1, RegisterA64 src2, int shift = 0);
2023-03-24 17:34:14 +00:00
void add(RegisterA64 dst, RegisterA64 src1, uint16_t src2);
2022-11-04 17:02:37 +00:00
void sub(RegisterA64 dst, RegisterA64 src1, RegisterA64 src2, int shift = 0);
2023-03-24 17:34:14 +00:00
void sub(RegisterA64 dst, RegisterA64 src1, uint16_t src2);
2022-11-04 17:02:37 +00:00
void neg(RegisterA64 dst, RegisterA64 src);
// Comparisons
// Note: some arithmetic instructions also have versions that update flags (ADDS etc) but we aren't using them atm
2022-11-10 22:04:44 +00:00
void cmp(RegisterA64 src1, RegisterA64 src2);
2023-03-24 17:34:14 +00:00
void cmp(RegisterA64 src1, uint16_t src2);
2023-03-31 13:21:14 +01:00
void csel(RegisterA64 dst, RegisterA64 src1, RegisterA64 src2, ConditionA64 cond);
2023-04-14 13:05:27 +01:00
void cset(RegisterA64 dst, ConditionA64 cond);
2022-11-04 17:02:37 +00:00
2022-11-10 22:04:44 +00:00
// Bitwise
2023-04-21 22:41:03 +01:00
void and_(RegisterA64 dst, RegisterA64 src1, RegisterA64 src2, int shift = 0);
void orr(RegisterA64 dst, RegisterA64 src1, RegisterA64 src2, int shift = 0);
void eor(RegisterA64 dst, RegisterA64 src1, RegisterA64 src2, int shift = 0);
void bic(RegisterA64 dst, RegisterA64 src1, RegisterA64 src2, int shift = 0);
void tst(RegisterA64 src1, RegisterA64 src2, int shift = 0);
2023-05-12 13:15:01 +01:00
void mvn_(RegisterA64 dst, RegisterA64 src);
2022-11-10 22:04:44 +00:00
2023-04-14 13:05:27 +01:00
// Bitwise with immediate
// Note: immediate must have a single contiguous sequence of 1 bits set of length 1..31
void and_(RegisterA64 dst, RegisterA64 src1, uint32_t src2);
void orr(RegisterA64 dst, RegisterA64 src1, uint32_t src2);
void eor(RegisterA64 dst, RegisterA64 src1, uint32_t src2);
void tst(RegisterA64 src1, uint32_t src2);
2022-11-10 22:04:44 +00:00
// Shifts
2022-11-04 17:02:37 +00:00
void lsl(RegisterA64 dst, RegisterA64 src1, RegisterA64 src2);
void lsr(RegisterA64 dst, RegisterA64 src1, RegisterA64 src2);
void asr(RegisterA64 dst, RegisterA64 src1, RegisterA64 src2);
void ror(RegisterA64 dst, RegisterA64 src1, RegisterA64 src2);
void clz(RegisterA64 dst, RegisterA64 src);
void rbit(RegisterA64 dst, RegisterA64 src);
2023-10-20 21:36:26 +01:00
void rev(RegisterA64 dst, RegisterA64 src);
2022-11-04 17:02:37 +00:00
2023-04-21 22:41:03 +01:00
// Shifts with immediates
// Note: immediate value must be in [0, 31] or [0, 63] range based on register type
void lsl(RegisterA64 dst, RegisterA64 src1, uint8_t src2);
void lsr(RegisterA64 dst, RegisterA64 src1, uint8_t src2);
void asr(RegisterA64 dst, RegisterA64 src1, uint8_t src2);
void ror(RegisterA64 dst, RegisterA64 src1, uint8_t src2);
2023-05-19 19:59:59 +01:00
// Bitfields
void ubfiz(RegisterA64 dst, RegisterA64 src, uint8_t f, uint8_t w);
void ubfx(RegisterA64 dst, RegisterA64 src, uint8_t f, uint8_t w);
void sbfiz(RegisterA64 dst, RegisterA64 src, uint8_t f, uint8_t w);
void sbfx(RegisterA64 dst, RegisterA64 src, uint8_t f, uint8_t w);
2022-11-04 17:02:37 +00:00
// Load
// Note: paired loads are currently omitted for simplicity
void ldr(RegisterA64 dst, AddressA64 src);
void ldrb(RegisterA64 dst, AddressA64 src);
void ldrh(RegisterA64 dst, AddressA64 src);
void ldrsb(RegisterA64 dst, AddressA64 src);
void ldrsh(RegisterA64 dst, AddressA64 src);
void ldrsw(RegisterA64 dst, AddressA64 src);
2023-03-24 17:34:14 +00:00
void ldp(RegisterA64 dst1, RegisterA64 dst2, AddressA64 src);
2022-11-04 17:02:37 +00:00
// Store
void str(RegisterA64 src, AddressA64 dst);
void strb(RegisterA64 src, AddressA64 dst);
void strh(RegisterA64 src, AddressA64 dst);
2023-03-24 17:34:14 +00:00
void stp(RegisterA64 src1, RegisterA64 src2, AddressA64 dst);
2022-11-04 17:02:37 +00:00
// Control flow
2022-11-10 22:04:44 +00:00
void b(Label& label);
2023-04-21 22:41:03 +01:00
void bl(Label& label);
2022-11-10 22:04:44 +00:00
void br(RegisterA64 src);
void blr(RegisterA64 src);
2022-11-04 17:02:37 +00:00
void ret();
2023-04-21 22:41:03 +01:00
// Conditional control flow
void b(ConditionA64 cond, Label& label);
void cbz(RegisterA64 src, Label& label);
void cbnz(RegisterA64 src, Label& label);
void tbz(RegisterA64 src, uint8_t bit, Label& label);
void tbnz(RegisterA64 src, uint8_t bit, Label& label);
2022-11-10 22:04:44 +00:00
// Address of embedded data
void adr(RegisterA64 dst, const void* ptr, size_t size);
void adr(RegisterA64 dst, uint64_t value);
void adr(RegisterA64 dst, double value);
2023-03-24 17:34:14 +00:00
// Address of code (label)
void adr(RegisterA64 dst, Label& label);
2024-03-15 21:01:00 +00:00
// Floating-point scalar/vector moves
2023-04-21 22:41:03 +01:00
// Note: constant must be compatible with immediate floating point moves (see isFmovSupported)
2023-03-31 13:21:14 +01:00
void fmov(RegisterA64 dst, RegisterA64 src);
2023-04-21 22:41:03 +01:00
void fmov(RegisterA64 dst, double src);
2023-03-31 13:21:14 +01:00
2024-03-15 21:01:00 +00:00
// Floating-point scalar/vector math
2023-03-31 13:21:14 +01:00
void fabs(RegisterA64 dst, RegisterA64 src);
void fadd(RegisterA64 dst, RegisterA64 src1, RegisterA64 src2);
void fdiv(RegisterA64 dst, RegisterA64 src1, RegisterA64 src2);
void fmul(RegisterA64 dst, RegisterA64 src1, RegisterA64 src2);
void fneg(RegisterA64 dst, RegisterA64 src);
void fsqrt(RegisterA64 dst, RegisterA64 src);
void fsub(RegisterA64 dst, RegisterA64 src1, RegisterA64 src2);
2024-03-15 21:01:00 +00:00
// Vector component manipulation
2024-01-27 02:30:40 +00:00
void ins_4s(RegisterA64 dst, RegisterA64 src, uint8_t index);
void ins_4s(RegisterA64 dst, uint8_t dstIndex, RegisterA64 src, uint8_t srcIndex);
void dup_4s(RegisterA64 dst, RegisterA64 src, uint8_t index);
2023-03-31 13:21:14 +01:00
// Floating-point rounding and conversions
void frinta(RegisterA64 dst, RegisterA64 src);
void frintm(RegisterA64 dst, RegisterA64 src);
void frintp(RegisterA64 dst, RegisterA64 src);
2023-04-28 12:55:55 +01:00
void fcvt(RegisterA64 dst, RegisterA64 src);
2023-03-31 13:21:14 +01:00
void fcvtzs(RegisterA64 dst, RegisterA64 src);
void fcvtzu(RegisterA64 dst, RegisterA64 src);
void scvtf(RegisterA64 dst, RegisterA64 src);
void ucvtf(RegisterA64 dst, RegisterA64 src);
// Floating-point conversion to integer using JS rules (wrap around 2^32) and set Z flag
// note: this is part of ARM8.3 (JSCVT feature); support of this instruction needs to be checked at runtime
void fjcvtzs(RegisterA64 dst, RegisterA64 src);
// Floating-point comparisons
void fcmp(RegisterA64 src1, RegisterA64 src2);
void fcmpz(RegisterA64 src);
void fcsel(RegisterA64 dst, RegisterA64 src1, RegisterA64 src2, ConditionA64 cond);
2023-05-25 21:46:51 +01:00
void udf();
2022-11-04 17:02:37 +00:00
// Run final checks
bool finalize();
// Places a label at current location and returns it
Label setLabel();
// Assigns label position to the current location
void setLabel(Label& label);
2023-03-17 14:59:30 +00:00
// Extracts code offset (in bytes) from label
uint32_t getLabelOffset(const Label& label)
{
2024-02-16 01:25:31 +00:00
CODEGEN_ASSERT(label.location != ~0u);
2023-03-17 14:59:30 +00:00
return label.location * 4;
}
2022-11-04 17:02:37 +00:00
void logAppend(const char* fmt, ...) LUAU_PRINTF_ATTR(2, 3);
uint32_t getCodeSize() const;
2024-01-12 19:16:39 +00:00
unsigned getInstructionCount() const;
2022-11-04 17:02:37 +00:00
// Resulting data and code that need to be copied over one after the other
// The *end* of 'data' has to be aligned to 16 bytes, this will also align 'code'
std::vector<uint8_t> data;
std::vector<uint32_t> code;
std::string text;
const bool logText = false;
2023-03-31 13:21:14 +01:00
const unsigned int features = 0;
2022-11-04 17:02:37 +00:00
2023-03-24 17:34:14 +00:00
// Maximum immediate argument to functions like add/sub/cmp
static constexpr size_t kMaxImmediate = (1 << 12) - 1;
2023-04-21 22:41:03 +01:00
// Check if immediate mode mask is supported for bitwise operations (and/or/xor)
static bool isMaskSupported(uint32_t mask);
// Check if fmov can be used to synthesize a constant
static bool isFmovSupported(double value);
2022-11-04 17:02:37 +00:00
private:
// Instruction archetypes
void place0(const char* name, uint32_t word);
2023-04-14 13:05:27 +01:00
void placeSR3(const char* name, RegisterA64 dst, RegisterA64 src1, RegisterA64 src2, uint8_t op, int shift = 0, int N = 0);
2022-11-10 22:04:44 +00:00
void placeSR2(const char* name, RegisterA64 dst, RegisterA64 src, uint8_t op, uint8_t op2 = 0);
2022-11-04 17:02:37 +00:00
void placeR3(const char* name, RegisterA64 dst, RegisterA64 src1, RegisterA64 src2, uint8_t op, uint8_t op2);
void placeR1(const char* name, RegisterA64 dst, RegisterA64 src, uint32_t op);
void placeI12(const char* name, RegisterA64 dst, RegisterA64 src1, int src2, uint8_t op);
void placeI16(const char* name, RegisterA64 dst, int src, uint8_t op, int shift = 0);
2023-05-12 13:15:01 +01:00
void placeA(const char* name, RegisterA64 dst, AddressA64 src, uint16_t opsize, int sizelog);
2023-04-21 22:41:03 +01:00
void placeB(const char* name, Label& label, uint8_t op);
2022-11-04 17:02:37 +00:00
void placeBC(const char* name, Label& label, uint8_t op, uint8_t cond);
2022-11-10 22:04:44 +00:00
void placeBCR(const char* name, Label& label, uint8_t op, RegisterA64 cond);
void placeBR(const char* name, RegisterA64 src, uint32_t op);
2023-04-21 22:41:03 +01:00
void placeBTR(const char* name, Label& label, uint8_t op, RegisterA64 cond, uint8_t bit);
2022-11-10 22:04:44 +00:00
void placeADR(const char* name, RegisterA64 src, uint8_t op);
2023-03-24 17:34:14 +00:00
void placeADR(const char* name, RegisterA64 src, uint8_t op, Label& label);
2023-03-31 13:21:14 +01:00
void placeP(const char* name, RegisterA64 dst1, RegisterA64 dst2, AddressA64 src, uint8_t op, uint8_t opc, int sizelog);
2023-04-14 13:05:27 +01:00
void placeCS(const char* name, RegisterA64 dst, RegisterA64 src1, RegisterA64 src2, ConditionA64 cond, uint8_t op, uint8_t opc, int invert = 0);
2023-03-31 13:21:14 +01:00
void placeFCMP(const char* name, RegisterA64 src1, RegisterA64 src2, uint8_t op, uint8_t opc);
2023-04-21 22:41:03 +01:00
void placeFMOV(const char* name, RegisterA64 dst, double src, uint32_t op);
2023-04-14 13:05:27 +01:00
void placeBM(const char* name, RegisterA64 dst, RegisterA64 src1, uint32_t src2, uint8_t op);
2023-05-19 19:59:59 +01:00
void placeBFM(const char* name, RegisterA64 dst, RegisterA64 src1, int src2, uint8_t op, int immr, int imms);
2023-09-01 17:38:53 +01:00
void placeER(const char* name, RegisterA64 dst, RegisterA64 src1, RegisterA64 src2, uint8_t op, int shift);
2024-02-23 18:40:00 +00:00
void placeVR(const char* name, RegisterA64 dst, RegisterA64 src1, RegisterA64 src2, uint16_t op, uint8_t op2);
2022-11-04 17:02:37 +00:00
void place(uint32_t word);
2022-11-10 22:04:44 +00:00
2023-04-21 22:41:03 +01:00
struct Patch
{
enum Kind
{
Imm26,
Imm19,
Imm14,
};
Kind kind : 2;
uint32_t label : 30;
uint32_t location;
};
void patchLabel(Label& label, Patch::Kind kind);
void patchOffset(uint32_t location, int value, Patch::Kind kind);
2022-11-04 17:02:37 +00:00
void commit();
LUAU_NOINLINE void extend();
// Data
size_t allocateData(size_t size, size_t align);
// Logging of assembly in text form
LUAU_NOINLINE void log(const char* opcode);
LUAU_NOINLINE void log(const char* opcode, RegisterA64 dst, RegisterA64 src1, RegisterA64 src2, int shift = 0);
LUAU_NOINLINE void log(const char* opcode, RegisterA64 dst, RegisterA64 src1, int src2);
LUAU_NOINLINE void log(const char* opcode, RegisterA64 dst, RegisterA64 src);
LUAU_NOINLINE void log(const char* opcode, RegisterA64 dst, int src, int shift = 0);
2023-04-21 22:41:03 +01:00
LUAU_NOINLINE void log(const char* opcode, RegisterA64 dst, double src);
2022-11-04 17:02:37 +00:00
LUAU_NOINLINE void log(const char* opcode, RegisterA64 dst, AddressA64 src);
2023-03-24 17:34:14 +00:00
LUAU_NOINLINE void log(const char* opcode, RegisterA64 dst1, RegisterA64 dst2, AddressA64 src);
2023-04-21 22:41:03 +01:00
LUAU_NOINLINE void log(const char* opcode, RegisterA64 src, Label label, int imm = -1);
2022-11-10 22:04:44 +00:00
LUAU_NOINLINE void log(const char* opcode, RegisterA64 src);
2022-11-04 17:02:37 +00:00
LUAU_NOINLINE void log(const char* opcode, Label label);
2023-03-31 13:21:14 +01:00
LUAU_NOINLINE void log(const char* opcode, RegisterA64 dst, RegisterA64 src1, RegisterA64 src2, ConditionA64 cond);
2022-11-04 17:02:37 +00:00
LUAU_NOINLINE void log(Label label);
LUAU_NOINLINE void log(RegisterA64 reg);
LUAU_NOINLINE void log(AddressA64 addr);
uint32_t nextLabel = 1;
2023-04-21 22:41:03 +01:00
std::vector<Patch> pendingLabels;
2022-11-04 17:02:37 +00:00
std::vector<uint32_t> labelLocations;
bool finalized = false;
2022-11-10 22:04:44 +00:00
bool overflowed = false;
2022-11-04 17:02:37 +00:00
size_t dataPos = 0;
uint32_t* codePos = nullptr;
uint32_t* codeEnd = nullptr;
};
2023-03-03 13:45:38 +00:00
} // namespace A64
2022-11-04 17:02:37 +00:00
} // namespace CodeGen
} // namespace Luau