2021-10-29 21:25:12 +01:00
// This file is part of the Luau programming language and is licensed under MIT License; see LICENSE.txt for details
# include "Luau/Compiler.h"
# include "Luau/Parser.h"
# include "Luau/BytecodeBuilder.h"
# include "Luau/Common.h"
2021-11-05 02:07:18 +00:00
# include "Luau/TimeTrace.h"
2021-10-29 21:25:12 +01:00
2022-01-14 16:06:31 +00:00
# include "Builtins.h"
# include "ConstantFolding.h"
2022-04-21 22:04:22 +01:00
# include "CostModel.h"
2022-01-14 16:06:31 +00:00
# include "TableShape.h"
2023-06-16 18:01:18 +01:00
# include "Types.h"
2022-01-14 16:06:31 +00:00
# include "ValueTracking.h"
2021-10-29 21:25:12 +01:00
# include <algorithm>
# include <bitset>
2022-08-25 21:55:08 +01:00
# include <memory>
2021-10-29 21:25:12 +01:00
# include <math.h>
2022-04-21 22:04:22 +01:00
LUAU_FASTINTVARIABLE ( LuauCompileLoopUnrollThreshold , 25 )
LUAU_FASTINTVARIABLE ( LuauCompileLoopUnrollThresholdMaxBoost , 300 )
2021-10-29 21:25:12 +01:00
2022-05-06 00:52:48 +01:00
LUAU_FASTINTVARIABLE ( LuauCompileInlineThreshold , 25 )
LUAU_FASTINTVARIABLE ( LuauCompileInlineThresholdMaxBoost , 300 )
LUAU_FASTINTVARIABLE ( LuauCompileInlineDepth , 5 )
2023-09-01 17:38:53 +01:00
LUAU_FASTFLAG ( LuauFloorDivision )
2023-10-20 21:36:26 +01:00
LUAU_FASTFLAGVARIABLE ( LuauCompileIfElseAndOr , false )
2023-09-01 17:38:53 +01:00
2021-10-29 21:25:12 +01:00
namespace Luau
{
2022-01-14 16:06:31 +00:00
using namespace Luau : : Compile ;
2021-10-29 21:25:12 +01:00
static const uint32_t kMaxRegisterCount = 255 ;
static const uint32_t kMaxUpvalueCount = 200 ;
static const uint32_t kMaxLocalCount = 200 ;
2023-04-28 12:55:55 +01:00
static const uint32_t kMaxInstructionCount = 1'000'000'000 ;
2021-10-29 21:25:12 +01:00
2022-08-11 21:42:54 +01:00
static const uint8_t kInvalidReg = 255 ;
2021-10-29 21:25:12 +01:00
CompileError : : CompileError ( const Location & location , const std : : string & message )
: location ( location )
, message ( message )
{
}
CompileError : : ~ CompileError ( ) throw ( ) { }
const char * CompileError : : what ( ) const throw ( )
{
return message . c_str ( ) ;
}
const Location & CompileError : : getLocation ( ) const
{
return location ;
}
// NOINLINE is used to limit the stack cost of this function due to std::string object / exception plumbing
LUAU_NOINLINE void CompileError : : raise ( const Location & location , const char * format , . . . )
{
va_list args ;
va_start ( args , format ) ;
std : : string message = vformat ( format , args ) ;
va_end ( args ) ;
throw CompileError ( location , message ) ;
}
static BytecodeBuilder : : StringRef sref ( AstName name )
{
LUAU_ASSERT ( name . value ) ;
return { name . value , strlen ( name . value ) } ;
}
static BytecodeBuilder : : StringRef sref ( AstArray < char > data )
{
LUAU_ASSERT ( data . data ) ;
return { data . data , data . size } ;
}
2022-07-14 23:39:35 +01:00
static BytecodeBuilder : : StringRef sref ( AstArray < const char > data )
{
LUAU_ASSERT ( data . data ) ;
return { data . data , data . size } ;
}
2021-10-29 21:25:12 +01:00
struct Compiler
{
struct RegScope ;
Compiler ( BytecodeBuilder & bytecode , const CompileOptions & options )
: bytecode ( bytecode )
, options ( options )
, functions ( nullptr )
, locals ( nullptr )
, globals ( AstName ( ) )
2022-01-14 16:06:31 +00:00
, variables ( nullptr )
2021-10-29 21:25:12 +01:00
, constants ( nullptr )
2022-04-21 22:04:22 +01:00
, locstants ( nullptr )
2022-01-14 16:06:31 +00:00
, tableShapes ( nullptr )
2022-07-14 23:39:35 +01:00
, builtins ( nullptr )
2023-07-07 18:14:35 +01:00
, typeMap ( nullptr )
2021-10-29 21:25:12 +01:00
{
2022-04-21 22:04:22 +01:00
// preallocate some buffers that are very likely to grow anyway; this works around std::vector's inefficient growth policy for small arrays
localStack . reserve ( 16 ) ;
upvals . reserve ( 16 ) ;
2021-10-29 21:25:12 +01:00
}
2022-05-20 00:46:52 +01:00
int getLocalReg ( AstLocal * local )
2021-10-29 21:25:12 +01:00
{
Local * l = locals . find ( local ) ;
2022-05-20 00:46:52 +01:00
return l & & l - > allocated ? l - > reg : - 1 ;
2021-10-29 21:25:12 +01:00
}
uint8_t getUpval ( AstLocal * local )
{
for ( size_t uid = 0 ; uid < upvals . size ( ) ; + + uid )
if ( upvals [ uid ] = = local )
return uint8_t ( uid ) ;
if ( upvals . size ( ) > = kMaxUpvalueCount )
CompileError : : raise (
local - > location , " Out of upvalue registers when trying to allocate %s: exceeded limit %d " , local - > name . value , kMaxUpvalueCount ) ;
// mark local as captured so that closeLocals emits LOP_CLOSEUPVALS accordingly
2022-01-14 16:06:31 +00:00
Variable * v = variables . find ( local ) ;
if ( v & & v - > written )
locals [ local ] . captured = true ;
2021-10-29 21:25:12 +01:00
upvals . push_back ( local ) ;
return uint8_t ( upvals . size ( ) - 1 ) ;
}
2023-02-24 18:24:22 +00:00
// true iff all execution paths through node subtree result in return/break/continue
// note: because this function doesn't visit loop nodes, it (correctly) only detects break/continue that refer to the outer control flow
bool alwaysTerminates ( AstStat * node )
2021-10-29 21:25:12 +01:00
{
if ( AstStatBlock * stat = node - > as < AstStatBlock > ( ) )
2023-02-24 18:24:22 +00:00
return stat - > body . size > 0 & & alwaysTerminates ( stat - > body . data [ stat - > body . size - 1 ] ) ;
2021-10-29 21:25:12 +01:00
else if ( node - > is < AstStatReturn > ( ) )
return true ;
2023-03-17 14:59:30 +00:00
else if ( node - > is < AstStatBreak > ( ) | | node - > is < AstStatContinue > ( ) )
2023-02-24 18:24:22 +00:00
return true ;
2021-10-29 21:25:12 +01:00
else if ( AstStatIf * stat = node - > as < AstStatIf > ( ) )
2023-02-24 18:24:22 +00:00
return stat - > elsebody & & alwaysTerminates ( stat - > thenbody ) & & alwaysTerminates ( stat - > elsebody ) ;
2021-10-29 21:25:12 +01:00
else
return false ;
}
void emitLoadK ( uint8_t target , int32_t cid )
{
LUAU_ASSERT ( cid > = 0 ) ;
if ( cid < 32768 )
{
bytecode . emitAD ( LOP_LOADK , target , int16_t ( cid ) ) ;
}
else
{
bytecode . emitAD ( LOP_LOADKX , target , 0 ) ;
bytecode . emitAux ( cid ) ;
}
}
2022-05-06 00:52:48 +01:00
AstExprFunction * getFunctionExpr ( AstExpr * node )
{
2022-05-20 00:46:52 +01:00
if ( AstExprLocal * expr = node - > as < AstExprLocal > ( ) )
2022-05-06 00:52:48 +01:00
{
2022-05-20 00:46:52 +01:00
Variable * lv = variables . find ( expr - > local ) ;
2022-05-06 00:52:48 +01:00
if ( ! lv | | lv - > written | | ! lv - > init )
return nullptr ;
return getFunctionExpr ( lv - > init ) ;
}
2022-05-20 00:46:52 +01:00
else if ( AstExprGroup * expr = node - > as < AstExprGroup > ( ) )
return getFunctionExpr ( expr - > expr ) ;
else if ( AstExprTypeAssertion * expr = node - > as < AstExprTypeAssertion > ( ) )
return getFunctionExpr ( expr - > expr ) ;
2022-05-06 00:52:48 +01:00
else
return node - > as < AstExprFunction > ( ) ;
}
2023-07-28 12:37:00 +01:00
uint32_t compileFunction ( AstExprFunction * func , uint8_t protoflags )
2021-10-29 21:25:12 +01:00
{
2021-11-05 02:07:18 +00:00
LUAU_TIMETRACE_SCOPE ( " Compiler::compileFunction " , " Compiler " ) ;
if ( func - > debugname . value )
LUAU_TIMETRACE_ARGUMENT ( " name " , func - > debugname . value ) ;
2021-10-29 21:25:12 +01:00
LUAU_ASSERT ( ! functions . contains ( func ) ) ;
LUAU_ASSERT ( regTop = = 0 & & stackSize = = 0 & & localStack . empty ( ) & & upvals . empty ( ) ) ;
RegScope rs ( this ) ;
bool self = func - > self ! = 0 ;
uint32_t fid = bytecode . beginFunction ( uint8_t ( self + func - > args . size ) , func - > vararg ) ;
setDebugLine ( func ) ;
2023-08-11 13:55:30 +01:00
// note: we move types out of typeMap which is safe because compileFunction is only called once per function
if ( std : : string * funcType = typeMap . find ( func ) )
bytecode . setFunctionTypeInfo ( std : : move ( * funcType ) ) ;
2023-06-16 18:01:18 +01:00
2021-10-29 21:25:12 +01:00
if ( func - > vararg )
bytecode . emitABC ( LOP_PREPVARARGS , uint8_t ( self + func - > args . size ) , 0 , 0 ) ;
uint8_t args = allocReg ( func , self + unsigned ( func - > args . size ) ) ;
if ( func - > self )
pushLocal ( func - > self , args ) ;
for ( size_t i = 0 ; i < func - > args . size ; + + i )
pushLocal ( func - > args . data [ i ] , uint8_t ( args + self + i ) ) ;
AstStatBlock * stat = func - > body ;
for ( size_t i = 0 ; i < stat - > body . size ; + + i )
compileStat ( stat - > body . data [ i ] ) ;
// valid function bytecode must always end with RETURN
// we elide this if we're guaranteed to hit a RETURN statement regardless of the control flow
2023-02-24 18:24:22 +00:00
if ( ! alwaysTerminates ( stat ) )
2021-10-29 21:25:12 +01:00
{
setDebugLineEnd ( stat ) ;
closeLocals ( 0 ) ;
bytecode . emitABC ( LOP_RETURN , 0 , 1 , 0 ) ;
}
// constant folding may remove some upvalue refs from bytecode, so this puts them back
if ( options . optimizationLevel > = 1 & & options . debugLevel > = 2 )
gatherConstUpvals ( func ) ;
2022-01-06 22:10:07 +00:00
bytecode . setDebugFunctionLineDefined ( func - > location . begin . line + 1 ) ;
2021-10-29 21:25:12 +01:00
if ( options . debugLevel > = 1 & & func - > debugname . value )
bytecode . setDebugFunctionName ( sref ( func - > debugname ) ) ;
if ( options . debugLevel > = 2 & & ! upvals . empty ( ) )
{
for ( AstLocal * l : upvals )
bytecode . pushDebugUpval ( sref ( l - > name ) ) ;
}
if ( options . optimizationLevel > = 1 )
bytecode . foldJumps ( ) ;
bytecode . expandJumps ( ) ;
popLocals ( 0 ) ;
2023-05-25 21:46:51 +01:00
if ( bytecode . getInstructionCount ( ) > kMaxInstructionCount )
2023-04-28 12:55:55 +01:00
CompileError : : raise ( func - > location , " Exceeded function instruction limit; split the function into parts to compile " ) ;
2023-10-06 18:31:16 +01:00
// since top-level code only executes once, it can be marked as cold if it has no loops (top-level code with loops might be profitable to compile natively)
2023-10-27 20:33:36 +01:00
if ( func - > functionDepth = = 0 & & ! hasLoops )
2023-10-06 18:31:16 +01:00
protoflags | = LPF_NATIVE_COLD ;
2023-07-28 12:37:00 +01:00
bytecode . endFunction ( uint8_t ( stackSize ) , uint8_t ( upvals . size ( ) ) , protoflags ) ;
2021-10-29 21:25:12 +01:00
Function & f = functions [ func ] ;
f . id = fid ;
2022-04-21 22:04:22 +01:00
f . upvals = upvals ;
2022-05-06 00:52:48 +01:00
// record information for inlining
2023-10-13 20:38:31 +01:00
if ( options . optimizationLevel > = 2 & & ! func - > vararg & & ! func - > self & & ! getfenvUsed & & ! setfenvUsed )
2022-05-06 00:52:48 +01:00
{
f . canInline = true ;
f . stackSize = stackSize ;
2022-07-14 23:39:35 +01:00
f . costModel = modelCost ( func - > body , func - > args . data , func - > args . size , builtins ) ;
2022-06-17 01:54:42 +01:00
// track functions that only ever return a single value so that we can convert multret calls to fixedret calls
2023-02-24 18:24:22 +00:00
if ( alwaysTerminates ( func - > body ) )
2022-06-17 01:54:42 +01:00
{
ReturnVisitor returnVisitor ( this ) ;
stat - > visit ( & returnVisitor ) ;
f . returnsOne = returnVisitor . returnsOne ;
}
2022-05-06 00:52:48 +01:00
}
2022-04-21 22:04:22 +01:00
upvals . clear ( ) ; // note: instead of std::move above, we copy & clear to preserve capacity for future pushes
2022-05-06 00:52:48 +01:00
stackSize = 0 ;
2023-10-06 18:31:16 +01:00
hasLoops = false ;
2021-10-29 21:25:12 +01:00
return fid ;
}
2022-07-14 23:39:35 +01:00
// returns true if node can return multiple values; may conservatively return true even if expr is known to return just a single value
bool isExprMultRet ( AstExpr * node )
{
AstExprCall * expr = node - > as < AstExprCall > ( ) ;
if ( ! expr )
return node - > is < AstExprVarargs > ( ) ;
// conservative version, optimized for compilation throughput
if ( options . optimizationLevel < = 1 )
return true ;
// handles builtin calls that can be constant-folded
// without this we may omit some optimizations eg compiling fast calls without use of FASTCALL2K
if ( isConstant ( expr ) )
return false ;
2023-03-03 13:45:38 +00:00
// handles builtin calls that can't be constant-folded but are known to return one value
// note: optimizationLevel check is technically redundant but it's important that we never optimize based on builtins in O1
2023-03-31 13:21:14 +01:00
if ( options . optimizationLevel > = 2 )
2023-03-03 13:45:38 +00:00
if ( int * bfid = builtins . find ( expr ) )
return getBuiltinInfo ( * bfid ) . results ! = 1 ;
2022-07-14 23:39:35 +01:00
// handles local function calls where we know only one argument is returned
AstExprFunction * func = getFunctionExpr ( expr - > func ) ;
Function * fi = func ? functions . find ( func ) : nullptr ;
if ( fi & & fi - > returnsOne )
return false ;
// unrecognized call, so we conservatively assume multret
return true ;
}
2021-10-29 21:25:12 +01:00
// note: this doesn't just clobber target (assuming it's temp), but also clobbers *all* allocated registers >= target!
// this is important to be able to support "multret" semantics due to Lua call frame structure
bool compileExprTempMultRet ( AstExpr * node , uint8_t target )
{
if ( AstExprCall * expr = node - > as < AstExprCall > ( ) )
{
2022-07-14 23:39:35 +01:00
// Optimization: convert multret calls that always return one value to fixedret calls; this facilitates inlining/constant folding
2022-07-29 04:41:13 +01:00
if ( options . optimizationLevel > = 2 & & ! isExprMultRet ( node ) )
2022-06-17 01:54:42 +01:00
{
2022-07-29 04:41:13 +01:00
compileExprTemp ( node , target ) ;
return false ;
2022-06-17 01:54:42 +01:00
}
2021-10-29 21:25:12 +01:00
// We temporarily swap out regTop to have targetTop work correctly...
// This is a crude hack but it's necessary for correctness :(
RegScope rs ( this , target ) ;
compileExprCall ( expr , target , /* targetCount= */ 0 , /* targetTop= */ true , /* multRet= */ true ) ;
return true ;
}
else if ( AstExprVarargs * expr = node - > as < AstExprVarargs > ( ) )
{
// We temporarily swap out regTop to have targetTop work correctly...
// This is a crude hack but it's necessary for correctness :(
RegScope rs ( this , target ) ;
compileExprVarargs ( expr , target , /* targetCount= */ 0 , /* multRet= */ true ) ;
return true ;
}
else
{
compileExprTemp ( node , target ) ;
return false ;
}
}
// note: this doesn't just clobber target (assuming it's temp), but also clobbers *all* allocated registers >= target!
// this is important to be able to emit code that takes fewer registers and runs faster
void compileExprTempTop ( AstExpr * node , uint8_t target )
{
// We temporarily swap out regTop to have targetTop work correctly...
// This is a crude hack but it's necessary for performance :(
// It makes sure that nested call expressions can use targetTop optimization and don't need to have too many registers
RegScope rs ( this , target + 1 ) ;
compileExprTemp ( node , target ) ;
}
void compileExprVarargs ( AstExprVarargs * expr , uint8_t target , uint8_t targetCount , bool multRet = false )
{
LUAU_ASSERT ( ! multRet | | unsigned ( target + targetCount ) = = regTop ) ;
2023-01-03 17:33:19 +00:00
setDebugLine ( expr ) ; // normally compileExpr sets up line info, but compileExprVarargs can be called directly
2021-10-29 21:25:12 +01:00
bytecode . emitABC ( LOP_GETVARARGS , target , multRet ? 0 : uint8_t ( targetCount + 1 ) , 0 ) ;
}
2022-01-27 21:29:34 +00:00
void compileExprSelectVararg ( AstExprCall * expr , uint8_t target , uint8_t targetCount , bool targetTop , bool multRet , uint8_t regs )
{
LUAU_ASSERT ( targetCount = = 1 ) ;
LUAU_ASSERT ( ! expr - > self ) ;
LUAU_ASSERT ( expr - > args . size = = 2 & & expr - > args . data [ 1 ] - > is < AstExprVarargs > ( ) ) ;
AstExpr * arg = expr - > args . data [ 0 ] ;
uint8_t argreg ;
2022-05-20 00:46:52 +01:00
if ( int reg = getExprLocalReg ( arg ) ; reg > = 0 )
argreg = uint8_t ( reg ) ;
2022-01-27 21:29:34 +00:00
else
{
argreg = uint8_t ( regs + 1 ) ;
compileExprTempTop ( arg , argreg ) ;
}
size_t fastcallLabel = bytecode . emitLabel ( ) ;
bytecode . emitABC ( LOP_FASTCALL1 , LBF_SELECT_VARARG , argreg , 0 ) ;
// note, these instructions are normally not executed and are used as a fallback for FASTCALL
// we can't use TempTop variant here because we need to make sure the arguments we already computed aren't overwritten
compileExprTemp ( expr - > func , regs ) ;
2022-02-03 23:09:37 +00:00
if ( argreg ! = regs + 1 )
bytecode . emitABC ( LOP_MOVE , uint8_t ( regs + 1 ) , argreg , 0 ) ;
2022-01-27 21:29:34 +00:00
bytecode . emitABC ( LOP_GETVARARGS , uint8_t ( regs + 2 ) , 0 , 0 ) ;
size_t callLabel = bytecode . emitLabel ( ) ;
if ( ! bytecode . patchSkipC ( fastcallLabel , callLabel ) )
CompileError : : raise ( expr - > func - > location , " Exceeded jump distance limit; simplify the code to compile " ) ;
// note, this is always multCall (last argument is variadic)
bytecode . emitABC ( LOP_CALL , regs , 0 , multRet ? 0 : uint8_t ( targetCount + 1 ) ) ;
// if we didn't output results directly to target, we need to move them
if ( ! targetTop )
{
for ( size_t i = 0 ; i < targetCount ; + + i )
bytecode . emitABC ( LOP_MOVE , uint8_t ( target + i ) , uint8_t ( regs + i ) , 0 ) ;
}
}
2022-09-02 00:00:14 +01:00
void compileExprFastcallN (
AstExprCall * expr , uint8_t target , uint8_t targetCount , bool targetTop , bool multRet , uint8_t regs , int bfid , int bfK = - 1 )
2022-01-27 21:29:34 +00:00
{
LUAU_ASSERT ( ! expr - > self ) ;
2022-08-18 22:04:33 +01:00
LUAU_ASSERT ( expr - > args . size > = 1 ) ;
LUAU_ASSERT ( expr - > args . size < = 2 | | ( bfid = = LBF_BIT32_EXTRACTK & & expr - > args . size = = 3 ) ) ;
LUAU_ASSERT ( bfid = = LBF_BIT32_EXTRACTK ? bfK > = 0 : bfK < 0 ) ;
2022-01-27 21:29:34 +00:00
2022-09-02 00:00:14 +01:00
LuauOpcode opc = expr - > args . size = = 1 ? LOP_FASTCALL1 : ( bfK > = 0 | | isConstant ( expr - > args . data [ 1 ] ) ) ? LOP_FASTCALL2K : LOP_FASTCALL2 ;
2022-08-18 22:04:33 +01:00
uint32_t args [ 3 ] = { } ;
2022-01-27 21:29:34 +00:00
for ( size_t i = 0 ; i < expr - > args . size ; + + i )
{
2022-09-02 00:00:14 +01:00
if ( i > 0 & & opc = = LOP_FASTCALL2K )
2022-08-18 22:04:33 +01:00
{
2022-09-02 00:00:14 +01:00
int32_t cid = getConstantIndex ( expr - > args . data [ i ] ) ;
if ( cid < 0 )
CompileError : : raise ( expr - > location , " Exceeded constant limit; simplify the code to compile " ) ;
2022-08-18 22:04:33 +01:00
2022-09-02 00:00:14 +01:00
args [ i ] = cid ;
2022-01-27 21:29:34 +00:00
}
2022-09-02 00:00:14 +01:00
else if ( int reg = getExprLocalReg ( expr - > args . data [ i ] ) ; reg > = 0 )
2022-08-18 22:04:33 +01:00
{
2022-05-20 00:46:52 +01:00
args [ i ] = uint8_t ( reg ) ;
2022-08-18 22:04:33 +01:00
}
2022-01-27 21:29:34 +00:00
else
{
args [ i ] = uint8_t ( regs + 1 + i ) ;
compileExprTempTop ( expr - > args . data [ i ] , uint8_t ( args [ i ] ) ) ;
}
}
size_t fastcallLabel = bytecode . emitLabel ( ) ;
bytecode . emitABC ( opc , uint8_t ( bfid ) , uint8_t ( args [ 0 ] ) , 0 ) ;
if ( opc ! = LOP_FASTCALL1 )
2022-08-18 22:04:33 +01:00
bytecode . emitAux ( bfK > = 0 ? bfK : args [ 1 ] ) ;
2022-01-27 21:29:34 +00:00
// Set up a traditional Lua stack for the subsequent LOP_CALL.
// Note, as with other instructions that immediately follow FASTCALL, these are normally not executed and are used as a fallback for
// these FASTCALL variants.
for ( size_t i = 0 ; i < expr - > args . size ; + + i )
{
2022-09-02 00:00:14 +01:00
if ( i > 0 & & opc = = LOP_FASTCALL2K )
emitLoadK ( uint8_t ( regs + 1 + i ) , args [ i ] ) ;
else if ( args [ i ] ! = regs + 1 + i )
bytecode . emitABC ( LOP_MOVE , uint8_t ( regs + 1 + i ) , uint8_t ( args [ i ] ) , 0 ) ;
2022-01-27 21:29:34 +00:00
}
// note, these instructions are normally not executed and are used as a fallback for FASTCALL
// we can't use TempTop variant here because we need to make sure the arguments we already computed aren't overwritten
compileExprTemp ( expr - > func , regs ) ;
size_t callLabel = bytecode . emitLabel ( ) ;
// FASTCALL will skip over the instructions needed to compute function and jump over CALL which must immediately follow the instruction
// sequence after FASTCALL
if ( ! bytecode . patchSkipC ( fastcallLabel , callLabel ) )
CompileError : : raise ( expr - > func - > location , " Exceeded jump distance limit; simplify the code to compile " ) ;
bytecode . emitABC ( LOP_CALL , regs , uint8_t ( expr - > args . size + 1 ) , multRet ? 0 : uint8_t ( targetCount + 1 ) ) ;
// if we didn't output results directly to target, we need to move them
if ( ! targetTop )
{
for ( size_t i = 0 ; i < targetCount ; + + i )
bytecode . emitABC ( LOP_MOVE , uint8_t ( target + i ) , uint8_t ( regs + i ) , 0 ) ;
}
}
2022-05-06 00:52:48 +01:00
bool tryCompileInlinedCall ( AstExprCall * expr , AstExprFunction * func , uint8_t target , uint8_t targetCount , bool multRet , int thresholdBase ,
int thresholdMaxBoost , int depthLimit )
{
Function * fi = functions . find ( func ) ;
LUAU_ASSERT ( fi ) ;
// make sure we have enough register space
if ( regTop > 128 | | fi - > stackSize > 32 )
{
bytecode . addDebugRemark ( " inlining failed: high register pressure " ) ;
return false ;
}
// we should ideally aggregate the costs during recursive inlining, but for now simply limit the depth
if ( int ( inlineFrames . size ( ) ) > = depthLimit )
{
bytecode . addDebugRemark ( " inlining failed: too many inlined frames " ) ;
return false ;
}
// compiling recursive inlining is difficult because we share constant/variable state but need to bind variables to different registers
for ( InlineFrame & frame : inlineFrames )
if ( frame . func = = func )
{
bytecode . addDebugRemark ( " inlining failed: can't inline recursive calls " ) ;
return false ;
}
2022-06-17 01:54:42 +01:00
// we can't inline multret functions because the caller expects L->top to be adjusted:
// - inlined return compiles to a JUMP, and we don't have an instruction that adjusts L->top arbitrarily
// - even if we did, right now all L->top adjustments are immediately consumed by the next instruction, and for now we want to preserve that
2023-03-03 13:45:38 +00:00
// - additionally, we can't easily compile multret expressions into designated target as computed call arguments will get clobbered
2022-05-06 00:52:48 +01:00
if ( multRet )
{
bytecode . addDebugRemark ( " inlining failed: can't convert fixed returns to multret " ) ;
return false ;
}
2022-05-20 00:46:52 +01:00
// compute constant bitvector for all arguments to feed the cost model
2022-05-06 00:52:48 +01:00
bool varc [ 8 ] = { } ;
2022-05-20 00:46:52 +01:00
for ( size_t i = 0 ; i < func - > args . size & & i < expr - > args . size & & i < 8 ; + + i )
2022-05-06 00:52:48 +01:00
varc [ i ] = isConstant ( expr - > args . data [ i ] ) ;
2022-05-20 00:46:52 +01:00
// if the last argument only returns a single value, all following arguments are nil
2022-07-14 23:39:35 +01:00
if ( expr - > args . size ! = 0 & & ! isExprMultRet ( expr - > args . data [ expr - > args . size - 1 ] ) )
2022-05-20 00:46:52 +01:00
for ( size_t i = expr - > args . size ; i < func - > args . size & & i < 8 ; + + i )
varc [ i ] = true ;
// we use a dynamic cost threshold that's based on the fixed limit boosted by the cost advantage we gain due to inlining
int inlinedCost = computeCost ( fi - > costModel , varc , std : : min ( int ( func - > args . size ) , 8 ) ) ;
2022-05-06 00:52:48 +01:00
int baselineCost = computeCost ( fi - > costModel , nullptr , 0 ) + 3 ;
int inlineProfit = ( inlinedCost = = 0 ) ? thresholdMaxBoost : std : : min ( thresholdMaxBoost , 100 * baselineCost / inlinedCost ) ;
int threshold = thresholdBase * inlineProfit / 100 ;
if ( inlinedCost > threshold )
{
bytecode . addDebugRemark ( " inlining failed: too expensive (cost %d, profit %.2fx) " , inlinedCost , double ( inlineProfit ) / 100 ) ;
return false ;
}
bytecode . addDebugRemark (
" inlining succeeded (cost %d, profit %.2fx, depth %d) " , inlinedCost , double ( inlineProfit ) / 100 , int ( inlineFrames . size ( ) ) ) ;
compileInlinedCall ( expr , func , target , targetCount ) ;
return true ;
}
void compileInlinedCall ( AstExprCall * expr , AstExprFunction * func , uint8_t target , uint8_t targetCount )
{
RegScope rs ( this ) ;
size_t oldLocals = localStack . size ( ) ;
2023-05-25 21:46:51 +01:00
std : : vector < InlineArg > args ;
2023-06-16 18:01:18 +01:00
args . reserve ( func - > args . size ) ;
2022-05-06 00:52:48 +01:00
// evaluate all arguments; note that we don't emit code for constant arguments (relying on constant folding)
2023-05-25 21:46:51 +01:00
// note that compiler state (variable registers/values) does not change here - we defer that to a separate loop below to handle nested calls
2022-05-06 00:52:48 +01:00
for ( size_t i = 0 ; i < func - > args . size ; + + i )
{
AstLocal * var = func - > args . data [ i ] ;
2022-05-20 00:46:52 +01:00
AstExpr * arg = i < expr - > args . size ? expr - > args . data [ i ] : nullptr ;
2022-05-06 00:52:48 +01:00
2022-07-14 23:39:35 +01:00
if ( i + 1 = = expr - > args . size & & func - > args . size > expr - > args . size & & isExprMultRet ( arg ) )
2022-05-20 00:46:52 +01:00
{
// if the last argument can return multiple values, we need to compute all of them into the remaining arguments
unsigned int tail = unsigned ( func - > args . size - expr - > args . size ) + 1 ;
uint8_t reg = allocReg ( arg , tail ) ;
if ( AstExprCall * expr = arg - > as < AstExprCall > ( ) )
compileExprCall ( expr , reg , tail , /* targetTop= */ true ) ;
else if ( AstExprVarargs * expr = arg - > as < AstExprVarargs > ( ) )
compileExprVarargs ( expr , reg , tail ) ;
else
LUAU_ASSERT ( ! " Unexpected expression type " ) ;
2023-06-16 18:01:18 +01:00
for ( size_t j = i ; j < func - > args . size ; + + j )
args . push_back ( { func - > args . data [ j ] , uint8_t ( reg + ( j - i ) ) } ) ;
2022-05-20 00:46:52 +01:00
// all remaining function arguments have been allocated and assigned to
break ;
}
else if ( Variable * vv = variables . find ( var ) ; vv & & vv - > written )
2022-05-06 00:52:48 +01:00
{
// if the argument is mutated, we need to allocate a fresh register even if it's a constant
uint8_t reg = allocReg ( arg , 1 ) ;
2022-05-20 00:46:52 +01:00
if ( arg )
compileExprTemp ( arg , reg ) ;
else
bytecode . emitABC ( LOP_LOADNIL , reg , 0 , 0 ) ;
2023-06-16 18:01:18 +01:00
args . push_back ( { var , reg } ) ;
2022-05-06 00:52:48 +01:00
}
2022-05-20 00:46:52 +01:00
else if ( arg = = nullptr )
{
// since the argument is not mutated, we can simply fold the value into the expressions that need it
2023-06-16 18:01:18 +01:00
args . push_back ( { var , kInvalidReg , { Constant : : Type_Nil } } ) ;
2022-05-20 00:46:52 +01:00
}
2022-05-06 00:52:48 +01:00
else if ( const Constant * cv = constants . find ( arg ) ; cv & & cv - > type ! = Constant : : Type_Unknown )
{
// since the argument is not mutated, we can simply fold the value into the expressions that need it
2023-06-16 18:01:18 +01:00
args . push_back ( { var , kInvalidReg , * cv } ) ;
2022-05-06 00:52:48 +01:00
}
else
{
2022-08-18 22:04:33 +01:00
AstExprLocal * le = getExprLocal ( arg ) ;
2022-05-06 00:52:48 +01:00
Variable * lv = le ? variables . find ( le - > local ) : nullptr ;
// if the argument is a local that isn't mutated, we will simply reuse the existing register
2022-05-20 00:46:52 +01:00
if ( int reg = le ? getExprLocalReg ( le ) : - 1 ; reg > = 0 & & ( ! lv | | ! lv - > written ) )
2022-05-06 00:52:48 +01:00
{
2023-06-16 18:01:18 +01:00
args . push_back ( { var , uint8_t ( reg ) } ) ;
2022-05-06 00:52:48 +01:00
}
else
{
2022-05-20 00:46:52 +01:00
uint8_t temp = allocReg ( arg , 1 ) ;
compileExprTemp ( arg , temp ) ;
2023-05-25 21:46:51 +01:00
2023-06-16 18:01:18 +01:00
args . push_back ( { var , temp } ) ;
2022-05-06 00:52:48 +01:00
}
}
}
2022-05-20 00:46:52 +01:00
// evaluate extra expressions for side effects
for ( size_t i = func - > args . size ; i < expr - > args . size ; + + i )
{
RegScope rsi ( this ) ;
compileExprAuto ( expr - > args . data [ i ] , rsi ) ;
}
2023-06-16 18:01:18 +01:00
// apply all evaluated arguments to the compiler state
// note: locals use current startpc for debug info, although some of them have been computed earlier; this is similar to compileStatLocal
for ( InlineArg & arg : args )
2023-10-06 18:31:16 +01:00
{
2023-06-16 18:01:18 +01:00
if ( arg . value . type = = Constant : : Type_Unknown )
2023-10-06 18:31:16 +01:00
{
2023-06-16 18:01:18 +01:00
pushLocal ( arg . local , arg . reg ) ;
2023-10-06 18:31:16 +01:00
}
2023-06-16 18:01:18 +01:00
else
2023-10-06 18:31:16 +01:00
{
2023-06-16 18:01:18 +01:00
locstants [ arg . local ] = arg . value ;
2023-10-06 18:31:16 +01:00
}
}
2023-06-16 18:01:18 +01:00
// the inline frame will be used to compile return statements as well as to reject recursive inlining attempts
inlineFrames . push_back ( { func , oldLocals , target , targetCount } ) ;
2023-05-25 21:46:51 +01:00
2022-05-06 00:52:48 +01:00
// fold constant values updated above into expressions in the function body
2023-08-04 18:01:35 +01:00
foldConstants ( constants , variables , locstants , builtinsFold , builtinsFoldMathK , func - > body ) ;
2022-05-06 00:52:48 +01:00
bool usedFallthrough = false ;
for ( size_t i = 0 ; i < func - > body - > body . size ; + + i )
{
AstStat * stat = func - > body - > body . data [ i ] ;
if ( AstStatReturn * ret = stat - > as < AstStatReturn > ( ) )
{
// Optimization: use fallthrough when compiling return at the end of the function to avoid an extra JUMP
compileInlineReturn ( ret , /* fallthrough= */ true ) ;
// TODO: This doesn't work when return is part of control flow; ideally we would track the state somehow and generalize this
usedFallthrough = true ;
break ;
}
else
compileStat ( stat ) ;
}
// for the fallthrough path we need to ensure we clear out target registers
2023-02-24 18:24:22 +00:00
if ( ! usedFallthrough & & ! alwaysTerminates ( func - > body ) )
2022-05-06 00:52:48 +01:00
{
for ( size_t i = 0 ; i < targetCount ; + + i )
bytecode . emitABC ( LOP_LOADNIL , uint8_t ( target + i ) , 0 , 0 ) ;
2022-06-17 01:54:42 +01:00
closeLocals ( oldLocals ) ;
2022-05-06 00:52:48 +01:00
}
popLocals ( oldLocals ) ;
size_t returnLabel = bytecode . emitLabel ( ) ;
patchJumps ( expr , inlineFrames . back ( ) . returnJumps , returnLabel ) ;
inlineFrames . pop_back ( ) ;
// clean up constant state for future inlining attempts
for ( size_t i = 0 ; i < func - > args . size ; + + i )
2023-10-06 18:31:16 +01:00
{
AstLocal * local = func - > args . data [ i ] ;
2023-10-13 20:38:31 +01:00
if ( Constant * var = locstants . find ( local ) )
var - > type = Constant : : Type_Unknown ;
2023-10-06 18:31:16 +01:00
}
2022-05-06 00:52:48 +01:00
2023-08-04 18:01:35 +01:00
foldConstants ( constants , variables , locstants , builtinsFold , builtinsFoldMathK , func - > body ) ;
2022-05-06 00:52:48 +01:00
}
2021-10-29 21:25:12 +01:00
void compileExprCall ( AstExprCall * expr , uint8_t target , uint8_t targetCount , bool targetTop = false , bool multRet = false )
{
LUAU_ASSERT ( ! targetTop | | unsigned ( target + targetCount ) = = regTop ) ;
setDebugLine ( expr ) ; // normally compileExpr sets up line info, but compileExprCall can be called directly
2022-05-06 00:52:48 +01:00
// try inlining the function
if ( options . optimizationLevel > = 2 & & ! expr - > self )
{
AstExprFunction * func = getFunctionExpr ( expr - > func ) ;
Function * fi = func ? functions . find ( func ) : nullptr ;
if ( fi & & fi - > canInline & &
tryCompileInlinedCall ( expr , func , target , targetCount , multRet , FInt : : LuauCompileInlineThreshold ,
FInt : : LuauCompileInlineThresholdMaxBoost , FInt : : LuauCompileInlineDepth ) )
return ;
2022-05-20 00:46:52 +01:00
// add a debug remark for cases when we didn't even call tryCompileInlinedCall
if ( func & & ! ( fi & & fi - > canInline ) )
2022-05-13 20:16:50 +01:00
{
if ( func - > vararg )
bytecode . addDebugRemark ( " inlining failed: function is variadic " ) ;
2022-05-26 21:33:48 +01:00
else if ( ! fi )
2022-05-20 00:46:52 +01:00
bytecode . addDebugRemark ( " inlining failed: can't inline recursive calls " ) ;
2022-05-26 21:33:48 +01:00
else if ( getfenvUsed | | setfenvUsed )
bytecode . addDebugRemark ( " inlining failed: module uses getfenv/setfenv " ) ;
2022-05-13 20:16:50 +01:00
}
2022-05-06 00:52:48 +01:00
}
2021-10-29 21:25:12 +01:00
RegScope rs ( this ) ;
unsigned int regCount = std : : max ( unsigned ( 1 + expr - > self + expr - > args . size ) , unsigned ( targetCount ) ) ;
// Optimization: if target points to the top of the stack, we can start the call at oldTop - 1 and won't need MOVE at the end
uint8_t regs = targetTop ? allocReg ( expr , regCount - targetCount ) - targetCount : allocReg ( expr , regCount ) ;
uint8_t selfreg = 0 ;
int bfid = - 1 ;
2022-07-14 23:39:35 +01:00
if ( options . optimizationLevel > = 1 & & ! expr - > self )
if ( const int * id = builtins . find ( expr ) )
bfid = * id ;
2021-10-29 21:25:12 +01:00
2022-10-13 23:59:53 +01:00
if ( bfid > = 0 & & bytecode . needsDebugRemarks ( ) )
{
Builtin builtin = getBuiltin ( expr - > func , globals , variables ) ;
bool lastMult = expr - > args . size > 0 & & isExprMultRet ( expr - > args . data [ expr - > args . size - 1 ] ) ;
if ( builtin . object . value )
bytecode . addDebugRemark ( " builtin %s.%s/%d%s " , builtin . object . value , builtin . method . value , int ( expr - > args . size ) , lastMult ? " + " : " " ) ;
else if ( builtin . method . value )
bytecode . addDebugRemark ( " builtin %s/%d%s " , builtin . method . value , int ( expr - > args . size ) , lastMult ? " + " : " " ) ;
}
2022-01-27 21:29:34 +00:00
if ( bfid = = LBF_SELECT_VARARG )
{
// Optimization: compile select(_, ...) as FASTCALL1; the builtin will read variadic arguments directly
// note: for now we restrict this to single-return expressions since our runtime code doesn't deal with general cases
2022-07-14 23:39:35 +01:00
if ( multRet = = false & & targetCount = = 1 )
2022-01-27 21:29:34 +00:00
return compileExprSelectVararg ( expr , target , targetCount , targetTop , multRet , regs ) ;
else
bfid = - 1 ;
}
2022-08-18 22:04:33 +01:00
// Optimization: for bit32.extract with constant in-range f/w we compile using FASTCALL2K and a special builtin
2022-09-02 00:00:14 +01:00
if ( bfid = = LBF_BIT32_EXTRACT & & expr - > args . size = = 3 & & isConstant ( expr - > args . data [ 1 ] ) & & isConstant ( expr - > args . data [ 2 ] ) )
2022-08-18 22:04:33 +01:00
{
Constant fc = getConstant ( expr - > args . data [ 1 ] ) ;
Constant wc = getConstant ( expr - > args . data [ 2 ] ) ;
int fi = fc . type = = Constant : : Type_Number ? int ( fc . valueNumber ) : - 1 ;
int wi = wc . type = = Constant : : Type_Number ? int ( wc . valueNumber ) : - 1 ;
if ( fi > = 0 & & wi > 0 & & fi + wi < = 32 )
{
int fwp = fi | ( ( wi - 1 ) < < 5 ) ;
int32_t cid = bytecode . addConstantNumber ( fwp ) ;
if ( cid < 0 )
CompileError : : raise ( expr - > location , " Exceeded constant limit; simplify the code to compile " ) ;
return compileExprFastcallN ( expr , target , targetCount , targetTop , multRet , regs , LBF_BIT32_EXTRACTK , cid ) ;
}
}
2022-01-27 21:29:34 +00:00
// Optimization: for 1/2 argument fast calls use specialized opcodes
2023-03-03 13:45:38 +00:00
if ( bfid > = 0 & & expr - > args . size > = 1 & & expr - > args . size < = 2 )
{
if ( ! isExprMultRet ( expr - > args . data [ expr - > args . size - 1 ] ) )
return compileExprFastcallN ( expr , target , targetCount , targetTop , multRet , regs , bfid ) ;
2023-07-28 12:37:00 +01:00
else if ( options . optimizationLevel > = 2 )
{
2023-08-18 18:06:29 +01:00
// when a builtin is none-safe with matching arity, even if the last expression returns 0 or >1 arguments,
// we can rely on the behavior of the function being the same (none-safe means nil and none are interchangeable)
BuiltinInfo info = getBuiltinInfo ( bfid ) ;
if ( int ( expr - > args . size ) = = info . params & & ( info . flags & BuiltinInfo : : Flag_NoneSafe ) ! = 0 )
2023-07-28 12:37:00 +01:00
return compileExprFastcallN ( expr , target , targetCount , targetTop , multRet , regs , bfid ) ;
}
2023-03-03 13:45:38 +00:00
}
2022-01-27 21:29:34 +00:00
2021-10-29 21:25:12 +01:00
if ( expr - > self )
{
AstExprIndexName * fi = expr - > func - > as < AstExprIndexName > ( ) ;
LUAU_ASSERT ( fi ) ;
// Optimization: use local register directly in NAMECALL if possible
2022-05-20 00:46:52 +01:00
if ( int reg = getExprLocalReg ( fi - > expr ) ; reg > = 0 )
2021-10-29 21:25:12 +01:00
{
2022-05-20 00:46:52 +01:00
selfreg = uint8_t ( reg ) ;
2021-10-29 21:25:12 +01:00
}
else
{
// Note: to be able to compile very deeply nested self call chains (obj:method1():method2():...), we need to be able to do this in
// finite stack space NAMECALL will happily move object from regs to regs+1 but we need to compute it into regs so that
// compileExprTempTop doesn't increase stack usage for every recursive call
selfreg = regs ;
compileExprTempTop ( fi - > expr , selfreg ) ;
}
}
else if ( bfid < 0 )
{
compileExprTempTop ( expr - > func , regs ) ;
}
bool multCall = false ;
2022-01-27 21:29:34 +00:00
for ( size_t i = 0 ; i < expr - > args . size ; + + i )
if ( i + 1 = = expr - > args . size )
multCall = compileExprTempMultRet ( expr - > args . data [ i ] , uint8_t ( regs + 1 + expr - > self + i ) ) ;
else
compileExprTempTop ( expr - > args . data [ i ] , uint8_t ( regs + 1 + expr - > self + i ) ) ;
2021-10-29 21:25:12 +01:00
2021-12-02 23:20:08 +00:00
setDebugLineEnd ( expr - > func ) ;
2021-10-29 21:25:12 +01:00
if ( expr - > self )
{
AstExprIndexName * fi = expr - > func - > as < AstExprIndexName > ( ) ;
LUAU_ASSERT ( fi ) ;
2021-12-02 23:20:08 +00:00
setDebugLine ( fi - > indexLocation ) ;
2021-10-29 21:25:12 +01:00
BytecodeBuilder : : StringRef iname = sref ( fi - > index ) ;
int32_t cid = bytecode . addConstantString ( iname ) ;
if ( cid < 0 )
CompileError : : raise ( fi - > location , " Exceeded constant limit; simplify the code to compile " ) ;
bytecode . emitABC ( LOP_NAMECALL , regs , selfreg , uint8_t ( BytecodeBuilder : : getStringHash ( iname ) ) ) ;
bytecode . emitAux ( cid ) ;
}
else if ( bfid > = 0 )
{
2022-01-27 21:29:34 +00:00
size_t fastcallLabel = bytecode . emitLabel ( ) ;
bytecode . emitABC ( LOP_FASTCALL , uint8_t ( bfid ) , 0 , 0 ) ;
2021-10-29 21:25:12 +01:00
// note, these instructions are normally not executed and are used as a fallback for FASTCALL
// we can't use TempTop variant here because we need to make sure the arguments we already computed aren't overwritten
compileExprTemp ( expr - > func , regs ) ;
size_t callLabel = bytecode . emitLabel ( ) ;
// FASTCALL will skip over the instructions needed to compute function and jump over CALL which must immediately follow the instruction
// sequence after FASTCALL
if ( ! bytecode . patchSkipC ( fastcallLabel , callLabel ) )
CompileError : : raise ( expr - > func - > location , " Exceeded jump distance limit; simplify the code to compile " ) ;
}
bytecode . emitABC ( LOP_CALL , regs , multCall ? 0 : uint8_t ( expr - > self + expr - > args . size + 1 ) , multRet ? 0 : uint8_t ( targetCount + 1 ) ) ;
// if we didn't output results directly to target, we need to move them
if ( ! targetTop )
{
for ( size_t i = 0 ; i < targetCount ; + + i )
bytecode . emitABC ( LOP_MOVE , uint8_t ( target + i ) , uint8_t ( regs + i ) , 0 ) ;
}
}
bool shouldShareClosure ( AstExprFunction * func )
{
const Function * f = functions . find ( func ) ;
if ( ! f )
return false ;
for ( AstLocal * uv : f - > upvals )
{
2022-01-14 16:06:31 +00:00
Variable * ul = variables . find ( uv ) ;
if ( ! ul )
return false ;
2021-10-29 21:25:12 +01:00
if ( ul - > written )
return false ;
// it's technically safe to share closures whenever all upvalues are immutable
// this is because of a runtime equality check in DUPCLOSURE.
// however, this results in frequent deoptimization and increases the set of reachable objects, making some temporary objects permanent
// instead we apply a heuristic: we share closures if they refer to top-level upvalues, or closures that refer to top-level upvalues
// this will only deoptimize (outside of fenv changes) if top level code is executed twice with different results.
if ( uv - > functionDepth ! = 0 | | uv - > loopDepth ! = 0 )
{
2022-01-14 16:06:31 +00:00
AstExprFunction * uf = ul - > init ? ul - > init - > as < AstExprFunction > ( ) : nullptr ;
if ( ! uf )
2021-10-29 21:25:12 +01:00
return false ;
2022-01-14 16:06:31 +00:00
if ( uf ! = func & & ! shouldShareClosure ( uf ) )
2021-10-29 21:25:12 +01:00
return false ;
}
}
return true ;
}
void compileExprFunction ( AstExprFunction * expr , uint8_t target )
{
2022-05-20 00:46:52 +01:00
RegScope rs ( this ) ;
2021-10-29 21:25:12 +01:00
const Function * f = functions . find ( expr ) ;
LUAU_ASSERT ( f ) ;
// when the closure has upvalues we'll use this to create the closure at runtime
// when the closure has no upvalues, we use constant closures that technically don't rely on the child function list
// however, it's still important to add the child function because debugger relies on the function hierarchy when setting breakpoints
int16_t pid = bytecode . addChildFunction ( f - > id ) ;
if ( pid < 0 )
CompileError : : raise ( expr - > location , " Exceeded closure limit; simplify the code to compile " ) ;
2022-06-17 01:52:23 +01:00
// we use a scratch vector to reduce allocations; this is safe since compileExprFunction is not reentrant
captures . clear ( ) ;
captures . reserve ( f - > upvals . size ( ) ) ;
for ( AstLocal * uv : f - > upvals )
2022-05-20 00:46:52 +01:00
{
2022-06-17 01:52:23 +01:00
LUAU_ASSERT ( uv - > functionDepth < expr - > functionDepth ) ;
2022-05-20 00:46:52 +01:00
2022-06-17 01:52:23 +01:00
if ( int reg = getLocalReg ( uv ) ; reg > = 0 )
2022-05-20 00:46:52 +01:00
{
2022-06-17 01:52:23 +01:00
// note: we can't check if uv is an upvalue in the current frame because inlining can migrate from upvalues to locals
Variable * ul = variables . find ( uv ) ;
bool immutable = ! ul | | ! ul - > written ;
2022-05-20 00:46:52 +01:00
2022-06-17 01:52:23 +01:00
captures . push_back ( { immutable ? LCT_VAL : LCT_REF , uint8_t ( reg ) } ) ;
2022-05-20 00:46:52 +01:00
}
2022-06-17 01:52:23 +01:00
else if ( const Constant * uc = locstants . find ( uv ) ; uc & & uc - > type ! = Constant : : Type_Unknown )
2022-05-20 00:46:52 +01:00
{
2022-06-17 01:52:23 +01:00
// inlining can result in an upvalue capture of a constant, in which case we can't capture without a temporary register
uint8_t reg = allocReg ( expr , 1 ) ;
compileExprConstant ( expr , uc , reg ) ;
2022-05-20 00:46:52 +01:00
2022-06-17 01:52:23 +01:00
captures . push_back ( { LCT_VAL , reg } ) ;
2022-05-20 00:46:52 +01:00
}
else
2022-06-17 01:52:23 +01:00
{
LUAU_ASSERT ( uv - > functionDepth < expr - > functionDepth - 1 ) ;
2022-05-20 00:46:52 +01:00
2022-06-17 01:52:23 +01:00
// get upvalue from parent frame
// note: this will add uv to the current upvalue list if necessary
uint8_t uid = getUpval ( uv ) ;
2022-05-20 00:46:52 +01:00
2022-06-17 01:52:23 +01:00
captures . push_back ( { LCT_UPVAL , uid } ) ;
}
2022-05-20 00:46:52 +01:00
}
2021-12-10 21:17:10 +00:00
// Optimization: when closure has no upvalues, or upvalues are safe to share, instead of allocating it every time we can share closure
// objects (this breaks assumptions about function identity which can lead to setfenv not working as expected, so we disable this when it
// is used)
2022-06-17 01:52:23 +01:00
int16_t shared = - 1 ;
2021-12-10 21:17:10 +00:00
if ( options . optimizationLevel > = 1 & & shouldShareClosure ( expr ) & & ! setfenvUsed )
2021-10-29 21:25:12 +01:00
{
2021-12-10 21:17:10 +00:00
int32_t cid = bytecode . addConstantClosure ( f - > id ) ;
2021-10-29 21:25:12 +01:00
2021-12-10 21:17:10 +00:00
if ( cid > = 0 & & cid < 32768 )
2022-06-17 01:52:23 +01:00
shared = int16_t ( cid ) ;
2021-10-29 21:25:12 +01:00
}
2022-10-13 23:59:53 +01:00
if ( shared < 0 )
bytecode . addDebugRemark ( " allocation: closure with %d upvalues " , int ( captures . size ( ) ) ) ;
2022-06-17 01:52:23 +01:00
if ( shared > = 0 )
bytecode . emitAD ( LOP_DUPCLOSURE , target , shared ) ;
else
2021-10-29 21:25:12 +01:00
bytecode . emitAD ( LOP_NEWCLOSURE , target , pid ) ;
2022-06-17 01:52:23 +01:00
for ( const Capture & c : captures )
bytecode . emitABC ( LOP_CAPTURE , uint8_t ( c . type ) , c . data , 0 ) ;
2021-10-29 21:25:12 +01:00
}
LuauOpcode getUnaryOp ( AstExprUnary : : Op op )
{
switch ( op )
{
case AstExprUnary : : Not :
return LOP_NOT ;
case AstExprUnary : : Minus :
return LOP_MINUS ;
case AstExprUnary : : Len :
return LOP_LENGTH ;
default :
LUAU_ASSERT ( ! " Unexpected unary operation " ) ;
return LOP_NOP ;
}
}
LuauOpcode getBinaryOpArith ( AstExprBinary : : Op op , bool k = false )
{
switch ( op )
{
case AstExprBinary : : Add :
return k ? LOP_ADDK : LOP_ADD ;
case AstExprBinary : : Sub :
return k ? LOP_SUBK : LOP_SUB ;
case AstExprBinary : : Mul :
return k ? LOP_MULK : LOP_MUL ;
case AstExprBinary : : Div :
return k ? LOP_DIVK : LOP_DIV ;
2023-09-01 17:38:53 +01:00
case AstExprBinary : : FloorDiv :
LUAU_ASSERT ( FFlag : : LuauFloorDivision ) ;
return k ? LOP_IDIVK : LOP_IDIV ;
2021-10-29 21:25:12 +01:00
case AstExprBinary : : Mod :
return k ? LOP_MODK : LOP_MOD ;
case AstExprBinary : : Pow :
return k ? LOP_POWK : LOP_POW ;
default :
LUAU_ASSERT ( ! " Unexpected binary operation " ) ;
return LOP_NOP ;
}
}
LuauOpcode getJumpOpCompare ( AstExprBinary : : Op op , bool not_ = false )
{
switch ( op )
{
case AstExprBinary : : CompareNe :
return not_ ? LOP_JUMPIFEQ : LOP_JUMPIFNOTEQ ;
case AstExprBinary : : CompareEq :
return not_ ? LOP_JUMPIFNOTEQ : LOP_JUMPIFEQ ;
case AstExprBinary : : CompareLt :
case AstExprBinary : : CompareGt :
return not_ ? LOP_JUMPIFNOTLT : LOP_JUMPIFLT ;
case AstExprBinary : : CompareLe :
case AstExprBinary : : CompareGe :
return not_ ? LOP_JUMPIFNOTLE : LOP_JUMPIFLE ;
default :
LUAU_ASSERT ( ! " Unexpected binary operation " ) ;
return LOP_NOP ;
}
}
bool isConstant ( AstExpr * node )
{
const Constant * cv = constants . find ( node ) ;
return cv & & cv - > type ! = Constant : : Type_Unknown ;
}
bool isConstantTrue ( AstExpr * node )
{
const Constant * cv = constants . find ( node ) ;
return cv & & cv - > type ! = Constant : : Type_Unknown & & cv - > isTruthful ( ) ;
}
bool isConstantFalse ( AstExpr * node )
{
const Constant * cv = constants . find ( node ) ;
return cv & & cv - > type ! = Constant : : Type_Unknown & & ! cv - > isTruthful ( ) ;
}
2022-05-26 21:33:48 +01:00
Constant getConstant ( AstExpr * node )
{
const Constant * cv = constants . find ( node ) ;
return cv ? * cv : Constant { Constant : : Type_Unknown } ;
}
2021-10-29 21:25:12 +01:00
size_t compileCompareJump ( AstExprBinary * expr , bool not_ = false )
{
RegScope rs ( this ) ;
2022-08-04 22:27:28 +01:00
bool isEq = ( expr - > op = = AstExprBinary : : CompareEq | | expr - > op = = AstExprBinary : : CompareNe ) ;
2021-10-29 21:25:12 +01:00
AstExpr * left = expr - > left ;
AstExpr * right = expr - > right ;
bool operandIsConstant = isConstant ( right ) ;
if ( isEq & & ! operandIsConstant )
{
operandIsConstant = isConstant ( left ) ;
if ( operandIsConstant )
std : : swap ( left , right ) ;
}
2022-09-02 00:00:14 +01:00
uint8_t rl = compileExprAuto ( left , rs ) ;
2021-10-29 21:25:12 +01:00
2022-09-02 00:00:14 +01:00
if ( isEq & & operandIsConstant )
{
const Constant * cv = constants . find ( right ) ;
LUAU_ASSERT ( cv & & cv - > type ! = Constant : : Type_Unknown ) ;
2022-08-04 22:27:28 +01:00
2022-09-02 00:00:14 +01:00
LuauOpcode opc = LOP_NOP ;
int32_t cid = - 1 ;
uint32_t flip = ( expr - > op = = AstExprBinary : : CompareEq ) = = not_ ? 0x80000000 : 0 ;
2022-08-04 22:27:28 +01:00
2022-09-02 00:00:14 +01:00
switch ( cv - > type )
{
case Constant : : Type_Nil :
opc = LOP_JUMPXEQKNIL ;
cid = 0 ;
break ;
2022-08-04 22:27:28 +01:00
2022-09-02 00:00:14 +01:00
case Constant : : Type_Boolean :
opc = LOP_JUMPXEQKB ;
cid = cv - > valueBoolean ;
break ;
2022-08-04 22:27:28 +01:00
2022-09-02 00:00:14 +01:00
case Constant : : Type_Number :
opc = LOP_JUMPXEQKN ;
cid = getConstantIndex ( right ) ;
break ;
2022-08-04 22:27:28 +01:00
2022-09-02 00:00:14 +01:00
case Constant : : Type_String :
opc = LOP_JUMPXEQKS ;
cid = getConstantIndex ( right ) ;
break ;
2022-08-04 22:27:28 +01:00
2022-09-02 00:00:14 +01:00
default :
LUAU_ASSERT ( ! " Unexpected constant type " ) ;
2022-08-04 22:27:28 +01:00
}
2022-09-02 00:00:14 +01:00
if ( cid < 0 )
CompileError : : raise ( expr - > location , " Exceeded constant limit; simplify the code to compile " ) ;
2022-08-04 22:27:28 +01:00
2022-09-02 00:00:14 +01:00
size_t jumpLabel = bytecode . emitLabel ( ) ;
2022-08-04 22:27:28 +01:00
2022-09-02 00:00:14 +01:00
bytecode . emitAD ( opc , rl , 0 ) ;
bytecode . emitAux ( cid | flip ) ;
2022-08-04 22:27:28 +01:00
2022-09-02 00:00:14 +01:00
return jumpLabel ;
2021-10-29 21:25:12 +01:00
}
else
{
2022-08-04 22:27:28 +01:00
LuauOpcode opc = getJumpOpCompare ( expr - > op , not_ ) ;
2022-09-02 00:00:14 +01:00
uint8_t rr = compileExprAuto ( right , rs ) ;
2022-08-04 22:27:28 +01:00
size_t jumpLabel = bytecode . emitLabel ( ) ;
if ( expr - > op = = AstExprBinary : : CompareGt | | expr - > op = = AstExprBinary : : CompareGe )
{
2022-09-02 00:00:14 +01:00
bytecode . emitAD ( opc , rr , 0 ) ;
2022-08-04 22:27:28 +01:00
bytecode . emitAux ( rl ) ;
}
else
{
bytecode . emitAD ( opc , rl , 0 ) ;
bytecode . emitAux ( rr ) ;
}
return jumpLabel ;
}
2021-10-29 21:25:12 +01:00
}
int32_t getConstantNumber ( AstExpr * node )
{
const Constant * c = constants . find ( node ) ;
if ( c & & c - > type = = Constant : : Type_Number )
{
int cid = bytecode . addConstantNumber ( c - > valueNumber ) ;
if ( cid < 0 )
CompileError : : raise ( node - > location , " Exceeded constant limit; simplify the code to compile " ) ;
return cid ;
}
return - 1 ;
}
int32_t getConstantIndex ( AstExpr * node )
{
const Constant * c = constants . find ( node ) ;
2022-05-06 00:52:48 +01:00
if ( ! c | | c - > type = = Constant : : Type_Unknown )
2021-10-29 21:25:12 +01:00
return - 1 ;
int cid = - 1 ;
switch ( c - > type )
{
case Constant : : Type_Nil :
cid = bytecode . addConstantNil ( ) ;
break ;
case Constant : : Type_Boolean :
cid = bytecode . addConstantBoolean ( c - > valueBoolean ) ;
break ;
case Constant : : Type_Number :
cid = bytecode . addConstantNumber ( c - > valueNumber ) ;
break ;
case Constant : : Type_String :
2022-01-14 16:06:31 +00:00
cid = bytecode . addConstantString ( sref ( c - > getString ( ) ) ) ;
2021-10-29 21:25:12 +01:00
break ;
default :
LUAU_ASSERT ( ! " Unexpected constant type " ) ;
return - 1 ;
}
if ( cid < 0 )
CompileError : : raise ( node - > location , " Exceeded constant limit; simplify the code to compile " ) ;
return cid ;
}
// compile expr to target temp register
2021-11-05 02:42:00 +00:00
// if the expr (or not expr if onlyTruth is false) is truthy, jump via skipJump
// if the expr (or not expr if onlyTruth is false) is falsy, fall through (target isn't guaranteed to be updated in this case)
// if target is omitted, then the jump behavior is the same - skipJump or fallthrough depending on the truthiness of the expression
2021-10-29 21:25:12 +01:00
void compileConditionValue ( AstExpr * node , const uint8_t * target , std : : vector < size_t > & skipJump , bool onlyTruth )
{
// Optimization: we don't need to compute constant values
2022-05-26 21:33:48 +01:00
if ( const Constant * cv = constants . find ( node ) ; cv & & cv - > type ! = Constant : : Type_Unknown )
2021-10-29 21:25:12 +01:00
{
2021-11-05 02:42:00 +00:00
// note that we only need to compute the value if it's truthy; otherwise we cal fall through
2021-10-29 21:25:12 +01:00
if ( cv - > isTruthful ( ) = = onlyTruth )
{
if ( target )
compileExprTemp ( node , * target ) ;
skipJump . push_back ( bytecode . emitLabel ( ) ) ;
bytecode . emitAD ( LOP_JUMP , 0 , 0 ) ;
}
return ;
}
if ( AstExprBinary * expr = node - > as < AstExprBinary > ( ) )
{
switch ( expr - > op )
{
case AstExprBinary : : And :
case AstExprBinary : : Or :
{
2021-11-05 02:42:00 +00:00
// disambiguation: there's 4 cases (we only need truthy or falsy results based on onlyTruth)
2021-10-29 21:25:12 +01:00
// onlyTruth = 1: a and b transforms to a ? b : dontcare
2022-08-18 22:04:33 +01:00
// onlyTruth = 1: a or b transforms to a ? a : b
2021-10-29 21:25:12 +01:00
// onlyTruth = 0: a and b transforms to !a ? a : b
// onlyTruth = 0: a or b transforms to !a ? b : dontcare
if ( onlyTruth = = ( expr - > op = = AstExprBinary : : And ) )
{
// we need to compile the left hand side, and skip to "dontcare" (aka fallthrough of the entire statement) if it's not the same as
// onlyTruth if it's the same then the result of the expression is the right hand side because of this, we *never* care about the
// result of the left hand side
std : : vector < size_t > elseJump ;
compileConditionValue ( expr - > left , nullptr , elseJump , ! onlyTruth ) ;
// fallthrough indicates that we need to compute & return the right hand side
// we use compileConditionValue again to process any extra and/or statements directly
compileConditionValue ( expr - > right , target , skipJump , onlyTruth ) ;
size_t elseLabel = bytecode . emitLabel ( ) ;
patchJumps ( expr , elseJump , elseLabel ) ;
}
else
{
// we need to compute the left hand side first; note that we will jump to skipJump if we know the answer
compileConditionValue ( expr - > left , target , skipJump , onlyTruth ) ;
// we will fall through if computing the left hand didn't give us an "interesting" result
// we still use compileConditionValue to recursively optimize any and/or/compare statements
compileConditionValue ( expr - > right , target , skipJump , onlyTruth ) ;
}
return ;
}
break ;
case AstExprBinary : : CompareNe :
case AstExprBinary : : CompareEq :
case AstExprBinary : : CompareLt :
case AstExprBinary : : CompareLe :
case AstExprBinary : : CompareGt :
case AstExprBinary : : CompareGe :
{
if ( target )
{
// since target is a temp register, we'll initialize it to 1, and then jump if the comparison is true
2021-11-05 02:42:00 +00:00
// if the comparison is false, we'll fallthrough and target will still be 1 but target has unspecified value for falsy results
// when we only care about falsy values instead of truthy values, the process is the same but with flipped conditionals
2021-10-29 21:25:12 +01:00
bytecode . emitABC ( LOP_LOADB , * target , onlyTruth ? 1 : 0 , 0 ) ;
}
size_t jumpLabel = compileCompareJump ( expr , /* not= */ ! onlyTruth ) ;
skipJump . push_back ( jumpLabel ) ;
return ;
}
break ;
// fall-through to default path below
default : ;
}
}
if ( AstExprUnary * expr = node - > as < AstExprUnary > ( ) )
{
// if we *do* need to compute the target, we'd have to inject "not" ops on every return path
// this is possible but cumbersome; so for now we only optimize not expression when we *don't* need the value
if ( ! target & & expr - > op = = AstExprUnary : : Not )
{
compileConditionValue ( expr - > expr , target , skipJump , ! onlyTruth ) ;
return ;
}
}
if ( AstExprGroup * expr = node - > as < AstExprGroup > ( ) )
{
compileConditionValue ( expr - > expr , target , skipJump , onlyTruth ) ;
return ;
}
RegScope rs ( this ) ;
uint8_t reg ;
if ( target )
{
reg = * target ;
compileExprTemp ( node , reg ) ;
}
else
{
reg = compileExprAuto ( node , rs ) ;
}
skipJump . push_back ( bytecode . emitLabel ( ) ) ;
bytecode . emitAD ( onlyTruth ? LOP_JUMPIF : LOP_JUMPIFNOT , reg , 0 ) ;
}
// checks if compiling the expression as a condition value generates code that's faster than using compileExpr
bool isConditionFast ( AstExpr * node )
{
const Constant * cv = constants . find ( node ) ;
if ( cv & & cv - > type ! = Constant : : Type_Unknown )
return true ;
if ( AstExprBinary * expr = node - > as < AstExprBinary > ( ) )
{
switch ( expr - > op )
{
case AstExprBinary : : And :
case AstExprBinary : : Or :
return true ;
case AstExprBinary : : CompareNe :
case AstExprBinary : : CompareEq :
case AstExprBinary : : CompareLt :
case AstExprBinary : : CompareLe :
case AstExprBinary : : CompareGt :
case AstExprBinary : : CompareGe :
return true ;
default :
return false ;
}
}
if ( AstExprGroup * expr = node - > as < AstExprGroup > ( ) )
return isConditionFast ( expr - > expr ) ;
return false ;
}
void compileExprAndOr ( AstExprBinary * expr , uint8_t target , bool targetTemp )
{
bool and_ = ( expr - > op = = AstExprBinary : : And ) ;
RegScope rs ( this ) ;
// Optimization: when left hand side is a constant, we can emit left hand side or right hand side
2022-05-26 21:33:48 +01:00
if ( const Constant * cl = constants . find ( expr - > left ) ; cl & & cl - > type ! = Constant : : Type_Unknown )
2021-10-29 21:25:12 +01:00
{
compileExpr ( and_ = = cl - > isTruthful ( ) ? expr - > right : expr - > left , target , targetTemp ) ;
return ;
}
// Note: two optimizations below can lead to inefficient codegen when the left hand side is a condition
if ( ! isConditionFast ( expr - > left ) )
{
// Optimization: when right hand side is a local variable, we can use AND/OR
2022-05-20 00:46:52 +01:00
if ( int reg = getExprLocalReg ( expr - > right ) ; reg > = 0 )
2021-10-29 21:25:12 +01:00
{
uint8_t lr = compileExprAuto ( expr - > left , rs ) ;
2022-05-20 00:46:52 +01:00
uint8_t rr = uint8_t ( reg ) ;
2021-10-29 21:25:12 +01:00
bytecode . emitABC ( and_ ? LOP_AND : LOP_OR , target , lr , rr ) ;
return ;
}
// Optimization: when right hand side is a constant, we can use ANDK/ORK
int32_t cid = getConstantIndex ( expr - > right ) ;
if ( cid > = 0 & & cid < = 255 )
{
uint8_t lr = compileExprAuto ( expr - > left , rs ) ;
bytecode . emitABC ( and_ ? LOP_ANDK : LOP_ORK , target , lr , uint8_t ( cid ) ) ;
return ;
}
}
// Optimization: if target is a temp register, we can clobber it which allows us to compute the result directly into it
// If it's not a temp register, then something like `a = a > 1 or a + 2` may clobber `a` while evaluating left hand side, and `a+2` will break
uint8_t reg = targetTemp ? target : allocReg ( expr , 1 ) ;
std : : vector < size_t > skipJump ;
compileConditionValue ( expr - > left , & reg , skipJump , /* onlyTruth= */ ! and_ ) ;
compileExprTemp ( expr - > right , reg ) ;
size_t moveLabel = bytecode . emitLabel ( ) ;
patchJumps ( expr , skipJump , moveLabel ) ;
if ( target ! = reg )
bytecode . emitABC ( LOP_MOVE , target , reg , 0 ) ;
}
void compileExprUnary ( AstExprUnary * expr , uint8_t target )
{
RegScope rs ( this ) ;
uint8_t re = compileExprAuto ( expr - > expr , rs ) ;
bytecode . emitABC ( getUnaryOp ( expr - > op ) , target , re , 0 ) ;
}
static void unrollConcats ( std : : vector < AstExpr * > & args )
{
for ( ; ; )
{
AstExprBinary * be = args . back ( ) - > as < AstExprBinary > ( ) ;
if ( ! be | | be - > op ! = AstExprBinary : : Concat )
break ;
args . back ( ) = be - > left ;
args . push_back ( be - > right ) ;
}
}
void compileExprBinary ( AstExprBinary * expr , uint8_t target , bool targetTemp )
{
RegScope rs ( this ) ;
switch ( expr - > op )
{
case AstExprBinary : : Add :
case AstExprBinary : : Sub :
case AstExprBinary : : Mul :
case AstExprBinary : : Div :
2023-09-01 17:38:53 +01:00
case AstExprBinary : : FloorDiv :
2021-10-29 21:25:12 +01:00
case AstExprBinary : : Mod :
case AstExprBinary : : Pow :
{
2023-09-01 17:38:53 +01:00
LUAU_ASSERT ( FFlag : : LuauFloorDivision | | expr - > op ! = AstExprBinary : : FloorDiv ) ;
2021-10-29 21:25:12 +01:00
int32_t rc = getConstantNumber ( expr - > right ) ;
if ( rc > = 0 & & rc < = 255 )
{
uint8_t rl = compileExprAuto ( expr - > left , rs ) ;
bytecode . emitABC ( getBinaryOpArith ( expr - > op , /* k= */ true ) , target , rl , uint8_t ( rc ) ) ;
}
else
{
uint8_t rl = compileExprAuto ( expr - > left , rs ) ;
uint8_t rr = compileExprAuto ( expr - > right , rs ) ;
bytecode . emitABC ( getBinaryOpArith ( expr - > op ) , target , rl , rr ) ;
}
}
break ;
case AstExprBinary : : Concat :
{
std : : vector < AstExpr * > args = { expr - > left , expr - > right } ;
// unroll the tree of concats down the right hand side to be able to do multiple ops
unrollConcats ( args ) ;
uint8_t regs = allocReg ( expr , unsigned ( args . size ( ) ) ) ;
for ( size_t i = 0 ; i < args . size ( ) ; + + i )
compileExprTemp ( args [ i ] , uint8_t ( regs + i ) ) ;
bytecode . emitABC ( LOP_CONCAT , target , regs , uint8_t ( regs + args . size ( ) - 1 ) ) ;
}
break ;
case AstExprBinary : : CompareNe :
case AstExprBinary : : CompareEq :
case AstExprBinary : : CompareLt :
case AstExprBinary : : CompareLe :
case AstExprBinary : : CompareGt :
case AstExprBinary : : CompareGe :
{
size_t jumpLabel = compileCompareJump ( expr ) ;
// note: this skips over the next LOADB instruction because of "1" in the C slot
bytecode . emitABC ( LOP_LOADB , target , 0 , 1 ) ;
size_t thenLabel = bytecode . emitLabel ( ) ;
bytecode . emitABC ( LOP_LOADB , target , 1 , 0 ) ;
patchJump ( expr , jumpLabel , thenLabel ) ;
}
break ;
case AstExprBinary : : And :
case AstExprBinary : : Or :
{
compileExprAndOr ( expr , target , targetTemp ) ;
}
break ;
default :
LUAU_ASSERT ( ! " Unexpected binary operation " ) ;
}
}
2023-10-20 21:36:26 +01:00
void compileExprIfElseAndOr ( bool and_ , uint8_t creg , AstExpr * other , uint8_t target )
{
int32_t cid = getConstantIndex ( other ) ;
if ( cid > = 0 & & cid < = 255 )
{
bytecode . emitABC ( and_ ? LOP_ANDK : LOP_ORK , target , creg , uint8_t ( cid ) ) ;
}
else
{
RegScope rs ( this ) ;
uint8_t oreg = compileExprAuto ( other , rs ) ;
bytecode . emitABC ( and_ ? LOP_AND : LOP_OR , target , creg , oreg ) ;
}
}
2021-10-29 21:25:12 +01:00
void compileExprIfElse ( AstExprIfElse * expr , uint8_t target , bool targetTemp )
{
if ( isConstant ( expr - > condition ) )
{
if ( isConstantTrue ( expr - > condition ) )
{
compileExpr ( expr - > trueExpr , target , targetTemp ) ;
}
else
{
compileExpr ( expr - > falseExpr , target , targetTemp ) ;
}
}
else
{
2023-10-20 21:36:26 +01:00
if ( FFlag : : LuauCompileIfElseAndOr )
{
// Optimization: convert some if..then..else expressions into and/or when the other side has no side effects and is very cheap to compute
// if v then v else e => v or e
// if v then e else v => v and e
if ( int creg = getExprLocalReg ( expr - > condition ) ; creg > = 0 )
{
if ( creg = = getExprLocalReg ( expr - > trueExpr ) & & ( getExprLocalReg ( expr - > falseExpr ) > = 0 | | isConstant ( expr - > falseExpr ) ) )
return compileExprIfElseAndOr ( /* and_= */ false , uint8_t ( creg ) , expr - > falseExpr , target ) ;
else if ( creg = = getExprLocalReg ( expr - > falseExpr ) & & ( getExprLocalReg ( expr - > trueExpr ) > = 0 | | isConstant ( expr - > trueExpr ) ) )
return compileExprIfElseAndOr ( /* and_= */ true , uint8_t ( creg ) , expr - > trueExpr , target ) ;
}
}
2021-10-29 21:25:12 +01:00
std : : vector < size_t > elseJump ;
compileConditionValue ( expr - > condition , nullptr , elseJump , false ) ;
compileExpr ( expr - > trueExpr , target , targetTemp ) ;
// Jump over else expression evaluation
size_t thenLabel = bytecode . emitLabel ( ) ;
bytecode . emitAD ( LOP_JUMP , 0 , 0 ) ;
size_t elseLabel = bytecode . emitLabel ( ) ;
compileExpr ( expr - > falseExpr , target , targetTemp ) ;
size_t endLabel = bytecode . emitLabel ( ) ;
patchJumps ( expr , elseJump , elseLabel ) ;
patchJump ( expr , thenLabel , endLabel ) ;
}
}
2022-08-25 21:55:08 +01:00
void compileExprInterpString ( AstExprInterpString * expr , uint8_t target , bool targetTemp )
{
size_t formatCapacity = 0 ;
for ( AstArray < char > string : expr - > strings )
{
formatCapacity + = string . size + std : : count ( string . data , string . data + string . size , ' % ' ) ;
}
std : : string formatString ;
formatString . reserve ( formatCapacity ) ;
size_t stringsLeft = expr - > strings . size ;
for ( AstArray < char > string : expr - > strings )
{
if ( memchr ( string . data , ' % ' , string . size ) )
{
for ( size_t characterIndex = 0 ; characterIndex < string . size ; + + characterIndex )
{
char character = string . data [ characterIndex ] ;
formatString . push_back ( character ) ;
if ( character = = ' % ' )
formatString . push_back ( ' % ' ) ;
}
}
else
formatString . append ( string . data , string . size ) ;
stringsLeft - - ;
if ( stringsLeft > 0 )
formatString + = " %* " ;
}
size_t formatStringSize = formatString . size ( ) ;
// We can't use formatStringRef.data() directly, because short strings don't have their data
// pinned in memory, so when interpFormatStrings grows, these pointers will move and become invalid.
std : : unique_ptr < char [ ] > formatStringPtr ( new char [ formatStringSize ] ) ;
memcpy ( formatStringPtr . get ( ) , formatString . data ( ) , formatStringSize ) ;
AstArray < char > formatStringArray { formatStringPtr . get ( ) , formatStringSize } ;
interpStrings . emplace_back ( std : : move ( formatStringPtr ) ) ; // invalidates formatStringPtr, but keeps formatStringArray intact
int32_t formatStringIndex = bytecode . addConstantString ( sref ( formatStringArray ) ) ;
if ( formatStringIndex < 0 )
CompileError : : raise ( expr - > location , " Exceeded constant limit; simplify the code to compile " ) ;
RegScope rs ( this ) ;
2023-02-03 12:34:12 +00:00
uint8_t baseReg = allocReg ( expr , unsigned ( 2 + expr - > expressions . size ) ) ;
2022-08-25 21:55:08 +01:00
emitLoadK ( baseReg , formatStringIndex ) ;
for ( size_t index = 0 ; index < expr - > expressions . size ; + + index )
compileExprTempTop ( expr - > expressions . data [ index ] , uint8_t ( baseReg + 2 + index ) ) ;
BytecodeBuilder : : StringRef formatMethod = sref ( AstName ( " format " ) ) ;
int32_t formatMethodIndex = bytecode . addConstantString ( formatMethod ) ;
if ( formatMethodIndex < 0 )
CompileError : : raise ( expr - > location , " Exceeded constant limit; simplify the code to compile " ) ;
bytecode . emitABC ( LOP_NAMECALL , baseReg , baseReg , uint8_t ( BytecodeBuilder : : getStringHash ( formatMethod ) ) ) ;
bytecode . emitAux ( formatMethodIndex ) ;
bytecode . emitABC ( LOP_CALL , baseReg , uint8_t ( expr - > expressions . size + 2 ) , 2 ) ;
bytecode . emitABC ( LOP_MOVE , target , baseReg , 0 ) ;
}
2021-10-29 21:25:12 +01:00
static uint8_t encodeHashSize ( unsigned int hashSize )
{
size_t hashSizeLog2 = 0 ;
while ( ( 1u < < hashSizeLog2 ) < hashSize )
hashSizeLog2 + + ;
return hashSize = = 0 ? 0 : uint8_t ( hashSizeLog2 + 1 ) ;
}
void compileExprTable ( AstExprTable * expr , uint8_t target , bool targetTemp )
{
// Optimization: if the table is empty, we can compute it directly into the target
if ( expr - > items . size = = 0 )
{
2022-01-14 16:06:31 +00:00
TableShape shape = tableShapes [ expr ] ;
2021-10-29 21:25:12 +01:00
2022-10-13 23:59:53 +01:00
bytecode . addDebugRemark ( " allocation: table hash %d " , shape . hashSize ) ;
2022-01-14 16:06:31 +00:00
bytecode . emitABC ( LOP_NEWTABLE , target , encodeHashSize ( shape . hashSize ) , 0 ) ;
bytecode . emitAux ( shape . arraySize ) ;
2021-10-29 21:25:12 +01:00
return ;
}
unsigned int arraySize = 0 ;
unsigned int hashSize = 0 ;
unsigned int recordSize = 0 ;
unsigned int indexSize = 0 ;
for ( size_t i = 0 ; i < expr - > items . size ; + + i )
{
const AstExprTable : : Item & item = expr - > items . data [ i ] ;
arraySize + = ( item . kind = = AstExprTable : : Item : : List ) ;
hashSize + = ( item . kind ! = AstExprTable : : Item : : List ) ;
recordSize + = ( item . kind = = AstExprTable : : Item : : Record ) ;
}
// Optimization: allocate sequential explicitly specified numeric indices ([1]) as arrays
if ( arraySize = = 0 & & hashSize > 0 )
{
for ( size_t i = 0 ; i < expr - > items . size ; + + i )
{
const AstExprTable : : Item & item = expr - > items . data [ i ] ;
2022-01-27 21:29:34 +00:00
LUAU_ASSERT ( item . key ) ; // no list portion => all items have keys
2022-02-11 18:43:14 +00:00
const Constant * ckey = constants . find ( item . key ) ;
2021-10-29 21:25:12 +01:00
2022-02-11 18:43:14 +00:00
indexSize + = ( ckey & & ckey - > type = = Constant : : Type_Number & & ckey - > valueNumber = = double ( indexSize + 1 ) ) ;
2021-10-29 21:25:12 +01:00
}
// we only perform the optimization if we don't have any other []-keys
// technically it's "safe" to do this even if we have other keys, but doing so changes iteration order and may break existing code
if ( hashSize = = recordSize + indexSize )
hashSize = recordSize ;
else
indexSize = 0 ;
}
int encodedHashSize = encodeHashSize ( hashSize ) ;
RegScope rs ( this ) ;
// Optimization: if target is a temp register, we can clobber it which allows us to compute the result directly into it
uint8_t reg = targetTemp ? target : allocReg ( expr , 1 ) ;
// Optimization: when all items are record fields, use template tables to compile expression
if ( arraySize = = 0 & & indexSize = = 0 & & hashSize = = recordSize & & recordSize > = 1 & & recordSize < = BytecodeBuilder : : TableShape : : kMaxLength )
{
BytecodeBuilder : : TableShape shape ;
for ( size_t i = 0 ; i < expr - > items . size ; + + i )
{
const AstExprTable : : Item & item = expr - > items . data [ i ] ;
LUAU_ASSERT ( item . kind = = AstExprTable : : Item : : Record ) ;
AstExprConstantString * ckey = item . key - > as < AstExprConstantString > ( ) ;
LUAU_ASSERT ( ckey ) ;
int cid = bytecode . addConstantString ( sref ( ckey - > value ) ) ;
if ( cid < 0 )
CompileError : : raise ( ckey - > location , " Exceeded constant limit; simplify the code to compile " ) ;
LUAU_ASSERT ( shape . length < BytecodeBuilder : : TableShape : : kMaxLength ) ;
shape . keys [ shape . length + + ] = int16_t ( cid ) ;
}
int32_t tid = bytecode . addConstantTable ( shape ) ;
if ( tid < 0 )
CompileError : : raise ( expr - > location , " Exceeded constant limit; simplify the code to compile " ) ;
2022-10-13 23:59:53 +01:00
bytecode . addDebugRemark ( " allocation: table template %d " , hashSize ) ;
2021-10-29 21:25:12 +01:00
if ( tid < 32768 )
{
bytecode . emitAD ( LOP_DUPTABLE , reg , int16_t ( tid ) ) ;
}
else
{
2022-01-14 16:06:31 +00:00
bytecode . emitABC ( LOP_NEWTABLE , reg , uint8_t ( encodedHashSize ) , 0 ) ;
2021-10-29 21:25:12 +01:00
bytecode . emitAux ( 0 ) ;
}
}
else
{
// Optimization: instead of allocating one extra element when the last element of the table literal is ..., let SETLIST allocate the
// correct amount of storage
const AstExprTable : : Item * last = expr - > items . size > 0 ? & expr - > items . data [ expr - > items . size - 1 ] : nullptr ;
bool trailingVarargs = last & & last - > kind = = AstExprTable : : Item : : List & & last - > value - > is < AstExprVarargs > ( ) ;
LUAU_ASSERT ( ! trailingVarargs | | arraySize > 0 ) ;
2022-10-13 23:59:53 +01:00
unsigned int arrayAllocation = arraySize - trailingVarargs + indexSize ;
if ( hashSize = = 0 )
bytecode . addDebugRemark ( " allocation: table array %d " , arrayAllocation ) ;
else if ( arrayAllocation = = 0 )
bytecode . addDebugRemark ( " allocation: table hash %d " , hashSize ) ;
else
bytecode . addDebugRemark ( " allocation: table hash %d array %d " , hashSize , arrayAllocation ) ;
2022-01-14 16:06:31 +00:00
bytecode . emitABC ( LOP_NEWTABLE , reg , uint8_t ( encodedHashSize ) , 0 ) ;
2022-10-13 23:59:53 +01:00
bytecode . emitAux ( arrayAllocation ) ;
2021-10-29 21:25:12 +01:00
}
unsigned int arrayChunkSize = std : : min ( 16u , arraySize ) ;
uint8_t arrayChunkReg = allocReg ( expr , arrayChunkSize ) ;
unsigned int arrayChunkCurrent = 0 ;
unsigned int arrayIndex = 1 ;
bool multRet = false ;
for ( size_t i = 0 ; i < expr - > items . size ; + + i )
{
const AstExprTable : : Item & item = expr - > items . data [ i ] ;
AstExpr * key = item . key ;
AstExpr * value = item . value ;
// some key/value pairs don't require us to compile the expressions, so we need to setup the line info here
setDebugLine ( value ) ;
if ( options . coverageLevel > = 2 )
{
bytecode . emitABC ( LOP_COVERAGE , 0 , 0 , 0 ) ;
}
// flush array chunk on overflow or before hash keys to maintain insertion order
if ( arrayChunkCurrent > 0 & & ( key | | arrayChunkCurrent = = arrayChunkSize ) )
{
bytecode . emitABC ( LOP_SETLIST , reg , arrayChunkReg , uint8_t ( arrayChunkCurrent + 1 ) ) ;
bytecode . emitAux ( arrayIndex ) ;
arrayIndex + = arrayChunkCurrent ;
arrayChunkCurrent = 0 ;
}
2022-01-27 21:29:34 +00:00
// items with a key are set one by one via SETTABLE/SETTABLEKS/SETTABLEN
2021-10-29 21:25:12 +01:00
if ( key )
{
RegScope rsi ( this ) ;
2022-02-11 18:43:14 +00:00
LValue lv = compileLValueIndex ( reg , key , rsi ) ;
uint8_t rv = compileExprAuto ( value , rsi ) ;
2021-10-29 21:25:12 +01:00
2022-02-11 18:43:14 +00:00
compileAssign ( lv , rv ) ;
2021-10-29 21:25:12 +01:00
}
// items without a key are set using SETLIST so that we can initialize large arrays quickly
else
{
uint8_t temp = uint8_t ( arrayChunkReg + arrayChunkCurrent ) ;
if ( i + 1 = = expr - > items . size )
multRet = compileExprTempMultRet ( value , temp ) ;
else
compileExprTempTop ( value , temp ) ;
arrayChunkCurrent + + ;
}
}
// flush last array chunk; note that this needs multret handling if the last expression was multret
if ( arrayChunkCurrent )
{
bytecode . emitABC ( LOP_SETLIST , reg , arrayChunkReg , multRet ? 0 : uint8_t ( arrayChunkCurrent + 1 ) ) ;
bytecode . emitAux ( arrayIndex ) ;
}
if ( target ! = reg )
bytecode . emitABC ( LOP_MOVE , target , reg , 0 ) ;
}
bool canImport ( AstExprGlobal * expr )
{
2022-01-14 16:06:31 +00:00
return options . optimizationLevel > = 1 & & getGlobalState ( globals , expr - > name ) ! = Global : : Written ;
2021-10-29 21:25:12 +01:00
}
bool canImportChain ( AstExprGlobal * expr )
{
2022-01-14 16:06:31 +00:00
return options . optimizationLevel > = 1 & & getGlobalState ( globals , expr - > name ) = = Global : : Default ;
2021-10-29 21:25:12 +01:00
}
void compileExprIndexName ( AstExprIndexName * expr , uint8_t target )
{
setDebugLine ( expr ) ; // normally compileExpr sets up line info, but compileExprIndexName can be called directly
// Optimization: index chains that start from global variables can be compiled into GETIMPORT statement
AstExprGlobal * importRoot = 0 ;
AstExprIndexName * import1 = 0 ;
AstExprIndexName * import2 = 0 ;
if ( AstExprIndexName * index = expr - > expr - > as < AstExprIndexName > ( ) )
{
importRoot = index - > expr - > as < AstExprGlobal > ( ) ;
import1 = index ;
import2 = expr ;
}
else
{
importRoot = expr - > expr - > as < AstExprGlobal > ( ) ;
import1 = expr ;
}
if ( importRoot & & canImportChain ( importRoot ) )
{
int32_t id0 = bytecode . addConstantString ( sref ( importRoot - > name ) ) ;
int32_t id1 = bytecode . addConstantString ( sref ( import1 - > index ) ) ;
int32_t id2 = import2 ? bytecode . addConstantString ( sref ( import2 - > index ) ) : - 1 ;
if ( id0 < 0 | | id1 < 0 | | ( import2 & & id2 < 0 ) )
CompileError : : raise ( expr - > location , " Exceeded constant limit; simplify the code to compile " ) ;
// Note: GETIMPORT encoding is limited to 10 bits per object id component
if ( id0 < 1024 & & id1 < 1024 & & id2 < 1024 )
{
uint32_t iid = import2 ? BytecodeBuilder : : getImportId ( id0 , id1 , id2 ) : BytecodeBuilder : : getImportId ( id0 , id1 ) ;
int32_t cid = bytecode . addImport ( iid ) ;
if ( cid > = 0 & & cid < 32768 )
{
bytecode . emitAD ( LOP_GETIMPORT , target , int16_t ( cid ) ) ;
bytecode . emitAux ( iid ) ;
return ;
}
}
}
RegScope rs ( this ) ;
uint8_t reg = compileExprAuto ( expr - > expr , rs ) ;
2021-12-02 23:20:08 +00:00
setDebugLine ( expr - > indexLocation ) ;
2021-10-29 21:25:12 +01:00
BytecodeBuilder : : StringRef iname = sref ( expr - > index ) ;
int32_t cid = bytecode . addConstantString ( iname ) ;
if ( cid < 0 )
CompileError : : raise ( expr - > location , " Exceeded constant limit; simplify the code to compile " ) ;
bytecode . emitABC ( LOP_GETTABLEKS , target , reg , uint8_t ( BytecodeBuilder : : getStringHash ( iname ) ) ) ;
bytecode . emitAux ( cid ) ;
}
void compileExprIndexExpr ( AstExprIndexExpr * expr , uint8_t target )
{
RegScope rs ( this ) ;
2022-05-26 21:33:48 +01:00
Constant cv = getConstant ( expr - > index ) ;
2021-10-29 21:25:12 +01:00
2022-05-26 21:33:48 +01:00
if ( cv . type = = Constant : : Type_Number & & cv . valueNumber > = 1 & & cv . valueNumber < = 256 & & double ( int ( cv . valueNumber ) ) = = cv . valueNumber )
2021-10-29 21:25:12 +01:00
{
2022-05-26 21:33:48 +01:00
uint8_t i = uint8_t ( int ( cv . valueNumber ) - 1 ) ;
2021-10-29 21:25:12 +01:00
2022-05-06 00:52:48 +01:00
uint8_t rt = compileExprAuto ( expr - > expr , rs ) ;
2022-02-11 18:43:14 +00:00
setDebugLine ( expr - > index ) ;
2022-01-27 21:29:34 +00:00
2021-10-29 21:25:12 +01:00
bytecode . emitABC ( LOP_GETTABLEN , target , rt , i ) ;
}
2022-05-26 21:33:48 +01:00
else if ( cv . type = = Constant : : Type_String )
2021-10-29 21:25:12 +01:00
{
2022-05-26 21:33:48 +01:00
BytecodeBuilder : : StringRef iname = sref ( cv . getString ( ) ) ;
2021-10-29 21:25:12 +01:00
int32_t cid = bytecode . addConstantString ( iname ) ;
if ( cid < 0 )
CompileError : : raise ( expr - > location , " Exceeded constant limit; simplify the code to compile " ) ;
2022-05-06 00:52:48 +01:00
uint8_t rt = compileExprAuto ( expr - > expr , rs ) ;
2022-02-11 18:43:14 +00:00
setDebugLine ( expr - > index ) ;
2022-01-27 21:29:34 +00:00
2021-10-29 21:25:12 +01:00
bytecode . emitABC ( LOP_GETTABLEKS , target , rt , uint8_t ( BytecodeBuilder : : getStringHash ( iname ) ) ) ;
bytecode . emitAux ( cid ) ;
}
else
{
uint8_t rt = compileExprAuto ( expr - > expr , rs ) ;
uint8_t ri = compileExprAuto ( expr - > index , rs ) ;
bytecode . emitABC ( LOP_GETTABLE , target , rt , ri ) ;
}
}
void compileExprGlobal ( AstExprGlobal * expr , uint8_t target )
{
// Optimization: builtin globals can be retrieved using GETIMPORT
if ( canImport ( expr ) )
{
int32_t id0 = bytecode . addConstantString ( sref ( expr - > name ) ) ;
if ( id0 < 0 )
CompileError : : raise ( expr - > location , " Exceeded constant limit; simplify the code to compile " ) ;
// Note: GETIMPORT encoding is limited to 10 bits per object id component
if ( id0 < 1024 )
{
uint32_t iid = BytecodeBuilder : : getImportId ( id0 ) ;
int32_t cid = bytecode . addImport ( iid ) ;
if ( cid > = 0 & & cid < 32768 )
{
bytecode . emitAD ( LOP_GETIMPORT , target , int16_t ( cid ) ) ;
bytecode . emitAux ( iid ) ;
return ;
}
}
}
BytecodeBuilder : : StringRef gname = sref ( expr - > name ) ;
int32_t cid = bytecode . addConstantString ( gname ) ;
if ( cid < 0 )
CompileError : : raise ( expr - > location , " Exceeded constant limit; simplify the code to compile " ) ;
bytecode . emitABC ( LOP_GETGLOBAL , target , 0 , uint8_t ( BytecodeBuilder : : getStringHash ( gname ) ) ) ;
bytecode . emitAux ( cid ) ;
}
void compileExprConstant ( AstExpr * node , const Constant * cv , uint8_t target )
{
switch ( cv - > type )
{
case Constant : : Type_Nil :
bytecode . emitABC ( LOP_LOADNIL , target , 0 , 0 ) ;
break ;
case Constant : : Type_Boolean :
bytecode . emitABC ( LOP_LOADB , target , cv - > valueBoolean , 0 ) ;
break ;
case Constant : : Type_Number :
{
double d = cv - > valueNumber ;
if ( d > = std : : numeric_limits < int16_t > : : min ( ) & & d < = std : : numeric_limits < int16_t > : : max ( ) & & double ( int16_t ( d ) ) = = d & &
! ( d = = 0.0 & & signbit ( d ) ) )
{
// short number encoding: doesn't require a table entry lookup
bytecode . emitAD ( LOP_LOADN , target , int16_t ( d ) ) ;
}
else
{
// long number encoding: use generic constant path
int32_t cid = bytecode . addConstantNumber ( d ) ;
if ( cid < 0 )
CompileError : : raise ( node - > location , " Exceeded constant limit; simplify the code to compile " ) ;
emitLoadK ( target , cid ) ;
}
}
break ;
case Constant : : Type_String :
{
2022-01-14 16:06:31 +00:00
int32_t cid = bytecode . addConstantString ( sref ( cv - > getString ( ) ) ) ;
2021-10-29 21:25:12 +01:00
if ( cid < 0 )
CompileError : : raise ( node - > location , " Exceeded constant limit; simplify the code to compile " ) ;
emitLoadK ( target , cid ) ;
}
break ;
default :
LUAU_ASSERT ( ! " Unexpected constant type " ) ;
}
}
void compileExpr ( AstExpr * node , uint8_t target , bool targetTemp = false )
{
setDebugLine ( node ) ;
if ( options . coverageLevel > = 2 & & needsCoverage ( node ) )
{
bytecode . emitABC ( LOP_COVERAGE , 0 , 0 , 0 ) ;
}
// Optimization: if expression has a constant value, we can emit it directly
2022-05-26 21:33:48 +01:00
if ( const Constant * cv = constants . find ( node ) ; cv & & cv - > type ! = Constant : : Type_Unknown )
2021-10-29 21:25:12 +01:00
{
2022-05-26 21:33:48 +01:00
compileExprConstant ( node , cv , target ) ;
return ;
2021-10-29 21:25:12 +01:00
}
if ( AstExprGroup * expr = node - > as < AstExprGroup > ( ) )
{
compileExpr ( expr - > expr , target , targetTemp ) ;
}
else if ( node - > is < AstExprConstantNil > ( ) )
{
bytecode . emitABC ( LOP_LOADNIL , target , 0 , 0 ) ;
}
else if ( AstExprConstantBool * expr = node - > as < AstExprConstantBool > ( ) )
{
bytecode . emitABC ( LOP_LOADB , target , expr - > value , 0 ) ;
}
else if ( AstExprConstantNumber * expr = node - > as < AstExprConstantNumber > ( ) )
{
int32_t cid = bytecode . addConstantNumber ( expr - > value ) ;
if ( cid < 0 )
CompileError : : raise ( expr - > location , " Exceeded constant limit; simplify the code to compile " ) ;
emitLoadK ( target , cid ) ;
}
else if ( AstExprConstantString * expr = node - > as < AstExprConstantString > ( ) )
{
int32_t cid = bytecode . addConstantString ( sref ( expr - > value ) ) ;
if ( cid < 0 )
CompileError : : raise ( expr - > location , " Exceeded constant limit; simplify the code to compile " ) ;
emitLoadK ( target , cid ) ;
}
else if ( AstExprLocal * expr = node - > as < AstExprLocal > ( ) )
{
2022-05-20 00:46:52 +01:00
// note: this can't check expr->upvalue because upvalues may be upgraded to locals during inlining
if ( int reg = getExprLocalReg ( expr ) ; reg > = 0 )
2021-10-29 21:25:12 +01:00
{
2023-01-06 16:07:19 +00:00
// Optimization: we don't need to move if target happens to be in the same register
2023-02-03 12:34:12 +00:00
if ( options . optimizationLevel = = 0 | | target ! = reg )
2023-01-06 16:07:19 +00:00
bytecode . emitABC ( LOP_MOVE , target , uint8_t ( reg ) , 0 ) ;
2021-10-29 21:25:12 +01:00
}
else
{
2022-05-20 00:46:52 +01:00
LUAU_ASSERT ( expr - > upvalue ) ;
uint8_t uid = getUpval ( expr - > local ) ;
2021-10-29 21:25:12 +01:00
2022-05-20 00:46:52 +01:00
bytecode . emitABC ( LOP_GETUPVAL , target , uid , 0 ) ;
2021-10-29 21:25:12 +01:00
}
}
else if ( AstExprGlobal * expr = node - > as < AstExprGlobal > ( ) )
{
compileExprGlobal ( expr , target ) ;
}
else if ( AstExprVarargs * expr = node - > as < AstExprVarargs > ( ) )
{
compileExprVarargs ( expr , target , /* targetCount= */ 1 ) ;
}
else if ( AstExprCall * expr = node - > as < AstExprCall > ( ) )
{
// Optimization: when targeting temporary registers, we can compile call in a special mode that doesn't require extra register moves
if ( targetTemp & & target = = regTop - 1 )
compileExprCall ( expr , target , 1 , /* targetTop= */ true ) ;
else
compileExprCall ( expr , target , /* targetCount= */ 1 ) ;
}
else if ( AstExprIndexName * expr = node - > as < AstExprIndexName > ( ) )
{
compileExprIndexName ( expr , target ) ;
}
else if ( AstExprIndexExpr * expr = node - > as < AstExprIndexExpr > ( ) )
{
compileExprIndexExpr ( expr , target ) ;
}
else if ( AstExprFunction * expr = node - > as < AstExprFunction > ( ) )
{
compileExprFunction ( expr , target ) ;
}
else if ( AstExprTable * expr = node - > as < AstExprTable > ( ) )
{
compileExprTable ( expr , target , targetTemp ) ;
}
else if ( AstExprUnary * expr = node - > as < AstExprUnary > ( ) )
{
compileExprUnary ( expr , target ) ;
}
else if ( AstExprBinary * expr = node - > as < AstExprBinary > ( ) )
{
compileExprBinary ( expr , target , targetTemp ) ;
}
else if ( AstExprTypeAssertion * expr = node - > as < AstExprTypeAssertion > ( ) )
{
compileExpr ( expr - > expr , target , targetTemp ) ;
}
2022-01-14 16:06:31 +00:00
else if ( AstExprIfElse * expr = node - > as < AstExprIfElse > ( ) )
2021-10-29 21:25:12 +01:00
{
compileExprIfElse ( expr , target , targetTemp ) ;
}
2023-01-27 21:28:45 +00:00
else if ( AstExprInterpString * interpString = node - > as < AstExprInterpString > ( ) )
2022-08-25 21:55:08 +01:00
{
compileExprInterpString ( interpString , target , targetTemp ) ;
}
2021-10-29 21:25:12 +01:00
else
{
LUAU_ASSERT ( ! " Unknown expression type " ) ;
}
}
void compileExprTemp ( AstExpr * node , uint8_t target )
{
return compileExpr ( node , target , /* targetTemp= */ true ) ;
}
uint8_t compileExprAuto ( AstExpr * node , RegScope & )
{
// Optimization: directly return locals instead of copying them to a temporary
2022-05-20 00:46:52 +01:00
if ( int reg = getExprLocalReg ( node ) ; reg > = 0 )
return uint8_t ( reg ) ;
2021-10-29 21:25:12 +01:00
// note: the register is owned by the parent scope
uint8_t reg = allocReg ( node , 1 ) ;
compileExprTemp ( node , reg ) ;
return reg ;
}
2022-08-11 21:42:54 +01:00
// initializes target..target+targetCount-1 range using expression
// if expression is a call/vararg, we assume it returns all values, otherwise we fill the rest with nil
// assumes target register range can be clobbered and is at the top of the register space if targetTop = true
void compileExprTempN ( AstExpr * node , uint8_t target , uint8_t targetCount , bool targetTop )
{
// we assume that target range is at the top of the register space and can be clobbered
// this is what allows us to compile the last call expression - if it's a call - using targetTop=true
LUAU_ASSERT ( ! targetTop | | unsigned ( target + targetCount ) = = regTop ) ;
if ( AstExprCall * expr = node - > as < AstExprCall > ( ) )
{
compileExprCall ( expr , target , targetCount , targetTop ) ;
}
else if ( AstExprVarargs * expr = node - > as < AstExprVarargs > ( ) )
{
compileExprVarargs ( expr , target , targetCount ) ;
}
else
{
compileExprTemp ( node , target ) ;
for ( size_t i = 1 ; i < targetCount ; + + i )
bytecode . emitABC ( LOP_LOADNIL , uint8_t ( target + i ) , 0 , 0 ) ;
}
}
2021-10-29 21:25:12 +01:00
// initializes target..target+targetCount-1 range using expressions from the list
2022-08-11 21:42:54 +01:00
// if list has fewer expressions, and last expression is multret, we assume it returns the rest of the values
// if list has fewer expressions, and last expression isn't multret, we fill the rest with nil
2022-05-06 00:52:48 +01:00
// assumes target register range can be clobbered and is at the top of the register space if targetTop = true
void compileExprListTemp ( const AstArray < AstExpr * > & list , uint8_t target , uint8_t targetCount , bool targetTop )
2021-10-29 21:25:12 +01:00
{
// we assume that target range is at the top of the register space and can be clobbered
// this is what allows us to compile the last call expression - if it's a call - using targetTop=true
2022-05-06 00:52:48 +01:00
LUAU_ASSERT ( ! targetTop | | unsigned ( target + targetCount ) = = regTop ) ;
2021-10-29 21:25:12 +01:00
if ( list . size = = targetCount )
{
for ( size_t i = 0 ; i < list . size ; + + i )
compileExprTemp ( list . data [ i ] , uint8_t ( target + i ) ) ;
}
else if ( list . size > targetCount )
{
for ( size_t i = 0 ; i < targetCount ; + + i )
compileExprTemp ( list . data [ i ] , uint8_t ( target + i ) ) ;
2022-05-20 00:46:52 +01:00
// evaluate extra expressions for side effects
2021-10-29 21:25:12 +01:00
for ( size_t i = targetCount ; i < list . size ; + + i )
{
RegScope rsi ( this ) ;
compileExprAuto ( list . data [ i ] , rsi ) ;
}
}
else if ( list . size > 0 )
{
for ( size_t i = 0 ; i < list . size - 1 ; + + i )
compileExprTemp ( list . data [ i ] , uint8_t ( target + i ) ) ;
2022-08-11 21:42:54 +01:00
compileExprTempN ( list . data [ list . size - 1 ] , uint8_t ( target + list . size - 1 ) , uint8_t ( targetCount - ( list . size - 1 ) ) , targetTop ) ;
2021-10-29 21:25:12 +01:00
}
else
{
for ( size_t i = 0 ; i < targetCount ; + + i )
bytecode . emitABC ( LOP_LOADNIL , uint8_t ( target + i ) , 0 , 0 ) ;
}
}
struct LValue
{
enum Kind
{
Kind_Local ,
Kind_Upvalue ,
Kind_Global ,
Kind_IndexName ,
Kind_IndexNumber ,
Kind_IndexExpr ,
} ;
Kind kind ;
uint8_t reg ; // register for local (Local) or table (Index*)
uint8_t upval ;
uint8_t index ; // register for index in IndexExpr
uint8_t number ; // index-1 (0-255) in IndexNumber
BytecodeBuilder : : StringRef name ;
Location location ;
} ;
2022-01-27 21:29:34 +00:00
LValue compileLValueIndex ( uint8_t reg , AstExpr * index , RegScope & rs )
{
2022-05-26 21:33:48 +01:00
Constant cv = getConstant ( index ) ;
2022-01-27 21:29:34 +00:00
2022-05-26 21:33:48 +01:00
if ( cv . type = = Constant : : Type_Number & & cv . valueNumber > = 1 & & cv . valueNumber < = 256 & & double ( int ( cv . valueNumber ) ) = = cv . valueNumber )
2022-01-27 21:29:34 +00:00
{
LValue result = { LValue : : Kind_IndexNumber } ;
result . reg = reg ;
2022-05-26 21:33:48 +01:00
result . number = uint8_t ( int ( cv . valueNumber ) - 1 ) ;
2022-01-27 21:29:34 +00:00
result . location = index - > location ;
return result ;
}
2022-05-26 21:33:48 +01:00
else if ( cv . type = = Constant : : Type_String )
2022-01-27 21:29:34 +00:00
{
LValue result = { LValue : : Kind_IndexName } ;
result . reg = reg ;
2022-05-26 21:33:48 +01:00
result . name = sref ( cv . getString ( ) ) ;
2022-01-27 21:29:34 +00:00
result . location = index - > location ;
return result ;
}
else
{
LValue result = { LValue : : Kind_IndexExpr } ;
result . reg = reg ;
result . index = compileExprAuto ( index , rs ) ;
result . location = index - > location ;
return result ;
}
}
2021-10-29 21:25:12 +01:00
LValue compileLValue ( AstExpr * node , RegScope & rs )
{
setDebugLine ( node ) ;
if ( AstExprLocal * expr = node - > as < AstExprLocal > ( ) )
{
2022-05-20 00:46:52 +01:00
// note: this can't check expr->upvalue because upvalues may be upgraded to locals during inlining
if ( int reg = getExprLocalReg ( expr ) ; reg > = 0 )
2021-10-29 21:25:12 +01:00
{
2022-05-20 00:46:52 +01:00
LValue result = { LValue : : Kind_Local } ;
result . reg = uint8_t ( reg ) ;
2021-10-29 21:25:12 +01:00
result . location = node - > location ;
return result ;
}
else
{
2022-05-20 00:46:52 +01:00
LUAU_ASSERT ( expr - > upvalue ) ;
LValue result = { LValue : : Kind_Upvalue } ;
result . upval = getUpval ( expr - > local ) ;
2021-10-29 21:25:12 +01:00
result . location = node - > location ;
return result ;
}
}
else if ( AstExprGlobal * expr = node - > as < AstExprGlobal > ( ) )
{
LValue result = { LValue : : Kind_Global } ;
result . name = sref ( expr - > name ) ;
result . location = node - > location ;
return result ;
}
else if ( AstExprIndexName * expr = node - > as < AstExprIndexName > ( ) )
{
LValue result = { LValue : : Kind_IndexName } ;
result . reg = compileExprAuto ( expr - > expr , rs ) ;
result . name = sref ( expr - > index ) ;
result . location = node - > location ;
return result ;
}
else if ( AstExprIndexExpr * expr = node - > as < AstExprIndexExpr > ( ) )
{
2022-01-27 21:29:34 +00:00
uint8_t reg = compileExprAuto ( expr - > expr , rs ) ;
2021-10-29 21:25:12 +01:00
2022-01-27 21:29:34 +00:00
return compileLValueIndex ( reg , expr - > index , rs ) ;
2021-10-29 21:25:12 +01:00
}
else
{
LUAU_ASSERT ( ! " Unknown assignment expression " ) ;
return LValue ( ) ;
}
}
void compileLValueUse ( const LValue & lv , uint8_t reg , bool set )
{
2022-02-11 18:43:14 +00:00
setDebugLine ( lv . location ) ;
2022-01-27 21:29:34 +00:00
2021-10-29 21:25:12 +01:00
switch ( lv . kind )
{
case LValue : : Kind_Local :
if ( set )
bytecode . emitABC ( LOP_MOVE , lv . reg , reg , 0 ) ;
else
bytecode . emitABC ( LOP_MOVE , reg , lv . reg , 0 ) ;
break ;
case LValue : : Kind_Upvalue :
bytecode . emitABC ( set ? LOP_SETUPVAL : LOP_GETUPVAL , reg , lv . upval , 0 ) ;
break ;
case LValue : : Kind_Global :
{
int32_t cid = bytecode . addConstantString ( lv . name ) ;
if ( cid < 0 )
CompileError : : raise ( lv . location , " Exceeded constant limit; simplify the code to compile " ) ;
bytecode . emitABC ( set ? LOP_SETGLOBAL : LOP_GETGLOBAL , reg , 0 , uint8_t ( BytecodeBuilder : : getStringHash ( lv . name ) ) ) ;
bytecode . emitAux ( cid ) ;
}
break ;
case LValue : : Kind_IndexName :
{
int32_t cid = bytecode . addConstantString ( lv . name ) ;
if ( cid < 0 )
CompileError : : raise ( lv . location , " Exceeded constant limit; simplify the code to compile " ) ;
bytecode . emitABC ( set ? LOP_SETTABLEKS : LOP_GETTABLEKS , reg , lv . reg , uint8_t ( BytecodeBuilder : : getStringHash ( lv . name ) ) ) ;
bytecode . emitAux ( cid ) ;
}
break ;
case LValue : : Kind_IndexNumber :
bytecode . emitABC ( set ? LOP_SETTABLEN : LOP_GETTABLEN , reg , lv . reg , lv . number ) ;
break ;
case LValue : : Kind_IndexExpr :
bytecode . emitABC ( set ? LOP_SETTABLE : LOP_GETTABLE , reg , lv . reg , lv . index ) ;
break ;
default :
LUAU_ASSERT ( ! " Unknown lvalue kind " ) ;
}
}
void compileAssign ( const LValue & lv , uint8_t source )
{
compileLValueUse ( lv , source , /* set= */ true ) ;
}
2022-07-21 21:36:41 +01:00
AstExprLocal * getExprLocal ( AstExpr * node )
2021-10-29 21:25:12 +01:00
{
2022-05-20 00:46:52 +01:00
if ( AstExprLocal * expr = node - > as < AstExprLocal > ( ) )
2022-07-21 21:36:41 +01:00
return expr ;
else if ( AstExprGroup * expr = node - > as < AstExprGroup > ( ) )
return getExprLocal ( expr - > expr ) ;
else if ( AstExprTypeAssertion * expr = node - > as < AstExprTypeAssertion > ( ) )
return getExprLocal ( expr - > expr ) ;
else
return nullptr ;
}
int getExprLocalReg ( AstExpr * node )
{
if ( AstExprLocal * expr = getExprLocal ( node ) )
2022-05-20 00:46:52 +01:00
{
// note: this can't check expr->upvalue because upvalues may be upgraded to locals during inlining
Local * l = locals . find ( expr - > local ) ;
2021-10-29 21:25:12 +01:00
2022-05-20 00:46:52 +01:00
return l & & l - > allocated ? l - > reg : - 1 ;
}
else
return - 1 ;
2021-10-29 21:25:12 +01:00
}
bool isStatBreak ( AstStat * node )
{
if ( AstStatBlock * stat = node - > as < AstStatBlock > ( ) )
return stat - > body . size = = 1 & & stat - > body . data [ 0 ] - > is < AstStatBreak > ( ) ;
return node - > is < AstStatBreak > ( ) ;
}
AstStatContinue * extractStatContinue ( AstStatBlock * block )
{
if ( block - > body . size = = 1 )
return block - > body . data [ 0 ] - > as < AstStatContinue > ( ) ;
else
return nullptr ;
}
void compileStatIf ( AstStatIf * stat )
{
// Optimization: condition is always false => we only need the else body
if ( isConstantFalse ( stat - > condition ) )
{
if ( stat - > elsebody )
compileStat ( stat - > elsebody ) ;
return ;
}
// Optimization: body is a "break" statement with no "else" => we can directly break out of the loop in "then" case
if ( ! stat - > elsebody & & isStatBreak ( stat - > thenbody ) & & ! areLocalsCaptured ( loops . back ( ) . localOffset ) )
{
// fallthrough = continue with the loop as usual
std : : vector < size_t > elseJump ;
compileConditionValue ( stat - > condition , nullptr , elseJump , true ) ;
for ( size_t jump : elseJump )
loopJumps . push_back ( { LoopJump : : Break , jump } ) ;
return ;
}
2023-10-13 20:38:31 +01:00
AstStatContinue * continueStatement = extractStatContinue ( stat - > thenbody ) ;
2021-10-29 21:25:12 +01:00
// Optimization: body is a "continue" statement with no "else" => we can directly continue in "then" case
2023-10-06 18:31:16 +01:00
if ( ! stat - > elsebody & & continueStatement ! = nullptr & & ! areLocalsCaptured ( loops . back ( ) . localOffsetContinue ) )
2021-10-29 21:25:12 +01:00
{
2023-11-03 19:47:28 +00:00
// track continue statement for repeat..until validation (validateContinueUntil)
if ( ! loops . back ( ) . continueUsed )
loops . back ( ) . continueUsed = continueStatement ;
2021-10-29 21:25:12 +01:00
// fallthrough = proceed with the loop body as usual
std : : vector < size_t > elseJump ;
compileConditionValue ( stat - > condition , nullptr , elseJump , true ) ;
for ( size_t jump : elseJump )
loopJumps . push_back ( { LoopJump : : Continue , jump } ) ;
return ;
}
std : : vector < size_t > elseJump ;
compileConditionValue ( stat - > condition , nullptr , elseJump , false ) ;
compileStat ( stat - > thenbody ) ;
if ( stat - > elsebody & & elseJump . size ( ) > 0 )
{
2023-02-24 18:24:22 +00:00
// we don't need to skip past "else" body if "then" ends with return/break/continue
2021-10-29 21:25:12 +01:00
// this is important because, if "else" also ends with return, we may *not* have any statement to skip to!
2023-02-24 18:24:22 +00:00
if ( alwaysTerminates ( stat - > thenbody ) )
2021-10-29 21:25:12 +01:00
{
size_t elseLabel = bytecode . emitLabel ( ) ;
compileStat ( stat - > elsebody ) ;
patchJumps ( stat , elseJump , elseLabel ) ;
}
else
{
size_t thenLabel = bytecode . emitLabel ( ) ;
bytecode . emitAD ( LOP_JUMP , 0 , 0 ) ;
size_t elseLabel = bytecode . emitLabel ( ) ;
compileStat ( stat - > elsebody ) ;
size_t endLabel = bytecode . emitLabel ( ) ;
patchJumps ( stat , elseJump , elseLabel ) ;
patchJump ( stat , thenLabel , endLabel ) ;
}
}
else
{
size_t endLabel = bytecode . emitLabel ( ) ;
patchJumps ( stat , elseJump , endLabel ) ;
}
}
void compileStatWhile ( AstStatWhile * stat )
{
// Optimization: condition is always false => there's no loop!
if ( isConstantFalse ( stat - > condition ) )
return ;
size_t oldJumps = loopJumps . size ( ) ;
size_t oldLocals = localStack . size ( ) ;
2023-11-03 19:47:28 +00:00
loops . push_back ( { oldLocals , oldLocals , nullptr } ) ;
2023-10-06 18:31:16 +01:00
hasLoops = true ;
2021-10-29 21:25:12 +01:00
size_t loopLabel = bytecode . emitLabel ( ) ;
std : : vector < size_t > elseJump ;
compileConditionValue ( stat - > condition , nullptr , elseJump , false ) ;
compileStat ( stat - > body ) ;
size_t contLabel = bytecode . emitLabel ( ) ;
size_t backLabel = bytecode . emitLabel ( ) ;
setDebugLine ( stat - > condition ) ;
// Note: this is using JUMPBACK, not JUMP, since JUMPBACK is interruptible and we want all loops to have at least one interruptible
// instruction
bytecode . emitAD ( LOP_JUMPBACK , 0 , 0 ) ;
size_t endLabel = bytecode . emitLabel ( ) ;
patchJump ( stat , backLabel , loopLabel ) ;
patchJumps ( stat , elseJump , endLabel ) ;
patchLoopJumps ( stat , oldJumps , endLabel , contLabel ) ;
loopJumps . resize ( oldJumps ) ;
loops . pop_back ( ) ;
}
void compileStatRepeat ( AstStatRepeat * stat )
{
size_t oldJumps = loopJumps . size ( ) ;
size_t oldLocals = localStack . size ( ) ;
2023-11-03 19:47:28 +00:00
loops . push_back ( { oldLocals , oldLocals , nullptr } ) ;
2023-10-06 18:31:16 +01:00
hasLoops = true ;
2021-10-29 21:25:12 +01:00
size_t loopLabel = bytecode . emitLabel ( ) ;
// note: we "inline" compileStatBlock here so that we can close/pop locals after evaluating condition
// this is necessary because condition can access locals declared inside the repeat..until body
AstStatBlock * body = stat - > body ;
RegScope rs ( this ) ;
2023-10-13 20:38:31 +01:00
bool continueValidated = false ;
2021-10-29 21:25:12 +01:00
for ( size_t i = 0 ; i < body - > body . size ; + + i )
2023-10-06 18:31:16 +01:00
{
2021-10-29 21:25:12 +01:00
compileStat ( body - > body . data [ i ] ) ;
2023-10-06 18:31:16 +01:00
// continue statement inside the repeat..until loop should not close upvalues defined directly in the loop body
// (but it must still close upvalues defined in more nested blocks)
// this is because the upvalues defined inside the loop body may be captured by a closure defined in the until
// expression that continue will jump to.
2023-10-27 20:33:36 +01:00
loops . back ( ) . localOffsetContinue = localStack . size ( ) ;
2023-10-13 20:38:31 +01:00
// if continue was called from this statement, then any local defined after this in the loop body should not be accessed by until condition
// it is sufficient to check this condition once, as if this holds for the first continue, it must hold for all subsequent continues.
2023-11-03 19:47:28 +00:00
if ( loops . back ( ) . continueUsed & & ! continueValidated )
2023-10-13 20:38:31 +01:00
{
validateContinueUntil ( loops . back ( ) . continueUsed , stat - > condition , body , i + 1 ) ;
continueValidated = true ;
}
2023-10-06 18:31:16 +01:00
}
2021-10-29 21:25:12 +01:00
size_t contLabel = bytecode . emitLabel ( ) ;
size_t endLabel ;
setDebugLine ( stat - > condition ) ;
if ( isConstantTrue ( stat - > condition ) )
{
closeLocals ( oldLocals ) ;
endLabel = bytecode . emitLabel ( ) ;
}
else
{
std : : vector < size_t > skipJump ;
compileConditionValue ( stat - > condition , nullptr , skipJump , true ) ;
// we close locals *after* we compute loop conditionals because during computation of condition it's (in theory) possible that user code
// mutates them
closeLocals ( oldLocals ) ;
size_t backLabel = bytecode . emitLabel ( ) ;
// Note: this is using JUMPBACK, not JUMP, since JUMPBACK is interruptible and we want all loops to have at least one interruptible
// instruction
bytecode . emitAD ( LOP_JUMPBACK , 0 , 0 ) ;
size_t skipLabel = bytecode . emitLabel ( ) ;
// we need to close locals *again* after the loop ends because the first closeLocals would be jumped over on the last iteration
closeLocals ( oldLocals ) ;
endLabel = bytecode . emitLabel ( ) ;
patchJump ( stat , backLabel , loopLabel ) ;
patchJumps ( stat , skipJump , skipLabel ) ;
}
popLocals ( oldLocals ) ;
patchLoopJumps ( stat , oldJumps , endLabel , contLabel ) ;
loopJumps . resize ( oldJumps ) ;
loops . pop_back ( ) ;
}
2022-05-06 00:52:48 +01:00
void compileInlineReturn ( AstStatReturn * stat , bool fallthrough )
{
setDebugLine ( stat ) ; // normally compileStat sets up line info, but compileInlineReturn can be called directly
InlineFrame frame = inlineFrames . back ( ) ;
compileExprListTemp ( stat - > list , frame . target , frame . targetCount , /* targetTop= */ false ) ;
2022-06-17 01:54:42 +01:00
closeLocals ( frame . localOffset ) ;
2022-05-06 00:52:48 +01:00
if ( ! fallthrough )
{
size_t jumpLabel = bytecode . emitLabel ( ) ;
bytecode . emitAD ( LOP_JUMP , 0 , 0 ) ;
inlineFrames . back ( ) . returnJumps . push_back ( jumpLabel ) ;
}
}
2021-10-29 21:25:12 +01:00
void compileStatReturn ( AstStatReturn * stat )
{
RegScope rs ( this ) ;
uint8_t temp = 0 ;
2022-05-13 20:16:50 +01:00
bool consecutive = false ;
2021-10-29 21:25:12 +01:00
bool multRet = false ;
2022-05-13 20:16:50 +01:00
// Optimization: return locals directly instead of copying them into a temporary
// this is very important for a single return value and occasionally effective for multiple values
2022-05-20 00:46:52 +01:00
if ( int reg = stat - > list . size > 0 ? getExprLocalReg ( stat - > list . data [ 0 ] ) : - 1 ; reg > = 0 )
2021-10-29 21:25:12 +01:00
{
2022-05-20 00:46:52 +01:00
temp = uint8_t ( reg ) ;
2022-05-13 20:16:50 +01:00
consecutive = true ;
2021-10-29 21:25:12 +01:00
2022-05-13 20:16:50 +01:00
for ( size_t i = 1 ; i < stat - > list . size ; + + i )
2022-05-20 00:46:52 +01:00
if ( getExprLocalReg ( stat - > list . data [ i ] ) ! = int ( temp + i ) )
2022-05-13 20:16:50 +01:00
{
consecutive = false ;
break ;
}
2021-10-29 21:25:12 +01:00
}
2022-05-13 20:16:50 +01:00
if ( ! consecutive & & stat - > list . size > 0 )
2021-10-29 21:25:12 +01:00
{
temp = allocReg ( stat , unsigned ( stat - > list . size ) ) ;
// Note: if the last element is a function call or a vararg specifier, then we need to somehow return all values that that call returned
for ( size_t i = 0 ; i < stat - > list . size ; + + i )
if ( i + 1 = = stat - > list . size )
multRet = compileExprTempMultRet ( stat - > list . data [ i ] , uint8_t ( temp + i ) ) ;
else
compileExprTempTop ( stat - > list . data [ i ] , uint8_t ( temp + i ) ) ;
}
closeLocals ( 0 ) ;
bytecode . emitABC ( LOP_RETURN , uint8_t ( temp ) , multRet ? 0 : uint8_t ( stat - > list . size + 1 ) , 0 ) ;
}
bool areLocalsRedundant ( AstStatLocal * stat )
{
// Extra expressions may have side effects
if ( stat - > values . size > stat - > vars . size )
return false ;
for ( AstLocal * local : stat - > vars )
{
2022-01-14 16:06:31 +00:00
Variable * v = variables . find ( local ) ;
2021-10-29 21:25:12 +01:00
2022-01-14 16:06:31 +00:00
if ( ! v | | ! v - > constant )
2021-10-29 21:25:12 +01:00
return false ;
}
return true ;
}
void compileStatLocal ( AstStatLocal * stat )
{
// Optimization: we don't need to allocate and assign const locals, since their uses will be constant-folded
if ( options . optimizationLevel > = 1 & & options . debugLevel < = 1 & & areLocalsRedundant ( stat ) )
return ;
2022-07-21 21:36:41 +01:00
// Optimization: for 1-1 local assignments, we can reuse the register *if* neither local is mutated
2022-08-18 22:04:33 +01:00
if ( options . optimizationLevel > = 1 & & stat - > vars . size = = 1 & & stat - > values . size = = 1 )
2022-07-21 21:36:41 +01:00
{
if ( AstExprLocal * re = getExprLocal ( stat - > values . data [ 0 ] ) )
{
Variable * lv = variables . find ( stat - > vars . data [ 0 ] ) ;
Variable * rv = variables . find ( re - > local ) ;
if ( int reg = getExprLocalReg ( re ) ; reg > = 0 & & ( ! lv | | ! lv - > written ) & & ( ! rv | | ! rv - > written ) )
{
pushLocal ( stat - > vars . data [ 0 ] , uint8_t ( reg ) ) ;
return ;
}
}
}
2021-10-29 21:25:12 +01:00
// note: allocReg in this case allocates into parent block register - note that we don't have RegScope here
uint8_t vars = allocReg ( stat , unsigned ( stat - > vars . size ) ) ;
2022-05-06 00:52:48 +01:00
compileExprListTemp ( stat - > values , vars , uint8_t ( stat - > vars . size ) , /* targetTop= */ true ) ;
2021-10-29 21:25:12 +01:00
for ( size_t i = 0 ; i < stat - > vars . size ; + + i )
pushLocal ( stat - > vars . data [ i ] , uint8_t ( vars + i ) ) ;
}
2022-04-21 22:04:22 +01:00
bool tryCompileUnrolledFor ( AstStatFor * stat , int thresholdBase , int thresholdMaxBoost )
{
2022-05-26 21:33:48 +01:00
Constant one = { Constant : : Type_Number } ;
one . valueNumber = 1.0 ;
Constant fromc = getConstant ( stat - > from ) ;
Constant toc = getConstant ( stat - > to ) ;
Constant stepc = stat - > step ? getConstant ( stat - > step ) : one ;
2022-04-21 22:04:22 +01:00
2022-05-26 21:33:48 +01:00
int tripCount = ( fromc . type = = Constant : : Type_Number & & toc . type = = Constant : : Type_Number & & stepc . type = = Constant : : Type_Number )
? getTripCount ( fromc . valueNumber , toc . valueNumber , stepc . valueNumber )
: - 1 ;
if ( tripCount < 0 )
2022-04-21 22:04:22 +01:00
{
bytecode . addDebugRemark ( " loop unroll failed: invalid iteration count " ) ;
return false ;
}
2022-05-26 21:33:48 +01:00
if ( tripCount > thresholdBase )
2022-04-21 22:04:22 +01:00
{
2022-05-26 21:33:48 +01:00
bytecode . addDebugRemark ( " loop unroll failed: too many iterations (%d) " , tripCount ) ;
2022-04-21 22:04:22 +01:00
return false ;
}
2022-05-26 21:33:48 +01:00
if ( Variable * lv = variables . find ( stat - > var ) ; lv & & lv - > written )
2022-04-21 22:04:22 +01:00
{
2022-05-26 21:33:48 +01:00
bytecode . addDebugRemark ( " loop unroll failed: mutable loop variable " ) ;
2022-04-21 22:04:22 +01:00
return false ;
}
AstLocal * var = stat - > var ;
2022-07-14 23:39:35 +01:00
uint64_t costModel = modelCost ( stat - > body , & var , 1 , builtins ) ;
2022-04-21 22:04:22 +01:00
// we use a dynamic cost threshold that's based on the fixed limit boosted by the cost advantage we gain due to unrolling
bool varc = true ;
int unrolledCost = computeCost ( costModel , & varc , 1 ) * tripCount ;
int baselineCost = ( computeCost ( costModel , nullptr , 0 ) + 1 ) * tripCount ;
int unrollProfit = ( unrolledCost = = 0 ) ? thresholdMaxBoost : std : : min ( thresholdMaxBoost , 100 * baselineCost / unrolledCost ) ;
int threshold = thresholdBase * unrollProfit / 100 ;
if ( unrolledCost > threshold )
{
bytecode . addDebugRemark (
" loop unroll failed: too expensive (iterations %d, cost %d, profit %.2fx) " , tripCount , unrolledCost , double ( unrollProfit ) / 100 ) ;
return false ;
}
bytecode . addDebugRemark ( " loop unroll succeeded (iterations %d, cost %d, profit %.2fx) " , tripCount , unrolledCost , double ( unrollProfit ) / 100 ) ;
2022-05-26 21:33:48 +01:00
compileUnrolledFor ( stat , tripCount , fromc . valueNumber , stepc . valueNumber ) ;
return true ;
}
void compileUnrolledFor ( AstStatFor * stat , int tripCount , double from , double step )
{
AstLocal * var = stat - > var ;
size_t oldLocals = localStack . size ( ) ;
size_t oldJumps = loopJumps . size ( ) ;
2023-11-03 19:47:28 +00:00
loops . push_back ( { oldLocals , oldLocals , nullptr } ) ;
2022-05-26 21:33:48 +01:00
for ( int iv = 0 ; iv < tripCount ; + + iv )
2022-04-21 22:04:22 +01:00
{
// we need to re-fold constants in the loop body with the new value; this reuses computed constant values elsewhere in the tree
locstants [ var ] . type = Constant : : Type_Number ;
2022-05-26 21:33:48 +01:00
locstants [ var ] . valueNumber = from + iv * step ;
2022-04-21 22:04:22 +01:00
2023-08-04 18:01:35 +01:00
foldConstants ( constants , variables , locstants , builtinsFold , builtinsFoldMathK , stat ) ;
2022-04-21 22:04:22 +01:00
2022-05-26 21:33:48 +01:00
size_t iterJumps = loopJumps . size ( ) ;
2022-04-21 22:04:22 +01:00
compileStat ( stat - > body ) ;
2022-05-26 21:33:48 +01:00
// all continue jumps need to go to the next iteration
size_t contLabel = bytecode . emitLabel ( ) ;
for ( size_t i = iterJumps ; i < loopJumps . size ( ) ; + + i )
if ( loopJumps [ i ] . type = = LoopJump : : Continue )
patchJump ( stat , loopJumps [ i ] . label , contLabel ) ;
2022-04-21 22:04:22 +01:00
}
2022-05-26 21:33:48 +01:00
// all break jumps need to go past the loop
size_t endLabel = bytecode . emitLabel ( ) ;
for ( size_t i = oldJumps ; i < loopJumps . size ( ) ; + + i )
if ( loopJumps [ i ] . type = = LoopJump : : Break )
patchJump ( stat , loopJumps [ i ] . label , endLabel ) ;
loopJumps . resize ( oldJumps ) ;
loops . pop_back ( ) ;
2022-05-06 00:52:48 +01:00
// clean up fold state in case we need to recompile - normally we compile the loop body once, but due to inlining we may need to do it again
locstants [ var ] . type = Constant : : Type_Unknown ;
2023-08-04 18:01:35 +01:00
foldConstants ( constants , variables , locstants , builtinsFold , builtinsFoldMathK , stat ) ;
2022-04-21 22:04:22 +01:00
}
2021-10-29 21:25:12 +01:00
void compileStatFor ( AstStatFor * stat )
{
RegScope rs ( this ) ;
2022-04-21 22:04:22 +01:00
// Optimization: small loops can be unrolled when it is profitable
if ( options . optimizationLevel > = 2 & & isConstant ( stat - > to ) & & isConstant ( stat - > from ) & & ( ! stat - > step | | isConstant ( stat - > step ) ) )
if ( tryCompileUnrolledFor ( stat , FInt : : LuauCompileLoopUnrollThreshold , FInt : : LuauCompileLoopUnrollThresholdMaxBoost ) )
return ;
2021-10-29 21:25:12 +01:00
size_t oldLocals = localStack . size ( ) ;
size_t oldJumps = loopJumps . size ( ) ;
2023-11-03 19:47:28 +00:00
loops . push_back ( { oldLocals , oldLocals , nullptr } ) ;
2023-10-06 18:31:16 +01:00
hasLoops = true ;
2021-10-29 21:25:12 +01:00
// register layout: limit, step, index
uint8_t regs = allocReg ( stat , 3 ) ;
// if the iteration index is assigned from within the loop, we need to protect the internal index from the assignment
// to do that, we will copy the index into an actual local variable on each iteration
// this makes sure the code inside the loop can't interfere with the iteration process (other than modifying the table we're iterating
// through)
uint8_t varreg = regs + 2 ;
2022-01-14 16:06:31 +00:00
if ( Variable * il = variables . find ( stat - > var ) ; il & & il - > written )
2021-10-29 21:25:12 +01:00
varreg = allocReg ( stat , 1 ) ;
compileExprTemp ( stat - > from , uint8_t ( regs + 2 ) ) ;
compileExprTemp ( stat - > to , uint8_t ( regs + 0 ) ) ;
if ( stat - > step )
compileExprTemp ( stat - > step , uint8_t ( regs + 1 ) ) ;
else
bytecode . emitABC ( LOP_LOADN , uint8_t ( regs + 1 ) , 1 , 0 ) ;
size_t forLabel = bytecode . emitLabel ( ) ;
bytecode . emitAD ( LOP_FORNPREP , regs , 0 ) ;
size_t loopLabel = bytecode . emitLabel ( ) ;
if ( varreg ! = regs + 2 )
bytecode . emitABC ( LOP_MOVE , varreg , regs + 2 , 0 ) ;
pushLocal ( stat - > var , varreg ) ;
compileStat ( stat - > body ) ;
closeLocals ( oldLocals ) ;
popLocals ( oldLocals ) ;
setDebugLine ( stat ) ;
size_t contLabel = bytecode . emitLabel ( ) ;
size_t backLabel = bytecode . emitLabel ( ) ;
bytecode . emitAD ( LOP_FORNLOOP , regs , 0 ) ;
size_t endLabel = bytecode . emitLabel ( ) ;
patchJump ( stat , forLabel , endLabel ) ;
patchJump ( stat , backLabel , loopLabel ) ;
patchLoopJumps ( stat , oldJumps , endLabel , contLabel ) ;
loopJumps . resize ( oldJumps ) ;
loops . pop_back ( ) ;
}
void compileStatForIn ( AstStatForIn * stat )
{
RegScope rs ( this ) ;
size_t oldLocals = localStack . size ( ) ;
size_t oldJumps = loopJumps . size ( ) ;
2023-11-03 19:47:28 +00:00
loops . push_back ( { oldLocals , oldLocals , nullptr } ) ;
2023-10-06 18:31:16 +01:00
hasLoops = true ;
2021-10-29 21:25:12 +01:00
// register layout: generator, state, index, variables...
uint8_t regs = allocReg ( stat , 3 ) ;
// this puts initial values of (generator, state, index) into the loop registers
2022-05-06 00:52:48 +01:00
compileExprListTemp ( stat - > values , regs , 3 , /* targetTop= */ true ) ;
2021-10-29 21:25:12 +01:00
// note that we reserve at least 2 variables; this allows our fast path to assume that we need 2 variables instead of 1 or 2
uint8_t vars = allocReg ( stat , std : : max ( unsigned ( stat - > vars . size ) , 2u ) ) ;
LUAU_ASSERT ( vars = = regs + 3 ) ;
2022-06-17 01:52:23 +01:00
LuauOpcode skipOp = LOP_FORGPREP ;
2021-10-29 21:25:12 +01:00
2022-06-17 01:52:23 +01:00
// Optimization: when we iterate via pairs/ipairs, we generate special bytecode that optimizes the traversal using internal iteration index
// These instructions dynamically check if generator is equal to next/inext and bail out
// They assume that the generator produces 2 variables, which is why we allocate at least 2 above (see vars assignment)
2021-10-29 21:25:12 +01:00
if ( options . optimizationLevel > = 1 & & stat - > vars . size < = 2 )
{
if ( stat - > values . size = = 1 & & stat - > values . data [ 0 ] - > is < AstExprCall > ( ) )
{
2022-01-14 16:06:31 +00:00
Builtin builtin = getBuiltin ( stat - > values . data [ 0 ] - > as < AstExprCall > ( ) - > func , globals , variables ) ;
2021-10-29 21:25:12 +01:00
if ( builtin . isGlobal ( " ipairs " ) ) // for .. in ipairs(t)
skipOp = LOP_FORGPREP_INEXT ;
else if ( builtin . isGlobal ( " pairs " ) ) // for .. in pairs(t)
skipOp = LOP_FORGPREP_NEXT ;
}
else if ( stat - > values . size = = 2 )
{
2022-01-14 16:06:31 +00:00
Builtin builtin = getBuiltin ( stat - > values . data [ 0 ] , globals , variables ) ;
2021-10-29 21:25:12 +01:00
if ( builtin . isGlobal ( " next " ) ) // for .. in next,t
skipOp = LOP_FORGPREP_NEXT ;
}
}
// first iteration jumps into FORGLOOP instruction, but for ipairs/pairs it does extra preparation that makes the cost of an extra instruction
// worthwhile
size_t skipLabel = bytecode . emitLabel ( ) ;
bytecode . emitAD ( skipOp , regs , 0 ) ;
size_t loopLabel = bytecode . emitLabel ( ) ;
for ( size_t i = 0 ; i < stat - > vars . size ; + + i )
pushLocal ( stat - > vars . data [ i ] , uint8_t ( vars + i ) ) ;
compileStat ( stat - > body ) ;
closeLocals ( oldLocals ) ;
popLocals ( oldLocals ) ;
setDebugLine ( stat ) ;
size_t contLabel = bytecode . emitLabel ( ) ;
size_t backLabel = bytecode . emitLabel ( ) ;
2022-08-18 22:04:33 +01:00
// FORGLOOP uses aux to encode variable count and fast path flag for ipairs traversal in the high bit
bytecode . emitAD ( LOP_FORGLOOP , regs , 0 ) ;
bytecode . emitAux ( ( skipOp = = LOP_FORGPREP_INEXT ? 0x80000000 : 0 ) | uint32_t ( stat - > vars . size ) ) ;
2021-10-29 21:25:12 +01:00
size_t endLabel = bytecode . emitLabel ( ) ;
patchJump ( stat , skipLabel , backLabel ) ;
patchJump ( stat , backLabel , loopLabel ) ;
patchLoopJumps ( stat , oldJumps , endLabel , contLabel ) ;
loopJumps . resize ( oldJumps ) ;
loops . pop_back ( ) ;
}
2022-08-11 21:42:54 +01:00
struct Assignment
{
LValue lvalue ;
uint8_t conflictReg = kInvalidReg ;
uint8_t valueReg = kInvalidReg ;
} ;
2022-08-25 21:55:08 +01:00
// This function analyzes assignments and marks assignment conflicts: cases when a variable is assigned on lhs
// but subsequently used on the rhs, assuming assignments are performed in order. Note that it's also possible
// for a variable to conflict on the lhs, if it's used in an lvalue expression after it's assigned.
// When conflicts are found, Assignment::conflictReg is allocated and that's where assignment is performed instead,
// until the final fixup in compileStatAssign. Assignment::valueReg is allocated by compileStatAssign as well.
//
// Per Lua manual, section 3.3.3 (Assignments), the proper assignment order is only guaranteed to hold for syntactic access:
//
// Note that this guarantee covers only accesses syntactically inside the assignment statement. If a function or a metamethod called
// during the assignment changes the value of a variable, Lua gives no guarantees about the order of that access.
//
// As such, we currently don't check if an assigned local is captured, which may mean it gets reassigned during a function call.
2022-08-11 21:42:54 +01:00
void resolveAssignConflicts ( AstStat * stat , std : : vector < Assignment > & vars , const AstArray < AstExpr * > & values )
{
struct Visitor : AstVisitor
{
Compiler * self ;
std : : bitset < 256 > conflict ;
std : : bitset < 256 > assigned ;
Visitor ( Compiler * self )
: self ( self )
{
}
bool visit ( AstExprLocal * node ) override
{
int reg = self - > getLocalReg ( node - > local ) ;
if ( reg > = 0 & & assigned [ reg ] )
conflict [ reg ] = true ;
return true ;
}
} ;
Visitor visitor ( this ) ;
2023-02-03 12:34:12 +00:00
// mark any registers that are used *after* assignment as conflicting
2022-12-02 10:46:05 +00:00
2023-02-03 12:34:12 +00:00
// first we go through assignments to locals, since they are performed before assignments to other l-values
for ( size_t i = 0 ; i < vars . size ( ) ; + + i )
{
const LValue & li = vars [ i ] . lvalue ;
2022-12-02 10:46:05 +00:00
2023-02-03 12:34:12 +00:00
if ( li . kind = = LValue : : Kind_Local )
2022-12-02 10:46:05 +00:00
{
2023-02-03 12:34:12 +00:00
if ( i < values . size )
2022-12-02 10:46:05 +00:00
values . data [ i ] - > visit ( & visitor ) ;
2023-02-03 12:34:12 +00:00
visitor . assigned [ li . reg ] = true ;
2022-12-02 10:46:05 +00:00
}
}
2023-02-03 12:34:12 +00:00
// and now we handle all other l-values
for ( size_t i = 0 ; i < vars . size ( ) ; + + i )
{
const LValue & li = vars [ i ] . lvalue ;
2022-12-02 10:46:05 +00:00
2023-02-03 12:34:12 +00:00
if ( li . kind ! = LValue : : Kind_Local & & i < values . size )
values . data [ i ] - > visit ( & visitor ) ;
2022-08-11 21:42:54 +01:00
}
// mark any registers used in trailing expressions as conflicting as well
for ( size_t i = vars . size ( ) ; i < values . size ; + + i )
values . data [ i ] - > visit ( & visitor ) ;
// mark any registers used on left hand side that are also assigned anywhere as conflicting
// this is order-independent because we evaluate all right hand side arguments into registers before doing table assignments
for ( const Assignment & var : vars )
{
const LValue & li = var . lvalue ;
if ( ( li . kind = = LValue : : Kind_IndexName | | li . kind = = LValue : : Kind_IndexNumber | | li . kind = = LValue : : Kind_IndexExpr ) & &
visitor . assigned [ li . reg ] )
visitor . conflict [ li . reg ] = true ;
if ( li . kind = = LValue : : Kind_IndexExpr & & visitor . assigned [ li . index ] )
visitor . conflict [ li . index ] = true ;
}
// for any conflicting var, we need to allocate a temporary register where the assignment is performed, so that we can move the value later
for ( Assignment & var : vars )
{
const LValue & li = var . lvalue ;
if ( li . kind = = LValue : : Kind_Local & & visitor . conflict [ li . reg ] )
var . conflictReg = allocReg ( stat , 1 ) ;
}
}
2021-10-29 21:25:12 +01:00
void compileStatAssign ( AstStatAssign * stat )
{
RegScope rs ( this ) ;
2022-08-11 21:42:54 +01:00
// Optimization: one to one assignments don't require complex conflict resolution machinery
2021-10-29 21:25:12 +01:00
if ( stat - > vars . size = = 1 & & stat - > values . size = = 1 )
{
LValue var = compileLValue ( stat - > vars . data [ 0 ] , rs ) ;
// Optimization: assign to locals directly
if ( var . kind = = LValue : : Kind_Local )
{
compileExpr ( stat - > values . data [ 0 ] , var . reg ) ;
}
else
{
uint8_t reg = compileExprAuto ( stat - > values . data [ 0 ] , rs ) ;
setDebugLine ( stat - > vars . data [ 0 ] ) ;
compileAssign ( var , reg ) ;
}
return ;
}
2022-09-02 00:00:14 +01:00
// compute all l-values: note that this doesn't assign anything yet but it allocates registers and computes complex expressions on the
// left hand side - for example, in "a[expr] = foo" expr will get evaluated here
std : : vector < Assignment > vars ( stat - > vars . size ) ;
for ( size_t i = 0 ; i < stat - > vars . size ; + + i )
vars [ i ] . lvalue = compileLValue ( stat - > vars . data [ i ] , rs ) ;
// perform conflict resolution: if any expression refers to a local that is assigned before evaluating it, we assign to a temporary
// register after this, vars[i].conflictReg is set for locals that need to be assigned in the second pass
resolveAssignConflicts ( stat , vars , stat - > values ) ;
// compute rhs into (mostly) fresh registers
// note that when the lhs assigment is a local, we evaluate directly into that register
// this is possible because resolveAssignConflicts renamed conflicting locals into temporaries
// after this, vars[i].valueReg is set to a register with the value for *all* vars, but some have already been assigned
for ( size_t i = 0 ; i < stat - > vars . size & & i < stat - > values . size ; + + i )
2022-08-11 21:42:54 +01:00
{
2022-09-02 00:00:14 +01:00
AstExpr * value = stat - > values . data [ i ] ;
2021-10-29 21:25:12 +01:00
2022-09-02 00:00:14 +01:00
if ( i + 1 = = stat - > values . size & & stat - > vars . size > stat - > values . size )
{
// allocate a consecutive range of regs for all remaining vars and compute everything into temps
// note, this also handles trailing nils
uint8_t rest = uint8_t ( stat - > vars . size - stat - > values . size + 1 ) ;
uint8_t temp = allocReg ( stat , rest ) ;
2021-10-29 21:25:12 +01:00
2022-09-02 00:00:14 +01:00
compileExprTempN ( value , temp , rest , /* targetTop= */ true ) ;
2021-10-29 21:25:12 +01:00
2022-09-02 00:00:14 +01:00
for ( size_t j = i ; j < stat - > vars . size ; + + j )
vars [ j ] . valueReg = uint8_t ( temp + ( j - i ) ) ;
}
else
2022-08-11 21:42:54 +01:00
{
2022-09-02 00:00:14 +01:00
Assignment & var = vars [ i ] ;
2021-10-29 21:25:12 +01:00
2022-09-02 00:00:14 +01:00
// if target is a local, use compileExpr directly to target
if ( var . lvalue . kind = = LValue : : Kind_Local )
2022-08-11 21:42:54 +01:00
{
2022-09-02 00:00:14 +01:00
var . valueReg = ( var . conflictReg = = kInvalidReg ) ? var . lvalue . reg : var . conflictReg ;
2022-08-11 21:42:54 +01:00
2022-09-02 00:00:14 +01:00
compileExpr ( stat - > values . data [ i ] , var . valueReg ) ;
2022-08-11 21:42:54 +01:00
}
else
{
2022-09-02 00:00:14 +01:00
var . valueReg = compileExprAuto ( stat - > values . data [ i ] , rs ) ;
2022-08-11 21:42:54 +01:00
}
}
2022-09-02 00:00:14 +01:00
}
2022-08-11 21:42:54 +01:00
2023-07-28 12:37:00 +01:00
// compute expressions with side effects
2022-09-02 00:00:14 +01:00
for ( size_t i = stat - > vars . size ; i < stat - > values . size ; + + i )
{
RegScope rsi ( this ) ;
compileExprAuto ( stat - > values . data [ i ] , rsi ) ;
}
2022-08-11 21:42:54 +01:00
2022-09-02 00:00:14 +01:00
// almost done... let's assign everything left to right, noting that locals were either written-to directly, or will be written-to in a
// separate pass to avoid conflicts
for ( const Assignment & var : vars )
{
LUAU_ASSERT ( var . valueReg ! = kInvalidReg ) ;
2022-08-11 21:42:54 +01:00
2022-09-02 00:00:14 +01:00
if ( var . lvalue . kind ! = LValue : : Kind_Local )
2022-08-11 21:42:54 +01:00
{
2022-09-02 00:00:14 +01:00
setDebugLine ( var . lvalue . location ) ;
compileAssign ( var . lvalue , var . valueReg ) ;
2022-08-11 21:42:54 +01:00
}
}
2022-09-02 00:00:14 +01:00
// all regular local writes are done by the prior loops by computing result directly into target, so this just handles conflicts OR
// local copies from temporary registers in multret context, since in that case we have to allocate consecutive temporaries
for ( const Assignment & var : vars )
{
if ( var . lvalue . kind = = LValue : : Kind_Local & & var . valueReg ! = var . lvalue . reg )
bytecode . emitABC ( LOP_MOVE , var . lvalue . reg , var . valueReg , 0 ) ;
2021-10-29 21:25:12 +01:00
}
}
void compileStatCompoundAssign ( AstStatCompoundAssign * stat )
{
RegScope rs ( this ) ;
LValue var = compileLValue ( stat - > var , rs ) ;
// Optimization: assign to locals directly
uint8_t target = ( var . kind = = LValue : : Kind_Local ) ? var . reg : allocReg ( stat , 1 ) ;
switch ( stat - > op )
{
case AstExprBinary : : Add :
case AstExprBinary : : Sub :
case AstExprBinary : : Mul :
case AstExprBinary : : Div :
2023-09-01 17:38:53 +01:00
case AstExprBinary : : FloorDiv :
2021-10-29 21:25:12 +01:00
case AstExprBinary : : Mod :
case AstExprBinary : : Pow :
{
2023-09-01 17:38:53 +01:00
LUAU_ASSERT ( FFlag : : LuauFloorDivision | | stat - > op ! = AstExprBinary : : FloorDiv ) ;
2021-10-29 21:25:12 +01:00
if ( var . kind ! = LValue : : Kind_Local )
compileLValueUse ( var , target , /* set= */ false ) ;
int32_t rc = getConstantNumber ( stat - > value ) ;
if ( rc > = 0 & & rc < = 255 )
{
bytecode . emitABC ( getBinaryOpArith ( stat - > op , /* k= */ true ) , target , target , uint8_t ( rc ) ) ;
}
else
{
uint8_t rr = compileExprAuto ( stat - > value , rs ) ;
bytecode . emitABC ( getBinaryOpArith ( stat - > op ) , target , target , rr ) ;
}
}
break ;
case AstExprBinary : : Concat :
{
std : : vector < AstExpr * > args = { stat - > value } ;
// unroll the tree of concats down the right hand side to be able to do multiple ops
unrollConcats ( args ) ;
uint8_t regs = allocReg ( stat , unsigned ( 1 + args . size ( ) ) ) ;
compileLValueUse ( var , regs , /* set= */ false ) ;
for ( size_t i = 0 ; i < args . size ( ) ; + + i )
compileExprTemp ( args [ i ] , uint8_t ( regs + 1 + i ) ) ;
bytecode . emitABC ( LOP_CONCAT , target , regs , uint8_t ( regs + args . size ( ) ) ) ;
}
break ;
default :
LUAU_ASSERT ( ! " Unexpected compound assignment operation " ) ;
}
if ( var . kind ! = LValue : : Kind_Local )
compileAssign ( var , target ) ;
}
void compileStatFunction ( AstStatFunction * stat )
{
// Optimization: compile value expresion directly into target local register
2022-05-20 00:46:52 +01:00
if ( int reg = getExprLocalReg ( stat - > name ) ; reg > = 0 )
2021-10-29 21:25:12 +01:00
{
2022-05-20 00:46:52 +01:00
compileExpr ( stat - > func , uint8_t ( reg ) ) ;
2021-10-29 21:25:12 +01:00
return ;
}
RegScope rs ( this ) ;
uint8_t reg = allocReg ( stat , 1 ) ;
compileExprTemp ( stat - > func , reg ) ;
LValue var = compileLValue ( stat - > name , rs ) ;
compileAssign ( var , reg ) ;
}
void compileStat ( AstStat * node )
{
setDebugLine ( node ) ;
if ( options . coverageLevel > = 1 & & needsCoverage ( node ) )
{
bytecode . emitABC ( LOP_COVERAGE , 0 , 0 , 0 ) ;
}
if ( AstStatBlock * stat = node - > as < AstStatBlock > ( ) )
{
RegScope rs ( this ) ;
size_t oldLocals = localStack . size ( ) ;
for ( size_t i = 0 ; i < stat - > body . size ; + + i )
compileStat ( stat - > body . data [ i ] ) ;
closeLocals ( oldLocals ) ;
popLocals ( oldLocals ) ;
}
else if ( AstStatIf * stat = node - > as < AstStatIf > ( ) )
{
compileStatIf ( stat ) ;
}
else if ( AstStatWhile * stat = node - > as < AstStatWhile > ( ) )
{
compileStatWhile ( stat ) ;
}
else if ( AstStatRepeat * stat = node - > as < AstStatRepeat > ( ) )
{
compileStatRepeat ( stat ) ;
}
else if ( node - > is < AstStatBreak > ( ) )
{
2021-11-12 02:12:39 +00:00
LUAU_ASSERT ( ! loops . empty ( ) ) ;
2021-10-29 21:25:12 +01:00
// before exiting out of the loop, we need to close all local variables that were captured in closures since loop start
// normally they are closed by the enclosing blocks, including the loop block, but we're skipping that here
closeLocals ( loops . back ( ) . localOffset ) ;
size_t label = bytecode . emitLabel ( ) ;
bytecode . emitAD ( LOP_JUMP , 0 , 0 ) ;
loopJumps . push_back ( { LoopJump : : Break , label } ) ;
}
else if ( AstStatContinue * stat = node - > as < AstStatContinue > ( ) )
{
2021-11-12 02:12:39 +00:00
LUAU_ASSERT ( ! loops . empty ( ) ) ;
2023-11-03 19:47:28 +00:00
// track continue statement for repeat..until validation (validateContinueUntil)
if ( ! loops . back ( ) . continueUsed )
loops . back ( ) . continueUsed = stat ;
2021-10-29 21:25:12 +01:00
// before continuing, we need to close all local variables that were captured in closures since loop start
// normally they are closed by the enclosing blocks, including the loop block, but we're skipping that here
2023-10-06 18:31:16 +01:00
closeLocals ( loops . back ( ) . localOffsetContinue ) ;
2021-10-29 21:25:12 +01:00
size_t label = bytecode . emitLabel ( ) ;
bytecode . emitAD ( LOP_JUMP , 0 , 0 ) ;
loopJumps . push_back ( { LoopJump : : Continue , label } ) ;
}
else if ( AstStatReturn * stat = node - > as < AstStatReturn > ( ) )
{
2022-05-06 00:52:48 +01:00
if ( options . optimizationLevel > = 2 & & ! inlineFrames . empty ( ) )
compileInlineReturn ( stat , /* fallthrough= */ false ) ;
else
compileStatReturn ( stat ) ;
2021-10-29 21:25:12 +01:00
}
else if ( AstStatExpr * stat = node - > as < AstStatExpr > ( ) )
{
// Optimization: since we don't need to read anything from the stack, we can compile the call to not return anything which saves register
// moves
if ( AstExprCall * expr = stat - > expr - > as < AstExprCall > ( ) )
{
uint8_t target = uint8_t ( regTop ) ;
compileExprCall ( expr , target , /* targetCount= */ 0 ) ;
}
else
{
RegScope rs ( this ) ;
compileExprAuto ( stat - > expr , rs ) ;
}
}
else if ( AstStatLocal * stat = node - > as < AstStatLocal > ( ) )
{
compileStatLocal ( stat ) ;
}
else if ( AstStatFor * stat = node - > as < AstStatFor > ( ) )
{
compileStatFor ( stat ) ;
}
else if ( AstStatForIn * stat = node - > as < AstStatForIn > ( ) )
{
compileStatForIn ( stat ) ;
}
else if ( AstStatAssign * stat = node - > as < AstStatAssign > ( ) )
{
compileStatAssign ( stat ) ;
}
else if ( AstStatCompoundAssign * stat = node - > as < AstStatCompoundAssign > ( ) )
{
compileStatCompoundAssign ( stat ) ;
}
else if ( AstStatFunction * stat = node - > as < AstStatFunction > ( ) )
{
compileStatFunction ( stat ) ;
}
else if ( AstStatLocalFunction * stat = node - > as < AstStatLocalFunction > ( ) )
{
uint8_t var = allocReg ( stat , 1 ) ;
pushLocal ( stat - > name , var ) ;
compileExprFunction ( stat - > func , var ) ;
Local & l = locals [ stat - > name ] ;
// we *have* to pushLocal before we compile the function, since the function may refer to the local as an upvalue
// however, this means the debugpc for the local is at an instruction where the local value hasn't been computed yet
// to fix this we just move the debugpc after the local value is established
l . debugpc = bytecode . getDebugPC ( ) ;
}
else if ( node - > is < AstStatTypeAlias > ( ) )
{
// do nothing
}
else
{
LUAU_ASSERT ( ! " Unknown statement type " ) ;
}
}
2023-10-13 20:38:31 +01:00
void validateContinueUntil ( AstStat * cont , AstExpr * condition , AstStatBlock * body , size_t start )
{
UndefinedLocalVisitor visitor ( this ) ;
for ( size_t i = start ; i < body - > body . size ; + + i )
{
if ( AstStatLocal * stat = body - > body . data [ i ] - > as < AstStatLocal > ( ) )
{
for ( AstLocal * local : stat - > vars )
visitor . locals . insert ( local ) ;
}
else if ( AstStatLocalFunction * stat = body - > body . data [ i ] - > as < AstStatLocalFunction > ( ) )
{
visitor . locals . insert ( stat - > name ) ;
}
}
condition - > visit ( & visitor ) ;
if ( visitor . undef )
CompileError : : raise ( condition - > location ,
" Local %s used in the repeat..until condition is undefined because continue statement on line %d jumps over it " ,
visitor . undef - > name . value , cont - > location . begin . line + 1 ) ;
}
2021-10-29 21:25:12 +01:00
void gatherConstUpvals ( AstExprFunction * func )
{
ConstUpvalueVisitor visitor ( this ) ;
func - > body - > visit ( & visitor ) ;
for ( AstLocal * local : visitor . upvals )
getUpval ( local ) ;
}
void pushLocal ( AstLocal * local , uint8_t reg )
{
if ( localStack . size ( ) > = kMaxLocalCount )
CompileError : : raise (
local - > location , " Out of local registers when trying to allocate %s: exceeded limit %d " , local - > name . value , kMaxLocalCount ) ;
localStack . push_back ( local ) ;
Local & l = locals [ local ] ;
LUAU_ASSERT ( ! l . allocated ) ;
l . reg = reg ;
l . allocated = true ;
l . debugpc = bytecode . getDebugPC ( ) ;
}
bool areLocalsCaptured ( size_t start )
{
LUAU_ASSERT ( start < = localStack . size ( ) ) ;
for ( size_t i = start ; i < localStack . size ( ) ; + + i )
{
Local * l = locals . find ( localStack [ i ] ) ;
LUAU_ASSERT ( l ) ;
2022-01-14 16:06:31 +00:00
if ( l - > captured )
2021-10-29 21:25:12 +01:00
return true ;
}
return false ;
}
void closeLocals ( size_t start )
{
LUAU_ASSERT ( start < = localStack . size ( ) ) ;
bool captured = false ;
uint8_t captureReg = 255 ;
for ( size_t i = start ; i < localStack . size ( ) ; + + i )
{
Local * l = locals . find ( localStack [ i ] ) ;
LUAU_ASSERT ( l ) ;
2022-01-14 16:06:31 +00:00
if ( l - > captured )
2021-10-29 21:25:12 +01:00
{
captured = true ;
captureReg = std : : min ( captureReg , l - > reg ) ;
}
}
if ( captured )
{
bytecode . emitABC ( LOP_CLOSEUPVALS , captureReg , 0 , 0 ) ;
}
}
void popLocals ( size_t start )
{
LUAU_ASSERT ( start < = localStack . size ( ) ) ;
for ( size_t i = start ; i < localStack . size ( ) ; + + i )
{
Local * l = locals . find ( localStack [ i ] ) ;
LUAU_ASSERT ( l ) ;
LUAU_ASSERT ( l - > allocated ) ;
l - > allocated = false ;
if ( options . debugLevel > = 2 )
{
uint32_t debugpc = bytecode . getDebugPC ( ) ;
bytecode . pushDebugLocal ( sref ( localStack [ i ] - > name ) , l - > reg , l - > debugpc , debugpc ) ;
}
}
localStack . resize ( start ) ;
}
void patchJump ( AstNode * node , size_t label , size_t target )
{
if ( ! bytecode . patchJumpD ( label , target ) )
CompileError : : raise ( node - > location , " Exceeded jump distance limit; simplify the code to compile " ) ;
}
void patchJumps ( AstNode * node , std : : vector < size_t > & labels , size_t target )
{
for ( size_t l : labels )
patchJump ( node , l , target ) ;
}
void patchLoopJumps ( AstNode * node , size_t oldJumps , size_t endLabel , size_t contLabel )
{
LUAU_ASSERT ( oldJumps < = loopJumps . size ( ) ) ;
for ( size_t i = oldJumps ; i < loopJumps . size ( ) ; + + i )
{
const LoopJump & lj = loopJumps [ i ] ;
switch ( lj . type )
{
case LoopJump : : Break :
patchJump ( node , lj . label , endLabel ) ;
break ;
case LoopJump : : Continue :
patchJump ( node , lj . label , contLabel ) ;
break ;
default :
LUAU_ASSERT ( ! " Unknown loop jump type " ) ;
}
}
}
uint8_t allocReg ( AstNode * node , unsigned int count )
{
unsigned int top = regTop ;
if ( top + count > kMaxRegisterCount )
CompileError : : raise ( node - > location , " Out of registers when trying to allocate %d registers: exceeded limit %d " , count , kMaxRegisterCount ) ;
regTop + = count ;
stackSize = std : : max ( stackSize , regTop ) ;
return uint8_t ( top ) ;
}
void setDebugLine ( AstNode * node )
{
if ( options . debugLevel > = 1 )
bytecode . setDebugLine ( node - > location . begin . line + 1 ) ;
}
2021-12-02 23:20:08 +00:00
void setDebugLine ( const Location & location )
{
if ( options . debugLevel > = 1 )
bytecode . setDebugLine ( location . begin . line + 1 ) ;
}
2021-10-29 21:25:12 +01:00
void setDebugLineEnd ( AstNode * node )
{
if ( options . debugLevel > = 1 )
bytecode . setDebugLine ( node - > location . end . line + 1 ) ;
}
bool needsCoverage ( AstNode * node )
{
return ! node - > is < AstStatBlock > ( ) & & ! node - > is < AstStatTypeAlias > ( ) ;
}
struct FenvVisitor : AstVisitor
{
bool & getfenvUsed ;
bool & setfenvUsed ;
FenvVisitor ( bool & getfenvUsed , bool & setfenvUsed )
: getfenvUsed ( getfenvUsed )
, setfenvUsed ( setfenvUsed )
{
}
bool visit ( AstExprGlobal * node ) override
{
if ( node - > name = = " getfenv " )
getfenvUsed = true ;
if ( node - > name = = " setfenv " )
setfenvUsed = true ;
return false ;
}
} ;
struct FunctionVisitor : AstVisitor
{
Compiler * self ;
std : : vector < AstExprFunction * > & functions ;
2023-08-04 18:01:35 +01:00
bool hasTypes = false ;
2021-10-29 21:25:12 +01:00
FunctionVisitor ( Compiler * self , std : : vector < AstExprFunction * > & functions )
: self ( self )
, functions ( functions )
{
2022-04-21 22:04:22 +01:00
// preallocate the result; this works around std::vector's inefficient growth policy for small arrays
functions . reserve ( 16 ) ;
2021-10-29 21:25:12 +01:00
}
bool visit ( AstExprFunction * node ) override
{
node - > body - > visit ( this ) ;
2023-08-11 13:55:30 +01:00
for ( AstLocal * arg : node - > args )
hasTypes | = arg - > annotation ! = nullptr ;
2023-08-04 18:01:35 +01:00
2021-10-29 21:25:12 +01:00
// this makes sure all functions that are used when compiling this one have been already added to the vector
functions . push_back ( node ) ;
return false ;
}
} ;
struct UndefinedLocalVisitor : AstVisitor
{
UndefinedLocalVisitor ( Compiler * self )
: self ( self )
, undef ( nullptr )
2023-10-13 20:38:31 +01:00
, locals ( nullptr )
2021-10-29 21:25:12 +01:00
{
}
void check ( AstLocal * local )
{
2023-11-03 19:47:28 +00:00
if ( ! undef & & locals . contains ( local ) )
undef = local ;
2021-10-29 21:25:12 +01:00
}
bool visit ( AstExprLocal * node ) override
{
if ( ! node - > upvalue )
check ( node - > local ) ;
return false ;
}
bool visit ( AstExprFunction * node ) override
{
const Function * f = self - > functions . find ( node ) ;
LUAU_ASSERT ( f ) ;
for ( AstLocal * uv : f - > upvals )
{
LUAU_ASSERT ( uv - > functionDepth < node - > functionDepth ) ;
if ( uv - > functionDepth = = node - > functionDepth - 1 )
check ( uv ) ;
}
return false ;
}
Compiler * self ;
AstLocal * undef ;
2023-10-13 20:38:31 +01:00
DenseHashSet < AstLocal * > locals ;
2021-10-29 21:25:12 +01:00
} ;
struct ConstUpvalueVisitor : AstVisitor
{
ConstUpvalueVisitor ( Compiler * self )
: self ( self )
{
}
bool visit ( AstExprLocal * node ) override
{
if ( node - > upvalue & & self - > isConstant ( node ) )
{
upvals . push_back ( node - > local ) ;
}
return false ;
}
bool visit ( AstExprFunction * node ) override
{
// short-circuits the traversal to make it faster
return false ;
}
Compiler * self ;
std : : vector < AstLocal * > upvals ;
} ;
2022-07-01 00:29:02 +01:00
struct ReturnVisitor : AstVisitor
2022-06-17 01:54:42 +01:00
{
Compiler * self ;
bool returnsOne = true ;
ReturnVisitor ( Compiler * self )
: self ( self )
{
}
bool visit ( AstExpr * expr ) override
{
return false ;
}
bool visit ( AstStatReturn * stat ) override
{
2022-07-29 04:41:13 +01:00
returnsOne & = stat - > list . size = = 1 & & ! self - > isExprMultRet ( stat - > list . data [ 0 ] ) ;
2022-06-17 01:54:42 +01:00
return false ;
}
} ;
2021-10-29 21:25:12 +01:00
struct RegScope
{
RegScope ( Compiler * self )
: self ( self )
, oldTop ( self - > regTop )
{
}
// This ctor is useful to forcefully adjust the stack frame in case we know that registers after a certain point are scratch and can be
// discarded
RegScope ( Compiler * self , unsigned int top )
: self ( self )
, oldTop ( self - > regTop )
{
LUAU_ASSERT ( top < = self - > regTop ) ;
self - > regTop = top ;
}
~ RegScope ( )
{
self - > regTop = oldTop ;
}
Compiler * self ;
unsigned int oldTop ;
} ;
struct Function
{
uint32_t id ;
std : : vector < AstLocal * > upvals ;
2022-05-06 00:52:48 +01:00
uint64_t costModel = 0 ;
unsigned int stackSize = 0 ;
bool canInline = false ;
2022-06-17 01:54:42 +01:00
bool returnsOne = false ;
2021-10-29 21:25:12 +01:00
} ;
struct Local
{
uint8_t reg = 0 ;
bool allocated = false ;
bool captured = false ;
uint32_t debugpc = 0 ;
} ;
struct LoopJump
{
enum Type
{
Break ,
Continue
} ;
Type type ;
size_t label ;
} ;
struct Loop
{
size_t localOffset ;
2023-10-06 18:31:16 +01:00
size_t localOffsetContinue ;
2021-10-29 21:25:12 +01:00
2023-10-13 20:38:31 +01:00
AstStatContinue * continueUsed ;
2021-10-29 21:25:12 +01:00
} ;
2023-05-25 21:46:51 +01:00
struct InlineArg
{
AstLocal * local ;
uint8_t reg ;
Constant value ;
} ;
2022-05-06 00:52:48 +01:00
struct InlineFrame
{
AstExprFunction * func ;
2022-06-17 01:54:42 +01:00
size_t localOffset ;
2022-05-06 00:52:48 +01:00
uint8_t target ;
uint8_t targetCount ;
std : : vector < size_t > returnJumps ;
} ;
2022-05-20 00:46:52 +01:00
struct Capture
{
LuauCaptureType type ;
uint8_t data ;
} ;
2021-10-29 21:25:12 +01:00
BytecodeBuilder & bytecode ;
CompileOptions options ;
DenseHashMap < AstExprFunction * , Function > functions ;
DenseHashMap < AstLocal * , Local > locals ;
DenseHashMap < AstName , Global > globals ;
2022-01-14 16:06:31 +00:00
DenseHashMap < AstLocal * , Variable > variables ;
2021-10-29 21:25:12 +01:00
DenseHashMap < AstExpr * , Constant > constants ;
2022-04-21 22:04:22 +01:00
DenseHashMap < AstLocal * , Constant > locstants ;
2022-01-14 16:06:31 +00:00
DenseHashMap < AstExprTable * , TableShape > tableShapes ;
2022-07-14 23:39:35 +01:00
DenseHashMap < AstExprCall * , int > builtins ;
2023-07-07 18:14:35 +01:00
DenseHashMap < AstExprFunction * , std : : string > typeMap ;
2022-07-14 23:39:35 +01:00
const DenseHashMap < AstExprCall * , int > * builtinsFold = nullptr ;
2023-08-04 18:01:35 +01:00
bool builtinsFoldMathK = false ;
2021-10-29 21:25:12 +01:00
2023-10-06 18:31:16 +01:00
// compileFunction state, gets reset for every function
2021-10-29 21:25:12 +01:00
unsigned int regTop = 0 ;
unsigned int stackSize = 0 ;
2023-10-06 18:31:16 +01:00
bool hasLoops = false ;
2021-10-29 21:25:12 +01:00
bool getfenvUsed = false ;
bool setfenvUsed = false ;
std : : vector < AstLocal * > localStack ;
std : : vector < AstLocal * > upvals ;
std : : vector < LoopJump > loopJumps ;
std : : vector < Loop > loops ;
2022-05-06 00:52:48 +01:00
std : : vector < InlineFrame > inlineFrames ;
2022-05-20 00:46:52 +01:00
std : : vector < Capture > captures ;
2022-08-25 21:55:08 +01:00
std : : vector < std : : unique_ptr < char [ ] > > interpStrings ;
2021-10-29 21:25:12 +01:00
} ;
2022-07-14 23:39:35 +01:00
void compileOrThrow ( BytecodeBuilder & bytecode , const ParseResult & parseResult , const AstNameTable & names , const CompileOptions & inputOptions )
2021-10-29 21:25:12 +01:00
{
2021-11-05 02:07:18 +00:00
LUAU_TIMETRACE_SCOPE ( " compileOrThrow " , " Compiler " ) ;
2022-07-14 23:39:35 +01:00
LUAU_ASSERT ( parseResult . root ) ;
LUAU_ASSERT ( parseResult . errors . empty ( ) ) ;
CompileOptions options = inputOptions ;
2023-07-28 12:37:00 +01:00
uint8_t mainFlags = 0 ;
2022-07-14 23:39:35 +01:00
for ( const HotComment & hc : parseResult . hotcomments )
2023-07-28 12:37:00 +01:00
{
2022-07-14 23:39:35 +01:00
if ( hc . header & & hc . content . compare ( 0 , 9 , " optimize " ) = = 0 )
options . optimizationLevel = std : : max ( 0 , std : : min ( 2 , atoi ( hc . content . c_str ( ) + 9 ) ) ) ;
2023-08-11 13:55:30 +01:00
if ( hc . header & & hc . content = = " native " )
2023-07-28 12:37:00 +01:00
{
mainFlags | = LPF_NATIVE_MODULE ;
options . optimizationLevel = 2 ; // note: this might be removed in the future in favor of --!optimize
}
}
2022-07-14 23:39:35 +01:00
AstStatBlock * root = parseResult . root ;
2021-10-29 21:25:12 +01:00
Compiler compiler ( bytecode , options ) ;
2021-11-12 02:12:39 +00:00
// since access to some global objects may result in values that change over time, we block imports from non-readonly tables
2022-01-14 16:06:31 +00:00
assignMutable ( compiler . globals , names , options . mutableGlobals ) ;
2021-10-29 21:25:12 +01:00
2022-01-14 16:06:31 +00:00
// this pass analyzes mutability of locals/globals and associates locals with their initial values
trackValues ( compiler . globals , compiler . variables , root ) ;
2021-10-29 21:25:12 +01:00
2023-10-06 18:31:16 +01:00
// this visitor tracks calls to getfenv/setfenv and disables some optimizations when they are found
if ( options . optimizationLevel > = 1 & & ( names . get ( " getfenv " ) . value | | names . get ( " setfenv " ) . value ) )
{
Compiler : : FenvVisitor fenvVisitor ( compiler . getfenvUsed , compiler . setfenvUsed ) ;
root - > visit ( & fenvVisitor ) ;
}
2022-07-14 23:39:35 +01:00
// builtin folding is enabled on optimization level 2 since we can't deoptimize folding at runtime
2023-10-27 20:33:36 +01:00
if ( options . optimizationLevel > = 2 & & ( ! compiler . getfenvUsed & & ! compiler . setfenvUsed ) )
2023-08-04 18:01:35 +01:00
{
2022-07-14 23:39:35 +01:00
compiler . builtinsFold = & compiler . builtins ;
2023-08-25 16:25:09 +01:00
if ( AstName math = names . get ( " math " ) ; math . value & & getGlobalState ( compiler . globals , math ) = = Global : : Default )
compiler . builtinsFoldMathK = true ;
2023-08-04 18:01:35 +01:00
}
2021-10-29 21:25:12 +01:00
if ( options . optimizationLevel > = 1 )
{
2022-07-14 23:39:35 +01:00
// this pass tracks which calls are builtins and can be compiled more efficiently
analyzeBuiltins ( compiler . builtins , compiler . globals , compiler . variables , options , root ) ;
2022-01-14 16:06:31 +00:00
// this pass analyzes constantness of expressions
2023-08-04 18:01:35 +01:00
foldConstants ( compiler . constants , compiler . variables , compiler . locstants , compiler . builtinsFold , compiler . builtinsFoldMathK , root ) ;
2022-01-14 16:06:31 +00:00
// this pass analyzes table assignments to estimate table shapes for initially empty tables
predictTableShapes ( compiler . tableShapes , root ) ;
2021-10-29 21:25:12 +01:00
}
// gathers all functions with the invariant that all function references are to functions earlier in the list
// for example, function foo() return function() end end will result in two vector entries, [0] = anonymous and [1] = foo
std : : vector < AstExprFunction * > functions ;
Compiler : : FunctionVisitor functionVisitor ( & compiler , functions ) ;
root - > visit ( & functionVisitor ) ;
2023-08-04 18:01:35 +01:00
// computes type information for all functions based on type annotations
2023-08-11 13:55:30 +01:00
if ( functionVisitor . hasTypes )
2023-08-04 18:01:35 +01:00
buildTypeMap ( compiler . typeMap , root , options . vectorType ) ;
2021-10-29 21:25:12 +01:00
for ( AstExprFunction * expr : functions )
2023-07-28 12:37:00 +01:00
compiler . compileFunction ( expr , 0 ) ;
2021-10-29 21:25:12 +01:00
2022-01-14 16:06:31 +00:00
AstExprFunction main ( root - > location , /*generics= */ AstArray < AstGenericType > ( ) , /*genericPacks= */ AstArray < AstGenericTypePack > ( ) ,
2022-08-25 21:55:08 +01:00
/* self= */ nullptr , AstArray < AstLocal * > ( ) , /* vararg= */ true , /* varargLocation= */ Luau : : Location ( ) , root , /* functionDepth= */ 0 ,
/* debugname= */ AstName ( ) ) ;
2023-07-28 12:37:00 +01:00
uint32_t mainid = compiler . compileFunction ( & main , mainFlags ) ;
2021-10-29 21:25:12 +01:00
2022-05-20 00:46:52 +01:00
const Compiler : : Function * mainf = compiler . functions . find ( & main ) ;
LUAU_ASSERT ( mainf & & mainf - > upvals . empty ( ) ) ;
2021-10-29 21:25:12 +01:00
bytecode . setMainFunction ( mainid ) ;
bytecode . finalize ( ) ;
}
void compileOrThrow ( BytecodeBuilder & bytecode , const std : : string & source , const CompileOptions & options , const ParseOptions & parseOptions )
{
Allocator allocator ;
AstNameTable names ( allocator ) ;
ParseResult result = Parser : : parse ( source . c_str ( ) , source . size ( ) , names , allocator , parseOptions ) ;
if ( ! result . errors . empty ( ) )
throw ParseErrors ( result . errors ) ;
2022-07-14 23:39:35 +01:00
compileOrThrow ( bytecode , result , names , options ) ;
2021-10-29 21:25:12 +01:00
}
std : : string compile ( const std : : string & source , const CompileOptions & options , const ParseOptions & parseOptions , BytecodeEncoder * encoder )
{
2021-11-05 02:07:18 +00:00
LUAU_TIMETRACE_SCOPE ( " compile " , " Compiler " ) ;
2021-10-29 21:25:12 +01:00
Allocator allocator ;
AstNameTable names ( allocator ) ;
ParseResult result = Parser : : parse ( source . c_str ( ) , source . size ( ) , names , allocator , parseOptions ) ;
if ( ! result . errors . empty ( ) )
{
// Users of this function expect only a single error message
const Luau : : ParseError & parseError = result . errors . front ( ) ;
std : : string error = format ( " :%d: %s " , parseError . getLocation ( ) . begin . line + 1 , parseError . what ( ) ) ;
return BytecodeBuilder : : getError ( error ) ;
}
try
{
BytecodeBuilder bcb ( encoder ) ;
2022-07-14 23:39:35 +01:00
compileOrThrow ( bcb , result , names , options ) ;
2021-10-29 21:25:12 +01:00
return bcb . getBytecode ( ) ;
}
catch ( CompileError & e )
{
std : : string error = format ( " :%d: %s " , e . getLocation ( ) . begin . line + 1 , e . what ( ) ) ;
return BytecodeBuilder : : getError ( error ) ;
}
}
} // namespace Luau