mirror of
https://github.com/luau-lang/luau.git
synced 2025-04-03 18:30:54 +01:00
CodeGen: Implement DOT_VEC IR opcode
This exposes vdpps on X64 and allows to compute a 3-wide dot product for two vectors, returning the result as a number.
This commit is contained in:
parent
d2c008c3a8
commit
74a91289e9
7 changed files with 31 additions and 1 deletions
|
@ -194,6 +194,10 @@ enum class IrCmd : uint8_t
|
|||
// A: TValue
|
||||
UNM_VEC,
|
||||
|
||||
// Compute dot product between two vectors
|
||||
// A, B: TValue
|
||||
DOT_VEC,
|
||||
|
||||
// Compute Luau 'not' operation on destructured TValue
|
||||
// A: tag
|
||||
// B: int (value)
|
||||
|
|
|
@ -176,6 +176,7 @@ inline bool hasResult(IrCmd cmd)
|
|||
case IrCmd::SUB_VEC:
|
||||
case IrCmd::MUL_VEC:
|
||||
case IrCmd::DIV_VEC:
|
||||
case IrCmd::DOT_VEC:
|
||||
case IrCmd::UNM_VEC:
|
||||
case IrCmd::NOT_ANY:
|
||||
case IrCmd::CMP_ANY:
|
||||
|
|
|
@ -163,6 +163,8 @@ const char* getCmdName(IrCmd cmd)
|
|||
return "DIV_VEC";
|
||||
case IrCmd::UNM_VEC:
|
||||
return "UNM_VEC";
|
||||
case IrCmd::DOT_VEC:
|
||||
return "DOT_VEC";
|
||||
case IrCmd::NOT_ANY:
|
||||
return "NOT_ANY";
|
||||
case IrCmd::CMP_ANY:
|
||||
|
|
|
@ -728,6 +728,11 @@ void IrLoweringA64::lowerInst(IrInst& inst, uint32_t index, const IrBlock& next)
|
|||
build.fneg(inst.regA64, regOp(inst.a));
|
||||
break;
|
||||
}
|
||||
case IrCmd::DOT_VEC:
|
||||
{
|
||||
CODEGEN_ASSERT(!"DOT_VEC is not implemented for A64");
|
||||
break;
|
||||
}
|
||||
case IrCmd::NOT_ANY:
|
||||
{
|
||||
inst.regA64 = regs.allocReuse(KindA64::w, index, {inst.a, inst.b});
|
||||
|
|
|
@ -675,6 +675,20 @@ void IrLoweringX64::lowerInst(IrInst& inst, uint32_t index, const IrBlock& next)
|
|||
build.vxorpd(inst.regX64, regOp(inst.a), build.f32x4(-0.0, -0.0, -0.0, -0.0));
|
||||
break;
|
||||
}
|
||||
case IrCmd::DOT_VEC:
|
||||
{
|
||||
inst.regX64 = regs.allocRegOrReuse(SizeX64::xmmword, index, {inst.a, inst.b});
|
||||
|
||||
ScopedRegX64 tmp1{regs};
|
||||
ScopedRegX64 tmp2{regs};
|
||||
|
||||
RegisterX64 tmpa = vecOp(inst.a, tmp1);
|
||||
RegisterX64 tmpb = (inst.a == inst.b) ? tmpa : vecOp(inst.b, tmp2);
|
||||
|
||||
build.vdpps(inst.regX64, tmpa, tmpb, 0x71); // 7 = 0b0111, sum first 3 products into first float
|
||||
build.vcvtss2sd(inst.regX64, inst.regX64, inst.regX64);
|
||||
break;
|
||||
}
|
||||
case IrCmd::NOT_ANY:
|
||||
{
|
||||
// TODO: if we have a single user which is a STORE_INT, we are missing the opportunity to write directly to target
|
||||
|
|
|
@ -75,6 +75,8 @@ IrValueKind getCmdValueKind(IrCmd cmd)
|
|||
case IrCmd::DIV_VEC:
|
||||
case IrCmd::UNM_VEC:
|
||||
return IrValueKind::Tvalue;
|
||||
case IrCmd::DOT_VEC:
|
||||
return IrValueKind::Double;
|
||||
case IrCmd::NOT_ANY:
|
||||
case IrCmd::CMP_ANY:
|
||||
return IrValueKind::Int;
|
||||
|
|
|
@ -768,7 +768,8 @@ static void constPropInInst(ConstPropState& state, IrBuilder& build, IrFunction&
|
|||
if (tag == LUA_TBOOLEAN &&
|
||||
(value.kind == IrOpKind::Inst || (value.kind == IrOpKind::Constant && function.constOp(value).kind == IrConstKind::Int)))
|
||||
canSplitTvalueStore = true;
|
||||
else if (tag == LUA_TNUMBER && (value.kind == IrOpKind::Inst || (value.kind == IrOpKind::Constant && function.constOp(value).kind == IrConstKind::Double)))
|
||||
else if (tag == LUA_TNUMBER &&
|
||||
(value.kind == IrOpKind::Inst || (value.kind == IrOpKind::Constant && function.constOp(value).kind == IrConstKind::Double)))
|
||||
canSplitTvalueStore = true;
|
||||
else if (tag != 0xff && isGCO(tag) && value.kind == IrOpKind::Inst)
|
||||
canSplitTvalueStore = true;
|
||||
|
@ -1342,6 +1343,7 @@ static void constPropInInst(ConstPropState& state, IrBuilder& build, IrFunction&
|
|||
case IrCmd::SUB_VEC:
|
||||
case IrCmd::MUL_VEC:
|
||||
case IrCmd::DIV_VEC:
|
||||
case IrCmd::DOT_VEC:
|
||||
if (IrInst* a = function.asInstOp(inst.a); a && a->cmd == IrCmd::TAG_VECTOR)
|
||||
replace(function, inst.a, a->a);
|
||||
|
||||
|
|
Loading…
Add table
Reference in a new issue