luau/Analysis/include/Luau/Normalize.h

466 lines
15 KiB
C
Raw Permalink Normal View History

2022-04-14 22:57:15 +01:00
// This file is part of the Luau programming language and is licensed under MIT License; see LICENSE.txt for details
2022-09-08 22:44:50 +01:00
#pragma once
2022-04-14 22:57:15 +01:00
Sync to upstream/release/655 * General - Fix the benchmark require wrapper function to work in Lua - Fix memory leak in the new Luau C API test * New Solver - Luau: type functions should be able to signal whether or not irreducibility is due to an error - Do not generate extra expansion constraint for uninvoked user-defined type functions - Print in a user-defined type function should be reported as an error instead of logging to stdout - Many e-graphs bugfixes and performance improvements - Many general bugfixes and improvements to the new solver as a whole - Fixed issue with Luau used-defined type functions not having all environments initialized - Infer types of globals under new type solver * Fragment Autocomplete - Miscellaneous fixes to make interop with the old solver better * Runtime - Support disabling specific Luau built-in functions from being fast-called or constant-evaluated - Added constant folding for vector arithmetic - Added constant propagation and type inference for Vector3 globals ---------------------------------------------------------- 9 contributors: Co-authored-by: Aaron Weiss <aaronweiss@roblox.com> Co-authored-by: Andy Friesen <afriesen@roblox.com> Co-authored-by: Aviral Goel <agoel@roblox.com> Co-authored-by: Daniel Angel <danielangel@roblox.com> Co-authored-by: Jonathan Kelaty <jkelaty@roblox.com> Co-authored-by: Hunter Goldstein <hgoldstein@roblox.com> Co-authored-by: Varun Saini <vsaini@roblox.com> Co-authored-by: Vighnesh Vijay <vvijay@roblox.com> Co-authored-by: Vyacheslav Egorov <vegorov@roblox.com>
2024-12-13 18:57:30 +00:00
#include "Luau/EqSatSimplification.h"
2022-08-18 22:04:33 +01:00
#include "Luau/NotNull.h"
2023-11-10 18:05:48 +00:00
#include "Luau/Set.h"
2023-10-20 21:36:26 +01:00
#include "Luau/TypeFwd.h"
2022-10-07 00:55:58 +01:00
#include "Luau/UnifierSharedState.h"
2022-08-18 22:04:33 +01:00
2023-10-20 21:36:26 +01:00
#include <initializer_list>
#include <map>
2022-08-18 22:04:33 +01:00
#include <memory>
2023-10-20 21:36:26 +01:00
#include <unordered_map>
#include <vector>
2022-04-14 22:57:15 +01:00
namespace Luau
{
struct InternalErrorReporter;
2022-08-18 22:04:33 +01:00
struct Module;
struct Scope;
using ModulePtr = std::shared_ptr<Module>;
2022-04-14 22:57:15 +01:00
Sync to upstream/release/655 * General - Fix the benchmark require wrapper function to work in Lua - Fix memory leak in the new Luau C API test * New Solver - Luau: type functions should be able to signal whether or not irreducibility is due to an error - Do not generate extra expansion constraint for uninvoked user-defined type functions - Print in a user-defined type function should be reported as an error instead of logging to stdout - Many e-graphs bugfixes and performance improvements - Many general bugfixes and improvements to the new solver as a whole - Fixed issue with Luau used-defined type functions not having all environments initialized - Infer types of globals under new type solver * Fragment Autocomplete - Miscellaneous fixes to make interop with the old solver better * Runtime - Support disabling specific Luau built-in functions from being fast-called or constant-evaluated - Added constant folding for vector arithmetic - Added constant propagation and type inference for Vector3 globals ---------------------------------------------------------- 9 contributors: Co-authored-by: Aaron Weiss <aaronweiss@roblox.com> Co-authored-by: Andy Friesen <afriesen@roblox.com> Co-authored-by: Aviral Goel <agoel@roblox.com> Co-authored-by: Daniel Angel <danielangel@roblox.com> Co-authored-by: Jonathan Kelaty <jkelaty@roblox.com> Co-authored-by: Hunter Goldstein <hgoldstein@roblox.com> Co-authored-by: Varun Saini <vsaini@roblox.com> Co-authored-by: Vighnesh Vijay <vvijay@roblox.com> Co-authored-by: Vyacheslav Egorov <vegorov@roblox.com>
2024-12-13 18:57:30 +00:00
bool isSubtype(
TypeId subTy,
TypeId superTy,
NotNull<Scope> scope,
NotNull<BuiltinTypes> builtinTypes,
NotNull<Simplifier> simplifier,
InternalErrorReporter& ice
);
bool isSubtype(
TypePackId subPack,
TypePackId superPack,
NotNull<Scope> scope,
NotNull<BuiltinTypes> builtinTypes,
NotNull<Simplifier> simplifier,
InternalErrorReporter& ice
);
2022-09-08 22:44:50 +01:00
2022-10-07 00:55:58 +01:00
class TypeIds
{
private:
2023-11-03 19:47:28 +00:00
DenseHashMap<TypeId, bool> types{nullptr};
2022-10-07 00:55:58 +01:00
std::vector<TypeId> order;
std::size_t hash = 0;
public:
using iterator = std::vector<TypeId>::iterator;
using const_iterator = std::vector<TypeId>::const_iterator;
TypeIds() = default;
~TypeIds() = default;
2023-10-20 21:36:26 +01:00
TypeIds(std::initializer_list<TypeId> tys);
TypeIds(const TypeIds&) = default;
TypeIds& operator=(const TypeIds&) = default;
TypeIds(TypeIds&&) = default;
2022-10-07 00:55:58 +01:00
TypeIds& operator=(TypeIds&&) = default;
void insert(TypeId ty);
/// Erase every element that does not also occur in tys
void retain(const TypeIds& tys);
void clear();
2022-12-09 18:07:25 +00:00
TypeId front() const;
2022-10-07 00:55:58 +01:00
iterator begin();
iterator end();
const_iterator begin() const;
const_iterator end() const;
iterator erase(const_iterator it);
2024-07-26 01:10:42 +01:00
void erase(TypeId ty);
2022-10-07 00:55:58 +01:00
size_t size() const;
bool empty() const;
size_t count(TypeId ty) const;
template<class Iterator>
void insert(Iterator begin, Iterator end)
{
for (Iterator it = begin; it != end; ++it)
insert(*it);
}
2022-10-13 23:59:53 +01:00
bool operator==(const TypeIds& there) const;
2022-10-07 00:55:58 +01:00
size_t getHash() const;
2023-06-09 13:20:36 +01:00
bool isNever() const;
2022-10-07 00:55:58 +01:00
};
} // namespace Luau
2022-10-13 23:59:53 +01:00
template<>
struct std::hash<Luau::TypeIds>
2022-10-07 00:55:58 +01:00
{
std::size_t operator()(const Luau::TypeIds& tys) const
{
return tys.getHash();
}
};
2022-10-13 23:59:53 +01:00
template<>
struct std::hash<const Luau::TypeIds*>
2022-10-07 00:55:58 +01:00
{
std::size_t operator()(const Luau::TypeIds* tys) const
{
return tys->getHash();
}
};
2022-10-13 23:59:53 +01:00
template<>
struct std::equal_to<Luau::TypeIds>
2022-10-07 00:55:58 +01:00
{
bool operator()(const Luau::TypeIds& here, const Luau::TypeIds& there) const
{
return here == there;
}
};
2022-10-13 23:59:53 +01:00
template<>
struct std::equal_to<const Luau::TypeIds*>
2022-10-07 00:55:58 +01:00
{
bool operator()(const Luau::TypeIds* here, const Luau::TypeIds* there) const
{
return *here == *there;
}
};
namespace Luau
{
2022-10-27 23:22:49 +01:00
/** A normalized string type is either `string` (represented by `nullopt`) or a
* union of string singletons.
*
2022-12-09 18:07:25 +00:00
* The representation is as follows:
2022-10-27 23:22:49 +01:00
*
* * A union of string singletons is finite and includes the singletons named by
* the `singletons` field.
* * An intersection of negated string singletons is cofinite and includes the
* singletons excluded by the `singletons` field. It is implied that cofinite
* values are exclusions from `string` itself.
* * The `string` data type is a cofinite set minus zero elements.
* * The `never` data type is a finite set plus zero elements.
*/
struct NormalizedStringType
{
// When false, this type represents a union of singleton string types.
// eg "a" | "b" | "c"
//
// When true, this type represents string intersected with negated string
// singleton types.
// eg string & ~"a" & ~"b" & ...
bool isCofinite = false;
2022-12-09 18:07:25 +00:00
std::map<std::string, TypeId> singletons;
2022-10-27 23:22:49 +01:00
void resetToString();
void resetToNever();
bool isNever() const;
bool isString() const;
/// Returns true if the string has finite domain.
///
/// Important subtlety: This method returns true for `never`. The empty set
/// is indeed an empty set.
bool isUnion() const;
/// Returns true if the string has infinite domain.
bool isIntersection() const;
bool includes(const std::string& str) const;
static const NormalizedStringType never;
2022-12-09 18:07:25 +00:00
NormalizedStringType();
NormalizedStringType(bool isCofinite, std::map<std::string, TypeId> singletons);
2022-10-27 23:22:49 +01:00
};
bool isSubtype(const NormalizedStringType& subStr, const NormalizedStringType& superStr);
2022-10-07 00:55:58 +01:00
2023-01-03 17:33:19 +00:00
struct NormalizedClassType
{
/** Has the following structure:
*
* (C1 & ~N11 & ... & ~Nn) | (C2 & ~N21 & ... & ~N2n) | ...
*
* C2 is either not a subtype of any other Cm, or it is and is also a
* subtype of one of Nmn types within the same cluster.
*
* Each TypeId is a class type.
*/
std::unordered_map<TypeId, TypeIds> classes;
/**
* In order to maintain a consistent insertion order, we use this vector to
* keep track of it. An ordered std::map will sort by pointer identity,
* which is undesirable.
*/
std::vector<TypeId> ordering;
void pushPair(TypeId ty, TypeIds negations);
void resetToNever();
bool isNever() const;
};
2022-11-04 17:02:37 +00:00
// A normalized function type can be `never`, the top function type `function`,
2022-10-07 00:55:58 +01:00
// or an intersection of function types.
2022-11-04 17:02:37 +00:00
//
// NOTE: type normalization can fail on function types with generics (e.g.
// because we do not support unions and intersections of generic type packs), so
// this type may contain `error`.
struct NormalizedFunctionType
{
bool isTop = false;
2023-03-31 13:21:14 +01:00
TypeIds parts;
2022-11-04 17:02:37 +00:00
void resetToNever();
void resetToTop();
bool isNever() const;
};
2022-10-07 00:55:58 +01:00
// A normalized generic/free type is a union, where each option is of the form (X & T) where
2023-03-17 14:59:30 +00:00
// * X is either a free type, a generic or a blocked type.
2022-10-07 00:55:58 +01:00
// * T is a normalized type.
struct NormalizedType;
using NormalizedTyvars = std::unordered_map<TypeId, std::unique_ptr<NormalizedType>>;
2024-04-05 18:41:05 +01:00
// Operations provided by `Normalizer` can have ternary results:
// 1. The operation returned true.
// 2. The operation returned false.
// 3. They can hit resource limitations, which invalidates _all normalized types_.
enum class NormalizationResult
{
// The operation returned true or succeeded.
True,
// The operation returned false or failed.
False,
// Resource limits were hit, invalidating all normalized types.
HitLimits,
};
2022-10-07 00:55:58 +01:00
// A normalized type is either any, unknown, or one of the form P | T | F | G where
// * P is a union of primitive types (including singletons, classes and the error type)
// * T is a union of table types
// * F is a union of an intersection of function types
2023-03-17 14:59:30 +00:00
// * G is a union of generic/free/blocked types, intersected with a normalized type
2022-10-07 00:55:58 +01:00
struct NormalizedType
{
// The top part of the type.
// This type is either never, unknown, or any.
// If this type is not never, all the other fields are null.
TypeId tops;
// The boolean part of the type.
// This type is either never, boolean type, or a boolean singleton.
TypeId booleans;
2023-01-03 17:33:19 +00:00
NormalizedClassType classes;
2022-10-07 00:55:58 +01:00
// The error part of the type.
// This type is either never or the error type.
TypeId errors;
// The nil part of the type.
// This type is either never or nil.
TypeId nils;
// The number part of the type.
// This type is either never or number.
TypeId numbers;
// The string part of the type.
// This may be the `string` type, or a union of singletons.
2022-10-27 23:22:49 +01:00
NormalizedStringType strings;
2022-10-07 00:55:58 +01:00
// The thread part of the type.
// This type is either never or thread.
TypeId threads;
2023-11-10 18:05:48 +00:00
// The buffer part of the type.
// This type is either never or buffer.
TypeId buffers;
2022-10-07 00:55:58 +01:00
// The (meta)table part of the type.
2023-01-27 21:28:45 +00:00
// Each element of this set is a (meta)table type, or the top `table` type.
// An empty set denotes never.
2022-10-07 00:55:58 +01:00
TypeIds tables;
// The function part of the type.
NormalizedFunctionType functions;
// The generic/free part of the type.
NormalizedTyvars tyvars;
2024-04-12 11:44:40 +01:00
// Free types, blocked types, and certain other types change shape as type
// inference is done. If we were to cache the normalization of these types,
// we'd be reusing bad, stale data.
bool isCacheable = true;
2023-01-03 17:33:19 +00:00
NormalizedType(NotNull<BuiltinTypes> builtinTypes);
2022-10-07 00:55:58 +01:00
NormalizedType() = delete;
~NormalizedType() = default;
2022-11-04 17:02:37 +00:00
NormalizedType(const NormalizedType&) = delete;
NormalizedType& operator=(const NormalizedType&) = delete;
NormalizedType(NormalizedType&&) = default;
2022-10-07 00:55:58 +01:00
NormalizedType& operator=(NormalizedType&&) = default;
2023-05-19 19:59:59 +01:00
// IsType functions
2023-11-03 19:47:28 +00:00
bool isUnknown() const;
2023-06-09 13:20:36 +01:00
/// Returns true if the type is exactly a number. Behaves like Type::isNumber()
bool isExactlyNumber() const;
/// Returns true if the type is a subtype of string(it could be a singleton). Behaves like Type::isString()
bool isSubtypeOfString() const;
2024-05-10 17:17:09 +01:00
/// Returns true if the type is a subtype of boolean(it could be a singleton). Behaves like Type::isBoolean()
bool isSubtypeOfBooleans() const;
2023-07-07 18:14:35 +01:00
/// Returns true if this type should result in error suppressing behavior.
bool shouldSuppressErrors() const;
2023-07-28 12:37:00 +01:00
/// Returns true if this type contains the primitve top table type, `table`.
bool hasTopTable() const;
2023-06-09 13:20:36 +01:00
// Helpers that improve readability of the above (they just say if the component is present)
bool hasTops() const;
bool hasBooleans() const;
bool hasClasses() const;
bool hasErrors() const;
bool hasNils() const;
bool hasNumbers() const;
bool hasStrings() const;
bool hasThreads() const;
2023-11-10 18:05:48 +00:00
bool hasBuffers() const;
2023-06-09 13:20:36 +01:00
bool hasTables() const;
bool hasFunctions() const;
bool hasTyvars() const;
2024-03-08 23:57:12 +00:00
bool isFalsy() const;
bool isTruthy() const;
2022-10-07 00:55:58 +01:00
};
2023-05-19 19:59:59 +01:00
2024-10-25 17:46:08 +01:00
using SeenTablePropPairs = Set<std::pair<TypeId, TypeId>, TypeIdPairHash>;
2023-05-19 19:59:59 +01:00
2022-10-07 00:55:58 +01:00
class Normalizer
{
2024-04-12 11:44:40 +01:00
std::unordered_map<TypeId, std::shared_ptr<NormalizedType>> cachedNormals;
2022-10-07 00:55:58 +01:00
std::unordered_map<const TypeIds*, TypeId> cachedIntersections;
std::unordered_map<const TypeIds*, TypeId> cachedUnions;
std::unordered_map<const TypeIds*, std::unique_ptr<TypeIds>> cachedTypeIds;
2023-05-25 21:46:51 +01:00
DenseHashMap<TypeId, bool> cachedIsInhabited{nullptr};
DenseHashMap<std::pair<TypeId, TypeId>, bool, TypeIdPairHash> cachedIsInhabitedIntersection{{nullptr, nullptr}};
2022-10-07 00:55:58 +01:00
bool withinResourceLimits();
public:
TypeArena* arena;
2023-01-03 17:33:19 +00:00
NotNull<BuiltinTypes> builtinTypes;
2022-10-07 00:55:58 +01:00
NotNull<UnifierSharedState> sharedState;
2023-05-25 21:46:51 +01:00
bool cacheInhabitance = false;
2022-10-07 00:55:58 +01:00
2023-05-25 21:46:51 +01:00
Normalizer(TypeArena* arena, NotNull<BuiltinTypes> builtinTypes, NotNull<UnifierSharedState> sharedState, bool cacheInhabitance = false);
2022-10-07 00:55:58 +01:00
Normalizer(const Normalizer&) = delete;
Normalizer(Normalizer&&) = delete;
Normalizer() = delete;
~Normalizer() = default;
Normalizer& operator=(Normalizer&&) = delete;
Normalizer& operator=(Normalizer&) = delete;
// If this returns null, the typechecker should emit a "too complex" error
2024-04-12 11:44:40 +01:00
std::shared_ptr<const NormalizedType> normalize(TypeId ty);
2022-10-07 00:55:58 +01:00
void clearNormal(NormalizedType& norm);
// ------- Cached TypeIds
TypeId unionType(TypeId here, TypeId there);
TypeId intersectionType(TypeId here, TypeId there);
const TypeIds* cacheTypeIds(TypeIds tys);
void clearCaches();
// ------- Normalizing unions
void unionTysWithTy(TypeIds& here, TypeId there);
TypeId unionOfTops(TypeId here, TypeId there);
TypeId unionOfBools(TypeId here, TypeId there);
void unionClassesWithClass(TypeIds& heres, TypeId there);
void unionClasses(TypeIds& heres, const TypeIds& theres);
2023-01-03 17:33:19 +00:00
void unionClassesWithClass(NormalizedClassType& heres, TypeId there);
void unionClasses(NormalizedClassType& heres, const NormalizedClassType& theres);
2022-10-07 00:55:58 +01:00
void unionStrings(NormalizedStringType& here, const NormalizedStringType& there);
std::optional<TypePackId> unionOfTypePacks(TypePackId here, TypePackId there);
std::optional<TypeId> unionOfFunctions(TypeId here, TypeId there);
std::optional<TypeId> unionSaturatedFunctions(TypeId here, TypeId there);
void unionFunctionsWithFunction(NormalizedFunctionType& heress, TypeId there);
void unionFunctions(NormalizedFunctionType& heress, const NormalizedFunctionType& theress);
void unionTablesWithTable(TypeIds& heres, TypeId there);
void unionTables(TypeIds& heres, const TypeIds& theres);
2024-04-05 18:41:05 +01:00
NormalizationResult unionNormals(NormalizedType& here, const NormalizedType& there, int ignoreSmallerTyvars = -1);
2024-10-25 17:46:08 +01:00
NormalizationResult unionNormalWithTy(
NormalizedType& here,
TypeId there,
SeenTablePropPairs& seenTablePropPairs,
Set<TypeId>& seenSetTypes,
int ignoreSmallerTyvars = -1
);
2022-10-07 00:55:58 +01:00
2022-10-27 23:22:49 +01:00
// ------- Negations
2022-11-04 17:02:37 +00:00
std::optional<NormalizedType> negateNormal(const NormalizedType& here);
2022-10-27 23:22:49 +01:00
TypeIds negateAll(const TypeIds& theres);
TypeId negate(TypeId there);
void subtractPrimitive(NormalizedType& here, TypeId ty);
void subtractSingleton(NormalizedType& here, TypeId ty);
2024-05-10 17:17:09 +01:00
NormalizationResult intersectNormalWithNegationTy(TypeId toNegate, NormalizedType& intersect);
2022-10-27 23:22:49 +01:00
2022-10-07 00:55:58 +01:00
// ------- Normalizing intersections
TypeId intersectionOfTops(TypeId here, TypeId there);
TypeId intersectionOfBools(TypeId here, TypeId there);
2023-01-03 17:33:19 +00:00
void intersectClasses(NormalizedClassType& heres, const NormalizedClassType& theres);
void intersectClassesWithClass(NormalizedClassType& heres, TypeId there);
2022-10-07 00:55:58 +01:00
void intersectStrings(NormalizedStringType& here, const NormalizedStringType& there);
std::optional<TypePackId> intersectionOfTypePacks(TypePackId here, TypePackId there);
2024-10-25 17:46:08 +01:00
std::optional<TypeId> intersectionOfTables(TypeId here, TypeId there, SeenTablePropPairs& seenTablePropPairs, Set<TypeId>& seenSet);
void intersectTablesWithTable(TypeIds& heres, TypeId there, SeenTablePropPairs& seenTablePropPairs, Set<TypeId>& seenSetTypes);
2022-10-07 00:55:58 +01:00
void intersectTables(TypeIds& heres, const TypeIds& theres);
std::optional<TypeId> intersectionOfFunctions(TypeId here, TypeId there);
void intersectFunctionsWithFunction(NormalizedFunctionType& heress, TypeId there);
void intersectFunctions(NormalizedFunctionType& heress, const NormalizedFunctionType& theress);
2024-10-25 17:46:08 +01:00
NormalizationResult intersectTyvarsWithTy(
NormalizedTyvars& here,
TypeId there,
SeenTablePropPairs& seenTablePropPairs,
Set<TypeId>& seenSetTypes
);
2024-04-05 18:41:05 +01:00
NormalizationResult intersectNormals(NormalizedType& here, const NormalizedType& there, int ignoreSmallerTyvars = -1);
2024-10-25 17:46:08 +01:00
NormalizationResult intersectNormalWithTy(NormalizedType& here, TypeId there, SeenTablePropPairs& seenTablePropPairs, Set<TypeId>& seenSetTypes);
NormalizationResult normalizeIntersections(
const std::vector<TypeId>& intersections,
NormalizedType& outType,
SeenTablePropPairs& seenTablePropPairs,
Set<TypeId>& seenSet
);
2022-10-07 00:55:58 +01:00
2022-12-02 10:46:05 +00:00
// Check for inhabitance
2024-04-05 18:41:05 +01:00
NormalizationResult isInhabited(TypeId ty);
NormalizationResult isInhabited(TypeId ty, Set<TypeId>& seen);
NormalizationResult isInhabited(const NormalizedType* norm);
NormalizationResult isInhabited(const NormalizedType* norm, Set<TypeId>& seen);
2023-05-25 21:46:51 +01:00
2023-04-28 12:55:55 +01:00
// Check for intersections being inhabited
2024-04-05 18:41:05 +01:00
NormalizationResult isIntersectionInhabited(TypeId left, TypeId right);
2024-10-25 17:46:08 +01:00
NormalizationResult isIntersectionInhabited(TypeId left, TypeId right, SeenTablePropPairs& seenTablePropPairs, Set<TypeId>& seenSet);
2022-12-02 10:46:05 +00:00
2022-10-07 00:55:58 +01:00
// -------- Convert back from a normalized type to a type
TypeId typeFromNormal(const NormalizedType& norm);
};
2022-04-14 22:57:15 +01:00
} // namespace Luau