2021-10-30 04:25:12 +08:00
|
|
|
// This file is part of the Luau programming language and is licensed under MIT License; see LICENSE.txt for details
|
|
|
|
#pragma once
|
|
|
|
|
|
|
|
#include "Luau/Bytecode.h"
|
|
|
|
#include "Luau/DenseHash.h"
|
2022-04-22 05:04:22 +08:00
|
|
|
#include "Luau/StringUtils.h"
|
2021-10-30 04:25:12 +08:00
|
|
|
|
|
|
|
#include <string>
|
|
|
|
|
|
|
|
namespace Luau
|
|
|
|
{
|
|
|
|
|
|
|
|
class BytecodeEncoder
|
|
|
|
{
|
|
|
|
public:
|
|
|
|
virtual ~BytecodeEncoder() {}
|
|
|
|
|
2023-08-19 01:06:29 +08:00
|
|
|
virtual void encode(uint32_t* data, size_t count) = 0;
|
2021-10-30 04:25:12 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
class BytecodeBuilder
|
|
|
|
{
|
|
|
|
public:
|
|
|
|
// BytecodeBuilder does *not* copy the data passed via StringRef; instead, it keeps the ref around until finalize()
|
|
|
|
// Please be careful with the lifetime of the data that's being passed because of this.
|
|
|
|
// The safe and correct pattern is to only build StringRefs out of pieces of AST (AstName or AstArray<>) that are backed by AstAllocator.
|
|
|
|
// Note that you must finalize() the builder before the Allocator backing the Ast is destroyed.
|
|
|
|
struct StringRef
|
|
|
|
{
|
|
|
|
// To construct a StringRef, use sref() from Compiler.cpp.
|
|
|
|
const char* data = nullptr;
|
|
|
|
size_t length = 0;
|
|
|
|
|
|
|
|
bool operator==(const StringRef& other) const;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct TableShape
|
|
|
|
{
|
|
|
|
static const unsigned int kMaxLength = 32;
|
|
|
|
|
|
|
|
int32_t keys[kMaxLength];
|
|
|
|
unsigned int length = 0;
|
|
|
|
|
|
|
|
bool operator==(const TableShape& other) const;
|
|
|
|
};
|
|
|
|
|
|
|
|
BytecodeBuilder(BytecodeEncoder* encoder = 0);
|
|
|
|
|
|
|
|
uint32_t beginFunction(uint8_t numparams, bool isvararg = false);
|
2023-07-14 23:57:16 +08:00
|
|
|
void endFunction(uint8_t maxstacksize, uint8_t numupvalues, uint8_t flags = 0);
|
2021-10-30 04:25:12 +08:00
|
|
|
|
|
|
|
void setMainFunction(uint32_t fid);
|
|
|
|
|
|
|
|
int32_t addConstantNil();
|
|
|
|
int32_t addConstantBoolean(bool value);
|
|
|
|
int32_t addConstantNumber(double value);
|
2023-12-02 10:04:44 +08:00
|
|
|
int32_t addConstantVector(float x, float y, float z, float w);
|
2021-10-30 04:25:12 +08:00
|
|
|
int32_t addConstantString(StringRef value);
|
|
|
|
int32_t addImport(uint32_t iid);
|
|
|
|
int32_t addConstantTable(const TableShape& shape);
|
|
|
|
int32_t addConstantClosure(uint32_t fid);
|
|
|
|
|
|
|
|
int16_t addChildFunction(uint32_t fid);
|
|
|
|
|
|
|
|
void emitABC(LuauOpcode op, uint8_t a, uint8_t b, uint8_t c);
|
|
|
|
void emitAD(LuauOpcode op, uint8_t a, int16_t d);
|
|
|
|
void emitE(LuauOpcode op, int32_t e);
|
|
|
|
void emitAux(uint32_t aux);
|
|
|
|
|
|
|
|
size_t emitLabel();
|
|
|
|
|
|
|
|
[[nodiscard]] bool patchJumpD(size_t jumpLabel, size_t targetLabel);
|
|
|
|
[[nodiscard]] bool patchSkipC(size_t jumpLabel, size_t targetLabel);
|
|
|
|
|
|
|
|
void foldJumps();
|
|
|
|
void expandJumps();
|
|
|
|
|
2023-06-17 01:01:18 +08:00
|
|
|
void setFunctionTypeInfo(std::string value);
|
2024-04-26 04:57:23 +08:00
|
|
|
void pushLocalTypeInfo(LuauBytecodeType type, uint8_t reg, uint32_t startpc, uint32_t endpc);
|
|
|
|
void pushUpvalTypeInfo(LuauBytecodeType type);
|
2023-06-17 01:01:18 +08:00
|
|
|
|
2024-06-01 01:46:33 +08:00
|
|
|
uint32_t addUserdataType(const char* name);
|
|
|
|
void useUserdataType(uint32_t index);
|
|
|
|
|
2021-10-30 04:25:12 +08:00
|
|
|
void setDebugFunctionName(StringRef name);
|
2022-01-07 06:10:07 +08:00
|
|
|
void setDebugFunctionLineDefined(int line);
|
2021-10-30 04:25:12 +08:00
|
|
|
void setDebugLine(int line);
|
|
|
|
void pushDebugLocal(StringRef name, uint8_t reg, uint32_t startpc, uint32_t endpc);
|
|
|
|
void pushDebugUpval(StringRef name);
|
2023-04-28 19:55:55 +08:00
|
|
|
|
|
|
|
size_t getInstructionCount() const;
|
2023-11-04 03:47:28 +08:00
|
|
|
size_t getTotalInstructionCount() const;
|
2021-10-30 04:25:12 +08:00
|
|
|
uint32_t getDebugPC() const;
|
|
|
|
|
2022-04-22 05:04:22 +08:00
|
|
|
void addDebugRemark(const char* format, ...) LUAU_PRINTF_ATTR(2, 3);
|
|
|
|
|
2021-10-30 04:25:12 +08:00
|
|
|
void finalize();
|
|
|
|
|
|
|
|
enum DumpFlags
|
|
|
|
{
|
|
|
|
Dump_Code = 1 << 0,
|
|
|
|
Dump_Lines = 1 << 1,
|
|
|
|
Dump_Source = 1 << 2,
|
|
|
|
Dump_Locals = 1 << 3,
|
2022-04-22 05:04:22 +08:00
|
|
|
Dump_Remarks = 1 << 4,
|
2024-04-26 04:57:23 +08:00
|
|
|
Dump_Types = 1 << 5,
|
2021-10-30 04:25:12 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
void setDumpFlags(uint32_t flags)
|
|
|
|
{
|
|
|
|
dumpFlags = flags;
|
|
|
|
dumpFunctionPtr = &BytecodeBuilder::dumpCurrentFunction;
|
|
|
|
}
|
|
|
|
|
|
|
|
void setDumpSource(const std::string& source);
|
|
|
|
|
2022-10-14 06:59:53 +08:00
|
|
|
bool needsDebugRemarks() const
|
|
|
|
{
|
|
|
|
return (dumpFlags & Dump_Remarks) != 0;
|
|
|
|
}
|
|
|
|
|
2021-10-30 04:25:12 +08:00
|
|
|
const std::string& getBytecode() const
|
|
|
|
{
|
|
|
|
LUAU_ASSERT(!bytecode.empty()); // did you forget to call finalize?
|
|
|
|
return bytecode;
|
|
|
|
}
|
|
|
|
|
|
|
|
std::string dumpFunction(uint32_t id) const;
|
|
|
|
std::string dumpEverything() const;
|
2022-10-14 06:59:53 +08:00
|
|
|
std::string dumpSourceRemarks() const;
|
2023-06-17 01:01:18 +08:00
|
|
|
std::string dumpTypeInfo() const;
|
2021-10-30 04:25:12 +08:00
|
|
|
|
2022-10-28 06:22:49 +08:00
|
|
|
void annotateInstruction(std::string& result, uint32_t fid, uint32_t instpos) const;
|
2022-10-22 01:33:43 +08:00
|
|
|
|
2021-10-30 04:25:12 +08:00
|
|
|
static uint32_t getImportId(int32_t id0);
|
|
|
|
static uint32_t getImportId(int32_t id0, int32_t id1);
|
|
|
|
static uint32_t getImportId(int32_t id0, int32_t id1, int32_t id2);
|
|
|
|
|
2023-01-14 04:36:28 +08:00
|
|
|
static int decomposeImportId(uint32_t ids, int32_t& id0, int32_t& id1, int32_t& id2);
|
|
|
|
|
2021-10-30 04:25:12 +08:00
|
|
|
static uint32_t getStringHash(StringRef key);
|
|
|
|
|
|
|
|
static std::string getError(const std::string& message);
|
|
|
|
|
2022-06-24 09:44:07 +08:00
|
|
|
static uint8_t getVersion();
|
2023-06-17 01:01:18 +08:00
|
|
|
static uint8_t getTypeEncodingVersion();
|
2022-06-24 09:44:07 +08:00
|
|
|
|
2021-10-30 04:25:12 +08:00
|
|
|
private:
|
|
|
|
struct Constant
|
|
|
|
{
|
|
|
|
enum Type
|
|
|
|
{
|
|
|
|
Type_Nil,
|
|
|
|
Type_Boolean,
|
|
|
|
Type_Number,
|
2023-12-02 10:04:44 +08:00
|
|
|
Type_Vector,
|
2021-10-30 04:25:12 +08:00
|
|
|
Type_String,
|
|
|
|
Type_Import,
|
|
|
|
Type_Table,
|
|
|
|
Type_Closure,
|
|
|
|
};
|
|
|
|
|
|
|
|
Type type;
|
|
|
|
union
|
|
|
|
{
|
|
|
|
bool valueBoolean;
|
|
|
|
double valueNumber;
|
2023-12-02 10:04:44 +08:00
|
|
|
float valueVector[4];
|
2021-10-30 04:25:12 +08:00
|
|
|
unsigned int valueString; // index into string table
|
|
|
|
uint32_t valueImport; // 10-10-10-2 encoded import id
|
|
|
|
uint32_t valueTable; // index into tableShapes[]
|
|
|
|
uint32_t valueClosure; // index of function in global list
|
|
|
|
};
|
|
|
|
};
|
|
|
|
|
|
|
|
struct ConstantKey
|
|
|
|
{
|
|
|
|
Constant::Type type;
|
2023-12-02 10:04:44 +08:00
|
|
|
// Note: this stores value* from Constant; when type is Type_Number, this stores the same bits as double does but in uint64_t.
|
|
|
|
// For Type_Vector, x and y are stored in 'value' and z and w are stored in 'extra'.
|
2021-10-30 04:25:12 +08:00
|
|
|
uint64_t value;
|
2023-12-02 10:04:44 +08:00
|
|
|
uint64_t extra = 0;
|
2021-10-30 04:25:12 +08:00
|
|
|
|
|
|
|
bool operator==(const ConstantKey& key) const
|
|
|
|
{
|
2023-12-02 10:04:44 +08:00
|
|
|
return type == key.type && value == key.value && extra == key.extra;
|
2021-10-30 04:25:12 +08:00
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
struct Function
|
|
|
|
{
|
|
|
|
std::string data;
|
|
|
|
|
|
|
|
uint8_t maxstacksize = 0;
|
|
|
|
uint8_t numparams = 0;
|
|
|
|
uint8_t numupvalues = 0;
|
|
|
|
bool isvararg = false;
|
|
|
|
|
|
|
|
unsigned int debugname = 0;
|
2022-01-07 06:10:07 +08:00
|
|
|
int debuglinedefined = 0;
|
2021-10-30 04:25:12 +08:00
|
|
|
|
|
|
|
std::string dump;
|
|
|
|
std::string dumpname;
|
2022-10-22 01:33:43 +08:00
|
|
|
std::vector<int> dumpinstoffs;
|
2023-06-17 01:01:18 +08:00
|
|
|
std::string typeinfo;
|
2021-10-30 04:25:12 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
struct DebugLocal
|
|
|
|
{
|
|
|
|
unsigned int name;
|
|
|
|
|
|
|
|
uint8_t reg;
|
|
|
|
uint32_t startpc;
|
|
|
|
uint32_t endpc;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct DebugUpval
|
|
|
|
{
|
|
|
|
unsigned int name;
|
|
|
|
};
|
|
|
|
|
2024-04-26 04:57:23 +08:00
|
|
|
struct TypedLocal
|
|
|
|
{
|
|
|
|
LuauBytecodeType type;
|
|
|
|
uint8_t reg;
|
|
|
|
uint32_t startpc;
|
|
|
|
uint32_t endpc;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct TypedUpval
|
|
|
|
{
|
|
|
|
LuauBytecodeType type;
|
|
|
|
};
|
|
|
|
|
2024-06-01 01:46:33 +08:00
|
|
|
struct UserdataType
|
|
|
|
{
|
|
|
|
std::string name;
|
|
|
|
uint32_t nameRef = 0;
|
|
|
|
bool used = false;
|
|
|
|
};
|
|
|
|
|
2021-10-30 04:25:12 +08:00
|
|
|
struct Jump
|
|
|
|
{
|
|
|
|
uint32_t source;
|
|
|
|
uint32_t target;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct StringRefHash
|
|
|
|
{
|
|
|
|
size_t operator()(const StringRef& v) const;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct ConstantKeyHash
|
|
|
|
{
|
|
|
|
size_t operator()(const ConstantKey& key) const;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct TableShapeHash
|
|
|
|
{
|
|
|
|
size_t operator()(const TableShape& v) const;
|
|
|
|
};
|
|
|
|
|
|
|
|
std::vector<Function> functions;
|
|
|
|
uint32_t currentFunction = ~0u;
|
|
|
|
uint32_t mainFunction = ~0u;
|
|
|
|
|
2023-11-04 03:47:28 +08:00
|
|
|
size_t totalInstructionCount = 0;
|
2021-10-30 04:25:12 +08:00
|
|
|
std::vector<uint32_t> insns;
|
|
|
|
std::vector<int> lines;
|
|
|
|
std::vector<Constant> constants;
|
|
|
|
std::vector<uint32_t> protos;
|
|
|
|
std::vector<Jump> jumps;
|
|
|
|
|
|
|
|
std::vector<TableShape> tableShapes;
|
|
|
|
|
|
|
|
bool hasLongJumps = false;
|
|
|
|
|
|
|
|
DenseHashMap<ConstantKey, int32_t, ConstantKeyHash> constantMap;
|
|
|
|
DenseHashMap<TableShape, int32_t, TableShapeHash> tableShapeMap;
|
2022-05-20 07:46:52 +08:00
|
|
|
DenseHashMap<uint32_t, int16_t> protoMap;
|
2021-10-30 04:25:12 +08:00
|
|
|
|
|
|
|
int debugLine = 0;
|
|
|
|
|
|
|
|
std::vector<DebugLocal> debugLocals;
|
|
|
|
std::vector<DebugUpval> debugUpvals;
|
|
|
|
|
2024-04-26 04:57:23 +08:00
|
|
|
std::vector<TypedLocal> typedLocals;
|
|
|
|
std::vector<TypedUpval> typedUpvals;
|
|
|
|
|
2024-06-01 01:46:33 +08:00
|
|
|
std::vector<UserdataType> userdataTypes;
|
|
|
|
|
2021-10-30 04:25:12 +08:00
|
|
|
DenseHashMap<StringRef, unsigned int, StringRefHash> stringTable;
|
2023-01-14 04:36:28 +08:00
|
|
|
std::vector<StringRef> debugStrings;
|
2021-10-30 04:25:12 +08:00
|
|
|
|
2022-04-29 09:04:52 +08:00
|
|
|
std::vector<std::pair<uint32_t, uint32_t>> debugRemarks;
|
2022-04-22 05:04:22 +08:00
|
|
|
std::string debugRemarkBuffer;
|
|
|
|
|
2021-10-30 04:25:12 +08:00
|
|
|
BytecodeEncoder* encoder = nullptr;
|
|
|
|
std::string bytecode;
|
|
|
|
|
|
|
|
uint32_t dumpFlags = 0;
|
|
|
|
std::vector<std::string> dumpSource;
|
2022-10-14 06:59:53 +08:00
|
|
|
std::vector<std::pair<int, std::string>> dumpRemarks;
|
2021-10-30 04:25:12 +08:00
|
|
|
|
2024-04-26 04:57:23 +08:00
|
|
|
std::string tempTypeInfo;
|
|
|
|
|
2022-10-22 01:33:43 +08:00
|
|
|
std::string (BytecodeBuilder::*dumpFunctionPtr)(std::vector<int>&) const = nullptr;
|
2021-10-30 04:25:12 +08:00
|
|
|
|
|
|
|
void validate() const;
|
2022-10-22 01:33:43 +08:00
|
|
|
void validateInstructions() const;
|
|
|
|
void validateVariadic() const;
|
2021-10-30 04:25:12 +08:00
|
|
|
|
2022-10-22 01:33:43 +08:00
|
|
|
std::string dumpCurrentFunction(std::vector<int>& dumpinstoffs) const;
|
2023-01-14 04:36:28 +08:00
|
|
|
void dumpConstant(std::string& result, int k) const;
|
2022-05-27 04:33:48 +08:00
|
|
|
void dumpInstruction(const uint32_t* opcode, std::string& output, int targetLabel) const;
|
2021-10-30 04:25:12 +08:00
|
|
|
|
2024-04-26 04:57:23 +08:00
|
|
|
void writeFunction(std::string& ss, uint32_t id, uint8_t flags);
|
2021-10-30 04:25:12 +08:00
|
|
|
void writeLineInfo(std::string& ss) const;
|
|
|
|
void writeStringTable(std::string& ss) const;
|
|
|
|
|
|
|
|
int32_t addConstant(const ConstantKey& key, const Constant& value);
|
|
|
|
unsigned int addStringTableEntry(StringRef value);
|
2024-06-01 01:46:33 +08:00
|
|
|
|
|
|
|
const char* tryGetUserdataTypeName(LuauBytecodeType type) const;
|
2021-10-30 04:25:12 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
} // namespace Luau
|