#pragma once #include "jit.h" #include "types.h" #include "stats.h" // To do: get cmake to define these.. #define ASMJIT_BUILD_EMBED #define ASMJIT_STATIC #include #include #include #include extern cycle_t VMCycles[10]; extern int VMCalls[10]; #define A (pc[0].a) #define B (pc[0].b) #define C (pc[0].c) #define Cs (pc[0].cs) #define BC (pc[0].i16u) #define BCs (pc[0].i16) #define ABCs (pc[0].i24) #define JMPOFS(x) ((x)->i24) struct JitLineInfo { ptrdiff_t InstructionIndex = 0; int32_t LineNumber = -1; asmjit::Label Label; }; class JitCompiler { public: JitCompiler(asmjit::CodeHolder *code, VMScriptFunction *sfunc) : cc(code), sfunc(sfunc) { } asmjit::CCFunc *Codegen(); VMScriptFunction *GetScriptFunction() { return sfunc; } TArray LineInfo; private: // Declare EmitXX functions for the opcodes: #define xx(op, name, mode, alt, kreg, ktype) void Emit##op(); #include "vmops.h" #undef xx asmjit::FuncSignature CreateFuncSignature(); void Setup(); void CreateRegisters(); void IncrementVMCalls(); void SetupFrame(); void SetupSimpleFrame(); void SetupFullVMFrame(); void BindLabels(); void EmitOpcode(); void EmitPopFrame(); void EmitNativeCall(VMNativeFunction *target); void EmitVMCall(asmjit::X86Gp ptr, VMFunction *target); void EmitVtbl(const VMOP *op); int StoreCallParams(); void LoadInOuts(); void LoadReturns(const VMOP *retval, int numret); void FillReturns(const VMOP *retval, int numret); void LoadCallResult(int type, int regnum, bool addrof); template void EmitComparisonOpcode(Func jmpFunc) { using namespace asmjit; int i = (int)(ptrdiff_t)(pc - sfunc->Code); auto successLabel = cc.newLabel(); auto failLabel = GetLabel(i + 2 + JMPOFS(pc + 1)); jmpFunc(static_cast(A & CMP_CHECK), failLabel, successLabel); cc.bind(successLabel); pc++; // This instruction uses two instruction slots - skip the next one } template void EmitVectorComparison(bool check, asmjit::Label& fail, asmjit::Label& success) { bool approx = static_cast(A & CMP_APPROX); if (!approx) { for (int i = 0; i < N; i++) { cc.ucomisd(regF[B + i], regF[C + i]); if (check) { cc.jp(success); if (i == (N - 1)) { cc.je(fail); } else { cc.jne(success); } } else { cc.jp(fail); cc.jne(fail); } } } else { auto tmp = newTempXmmSd(); const int64_t absMaskInt = 0x7FFFFFFFFFFFFFFF; auto absMask = cc.newDoubleConst(asmjit::kConstScopeLocal, reinterpret_cast(absMaskInt)); auto absMaskXmm = newTempXmmPd(); auto epsilon = cc.newDoubleConst(asmjit::kConstScopeLocal, VM_EPSILON); auto epsilonXmm = newTempXmmSd(); for (int i = 0; i < N; i++) { cc.movsd(tmp, regF[B + i]); cc.subsd(tmp, regF[C + i]); cc.movsd(absMaskXmm, absMask); cc.andpd(tmp, absMaskXmm); cc.movsd(epsilonXmm, epsilon); cc.ucomisd(epsilonXmm, tmp); if (check) { cc.jp(success); if (i == (N - 1)) { cc.ja(fail); } else { cc.jna(success); } } else { cc.jp(fail); cc.jna(fail); } } } } static uint64_t ToMemAddress(const void *d) { return (uint64_t)(ptrdiff_t)d; } void CallSqrt(const asmjit::X86Xmm &a, const asmjit::X86Xmm &b); static void CallAssignString(FString* to, FString* from) { *to = *from; } template asmjit::CCFuncCall *CreateCall(RetType(*func)(P1 p1)) { return cc.call(asmjit::imm_ptr(reinterpret_cast(static_cast(func))), asmjit::FuncSignature1()); } template asmjit::CCFuncCall *CreateCall(RetType(*func)(P1 p1, P2 p2)) { return cc.call(asmjit::imm_ptr(reinterpret_cast(static_cast(func))), asmjit::FuncSignature2()); } template asmjit::CCFuncCall *CreateCall(RetType(*func)(P1 p1, P2 p2, P3 p3)) { return cc.call(asmjit::imm_ptr(reinterpret_cast(static_cast(func))), asmjit::FuncSignature3()); } template asmjit::CCFuncCall *CreateCall(RetType(*func)(P1 p1, P2 p2, P3 p3, P4 p4)) { return cc.call(asmjit::imm_ptr(reinterpret_cast(static_cast(func))), asmjit::FuncSignature4()); } template asmjit::CCFuncCall *CreateCall(RetType(*func)(P1 p1, P2 p2, P3 p3, P4 p4, P5 p5)) { return cc.call(asmjit::imm_ptr(reinterpret_cast(static_cast(func))), asmjit::FuncSignature5()); } template asmjit::CCFuncCall *CreateCall(RetType(*func)(P1 p1, P2 p2, P3 p3, P4 p4, P5 p5, P6 p6)) { return cc.call(asmjit::imm_ptr(reinterpret_cast(static_cast(func))), asmjit::FuncSignature6()); } template asmjit::CCFuncCall* CreateCall(RetType(*func)(P1 p1, P2 p2, P3 p3, P4 p4, P5 p5, P6 p6, P7 p7)) { return cc.call(asmjit::imm_ptr(reinterpret_cast(static_cast(func))), asmjit::FuncSignature7()); } template asmjit::CCFuncCall* CreateCall(RetType(*func)(P1 p1, P2 p2, P3 p3, P4 p4, P5 p5, P6 p6, P7 p7, P8 p8)) { return cc.call(asmjit::imm_ptr(reinterpret_cast(static_cast(func))), asmjit::FuncSignature8()); } template asmjit::CCFuncCall* CreateCall(RetType(*func)(P1 p1, P2 p2, P3 p3, P4 p4, P5 p5, P6 p6, P7 p7, P8 p8, P9 p9)) { return cc.call(asmjit::imm_ptr(reinterpret_cast(static_cast(func))), asmjit::FuncSignature9()); } FString regname; size_t tmpPosInt32, tmpPosInt64, tmpPosIntPtr, tmpPosXmmSd, tmpPosXmmSs, tmpPosXmmPd, resultPosInt32, resultPosIntPtr, resultPosXmmSd; std::vector regTmpInt32, regTmpInt64, regTmpIntPtr, regResultInt32, regResultIntPtr; std::vector regTmpXmmSd, regTmpXmmSs, regTmpXmmPd, regResultXmmSd; void ResetTemp() { tmpPosInt32 = 0; tmpPosInt64 = 0; tmpPosIntPtr = 0; tmpPosXmmSd = 0; tmpPosXmmSs = 0; tmpPosXmmPd = 0; resultPosInt32 = 0; resultPosIntPtr = 0; resultPosXmmSd = 0; } template T newTempRegister(std::vector &tmpVector, size_t &tmpPos, const char *name, NewFunc newCallback) { if (tmpPos == tmpVector.size()) { regname.Format("%s%d", name, (int)tmpVector.size()); tmpVector.push_back(newCallback(regname.GetChars())); } return tmpVector[tmpPos++]; } asmjit::X86Gp newTempInt32() { return newTempRegister(regTmpInt32, tmpPosInt32, "tmpDword", [&](const char *name) { return cc.newInt32(name); }); } asmjit::X86Gp newTempInt64() { return newTempRegister(regTmpInt64, tmpPosInt64, "tmpQword", [&](const char *name) { return cc.newInt64(name); }); } asmjit::X86Gp newTempIntPtr() { return newTempRegister(regTmpIntPtr, tmpPosIntPtr, "tmpPtr", [&](const char *name) { return cc.newIntPtr(name); }); } asmjit::X86Xmm newTempXmmSd() { return newTempRegister(regTmpXmmSd, tmpPosXmmSd, "tmpXmmSd", [&](const char *name) { return cc.newXmmSd(name); }); } asmjit::X86Xmm newTempXmmSs() { return newTempRegister(regTmpXmmSs, tmpPosXmmSs, "tmpXmmSs", [&](const char *name) { return cc.newXmmSs(name); }); } asmjit::X86Xmm newTempXmmPd() { return newTempRegister(regTmpXmmPd, tmpPosXmmPd, "tmpXmmPd", [&](const char *name) { return cc.newXmmPd(name); }); } asmjit::X86Gp newResultInt32() { return newTempRegister(regResultInt32, resultPosInt32, "resultDword", [&](const char *name) { return cc.newInt32(name); }); } asmjit::X86Gp newResultIntPtr() { return newTempRegister(regResultIntPtr, resultPosIntPtr, "resultPtr", [&](const char *name) { return cc.newIntPtr(name); }); } asmjit::X86Xmm newResultXmmSd() { return newTempRegister(regResultXmmSd, resultPosXmmSd, "resultXmmSd", [&](const char *name) { return cc.newXmmSd(name); }); } void EmitReadBarrier(); void EmitNullPointerThrow(int index, EVMAbortException reason); void EmitThrowException(EVMAbortException reason); asmjit::Label EmitThrowExceptionLabel(EVMAbortException reason); static void ThrowArrayOutOfBounds(int index, int size); static void ThrowException(int reason); asmjit::X86Gp CheckRegD(int r0, int r1); asmjit::X86Xmm CheckRegF(int r0, int r1); asmjit::X86Xmm CheckRegF(int r0, int r1, int r2); asmjit::X86Xmm CheckRegF(int r0, int r1, int r2, int r3); asmjit::X86Xmm CheckRegF(int r0, int r1, int r2, int r3, int r4); asmjit::X86Gp CheckRegS(int r0, int r1); asmjit::X86Gp CheckRegA(int r0, int r1); asmjit::X86Compiler cc; VMScriptFunction *sfunc; asmjit::CCFunc *func = nullptr; asmjit::X86Gp args; asmjit::X86Gp numargs; asmjit::X86Gp ret; asmjit::X86Gp numret; asmjit::X86Gp stack; int offsetParams; int offsetF; int offsetS; int offsetA; int offsetD; int offsetExtra; TArray ParamOpcodes; void CheckVMFrame(); asmjit::X86Gp GetCallReturns(); bool vmframeAllocated = false; asmjit::CBNode *vmframeCursor = nullptr; asmjit::X86Gp vmframe; bool callReturnsAllocated = false; asmjit::CBNode *callReturnsCursor = nullptr; asmjit::X86Gp callReturns; const int *konstd; const double *konstf; const FString *konsts; const FVoidObj *konsta; TArray regD; TArray regF; TArray regA; TArray regS; struct OpcodeLabel { asmjit::CBNode *cursor = nullptr; asmjit::Label label; bool inUse = false; }; asmjit::Label GetLabel(size_t pos) { auto &label = labels[pos]; if (!label.inUse) { label.label = cc.newLabel(); label.inUse = true; } return label.label; } TArray labels; // Get temporary storage enough for DVector4 which is required by operation such as MULQQ and MULQV3 bool vectorStackAllocated = false; asmjit::X86Mem vectorStack; asmjit::X86Mem GetTemporaryVectorStackStorage() { if (!vectorStackAllocated) { vectorStack = cc.newStack(sizeof(DVector4), alignof(DVector4), "tmpDVector4"); vectorStackAllocated = true; } return vectorStack; } const VMOP *pc; VM_UBYTE op; }; class AsmJitException : public std::exception { public: AsmJitException(asmjit::Error error, const char *message) noexcept : error(error), message(message) { } const char* what() const noexcept override { return message.GetChars(); } asmjit::Error error; FString message; }; class ThrowingErrorHandler : public asmjit::ErrorHandler { public: bool handleError(asmjit::Error err, const char *message, asmjit::CodeEmitter *origin) override { throw AsmJitException(err, message); } }; void *AddJitFunction(asmjit::CodeHolder* code, JitCompiler *compiler); asmjit::CodeInfo GetHostCodeInfo();