mirror of
https://github.com/ZDoom/Raze.git
synced 2025-01-11 19:40:46 +00:00
6e49f0bf8f
Bone model support in GLES and ZScript quaternions.
609 lines
14 KiB
C++
609 lines
14 KiB
C++
|
|
#include "jit.h"
|
|
#include "jitintern.h"
|
|
#include "printf.h"
|
|
|
|
extern PString *TypeString;
|
|
extern PStruct *TypeVector2;
|
|
extern PStruct *TypeVector3;
|
|
extern PStruct* TypeVector4;
|
|
extern PStruct* TypeQuaternion;
|
|
extern PStruct* TypeFQuaternion;
|
|
|
|
static void OutputJitLog(const asmjit::StringLogger &logger);
|
|
|
|
JitFuncPtr JitCompile(VMScriptFunction *sfunc)
|
|
{
|
|
#if 0
|
|
if (strcmp(sfunc->PrintableName.GetChars(), "StatusScreen.drawNum") != 0)
|
|
return nullptr;
|
|
#endif
|
|
|
|
using namespace asmjit;
|
|
StringLogger logger;
|
|
try
|
|
{
|
|
ThrowingErrorHandler errorHandler;
|
|
CodeHolder code;
|
|
code.init(GetHostCodeInfo());
|
|
code.setErrorHandler(&errorHandler);
|
|
code.setLogger(&logger);
|
|
|
|
JitCompiler compiler(&code, sfunc);
|
|
return reinterpret_cast<JitFuncPtr>(AddJitFunction(&code, &compiler));
|
|
}
|
|
catch (const CRecoverableError &e)
|
|
{
|
|
OutputJitLog(logger);
|
|
Printf("%s: Unexpected JIT error: %s\n",sfunc->PrintableName.GetChars(), e.what());
|
|
return nullptr;
|
|
}
|
|
}
|
|
|
|
void JitDumpLog(FILE *file, VMScriptFunction *sfunc)
|
|
{
|
|
using namespace asmjit;
|
|
StringLogger logger;
|
|
try
|
|
{
|
|
ThrowingErrorHandler errorHandler;
|
|
CodeHolder code;
|
|
code.init(GetHostCodeInfo());
|
|
code.setErrorHandler(&errorHandler);
|
|
code.setLogger(&logger);
|
|
|
|
JitCompiler compiler(&code, sfunc);
|
|
compiler.Codegen();
|
|
|
|
fwrite(logger.getString(), logger.getLength(), 1, file);
|
|
}
|
|
catch (const std::exception &e)
|
|
{
|
|
fwrite(logger.getString(), logger.getLength(), 1, file);
|
|
|
|
FString err;
|
|
err.Format("Unexpected JIT error: %s\n", e.what());
|
|
fwrite(err.GetChars(), err.Len(), 1, file);
|
|
fclose(file);
|
|
|
|
I_FatalError("Unexpected JIT error: %s\n", e.what());
|
|
}
|
|
}
|
|
|
|
static void OutputJitLog(const asmjit::StringLogger &logger)
|
|
{
|
|
// Write line by line since I_FatalError seems to cut off long strings
|
|
const char *pos = logger.getString();
|
|
const char *end = pos;
|
|
while (*end)
|
|
{
|
|
if (*end == '\n')
|
|
{
|
|
FString substr(pos, (int)(ptrdiff_t)(end - pos));
|
|
Printf("%s\n", substr.GetChars());
|
|
pos = end + 1;
|
|
}
|
|
end++;
|
|
}
|
|
if (pos != end)
|
|
Printf("%s\n", pos);
|
|
}
|
|
|
|
/////////////////////////////////////////////////////////////////////////////
|
|
|
|
static const char *OpNames[NUM_OPS] =
|
|
{
|
|
#define xx(op, name, mode, alt, kreg, ktype) #op,
|
|
#include "vmops.h"
|
|
#undef xx
|
|
};
|
|
|
|
asmjit::CCFunc *JitCompiler::Codegen()
|
|
{
|
|
Setup();
|
|
|
|
int lastLine = -1;
|
|
|
|
pc = sfunc->Code;
|
|
auto end = pc + sfunc->CodeSize;
|
|
while (pc != end)
|
|
{
|
|
int i = (int)(ptrdiff_t)(pc - sfunc->Code);
|
|
op = pc->op;
|
|
|
|
int curLine = sfunc->PCToLine(pc);
|
|
if (curLine != lastLine)
|
|
{
|
|
lastLine = curLine;
|
|
|
|
auto label = cc.newLabel();
|
|
cc.bind(label);
|
|
|
|
JitLineInfo info;
|
|
info.Label = label;
|
|
info.LineNumber = curLine;
|
|
LineInfo.Push(info);
|
|
}
|
|
|
|
if (op != OP_PARAM && op != OP_PARAMI && op != OP_VTBL)
|
|
{
|
|
FString lineinfo;
|
|
lineinfo.Format("; line %d: %02x%02x%02x%02x %s", curLine, pc->op, pc->a, pc->b, pc->c, OpNames[op]);
|
|
cc.comment("", 0);
|
|
cc.comment(lineinfo.GetChars(), lineinfo.Len());
|
|
}
|
|
|
|
labels[i].cursor = cc.getCursor();
|
|
ResetTemp();
|
|
EmitOpcode();
|
|
|
|
pc++;
|
|
}
|
|
|
|
BindLabels();
|
|
|
|
cc.endFunc();
|
|
cc.finalize();
|
|
|
|
auto code = cc.getCode ();
|
|
for (unsigned int j = 0; j < LineInfo.Size (); j++)
|
|
{
|
|
auto info = LineInfo[j];
|
|
|
|
if (!code->isLabelValid (info.Label))
|
|
{
|
|
continue;
|
|
}
|
|
|
|
info.InstructionIndex = code->getLabelOffset (info.Label);
|
|
|
|
LineInfo[j] = info;
|
|
}
|
|
|
|
std::stable_sort(LineInfo.begin(), LineInfo.end(), [](const JitLineInfo &a, const JitLineInfo &b) { return a.InstructionIndex < b.InstructionIndex; });
|
|
|
|
return func;
|
|
}
|
|
|
|
void JitCompiler::EmitOpcode()
|
|
{
|
|
switch (op)
|
|
{
|
|
#define xx(op, name, mode, alt, kreg, ktype) case OP_##op: Emit##op(); break;
|
|
#include "vmops.h"
|
|
#undef xx
|
|
|
|
default:
|
|
I_FatalError("JIT error: Unknown VM opcode %d\n", op);
|
|
break;
|
|
}
|
|
}
|
|
|
|
void JitCompiler::BindLabels()
|
|
{
|
|
asmjit::CBNode *cursor = cc.getCursor();
|
|
unsigned int size = labels.Size();
|
|
for (unsigned int i = 0; i < size; i++)
|
|
{
|
|
const OpcodeLabel &label = labels[i];
|
|
if (label.inUse)
|
|
{
|
|
cc.setCursor(label.cursor);
|
|
cc.bind(label.label);
|
|
}
|
|
}
|
|
cc.setCursor(cursor);
|
|
}
|
|
|
|
void JitCompiler::CheckVMFrame()
|
|
{
|
|
if (!vmframeAllocated)
|
|
{
|
|
auto cursor = cc.getCursor();
|
|
cc.setCursor(vmframeCursor);
|
|
|
|
auto vmstack = cc.newStack(sfunc->StackSize, 16, "vmstack");
|
|
vmframe = cc.newIntPtr("vmframe");
|
|
cc.lea(vmframe, vmstack);
|
|
|
|
cc.setCursor(cursor);
|
|
vmframeAllocated = true;
|
|
}
|
|
}
|
|
|
|
asmjit::X86Gp JitCompiler::GetCallReturns()
|
|
{
|
|
if (!callReturnsAllocated)
|
|
{
|
|
auto cursor = cc.getCursor();
|
|
cc.setCursor(callReturnsCursor);
|
|
auto stackalloc = cc.newStack(sizeof(VMReturn) * MAX_RETURNS, alignof(VMReturn), "stackalloc");
|
|
callReturns = cc.newIntPtr("callReturns");
|
|
cc.lea(callReturns, stackalloc);
|
|
cc.setCursor(cursor);
|
|
callReturnsAllocated = true;
|
|
}
|
|
return callReturns;
|
|
}
|
|
|
|
void JitCompiler::Setup()
|
|
{
|
|
using namespace asmjit;
|
|
|
|
ResetTemp();
|
|
|
|
static const char *marks = "=======================================================";
|
|
cc.comment("", 0);
|
|
cc.comment(marks, 56);
|
|
|
|
FString funcname;
|
|
funcname.Format("Function: %s", sfunc->PrintableName.GetChars());
|
|
cc.comment(funcname.GetChars(), funcname.Len());
|
|
|
|
cc.comment(marks, 56);
|
|
cc.comment("", 0);
|
|
|
|
auto unusedFunc = cc.newIntPtr("func"); // VMFunction*
|
|
args = cc.newIntPtr("args"); // VMValue *params
|
|
numargs = cc.newInt32("numargs"); // int numargs
|
|
ret = cc.newIntPtr("ret"); // VMReturn *ret
|
|
numret = cc.newInt32("numret"); // int numret
|
|
|
|
func = cc.addFunc(FuncSignature5<int, VMFunction *, void *, int, void *, int>());
|
|
cc.setArg(0, unusedFunc);
|
|
cc.setArg(1, args);
|
|
cc.setArg(2, numargs);
|
|
cc.setArg(3, ret);
|
|
cc.setArg(4, numret);
|
|
|
|
callReturnsCursor = cc.getCursor();
|
|
|
|
konstd = sfunc->KonstD;
|
|
konstf = sfunc->KonstF;
|
|
konsts = sfunc->KonstS;
|
|
konsta = sfunc->KonstA;
|
|
|
|
labels.Resize(sfunc->CodeSize);
|
|
|
|
CreateRegisters();
|
|
IncrementVMCalls();
|
|
SetupFrame();
|
|
}
|
|
|
|
void JitCompiler::SetupFrame()
|
|
{
|
|
// the VM version reads this from the stack, but it is constant data
|
|
offsetParams = ((int)sizeof(VMFrame) + 15) & ~15;
|
|
offsetF = offsetParams + (int)(sfunc->MaxParam * sizeof(VMValue));
|
|
offsetS = offsetF + (int)(sfunc->NumRegF * sizeof(double));
|
|
offsetA = offsetS + (int)(sfunc->NumRegS * sizeof(FString));
|
|
offsetD = offsetA + (int)(sfunc->NumRegA * sizeof(void*));
|
|
offsetExtra = (offsetD + (int)(sfunc->NumRegD * sizeof(int32_t)) + 15) & ~15;
|
|
|
|
if (sfunc->SpecialInits.Size() == 0 && sfunc->NumRegS == 0 && sfunc->ExtraSpace == 0)
|
|
{
|
|
SetupSimpleFrame();
|
|
}
|
|
else
|
|
{
|
|
SetupFullVMFrame();
|
|
}
|
|
}
|
|
|
|
void JitCompiler::SetupSimpleFrame()
|
|
{
|
|
using namespace asmjit;
|
|
|
|
// This is a simple frame with no constructors or destructors. Allocate it on the stack ourselves.
|
|
|
|
vmframeCursor = cc.getCursor();
|
|
|
|
int argsPos = 0;
|
|
int regd = 0, regf = 0, rega = 0;
|
|
for (unsigned int i = 0; i < sfunc->Proto->ArgumentTypes.Size(); i++)
|
|
{
|
|
const PType *type = sfunc->Proto->ArgumentTypes[i];
|
|
if (sfunc->ArgFlags.Size() && sfunc->ArgFlags[i] & (VARF_Out | VARF_Ref))
|
|
{
|
|
cc.mov(regA[rega++], x86::ptr(args, argsPos++ * sizeof(VMValue) + offsetof(VMValue, a)));
|
|
}
|
|
else if (type == TypeVector2 || type == TypeFVector2)
|
|
{
|
|
cc.movsd(regF[regf++], x86::qword_ptr(args, argsPos++ * sizeof(VMValue) + offsetof(VMValue, f)));
|
|
cc.movsd(regF[regf++], x86::qword_ptr(args, argsPos++ * sizeof(VMValue) + offsetof(VMValue, f)));
|
|
}
|
|
else if (type == TypeVector3 || type == TypeFVector3)
|
|
{
|
|
cc.movsd(regF[regf++], x86::qword_ptr(args, argsPos++ * sizeof(VMValue) + offsetof(VMValue, f)));
|
|
cc.movsd(regF[regf++], x86::qword_ptr(args, argsPos++ * sizeof(VMValue) + offsetof(VMValue, f)));
|
|
cc.movsd(regF[regf++], x86::qword_ptr(args, argsPos++ * sizeof(VMValue) + offsetof(VMValue, f)));
|
|
}
|
|
else if (type == TypeVector4 || type == TypeFVector4 || type == TypeQuaternion || type == TypeFQuaternion)
|
|
{
|
|
cc.movsd(regF[regf++], x86::qword_ptr(args, argsPos++ * sizeof(VMValue) + offsetof(VMValue, f)));
|
|
cc.movsd(regF[regf++], x86::qword_ptr(args, argsPos++ * sizeof(VMValue) + offsetof(VMValue, f)));
|
|
cc.movsd(regF[regf++], x86::qword_ptr(args, argsPos++ * sizeof(VMValue) + offsetof(VMValue, f)));
|
|
cc.movsd(regF[regf++], x86::qword_ptr(args, argsPos++ * sizeof(VMValue) + offsetof(VMValue, f)));
|
|
}
|
|
else if (type == TypeFloat64)
|
|
{
|
|
cc.movsd(regF[regf++], x86::qword_ptr(args, argsPos++ * sizeof(VMValue) + offsetof(VMValue, f)));
|
|
}
|
|
else if (type == TypeString)
|
|
{
|
|
I_FatalError("JIT: Strings are not supported yet for simple frames");
|
|
}
|
|
else if (type->isIntCompatible())
|
|
{
|
|
cc.mov(regD[regd++], x86::dword_ptr(args, argsPos++ * sizeof(VMValue) + offsetof(VMValue, i)));
|
|
}
|
|
else
|
|
{
|
|
cc.mov(regA[rega++], x86::ptr(args, argsPos++ * sizeof(VMValue) + offsetof(VMValue, a)));
|
|
}
|
|
}
|
|
|
|
const char *errorDetails = nullptr;
|
|
|
|
if (sfunc->NumArgs != argsPos)
|
|
{
|
|
errorDetails = "arguments";
|
|
}
|
|
else if (regd > sfunc->NumRegD)
|
|
{
|
|
errorDetails = "integer registers";
|
|
}
|
|
else if (regf > sfunc->NumRegF)
|
|
{
|
|
errorDetails = "floating point registers";
|
|
}
|
|
else if (rega > sfunc->NumRegA)
|
|
{
|
|
errorDetails = "address registers";
|
|
}
|
|
|
|
if (errorDetails)
|
|
{
|
|
I_FatalError("JIT: inconsistent number of %s for function %s", errorDetails, sfunc->PrintableName.GetChars());
|
|
}
|
|
|
|
for (int i = regd; i < sfunc->NumRegD; i++)
|
|
cc.xor_(regD[i], regD[i]);
|
|
|
|
for (int i = regf; i < sfunc->NumRegF; i++)
|
|
cc.xorpd(regF[i], regF[i]);
|
|
|
|
for (int i = rega; i < sfunc->NumRegA; i++)
|
|
cc.xor_(regA[i], regA[i]);
|
|
}
|
|
|
|
static VMFrameStack *CreateFullVMFrame(VMScriptFunction *func, VMValue *args, int numargs)
|
|
{
|
|
VMFrameStack *stack = &GlobalVMStack;
|
|
VMFrame *newf = stack->AllocFrame(func);
|
|
VMFillParams(args, newf, numargs);
|
|
return stack;
|
|
}
|
|
|
|
void JitCompiler::SetupFullVMFrame()
|
|
{
|
|
using namespace asmjit;
|
|
|
|
stack = cc.newIntPtr("stack");
|
|
auto allocFrame = CreateCall<VMFrameStack *, VMScriptFunction *, VMValue *, int>(CreateFullVMFrame);
|
|
allocFrame->setRet(0, stack);
|
|
allocFrame->setArg(0, imm_ptr(sfunc));
|
|
allocFrame->setArg(1, args);
|
|
allocFrame->setArg(2, numargs);
|
|
|
|
vmframe = cc.newIntPtr("vmframe");
|
|
cc.mov(vmframe, x86::ptr(stack)); // stack->Blocks
|
|
cc.mov(vmframe, x86::ptr(vmframe, VMFrameStack::OffsetLastFrame())); // Blocks->LastFrame
|
|
vmframeAllocated = true;
|
|
|
|
for (int i = 0; i < sfunc->NumRegD; i++)
|
|
cc.mov(regD[i], x86::dword_ptr(vmframe, offsetD + i * sizeof(int32_t)));
|
|
|
|
for (int i = 0; i < sfunc->NumRegF; i++)
|
|
cc.movsd(regF[i], x86::qword_ptr(vmframe, offsetF + i * sizeof(double)));
|
|
|
|
for (int i = 0; i < sfunc->NumRegS; i++)
|
|
cc.lea(regS[i], x86::ptr(vmframe, offsetS + i * sizeof(FString)));
|
|
|
|
for (int i = 0; i < sfunc->NumRegA; i++)
|
|
cc.mov(regA[i], x86::ptr(vmframe, offsetA + i * sizeof(void*)));
|
|
}
|
|
|
|
static void PopFullVMFrame(VMFrameStack *stack)
|
|
{
|
|
stack->PopFrame();
|
|
}
|
|
|
|
void JitCompiler::EmitPopFrame()
|
|
{
|
|
if (sfunc->SpecialInits.Size() != 0 || sfunc->NumRegS != 0 || sfunc->ExtraSpace != 0)
|
|
{
|
|
auto popFrame = CreateCall<void, VMFrameStack *>(PopFullVMFrame);
|
|
popFrame->setArg(0, stack);
|
|
}
|
|
}
|
|
|
|
void JitCompiler::IncrementVMCalls()
|
|
{
|
|
// VMCalls[0]++
|
|
auto vmcallsptr = newTempIntPtr();
|
|
auto vmcalls = newTempInt32();
|
|
cc.mov(vmcallsptr, asmjit::imm_ptr(VMCalls));
|
|
cc.mov(vmcalls, asmjit::x86::dword_ptr(vmcallsptr));
|
|
cc.add(vmcalls, (int)1);
|
|
cc.mov(asmjit::x86::dword_ptr(vmcallsptr), vmcalls);
|
|
}
|
|
|
|
void JitCompiler::CreateRegisters()
|
|
{
|
|
regD.Resize(sfunc->NumRegD);
|
|
regF.Resize(sfunc->NumRegF);
|
|
regA.Resize(sfunc->NumRegA);
|
|
regS.Resize(sfunc->NumRegS);
|
|
|
|
for (int i = 0; i < sfunc->NumRegD; i++)
|
|
{
|
|
regname.Format("regD%d", i);
|
|
regD[i] = cc.newInt32(regname.GetChars());
|
|
}
|
|
|
|
for (int i = 0; i < sfunc->NumRegF; i++)
|
|
{
|
|
regname.Format("regF%d", i);
|
|
regF[i] = cc.newXmmSd(regname.GetChars());
|
|
}
|
|
|
|
for (int i = 0; i < sfunc->NumRegS; i++)
|
|
{
|
|
regname.Format("regS%d", i);
|
|
regS[i] = cc.newIntPtr(regname.GetChars());
|
|
}
|
|
|
|
for (int i = 0; i < sfunc->NumRegA; i++)
|
|
{
|
|
regname.Format("regA%d", i);
|
|
regA[i] = cc.newIntPtr(regname.GetChars());
|
|
}
|
|
}
|
|
|
|
void JitCompiler::EmitNullPointerThrow(int index, EVMAbortException reason)
|
|
{
|
|
auto label = EmitThrowExceptionLabel(reason);
|
|
cc.test(regA[index], regA[index]);
|
|
cc.je(label);
|
|
}
|
|
|
|
void JitCompiler::ThrowException(int reason)
|
|
{
|
|
ThrowAbortException((EVMAbortException)reason, nullptr);
|
|
}
|
|
|
|
void JitCompiler::EmitThrowException(EVMAbortException reason)
|
|
{
|
|
auto call = CreateCall<void, int>(&JitCompiler::ThrowException);
|
|
call->setArg(0, asmjit::imm(reason));
|
|
}
|
|
|
|
asmjit::Label JitCompiler::EmitThrowExceptionLabel(EVMAbortException reason)
|
|
{
|
|
auto label = cc.newLabel();
|
|
auto cursor = cc.getCursor();
|
|
cc.bind(label);
|
|
EmitThrowException(reason);
|
|
cc.setCursor(cursor);
|
|
|
|
JitLineInfo info;
|
|
info.Label = label;
|
|
info.LineNumber = sfunc->PCToLine(pc);
|
|
LineInfo.Push(info);
|
|
|
|
return label;
|
|
}
|
|
|
|
asmjit::X86Gp JitCompiler::CheckRegD(int r0, int r1)
|
|
{
|
|
if (r0 != r1)
|
|
{
|
|
return regD[r0];
|
|
}
|
|
else
|
|
{
|
|
auto copy = newTempInt32();
|
|
cc.mov(copy, regD[r0]);
|
|
return copy;
|
|
}
|
|
}
|
|
|
|
asmjit::X86Xmm JitCompiler::CheckRegF(int r0, int r1)
|
|
{
|
|
if (r0 != r1)
|
|
{
|
|
return regF[r0];
|
|
}
|
|
else
|
|
{
|
|
auto copy = newTempXmmSd();
|
|
cc.movsd(copy, regF[r0]);
|
|
return copy;
|
|
}
|
|
}
|
|
|
|
asmjit::X86Xmm JitCompiler::CheckRegF(int r0, int r1, int r2)
|
|
{
|
|
if (r0 != r1 && r0 != r2)
|
|
{
|
|
return regF[r0];
|
|
}
|
|
else
|
|
{
|
|
auto copy = newTempXmmSd();
|
|
cc.movsd(copy, regF[r0]);
|
|
return copy;
|
|
}
|
|
}
|
|
|
|
asmjit::X86Xmm JitCompiler::CheckRegF(int r0, int r1, int r2, int r3)
|
|
{
|
|
if (r0 != r1 && r0 != r2 && r0 != r3)
|
|
{
|
|
return regF[r0];
|
|
}
|
|
else
|
|
{
|
|
auto copy = newTempXmmSd();
|
|
cc.movsd(copy, regF[r0]);
|
|
return copy;
|
|
}
|
|
}
|
|
|
|
asmjit::X86Xmm JitCompiler::CheckRegF(int r0, int r1, int r2, int r3, int r4)
|
|
{
|
|
if (r0 != r1 && r0 != r2 && r0 != r3 && r0 != r4)
|
|
{
|
|
return regF[r0];
|
|
}
|
|
else
|
|
{
|
|
auto copy = newTempXmmSd();
|
|
cc.movsd(copy, regF[r0]);
|
|
return copy;
|
|
}
|
|
}
|
|
|
|
asmjit::X86Gp JitCompiler::CheckRegS(int r0, int r1)
|
|
{
|
|
if (r0 != r1)
|
|
{
|
|
return regS[r0];
|
|
}
|
|
else
|
|
{
|
|
auto copy = newTempIntPtr();
|
|
cc.mov(copy, regS[r0]);
|
|
return copy;
|
|
}
|
|
}
|
|
|
|
asmjit::X86Gp JitCompiler::CheckRegA(int r0, int r1)
|
|
{
|
|
if (r0 != r1)
|
|
{
|
|
return regA[r0];
|
|
}
|
|
else
|
|
{
|
|
auto copy = newTempIntPtr();
|
|
cc.mov(copy, regA[r0]);
|
|
return copy;
|
|
}
|
|
}
|
|
|
|
void JitCompiler::EmitNOP()
|
|
{
|
|
cc.nop();
|
|
}
|