mirror of
https://github.com/ZDoom/gzdoom.git
synced 2024-11-10 14:51:40 +00:00
- implement xor swap for vec registers
This commit is contained in:
parent
0dfb0d8427
commit
f17a90ef69
2 changed files with 67 additions and 6 deletions
|
@ -271,6 +271,22 @@ Error X86RAPass::emitSwapGp(VirtReg* dstReg, VirtReg* srcReg, uint32_t dstPhysId
|
|||
return kErrorOk;
|
||||
}
|
||||
|
||||
Error X86RAPass::emitSwapVec(VirtReg* dstReg, VirtReg* srcReg, uint32_t dstPhysId, uint32_t srcPhysId, const char* reason) noexcept {
|
||||
ASMJIT_ASSERT(dstPhysId != Globals::kInvalidRegId);
|
||||
ASMJIT_ASSERT(srcPhysId != Globals::kInvalidRegId);
|
||||
ASMJIT_ASSERT(dstPhysId != srcPhysId);
|
||||
|
||||
X86Reg a = X86Reg::fromSignature(dstReg->getSignature(), dstPhysId);
|
||||
X86Reg b = X86Reg::fromSignature(srcReg->getSignature(), srcPhysId);
|
||||
|
||||
ASMJIT_PROPAGATE(cc()->emit(X86Inst::kIdXorps, a, b));
|
||||
if (_emitComments)
|
||||
cc()->getCursor()->setInlineComment(cc()->_cbDataZone.sformat("[%s] %s, %s", reason, dstReg->getName(), srcReg->getName()));
|
||||
ASMJIT_PROPAGATE(cc()->emit(X86Inst::kIdXorps, b, a));
|
||||
ASMJIT_PROPAGATE(cc()->emit(X86Inst::kIdXorps, a, b));
|
||||
return kErrorOk;
|
||||
}
|
||||
|
||||
Error X86RAPass::emitImmToReg(uint32_t dstTypeId, uint32_t dstPhysId, const Imm* src) noexcept {
|
||||
ASMJIT_ASSERT(dstPhysId != Globals::kInvalidRegId);
|
||||
|
||||
|
@ -778,6 +794,9 @@ _MoveOrLoad:
|
|||
if (C == X86Reg::kKindGp) {
|
||||
self->swapGp(dVReg, sVd);
|
||||
}
|
||||
else if (C == X86Reg::kKindVec) {
|
||||
self->swapVec(dVReg, sVd);
|
||||
}
|
||||
else {
|
||||
self->spill<C>(dVReg);
|
||||
self->move<C>(sVd, physId);
|
||||
|
@ -932,10 +951,13 @@ static ASMJIT_INLINE void X86RAPass_intersectStateVars(X86RAPass* self, X86RASta
|
|||
didWork = true;
|
||||
continue;
|
||||
}
|
||||
else if (C == X86Reg::kKindGp) {
|
||||
else if (C == X86Reg::kKindGp || C == X86Reg::kKindVec) {
|
||||
if (aCell.getState() == VirtReg::kStateReg) {
|
||||
if (dVReg->getPhysId() != Globals::kInvalidRegId && aVReg->getPhysId() != Globals::kInvalidRegId) {
|
||||
self->swapGp(dVReg, aVReg);
|
||||
if (C == X86Reg::kKindGp)
|
||||
self->swapGp(dVReg, aVReg);
|
||||
else
|
||||
self->swapVec(dVReg, aVReg);
|
||||
|
||||
didWork = true;
|
||||
continue;
|
||||
|
@ -2787,9 +2809,13 @@ ASMJIT_INLINE void X86VarAlloc::alloc() {
|
|||
// allocation tasks by a single 'xchg' instruction, swapping
|
||||
// two registers required by the instruction/node or one register
|
||||
// required with another non-required.
|
||||
if (C == X86Reg::kKindGp && aPhysId != Globals::kInvalidRegId) {
|
||||
// Uses xor swap for Vec registers.
|
||||
if ((C == X86Reg::kKindGp || C == X86Reg::kKindVec) && aPhysId != Globals::kInvalidRegId) {
|
||||
TiedReg* bTied = bVReg->_tied;
|
||||
_context->swapGp(aVReg, bVReg);
|
||||
if (C == X86Reg::kKindGp)
|
||||
_context->swapGp(aVReg, bVReg);
|
||||
else
|
||||
_context->swapVec(aVReg, bVReg);
|
||||
|
||||
aTied->flags |= TiedReg::kRDone;
|
||||
addTiedDone(C);
|
||||
|
@ -3341,8 +3367,11 @@ ASMJIT_INLINE void X86CallAlloc::alloc() {
|
|||
// allocation tasks by a single 'xchg' instruction, swapping
|
||||
// two registers required by the instruction/node or one register
|
||||
// required with another non-required.
|
||||
if (C == X86Reg::kKindGp && sPhysId != Globals::kInvalidRegId) {
|
||||
_context->swapGp(aVReg, bVReg);
|
||||
if ((C == X86Reg::kKindGp || C == X86Reg::kKindVec) && sPhysId != Globals::kInvalidRegId) {
|
||||
if (C == X86Reg::kKindGp)
|
||||
_context->swapGp(aVReg, bVReg);
|
||||
else
|
||||
_context->swapVec(aVReg, bVReg);
|
||||
|
||||
aTied->flags |= TiedReg::kRDone;
|
||||
addTiedDone(C);
|
||||
|
|
|
@ -327,6 +327,7 @@ public:
|
|||
Error emitLoad(VirtReg* vreg, uint32_t id, const char* reason);
|
||||
Error emitSave(VirtReg* vreg, uint32_t id, const char* reason);
|
||||
Error emitSwapGp(VirtReg* aVReg, VirtReg* bVReg, uint32_t aId, uint32_t bId, const char* reason) noexcept;
|
||||
Error emitSwapVec(VirtReg* aVReg, VirtReg* bVReg, uint32_t aId, uint32_t bId, const char* reason) noexcept;
|
||||
|
||||
Error emitImmToReg(uint32_t dstTypeId, uint32_t dstPhysId, const Imm* src) noexcept;
|
||||
Error emitImmToStack(uint32_t dstTypeId, const X86Mem* dst, const Imm* src) noexcept;
|
||||
|
@ -515,6 +516,37 @@ public:
|
|||
ASMJIT_X86_CHECK_STATE
|
||||
}
|
||||
|
||||
//! Swap two registers
|
||||
//!
|
||||
//! Xor swap on Vec registers.
|
||||
ASMJIT_INLINE void swapVec(VirtReg* aVReg, VirtReg* bVReg) {
|
||||
ASMJIT_ASSERT(aVReg != bVReg);
|
||||
|
||||
ASMJIT_ASSERT(aVReg->getKind() == X86Reg::kKindVec);
|
||||
ASMJIT_ASSERT(aVReg->getState() == VirtReg::kStateReg);
|
||||
ASMJIT_ASSERT(aVReg->getPhysId() != Globals::kInvalidRegId);
|
||||
|
||||
ASMJIT_ASSERT(bVReg->getKind() == X86Reg::kKindVec);
|
||||
ASMJIT_ASSERT(bVReg->getState() == VirtReg::kStateReg);
|
||||
ASMJIT_ASSERT(bVReg->getPhysId() != Globals::kInvalidRegId);
|
||||
|
||||
uint32_t aIndex = aVReg->getPhysId();
|
||||
uint32_t bIndex = bVReg->getPhysId();
|
||||
|
||||
emitSwapVec(aVReg, bVReg, aIndex, bIndex, "Swap");
|
||||
|
||||
aVReg->setPhysId(bIndex);
|
||||
bVReg->setPhysId(aIndex);
|
||||
|
||||
_x86State.getListByKind(X86Reg::kKindVec)[aIndex] = bVReg;
|
||||
_x86State.getListByKind(X86Reg::kKindVec)[bIndex] = aVReg;
|
||||
|
||||
uint32_t m = aVReg->isModified() ^ bVReg->isModified();
|
||||
_x86State._modified.xor_(X86Reg::kKindVec, (m << aIndex) | (m << bIndex));
|
||||
|
||||
ASMJIT_X86_CHECK_STATE
|
||||
}
|
||||
|
||||
// --------------------------------------------------------------------------
|
||||
// [Alloc / Spill]
|
||||
// --------------------------------------------------------------------------
|
||||
|
|
Loading…
Reference in a new issue