Play-/Source/VUShared.cpp

695 lines
18 KiB
C++
Raw Normal View History

#include "VUShared.h"
#include "MIPS.h"
#include "CodeGen_FPU.h"
#include "CodeGen_VUF128.h"
#include "offsetof_def.h"
using namespace VUShared;
using namespace CodeGen;
using namespace std;
bool VUShared::DestinationHasElement(uint8 nDest, unsigned int nElement)
{
return (nDest & (1 << (nElement ^ 0x03))) != 0;
}
uint32* VUShared::GetVectorElement(CMIPS* pCtx, unsigned int nReg, unsigned int nElement)
{
switch(nElement)
{
case 0:
return &pCtx->m_State.nCOP2[nReg].nV0;
break;
case 1:
return &pCtx->m_State.nCOP2[nReg].nV1;
break;
case 2:
return &pCtx->m_State.nCOP2[nReg].nV2;
break;
case 3:
return &pCtx->m_State.nCOP2[nReg].nV3;
break;
}
return NULL;
}
size_t VUShared::GetVectorElement(unsigned int nRegister, unsigned int nElement)
{
return offsetof(CMIPS, m_State.nCOP2[nRegister].nV[nElement]);
}
uint32* VUShared::GetAccumulatorElement(CMIPS* pCtx, unsigned int nElement)
{
switch(nElement)
{
case 0:
return &pCtx->m_State.nCOP2A.nV0;
break;
case 1:
return &pCtx->m_State.nCOP2A.nV1;
break;
case 2:
return &pCtx->m_State.nCOP2A.nV2;
break;
case 3:
return &pCtx->m_State.nCOP2A.nV3;
break;
}
return NULL;
}
size_t VUShared::GetAccumulatorElement(unsigned int nElement)
{
return offsetof(CMIPS, m_State.nCOP2A.nV[nElement]);
}
void VUShared::PullVector(uint8 nDest, uint128* pVector)
{
CVUF128::Pull( \
DestinationHasElement(nDest, 0) ? &pVector->nV0 : NULL, \
DestinationHasElement(nDest, 1) ? &pVector->nV1 : NULL, \
DestinationHasElement(nDest, 2) ? &pVector->nV2 : NULL, \
DestinationHasElement(nDest, 3) ? &pVector->nV3 : NULL);
}
void VUShared::PullVectorEx(CCodeGen* codeGen, uint8 dest, size_t vector)
{
codeGen->MD_PullRel(
DestinationHasElement(dest, 0) ? vector + 0x0 : SIZE_MAX,
DestinationHasElement(dest, 1) ? vector + 0x4 : SIZE_MAX,
DestinationHasElement(dest, 2) ? vector + 0x8 : SIZE_MAX,
DestinationHasElement(dest, 3) ? vector + 0xC : SIZE_MAX);
}
void VUShared::ABS(CCacheBlock* pB, CMIPS* pCtx, uint8 nDest, uint8 nFt, uint8 nFs)
{
CCodeGen::Begin(pB);
{
unsigned int i;
for(i = 0; i < 4; i++)
{
if(!DestinationHasElement(nDest, i)) continue;
CFPU::PushSingle(GetVectorElement(pCtx, nFs, i));
CFPU::Abs();
CFPU::PullSingle(GetVectorElement(pCtx, nFt, i));
}
}
CCodeGen::End();
}
void VUShared::ADD(CCodeGen* codeGen, uint8 nDest, uint8 nFd, uint8 nFs, uint8 nFt)
{
codeGen->MD_PushRel(offsetof(CMIPS, m_State.nCOP2[nFs]));
codeGen->MD_PushRel(offsetof(CMIPS, m_State.nCOP2[nFt]));
codeGen->MD_AddS();
//Get result flags
codeGen->PushTop();
codeGen->PushTop();
codeGen->MD_IsNegative();
PullVectorEx(codeGen, nDest, offsetof(CMIPS, m_State.nCOP2SF));
codeGen->MD_IsZero();
PullVectorEx(codeGen, nDest, offsetof(CMIPS, m_State.nCOP2ZF));
//Save result
PullVectorEx(codeGen, nDest, offsetof(CMIPS, m_State.nCOP2[nFd]));
}
void VUShared::ADDbc(CCodeGen* codeGen, uint8 nDest, uint8 nFd, uint8 nFs, uint8 nFt, uint8 nBc)
{
codeGen->MD_PushRel(offsetof(CMIPS, m_State.nCOP2[nFs]));
codeGen->MD_PushRelExpand(offsetof(CMIPS, m_State.nCOP2[nFt].nV[nBc]));
codeGen->MD_AddS();
PullVectorEx(codeGen, nDest, offsetof(CMIPS, m_State.nCOP2[nFd]));
}
void VUShared::ADDi(CCacheBlock* pB, CMIPS* pCtx, uint8 nDest, uint8 nFd, uint8 nFs)
{
CCodeGen::Begin(pB);
{
CVUF128::Push(&pCtx->m_State.nCOP2[nFs]);
CVUF128::Push(&pCtx->m_State.nCOP2I);
CVUF128::Add();
PullVector(nDest, &pCtx->m_State.nCOP2[nFd]);
}
CCodeGen::End();
}
void VUShared::ADDq(CCodeGen* codeGen, uint8 nDest, uint8 nFd, uint8 nFs)
{
codeGen->MD_PushRel(offsetof(CMIPS, m_State.nCOP2[nFs]));
codeGen->MD_PushRelExpand(offsetof(CMIPS, m_State.nCOP2Q));
codeGen->MD_AddS();
PullVectorEx(codeGen, nDest, offsetof(CMIPS, m_State.nCOP2[nFd]));
}
void VUShared::ADDAbc(CCacheBlock* pB, CMIPS* pCtx, uint8 nDest, uint8 nFs, uint8 nFt, uint8 nBc)
{
CCodeGen::Begin(pB);
{
CVUF128::Push(&pCtx->m_State.nCOP2[nFs]);
CVUF128::Push(&pCtx->m_State.nCOP2[nFt].nV[nBc]);
CVUF128::Add();
PullVector(nDest, &pCtx->m_State.nCOP2A);
}
CCodeGen::End();
}
void VUShared::CLIP(CCacheBlock* pB, CMIPS* pCtx, uint8 nFs, uint8 nFt)
{
CCodeGen::Begin(pB);
{
//Create some space for the new test results
CCodeGen::PushVar(&pCtx->m_State.nCOP2CF);
//Decomment -> CCodeGen::Shl(6);
CCodeGen::PullVar(&pCtx->m_State.nCOP2CF);
for(unsigned int i = 0; i < 3; i++)
{
//c > +|w|
CFPU::PushSingle(&pCtx->m_State.nCOP2[nFt].nV[3]);
CFPU::Abs();
CFPU::PushSingle(&pCtx->m_State.nCOP2[nFs].nV[i]);
CFPU::Cmp(CCodeGen::CONDITION_AB);
CCodeGen::BeginIf(true);
{
CCodeGen::PushVar(&pCtx->m_State.nCOP2CF);
CCodeGen::PushCst(1 << ((i * 2) + 0));
//Decomment -> CCodeGen::Or();
CCodeGen::PullVar(&pCtx->m_State.nCOP2CF);
}
CCodeGen::EndIf();
//c < -|w|
CFPU::PushSingle(&pCtx->m_State.nCOP2[nFt].nV[3]);
CFPU::Abs();
CFPU::Neg();
CFPU::PushSingle(&pCtx->m_State.nCOP2[nFs].nV[i]);
CFPU::Cmp(CCodeGen::CONDITION_BL);
CCodeGen::BeginIf(true);
{
CCodeGen::PushVar(&pCtx->m_State.nCOP2CF);
CCodeGen::PushCst(1 << ((i * 2) + 1));
//Decomment -> CCodeGen::Or();
CCodeGen::PullVar(&pCtx->m_State.nCOP2CF);
}
CCodeGen::EndIf();
}
}
CCodeGen::End();
}
void VUShared::DIV(CCodeGen* codeGen, uint8 nFs, uint8 nFsf, uint8 nFt, uint8 nFtf)
{
//Check for zero
codeGen->PushRel(GetVectorElement(nFt, nFtf));
codeGen->PushCst(0x7FFFFFFF);
codeGen->And();
codeGen->PushCst(0);
codeGen->Cmp(CCodeGen::CONDITION_EQ);
codeGen->BeginIfElse(true);
{
codeGen->PushCst(0x7F7FFFFF);
codeGen->PushRel(GetVectorElement(nFs, nFsf));
codeGen->PushRel(GetVectorElement(nFt, nFtf));
codeGen->Xor();
codeGen->PushCst(0x80000000);
codeGen->And();
codeGen->Or();
codeGen->PullRel(offsetof(CMIPS, m_State.nCOP2Q));
}
codeGen->BeginIfElseAlt();
{
codeGen->FP_PushSingle(GetVectorElement(nFs, nFsf));
codeGen->FP_PushSingle(GetVectorElement(nFt, nFtf));
codeGen->FP_Div();
codeGen->FP_PullSingle(offsetof(CMIPS, m_State.nCOP2Q));
}
codeGen->EndIf();
}
void VUShared::FTOI0(CCacheBlock* pB, CMIPS* pCtx, uint8 nDest, uint8 nFt, uint8 nFs)
{
CCodeGen::Begin(pB);
{
CVUF128::Push(&pCtx->m_State.nCOP2[nFs]);
CVUF128::ToWordTruncate();
PullVector(nDest, &pCtx->m_State.nCOP2[nFt]);
}
CCodeGen::End();
}
void VUShared::FTOI4(CCacheBlock* pB, CMIPS* pCtx, uint8 nDest, uint8 nFt, uint8 nFs)
{
CCodeGen::Begin(pB);
{
//Get the fractional part
CVUF128::Push(&pCtx->m_State.nCOP2[nFs]);
CVUF128::Push(&pCtx->m_State.nCOP2[nFs]);
CVUF128::Truncate();
CVUF128::Sub();
CVUF128::PushImm(16.0f);
CVUF128::Mul();
//Get the whole part
CVUF128::Push(&pCtx->m_State.nCOP2[nFs]);
CVUF128::Truncate();
CVUF128::PushImm(16.0f);
CVUF128::Mul();
//Add both parts
CVUF128::Add();
//Save result
CVUF128::ToWordTruncate();
PullVector(nDest, &pCtx->m_State.nCOP2[nFt]);
}
CCodeGen::End();
}
void VUShared::ITOF0(CCacheBlock* pB, CMIPS* pCtx, uint8 nDest, uint8 nFt, uint8 nFs)
{
CCodeGen::Begin(pB);
{
CVUF128::Push(&pCtx->m_State.nCOP2[nFs]);
CVUF128::ToSingle();
PullVector(nDest, &pCtx->m_State.nCOP2[nFt]);
}
CCodeGen::End();
}
void VUShared::MADD(CCacheBlock* pB, CMIPS* pCtx, uint8 nDest, uint8 nFd, uint8 nFs, uint8 nFt)
{
CCodeGen::Begin(pB);
{
CVUF128::Push(&pCtx->m_State.nCOP2A);
CVUF128::Push(&pCtx->m_State.nCOP2[nFs]);
CVUF128::Push(&pCtx->m_State.nCOP2[nFt]);
CVUF128::Mul();
CVUF128::Add();
PullVector(nDest, &pCtx->m_State.nCOP2[nFd]);
}
CCodeGen::End();
}
void VUShared::MADDbc(CCodeGen* codeGen, uint8 nDest, uint8 nFd, uint8 nFs, uint8 nFt, uint8 nBc)
{
codeGen->MD_PushRel(offsetof(CMIPS, m_State.nCOP2A));
codeGen->MD_PushRel(offsetof(CMIPS, m_State.nCOP2[nFs]));
codeGen->MD_PushRelExpand(offsetof(CMIPS, m_State.nCOP2[nFt].nV[nBc]));
codeGen->MD_MulS();
codeGen->MD_AddS();
PullVectorEx(codeGen, nDest, offsetof(CMIPS, m_State.nCOP2[nFd]));
}
void VUShared::MADDA(CCacheBlock* pB, CMIPS* pCtx, uint8 nDest, uint8 nFs, uint8 nFt)
{
CCodeGen::Begin(pB);
{
CVUF128::Push(&pCtx->m_State.nCOP2A);
CVUF128::Push(&pCtx->m_State.nCOP2[nFs]);
CVUF128::Push(&pCtx->m_State.nCOP2[nFt]);
CVUF128::Mul();
CVUF128::Add();
PullVector(nDest, &pCtx->m_State.nCOP2A);
}
CCodeGen::End();
}
void VUShared::MADDAbc(CCodeGen* codeGen, uint8 nDest, uint8 nFs, uint8 nFt, uint8 nBc)
{
codeGen->MD_PushRel(offsetof(CMIPS, m_State.nCOP2A));
codeGen->MD_PushRel(offsetof(CMIPS, m_State.nCOP2[nFs]));
codeGen->MD_PushRelExpand(offsetof(CMIPS, m_State.nCOP2[nFt].nV[nBc]));
codeGen->MD_MulS();
codeGen->MD_AddS();
PullVectorEx(codeGen, nDest, offsetof(CMIPS, m_State.nCOP2A));
}
void VUShared::MADDAi(CCacheBlock* pB, CMIPS* pCtx, uint8 nDest, uint8 nFs)
{
CCodeGen::Begin(pB);
{
CVUF128::Push(&pCtx->m_State.nCOP2A);
CVUF128::Push(&pCtx->m_State.nCOP2[nFs]);
CVUF128::Push(&pCtx->m_State.nCOP2I);
CVUF128::Mul();
CVUF128::Add();
PullVector(nDest, &pCtx->m_State.nCOP2A);
}
CCodeGen::End();
}
void VUShared::MAX(CCacheBlock* pB, CMIPS* pCtx, uint8 nDest, uint8 nFd, uint8 nFs, uint8 nFt)
{
CCodeGen::Begin(pB);
{
CVUF128::Push(&pCtx->m_State.nCOP2[nFs]);
CVUF128::Push(&pCtx->m_State.nCOP2[nFt]);
CVUF128::Max();
PullVector(nDest, &pCtx->m_State.nCOP2[nFd]);
}
CCodeGen::End();
}
void VUShared::MAXbc(CCacheBlock* pB, CMIPS* pCtx, uint8 nDest, uint8 nFd, uint8 nFs, uint8 nFt, uint8 nBc)
{
CCodeGen::Begin(pB);
{
CVUF128::Push(&pCtx->m_State.nCOP2[nFs]);
CVUF128::Push(&pCtx->m_State.nCOP2[nFt].nV[nBc]);
CVUF128::Max();
PullVector(nDest, &pCtx->m_State.nCOP2[nFd]);
}
CCodeGen::End();
}
void VUShared::MINI(CCacheBlock* pB, CMIPS* pCtx, uint8 nDest, uint8 nFd, uint8 nFs, uint8 nFt)
{
CCodeGen::Begin(pB);
{
CVUF128::Push(&pCtx->m_State.nCOP2[nFs]);
CVUF128::Push(&pCtx->m_State.nCOP2[nFt]);
CVUF128::Min();
PullVector(nDest, &pCtx->m_State.nCOP2[nFd]);
}
CCodeGen::End();
}
void VUShared::MINIbc(CCacheBlock* pB, CMIPS* pCtx, uint8 nDest, uint8 nFd, uint8 nFs, uint8 nFt, uint8 nBc)
{
CCodeGen::Begin(pB);
{
CVUF128::Push(&pCtx->m_State.nCOP2[nFs]);
CVUF128::Push(&pCtx->m_State.nCOP2[nFt].nV[nBc]);
CVUF128::Min();
PullVector(nDest, &pCtx->m_State.nCOP2[nFd]);
}
CCodeGen::End();
}
void VUShared::MINIi(CCacheBlock* pB, CMIPS* pCtx, uint8 nDest, uint8 nFd, uint8 nFs)
{
CCodeGen::Begin(pB);
{
CVUF128::Push(&pCtx->m_State.nCOP2[nFs]);
CVUF128::Push(&pCtx->m_State.nCOP2I);
CVUF128::Min();
PullVector(nDest, &pCtx->m_State.nCOP2[nFd]);
}
CCodeGen::End();
}
void VUShared::MOVE(CCodeGen* codeGen, uint8 nDest, uint8 nFt, uint8 nFs)
{
for(unsigned int i = 0; i < 4; i++)
{
if(!DestinationHasElement(nDest, i)) continue;
codeGen->PushRel(offsetof(CMIPS, m_State.nCOP2[nFs].nV[i]));
codeGen->PullRel(offsetof(CMIPS, m_State.nCOP2[nFt].nV[i]));
}
}
void VUShared::MR32(CCodeGen* codeGen, uint8 nDest, uint8 nFt, uint8 nFs)
{
for(unsigned int i = 0; i < 4; i++)
{
if(!DestinationHasElement(nDest, i)) continue;
codeGen->PushRel(offsetof(CMIPS, m_State.nCOP2[nFs].nV[(i + 1) & 3]));
codeGen->PullRel(offsetof(CMIPS, m_State.nCOP2[nFt].nV[i]));
}
}
void VUShared::MSUBi(CCacheBlock* pB, CMIPS* pCtx, uint8 nDest, uint8 nFd, uint8 nFs)
{
CCodeGen::Begin(pB);
{
CVUF128::Push(&pCtx->m_State.nCOP2A);
CVUF128::Push(&pCtx->m_State.nCOP2[nFs]);
CVUF128::Push(&pCtx->m_State.nCOP2I);
CVUF128::Mul();
CVUF128::Sub();
PullVector(nDest, &pCtx->m_State.nCOP2[nFd]);
}
CCodeGen::End();
}
void VUShared::MSUBAi(CCacheBlock* pB, CMIPS* pCtx, uint8 nDest, uint8 nFs)
{
CCodeGen::Begin(pB);
{
CVUF128::Push(&pCtx->m_State.nCOP2A);
CVUF128::Push(&pCtx->m_State.nCOP2[nFs]);
CVUF128::Push(&pCtx->m_State.nCOP2I);
CVUF128::Mul();
CVUF128::Sub();
PullVector(nDest, &pCtx->m_State.nCOP2A);
}
CCodeGen::End();
}
void VUShared::MUL(CCodeGen* codeGen, uint8 nDest, uint8 nFd, uint8 nFs, uint8 nFt)
{
codeGen->MD_PushRel(offsetof(CMIPS, m_State.nCOP2[nFs]));
codeGen->MD_PushRel(offsetof(CMIPS, m_State.nCOP2[nFt]));
codeGen->MD_MulS();
PullVectorEx(codeGen, nDest, offsetof(CMIPS, m_State.nCOP2[nFd]));
}
void VUShared::MULbc(CCacheBlock* pB, CMIPS* pCtx, uint8 nDest, uint8 nFd, uint8 nFs, uint8 nFt, uint8 nBc)
{
CCodeGen::Begin(pB);
{
CVUF128::Push(&pCtx->m_State.nCOP2[nFs]);
CVUF128::Push(&pCtx->m_State.nCOP2[nFt].nV[nBc]);
CVUF128::Mul();
PullVector(nDest, &pCtx->m_State.nCOP2[nFd]);
}
CCodeGen::End();
}
void VUShared::MULi(CCacheBlock* pB, CMIPS* pCtx, uint8 nDest, uint8 nFd, uint8 nFs)
{
CCodeGen::Begin(pB);
{
CVUF128::Push(&pCtx->m_State.nCOP2[nFs]);
CVUF128::Push(&pCtx->m_State.nCOP2I);
CVUF128::Mul();
PullVector(nDest, &pCtx->m_State.nCOP2[nFd]);
}
CCodeGen::End();
}
void VUShared::MULq(CCodeGen* codeGen, uint8 nDest, uint8 nFd, uint8 nFs)
{
codeGen->MD_PushRel(offsetof(CMIPS, m_State.nCOP2[nFs]));
codeGen->MD_PushRelExpand(offsetof(CMIPS, m_State.nCOP2Q));
codeGen->MD_MulS();
PullVectorEx(codeGen, nDest, offsetof(CMIPS, m_State.nCOP2[nFd]));
}
void VUShared::MULA(CCacheBlock* pB, CMIPS* pCtx, uint8 nDest, uint8 nFs, uint8 nFt)
{
CCodeGen::Begin(pB);
{
CVUF128::Push(&pCtx->m_State.nCOP2[nFs]);
CVUF128::Push(&pCtx->m_State.nCOP2[nFt]);
CVUF128::Mul();
PullVector(nDest, &pCtx->m_State.nCOP2A);
}
CCodeGen::End();
}
void VUShared::MULAbc(CCodeGen* codeGen, uint8 nDest, uint8 nFs, uint8 nFt, uint8 nBc)
{
codeGen->MD_PushRel(offsetof(CMIPS, m_State.nCOP2[nFs]));
codeGen->MD_PushRelExpand(offsetof(CMIPS, m_State.nCOP2[nFt].nV[nBc]));
codeGen->MD_MulS();
PullVectorEx(codeGen, nDest, offsetof(CMIPS, m_State.nCOP2A));
}
void VUShared::MULAi(CCacheBlock* pB, CMIPS* pCtx, uint8 nDest, uint8 nFs)
{
CCodeGen::Begin(pB);
{
CVUF128::Push(&pCtx->m_State.nCOP2[nFs]);
CVUF128::Push(&pCtx->m_State.nCOP2I);
CVUF128::Mul();
PullVector(nDest, &pCtx->m_State.nCOP2A);
}
CCodeGen::End();
}
void VUShared::OPMULA(CCodeGen* codeGen, uint8 nFs, uint8 nFt)
{
//ACCx
codeGen->FP_PushSingle(GetVectorElement(nFs, VECTOR_COMPY));
codeGen->FP_PushSingle(GetVectorElement(nFt, VECTOR_COMPZ));
codeGen->FP_Mul();
codeGen->FP_PullSingle(GetAccumulatorElement(VECTOR_COMPX));
//ACCy
codeGen->FP_PushSingle(GetVectorElement(nFs, VECTOR_COMPZ));
codeGen->FP_PushSingle(GetVectorElement(nFt, VECTOR_COMPX));
codeGen->FP_Mul();
codeGen->FP_PullSingle(GetAccumulatorElement(VECTOR_COMPY));
//ACCz
codeGen->FP_PushSingle(GetVectorElement(nFs, VECTOR_COMPX));
codeGen->FP_PushSingle(GetVectorElement(nFt, VECTOR_COMPY));
codeGen->FP_Mul();
codeGen->FP_PullSingle(GetAccumulatorElement(VECTOR_COMPZ));
}
void VUShared::OPMSUB(CCodeGen* codeGen, uint8 nFd, uint8 nFs, uint8 nFt)
{
if(nFd == 0)
{
//Atelier Iris - OPMSUB with VF0 as FD...
//This is probably to set a flag which is tested a bit further
//The flag tested is Sz
throw runtime_error("Remimplement.");
/*
CCodeGen::Begin(pB);
{
CFPU::PushSingleImm(0.0);
CFPU::PushSingle(GetAccumulatorElement(pCtx, VECTOR_COMPZ));
CFPU::PushSingle(GetVectorElement(pCtx, nFs, VECTOR_COMPX));
CFPU::PushSingle(GetVectorElement(pCtx, nFt, VECTOR_COMPY));
CFPU::Mul();
CFPU::Sub();
CFPU::Cmp(CCodeGen::CONDITION_BL);
CCodeGen::BeginIfElse(true);
{
CCodeGen::PushCst(0xFFFFFFFF);
CCodeGen::PullVar(&pCtx->m_State.nCOP2SF.nV[2]);
}
CCodeGen::BeginIfElseAlt();
{
CCodeGen::PushCst(0);
CCodeGen::PullVar(&pCtx->m_State.nCOP2SF.nV[2]);
}
CCodeGen::EndIf();
}
CCodeGen::End();
return;
*/
}
//X
codeGen->FP_PushSingle(GetAccumulatorElement(VECTOR_COMPX));
codeGen->FP_PushSingle(GetVectorElement(nFs, VECTOR_COMPY));
codeGen->FP_PushSingle(GetVectorElement(nFt, VECTOR_COMPZ));
codeGen->FP_Mul();
codeGen->FP_Sub();
codeGen->FP_PullSingle(GetVectorElement(nFd, VECTOR_COMPX));
//Y
codeGen->FP_PushSingle(GetAccumulatorElement(VECTOR_COMPY));
codeGen->FP_PushSingle(GetVectorElement(nFs, VECTOR_COMPZ));
codeGen->FP_PushSingle(GetVectorElement(nFt, VECTOR_COMPX));
codeGen->FP_Mul();
codeGen->FP_Sub();
codeGen->FP_PullSingle(GetVectorElement(nFd, VECTOR_COMPY));
//Z
codeGen->FP_PushSingle(GetAccumulatorElement(VECTOR_COMPZ));
codeGen->FP_PushSingle(GetVectorElement(nFs, VECTOR_COMPX));
codeGen->FP_PushSingle(GetVectorElement(nFt, VECTOR_COMPY));
codeGen->FP_Mul();
codeGen->FP_Sub();
codeGen->FP_PullSingle(GetVectorElement(nFd, VECTOR_COMPZ));
}
void VUShared::RINIT(CCacheBlock* pB, CMIPS* pCtx, uint8 nFs, uint8 nFsf)
{
CCodeGen::Begin(pB);
{
CCodeGen::PushVar(&pCtx->m_State.nCOP2[nFs].nV[nFsf]);
CCodeGen::PushCst(0x007FFFFF);
CCodeGen::And();
CCodeGen::PullVar(&pCtx->m_State.nCOP2R);
}
CCodeGen::End();
}
void VUShared::RSQRT(CCacheBlock* pB, CMIPS* pCtx, uint8 nFs, uint8 nFsf, uint8 nFt, uint8 nFtf)
{
CCodeGen::Begin(pB);
{
CFPU::PushSingle(GetVectorElement(pCtx, nFs, nFsf));
CFPU::PushSingle(GetVectorElement(pCtx, nFt, nFtf));
CFPU::Sqrt();
CFPU::Div();
CFPU::PullSingle(&pCtx->m_State.nCOP2Q);
}
CCodeGen::End();
}
void VUShared::RXOR(CCacheBlock* pB, CMIPS* pCtx, uint8 nFs, uint8 nFsf)
{
CCodeGen::Begin(pB);
{
CCodeGen::PushRel(offsetof(CMIPS, m_State.nCOP2[nFs].nV[nFsf]));
CCodeGen::PushRel(offsetof(CMIPS, m_State.nCOP2R));
CCodeGen::Xor();
CCodeGen::PushCst(0x007FFFFF);
CCodeGen::And();
CCodeGen::PullRel(offsetof(CMIPS, m_State.nCOP2R));
}
CCodeGen::End();
}
void VUShared::SQRT(CCodeGen* codeGen, uint8 nFt, uint8 nFtf)
{
codeGen->FP_PushSingle(GetVectorElement(nFt, nFtf));
codeGen->FP_Sqrt();
codeGen->FP_PullSingle(offsetof(CMIPS, m_State.nCOP2Q));
}
void VUShared::SUB(CCodeGen* codeGen, uint8 nDest, uint8 nFd, uint8 nFs, uint8 nFt)
{
codeGen->MD_PushRel(offsetof(CMIPS, m_State.nCOP2[nFs]));
codeGen->MD_PushRel(offsetof(CMIPS, m_State.nCOP2[nFt]));
codeGen->MD_SubS();
PullVectorEx(codeGen, nDest, offsetof(CMIPS, m_State.nCOP2[nFd]));
}
void VUShared::SUBbc(CCacheBlock* pB, CMIPS* pCtx, uint8 nDest, uint8 nFd, uint8 nFs, uint8 nFt, uint8 nBc)
{
CCodeGen::Begin(pB);
{
CVUF128::Push(&pCtx->m_State.nCOP2[nFs]);
CVUF128::Push(&pCtx->m_State.nCOP2[nFt].nV[nBc]);
CVUF128::Sub();
PullVector(nDest, &pCtx->m_State.nCOP2[nFd]);
}
CCodeGen::End();
}
void VUShared::SUBi(CCacheBlock* pB, CMIPS* pCtx, uint8 nDest, uint8 nFd, uint8 nFs)
{
CCodeGen::Begin(pB);
{
CVUF128::Push(&pCtx->m_State.nCOP2[nFs]);
CVUF128::Push(&pCtx->m_State.nCOP2I);
CVUF128::Sub();
PullVector(nDest, &pCtx->m_State.nCOP2[nFd]);
}
CCodeGen::End();
}