Optimize sprite multiplexer

This commit is contained in:
drmortalwombat 2024-08-08 22:07:44 +02:00
parent 6f069946ba
commit d98c4b760f
4 changed files with 93 additions and 12 deletions

View File

@ -270,7 +270,7 @@ void vspr_update(void)
{
char xymask = 0;
volatile char * vsprs = vspriteScreen;
char sypos[VSPRITES_MAX];
// char sypos[VSPRITES_MAX];
#pragma unroll(full)
@ -291,9 +291,9 @@ void vspr_update(void)
xymask = ((unsigned)xymask | (vspriteXHigh[ri] << 8)) >> 1;
#endif
vic.spr_pos[uj].x = vspriteXLow[ri];
vic.spr_pos[uj].y = vspriteYLow[ri];
vic.spr_pos[uj].y = spriteYPos[ui + 1];
sypos[ui] = vspriteYLow[ri];
// sypos[ui] = vspriteYLow[ri];
}
vic.spr_msbx = xymask;
@ -303,9 +303,9 @@ void vspr_update(void)
for(char ti=0; ti<VSPRITES_MAX - 8; ti++)
{
byte ri = spriteOrder[ti + 8];
if (!done && vspriteYLow[ri] < 250)
if (!done && spriteYPos[ti + 9] < 250)
{
byte ri = spriteOrder[ti + 8];
#ifdef VSPRITE_REVERSE
char m = 0x80 >> (ti & 7);
#else
@ -316,14 +316,14 @@ void vspr_update(void)
if (!(vspriteXHigh[ri] & 1))
xymask ^= m;
rirq_data(spirq + ti, 2, vspriteYLow[ri]);
rirq_data(spirq + ti, 2, spriteYPos[ti + 9]);
rirq_data(spirq + ti, 0, vspriteColor[ri]);
rirq_data(spirq + ti, 1, vspriteXLow[ri]);
rirq_data(spirq + ti, 3, vspriteImage[ri]);
rirq_data(spirq + ti, 4, xymask);
rirq_move(ti, sypos[ti] + 23);
sypos[ti + 8] = vspriteYLow[ri];
rirq_move(ti, spriteYPos[ti + 1] + 23);
// spriteYPos[ti + 9] = vspriteYLow[ri];
}
else
{

View File

@ -518,6 +518,9 @@ Declaration* ConstexprInterpreter::Value::GetConst(int offset, Declaration* type
for (int i=0; i<type->mSize; i += type->mBase->mSize)
{
Declaration* cdec = GetConst(offset + i, type->mBase, dataSection);
if (type->mStride)
cdec->mOffset = i / type->mBase->mSize;
else
cdec->mOffset = i;
if (ldec)

View File

@ -6407,6 +6407,34 @@ void NativeCodeBasicBlock::StoreByteOffsetIndexedValue(InterCodeProcedure* proc,
}
}
void NativeCodeBasicBlock::LoadStoreIndirectPair(InterCodeProcedure* proc, const InterInstruction* wins0, const InterInstruction* wins1)
{
int sreg = BC_REG_TMP + proc->mTempOffset[wins0->mSrc[0].mTemp];
int ireg0 = BC_REG_TMP + proc->mTempOffset[wins0->mSrc[1].mTemp];
int index0 = int(wins0->mSrc[1].mIntConst);
uint32 wflags0 = NCIF_LOWER | NCIF_UPPER;
if (wins0->mVolatile)
wflags0 |= NCIF_VOLATILE;
int ireg1 = BC_REG_TMP + proc->mTempOffset[wins1->mSrc[1].mTemp];
int index1 = int(wins1->mSrc[1].mIntConst);
uint32 wflags1 = NCIF_LOWER | NCIF_UPPER;
if (wins1->mVolatile)
wflags1 |= NCIF_VOLATILE;
CheckFrameIndex(wins0, ireg0, index0, 1, BC_REG_ADDR);
CheckFrameIndex(wins1, ireg1, index1, 1, BC_REG_ACCU);
mIns.Push(NativeCodeInstruction(wins0, ASMIT_LDA, ASMIM_ZERO_PAGE, sreg));
mIns.Push(NativeCodeInstruction(wins0, ASMIT_LDY, ASMIM_IMMEDIATE, index0));
mIns.Push(NativeCodeInstruction(wins0, ASMIT_STA, ASMIM_INDIRECT_Y, ireg0, nullptr, wflags0));
mIns.Push(NativeCodeInstruction(wins1, ASMIT_LDY, ASMIM_IMMEDIATE, index1));
mIns.Push(NativeCodeInstruction(wins1, ASMIT_STA, ASMIM_INDIRECT_Y, ireg1, nullptr, wflags1));
}
void NativeCodeBasicBlock::LoadStoreIndirectValue(InterCodeProcedure* proc, const InterInstruction* rins, const InterInstruction* wins)
{
int size = InterTypeSize[wins->mSrc[0].mType];
@ -33560,7 +33588,7 @@ bool NativeCodeBasicBlock::MoveLDSTXOutOfRange(int at)
else if (mIns[j].ReferencesXReg())
return false;
if (mIns[j].mType == ASMIT_JSR)
if (mIns[j].mType == ASMIT_JSR || mIns[j].mType == ASMIT_RTS)
return false;
if (!(mIns[j].mLive & (LIVE_CPU_REG_A | LIVE_CPU_REG_Z)))
@ -47969,6 +47997,39 @@ bool NativeCodeBasicBlock::PeepHoleOptimizerIterateN(int i, int pass)
#endif
}
#if 1
if (i + 7 < mIns.Size() &&
mIns[i + 0].mType == ASMIT_STA && mIns[i + 0].mMode == ASMIM_ZERO_PAGE &&
mIns[i + 1].mType == ASMIT_CLC &&
mIns[i + 2].mType == ASMIT_ADC && mIns[i + 2].mMode == ASMIM_ZERO_PAGE &&
mIns[i + 3].mType == ASMIT_STA && mIns[i + 3].mMode == ASMIM_ZERO_PAGE && mIns[i + 2].mAddress == mIns[i + 3].mAddress &&
mIns[i + 4].mType == ASMIT_LDA &&
mIns[i + 5].mType == ASMIT_STA && mIns[i + 5].mMode == ASMIM_ZERO_PAGE && mIns[i + 5].mAddress != mIns[i + 0].mAddress &&
mIns[i + 6].mType == ASMIT_ADC && mIns[i + 6].mMode == ASMIM_ZERO_PAGE && mIns[i + 6].mAddress == mIns[i + 2].mAddress + 1 &&
mIns[i + 7].mType == ASMIT_STA && mIns[i + 7].mMode == ASMIM_ZERO_PAGE && mIns[i + 6].mAddress == mIns[i + 7].mAddress &&
!(mIns[i + 7].mLive & LIVE_CPU_REG_A))
{
int yval = RetrieveYValue(i);
mProc->ResetPatched();
if (CheckForwardSumYPointer(this, mIns[i + 2].mAddress, mIns[i + 2].mAddress, mIns[i + 0], i + 8, yval, 0))
{
mProc->ResetPatched();
if (PatchForwardSumYPointer(this, mIns[i + 2].mAddress, mIns[i + 2].mAddress, mIns[i + 0], i + 8, yval))
{
mIns[i + 2].mType = ASMIT_NOP; mIns[i + 2].mMode = ASMIM_IMPLIED;
mIns[i + 3].mType = ASMIT_NOP; mIns[i + 3].mMode = ASMIM_IMPLIED;
if (mTrueJump)
mTrueJump->CheckLive();
if (mFalseJump)
mFalseJump->CheckLive();
return true;
}
}
}
#endif
#if 1
if (pass == 0 &&
i + 7 < mIns.Size() &&
@ -50379,7 +50440,7 @@ void NativeCodeProcedure::Compile(InterCodeProcedure* proc)
mInterProc = proc;
mInterProc->mLinkerObject->mNativeProc = this;
CheckFunc = !strcmp(mInterProc->mIdent->mString, "screen_flip");
CheckFunc = !strcmp(mInterProc->mIdent->mString, "shot_add");
int nblocks = proc->mBlocks.Size();
tblocks = new NativeCodeBasicBlock * [nblocks];
@ -51238,6 +51299,7 @@ void NativeCodeProcedure::Optimize(void)
} while (changed && t < 20);
#endif
BuildDataFlowSets();
ResetVisited();
mEntryBlock->RemoveUnusedResultInstructions();
@ -51283,6 +51345,7 @@ void NativeCodeProcedure::Optimize(void)
#endif
if (step == 2)
{
ResetVisited();
@ -52334,6 +52397,20 @@ void NativeCodeProcedure::CompileInterBlock(InterCodeProcedure* iproc, InterCode
switch (ins->mCode)
{
case IC_STORE:
if (i + 1 < iblock->mInstructions.Size() &&
ins->mSrc[0].mType == IT_INT8 &&
ins->mSrc[0].mTemp >= 0 &&
ins->mSrc[1].mTemp >= 0 &&
iblock->mInstructions[i + 1]->mCode == IC_STORE &&
iblock->mInstructions[i + 1]->mSrc[0].mType == IT_INT8 &&
iblock->mInstructions[i + 1]->mSrc[0].mTemp == ins->mSrc[0].mTemp &&
iblock->mInstructions[i + 1]->mSrc[0].mFinal &&
iblock->mInstructions[i + 1]->mSrc[1].mTemp >= 0)
{
block->LoadStoreIndirectPair(iproc, ins, iblock->mInstructions[i + 1]);
i++;
}
else
block->StoreValue(iproc, ins);
break;
case IC_LOAD:

View File

@ -358,6 +358,7 @@ public:
void StoreValue(InterCodeProcedure* proc, const InterInstruction * ins);
void LoadValue(InterCodeProcedure* proc, const InterInstruction * ins);
void LoadStoreValue(InterCodeProcedure* proc, const InterInstruction * rins, const InterInstruction * wins);
void LoadStoreIndirectPair(InterCodeProcedure* proc, const InterInstruction* wins0, const InterInstruction* wins1);
bool LoadOpStoreIndirectValue(InterCodeProcedure* proc, const InterInstruction* rins, const InterInstruction* oins, int oindex, const InterInstruction* wins);
bool LoadUnopStoreIndirectValue(InterCodeProcedure* proc, const InterInstruction* rins, const InterInstruction* oins, const InterInstruction* wins);
bool LoadLoadOpStoreIndirectValue(InterCodeProcedure* proc, const InterInstruction* rins1, const InterInstruction* rins0, const InterInstruction* oins, const InterInstruction* wins);