git-svn-id: https://pcsxr.svn.codeplex.com/svn/pcsxr@45285 e17a0e51-4ae3-4d35-97c3-1a29b211df97

This commit is contained in:
SND\weimingzhi_cp 2010-04-14 10:01:50 +00:00
parent 9729610b99
commit 5810556c32
3 changed files with 215 additions and 204 deletions

View File

@ -2,7 +2,7 @@
Version 2, June 1991
Copyright (C) 1989, 1991 Free Software Foundation, Inc.
51 Franklin Steet, Fifth Floor, Boston, MA 02111-1307 USA
51 Franklin Street, Fifth Floor, Boston, MA 02111-1307 USA
Everyone is permitted to copy and distribute verbatim copies
of this license document, but changing it is not allowed.

View File

@ -1,6 +1,7 @@
April 14, 2010 Wei Mingzhi <whistler_wmz@users.sf.net>
* libpcsxcore/gte.c: Use u32 instead of unsigned long.
* COPYING: Fixed a typo in FSF's address.
April 13, 2010 Wei Mingzhi <whistler_wmz@users.sf.net>

View File

@ -1,18 +1,18 @@
/* PCSX-Revolution - PS Emulator for Nintendo Wii
* Copyright (C) 2009-2010 PCSX-Revolution Dev Team
/* PCSX-Revolution - PS Emulator for Nintendo Wii
* Copyright (C) 2009-2010 PCSX-Revolution Dev Team
*
* PCSX-Revolution is free software: you can redistribute it and/or
* modify it under the terms of the GNU General Public License as
* published by the Free Software Foundation, either version 2 of the
* License, or (at your option) any later version.
* PCSX-Revolution is free software: you can redistribute it and/or
* modify it under the terms of the GNU General Public License as
* published by the Free Software Foundation, either version 2 of the
* License, or (at your option) any later version.
*
* PCSX-Revolution is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
* See the GNU General Public License for more details.
* PCSX-Revolution is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
* See the GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with PCSX-Revolution. If not, see <http://www.gnu.org/licenses/>.
* You should have received a copy of the GNU General Public License
* along with PCSX-Revolution. If not, see <http://www.gnu.org/licenses/>.
*/
/*
@ -189,15 +189,15 @@ static inline s32 LIM(s32 value, s32 max, s32 min, u32 flag) {
#define A1(a) BOUNDS((a), 0x7fffffff, (1 << 30), -(s64)0x80000000, (1 << 31) | (1 << 27))
#define A2(a) BOUNDS((a), 0x7fffffff, (1 << 29), -(s64)0x80000000, (1 << 31) | (1 << 26))
#define A3(a) BOUNDS((a), 0x7fffffff, (1 << 28), -(s64)0x80000000, (1 << 31) | (1 << 25))
#define Lm_B1(a, l) LIM((a), 0x7fff, -0x8000 * !l, (1 << 31) | (1 << 24))
#define Lm_B2(a, l) LIM((a), 0x7fff, -0x8000 * !l, (1 << 31) | (1 << 23))
#define Lm_B3(a, l) LIM((a), 0x7fff, -0x8000 * !l, (1 << 22) )
#define Lm_C1(a) LIM((a), 0x00ff, 0x0000, (1 << 21) )
#define Lm_C2(a) LIM((a), 0x00ff, 0x0000, (1 << 20) )
#define Lm_C3(a) LIM((a), 0x00ff, 0x0000, (1 << 19) )
#define Lm_D(a) LIM((a), 0xffff, 0x0000, (1 << 31) | (1 << 18))
#define limB1(a, l) LIM((a), 0x7fff, -0x8000 * !l, (1 << 31) | (1 << 24))
#define limB2(a, l) LIM((a), 0x7fff, -0x8000 * !l, (1 << 31) | (1 << 23))
#define limB3(a, l) LIM((a), 0x7fff, -0x8000 * !l, (1 << 22) )
#define limC1(a) LIM((a), 0x00ff, 0x0000, (1 << 21) )
#define limC2(a) LIM((a), 0x00ff, 0x0000, (1 << 20) )
#define limC3(a) LIM((a), 0x00ff, 0x0000, (1 << 19) )
#define limD(a) LIM((a), 0xffff, 0x0000, (1 << 31) | (1 << 18))
static inline u32 Lm_E(u32 result) {
static inline u32 limE(u32 result) {
if (result > 0x1ffff) {
gteFLAG |= (1 << 31) | (1 << 17);
return 0x1ffff;
@ -206,20 +206,27 @@ static inline u32 Lm_E(u32 result) {
}
#define F(a) BOUNDS((a), 0x7fffffff, (1 << 31) | (1 << 16), -(s64)0x80000000, (1 << 31) | (1 << 15))
#define Lm_G1(a) LIM((a), 0x3ff, -0x400, (1 << 31) | (1 << 14))
#define Lm_G2(a) LIM((a), 0x3ff, -0x400, (1 << 31) | (1 << 13))
#define Lm_H(a) LIM((a), 0xfff, 0x000, (1 << 12))
#define limG1(a) LIM((a), 0x3ff, -0x400, (1 << 31) | (1 << 14))
#define limG2(a) LIM((a), 0x3ff, -0x400, (1 << 31) | (1 << 13))
#define limH(a) LIM((a), 0xfff, 0x000, (1 << 12))
static inline u32 MFC2(int reg) {
switch(reg) {
case 1: case 3: case 5:
case 8: case 9: case 10:
switch (reg) {
case 1:
case 3:
case 5:
case 8:
case 9:
case 10:
case 11:
psxRegs.CP2D.r[reg] = (s32)psxRegs.CP2D.p[reg].sw.l;
break;
case 7: case 16: case 17:
case 18: case 19:
case 7:
case 16:
case 17:
case 18:
case 19:
psxRegs.CP2D.r[reg] = (u32)psxRegs.CP2D.p[reg].w.l;
break;
@ -227,7 +234,8 @@ static inline u32 MFC2(int reg) {
psxRegs.CP2D.r[reg] = gteSXY2;
break;
case 28: case 30:
case 28:
case 30:
return 0;
case 29:
@ -256,7 +264,7 @@ static inline void MTC2(u32 value, int reg) {
break;
case 30:
{
{
int a;
gteLZCS = value;
@ -268,7 +276,7 @@ static inline void MTC2(u32 value, int reg) {
} else if (a < 0) {
int i;
a ^= 0xffffffff;
for (i=31; (a & (1 << i)) == 0 && i >= 0; i--);
for (i = 31; (a & (1 << i)) == 0 && i >= 0; i--);
gteLZCR = 31 - i;
} else {
gteLZCR = 32;
@ -276,7 +284,9 @@ static inline void MTC2(u32 value, int reg) {
}
break;
case 7: case 29: case 31:
case 7:
case 29:
case 31:
return;
default:
@ -346,21 +356,21 @@ void gteRTPS() {
gteMAC1 = A1((((s64)gteTRX << 12) + (gteR11 * gteVX0) + (gteR12 * gteVY0) + (gteR13 * gteVZ0)) >> 12);
gteMAC2 = A2((((s64)gteTRY << 12) + (gteR21 * gteVX0) + (gteR22 * gteVY0) + (gteR23 * gteVZ0)) >> 12);
gteMAC3 = A3((((s64)gteTRZ << 12) + (gteR31 * gteVX0) + (gteR32 * gteVY0) + (gteR33 * gteVZ0)) >> 12);
gteIR1 = Lm_B1(gteMAC1, 0);
gteIR2 = Lm_B2(gteMAC2, 0);
gteIR3 = Lm_B3(gteMAC3, 0);
gteIR1 = limB1(gteMAC1, 0);
gteIR2 = limB2(gteMAC2, 0);
gteIR3 = limB3(gteMAC3, 0);
gteSZ0 = gteSZ1;
gteSZ1 = gteSZ2;
gteSZ2 = gteSZ3;
gteSZ3 = Lm_D(gteMAC3);
h_over_sz3 = Lm_E((gteH * 65536) / (gteSZ3 + 0.5));
gteSZ3 = limD(gteMAC3);
h_over_sz3 = limE((gteH * 65536) / (gteSZ3 + 0.5));
gteSXY0 = gteSXY1;
gteSXY1 = gteSXY2;
gteSX2 = Lm_G1(F((s64)gteOFX + ((s64)gteIR1 * h_over_sz3)) >> 16);
gteSY2 = Lm_G2(F((s64)gteOFY + ((s64)gteIR2 * h_over_sz3)) >> 16);
gteSX2 = limG1(F((s64)gteOFX + ((s64)gteIR1 * h_over_sz3)) >> 16);
gteSY2 = limG2(F((s64)gteOFY + ((s64)gteIR2 * h_over_sz3)) >> 16);
gteMAC0 = F((s64)(gteDQB + ((s64)gteDQA * h_over_sz3)) >> 12);
gteIR0 = Lm_H(gteMAC0);
gteIR0 = limH(gteMAC0);
}
void gteRTPT() {
@ -381,16 +391,16 @@ void gteRTPT() {
gteMAC1 = A1((((s64)gteTRX << 12) + (gteR11 * vx) + (gteR12 * vy) + (gteR13 * vz)) >> 12);
gteMAC2 = A2((((s64)gteTRY << 12) + (gteR21 * vx) + (gteR22 * vy) + (gteR23 * vz)) >> 12);
gteMAC3 = A3((((s64)gteTRZ << 12) + (gteR31 * vx) + (gteR32 * vy) + (gteR33 * vz)) >> 12);
gteIR1 = Lm_B1(gteMAC1, 0);
gteIR2 = Lm_B2(gteMAC2, 0);
gteIR3 = Lm_B3(gteMAC3, 0);
fSZ(v) = Lm_D(gteMAC3);
h_over_sz3 = Lm_E((gteH * 65536) / (fSZ(v) + 0.5));
fSX(v) = Lm_G1(F((s64)gteOFX + ((s64)gteIR1 * h_over_sz3)) >> 16);
fSY(v) = Lm_G2(F((s64)gteOFY + ((s64)gteIR2 * h_over_sz3)) >> 16);
gteIR1 = limB1(gteMAC1, 0);
gteIR2 = limB2(gteMAC2, 0);
gteIR3 = limB3(gteMAC3, 0);
fSZ(v) = limD(gteMAC3);
h_over_sz3 = limE((gteH * 65536) / (fSZ(v) + 0.5));
fSX(v) = limG1(F((s64)gteOFX + ((s64)gteIR1 * h_over_sz3)) >> 16);
fSY(v) = limG2(F((s64)gteOFY + ((s64)gteIR2 * h_over_sz3)) >> 16);
}
gteMAC0 = F((s64)(gteDQB + ((s64)gteDQA * h_over_sz3)) >> 12);
gteIR0 = Lm_H(gteMAC0);
gteIR0 = limH(gteMAC0);
}
void gteMVMVA() {
@ -412,9 +422,9 @@ void gteMVMVA() {
gteMAC2 = A2((((s64)CV2(cv) << 12) + (MX21(mx) * vx) + (MX22(mx) * vy) + (MX23(mx) * vz)) >> shift);
gteMAC3 = A3((((s64)CV3(cv) << 12) + (MX31(mx) * vx) + (MX32(mx) * vy) + (MX33(mx) * vz)) >> shift);
gteIR1 = Lm_B1(gteMAC1, lm);
gteIR2 = Lm_B2(gteMAC2, lm);
gteIR3 = Lm_B3(gteMAC3, lm);
gteIR1 = limB1(gteMAC1, lm);
gteIR2 = limB2(gteMAC2, lm);
gteIR3 = limB3(gteMAC3, lm);
}
void gteNCLIP() {
@ -435,7 +445,7 @@ void gteAVSZ3() {
gteFLAG = 0;
gteMAC0 = F((s64)(gteZSF3 * gteSZ1) + (gteZSF3 * gteSZ2) + (gteZSF3 * gteSZ3));
gteOTZ = Lm_D(gteMAC0 >> 12);
gteOTZ = limD(gteMAC0 >> 12);
}
void gteAVSZ4() {
@ -445,7 +455,7 @@ void gteAVSZ4() {
gteFLAG = 0;
gteMAC0 = F((s64)(gteZSF4 * (gteSZ0 + gteSZ1 + gteSZ2 + gteSZ3)));
gteOTZ = Lm_D(gteMAC0 >> 12);
gteOTZ = limD(gteMAC0 >> 12);
}
void gteSQR() {
@ -460,9 +470,9 @@ void gteSQR() {
gteMAC1 = A1((gteIR1 * gteIR1) >> shift);
gteMAC2 = A2((gteIR2 * gteIR2) >> shift);
gteMAC3 = A3((gteIR3 * gteIR3) >> shift);
gteIR1 = Lm_B1(gteMAC1 >> shift, lm);
gteIR2 = Lm_B2(gteMAC2 >> shift, lm);
gteIR3 = Lm_B3(gteMAC3 >> shift, lm);
gteIR1 = limB1(gteMAC1 >> shift, lm);
gteIR2 = limB2(gteMAC2 >> shift, lm);
gteIR3 = limB3(gteMAC3 >> shift, lm);
}
void gteNCCS() {
@ -474,28 +484,28 @@ void gteNCCS() {
gteMAC1 = A1((((s64)gteL11 * gteVX0) + (gteL12 * gteVY0) + (gteL13 * gteVZ0)) >> 12);
gteMAC2 = A2((((s64)gteL21 * gteVX0) + (gteL22 * gteVY0) + (gteL23 * gteVZ0)) >> 12);
gteMAC3 = A3((((s64)gteL31 * gteVX0) + (gteL32 * gteVY0) + (gteL33 * gteVZ0)) >> 12);
gteIR1 = Lm_B1(gteMAC1, 1);
gteIR2 = Lm_B2(gteMAC2, 1);
gteIR3 = Lm_B3(gteMAC3, 1);
gteIR1 = limB1(gteMAC1, 1);
gteIR2 = limB2(gteMAC2, 1);
gteIR3 = limB3(gteMAC3, 1);
gteMAC1 = A1((((s64)gteRBK << 12) + (gteLR1 * gteIR1) + (gteLR2 * gteIR2) + (gteLR3 * gteIR3)) >> 12);
gteMAC2 = A2((((s64)gteGBK << 12) + (gteLG1 * gteIR1) + (gteLG2 * gteIR2) + (gteLG3 * gteIR3)) >> 12);
gteMAC3 = A3((((s64)gteBBK << 12) + (gteLB1 * gteIR1) + (gteLB2 * gteIR2) + (gteLB3 * gteIR3)) >> 12);
gteIR1 = Lm_B1(gteMAC1, 1);
gteIR2 = Lm_B2(gteMAC2, 1);
gteIR3 = Lm_B3(gteMAC3, 1);
gteIR1 = limB1(gteMAC1, 1);
gteIR2 = limB2(gteMAC2, 1);
gteIR3 = limB3(gteMAC3, 1);
gteMAC1 = A1(((s64)gteR * gteIR1) >> 8);
gteMAC2 = A2(((s64)gteG * gteIR2) >> 8);
gteMAC3 = A3(((s64)gteB * gteIR3) >> 8);
gteIR1 = Lm_B1(gteMAC1, 1);
gteIR2 = Lm_B2(gteMAC2, 1);
gteIR3 = Lm_B3(gteMAC3, 1);
gteIR1 = limB1(gteMAC1, 1);
gteIR2 = limB2(gteMAC2, 1);
gteIR3 = limB3(gteMAC3, 1);
gteRGB0 = gteRGB1;
gteRGB1 = gteRGB2;
gteCODE2 = gteCODE;
gteR2 = Lm_C1(gteMAC1 >> 4);
gteG2 = Lm_C2(gteMAC2 >> 4);
gteB2 = Lm_C3(gteMAC3 >> 4);
gteR2 = limC1(gteMAC1 >> 4);
gteG2 = limC2(gteMAC2 >> 4);
gteB2 = limC3(gteMAC3 >> 4);
}
void gteNCCT() {
@ -514,15 +524,15 @@ void gteNCCT() {
gteMAC1 = A1((((s64)gteL11 * vx) + (gteL12 * vy) + (gteL13 * vz)) >> 12);
gteMAC2 = A2((((s64)gteL21 * vx) + (gteL22 * vy) + (gteL23 * vz)) >> 12);
gteMAC3 = A3((((s64)gteL31 * vx) + (gteL32 * vy) + (gteL33 * vz)) >> 12);
gteIR1 = Lm_B1(gteMAC1, 1);
gteIR2 = Lm_B2(gteMAC2, 1);
gteIR3 = Lm_B3(gteMAC3, 1);
gteIR1 = limB1(gteMAC1, 1);
gteIR2 = limB2(gteMAC2, 1);
gteIR3 = limB3(gteMAC3, 1);
gteMAC1 = A1((((s64)gteRBK << 12) + (gteLR1 * gteIR1) + (gteLR2 * gteIR2) + (gteLR3 * gteIR3)) >> 12);
gteMAC2 = A2((((s64)gteGBK << 12) + (gteLG1 * gteIR1) + (gteLG2 * gteIR2) + (gteLG3 * gteIR3)) >> 12);
gteMAC3 = A3((((s64)gteBBK << 12) + (gteLB1 * gteIR1) + (gteLB2 * gteIR2) + (gteLB3 * gteIR3)) >> 12);
gteIR1 = Lm_B1(gteMAC1, 1);
gteIR2 = Lm_B2(gteMAC2, 1);
gteIR3 = Lm_B3(gteMAC3, 1);
gteIR1 = limB1(gteMAC1, 1);
gteIR2 = limB2(gteMAC2, 1);
gteIR3 = limB3(gteMAC3, 1);
gteMAC1 = A1(((s64)gteR * gteIR1) >> 8);
gteMAC2 = A2(((s64)gteG * gteIR2) >> 8);
gteMAC3 = A3(((s64)gteB * gteIR3) >> 8);
@ -530,13 +540,13 @@ void gteNCCT() {
gteRGB0 = gteRGB1;
gteRGB1 = gteRGB2;
gteCODE2 = gteCODE;
gteR2 = Lm_C1(gteMAC1 >> 4);
gteG2 = Lm_C2(gteMAC2 >> 4);
gteB2 = Lm_C3(gteMAC3 >> 4);
gteR2 = limC1(gteMAC1 >> 4);
gteG2 = limC2(gteMAC2 >> 4);
gteB2 = limC3(gteMAC3 >> 4);
}
gteIR1 = Lm_B1(gteMAC1, 1);
gteIR2 = Lm_B2(gteMAC2, 1);
gteIR3 = Lm_B3(gteMAC3, 1);
gteIR1 = limB1(gteMAC1, 1);
gteIR2 = limB2(gteMAC2, 1);
gteIR3 = limB3(gteMAC3, 1);
}
void gteNCDS() {
@ -548,28 +558,28 @@ void gteNCDS() {
gteMAC1 = A1((((s64)gteL11 * gteVX0) + (gteL12 * gteVY0) + (gteL13 * gteVZ0)) >> 12);
gteMAC2 = A2((((s64)gteL21 * gteVX0) + (gteL22 * gteVY0) + (gteL23 * gteVZ0)) >> 12);
gteMAC3 = A3((((s64)gteL31 * gteVX0) + (gteL32 * gteVY0) + (gteL33 * gteVZ0)) >> 12);
gteIR1 = Lm_B1(gteMAC1, 1);
gteIR2 = Lm_B2(gteMAC2, 1);
gteIR3 = Lm_B3(gteMAC3, 1);
gteIR1 = limB1(gteMAC1, 1);
gteIR2 = limB2(gteMAC2, 1);
gteIR3 = limB3(gteMAC3, 1);
gteMAC1 = A1((((s64)gteRBK << 12) + (gteLR1 * gteIR1) + (gteLR2 * gteIR2) + (gteLR3 * gteIR3)) >> 12);
gteMAC2 = A2((((s64)gteGBK << 12) + (gteLG1 * gteIR1) + (gteLG2 * gteIR2) + (gteLG3 * gteIR3)) >> 12);
gteMAC3 = A3((((s64)gteBBK << 12) + (gteLB1 * gteIR1) + (gteLB2 * gteIR2) + (gteLB3 * gteIR3)) >> 12);
gteIR1 = Lm_B1(gteMAC1, 1);
gteIR2 = Lm_B2(gteMAC2, 1);
gteIR3 = Lm_B3(gteMAC3, 1);
gteMAC1 = A1(((((s64)gteR << 4) * gteIR1) + (gteIR0 * Lm_B1(gteRFC - ((gteR * gteIR1) >> 8), 0))) >> 12);
gteMAC2 = A2(((((s64)gteG << 4) * gteIR2) + (gteIR0 * Lm_B2(gteGFC - ((gteG * gteIR2) >> 8), 0))) >> 12);
gteMAC3 = A3(((((s64)gteB << 4) * gteIR3) + (gteIR0 * Lm_B3(gteBFC - ((gteB * gteIR3) >> 8), 0))) >> 12);
gteIR1 = Lm_B1(gteMAC1, 1);
gteIR2 = Lm_B2(gteMAC2, 1);
gteIR3 = Lm_B3(gteMAC3, 1);
gteIR1 = limB1(gteMAC1, 1);
gteIR2 = limB2(gteMAC2, 1);
gteIR3 = limB3(gteMAC3, 1);
gteMAC1 = A1(((((s64)gteR << 4) * gteIR1) + (gteIR0 * limB1(gteRFC - ((gteR * gteIR1) >> 8), 0))) >> 12);
gteMAC2 = A2(((((s64)gteG << 4) * gteIR2) + (gteIR0 * limB2(gteGFC - ((gteG * gteIR2) >> 8), 0))) >> 12);
gteMAC3 = A3(((((s64)gteB << 4) * gteIR3) + (gteIR0 * limB3(gteBFC - ((gteB * gteIR3) >> 8), 0))) >> 12);
gteIR1 = limB1(gteMAC1, 1);
gteIR2 = limB2(gteMAC2, 1);
gteIR3 = limB3(gteMAC3, 1);
gteRGB0 = gteRGB1;
gteRGB1 = gteRGB2;
gteCODE2 = gteCODE;
gteR2 = Lm_C1(gteMAC1 >> 4);
gteG2 = Lm_C2(gteMAC2 >> 4);
gteB2 = Lm_C3(gteMAC3 >> 4);
gteR2 = limC1(gteMAC1 >> 4);
gteG2 = limC2(gteMAC2 >> 4);
gteB2 = limC3(gteMAC3 >> 4);
}
void gteNCDT() {
@ -588,29 +598,29 @@ void gteNCDT() {
gteMAC1 = A1((((s64)gteL11 * vx) + (gteL12 * vy) + (gteL13 * vz)) >> 12);
gteMAC2 = A2((((s64)gteL21 * vx) + (gteL22 * vy) + (gteL23 * vz)) >> 12);
gteMAC3 = A3((((s64)gteL31 * vx) + (gteL32 * vy) + (gteL33 * vz)) >> 12);
gteIR1 = Lm_B1(gteMAC1, 1);
gteIR2 = Lm_B2(gteMAC2, 1);
gteIR3 = Lm_B3(gteMAC3, 1);
gteIR1 = limB1(gteMAC1, 1);
gteIR2 = limB2(gteMAC2, 1);
gteIR3 = limB3(gteMAC3, 1);
gteMAC1 = A1((((s64)gteRBK << 12) + (gteLR1 * gteIR1) + (gteLR2 * gteIR2) + (gteLR3 * gteIR3)) >> 12);
gteMAC2 = A2((((s64)gteGBK << 12) + (gteLG1 * gteIR1) + (gteLG2 * gteIR2) + (gteLG3 * gteIR3)) >> 12);
gteMAC3 = A3((((s64)gteBBK << 12) + (gteLB1 * gteIR1) + (gteLB2 * gteIR2) + (gteLB3 * gteIR3)) >> 12);
gteIR1 = Lm_B1(gteMAC1, 1);
gteIR2 = Lm_B2(gteMAC2, 1);
gteIR3 = Lm_B3(gteMAC3, 1);
gteMAC1 = A1(((((s64)gteR << 4) * gteIR1) + (gteIR0 * Lm_B1(gteRFC - ((gteR * gteIR1) >> 8), 0))) >> 12);
gteMAC2 = A2(((((s64)gteG << 4) * gteIR2) + (gteIR0 * Lm_B2(gteGFC - ((gteG * gteIR2) >> 8), 0))) >> 12);
gteMAC3 = A3(((((s64)gteB << 4) * gteIR3) + (gteIR0 * Lm_B3(gteBFC - ((gteB * gteIR3) >> 8), 0))) >> 12);
gteIR1 = limB1(gteMAC1, 1);
gteIR2 = limB2(gteMAC2, 1);
gteIR3 = limB3(gteMAC3, 1);
gteMAC1 = A1(((((s64)gteR << 4) * gteIR1) + (gteIR0 * limB1(gteRFC - ((gteR * gteIR1) >> 8), 0))) >> 12);
gteMAC2 = A2(((((s64)gteG << 4) * gteIR2) + (gteIR0 * limB2(gteGFC - ((gteG * gteIR2) >> 8), 0))) >> 12);
gteMAC3 = A3(((((s64)gteB << 4) * gteIR3) + (gteIR0 * limB3(gteBFC - ((gteB * gteIR3) >> 8), 0))) >> 12);
gteRGB0 = gteRGB1;
gteRGB1 = gteRGB2;
gteCODE2 = gteCODE;
gteR2 = Lm_C1(gteMAC1 >> 4);
gteG2 = Lm_C2(gteMAC2 >> 4);
gteB2 = Lm_C3(gteMAC3 >> 4);
gteR2 = limC1(gteMAC1 >> 4);
gteG2 = limC2(gteMAC2 >> 4);
gteB2 = limC3(gteMAC3 >> 4);
}
gteIR1 = Lm_B1(gteMAC1, 1);
gteIR2 = Lm_B2(gteMAC2, 1);
gteIR3 = Lm_B3(gteMAC3, 1);
gteIR1 = limB1(gteMAC1, 1);
gteIR2 = limB2(gteMAC2, 1);
gteIR3 = limB3(gteMAC3, 1);
}
void gteOP() {
@ -625,36 +635,36 @@ void gteOP() {
gteMAC1 = A1(((s64)(gteR22 * gteIR3) - (gteR33 * gteIR2)) >> shift);
gteMAC2 = A2(((s64)(gteR33 * gteIR1) - (gteR11 * gteIR3)) >> shift);
gteMAC3 = A3(((s64)(gteR11 * gteIR2) - (gteR22 * gteIR1)) >> shift);
gteIR1 = Lm_B1(gteMAC1, lm);
gteIR2 = Lm_B2(gteMAC2, lm);
gteIR3 = Lm_B3(gteMAC3, lm);
gteIR1 = limB1(gteMAC1, lm);
gteIR2 = limB2(gteMAC2, lm);
gteIR3 = limB3(gteMAC3, lm);
}
void gteDCPL() {
int shift = 12 * GTE_SF(gteop);
int lm = GTE_LM(gteop);
s64 iR = (gteR << 4) * gteIR1;
s64 iG = (gteG << 4) * gteIR2;
s64 iB = (gteB << 4) * gteIR3;
s64 iR = (gteR << 4) * gteIR1;
s64 iG = (gteG << 4) * gteIR2;
s64 iB = (gteB << 4) * gteIR3;
#ifdef GTE_LOG
GTE_LOG("DCPL\n");
#endif
gteFLAG = 0;
gteMAC1 = A1(iR + gteIR0 * Lm_B1(gteRFC - iR, 0)) >> shift;
gteMAC2 = A2(iG + gteIR0 * Lm_B1(gteGFC - iG, 0)) >> shift;
gteMAC3 = A3(iB + gteIR0 * Lm_B1(gteBFC - iB, 0)) >> shift;
gteMAC1 = A1(iR + gteIR0 * limB1(gteRFC - iR, 0)) >> shift;
gteMAC2 = A2(iG + gteIR0 * limB1(gteGFC - iG, 0)) >> shift;
gteMAC3 = A3(iB + gteIR0 * limB1(gteBFC - iB, 0)) >> shift;
gteIR1 = Lm_B1(gteMAC1 >> 4, lm);
gteIR2 = Lm_B2(gteMAC2 >> 4, lm);
gteIR3 = Lm_B3(gteMAC3 >> 4, lm);
gteIR1 = limB1(gteMAC1 >> 4, lm);
gteIR2 = limB2(gteMAC2 >> 4, lm);
gteIR3 = limB3(gteMAC3 >> 4, lm);
gteRGB0 = gteRGB1;
gteRGB1 = gteRGB2;
gteCODE2 = gteCODE;
gteR2 = Lm_C1(gteMAC1 >> 4);
gteG2 = Lm_C2(gteMAC2 >> 4);
gteB2 = Lm_C3(gteMAC3 >> 4);
gteR2 = limC1(gteMAC1 >> 4);
gteG2 = limC2(gteMAC2 >> 4);
gteB2 = limC3(gteMAC3 >> 4);
}
void gteGPF() {
@ -668,16 +678,16 @@ void gteGPF() {
gteMAC1 = A1(((s64)gteIR0 * gteIR1) >> shift);
gteMAC2 = A2(((s64)gteIR0 * gteIR2) >> shift);
gteMAC3 = A3(((s64)gteIR0 * gteIR3) >> shift);
gteIR1 = Lm_B1(gteMAC1, 0);
gteIR2 = Lm_B2(gteMAC2, 0);
gteIR3 = Lm_B3(gteMAC3, 0);
gteIR1 = limB1(gteMAC1, 0);
gteIR2 = limB2(gteMAC2, 0);
gteIR3 = limB3(gteMAC3, 0);
gteRGB0 = gteRGB1;
gteRGB1 = gteRGB2;
gteCODE2 = gteCODE;
gteR2 = Lm_C1(gteMAC1 >> 4);
gteG2 = Lm_C2(gteMAC2 >> 4);
gteB2 = Lm_C3(gteMAC3 >> 4);
gteR2 = limC1(gteMAC1 >> 4);
gteG2 = limC2(gteMAC2 >> 4);
gteB2 = limC3(gteMAC3 >> 4);
}
void gteGPL() {
@ -691,16 +701,16 @@ void gteGPL() {
gteMAC1 = A1((((s64)gteMAC1 << shift) + (gteIR0 * gteIR1)) >> shift);
gteMAC2 = A2((((s64)gteMAC2 << shift) + (gteIR0 * gteIR2)) >> shift);
gteMAC3 = A3((((s64)gteMAC3 << shift) + (gteIR0 * gteIR3)) >> shift);
gteIR1 = Lm_B1(gteMAC1, 0);
gteIR2 = Lm_B2(gteMAC2, 0);
gteIR3 = Lm_B3(gteMAC3, 0);
gteIR1 = limB1(gteMAC1, 0);
gteIR2 = limB2(gteMAC2, 0);
gteIR3 = limB3(gteMAC3, 0);
gteRGB0 = gteRGB1;
gteRGB1 = gteRGB2;
gteCODE2 = gteCODE;
gteR2 = Lm_C1(gteMAC1 >> 4);
gteG2 = Lm_C2(gteMAC2 >> 4);
gteB2 = Lm_C3(gteMAC3 >> 4);
gteR2 = limC1(gteMAC1 >> 4);
gteG2 = limC2(gteMAC2 >> 4);
gteB2 = limC3(gteMAC3 >> 4);
}
void gteDPCS() {
@ -711,19 +721,19 @@ void gteDPCS() {
#endif
gteFLAG = 0;
gteMAC1 = A1(((gteR << 16) + (gteIR0 * Lm_B1(A1((s64)gteRFC - (gteR << 4)) << (12 - shift), 0))) >> 12);
gteMAC2 = A2(((gteG << 16) + (gteIR0 * Lm_B2(A2((s64)gteGFC - (gteG << 4)) << (12 - shift), 0))) >> 12);
gteMAC3 = A3(((gteB << 16) + (gteIR0 * Lm_B3(A3((s64)gteBFC - (gteB << 4)) << (12 - shift), 0))) >> 12);
gteMAC1 = A1(((gteR << 16) + (gteIR0 * limB1(A1((s64)gteRFC - (gteR << 4)) << (12 - shift), 0))) >> 12);
gteMAC2 = A2(((gteG << 16) + (gteIR0 * limB2(A2((s64)gteGFC - (gteG << 4)) << (12 - shift), 0))) >> 12);
gteMAC3 = A3(((gteB << 16) + (gteIR0 * limB3(A3((s64)gteBFC - (gteB << 4)) << (12 - shift), 0))) >> 12);
gteIR1 = Lm_B1(gteMAC1, 0);
gteIR2 = Lm_B2(gteMAC2, 0);
gteIR3 = Lm_B3(gteMAC3, 0);
gteIR1 = limB1(gteMAC1, 0);
gteIR2 = limB2(gteMAC2, 0);
gteIR3 = limB3(gteMAC3, 0);
gteRGB0 = gteRGB1;
gteRGB1 = gteRGB2;
gteCODE2 = gteCODE;
gteR2 = Lm_C1(gteMAC1 >> 4);
gteG2 = Lm_C2(gteMAC2 >> 4);
gteB2 = Lm_C3(gteMAC3 >> 4);
gteR2 = limC1(gteMAC1 >> 4);
gteG2 = limC2(gteMAC2 >> 4);
gteB2 = limC3(gteMAC3 >> 4);
}
void gteDPCT() {
@ -735,20 +745,20 @@ void gteDPCT() {
gteFLAG = 0;
for (v = 0; v < 3; v++) {
gteMAC1 = A1((((s64)gteR0 << 16) + ((s64)gteIR0 * (Lm_B1(gteRFC - (gteR0 << 4), 0)))) >> 12);
gteMAC2 = A2((((s64)gteG0 << 16) + ((s64)gteIR0 * (Lm_B1(gteGFC - (gteG0 << 4), 0)))) >> 12);
gteMAC3 = A3((((s64)gteB0 << 16) + ((s64)gteIR0 * (Lm_B1(gteBFC - (gteB0 << 4), 0)))) >> 12);
gteMAC1 = A1((((s64)gteR0 << 16) + ((s64)gteIR0 * (limB1(gteRFC - (gteR0 << 4), 0)))) >> 12);
gteMAC2 = A2((((s64)gteG0 << 16) + ((s64)gteIR0 * (limB1(gteGFC - (gteG0 << 4), 0)))) >> 12);
gteMAC3 = A3((((s64)gteB0 << 16) + ((s64)gteIR0 * (limB1(gteBFC - (gteB0 << 4), 0)))) >> 12);
gteRGB0 = gteRGB1;
gteRGB1 = gteRGB2;
gteCODE2 = gteCODE;
gteR2 = Lm_C1(gteMAC1 >> 4);
gteG2 = Lm_C2(gteMAC2 >> 4);
gteB2 = Lm_C3(gteMAC3 >> 4);
gteR2 = limC1(gteMAC1 >> 4);
gteG2 = limC2(gteMAC2 >> 4);
gteB2 = limC3(gteMAC3 >> 4);
}
gteIR1 = Lm_B1(gteMAC1, 0);
gteIR2 = Lm_B2(gteMAC2, 0);
gteIR3 = Lm_B3(gteMAC3, 0);
gteIR1 = limB1(gteMAC1, 0);
gteIR2 = limB2(gteMAC2, 0);
gteIR3 = limB3(gteMAC3, 0);
}
void gteNCS() {
@ -760,22 +770,22 @@ void gteNCS() {
gteMAC1 = A1((((s64)gteL11 * gteVX0) + (gteL12 * gteVY0) + (gteL13 * gteVZ0)) >> 12);
gteMAC2 = A2((((s64)gteL21 * gteVX0) + (gteL22 * gteVY0) + (gteL23 * gteVZ0)) >> 12);
gteMAC3 = A3((((s64)gteL31 * gteVX0) + (gteL32 * gteVY0) + (gteL33 * gteVZ0)) >> 12);
gteIR1 = Lm_B1(gteMAC1, 1);
gteIR2 = Lm_B2(gteMAC2, 1);
gteIR3 = Lm_B3(gteMAC3, 1);
gteIR1 = limB1(gteMAC1, 1);
gteIR2 = limB2(gteMAC2, 1);
gteIR3 = limB3(gteMAC3, 1);
gteMAC1 = A1((((s64)gteRBK << 12) + (gteLR1 * gteIR1) + (gteLR2 * gteIR2) + (gteLR3 * gteIR3)) >> 12);
gteMAC2 = A2((((s64)gteGBK << 12) + (gteLG1 * gteIR1) + (gteLG2 * gteIR2) + (gteLG3 * gteIR3)) >> 12);
gteMAC3 = A3((((s64)gteBBK << 12) + (gteLB1 * gteIR1) + (gteLB2 * gteIR2) + (gteLB3 * gteIR3)) >> 12);
gteIR1 = Lm_B1(gteMAC1, 1);
gteIR2 = Lm_B2(gteMAC2, 1);
gteIR3 = Lm_B3(gteMAC3, 1);
gteIR1 = limB1(gteMAC1, 1);
gteIR2 = limB2(gteMAC2, 1);
gteIR3 = limB3(gteMAC3, 1);
gteRGB0 = gteRGB1;
gteRGB1 = gteRGB2;
gteCODE2 = gteCODE;
gteR2 = Lm_C1(gteMAC1 >> 4);
gteG2 = Lm_C2(gteMAC2 >> 4);
gteB2 = Lm_C3(gteMAC3 >> 4);
gteR2 = limC1(gteMAC1 >> 4);
gteG2 = limC2(gteMAC2 >> 4);
gteB2 = limC3(gteMAC3 >> 4);
}
void gteNCT() {
@ -794,22 +804,22 @@ void gteNCT() {
gteMAC1 = A1((((s64)gteL11 * vx) + (gteL12 * vy) + (gteL13 * vz)) >> 12);
gteMAC2 = A2((((s64)gteL21 * vx) + (gteL22 * vy) + (gteL23 * vz)) >> 12);
gteMAC3 = A3((((s64)gteL31 * vx) + (gteL32 * vy) + (gteL33 * vz)) >> 12);
gteIR1 = Lm_B1(gteMAC1, 1);
gteIR2 = Lm_B2(gteMAC2, 1);
gteIR3 = Lm_B3(gteMAC3, 1);
gteIR1 = limB1(gteMAC1, 1);
gteIR2 = limB2(gteMAC2, 1);
gteIR3 = limB3(gteMAC3, 1);
gteMAC1 = A1((((s64)gteRBK << 12) + (gteLR1 * gteIR1) + (gteLR2 * gteIR2) + (gteLR3 * gteIR3)) >> 12);
gteMAC2 = A2((((s64)gteGBK << 12) + (gteLG1 * gteIR1) + (gteLG2 * gteIR2) + (gteLG3 * gteIR3)) >> 12);
gteMAC3 = A3((((s64)gteBBK << 12) + (gteLB1 * gteIR1) + (gteLB2 * gteIR2) + (gteLB3 * gteIR3)) >> 12);
gteRGB0 = gteRGB1;
gteRGB1 = gteRGB2;
gteCODE2 = gteCODE;
gteR2 = Lm_C1(gteMAC1 >> 4);
gteG2 = Lm_C2(gteMAC2 >> 4);
gteB2 = Lm_C3(gteMAC3 >> 4);
gteR2 = limC1(gteMAC1 >> 4);
gteG2 = limC2(gteMAC2 >> 4);
gteB2 = limC3(gteMAC3 >> 4);
}
gteIR1 = Lm_B1(gteMAC1, 1);
gteIR2 = Lm_B2(gteMAC2, 1);
gteIR3 = Lm_B3(gteMAC3, 1);
gteIR1 = limB1(gteMAC1, 1);
gteIR2 = limB2(gteMAC2, 1);
gteIR3 = limB3(gteMAC3, 1);
}
void gteCC() {
@ -821,22 +831,22 @@ void gteCC() {
gteMAC1 = A1((((s64)gteRBK << 12) + (gteLR1 * gteIR1) + (gteLR2 * gteIR2) + (gteLR3 * gteIR3)) >> 12);
gteMAC2 = A2((((s64)gteGBK << 12) + (gteLG1 * gteIR1) + (gteLG2 * gteIR2) + (gteLG3 * gteIR3)) >> 12);
gteMAC3 = A3((((s64)gteBBK << 12) + (gteLB1 * gteIR1) + (gteLB2 * gteIR2) + (gteLB3 * gteIR3)) >> 12);
gteIR1 = Lm_B1(gteMAC1, 1);
gteIR2 = Lm_B2(gteMAC2, 1);
gteIR3 = Lm_B3(gteMAC3, 1);
gteIR1 = limB1(gteMAC1, 1);
gteIR2 = limB2(gteMAC2, 1);
gteIR3 = limB3(gteMAC3, 1);
gteMAC1 = A1(((s64)gteR * gteIR1) >> 8);
gteMAC2 = A2(((s64)gteG * gteIR2) >> 8);
gteMAC3 = A3(((s64)gteB * gteIR3) >> 8);
gteIR1 = Lm_B1(gteMAC1, 1);
gteIR2 = Lm_B2(gteMAC2, 1);
gteIR3 = Lm_B3(gteMAC3, 1);
gteIR1 = limB1(gteMAC1, 1);
gteIR2 = limB2(gteMAC2, 1);
gteIR3 = limB3(gteMAC3, 1);
gteRGB0 = gteRGB1;
gteRGB1 = gteRGB2;
gteCODE2 = gteCODE;
gteR2 = Lm_C1(gteMAC1 >> 4);
gteG2 = Lm_C2(gteMAC2 >> 4);
gteB2 = Lm_C3(gteMAC3 >> 4);
gteR2 = limC1(gteMAC1 >> 4);
gteG2 = limC2(gteMAC2 >> 4);
gteB2 = limC3(gteMAC3 >> 4);
}
void gteINTPL() {
@ -848,18 +858,18 @@ void gteINTPL() {
#endif
gteFLAG = 0;
gteMAC1 = A1(((gteIR1 << 12) + (gteIR0 * Lm_B1(((s64)gteRFC - gteIR1), 0))) >> shift);
gteMAC2 = A2(((gteIR2 << 12) + (gteIR0 * Lm_B2(((s64)gteGFC - gteIR2), 0))) >> shift);
gteMAC3 = A3(((gteIR3 << 12) + (gteIR0 * Lm_B3(((s64)gteBFC - gteIR3), 0))) >> shift);
gteIR1 = Lm_B1(gteMAC1, lm);
gteIR2 = Lm_B2(gteMAC2, lm);
gteIR3 = Lm_B3(gteMAC3, lm);
gteMAC1 = A1(((gteIR1 << 12) + (gteIR0 * limB1(((s64)gteRFC - gteIR1), 0))) >> shift);
gteMAC2 = A2(((gteIR2 << 12) + (gteIR0 * limB2(((s64)gteGFC - gteIR2), 0))) >> shift);
gteMAC3 = A3(((gteIR3 << 12) + (gteIR0 * limB3(((s64)gteBFC - gteIR3), 0))) >> shift);
gteIR1 = limB1(gteMAC1, lm);
gteIR2 = limB2(gteMAC2, lm);
gteIR3 = limB3(gteMAC3, lm);
gteRGB0 = gteRGB1;
gteRGB1 = gteRGB2;
gteCODE2 = gteCODE;
gteR2 = Lm_C1(gteMAC1 >> 4);
gteG2 = Lm_C2(gteMAC2 >> 4);
gteB2 = Lm_C3(gteMAC3 >> 4);
gteR2 = limC1(gteMAC1 >> 4);
gteG2 = limC2(gteMAC2 >> 4);
gteB2 = limC3(gteMAC3 >> 4);
}
void gteCDP() {
@ -871,20 +881,20 @@ void gteCDP() {
gteMAC1 = A1((((s64)gteRBK << 12) + (gteLR1 * gteIR1) + (gteLR2 * gteIR2) + (gteLR3 * gteIR3)) >> 12);
gteMAC2 = A2((((s64)gteGBK << 12) + (gteLG1 * gteIR1) + (gteLG2 * gteIR2) + (gteLG3 * gteIR3)) >> 12);
gteMAC3 = A3((((s64)gteBBK << 12) + (gteLB1 * gteIR1) + (gteLB2 * gteIR2) + (gteLB3 * gteIR3)) >> 12);
gteIR1 = Lm_B1(gteMAC1, 1);
gteIR2 = Lm_B2(gteMAC2, 1);
gteIR3 = Lm_B3(gteMAC3, 1);
gteMAC1 = A1(((((s64)gteR << 4) * gteIR1) + (gteIR0 * Lm_B1(gteRFC - ((gteR * gteIR1) >> 8), 0))) >> 12);
gteMAC2 = A2(((((s64)gteG << 4) * gteIR2) + (gteIR0 * Lm_B2(gteGFC - ((gteG * gteIR2) >> 8), 0))) >> 12);
gteMAC3 = A3(((((s64)gteB << 4) * gteIR3) + (gteIR0 * Lm_B3(gteBFC - ((gteB * gteIR3) >> 8), 0))) >> 12);
gteIR1 = Lm_B1(gteMAC1, 1);
gteIR2 = Lm_B2(gteMAC2, 1);
gteIR3 = Lm_B3(gteMAC3, 1);
gteIR1 = limB1(gteMAC1, 1);
gteIR2 = limB2(gteMAC2, 1);
gteIR3 = limB3(gteMAC3, 1);
gteMAC1 = A1(((((s64)gteR << 4) * gteIR1) + (gteIR0 * limB1(gteRFC - ((gteR * gteIR1) >> 8), 0))) >> 12);
gteMAC2 = A2(((((s64)gteG << 4) * gteIR2) + (gteIR0 * limB2(gteGFC - ((gteG * gteIR2) >> 8), 0))) >> 12);
gteMAC3 = A3(((((s64)gteB << 4) * gteIR3) + (gteIR0 * limB3(gteBFC - ((gteB * gteIR3) >> 8), 0))) >> 12);
gteIR1 = limB1(gteMAC1, 1);
gteIR2 = limB2(gteMAC2, 1);
gteIR3 = limB3(gteMAC3, 1);
gteRGB0 = gteRGB1;
gteRGB1 = gteRGB2;
gteCODE2 = gteCODE;
gteR2 = Lm_C1(gteMAC1 >> 4);
gteG2 = Lm_C2(gteMAC2 >> 4);
gteB2 = Lm_C3(gteMAC3 >> 4);
gteR2 = limC1(gteMAC1 >> 4);
gteG2 = limC2(gteMAC2 >> 4);
gteB2 = limC3(gteMAC3 >> 4);
}