diff options
| author | iCatButler <i.am.catbutler@gmail.com> | 2016-03-25 16:25:15 +0000 |
|---|---|---|
| committer | iCatButler <i.am.catbutler@gmail.com> | 2016-03-25 16:25:15 +0000 |
| commit | 7767ea4acbae995cd8e6302bdb7c97e89748dfd8 (patch) | |
| tree | b4a3025b703f8f3f383626aa5a651b2954c3a512 /libpcsxcore/pgxp_gte.c | |
| parent | 106f6594c9e2ad601deb7ad9bdf5eab8a568c01b (diff) | |
Initial upload of PGXP.
Diffstat (limited to 'libpcsxcore/pgxp_gte.c')
| -rw-r--r-- | libpcsxcore/pgxp_gte.c | 437 |
1 files changed, 437 insertions, 0 deletions
diff --git a/libpcsxcore/pgxp_gte.c b/libpcsxcore/pgxp_gte.c new file mode 100644 index 00000000..4b22c778 --- /dev/null +++ b/libpcsxcore/pgxp_gte.c @@ -0,0 +1,437 @@ +/***************************************************************************
+* Copyright (C) 2016 by iCatButler *
+* *
+* This program is free software; you can redistribute it and/or modify *
+* it under the terms of the GNU General Public License as published by *
+* the Free Software Foundation; either version 2 of the License, or *
+* (at your option) any later version. *
+* *
+* This program is distributed in the hope that it will be useful, *
+* but WITHOUT ANY WARRANTY; without even the implied warranty of *
+* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the *
+* GNU General Public License for more details. *
+* *
+* You should have received a copy of the GNU General Public License *
+* along with this program; if not, write to the *
+* Free Software Foundation, Inc., *
+* 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. *
+***************************************************************************/
+
+/**************************************************************************
+* pgxp_gte.c
+* PGXP - Parallel/Precision Geometry Xform Pipeline
+*
+* Created on: 12 Mar 2016
+* Author: iCatButler
+***************************************************************************/ + +#include "pgxp_gte.h" +#include "psxmem.h" + +typedef struct +{ + float x; + float y; + float z; + unsigned int valid; + unsigned int count; +} precise_value; + +typedef union +{ + struct + { + s16 x; + s16 y; + }; + u32 word; +} low_value; + +#define tolerance 1.0f + +precise_value GTE_reg[32]; +precise_value CPU_reg[32]; + +precise_value Mem[2048 * 1024 / 4]; // mirror 2MB in 32-bit words +precise_value Scratch[2048 * 1024 / 4]; // mirror 2MB in 32-bit words + +void PGXP_Init() +{ + memset(Mem, 0, sizeof(Mem)); +} + +char* PGXP_GetMem() +{ + return (char*)(Mem); +} + +#define VRAM 0 +#define SCRATCH 1 + +precise_value* ReadMem(u32 addr) +{ + u32 memType; + uint32_t paddr = addr; + int* ip = NULL; + + switch (paddr >> 20) + { + case 0x800: + case 0x801: + case 0xa00: + case 0xa01: + case 0x000: + case 0x001: + memType = VRAM; + break; + case 0x1f8: + memType = SCRATCH; + break; + default: + return NULL; + } + +#ifdef GTE_LOG + //GTE_LOG("PGXP_Read %x [%x] |", addr, paddr); +#endif + if (memType == VRAM) + { + paddr = (paddr & 0x1FFFFF) >> 2; + return &Mem[paddr]; + } + else if (memType == SCRATCH) + { + paddr = (paddr & 0x1FFFFF) >> 2; + return &Scratch[paddr]; + } + + return NULL; +} + +void WriteMem(precise_value value, u32 addr) +{ + u32 memType; + uint32_t paddr = addr; + int* ip = NULL; + + switch (paddr >> 20) + { + case 0x800: + case 0x801: + case 0xa00: + case 0xa01: + case 0x000: + case 0x001: + memType = VRAM; + break; + case 0x1f8: + memType = SCRATCH; + break; + default: + if (value.valid) + *ip = 5; + return; + } + +#ifdef GTE_LOG + GTE_LOG("PGXP_Write %x [%x] |", addr, paddr); +#endif + + // Store to RAM + if (memType == VRAM) + { + paddr = (paddr & 0x1FFFFF) >> 2; + Mem[paddr] = value; + } + else if (memType == SCRATCH) + { + paddr = (paddr & 0x1FFFFF) >> 2;// (paddr & 0x3FFF) >> 2; + Scratch[paddr] = value; + } +} + +#define SX0 (GTE_reg[ 12 ].x) +#define SY0 (GTE_reg[ 12 ].y) +#define SX1 (GTE_reg[ 13 ].x) +#define SY1 (GTE_reg[ 13 ].y) +#define SX2 (GTE_reg[ 14 ].x) +#define SY2 (GTE_reg[ 14 ].y) + +#define SXY0 (GTE_reg[ 12 ]) +#define SXY1 (GTE_reg[ 13 ]) +#define SXY2 (GTE_reg[ 14 ]) +#define SXYP (GTE_reg[ 15 ]) + +unsigned int PGXP_validate(float high, s16 low) +{ + if (fabs(high - (float)(low)) < tolerance) + return 1; + return 0; +} + +// Check that value is still within tolerance of low precision value and invalidate if not +precise_value PGXP_validateXY(precise_value *high, u32 low) +{ + low_value temp; + precise_value ret; + + ret.valid = 0; + temp.word = low; + + if (!high) + return ret; + + high->valid = (high->valid && PGXP_validate(high->x, temp.x) && PGXP_validate(high->y, temp.y)); + + // Cheat + //if (!high->valid) + //{ + // high->x = temp.x; + // high->y = temp.y; + // high->valid = 1; + //} + + return *high; +} + +u32 PGXP_compareXY(precise_value high, u32 low) +{ + low_value temp; + temp.word = low; + + if (PGXP_validate(high.x, temp.x) && PGXP_validate(high.y, temp.y)) + return 1; + return 0; +} + +precise_value PGXP_copyXY(u32 low) +{ + low_value temp; + precise_value ret; + + ret.valid = 0; + temp.word = low; + + ret.x = temp.x; + ret.y = temp.y; + ret.count = 0; + ret.valid = 1; + + return ret; +} + +void PGXP_pushSXYZ2f(float _x, float _y, float _z) +{ + static unsigned int uCount = 0; + // push values down FIFO + SXY0 = SXY1; + SXY1 = SXY2; + + SXY2.x = _x; + SXY2.y = _y; + SXY2.z = _z; + SXY2.valid = 1; + SXY2.count = uCount++; + +#ifdef GTE_LOG + GTE_LOG("PGPR_PUSH (%f, %f) %u %u|", SXY2.x, SXY2.y, SXY2.valid, SXY2.count); +#endif +} + +void PGXP_pushSXYZ2s(s64 _x, s64 _y, s64 _z) +{ + float fx = (float)(_x) / (float)(1 << 16); + float fy = (float)(_y) / (float)(1 << 16); + float fz = (float)(_z); + + PGXP_pushSXYZ2f(fx, fy, fz); +} + +int PGXP_NLCIP_valid() +{ + if (SXY0.valid && SXY1.valid && SXY2.valid) + return 1; + return 0; +} + +float PGXP_NCLIP() +{ + float nclip = ((SX0 * SY1) + (SX1 * SY2) + (SX2 * SY0) - (SX0 * SY2) - (SX1 * SY0) - (SX2 * SY1)); + + // ensure fractional values are not incorrectly rounded to 0 + if (fabs(nclip) < 1.0f) + nclip += (nclip < 0.f ? -2 : 2); + + return nclip; +} + +static precise_value PGXP_MFC2_int(u32 reg) +{ + switch (reg) + { + case 15: + GTE_reg[reg] = SXYP = SXY2; + break; + } + + return GTE_reg[reg]; +} + + +static void PGXP_MTC2_int(precise_value value, u32 reg) +{ + switch(reg) + { + case 15: + // push FIFO + SXY0 = SXY1; + SXY1 = SXY2; + SXY2 = value; + SXYP = SXY2; + break; + + case 31: + return; + } + + GTE_reg[reg] = value; +} + +// copy GTE data reg to GPR reg (MFC2) +void PGXP_MFC2(u32 gpr, u32 gtr, u32 value) +{ + if (!gpr) return; +#ifdef GTE_LOG + GTE_LOG("PGXP_MFC2 [%x] [%x] %x (%u %u)|", gpr, gtr, value, GTE_reg[gtr].valid, GTE_reg[gtr].count); +#endif + + CPU_reg[gpr] = PGXP_validateXY(>E_reg[gtr], value); +} + +// copy GPR reg to GTE data reg (MTC2) +void PGXP_MTC2(u32 gpr, u32 gtr, u32 value) +{ +#ifdef GTE_LOG + GTE_LOG("PGXP_MTC2 [%x] [%x] %x (%u %u)|", gpr, gtr, value, CPU_reg[gtr].valid, CPU_reg[gtr].count); +#endif + PGXP_MTC2_int(PGXP_validateXY(&CPU_reg[gpr], value), gtr); +} + +// copy memory to GTE reg +void PGXP_LWC2(u32 addr, u32 gtr, u32 value) +{ +#ifdef GTE_LOG + precise_value* pp = ReadMem(addr); + precise_value p; + low_value temp; + temp.word = value; + + p.x = p.y = p.valid = 0; + + if (pp) + p = *pp; + + GTE_LOG("PGXP_LWC2 %x [%x] %x (%d, %d) (%f, %f) %u %u|", addr, gtr, value, temp.x, temp.y, p.x, p.y, p.valid, p.count); +#endif + PGXP_MTC2_int(PGXP_validateXY(ReadMem(addr), value), gtr); +} + +//copy GTE reg to memory +void PGXP_SWC2(u32 addr, u32 gtr, u32 value) +{ +#ifdef GTE_LOG + low_value temp; + temp.word = value; + + if (PGXP_compareXY(GTE_reg[gtr], value)) + GTE_LOG("PGPR_SWC2 %x [%x] %x (%d, %d) (%f, %f) %u %u|", addr, gtr, value, temp.x, temp.y, GTE_reg[gtr].x, GTE_reg[gtr].y, GTE_reg[gtr].valid, GTE_reg[gtr].count); +#endif + WriteMem(PGXP_validateXY(>E_reg[gtr], value), addr); +} + +// ltore 32bit word +void PGPR_L32(u32 addr, u32 code, u32 value) +{ + u32 reg = ((code >> 16) & 0x1F); // The rt part of the instruction register + u32 op = ((code >> 26)); + precise_value p; + + low_value temp; + temp.word = value; + + p.x = p.y = p.valid = p.count = 0; + + switch (op) + { + case 34: //LWL + CPU_reg[reg] = PGXP_validateXY(ReadMem(addr), value); + break; + case 35: //LW + CPU_reg[reg] = PGXP_validateXY(ReadMem(addr), value); + break; + case 37: //LWR + CPU_reg[reg] = PGXP_validateXY(ReadMem(addr), value); + break; + case 50: //LWC2 (GTE vertex reads) + GTE_reg[reg] = PGXP_validateXY(ReadMem(addr), value); + break; + default: + // invalidate register + // WriteMem(p, addr); + break; + } + +#ifdef GTE_LOG + GTE_LOG("PGPR_L32 %u: %x %x[%x %x] (%d, %d) (%f, %f) %x %u|", op, addr, value, code, reg, temp.x, temp.y, CPU_reg[reg].x, CPU_reg[reg].y, CPU_reg[reg].valid, CPU_reg[reg].count); +#endif +} + +// store 32bit word +void PGPR_S32(u32 addr, u32 code, u32 value) +{ + u32 reg = ((code >> 16) & 0x1F); // The rt part of the instruction register + u32 op = ((code >> 26)); + precise_value p; + + low_value temp; + temp.word = value; + + p.x = p.y = p.valid = p.count = 0; + +#ifdef GTE_LOG + GTE_LOG("PGPR_S32 %u: %x %x[%x %x] (%d, %d) (%f, %f) %x %u|", op, addr, value, code, reg, temp.x, temp.y, CPU_reg[reg].x, CPU_reg[reg].y, CPU_reg[reg].valid, CPU_reg[reg].count); +#endif + + switch (op) + { + case 42: //SWL + WriteMem(PGXP_validateXY(&CPU_reg[reg], value), addr); + break; + case 43: //SW + WriteMem(PGXP_validateXY(&CPU_reg[reg], value), addr); + break; + case 46: //SWR + WriteMem(PGXP_validateXY(&CPU_reg[reg], value), addr); + break; + case 58: //SWC2 (GTE vertex writes) + WriteMem(PGXP_validateXY(>E_reg[reg], value), addr); + break; + default: + // invalidate memory + // WriteMem(p, addr); + break; + } +} + +u32 PGXP_psxMemRead32Trace(u32 mem, u32 code) +{ + u32 value = psxMemRead32(mem); + PGPR_L32(mem, code, value); + return value; +} + +void PGXP_psxMemWrite32Trace(u32 mem, u32 value, u32 code) +{ + PGPR_S32(mem, code, value); + psxMemWrite32(mem, value); +}
\ No newline at end of file |
