2023-09-03 04:30:26 +00:00
|
|
|
// SPDX-FileCopyrightText: 2016 iCatButler, 2019-2023 Connor McLaughlin <stenzek@gmail.com>
|
|
|
|
// SPDX-License-Identifier: GPL-2.0+
|
2020-08-01 14:25:07 +00:00
|
|
|
|
|
|
|
#include "pgxp.h"
|
2021-05-25 10:01:00 +00:00
|
|
|
#include "bus.h"
|
|
|
|
#include "cpu_core.h"
|
2020-08-01 14:25:07 +00:00
|
|
|
#include "settings.h"
|
2023-09-03 04:30:26 +00:00
|
|
|
|
|
|
|
#include "common/log.h"
|
|
|
|
|
2020-08-19 15:21:36 +00:00
|
|
|
#include <climits>
|
2020-09-02 12:44:52 +00:00
|
|
|
#include <cmath>
|
2023-09-03 04:30:26 +00:00
|
|
|
|
2021-06-12 10:44:09 +00:00
|
|
|
Log_SetChannel(PGXP);
|
2020-08-01 14:25:07 +00:00
|
|
|
|
|
|
|
namespace PGXP {
|
2021-06-12 12:02:28 +00:00
|
|
|
|
|
|
|
enum : u32
|
|
|
|
{
|
|
|
|
VERTEX_CACHE_WIDTH = 0x800 * 2,
|
|
|
|
VERTEX_CACHE_HEIGHT = 0x800 * 2,
|
|
|
|
VERTEX_CACHE_SIZE = VERTEX_CACHE_WIDTH * VERTEX_CACHE_HEIGHT,
|
2023-11-06 08:09:27 +00:00
|
|
|
PGXP_MEM_SIZE = (static_cast<u32>(Bus::RAM_8MB_SIZE) + static_cast<u32>(CPU::SCRATCHPAD_SIZE)) / 4,
|
2021-08-22 14:17:51 +00:00
|
|
|
PGXP_MEM_SCRATCH_OFFSET = Bus::RAM_8MB_SIZE / 4
|
2021-06-12 12:02:28 +00:00
|
|
|
};
|
|
|
|
|
|
|
|
#define NONE 0
|
|
|
|
#define ALL 0xFFFFFFFF
|
|
|
|
#define VALID 1
|
|
|
|
#define VALID_0 (VALID << 0)
|
|
|
|
#define VALID_1 (VALID << 8)
|
|
|
|
#define VALID_2 (VALID << 16)
|
|
|
|
#define VALID_3 (VALID << 24)
|
|
|
|
#define VALID_01 (VALID_0 | VALID_1)
|
|
|
|
#define VALID_012 (VALID_0 | VALID_1 | VALID_2)
|
|
|
|
#define VALID_ALL (VALID_0 | VALID_1 | VALID_2 | VALID_3)
|
|
|
|
#define INV_VALID_ALL (ALL ^ VALID_ALL)
|
|
|
|
|
2023-09-03 04:30:26 +00:00
|
|
|
struct PGXP_value
|
2020-08-01 14:25:07 +00:00
|
|
|
{
|
|
|
|
float x;
|
|
|
|
float y;
|
|
|
|
float z;
|
|
|
|
union
|
|
|
|
{
|
2023-09-03 04:30:26 +00:00
|
|
|
u32 flags;
|
|
|
|
u8 compFlags[4];
|
|
|
|
u16 halfFlags[2];
|
2020-08-01 14:25:07 +00:00
|
|
|
};
|
2023-09-03 04:30:26 +00:00
|
|
|
u32 value;
|
|
|
|
};
|
2020-08-01 14:25:07 +00:00
|
|
|
|
|
|
|
typedef union
|
|
|
|
{
|
|
|
|
struct
|
|
|
|
{
|
|
|
|
u8 l, h, h2, h3;
|
|
|
|
} b;
|
|
|
|
struct
|
|
|
|
{
|
|
|
|
u16 l, h;
|
|
|
|
} w;
|
|
|
|
struct
|
|
|
|
{
|
|
|
|
s8 l, h, h2, h3;
|
|
|
|
} sb;
|
|
|
|
struct
|
|
|
|
{
|
|
|
|
s16 l, h;
|
|
|
|
} sw;
|
|
|
|
u32 d;
|
|
|
|
s32 sd;
|
|
|
|
} psx_value;
|
|
|
|
|
2021-06-12 12:02:28 +00:00
|
|
|
static void PGXP_CacheVertex(s16 sx, s16 sy, const PGXP_value& vertex);
|
2020-08-01 14:25:07 +00:00
|
|
|
|
2020-08-19 13:26:57 +00:00
|
|
|
static void MakeValid(PGXP_value* pV, u32 psxV);
|
2020-08-01 14:25:07 +00:00
|
|
|
static void Validate(PGXP_value* pV, u32 psxV);
|
|
|
|
static void MaskValidate(PGXP_value* pV, u32 psxV, u32 mask, u32 validMask);
|
|
|
|
|
2020-08-19 13:26:57 +00:00
|
|
|
static double f16Sign(double in);
|
|
|
|
static double f16Unsign(double in);
|
|
|
|
static double f16Overflow(double in);
|
|
|
|
|
2020-08-01 14:25:07 +00:00
|
|
|
static PGXP_value* GetPtr(u32 addr);
|
|
|
|
static PGXP_value* ReadMem(u32 addr);
|
|
|
|
|
2021-06-12 12:02:28 +00:00
|
|
|
static const PGXP_value PGXP_value_invalid = {0.f, 0.f, 0.f, {0}, 0};
|
|
|
|
static const PGXP_value PGXP_value_zero = {0.f, 0.f, 0.f, {VALID_ALL}, 0};
|
2020-08-01 14:25:07 +00:00
|
|
|
|
2021-06-12 12:02:28 +00:00
|
|
|
static PGXP_value CPU_reg[34];
|
|
|
|
static PGXP_value CP0_reg[32];
|
|
|
|
#define CPU_Hi CPU_reg[32]
|
|
|
|
#define CPU_Lo CPU_reg[33]
|
2020-08-01 14:25:07 +00:00
|
|
|
|
2021-06-12 12:02:28 +00:00
|
|
|
// GTE registers
|
2023-08-15 13:12:21 +00:00
|
|
|
static PGXP_value GTE_regs[64];
|
2020-09-02 12:44:52 +00:00
|
|
|
|
|
|
|
static PGXP_value* Mem = nullptr;
|
|
|
|
static PGXP_value* vertexCache = nullptr;
|
|
|
|
|
2021-06-12 12:02:28 +00:00
|
|
|
ALWAYS_INLINE_RELEASE void MakeValid(PGXP_value* pV, u32 psxV)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
|
|
|
if (VALID_01 != (pV->flags & VALID_01))
|
|
|
|
{
|
2021-06-12 12:02:28 +00:00
|
|
|
pV->x = static_cast<float>(static_cast<s16>(Truncate16(psxV)));
|
|
|
|
pV->y = static_cast<float>(static_cast<s16>(Truncate16(psxV >> 16)));
|
2020-08-19 13:26:57 +00:00
|
|
|
pV->z = 0.f;
|
|
|
|
pV->flags |= VALID_01;
|
2021-06-12 12:02:28 +00:00
|
|
|
pV->value = psxV;
|
2020-08-19 13:26:57 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-06-12 12:02:28 +00:00
|
|
|
ALWAYS_INLINE_RELEASE void Validate(PGXP_value* pV, u32 psxV)
|
2020-08-01 14:25:07 +00:00
|
|
|
{
|
|
|
|
// assume pV is not NULL
|
|
|
|
pV->flags &= (pV->value == psxV) ? ALL : INV_VALID_ALL;
|
|
|
|
}
|
|
|
|
|
2021-06-12 12:02:28 +00:00
|
|
|
ALWAYS_INLINE_RELEASE void MaskValidate(PGXP_value* pV, u32 psxV, u32 mask, u32 validMask)
|
2020-08-01 14:25:07 +00:00
|
|
|
{
|
|
|
|
// assume pV is not NULL
|
|
|
|
pV->flags &= ((pV->value & mask) == (psxV & mask)) ? ALL : (ALL ^ (validMask));
|
|
|
|
}
|
|
|
|
|
2021-06-12 12:02:28 +00:00
|
|
|
ALWAYS_INLINE_RELEASE double f16Sign(double in)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
2023-10-31 15:32:29 +00:00
|
|
|
const s32 s = static_cast<s32>(static_cast<u64>(in * (USHRT_MAX + 1)));
|
|
|
|
return static_cast<double>(s) / static_cast<double>(USHRT_MAX + 1);
|
2020-08-19 13:26:57 +00:00
|
|
|
}
|
2021-06-12 12:02:28 +00:00
|
|
|
ALWAYS_INLINE_RELEASE double f16Unsign(double in)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
2023-10-31 15:32:29 +00:00
|
|
|
return (in >= 0) ? in : (in + (USHRT_MAX + 1));
|
2020-08-19 13:26:57 +00:00
|
|
|
}
|
2021-06-12 12:02:28 +00:00
|
|
|
ALWAYS_INLINE_RELEASE double f16Overflow(double in)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
|
|
|
double out = 0;
|
|
|
|
s64 v = ((s64)in) >> 16;
|
|
|
|
out = (double)v;
|
|
|
|
return out;
|
|
|
|
}
|
|
|
|
|
2021-02-17 15:41:10 +00:00
|
|
|
ALWAYS_INLINE_RELEASE PGXP_value* GetPtr(u32 addr)
|
2020-08-01 14:25:07 +00:00
|
|
|
{
|
2023-11-06 08:09:27 +00:00
|
|
|
if ((addr & CPU::SCRATCHPAD_ADDR_MASK) == CPU::SCRATCHPAD_ADDR)
|
|
|
|
return &Mem[PGXP_MEM_SCRATCH_OFFSET + ((addr & CPU::SCRATCHPAD_OFFSET_MASK) >> 2)];
|
2020-08-01 14:25:07 +00:00
|
|
|
|
2021-05-25 10:01:00 +00:00
|
|
|
const u32 paddr = (addr & CPU::PHYSICAL_MEMORY_ADDRESS_MASK);
|
|
|
|
if (paddr < Bus::RAM_MIRROR_END)
|
2021-08-22 14:17:51 +00:00
|
|
|
return &Mem[(paddr & Bus::g_ram_mask) >> 2];
|
2021-05-25 10:01:00 +00:00
|
|
|
else
|
|
|
|
return nullptr;
|
2020-08-01 14:25:07 +00:00
|
|
|
}
|
|
|
|
|
2021-02-17 15:41:10 +00:00
|
|
|
ALWAYS_INLINE_RELEASE PGXP_value* ReadMem(u32 addr)
|
2020-08-01 14:25:07 +00:00
|
|
|
{
|
|
|
|
return GetPtr(addr);
|
|
|
|
}
|
|
|
|
|
2021-02-17 15:41:10 +00:00
|
|
|
ALWAYS_INLINE_RELEASE void ValidateAndCopyMem(PGXP_value* dest, u32 addr, u32 value)
|
2020-08-01 14:25:07 +00:00
|
|
|
{
|
|
|
|
PGXP_value* pMem = GetPtr(addr);
|
2023-11-04 10:03:45 +00:00
|
|
|
if (pMem)
|
2020-08-01 14:25:07 +00:00
|
|
|
{
|
|
|
|
Validate(pMem, value);
|
|
|
|
*dest = *pMem;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2021-06-12 12:02:28 +00:00
|
|
|
*dest = PGXP_value_invalid;
|
2020-08-01 14:25:07 +00:00
|
|
|
}
|
|
|
|
|
2023-09-03 04:30:26 +00:00
|
|
|
ALWAYS_INLINE_RELEASE static void ValidateAndCopyMem16(PGXP_value* dest, u32 addr, u32 value, bool sign)
|
2020-08-01 14:25:07 +00:00
|
|
|
{
|
|
|
|
u32 validMask = 0;
|
|
|
|
psx_value val, mask;
|
|
|
|
PGXP_value* pMem = GetPtr(addr);
|
2023-11-04 10:03:45 +00:00
|
|
|
if (pMem)
|
2020-08-01 14:25:07 +00:00
|
|
|
{
|
|
|
|
mask.d = val.d = 0;
|
|
|
|
// determine if high or low word
|
|
|
|
if ((addr % 4) == 2)
|
|
|
|
{
|
|
|
|
val.w.h = static_cast<u16>(value);
|
|
|
|
mask.w.h = 0xFFFF;
|
|
|
|
validMask = VALID_1;
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
val.w.l = static_cast<u16>(value);
|
|
|
|
mask.w.l = 0xFFFF;
|
|
|
|
validMask = VALID_0;
|
|
|
|
}
|
|
|
|
|
|
|
|
// validate and copy whole value
|
|
|
|
MaskValidate(pMem, val.d, mask.d, validMask);
|
|
|
|
*dest = *pMem;
|
|
|
|
|
|
|
|
// if high word then shift
|
|
|
|
if ((addr % 4) == 2)
|
|
|
|
{
|
|
|
|
dest->x = dest->y;
|
|
|
|
dest->compFlags[0] = dest->compFlags[1];
|
|
|
|
}
|
|
|
|
|
|
|
|
// truncate value
|
|
|
|
dest->y = (dest->x < 0) ? -1.f * sign : 0.f; // 0.f;
|
|
|
|
dest->value = value;
|
|
|
|
dest->compFlags[1] = VALID; // iCB: High word is valid, just 0
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2021-06-12 12:02:28 +00:00
|
|
|
*dest = PGXP_value_invalid;
|
2020-08-01 14:25:07 +00:00
|
|
|
}
|
|
|
|
|
2021-06-12 12:02:28 +00:00
|
|
|
ALWAYS_INLINE_RELEASE void WriteMem(const PGXP_value* value, u32 addr)
|
2020-08-01 14:25:07 +00:00
|
|
|
{
|
|
|
|
PGXP_value* pMem = GetPtr(addr);
|
|
|
|
|
|
|
|
if (pMem)
|
|
|
|
*pMem = *value;
|
|
|
|
}
|
|
|
|
|
2021-06-24 06:52:38 +00:00
|
|
|
ALWAYS_INLINE_RELEASE static void WriteMem16(const PGXP_value* src, u32 addr)
|
2020-08-01 14:25:07 +00:00
|
|
|
{
|
|
|
|
PGXP_value* dest = GetPtr(addr);
|
2023-11-04 10:03:45 +00:00
|
|
|
psx_value* pVal = nullptr;
|
2020-08-01 14:25:07 +00:00
|
|
|
|
|
|
|
if (dest)
|
|
|
|
{
|
|
|
|
pVal = (psx_value*)&dest->value;
|
|
|
|
// determine if high or low word
|
|
|
|
if ((addr % 4) == 2)
|
|
|
|
{
|
|
|
|
dest->y = src->x;
|
|
|
|
dest->compFlags[1] = src->compFlags[0];
|
|
|
|
pVal->w.h = (u16)src->value;
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
dest->x = src->x;
|
|
|
|
dest->compFlags[0] = src->compFlags[0];
|
|
|
|
pVal->w.l = (u16)src->value;
|
|
|
|
}
|
|
|
|
|
|
|
|
// overwrite z/w if valid
|
|
|
|
if (src->compFlags[2] == VALID)
|
|
|
|
{
|
|
|
|
dest->z = src->z;
|
|
|
|
dest->compFlags[2] = src->compFlags[2];
|
|
|
|
}
|
|
|
|
|
|
|
|
// dest->valid = dest->valid && src->valid;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
void Initialize()
|
|
|
|
{
|
2021-06-12 12:02:28 +00:00
|
|
|
std::memset(CPU_reg, 0, sizeof(CPU_reg));
|
|
|
|
std::memset(CP0_reg, 0, sizeof(CP0_reg));
|
|
|
|
|
2023-08-15 13:12:21 +00:00
|
|
|
std::memset(GTE_regs, 0, sizeof(GTE_regs));
|
2021-06-12 12:02:28 +00:00
|
|
|
|
|
|
|
if (!Mem)
|
|
|
|
{
|
|
|
|
Mem = static_cast<PGXP_value*>(std::calloc(PGXP_MEM_SIZE, sizeof(PGXP_value)));
|
|
|
|
if (!Mem)
|
|
|
|
{
|
|
|
|
std::fprintf(stderr, "Failed to allocate PGXP memory\n");
|
|
|
|
std::abort();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (g_settings.gpu_pgxp_vertex_cache && !vertexCache)
|
|
|
|
{
|
|
|
|
vertexCache = static_cast<PGXP_value*>(std::calloc(VERTEX_CACHE_SIZE, sizeof(PGXP_value)));
|
|
|
|
if (!vertexCache)
|
|
|
|
{
|
|
|
|
Log_ErrorPrint("Failed to allocate memory for vertex cache, disabling.");
|
|
|
|
g_settings.gpu_pgxp_vertex_cache = false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (vertexCache)
|
|
|
|
std::memset(vertexCache, 0, sizeof(PGXP_value) * VERTEX_CACHE_SIZE);
|
|
|
|
}
|
|
|
|
|
|
|
|
void Reset()
|
|
|
|
{
|
|
|
|
std::memset(CPU_reg, 0, sizeof(CPU_reg));
|
|
|
|
std::memset(CP0_reg, 0, sizeof(CP0_reg));
|
|
|
|
|
2023-08-15 13:12:21 +00:00
|
|
|
std::memset(GTE_regs, 0, sizeof(GTE_regs));
|
2021-06-12 12:02:28 +00:00
|
|
|
|
|
|
|
if (Mem)
|
|
|
|
std::memset(Mem, 0, sizeof(PGXP_value) * PGXP_MEM_SIZE);
|
2021-06-12 10:44:09 +00:00
|
|
|
|
|
|
|
if (vertexCache)
|
|
|
|
std::memset(vertexCache, 0, sizeof(PGXP_value) * VERTEX_CACHE_SIZE);
|
2020-08-01 14:25:07 +00:00
|
|
|
}
|
|
|
|
|
2020-09-02 12:44:52 +00:00
|
|
|
void Shutdown()
|
2020-08-01 14:25:07 +00:00
|
|
|
{
|
2020-09-02 12:44:52 +00:00
|
|
|
if (vertexCache)
|
|
|
|
{
|
|
|
|
std::free(vertexCache);
|
|
|
|
vertexCache = nullptr;
|
|
|
|
}
|
|
|
|
if (Mem)
|
|
|
|
{
|
|
|
|
std::free(Mem);
|
|
|
|
Mem = nullptr;
|
|
|
|
}
|
2020-08-01 14:25:07 +00:00
|
|
|
|
2023-08-15 13:12:21 +00:00
|
|
|
std::memset(GTE_regs, 0, sizeof(GTE_regs));
|
2020-08-01 14:25:07 +00:00
|
|
|
|
2021-06-12 12:02:28 +00:00
|
|
|
std::memset(CPU_reg, 0, sizeof(CPU_reg));
|
|
|
|
std::memset(CP0_reg, 0, sizeof(CP0_reg));
|
2020-08-01 14:25:07 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// Instruction register decoding
|
2023-09-03 04:30:26 +00:00
|
|
|
#define op(_instr) (_instr >> 26) // The op part of the instruction register
|
|
|
|
#define func(_instr) ((_instr)&0x3F) // The funct part of the instruction register
|
|
|
|
#define sa(_instr) ((_instr >> 6) & 0x1F) // The sa part of the instruction register
|
2020-08-01 14:25:07 +00:00
|
|
|
#define rd(_instr) ((_instr >> 11) & 0x1F) // The rd part of the instruction register
|
|
|
|
#define rt(_instr) ((_instr >> 16) & 0x1F) // The rt part of the instruction register
|
|
|
|
#define rs(_instr) ((_instr >> 21) & 0x1F) // The rs part of the instruction register
|
2023-09-03 04:30:26 +00:00
|
|
|
#define imm(_instr) (_instr & 0xFFFF) // The immediate part of the instruction register
|
2023-08-15 13:12:21 +00:00
|
|
|
#define cop2idx(_instr) (((_instr >> 11) & 0x1F) | ((_instr >> 17) & 0x20))
|
2020-08-01 14:25:07 +00:00
|
|
|
|
2023-08-15 13:12:21 +00:00
|
|
|
#define SX0 (GTE_regs[12].x)
|
|
|
|
#define SY0 (GTE_regs[12].y)
|
|
|
|
#define SX1 (GTE_regs[13].x)
|
|
|
|
#define SY1 (GTE_regs[13].y)
|
|
|
|
#define SX2 (GTE_regs[14].x)
|
|
|
|
#define SY2 (GTE_regs[14].y)
|
2020-08-01 14:25:07 +00:00
|
|
|
|
2023-08-15 13:12:21 +00:00
|
|
|
#define SXY0 (GTE_regs[12])
|
|
|
|
#define SXY1 (GTE_regs[13])
|
|
|
|
#define SXY2 (GTE_regs[14])
|
|
|
|
#define SXYP (GTE_regs[15])
|
2020-08-01 14:25:07 +00:00
|
|
|
|
2021-06-12 12:02:28 +00:00
|
|
|
void GTE_PushSXYZ2f(float x, float y, float z, u32 v)
|
2020-08-01 14:25:07 +00:00
|
|
|
{
|
|
|
|
// push values down FIFO
|
|
|
|
SXY0 = SXY1;
|
|
|
|
SXY1 = SXY2;
|
|
|
|
|
2021-06-12 12:02:28 +00:00
|
|
|
SXY2.x = x;
|
|
|
|
SXY2.y = y;
|
|
|
|
SXY2.z = z;
|
|
|
|
SXY2.value = v;
|
2020-08-01 14:25:07 +00:00
|
|
|
SXY2.flags = VALID_ALL;
|
|
|
|
|
|
|
|
if (g_settings.gpu_pgxp_vertex_cache)
|
2021-06-12 12:02:28 +00:00
|
|
|
PGXP_CacheVertex(static_cast<s16>(Truncate16(v)), static_cast<s16>(Truncate16(v >> 16)), SXY2);
|
2020-08-01 14:25:07 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
#define VX(n) (psxRegs.CP2D.p[n << 1].sw.l)
|
|
|
|
#define VY(n) (psxRegs.CP2D.p[n << 1].sw.h)
|
|
|
|
#define VZ(n) (psxRegs.CP2D.p[(n << 1) + 1].sw.l)
|
|
|
|
|
|
|
|
int GTE_NCLIP_valid(u32 sxy0, u32 sxy1, u32 sxy2)
|
|
|
|
{
|
|
|
|
Validate(&SXY0, sxy0);
|
|
|
|
Validate(&SXY1, sxy1);
|
|
|
|
Validate(&SXY2, sxy2);
|
|
|
|
if (((SXY0.flags & SXY1.flags & SXY2.flags & VALID_01) == VALID_01)) // && Config.PGXP_GTE && (Config.PGXP_Mode > 0))
|
|
|
|
return 1;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
float GTE_NCLIP()
|
|
|
|
{
|
|
|
|
float nclip = ((SX0 * SY1) + (SX1 * SY2) + (SX2 * SY0) - (SX0 * SY2) - (SX1 * SY0) - (SX2 * SY1));
|
|
|
|
|
|
|
|
// ensure fractional values are not incorrectly rounded to 0
|
|
|
|
float nclipAbs = std::abs(nclip);
|
|
|
|
if ((0.1f < nclipAbs) && (nclipAbs < 1.f))
|
|
|
|
nclip += (nclip < 0.f ? -1 : 1);
|
|
|
|
|
|
|
|
// float AX = SX1 - SX0;
|
|
|
|
// float AY = SY1 - SY0;
|
|
|
|
|
|
|
|
// float BX = SX2 - SX0;
|
|
|
|
// float BY = SY2 - SY0;
|
|
|
|
|
|
|
|
//// normalise A and B
|
|
|
|
// float mA = sqrt((AX*AX) + (AY*AY));
|
|
|
|
// float mB = sqrt((BX*BX) + (BY*BY));
|
|
|
|
|
|
|
|
//// calculate AxB to get Z component of C
|
|
|
|
// float CZ = ((AX * BY) - (AY * BX)) * (1 << 12);
|
|
|
|
|
|
|
|
return nclip;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void PGXP_MTC2_int(PGXP_value value, u32 reg)
|
|
|
|
{
|
|
|
|
switch (reg)
|
|
|
|
{
|
|
|
|
case 15:
|
|
|
|
// push FIFO
|
|
|
|
SXY0 = SXY1;
|
|
|
|
SXY1 = SXY2;
|
|
|
|
SXY2 = value;
|
|
|
|
SXYP = SXY2;
|
|
|
|
break;
|
|
|
|
|
|
|
|
case 31:
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2023-08-15 13:12:21 +00:00
|
|
|
GTE_regs[reg] = value;
|
2020-08-01 14:25:07 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
////////////////////////////////////
|
|
|
|
// Data transfer tracking
|
|
|
|
////////////////////////////////////
|
|
|
|
|
2023-08-15 13:12:21 +00:00
|
|
|
void CPU_MFC2(u32 instr, u32 rdVal)
|
2020-08-01 14:25:07 +00:00
|
|
|
{
|
|
|
|
// CPU[Rt] = GTE_D[Rd]
|
2023-08-15 13:12:21 +00:00
|
|
|
const u32 idx = cop2idx(instr);
|
|
|
|
Validate(>E_regs[idx], rdVal);
|
|
|
|
CPU_reg[rt(instr)] = GTE_regs[idx];
|
|
|
|
CPU_reg[rt(instr)].value = rdVal;
|
2020-08-01 14:25:07 +00:00
|
|
|
}
|
|
|
|
|
2023-08-15 13:12:21 +00:00
|
|
|
void CPU_MTC2(u32 instr, u32 rtVal)
|
2020-08-01 14:25:07 +00:00
|
|
|
{
|
|
|
|
// GTE_D[Rd] = CPU[Rt]
|
2023-08-15 13:12:21 +00:00
|
|
|
const u32 idx = cop2idx(instr);
|
2020-08-01 14:25:07 +00:00
|
|
|
Validate(&CPU_reg[rt(instr)], rtVal);
|
2023-08-15 13:12:21 +00:00
|
|
|
PGXP_MTC2_int(CPU_reg[rt(instr)], idx);
|
|
|
|
GTE_regs[idx].value = rtVal;
|
2020-08-01 14:25:07 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
////////////////////////////////////
|
|
|
|
// Memory Access
|
|
|
|
////////////////////////////////////
|
2023-08-15 13:12:21 +00:00
|
|
|
void CPU_LWC2(u32 instr, u32 addr, u32 rtVal)
|
2020-08-01 14:25:07 +00:00
|
|
|
{
|
|
|
|
// GTE_D[Rt] = Mem[addr]
|
|
|
|
PGXP_value val;
|
|
|
|
ValidateAndCopyMem(&val, addr, rtVal);
|
|
|
|
PGXP_MTC2_int(val, rt(instr));
|
|
|
|
}
|
|
|
|
|
2023-08-15 13:12:21 +00:00
|
|
|
void CPU_SWC2(u32 instr, u32 addr, u32 rtVal)
|
2020-08-01 14:25:07 +00:00
|
|
|
{
|
|
|
|
// Mem[addr] = GTE_D[Rt]
|
2023-08-15 13:12:21 +00:00
|
|
|
Validate(>E_regs[rt(instr)], rtVal);
|
|
|
|
WriteMem(>E_regs[rt(instr)], addr);
|
2020-08-01 14:25:07 +00:00
|
|
|
}
|
|
|
|
|
2021-06-12 12:02:28 +00:00
|
|
|
ALWAYS_INLINE_RELEASE void PGXP_CacheVertex(s16 sx, s16 sy, const PGXP_value& vertex)
|
2020-09-02 12:44:52 +00:00
|
|
|
{
|
2021-06-12 12:02:28 +00:00
|
|
|
if (sx >= -0x800 && sx <= 0x7ff && sy >= -0x800 && sy <= 0x7ff)
|
2020-09-02 12:44:52 +00:00
|
|
|
{
|
2021-06-12 12:02:28 +00:00
|
|
|
// Write vertex into cache
|
|
|
|
vertexCache[(sy + 0x800) * VERTEX_CACHE_WIDTH + (sx + 0x800)] = vertex;
|
2020-09-02 12:44:52 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-06-12 12:02:28 +00:00
|
|
|
static ALWAYS_INLINE_RELEASE PGXP_value* PGXP_GetCachedVertex(short sx, short sy)
|
2020-08-01 14:25:07 +00:00
|
|
|
{
|
2021-06-12 12:02:28 +00:00
|
|
|
if (sx >= -0x800 && sx <= 0x7ff && sy >= -0x800 && sy <= 0x7ff)
|
2020-08-01 14:25:07 +00:00
|
|
|
{
|
2021-06-12 12:02:28 +00:00
|
|
|
// Return pointer to cache entry
|
|
|
|
return &vertexCache[(sy + 0x800) * VERTEX_CACHE_WIDTH + (sx + 0x800)];
|
2020-08-01 14:25:07 +00:00
|
|
|
}
|
|
|
|
|
2021-06-12 10:44:09 +00:00
|
|
|
return nullptr;
|
2020-08-01 14:25:07 +00:00
|
|
|
}
|
|
|
|
|
2020-11-26 14:02:13 +00:00
|
|
|
static ALWAYS_INLINE_RELEASE float TruncateVertexPosition(float p)
|
2020-08-01 14:25:07 +00:00
|
|
|
{
|
|
|
|
const s32 int_part = static_cast<s32>(p);
|
|
|
|
const float int_part_f = static_cast<float>(int_part);
|
|
|
|
return static_cast<float>(static_cast<s16>(int_part << 5) >> 5) + (p - int_part_f);
|
|
|
|
}
|
|
|
|
|
2020-11-26 14:02:13 +00:00
|
|
|
static ALWAYS_INLINE_RELEASE bool IsWithinTolerance(float precise_x, float precise_y, int int_x, int int_y)
|
|
|
|
{
|
|
|
|
const float tolerance = g_settings.gpu_pgxp_tolerance;
|
|
|
|
if (tolerance < 0.0f)
|
|
|
|
return true;
|
|
|
|
|
|
|
|
return (std::abs(precise_x - static_cast<float>(int_x)) <= tolerance &&
|
|
|
|
std::abs(precise_y - static_cast<float>(int_y)) <= tolerance);
|
|
|
|
}
|
|
|
|
|
2020-08-01 14:25:07 +00:00
|
|
|
bool GetPreciseVertex(u32 addr, u32 value, int x, int y, int xOffs, int yOffs, float* out_x, float* out_y, float* out_w)
|
|
|
|
{
|
|
|
|
const PGXP_value* vert = ReadMem(addr);
|
|
|
|
if (vert && ((vert->flags & VALID_01) == VALID_01) && (vert->value == value))
|
|
|
|
{
|
|
|
|
// There is a value here with valid X and Y coordinates
|
|
|
|
*out_x = TruncateVertexPosition(vert->x) + static_cast<float>(xOffs);
|
|
|
|
*out_y = TruncateVertexPosition(vert->y) + static_cast<float>(yOffs);
|
|
|
|
*out_w = vert->z / 32768.0f;
|
2021-06-12 12:02:28 +00:00
|
|
|
|
2020-11-26 14:02:13 +00:00
|
|
|
if (IsWithinTolerance(*out_x, *out_y, x, y))
|
|
|
|
{
|
|
|
|
// check validity of z component
|
|
|
|
return ((vert->flags & VALID_2) == VALID_2);
|
|
|
|
}
|
2020-08-01 14:25:07 +00:00
|
|
|
}
|
2021-06-12 12:02:28 +00:00
|
|
|
|
|
|
|
if (g_settings.gpu_pgxp_vertex_cache)
|
2020-08-01 14:25:07 +00:00
|
|
|
{
|
|
|
|
const short psx_x = (short)(value & 0xFFFFu);
|
|
|
|
const short psx_y = (short)(value >> 16);
|
|
|
|
|
|
|
|
// Look in cache for valid vertex
|
|
|
|
vert = PGXP_GetCachedVertex(psx_x, psx_y);
|
2021-06-12 12:02:28 +00:00
|
|
|
if (vert && (vert->flags & VALID_01) == VALID_01)
|
2020-08-01 14:25:07 +00:00
|
|
|
{
|
|
|
|
*out_x = TruncateVertexPosition(vert->x) + static_cast<float>(xOffs);
|
|
|
|
*out_y = TruncateVertexPosition(vert->y) + static_cast<float>(yOffs);
|
|
|
|
*out_w = vert->z / 32768.0f;
|
2020-11-26 14:02:13 +00:00
|
|
|
|
|
|
|
if (IsWithinTolerance(*out_x, *out_y, x, y))
|
2021-06-12 12:02:28 +00:00
|
|
|
return false;
|
2020-08-01 14:25:07 +00:00
|
|
|
}
|
|
|
|
}
|
2020-11-26 14:02:13 +00:00
|
|
|
|
|
|
|
// no valid value can be found anywhere, use the native PSX data
|
|
|
|
*out_x = static_cast<float>(x);
|
|
|
|
*out_y = static_cast<float>(y);
|
|
|
|
*out_w = 1.0f;
|
|
|
|
return false;
|
2020-08-01 14:25:07 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// Instruction register decoding
|
2023-09-03 04:30:26 +00:00
|
|
|
#define op(_instr) (_instr >> 26) // The op part of the instruction register
|
|
|
|
#define func(_instr) ((_instr)&0x3F) // The funct part of the instruction register
|
|
|
|
#define sa(_instr) ((_instr >> 6) & 0x1F) // The sa part of the instruction register
|
2020-08-01 14:25:07 +00:00
|
|
|
#define rd(_instr) ((_instr >> 11) & 0x1F) // The rd part of the instruction register
|
|
|
|
#define rt(_instr) ((_instr >> 16) & 0x1F) // The rt part of the instruction register
|
|
|
|
#define rs(_instr) ((_instr >> 21) & 0x1F) // The rs part of the instruction register
|
2023-09-03 04:30:26 +00:00
|
|
|
#define imm(_instr) (_instr & 0xFFFF) // The immediate part of the instruction register
|
2021-02-17 15:45:32 +00:00
|
|
|
#define imm_sext(_instr) \
|
|
|
|
static_cast<s32>(static_cast<s16>(_instr & 0xFFFF)) // The immediate part of the instruction register
|
2020-08-01 14:25:07 +00:00
|
|
|
|
2023-08-15 13:12:21 +00:00
|
|
|
void CPU_LW(u32 instr, u32 addr, u32 rtVal)
|
2020-08-01 14:25:07 +00:00
|
|
|
{
|
|
|
|
// Rt = Mem[Rs + Im]
|
|
|
|
ValidateAndCopyMem(&CPU_reg[rt(instr)], addr, rtVal);
|
|
|
|
}
|
|
|
|
|
2023-08-15 13:12:21 +00:00
|
|
|
void CPU_LBx(u32 instr, u32 addr, u32 rtVal)
|
2020-08-01 14:25:07 +00:00
|
|
|
{
|
2021-06-12 12:02:28 +00:00
|
|
|
CPU_reg[rt(instr)] = PGXP_value_invalid;
|
2020-08-01 14:25:07 +00:00
|
|
|
}
|
|
|
|
|
2023-09-03 04:30:26 +00:00
|
|
|
void CPU_LH(u32 instr, u32 addr, u32 rtVal)
|
2020-08-01 14:25:07 +00:00
|
|
|
{
|
2023-09-03 04:30:26 +00:00
|
|
|
// Rt = Mem[Rs + Im] (sign extended)
|
|
|
|
ValidateAndCopyMem16(&CPU_reg[rt(instr)], addr, rtVal, true);
|
|
|
|
}
|
|
|
|
|
|
|
|
void CPU_LHU(u32 instr, u32 addr, u32 rtVal)
|
|
|
|
{
|
|
|
|
// Rt = Mem[Rs + Im] (zero extended)
|
|
|
|
ValidateAndCopyMem16(&CPU_reg[rt(instr)], addr, rtVal, false);
|
2020-08-01 14:25:07 +00:00
|
|
|
}
|
|
|
|
|
2023-08-15 13:12:21 +00:00
|
|
|
void CPU_SB(u32 instr, u32 addr, u32 rtVal)
|
2020-08-01 14:25:07 +00:00
|
|
|
{
|
2021-06-12 12:02:28 +00:00
|
|
|
WriteMem(&PGXP_value_invalid, addr);
|
2020-08-01 14:25:07 +00:00
|
|
|
}
|
|
|
|
|
2023-08-15 13:12:21 +00:00
|
|
|
void CPU_SH(u32 instr, u32 addr, u32 rtVal)
|
2020-08-01 14:25:07 +00:00
|
|
|
{
|
2021-06-24 06:52:38 +00:00
|
|
|
PGXP_value* val = &CPU_reg[rt(instr)];
|
|
|
|
|
2020-08-01 14:25:07 +00:00
|
|
|
// validate and copy half value
|
2021-06-24 06:52:38 +00:00
|
|
|
MaskValidate(val, rtVal, 0xFFFF, VALID_0);
|
|
|
|
WriteMem16(val, addr);
|
2020-08-01 14:25:07 +00:00
|
|
|
}
|
|
|
|
|
2023-08-15 13:12:21 +00:00
|
|
|
void CPU_SW(u32 instr, u32 addr, u32 rtVal)
|
2020-08-01 14:25:07 +00:00
|
|
|
{
|
|
|
|
// Mem[Rs + Im] = Rt
|
2021-06-24 06:52:38 +00:00
|
|
|
PGXP_value* val = &CPU_reg[rt(instr)];
|
|
|
|
Validate(val, rtVal);
|
|
|
|
WriteMem(val, addr);
|
2020-08-01 14:25:07 +00:00
|
|
|
}
|
|
|
|
|
2020-10-04 12:13:33 +00:00
|
|
|
void CPU_MOVE(u32 rd_and_rs, u32 rsVal)
|
|
|
|
{
|
|
|
|
const u32 Rs = (rd_and_rs & 0xFFu);
|
|
|
|
Validate(&CPU_reg[Rs], rsVal);
|
|
|
|
CPU_reg[(rd_and_rs >> 8)] = CPU_reg[Rs];
|
|
|
|
}
|
|
|
|
|
2021-02-17 15:45:32 +00:00
|
|
|
void CPU_ADDI(u32 instr, u32 rsVal)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
|
|
|
// Rt = Rs + Imm (signed)
|
|
|
|
Validate(&CPU_reg[rs(instr)], rsVal);
|
2023-10-31 15:32:29 +00:00
|
|
|
PGXP_value ret = CPU_reg[rs(instr)];
|
|
|
|
|
|
|
|
psx_value tempImm;
|
|
|
|
tempImm.d = SignExtend32(static_cast<u16>(imm(instr)));
|
2020-08-19 13:26:57 +00:00
|
|
|
|
2020-12-03 15:07:34 +00:00
|
|
|
if (tempImm.d != 0)
|
|
|
|
{
|
|
|
|
ret.x = (float)f16Unsign(ret.x);
|
|
|
|
ret.x += (float)tempImm.w.l;
|
2020-08-19 13:26:57 +00:00
|
|
|
|
2020-12-03 15:07:34 +00:00
|
|
|
// carry on over/underflow
|
|
|
|
float of = (ret.x > USHRT_MAX) ? 1.f : (ret.x < 0) ? -1.f : 0.f;
|
|
|
|
ret.x = (float)f16Sign(ret.x);
|
|
|
|
// ret.x -= of * (USHRT_MAX + 1);
|
|
|
|
ret.y += tempImm.sw.h + of;
|
2020-08-19 13:26:57 +00:00
|
|
|
|
2020-12-03 15:07:34 +00:00
|
|
|
// truncate on overflow/underflow
|
|
|
|
ret.y += (ret.y > SHRT_MAX) ? -(USHRT_MAX + 1) : (ret.y < SHRT_MIN) ? USHRT_MAX + 1 : 0.f;
|
|
|
|
}
|
2020-08-19 13:26:57 +00:00
|
|
|
|
|
|
|
CPU_reg[rt(instr)] = ret;
|
2021-02-17 15:45:32 +00:00
|
|
|
CPU_reg[rt(instr)].value = rsVal + imm_sext(instr);
|
2020-08-19 13:26:57 +00:00
|
|
|
}
|
|
|
|
|
2021-02-17 15:45:32 +00:00
|
|
|
void CPU_ANDI(u32 instr, u32 rsVal)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
|
|
|
// Rt = Rs & Imm
|
2021-02-17 15:45:32 +00:00
|
|
|
const u32 rtVal = rsVal & imm(instr);
|
2020-08-19 13:26:57 +00:00
|
|
|
psx_value vRt;
|
|
|
|
PGXP_value ret;
|
|
|
|
|
|
|
|
Validate(&CPU_reg[rs(instr)], rsVal);
|
|
|
|
ret = CPU_reg[rs(instr)];
|
|
|
|
|
|
|
|
vRt.d = rtVal;
|
|
|
|
|
|
|
|
ret.y = 0.f; // remove upper 16-bits
|
|
|
|
|
|
|
|
switch (imm(instr))
|
|
|
|
{
|
|
|
|
case 0:
|
|
|
|
// if 0 then x == 0
|
|
|
|
ret.x = 0.f;
|
|
|
|
break;
|
|
|
|
case 0xFFFF:
|
|
|
|
// if saturated then x == x
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
// otherwise x is low precision value
|
|
|
|
ret.x = vRt.sw.l;
|
|
|
|
ret.flags |= VALID_0;
|
|
|
|
}
|
|
|
|
|
|
|
|
ret.flags |= VALID_1;
|
|
|
|
|
|
|
|
CPU_reg[rt(instr)] = ret;
|
|
|
|
CPU_reg[rt(instr)].value = rtVal;
|
|
|
|
}
|
|
|
|
|
2021-02-17 15:45:32 +00:00
|
|
|
void CPU_ORI(u32 instr, u32 rsVal)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
|
|
|
// Rt = Rs | Imm
|
2021-02-17 15:45:32 +00:00
|
|
|
const u32 rtVal = rsVal | imm(instr);
|
2020-08-19 13:26:57 +00:00
|
|
|
psx_value vRt;
|
|
|
|
PGXP_value ret;
|
|
|
|
|
|
|
|
Validate(&CPU_reg[rs(instr)], rsVal);
|
|
|
|
ret = CPU_reg[rs(instr)];
|
|
|
|
|
|
|
|
vRt.d = rtVal;
|
|
|
|
|
|
|
|
switch (imm(instr))
|
|
|
|
{
|
|
|
|
case 0:
|
|
|
|
// if 0 then x == x
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
// otherwise x is low precision value
|
|
|
|
ret.x = vRt.sw.l;
|
|
|
|
ret.flags |= VALID_0;
|
|
|
|
}
|
|
|
|
|
|
|
|
ret.value = rtVal;
|
|
|
|
CPU_reg[rt(instr)] = ret;
|
|
|
|
}
|
|
|
|
|
2021-02-17 15:45:32 +00:00
|
|
|
void CPU_XORI(u32 instr, u32 rsVal)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
|
|
|
// Rt = Rs ^ Imm
|
2021-02-17 15:45:32 +00:00
|
|
|
const u32 rtVal = rsVal ^ imm(instr);
|
2020-08-19 13:26:57 +00:00
|
|
|
psx_value vRt;
|
|
|
|
PGXP_value ret;
|
|
|
|
|
|
|
|
Validate(&CPU_reg[rs(instr)], rsVal);
|
|
|
|
ret = CPU_reg[rs(instr)];
|
|
|
|
|
|
|
|
vRt.d = rtVal;
|
|
|
|
|
|
|
|
switch (imm(instr))
|
|
|
|
{
|
|
|
|
case 0:
|
|
|
|
// if 0 then x == x
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
// otherwise x is low precision value
|
|
|
|
ret.x = vRt.sw.l;
|
|
|
|
ret.flags |= VALID_0;
|
|
|
|
}
|
|
|
|
|
|
|
|
ret.value = rtVal;
|
|
|
|
CPU_reg[rt(instr)] = ret;
|
|
|
|
}
|
|
|
|
|
2021-02-17 15:45:32 +00:00
|
|
|
void CPU_SLTI(u32 instr, u32 rsVal)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
|
|
|
// Rt = Rs < Imm (signed)
|
|
|
|
psx_value tempImm;
|
|
|
|
PGXP_value ret;
|
|
|
|
|
|
|
|
Validate(&CPU_reg[rs(instr)], rsVal);
|
|
|
|
ret = CPU_reg[rs(instr)];
|
|
|
|
|
|
|
|
tempImm.w.h = imm(instr);
|
|
|
|
ret.y = 0.f;
|
|
|
|
ret.x = (CPU_reg[rs(instr)].x < tempImm.sw.h) ? 1.f : 0.f;
|
|
|
|
ret.flags |= VALID_1;
|
2021-02-17 15:45:32 +00:00
|
|
|
ret.value = BoolToUInt32(static_cast<s32>(rsVal) < imm_sext(instr));
|
2020-08-19 13:26:57 +00:00
|
|
|
|
|
|
|
CPU_reg[rt(instr)] = ret;
|
|
|
|
}
|
|
|
|
|
2021-02-17 15:45:32 +00:00
|
|
|
void CPU_SLTIU(u32 instr, u32 rsVal)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
|
|
|
// Rt = Rs < Imm (Unsigned)
|
|
|
|
psx_value tempImm;
|
|
|
|
PGXP_value ret;
|
|
|
|
|
|
|
|
Validate(&CPU_reg[rs(instr)], rsVal);
|
|
|
|
ret = CPU_reg[rs(instr)];
|
|
|
|
|
|
|
|
tempImm.w.h = imm(instr);
|
|
|
|
ret.y = 0.f;
|
|
|
|
ret.x = (f16Unsign(CPU_reg[rs(instr)].x) < tempImm.w.h) ? 1.f : 0.f;
|
|
|
|
ret.flags |= VALID_1;
|
2021-02-17 15:45:32 +00:00
|
|
|
ret.value = BoolToUInt32(rsVal < imm(instr));
|
2020-08-19 13:26:57 +00:00
|
|
|
|
|
|
|
CPU_reg[rt(instr)] = ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
////////////////////////////////////
|
|
|
|
// Load Upper
|
|
|
|
////////////////////////////////////
|
2021-02-17 14:47:38 +00:00
|
|
|
void CPU_LUI(u32 instr)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
|
|
|
// Rt = Imm << 16
|
|
|
|
CPU_reg[rt(instr)] = PGXP_value_zero;
|
|
|
|
CPU_reg[rt(instr)].y = (float)(s16)imm(instr);
|
2021-02-17 14:47:38 +00:00
|
|
|
CPU_reg[rt(instr)].value = static_cast<u32>(imm(instr)) << 16;
|
2020-08-19 13:26:57 +00:00
|
|
|
CPU_reg[rt(instr)].flags = VALID_01;
|
|
|
|
}
|
|
|
|
|
|
|
|
////////////////////////////////////
|
|
|
|
// Register Arithmetic
|
|
|
|
////////////////////////////////////
|
|
|
|
|
2021-02-17 15:45:32 +00:00
|
|
|
void CPU_ADD(u32 instr, u32 rsVal, u32 rtVal)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
|
|
|
// Rd = Rs + Rt (signed)
|
|
|
|
PGXP_value ret;
|
|
|
|
Validate(&CPU_reg[rs(instr)], rsVal);
|
|
|
|
Validate(&CPU_reg[rt(instr)], rtVal);
|
|
|
|
|
2023-09-03 04:30:26 +00:00
|
|
|
if (rtVal == 0)
|
|
|
|
{
|
|
|
|
ret = CPU_reg[rs(instr)];
|
|
|
|
}
|
|
|
|
else if (rsVal == 0)
|
|
|
|
{
|
|
|
|
ret = CPU_reg[rt(instr)];
|
|
|
|
}
|
|
|
|
else
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
2020-12-03 15:07:34 +00:00
|
|
|
// iCB: Only require one valid input
|
|
|
|
if (((CPU_reg[rt(instr)].flags & VALID_01) != VALID_01) != ((CPU_reg[rs(instr)].flags & VALID_01) != VALID_01))
|
|
|
|
{
|
|
|
|
MakeValid(&CPU_reg[rs(instr)], rsVal);
|
|
|
|
MakeValid(&CPU_reg[rt(instr)], rtVal);
|
|
|
|
}
|
2020-08-19 13:26:57 +00:00
|
|
|
|
2020-12-03 15:07:34 +00:00
|
|
|
ret = CPU_reg[rs(instr)];
|
2020-08-19 13:26:57 +00:00
|
|
|
|
2020-12-03 15:07:34 +00:00
|
|
|
ret.x = (float)f16Unsign(ret.x);
|
|
|
|
ret.x += (float)f16Unsign(CPU_reg[rt(instr)].x);
|
2020-08-19 13:26:57 +00:00
|
|
|
|
2020-12-03 15:07:34 +00:00
|
|
|
// carry on over/underflow
|
|
|
|
float of = (ret.x > USHRT_MAX) ? 1.f : (ret.x < 0) ? -1.f : 0.f;
|
|
|
|
ret.x = (float)f16Sign(ret.x);
|
|
|
|
// ret.x -= of * (USHRT_MAX + 1);
|
|
|
|
ret.y += CPU_reg[rt(instr)].y + of;
|
2020-08-19 13:26:57 +00:00
|
|
|
|
2020-12-03 15:07:34 +00:00
|
|
|
// truncate on overflow/underflow
|
|
|
|
ret.y += (ret.y > SHRT_MAX) ? -(USHRT_MAX + 1) : (ret.y < SHRT_MIN) ? USHRT_MAX + 1 : 0.f;
|
2020-08-19 13:26:57 +00:00
|
|
|
|
2020-12-03 15:07:34 +00:00
|
|
|
// TODO: decide which "z/w" component to use
|
2020-08-19 13:26:57 +00:00
|
|
|
|
2020-12-03 15:07:34 +00:00
|
|
|
ret.halfFlags[0] &= CPU_reg[rt(instr)].halfFlags[0];
|
|
|
|
}
|
2020-08-19 13:26:57 +00:00
|
|
|
|
2021-02-17 15:45:32 +00:00
|
|
|
ret.value = rsVal + rtVal;
|
2020-08-19 13:26:57 +00:00
|
|
|
|
|
|
|
CPU_reg[rd(instr)] = ret;
|
|
|
|
}
|
|
|
|
|
2021-02-17 15:45:32 +00:00
|
|
|
void CPU_SUB(u32 instr, u32 rsVal, u32 rtVal)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
|
|
|
// Rd = Rs - Rt (signed)
|
|
|
|
PGXP_value ret;
|
|
|
|
Validate(&CPU_reg[rs(instr)], rsVal);
|
|
|
|
Validate(&CPU_reg[rt(instr)], rtVal);
|
|
|
|
|
|
|
|
// iCB: Only require one valid input
|
|
|
|
if (((CPU_reg[rt(instr)].flags & VALID_01) != VALID_01) != ((CPU_reg[rs(instr)].flags & VALID_01) != VALID_01))
|
|
|
|
{
|
|
|
|
MakeValid(&CPU_reg[rs(instr)], rsVal);
|
|
|
|
MakeValid(&CPU_reg[rt(instr)], rtVal);
|
|
|
|
}
|
|
|
|
|
|
|
|
ret = CPU_reg[rs(instr)];
|
|
|
|
|
|
|
|
ret.x = (float)f16Unsign(ret.x);
|
|
|
|
ret.x -= (float)f16Unsign(CPU_reg[rt(instr)].x);
|
|
|
|
|
|
|
|
// carry on over/underflow
|
|
|
|
float of = (ret.x > USHRT_MAX) ? 1.f : (ret.x < 0) ? -1.f : 0.f;
|
|
|
|
ret.x = (float)f16Sign(ret.x);
|
|
|
|
// ret.x -= of * (USHRT_MAX + 1);
|
|
|
|
ret.y -= CPU_reg[rt(instr)].y - of;
|
|
|
|
|
|
|
|
// truncate on overflow/underflow
|
|
|
|
ret.y += (ret.y > SHRT_MAX) ? -(USHRT_MAX + 1) : (ret.y < SHRT_MIN) ? USHRT_MAX + 1 : 0.f;
|
|
|
|
|
|
|
|
ret.halfFlags[0] &= CPU_reg[rt(instr)].halfFlags[0];
|
|
|
|
|
2021-02-17 15:45:32 +00:00
|
|
|
ret.value = rsVal - rtVal;
|
2020-08-19 13:26:57 +00:00
|
|
|
|
|
|
|
CPU_reg[rd(instr)] = ret;
|
|
|
|
}
|
|
|
|
|
2021-02-17 15:45:32 +00:00
|
|
|
static void CPU_BITWISE(u32 instr, u32 rdVal, u32 rsVal, u32 rtVal)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
|
|
|
// Rd = Rs & Rt
|
|
|
|
psx_value vald, vals, valt;
|
|
|
|
PGXP_value ret;
|
|
|
|
|
|
|
|
Validate(&CPU_reg[rs(instr)], rsVal);
|
|
|
|
Validate(&CPU_reg[rt(instr)], rtVal);
|
|
|
|
|
|
|
|
// iCB: Only require one valid input
|
|
|
|
if (((CPU_reg[rt(instr)].flags & VALID_01) != VALID_01) != ((CPU_reg[rs(instr)].flags & VALID_01) != VALID_01))
|
|
|
|
{
|
|
|
|
MakeValid(&CPU_reg[rs(instr)], rsVal);
|
|
|
|
MakeValid(&CPU_reg[rt(instr)], rtVal);
|
|
|
|
}
|
|
|
|
|
|
|
|
vald.d = rdVal;
|
|
|
|
vals.d = rsVal;
|
|
|
|
valt.d = rtVal;
|
|
|
|
|
|
|
|
// CPU_reg[rd(instr)].valid = CPU_reg[rs(instr)].valid && CPU_reg[rt(instr)].valid;
|
|
|
|
ret.flags = VALID_01;
|
|
|
|
|
|
|
|
if (vald.w.l == 0)
|
|
|
|
{
|
|
|
|
ret.x = 0.f;
|
|
|
|
}
|
|
|
|
else if (vald.w.l == vals.w.l)
|
|
|
|
{
|
|
|
|
ret.x = CPU_reg[rs(instr)].x;
|
|
|
|
ret.compFlags[0] = CPU_reg[rs(instr)].compFlags[0];
|
|
|
|
}
|
|
|
|
else if (vald.w.l == valt.w.l)
|
|
|
|
{
|
|
|
|
ret.x = CPU_reg[rt(instr)].x;
|
|
|
|
ret.compFlags[0] = CPU_reg[rt(instr)].compFlags[0];
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
ret.x = (float)vald.sw.l;
|
|
|
|
ret.compFlags[0] = VALID;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (vald.w.h == 0)
|
|
|
|
{
|
|
|
|
ret.y = 0.f;
|
|
|
|
}
|
|
|
|
else if (vald.w.h == vals.w.h)
|
|
|
|
{
|
|
|
|
ret.y = CPU_reg[rs(instr)].y;
|
|
|
|
ret.compFlags[1] &= CPU_reg[rs(instr)].compFlags[1];
|
|
|
|
}
|
|
|
|
else if (vald.w.h == valt.w.h)
|
|
|
|
{
|
|
|
|
ret.y = CPU_reg[rt(instr)].y;
|
|
|
|
ret.compFlags[1] &= CPU_reg[rt(instr)].compFlags[1];
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
ret.y = (float)vald.sw.h;
|
|
|
|
ret.compFlags[1] = VALID;
|
|
|
|
}
|
|
|
|
|
|
|
|
// iCB Hack: Force validity if even one half is valid
|
|
|
|
// if ((ret.hFlags & VALID_HALF) || (ret.lFlags & VALID_HALF))
|
|
|
|
// ret.valid = 1;
|
|
|
|
// /iCB Hack
|
|
|
|
|
|
|
|
// Get a valid W
|
|
|
|
if ((CPU_reg[rs(instr)].flags & VALID_2) == VALID_2)
|
|
|
|
{
|
|
|
|
ret.z = CPU_reg[rs(instr)].z;
|
|
|
|
ret.compFlags[2] = CPU_reg[rs(instr)].compFlags[2];
|
|
|
|
}
|
|
|
|
else if ((CPU_reg[rt(instr)].flags & VALID_2) == VALID_2)
|
|
|
|
{
|
|
|
|
ret.z = CPU_reg[rt(instr)].z;
|
|
|
|
ret.compFlags[2] = CPU_reg[rt(instr)].compFlags[2];
|
|
|
|
}
|
2023-10-31 15:32:29 +00:00
|
|
|
else
|
|
|
|
{
|
|
|
|
ret.z = 0.0f;
|
|
|
|
ret.compFlags[2] = 0;
|
|
|
|
}
|
2020-08-19 13:26:57 +00:00
|
|
|
|
|
|
|
ret.value = rdVal;
|
|
|
|
CPU_reg[rd(instr)] = ret;
|
|
|
|
}
|
|
|
|
|
2021-02-17 15:45:32 +00:00
|
|
|
void CPU_AND_(u32 instr, u32 rsVal, u32 rtVal)
|
|
|
|
{
|
|
|
|
// Rd = Rs & Rt
|
|
|
|
const u32 rdVal = rsVal & rtVal;
|
|
|
|
CPU_BITWISE(instr, rdVal, rsVal, rtVal);
|
|
|
|
}
|
|
|
|
|
|
|
|
void CPU_OR_(u32 instr, u32 rsVal, u32 rtVal)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
|
|
|
// Rd = Rs | Rt
|
2021-02-17 15:45:32 +00:00
|
|
|
const u32 rdVal = rsVal | rtVal;
|
|
|
|
CPU_BITWISE(instr, rdVal, rsVal, rtVal);
|
2020-08-19 13:26:57 +00:00
|
|
|
}
|
|
|
|
|
2021-02-17 15:45:32 +00:00
|
|
|
void CPU_XOR_(u32 instr, u32 rsVal, u32 rtVal)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
|
|
|
// Rd = Rs ^ Rt
|
2021-02-17 15:45:32 +00:00
|
|
|
const u32 rdVal = rsVal ^ rtVal;
|
|
|
|
CPU_BITWISE(instr, rdVal, rsVal, rtVal);
|
2020-08-19 13:26:57 +00:00
|
|
|
}
|
|
|
|
|
2021-02-17 15:45:32 +00:00
|
|
|
void CPU_NOR(u32 instr, u32 rsVal, u32 rtVal)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
|
|
|
// Rd = Rs NOR Rt
|
2021-02-17 15:45:32 +00:00
|
|
|
const u32 rdVal = ~(rsVal | rtVal);
|
|
|
|
CPU_BITWISE(instr, rdVal, rsVal, rtVal);
|
2020-08-19 13:26:57 +00:00
|
|
|
}
|
|
|
|
|
2021-02-17 15:45:32 +00:00
|
|
|
void CPU_SLT(u32 instr, u32 rsVal, u32 rtVal)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
|
|
|
// Rd = Rs < Rt (signed)
|
|
|
|
PGXP_value ret;
|
|
|
|
Validate(&CPU_reg[rs(instr)], rsVal);
|
|
|
|
Validate(&CPU_reg[rt(instr)], rtVal);
|
|
|
|
|
|
|
|
// iCB: Only require one valid input
|
|
|
|
if (((CPU_reg[rt(instr)].flags & VALID_01) != VALID_01) != ((CPU_reg[rs(instr)].flags & VALID_01) != VALID_01))
|
|
|
|
{
|
|
|
|
MakeValid(&CPU_reg[rs(instr)], rsVal);
|
|
|
|
MakeValid(&CPU_reg[rt(instr)], rtVal);
|
|
|
|
}
|
|
|
|
|
|
|
|
ret = CPU_reg[rs(instr)];
|
|
|
|
ret.y = 0.f;
|
|
|
|
ret.compFlags[1] = VALID;
|
|
|
|
|
2021-05-25 10:01:00 +00:00
|
|
|
ret.x = (CPU_reg[rs(instr)].y < CPU_reg[rt(instr)].y) ? 1.f :
|
|
|
|
(f16Unsign(CPU_reg[rs(instr)].x) < f16Unsign(CPU_reg[rt(instr)].x)) ? 1.f :
|
|
|
|
0.f;
|
2020-08-19 13:26:57 +00:00
|
|
|
|
2021-02-17 15:45:32 +00:00
|
|
|
ret.value = BoolToUInt32(static_cast<s32>(rsVal) < static_cast<s32>(rtVal));
|
2020-08-19 13:26:57 +00:00
|
|
|
CPU_reg[rd(instr)] = ret;
|
|
|
|
}
|
|
|
|
|
2021-02-17 15:45:32 +00:00
|
|
|
void CPU_SLTU(u32 instr, u32 rsVal, u32 rtVal)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
|
|
|
// Rd = Rs < Rt (unsigned)
|
|
|
|
PGXP_value ret;
|
|
|
|
Validate(&CPU_reg[rs(instr)], rsVal);
|
|
|
|
Validate(&CPU_reg[rt(instr)], rtVal);
|
|
|
|
|
|
|
|
// iCB: Only require one valid input
|
|
|
|
if (((CPU_reg[rt(instr)].flags & VALID_01) != VALID_01) != ((CPU_reg[rs(instr)].flags & VALID_01) != VALID_01))
|
|
|
|
{
|
|
|
|
MakeValid(&CPU_reg[rs(instr)], rsVal);
|
|
|
|
MakeValid(&CPU_reg[rt(instr)], rtVal);
|
|
|
|
}
|
|
|
|
|
|
|
|
ret = CPU_reg[rs(instr)];
|
|
|
|
ret.y = 0.f;
|
|
|
|
ret.compFlags[1] = VALID;
|
|
|
|
|
2021-05-25 10:01:00 +00:00
|
|
|
ret.x = (f16Unsign(CPU_reg[rs(instr)].y) < f16Unsign(CPU_reg[rt(instr)].y)) ? 1.f :
|
|
|
|
(f16Unsign(CPU_reg[rs(instr)].x) < f16Unsign(CPU_reg[rt(instr)].x)) ? 1.f :
|
|
|
|
0.f;
|
2020-08-19 13:26:57 +00:00
|
|
|
|
2021-02-17 15:45:32 +00:00
|
|
|
ret.value = BoolToUInt32(rsVal < rtVal);
|
2020-08-19 13:26:57 +00:00
|
|
|
CPU_reg[rd(instr)] = ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
////////////////////////////////////
|
|
|
|
// Register mult/div
|
|
|
|
////////////////////////////////////
|
|
|
|
|
2021-02-17 14:37:17 +00:00
|
|
|
void CPU_MULT(u32 instr, u32 rsVal, u32 rtVal)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
|
|
|
// Hi/Lo = Rs * Rt (signed)
|
|
|
|
Validate(&CPU_reg[rs(instr)], rsVal);
|
|
|
|
Validate(&CPU_reg[rt(instr)], rtVal);
|
|
|
|
|
|
|
|
// iCB: Only require one valid input
|
|
|
|
if (((CPU_reg[rt(instr)].flags & VALID_01) != VALID_01) != ((CPU_reg[rs(instr)].flags & VALID_01) != VALID_01))
|
|
|
|
{
|
|
|
|
MakeValid(&CPU_reg[rs(instr)], rsVal);
|
|
|
|
MakeValid(&CPU_reg[rt(instr)], rtVal);
|
|
|
|
}
|
|
|
|
|
|
|
|
CPU_Lo = CPU_Hi = CPU_reg[rs(instr)];
|
|
|
|
|
|
|
|
CPU_Lo.halfFlags[0] = CPU_Hi.halfFlags[0] = (CPU_reg[rs(instr)].halfFlags[0] & CPU_reg[rt(instr)].halfFlags[0]);
|
|
|
|
|
|
|
|
double xx, xy, yx, yy;
|
|
|
|
double lx = 0, ly = 0, hx = 0, hy = 0;
|
|
|
|
|
|
|
|
// Multiply out components
|
|
|
|
xx = f16Unsign(CPU_reg[rs(instr)].x) * f16Unsign(CPU_reg[rt(instr)].x);
|
|
|
|
xy = f16Unsign(CPU_reg[rs(instr)].x) * (CPU_reg[rt(instr)].y);
|
|
|
|
yx = (CPU_reg[rs(instr)].y) * f16Unsign(CPU_reg[rt(instr)].x);
|
|
|
|
yy = (CPU_reg[rs(instr)].y) * (CPU_reg[rt(instr)].y);
|
|
|
|
|
|
|
|
// Split values into outputs
|
|
|
|
lx = xx;
|
|
|
|
|
|
|
|
ly = f16Overflow(xx);
|
|
|
|
ly += xy + yx;
|
|
|
|
|
|
|
|
hx = f16Overflow(ly);
|
|
|
|
hx += yy;
|
|
|
|
|
|
|
|
hy = f16Overflow(hx);
|
|
|
|
|
|
|
|
CPU_Lo.x = (float)f16Sign(lx);
|
|
|
|
CPU_Lo.y = (float)f16Sign(ly);
|
|
|
|
CPU_Hi.x = (float)f16Sign(hx);
|
|
|
|
CPU_Hi.y = (float)f16Sign(hy);
|
|
|
|
|
2021-02-17 14:37:17 +00:00
|
|
|
// compute PSX value
|
|
|
|
const u64 result = static_cast<u64>(static_cast<s64>(SignExtend64(rsVal)) * static_cast<s64>(SignExtend64(rtVal)));
|
|
|
|
CPU_Hi.value = Truncate32(result >> 32);
|
|
|
|
CPU_Lo.value = Truncate32(result);
|
2020-08-19 13:26:57 +00:00
|
|
|
}
|
|
|
|
|
2021-02-17 14:37:17 +00:00
|
|
|
void CPU_MULTU(u32 instr, u32 rsVal, u32 rtVal)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
|
|
|
// Hi/Lo = Rs * Rt (unsigned)
|
|
|
|
Validate(&CPU_reg[rs(instr)], rsVal);
|
|
|
|
Validate(&CPU_reg[rt(instr)], rtVal);
|
|
|
|
|
|
|
|
// iCB: Only require one valid input
|
|
|
|
if (((CPU_reg[rt(instr)].flags & VALID_01) != VALID_01) != ((CPU_reg[rs(instr)].flags & VALID_01) != VALID_01))
|
|
|
|
{
|
|
|
|
MakeValid(&CPU_reg[rs(instr)], rsVal);
|
|
|
|
MakeValid(&CPU_reg[rt(instr)], rtVal);
|
|
|
|
}
|
|
|
|
|
|
|
|
CPU_Lo = CPU_Hi = CPU_reg[rs(instr)];
|
|
|
|
|
|
|
|
CPU_Lo.halfFlags[0] = CPU_Hi.halfFlags[0] = (CPU_reg[rs(instr)].halfFlags[0] & CPU_reg[rt(instr)].halfFlags[0]);
|
|
|
|
|
|
|
|
double xx, xy, yx, yy;
|
|
|
|
double lx = 0, ly = 0, hx = 0, hy = 0;
|
|
|
|
|
|
|
|
// Multiply out components
|
|
|
|
xx = f16Unsign(CPU_reg[rs(instr)].x) * f16Unsign(CPU_reg[rt(instr)].x);
|
|
|
|
xy = f16Unsign(CPU_reg[rs(instr)].x) * f16Unsign(CPU_reg[rt(instr)].y);
|
|
|
|
yx = f16Unsign(CPU_reg[rs(instr)].y) * f16Unsign(CPU_reg[rt(instr)].x);
|
|
|
|
yy = f16Unsign(CPU_reg[rs(instr)].y) * f16Unsign(CPU_reg[rt(instr)].y);
|
|
|
|
|
|
|
|
// Split values into outputs
|
|
|
|
lx = xx;
|
|
|
|
|
|
|
|
ly = f16Overflow(xx);
|
|
|
|
ly += xy + yx;
|
|
|
|
|
|
|
|
hx = f16Overflow(ly);
|
|
|
|
hx += yy;
|
|
|
|
|
|
|
|
hy = f16Overflow(hx);
|
|
|
|
|
|
|
|
CPU_Lo.x = (float)f16Sign(lx);
|
|
|
|
CPU_Lo.y = (float)f16Sign(ly);
|
|
|
|
CPU_Hi.x = (float)f16Sign(hx);
|
|
|
|
CPU_Hi.y = (float)f16Sign(hy);
|
|
|
|
|
2021-02-17 14:37:17 +00:00
|
|
|
// compute PSX value
|
|
|
|
const u64 result = ZeroExtend64(rsVal) * ZeroExtend64(rtVal);
|
|
|
|
CPU_Hi.value = Truncate32(result >> 32);
|
|
|
|
CPU_Lo.value = Truncate32(result);
|
2020-08-19 13:26:57 +00:00
|
|
|
}
|
|
|
|
|
2021-02-17 14:37:17 +00:00
|
|
|
void CPU_DIV(u32 instr, u32 rsVal, u32 rtVal)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
|
|
|
// Lo = Rs / Rt (signed)
|
|
|
|
// Hi = Rs % Rt (signed)
|
|
|
|
Validate(&CPU_reg[rs(instr)], rsVal);
|
|
|
|
Validate(&CPU_reg[rt(instr)], rtVal);
|
|
|
|
|
|
|
|
//// iCB: Only require one valid input
|
|
|
|
if (((CPU_reg[rt(instr)].flags & VALID_01) != VALID_01) != ((CPU_reg[rs(instr)].flags & VALID_01) != VALID_01))
|
|
|
|
{
|
|
|
|
MakeValid(&CPU_reg[rs(instr)], rsVal);
|
|
|
|
MakeValid(&CPU_reg[rt(instr)], rtVal);
|
|
|
|
}
|
|
|
|
|
|
|
|
CPU_Lo = CPU_Hi = CPU_reg[rs(instr)];
|
|
|
|
|
|
|
|
CPU_Lo.halfFlags[0] = CPU_Hi.halfFlags[0] = (CPU_reg[rs(instr)].halfFlags[0] & CPU_reg[rt(instr)].halfFlags[0]);
|
|
|
|
|
|
|
|
double vs = f16Unsign(CPU_reg[rs(instr)].x) + (CPU_reg[rs(instr)].y) * (double)(1 << 16);
|
|
|
|
double vt = f16Unsign(CPU_reg[rt(instr)].x) + (CPU_reg[rt(instr)].y) * (double)(1 << 16);
|
|
|
|
|
|
|
|
double lo = vs / vt;
|
|
|
|
CPU_Lo.y = (float)f16Sign(f16Overflow(lo));
|
|
|
|
CPU_Lo.x = (float)f16Sign(lo);
|
|
|
|
|
|
|
|
double hi = fmod(vs, vt);
|
|
|
|
CPU_Hi.y = (float)f16Sign(f16Overflow(hi));
|
|
|
|
CPU_Hi.x = (float)f16Sign(hi);
|
|
|
|
|
2021-02-17 14:37:17 +00:00
|
|
|
// compute PSX value
|
|
|
|
if (static_cast<s32>(rtVal) == 0)
|
|
|
|
{
|
|
|
|
// divide by zero
|
|
|
|
CPU_Lo.value = (static_cast<s32>(rsVal) >= 0) ? UINT32_C(0xFFFFFFFF) : UINT32_C(1);
|
|
|
|
CPU_Hi.value = static_cast<u32>(static_cast<s32>(rsVal));
|
|
|
|
}
|
|
|
|
else if (rsVal == UINT32_C(0x80000000) && static_cast<s32>(rtVal) == -1)
|
|
|
|
{
|
|
|
|
// unrepresentable
|
|
|
|
CPU_Lo.value = UINT32_C(0x80000000);
|
|
|
|
CPU_Hi.value = 0;
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
CPU_Lo.value = static_cast<u32>(static_cast<s32>(rsVal) / static_cast<s32>(rtVal));
|
|
|
|
CPU_Hi.value = static_cast<u32>(static_cast<s32>(rsVal) % static_cast<s32>(rtVal));
|
|
|
|
}
|
2020-08-19 13:26:57 +00:00
|
|
|
}
|
|
|
|
|
2021-02-17 14:37:17 +00:00
|
|
|
void CPU_DIVU(u32 instr, u32 rsVal, u32 rtVal)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
|
|
|
// Lo = Rs / Rt (unsigned)
|
|
|
|
// Hi = Rs % Rt (unsigned)
|
|
|
|
Validate(&CPU_reg[rs(instr)], rsVal);
|
|
|
|
Validate(&CPU_reg[rt(instr)], rtVal);
|
|
|
|
|
|
|
|
//// iCB: Only require one valid input
|
|
|
|
if (((CPU_reg[rt(instr)].flags & VALID_01) != VALID_01) != ((CPU_reg[rs(instr)].flags & VALID_01) != VALID_01))
|
|
|
|
{
|
|
|
|
MakeValid(&CPU_reg[rs(instr)], rsVal);
|
|
|
|
MakeValid(&CPU_reg[rt(instr)], rtVal);
|
|
|
|
}
|
|
|
|
|
|
|
|
CPU_Lo = CPU_Hi = CPU_reg[rs(instr)];
|
|
|
|
|
|
|
|
CPU_Lo.halfFlags[0] = CPU_Hi.halfFlags[0] = (CPU_reg[rs(instr)].halfFlags[0] & CPU_reg[rt(instr)].halfFlags[0]);
|
|
|
|
|
|
|
|
double vs = f16Unsign(CPU_reg[rs(instr)].x) + f16Unsign(CPU_reg[rs(instr)].y) * (double)(1 << 16);
|
|
|
|
double vt = f16Unsign(CPU_reg[rt(instr)].x) + f16Unsign(CPU_reg[rt(instr)].y) * (double)(1 << 16);
|
|
|
|
|
|
|
|
double lo = vs / vt;
|
|
|
|
CPU_Lo.y = (float)f16Sign(f16Overflow(lo));
|
|
|
|
CPU_Lo.x = (float)f16Sign(lo);
|
|
|
|
|
|
|
|
double hi = fmod(vs, vt);
|
|
|
|
CPU_Hi.y = (float)f16Sign(f16Overflow(hi));
|
|
|
|
CPU_Hi.x = (float)f16Sign(hi);
|
|
|
|
|
2021-02-17 14:37:17 +00:00
|
|
|
if (rtVal == 0)
|
|
|
|
{
|
|
|
|
// divide by zero
|
|
|
|
CPU_Lo.value = UINT32_C(0xFFFFFFFF);
|
|
|
|
CPU_Hi.value = rsVal;
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
CPU_Lo.value = rsVal / rtVal;
|
|
|
|
CPU_Hi.value = rsVal % rtVal;
|
|
|
|
}
|
2020-08-19 13:26:57 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
////////////////////////////////////
|
|
|
|
// Shift operations (sa)
|
|
|
|
////////////////////////////////////
|
2021-02-17 15:45:32 +00:00
|
|
|
void CPU_SLL(u32 instr, u32 rtVal)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
|
|
|
// Rd = Rt << Sa
|
2021-02-17 15:45:32 +00:00
|
|
|
const u32 rdVal = rtVal << sa(instr);
|
2020-08-19 13:26:57 +00:00
|
|
|
PGXP_value ret;
|
|
|
|
u32 sh = sa(instr);
|
|
|
|
Validate(&CPU_reg[rt(instr)], rtVal);
|
|
|
|
|
|
|
|
ret = CPU_reg[rt(instr)];
|
|
|
|
|
|
|
|
// TODO: Shift flags
|
|
|
|
double x = f16Unsign(CPU_reg[rt(instr)].x);
|
|
|
|
double y = f16Unsign(CPU_reg[rt(instr)].y);
|
|
|
|
if (sh >= 32)
|
|
|
|
{
|
|
|
|
x = 0.f;
|
|
|
|
y = 0.f;
|
|
|
|
}
|
|
|
|
else if (sh == 16)
|
|
|
|
{
|
|
|
|
y = f16Sign(x);
|
|
|
|
x = 0.f;
|
|
|
|
}
|
|
|
|
else if (sh >= 16)
|
|
|
|
{
|
|
|
|
y = x * (1 << (sh - 16));
|
|
|
|
y = f16Sign(y);
|
|
|
|
x = 0.f;
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
x = x * (1 << sh);
|
|
|
|
y = y * (1 << sh);
|
|
|
|
y += f16Overflow(x);
|
|
|
|
x = f16Sign(x);
|
|
|
|
y = f16Sign(y);
|
|
|
|
}
|
|
|
|
|
|
|
|
ret.x = (float)x;
|
|
|
|
ret.y = (float)y;
|
|
|
|
|
|
|
|
ret.value = rdVal;
|
|
|
|
CPU_reg[rd(instr)] = ret;
|
|
|
|
}
|
|
|
|
|
2021-02-17 15:45:32 +00:00
|
|
|
void CPU_SRL(u32 instr, u32 rtVal)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
|
|
|
// Rd = Rt >> Sa
|
2021-02-17 15:45:32 +00:00
|
|
|
const u32 rdVal = rtVal >> sa(instr);
|
2020-08-19 13:26:57 +00:00
|
|
|
PGXP_value ret;
|
|
|
|
u32 sh = sa(instr);
|
|
|
|
Validate(&CPU_reg[rt(instr)], rtVal);
|
|
|
|
|
|
|
|
ret = CPU_reg[rt(instr)];
|
|
|
|
|
|
|
|
double x = CPU_reg[rt(instr)].x, y = f16Unsign(CPU_reg[rt(instr)].y);
|
|
|
|
|
|
|
|
psx_value iX;
|
|
|
|
iX.d = rtVal;
|
|
|
|
psx_value iY;
|
|
|
|
iY.d = rtVal;
|
|
|
|
|
|
|
|
iX.sd = (iX.sd << 16) >> 16; // remove Y
|
|
|
|
iY.sw.l = iX.sw.h; // overwrite x with sign(x)
|
|
|
|
|
|
|
|
// Shift test values
|
|
|
|
psx_value dX;
|
|
|
|
dX.sd = iX.sd >> sh;
|
|
|
|
psx_value dY;
|
|
|
|
dY.d = iY.d >> sh;
|
|
|
|
|
|
|
|
if (dX.sw.l != iX.sw.h)
|
|
|
|
x = x / (1 << sh);
|
|
|
|
else
|
|
|
|
x = dX.sw.l; // only sign bits left
|
|
|
|
|
|
|
|
if (dY.sw.l != iX.sw.h)
|
|
|
|
{
|
|
|
|
if (sh == 16)
|
|
|
|
{
|
|
|
|
x = y;
|
|
|
|
}
|
|
|
|
else if (sh < 16)
|
|
|
|
{
|
|
|
|
x += y * (1 << (16 - sh));
|
|
|
|
if (CPU_reg[rt(instr)].x < 0)
|
|
|
|
x += 1 << (16 - sh);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
x += y / (1 << (sh - 16));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if ((dY.sw.h == 0) || (dY.sw.h == -1))
|
|
|
|
y = dY.sw.h;
|
|
|
|
else
|
|
|
|
y = y / (1 << sh);
|
|
|
|
|
|
|
|
x = f16Sign(x);
|
|
|
|
y = f16Sign(y);
|
|
|
|
|
|
|
|
ret.x = (float)x;
|
|
|
|
ret.y = (float)y;
|
|
|
|
|
|
|
|
ret.value = rdVal;
|
|
|
|
CPU_reg[rd(instr)] = ret;
|
|
|
|
}
|
|
|
|
|
2021-02-17 15:45:32 +00:00
|
|
|
void CPU_SRA(u32 instr, u32 rtVal)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
|
|
|
// Rd = Rt >> Sa
|
2021-02-17 15:45:32 +00:00
|
|
|
const u32 rdVal = static_cast<u32>(static_cast<s32>(rtVal) >> sa(instr));
|
2020-08-19 13:26:57 +00:00
|
|
|
PGXP_value ret;
|
|
|
|
u32 sh = sa(instr);
|
|
|
|
Validate(&CPU_reg[rt(instr)], rtVal);
|
|
|
|
ret = CPU_reg[rt(instr)];
|
|
|
|
|
|
|
|
double x = CPU_reg[rt(instr)].x, y = CPU_reg[rt(instr)].y;
|
|
|
|
|
|
|
|
psx_value iX;
|
|
|
|
iX.d = rtVal;
|
|
|
|
psx_value iY;
|
|
|
|
iY.d = rtVal;
|
|
|
|
|
|
|
|
iX.sd = (iX.sd << 16) >> 16; // remove Y
|
|
|
|
iY.sw.l = iX.sw.h; // overwrite x with sign(x)
|
|
|
|
|
|
|
|
// Shift test values
|
|
|
|
psx_value dX;
|
|
|
|
dX.sd = iX.sd >> sh;
|
|
|
|
psx_value dY;
|
|
|
|
dY.sd = iY.sd >> sh;
|
|
|
|
|
|
|
|
if (dX.sw.l != iX.sw.h)
|
|
|
|
x = x / (1 << sh);
|
|
|
|
else
|
|
|
|
x = dX.sw.l; // only sign bits left
|
|
|
|
|
|
|
|
if (dY.sw.l != iX.sw.h)
|
|
|
|
{
|
|
|
|
if (sh == 16)
|
|
|
|
{
|
|
|
|
x = y;
|
|
|
|
}
|
|
|
|
else if (sh < 16)
|
|
|
|
{
|
|
|
|
x += y * (1 << (16 - sh));
|
|
|
|
if (CPU_reg[rt(instr)].x < 0)
|
|
|
|
x += 1 << (16 - sh);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
x += y / (1 << (sh - 16));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if ((dY.sw.h == 0) || (dY.sw.h == -1))
|
|
|
|
y = dY.sw.h;
|
|
|
|
else
|
|
|
|
y = y / (1 << sh);
|
|
|
|
|
|
|
|
x = f16Sign(x);
|
|
|
|
y = f16Sign(y);
|
|
|
|
|
|
|
|
ret.x = (float)x;
|
|
|
|
ret.y = (float)y;
|
|
|
|
|
|
|
|
ret.value = rdVal;
|
|
|
|
CPU_reg[rd(instr)] = ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
////////////////////////////////////
|
|
|
|
// Shift operations variable
|
|
|
|
////////////////////////////////////
|
2021-02-17 15:45:32 +00:00
|
|
|
void CPU_SLLV(u32 instr, u32 rtVal, u32 rsVal)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
|
|
|
// Rd = Rt << Rs
|
2021-02-17 15:45:32 +00:00
|
|
|
const u32 rdVal = rtVal << rsVal;
|
2020-08-19 13:26:57 +00:00
|
|
|
PGXP_value ret;
|
|
|
|
u32 sh = rsVal & 0x1F;
|
|
|
|
Validate(&CPU_reg[rt(instr)], rtVal);
|
|
|
|
Validate(&CPU_reg[rs(instr)], rsVal);
|
|
|
|
|
|
|
|
ret = CPU_reg[rt(instr)];
|
|
|
|
|
|
|
|
double x = f16Unsign(CPU_reg[rt(instr)].x);
|
|
|
|
double y = f16Unsign(CPU_reg[rt(instr)].y);
|
|
|
|
if (sh >= 32)
|
|
|
|
{
|
|
|
|
x = 0.f;
|
|
|
|
y = 0.f;
|
|
|
|
}
|
|
|
|
else if (sh == 16)
|
|
|
|
{
|
|
|
|
y = f16Sign(x);
|
|
|
|
x = 0.f;
|
|
|
|
}
|
|
|
|
else if (sh >= 16)
|
|
|
|
{
|
|
|
|
y = x * (1 << (sh - 16));
|
|
|
|
y = f16Sign(y);
|
|
|
|
x = 0.f;
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
x = x * (1 << sh);
|
|
|
|
y = y * (1 << sh);
|
|
|
|
y += f16Overflow(x);
|
|
|
|
x = f16Sign(x);
|
|
|
|
y = f16Sign(y);
|
|
|
|
}
|
|
|
|
|
|
|
|
ret.x = (float)x;
|
|
|
|
ret.y = (float)y;
|
|
|
|
|
|
|
|
ret.value = rdVal;
|
|
|
|
CPU_reg[rd(instr)] = ret;
|
|
|
|
}
|
|
|
|
|
2021-02-17 15:45:32 +00:00
|
|
|
void CPU_SRLV(u32 instr, u32 rtVal, u32 rsVal)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
|
|
|
// Rd = Rt >> Sa
|
2021-02-17 15:45:32 +00:00
|
|
|
const u32 rdVal = rtVal >> rsVal;
|
2020-08-19 13:26:57 +00:00
|
|
|
PGXP_value ret;
|
|
|
|
u32 sh = rsVal & 0x1F;
|
|
|
|
Validate(&CPU_reg[rt(instr)], rtVal);
|
|
|
|
Validate(&CPU_reg[rs(instr)], rsVal);
|
|
|
|
|
|
|
|
ret = CPU_reg[rt(instr)];
|
|
|
|
|
|
|
|
double x = CPU_reg[rt(instr)].x, y = f16Unsign(CPU_reg[rt(instr)].y);
|
|
|
|
|
|
|
|
psx_value iX;
|
|
|
|
iX.d = rtVal;
|
|
|
|
psx_value iY;
|
|
|
|
iY.d = rtVal;
|
|
|
|
|
|
|
|
iX.sd = (iX.sd << 16) >> 16; // remove Y
|
|
|
|
iY.sw.l = iX.sw.h; // overwrite x with sign(x)
|
|
|
|
|
|
|
|
// Shift test values
|
|
|
|
psx_value dX;
|
|
|
|
dX.sd = iX.sd >> sh;
|
|
|
|
psx_value dY;
|
|
|
|
dY.d = iY.d >> sh;
|
|
|
|
|
|
|
|
if (dX.sw.l != iX.sw.h)
|
|
|
|
x = x / (1 << sh);
|
|
|
|
else
|
|
|
|
x = dX.sw.l; // only sign bits left
|
|
|
|
|
|
|
|
if (dY.sw.l != iX.sw.h)
|
|
|
|
{
|
|
|
|
if (sh == 16)
|
|
|
|
{
|
|
|
|
x = y;
|
|
|
|
}
|
|
|
|
else if (sh < 16)
|
|
|
|
{
|
|
|
|
x += y * (1 << (16 - sh));
|
|
|
|
if (CPU_reg[rt(instr)].x < 0)
|
|
|
|
x += 1 << (16 - sh);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
x += y / (1 << (sh - 16));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if ((dY.sw.h == 0) || (dY.sw.h == -1))
|
|
|
|
y = dY.sw.h;
|
|
|
|
else
|
|
|
|
y = y / (1 << sh);
|
|
|
|
|
|
|
|
x = f16Sign(x);
|
|
|
|
y = f16Sign(y);
|
|
|
|
|
|
|
|
ret.x = (float)x;
|
|
|
|
ret.y = (float)y;
|
|
|
|
|
|
|
|
ret.value = rdVal;
|
|
|
|
CPU_reg[rd(instr)] = ret;
|
|
|
|
}
|
|
|
|
|
2021-02-17 15:45:32 +00:00
|
|
|
void CPU_SRAV(u32 instr, u32 rtVal, u32 rsVal)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
|
|
|
// Rd = Rt >> Sa
|
2021-02-17 15:45:32 +00:00
|
|
|
const u32 rdVal = static_cast<u32>(static_cast<s32>(rtVal) >> rsVal);
|
2020-08-19 13:26:57 +00:00
|
|
|
PGXP_value ret;
|
|
|
|
u32 sh = rsVal & 0x1F;
|
|
|
|
Validate(&CPU_reg[rt(instr)], rtVal);
|
|
|
|
Validate(&CPU_reg[rs(instr)], rsVal);
|
|
|
|
|
|
|
|
ret = CPU_reg[rt(instr)];
|
|
|
|
|
|
|
|
double x = CPU_reg[rt(instr)].x, y = CPU_reg[rt(instr)].y;
|
|
|
|
|
|
|
|
psx_value iX;
|
|
|
|
iX.d = rtVal;
|
|
|
|
psx_value iY;
|
|
|
|
iY.d = rtVal;
|
|
|
|
|
|
|
|
iX.sd = (iX.sd << 16) >> 16; // remove Y
|
|
|
|
iY.sw.l = iX.sw.h; // overwrite x with sign(x)
|
|
|
|
|
|
|
|
// Shift test values
|
|
|
|
psx_value dX;
|
|
|
|
dX.sd = iX.sd >> sh;
|
|
|
|
psx_value dY;
|
|
|
|
dY.sd = iY.sd >> sh;
|
|
|
|
|
|
|
|
if (dX.sw.l != iX.sw.h)
|
|
|
|
x = x / (1 << sh);
|
|
|
|
else
|
|
|
|
x = dX.sw.l; // only sign bits left
|
|
|
|
|
|
|
|
if (dY.sw.l != iX.sw.h)
|
|
|
|
{
|
|
|
|
if (sh == 16)
|
|
|
|
{
|
|
|
|
x = y;
|
|
|
|
}
|
|
|
|
else if (sh < 16)
|
|
|
|
{
|
|
|
|
x += y * (1 << (16 - sh));
|
|
|
|
if (CPU_reg[rt(instr)].x < 0)
|
|
|
|
x += 1 << (16 - sh);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
x += y / (1 << (sh - 16));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if ((dY.sw.h == 0) || (dY.sw.h == -1))
|
|
|
|
y = dY.sw.h;
|
|
|
|
else
|
|
|
|
y = y / (1 << sh);
|
|
|
|
|
|
|
|
x = f16Sign(x);
|
|
|
|
y = f16Sign(y);
|
|
|
|
|
|
|
|
ret.x = (float)x;
|
|
|
|
ret.y = (float)y;
|
|
|
|
|
|
|
|
ret.value = rdVal;
|
|
|
|
CPU_reg[rd(instr)] = ret;
|
|
|
|
}
|
|
|
|
|
2021-02-17 14:27:31 +00:00
|
|
|
void CPU_MFHI(u32 instr, u32 hiVal)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
|
|
|
// Rd = Hi
|
|
|
|
Validate(&CPU_Hi, hiVal);
|
|
|
|
|
|
|
|
CPU_reg[rd(instr)] = CPU_Hi;
|
|
|
|
}
|
|
|
|
|
2023-08-15 13:12:21 +00:00
|
|
|
void CPU_MTHI(u32 instr, u32 rsVal)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
|
|
|
// Hi = Rd
|
2023-08-15 13:12:21 +00:00
|
|
|
Validate(&CPU_reg[rs(instr)], rsVal);
|
2020-08-19 13:26:57 +00:00
|
|
|
|
|
|
|
CPU_Hi = CPU_reg[rd(instr)];
|
|
|
|
}
|
|
|
|
|
2021-02-17 14:27:31 +00:00
|
|
|
void CPU_MFLO(u32 instr, u32 loVal)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
|
|
|
// Rd = Lo
|
|
|
|
Validate(&CPU_Lo, loVal);
|
|
|
|
|
|
|
|
CPU_reg[rd(instr)] = CPU_Lo;
|
|
|
|
}
|
|
|
|
|
2023-08-15 13:12:21 +00:00
|
|
|
void CPU_MTLO(u32 instr, u32 rsVal)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
|
|
|
// Lo = Rd
|
2023-08-15 13:12:21 +00:00
|
|
|
Validate(&CPU_reg[rs(instr)], rsVal);
|
2020-08-19 13:26:57 +00:00
|
|
|
|
|
|
|
CPU_Lo = CPU_reg[rd(instr)];
|
|
|
|
}
|
|
|
|
|
2021-02-17 15:15:18 +00:00
|
|
|
void CPU_MFC0(u32 instr, u32 rdVal)
|
2020-08-19 13:26:57 +00:00
|
|
|
{
|
|
|
|
// CPU[Rt] = CP0[Rd]
|
|
|
|
Validate(&CP0_reg[rd(instr)], rdVal);
|
|
|
|
CPU_reg[rt(instr)] = CP0_reg[rd(instr)];
|
2021-02-17 15:15:18 +00:00
|
|
|
CPU_reg[rt(instr)].value = rdVal;
|
2020-08-19 13:26:57 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
void CPU_MTC0(u32 instr, u32 rdVal, u32 rtVal)
|
|
|
|
{
|
|
|
|
// CP0[Rd] = CPU[Rt]
|
|
|
|
Validate(&CPU_reg[rt(instr)], rtVal);
|
|
|
|
CP0_reg[rd(instr)] = CPU_reg[rt(instr)];
|
|
|
|
CP0_reg[rd(instr)].value = rdVal;
|
|
|
|
}
|
|
|
|
|
2020-08-19 15:21:36 +00:00
|
|
|
} // namespace PGXP
|