+#if 1
+
//
// GPU Core
//
-// by cal2
+// Originally by David Raingeard (Cal2)
// GCC/SDL port by Niels Wagenaar (Linux/WIN32) and Caz (BeOS)
-// Cleanups, endian wrongness, and bad ASM amelioration by James L. Hammons
+// Cleanups, endian wrongness, and bad ASM amelioration by James Hammons
+// (C) 2010 Underground Software
+//
+// JLH = James Hammons <jlhamm@acm.org>
+//
+// Who When What
+// --- ---------- -------------------------------------------------------------
+// JLH 01/16/2010 Created this log ;-)
+// JLH 11/26/2011 Added fixes for LOAD/STORE alignment issues
+
+//
// Note: Endian wrongness probably stems from the MAME origins of this emu and
// the braindead way in which MAME handles memory. :-)
//
+// Problem with not booting the BIOS was the incorrect way that the
+// SUBC instruction set the carry when the carry was set going in...
+// Same problem with ADDC...
+//
#include "gpu.h"
-#define CINT0FLAG 0x00200
-#define CINT1FLAG 0x00400
-#define CINT2FLAG 0x00800
-#define CINT3FLAG 0x01000
-#define CINT4FLAG 0x02000
+#include <stdlib.h>
+#include <string.h> // For memset
+#include "dsp.h"
+#include "jagdasm.h"
+#include "jaguar.h"
+#include "log.h"
+#include "m68000/m68kinterface.h"
+//#include "memory.h"
+#include "tom.h"
+
+
+// Seems alignment in loads & stores was off...
+#define GPU_CORRECT_ALIGNMENT
+//#define GPU_DEBUG
+
+// For GPU dissasembly...
+
+#if 0
+#define GPU_DIS_ABS
+#define GPU_DIS_ADD
+#define GPU_DIS_ADDC
+#define GPU_DIS_ADDQ
+#define GPU_DIS_ADDQT
+#define GPU_DIS_AND
+#define GPU_DIS_BCLR
+#define GPU_DIS_BSET
+#define GPU_DIS_BTST
+#define GPU_DIS_CMP
+#define GPU_DIS_CMPQ
+#define GPU_DIS_DIV
+#define GPU_DIS_IMULT
+#define GPU_DIS_JUMP
+#define GPU_DIS_JR
+#define GPU_DIS_LOAD
+#define GPU_DIS_LOADB
+#define GPU_DIS_LOADW
+#define GPU_DIS_LOAD14I
+#define GPU_DIS_LOAD14R
+#define GPU_DIS_LOAD15I
+#define GPU_DIS_LOAD15R
+#define GPU_DIS_MOVE
+#define GPU_DIS_MOVEFA
+#define GPU_DIS_MOVEI
+#define GPU_DIS_MOVEPC
+#define GPU_DIS_MOVETA
+#define GPU_DIS_MOVEQ
+#define GPU_DIS_MULT
+#define GPU_DIS_NEG
+#define GPU_DIS_NOP
+#define GPU_DIS_NOT
+#define GPU_DIS_OR
+#define GPU_DIS_PACK
+#define GPU_DIS_ROR
+#define GPU_DIS_RORQ
+#define GPU_DIS_SAT8
+#define GPU_DIS_SH
+#define GPU_DIS_SHA
+#define GPU_DIS_SHARQ
+#define GPU_DIS_SHLQ
+#define GPU_DIS_SHRQ
+#define GPU_DIS_STORE
+#define GPU_DIS_STOREB
+#define GPU_DIS_STOREW
+#define GPU_DIS_STORE14I
+#define GPU_DIS_STORE14R
+#define GPU_DIS_STORE15I
+#define GPU_DIS_STORE15R
+#define GPU_DIS_SUB
+#define GPU_DIS_SUBC
+#define GPU_DIS_SUBQ
+#define GPU_DIS_SUBQT
+#define GPU_DIS_XOR
+
+bool doGPUDis = false;
+//bool doGPUDis = true;
+#endif
+
+/*
+GPU opcodes use (BIOS flying ATARI logo):
++ add 357416
++ addq 538030
++ addqt 6999
++ sub 116663
++ subq 188059
++ subqt 15086
++ neg 36097
++ and 233993
++ or 109332
++ xor 1384
++ btst 111924
++ bset 25029
++ bclr 10551
++ mult 28147
++ imult 69148
++ div 64102
++ abs 159394
++ shlq 194690
++ shrq 292587
++ sharq 192649
++ rorq 58672
++ cmp 244963
++ cmpq 114834
++ move 833472
++ moveq 56427
++ moveta 220814
++ movefa 170678
++ movei 152025
++ loadw 108220
++ load 430936
++ storew 3036
++ store 372490
++ move_pc 2330
++ jump 349134
++ jr 529171
+ mmult 64904
++ nop 432179
+*/
+
+// Various bits
+
+#define CINT0FLAG 0x0200
+#define CINT1FLAG 0x0400
+#define CINT2FLAG 0x0800
+#define CINT3FLAG 0x1000
+#define CINT4FLAG 0x2000
#define CINT04FLAGS (CINT0FLAG | CINT1FLAG | CINT2FLAG | CINT3FLAG | CINT4FLAG)
+// GPU_FLAGS bits
+
+#define ZERO_FLAG 0x0001
+#define CARRY_FLAG 0x0002
+#define NEGA_FLAG 0x0004
+#define IMASK 0x0008
+#define INT_ENA0 0x0010
+#define INT_ENA1 0x0020
+#define INT_ENA2 0x0040
+#define INT_ENA3 0x0080
+#define INT_ENA4 0x0100
+#define INT_CLR0 0x0200
+#define INT_CLR1 0x0400
+#define INT_CLR2 0x0800
+#define INT_CLR3 0x1000
+#define INT_CLR4 0x2000
+#define REGPAGE 0x4000
+#define DMAEN 0x8000
+
+// External global variables
+
extern int start_logging;
+extern int gpu_start_log;
+
+// Private function prototypes
+
+void GPUUpdateRegisterBanks(void);
+void GPUDumpDisassembly(void);
+void GPUDumpRegisters(void);
+void GPUDumpMemory(void);
static void gpu_opcode_add(void);
static void gpu_opcode_addc(void);
static void gpu_opcode_sat24(void);
static void gpu_opcode_pack(void);
-uint8 gpu_opcode_cycles[64] =
-{
- 3, 3, 3, 3,
- 3, 3, 3, 3,
- 3, 3, 3, 3,
- 3, 3, 3, 3,
- 3, 3, 1, 3,
- 1, 18, 3, 3,
- 3, 3, 3, 3,
- 3, 3, 3, 3,
- 3, 3, 2, 2,
- 2, 2, 3, 4,
- 5, 4, 5, 6,
- 6, 1, 1, 1,
- 1, 2, 2, 2,
- 1, 1, 9, 3,
- 3, 1, 6, 6,
- 2, 2, 3, 3
-};
-
-void (*gpu_opcode[64])()=
-{
+// This is wrong, since it doesn't take pipeline effects into account. !!! FIX !!!
+/*uint8_t gpu_opcode_cycles[64] =
+{
+ 3, 3, 3, 3, 3, 3, 3, 3,
+ 3, 3, 3, 3, 3, 3, 3, 3,
+ 3, 3, 1, 3, 1, 18, 3, 3,
+ 3, 3, 3, 3, 3, 3, 3, 3,
+ 3, 3, 2, 2, 2, 2, 3, 4,
+ 5, 4, 5, 6, 6, 1, 1, 1,
+ 1, 2, 2, 2, 1, 1, 9, 3,
+ 3, 1, 6, 6, 2, 2, 3, 3
+};//*/
+//Here's a QnD kludge...
+//This is wrong, wrong, WRONG, but it seems to work for the time being...
+//(That is, it fixes Flip Out which relies on GPU timing rather than semaphores. Bad developers! Bad!)
+//What's needed here is a way to take pipeline effects into account (including pipeline stalls!)...
+/*uint8_t gpu_opcode_cycles[64] =
+{
+ 1, 1, 1, 1, 1, 1, 1, 1,
+ 1, 1, 1, 1, 1, 1, 1, 1,
+ 1, 1, 1, 1, 1, 9, 1, 1,
+ 1, 1, 1, 1, 1, 1, 1, 1,
+ 1, 1, 1, 1, 1, 1, 1, 2,
+ 2, 2, 2, 3, 3, 1, 1, 1,
+ 1, 1, 1, 1, 1, 1, 4, 1,
+ 1, 1, 3, 3, 1, 1, 1, 1
+};//*/
+uint8_t gpu_opcode_cycles[64] =
+{
+ 1, 1, 1, 1, 1, 1, 1, 1,
+ 1, 1, 1, 1, 1, 1, 1, 1,
+ 1, 1, 1, 1, 1, 1, 1, 1,
+ 1, 1, 1, 1, 1, 1, 1, 1,
+ 1, 1, 1, 1, 1, 1, 1, 1,
+ 1, 1, 1, 1, 1, 1, 1, 1,
+ 1, 1, 1, 1, 1, 1, 1, 1,
+ 1, 1, 1, 1, 1, 1, 1, 1
+};//*/
+
+void (*gpu_opcode[64])()=
+{
gpu_opcode_add, gpu_opcode_addc, gpu_opcode_addq, gpu_opcode_addqt,
gpu_opcode_sub, gpu_opcode_subc, gpu_opcode_subq, gpu_opcode_subqt,
gpu_opcode_neg, gpu_opcode_and, gpu_opcode_or, gpu_opcode_xor,
gpu_opcode_store_r14_ri, gpu_opcode_store_r15_ri, gpu_opcode_sat24, gpu_opcode_pack,
};
-static uint8 * gpu_ram_8;
-//static uint16 *gpu_ram_16;
-//static uint32 *gpu_ram_32;
-
-
-static uint32 gpu_pc;
-static uint32 gpu_acc;
-static uint32 gpu_remain;
-static uint32 gpu_hidata;
-static uint32 gpu_flags;
-static uint32 gpu_matrix_control;
-static uint32 gpu_pointer_to_matrix;
-static uint32 gpu_data_organization;
-static uint32 gpu_control;
-static uint32 gpu_div_control;
-static uint8 gpu_flag_z;
-static uint8 gpu_flag_n;
-static uint8 gpu_flag_c;
-static uint8 gpu_alternate_flag_z;
-static uint8 gpu_alternate_flag_n;
-static uint8 gpu_alternate_flag_c;
-static uint32 * gpu_reg;
-static uint32 * gpu_alternate_reg;
-static uint32 * gpu_reg_bank_0;
-static uint32 * gpu_reg_bank_1;
-
-static uint32 gpu_opcode_first_parameter;
-static uint32 gpu_opcode_second_parameter;
+static uint8_t gpu_ram_8[0x1000];
+uint32_t gpu_pc;
+static uint32_t gpu_acc;
+static uint32_t gpu_remain;
+static uint32_t gpu_hidata;
+static uint32_t gpu_flags;
+static uint32_t gpu_matrix_control;
+static uint32_t gpu_pointer_to_matrix;
+static uint32_t gpu_data_organization;
+static uint32_t gpu_control;
+static uint32_t gpu_div_control;
+// There is a distinct advantage to having these separated out--there's no need to clear
+// a bit before writing a result. I.e., if the result of an operation leaves a zero in
+// the carry flag, you don't have to zero gpu_flag_c before you can write that zero!
+static uint8_t gpu_flag_z, gpu_flag_n, gpu_flag_c;
+uint32_t gpu_reg_bank_0[32];
+uint32_t gpu_reg_bank_1[32];
+static uint32_t * gpu_reg;
+static uint32_t * gpu_alternate_reg;
+
+static uint32_t gpu_instruction;
+static uint32_t gpu_opcode_first_parameter;
+static uint32_t gpu_opcode_second_parameter;
#define GPU_RUNNING (gpu_control & 0x01)
-#define Rm gpu_reg[gpu_opcode_first_parameter]
-#define Rn gpu_reg[gpu_opcode_second_parameter]
-#define alternate_Rm gpu_alternate_reg[gpu_opcode_first_parameter]
-#define alternate_Rn gpu_alternate_reg[gpu_opcode_second_parameter]
-#define imm_1 gpu_opcode_first_parameter
-#define imm_2 gpu_opcode_second_parameter
+#define RM gpu_reg[gpu_opcode_first_parameter]
+#define RN gpu_reg[gpu_opcode_second_parameter]
+#define ALTERNATE_RM gpu_alternate_reg[gpu_opcode_first_parameter]
+#define ALTERNATE_RN gpu_alternate_reg[gpu_opcode_second_parameter]
+#define IMM_1 gpu_opcode_first_parameter
+#define IMM_2 gpu_opcode_second_parameter
-#define set_flag_z(r) gpu_flag_z = (r==0);
-#define set_flag_n(r) gpu_flag_n = ((r&0x80000000)>>31);
+#define SET_FLAG_Z(r) (gpu_flag_z = ((r) == 0));
+#define SET_FLAG_N(r) (gpu_flag_n = (((uint32_t)(r) >> 31) & 0x01));
-#define reset_flag_z() gpu_flag_z = 0;
-#define reset_flag_n() gpu_flag_n = 0;
-#define reset_flag_c() gpu_flag_c = 0;
+#define RESET_FLAG_Z() gpu_flag_z = 0;
+#define RESET_FLAG_N() gpu_flag_n = 0;
+#define RESET_FLAG_C() gpu_flag_c = 0;
#define CLR_Z (gpu_flag_z = 0)
#define CLR_ZN (gpu_flag_z = gpu_flag_n = 0)
#define CLR_ZNC (gpu_flag_z = gpu_flag_n = gpu_flag_c = 0)
#define SET_Z(r) (gpu_flag_z = ((r) == 0))
-#define SET_N(r) (gpu_flag_n = (((UINT32)(r) >> 31) & 0x01))
-#define SET_C_ADD(a,b) (gpu_flag_c = ((UINT32)(b) > (UINT32)(~(a))))
-#define SET_C_SUB(a,b) (gpu_flag_c = ((UINT32)(b) > (UINT32)(a)))
+#define SET_N(r) (gpu_flag_n = (((uint32_t)(r) >> 31) & 0x01))
+#define SET_C_ADD(a,b) (gpu_flag_c = ((uint32_t)(b) > (uint32_t)(~(a))))
+#define SET_C_SUB(a,b) (gpu_flag_c = ((uint32_t)(b) > (uint32_t)(a)))
#define SET_ZN(r) SET_N(r); SET_Z(r)
#define SET_ZNC_ADD(a,b,r) SET_N(r); SET_Z(r); SET_C_ADD(a,b)
#define SET_ZNC_SUB(a,b,r) SET_N(r); SET_Z(r); SET_C_SUB(a,b)
-uint32 gpu_convert_zero[32] = { 32,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31 };
+uint32_t gpu_convert_zero[32] =
+ { 32,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31 };
-uint8 * branch_condition_table = 0;
-#define branch_condition(x) branch_condition_table[(x) + ((jaguar_flags & 7) << 5)]
+uint8_t * branch_condition_table = 0;
+#define BRANCH_CONDITION(x) branch_condition_table[(x) + ((jaguar_flags & 7) << 5)]
-uint32 gpu_opcode_use[64];
+uint32_t gpu_opcode_use[64];
-void gpu_update_register_banks(void);
-
-char *gpu_opcode_str[64]=
-{
+const char * gpu_opcode_str[64]=
+{
"add", "addc", "addq", "addqt",
"sub", "subc", "subq", "subqt",
"neg", "and", "or", "xor",
"store_r14_ri", "store_r15_ri", "sat24", "pack",
};
-static uint32 gpu_in_exec = 0;
-static uint32 gpu_releaseTimeSlice_flag = 0;
+static uint32_t gpu_in_exec = 0;
+static uint32_t gpu_releaseTimeSlice_flag = 0;
-
-void gpu_releaseTimeslice(void)
+void GPUReleaseTimeslice(void)
{
gpu_releaseTimeSlice_flag = 1;
}
-uint32 gpu_get_pc(void)
+uint32_t GPUGetPC(void)
{
return gpu_pc;
}
void build_branch_condition_table(void)
{
-#define ZFLAG 0x00001
-#define CFLAG 0x00002
-#define NFLAG 0x00004
-
if (!branch_condition_table)
{
- branch_condition_table = (uint8*)malloc(32 * 8 * sizeof(branch_condition_table[0]));
+ branch_condition_table = (uint8_t *)malloc(32 * 8 * sizeof(branch_condition_table[0]));
if (branch_condition_table)
{
{
int result = 1;
if (j & 1)
- if (i & ZFLAG)
+ if (i & ZERO_FLAG)
result = 0;
if (j & 2)
- if (!(i & ZFLAG))
+ if (!(i & ZERO_FLAG))
result = 0;
if (j & 4)
- if (i & (CFLAG << (j >> 4)))
+ if (i & (CARRY_FLAG << (j >> 4)))
result = 0;
if (j & 8)
- if (!(i & (CFLAG << (j >> 4))))
+ if (!(i & (CARRY_FLAG << (j >> 4))))
result = 0;
branch_condition_table[i * 32 + j] = result;
}
//
// GPU byte access (read)
//
+uint8_t GPUReadByte(uint32_t offset, uint32_t who/*=UNKNOWN*/)
+{
+ if (offset >= 0xF02000 && offset <= 0xF020FF)
+ WriteLog("GPU: ReadByte--Attempt to read from GPU register file by %s!\n", whoName[who]);
-unsigned gpu_byte_read(unsigned int offset)
-{
- if ((offset >= gpu_work_ram_base) && (offset < gpu_work_ram_base+0x1000))
+ if ((offset >= GPU_WORK_RAM_BASE) && (offset < GPU_WORK_RAM_BASE+0x1000))
return gpu_ram_8[offset & 0xFFF];
- else if ((offset >= gpu_control_ram_base) && (offset < gpu_control_ram_base+0x20))
+ else if ((offset >= GPU_CONTROL_RAM_BASE) && (offset < GPU_CONTROL_RAM_BASE+0x20))
{
- uint32 data = gpu_long_read(offset & 0xFFFFFFFC);
+ uint32_t data = GPUReadLong(offset & 0xFFFFFFFC, who);
if ((offset & 0x03) == 0)
return data >> 24;
return data & 0xFF;
}
- return jaguar_byte_read(offset);
+ return JaguarReadByte(offset, who);
}
//
// GPU word access (read)
//
-
-unsigned gpu_word_read(unsigned int offset)
+uint16_t GPUReadWord(uint32_t offset, uint32_t who/*=UNKNOWN*/)
{
- if ((offset >= gpu_work_ram_base) && (offset < gpu_work_ram_base+0x1000))
+ if (offset >= 0xF02000 && offset <= 0xF020FF)
+ WriteLog("GPU: ReadWord--Attempt to read from GPU register file by %s!\n", whoName[who]);
+
+ if ((offset >= GPU_WORK_RAM_BASE) && (offset < GPU_WORK_RAM_BASE+0x1000))
{
offset &= 0xFFF;
- uint16 data = ((uint16)gpu_ram_8[offset] << 8) | (uint16)gpu_ram_8[offset+1];
+ uint16_t data = ((uint16_t)gpu_ram_8[offset] << 8) | (uint16_t)gpu_ram_8[offset+1];
return data;
}
- else if ((offset >= gpu_control_ram_base) && (offset < gpu_control_ram_base+0x20))
+ else if ((offset >= GPU_CONTROL_RAM_BASE) && (offset < GPU_CONTROL_RAM_BASE+0x20))
{
// This looks and smells wrong...
// But it *might* be OK...
if (offset & 0x01) // Catch cases 1 & 3... (unaligned read)
- return (gpu_byte_read(offset) << 8) | gpu_byte_read(offset+1);
+ return (GPUReadByte(offset, who) << 8) | GPUReadByte(offset+1, who);
- uint32 data = gpu_long_read(offset & 0xFFFFFFFC);
+ uint32_t data = GPUReadLong(offset & 0xFFFFFFFC, who);
if (offset & 0x02) // Cases 0 & 2...
return data & 0xFFFF;
return data >> 16;
}
- return jaguar_word_read(offset);
+//TEMP--Mirror of F03000? No. Writes only...
+//if (offset >= 0xF0B000 && offset <= 0xF0BFFF)
+//WriteLog("[GPUR16] --> Possible GPU RAM mirror access by %s!", whoName[who]);
+
+ return JaguarReadWord(offset, who);
}
//
// GPU dword access (read)
//
-
-unsigned gpu_long_read(unsigned int offset)
+uint32_t GPUReadLong(uint32_t offset, uint32_t who/*=UNKNOWN*/)
{
+ if (offset >= 0xF02000 && offset <= 0xF020FF)
+ {
+ WriteLog("GPU: ReadLong--Attempt to read from GPU register file (%X) by %s!\n", offset, whoName[who]);
+ uint32_t reg = (offset & 0xFC) >> 2;
+ return (reg < 32 ? gpu_reg_bank_0[reg] : gpu_reg_bank_1[reg - 32]);
+ }
- if ((offset >= gpu_work_ram_base) && (offset < gpu_work_ram_base+0x1000))
+// if ((offset >= GPU_WORK_RAM_BASE) && (offset < GPU_WORK_RAM_BASE + 0x1000))
+ if ((offset >= GPU_WORK_RAM_BASE) && (offset <= GPU_WORK_RAM_BASE + 0x0FFC))
{
offset &= 0xFFF;
- return ((uint32)gpu_ram_8[offset] << 24) | ((uint32)gpu_ram_8[offset+1] << 16)
- | ((uint32)gpu_ram_8[offset+2] << 8) | (uint32)gpu_ram_8[offset+3];
+ return ((uint32_t)gpu_ram_8[offset] << 24) | ((uint32_t)gpu_ram_8[offset+1] << 16)
+ | ((uint32_t)gpu_ram_8[offset+2] << 8) | (uint32_t)gpu_ram_8[offset+3];//*/
+// return GET32(gpu_ram_8, offset);
}
- else if ((offset >= gpu_control_ram_base) && (offset < gpu_control_ram_base+0x20))
+// else if ((offset >= GPU_CONTROL_RAM_BASE) && (offset < GPU_CONTROL_RAM_BASE+0x20))
+ else if ((offset >= GPU_CONTROL_RAM_BASE) && (offset <= GPU_CONTROL_RAM_BASE + 0x1C))
{
offset &= 0x1F;
switch (offset)
gpu_flag_n = (gpu_flag_n ? 1 : 0);
gpu_flags = (gpu_flags & 0xFFFFFFF8) | (gpu_flag_n << 2) | (gpu_flag_c << 1) | gpu_flag_z;
-
+
return gpu_flags & 0xFFFFC1FF;
case 0x04:
return gpu_matrix_control;
case 0x1C:
return gpu_remain;
default: // unaligned long read
+#ifdef GPU_DEBUG
+ WriteLog("GPU: Read32--unaligned 32 bit read at %08X by %s.\n", GPU_CONTROL_RAM_BASE + offset, whoName[who]);
+#endif // GPU_DEBUG
return 0;
- //exit(0);
- // __asm int 3
- // }
}
- // to prevent any lock-ups
}
+//TEMP--Mirror of F03000? No. Writes only...
+//if (offset >= 0xF0B000 && offset <= 0xF0BFFF)
+// WriteLog("[GPUR32] --> Possible GPU RAM mirror access by %s!\n", whoName[who]);
+/*if (offset >= 0xF1D000 && offset <= 0xF1DFFF)
+ WriteLog("[GPUR32] --> Reading from Wavetable ROM!\n");//*/
- return (jaguar_word_read(offset) << 16) | jaguar_word_read(offset+2);
+ return (JaguarReadWord(offset, who) << 16) | JaguarReadWord(offset + 2, who);
}
//
// GPU byte access (write)
//
-
-void gpu_byte_write(unsigned offset, unsigned data)
+void GPUWriteByte(uint32_t offset, uint8_t data, uint32_t who/*=UNKNOWN*/)
{
- if ((offset >= gpu_work_ram_base) && (offset < gpu_work_ram_base+0x1000))
+ if (offset >= 0xF02000 && offset <= 0xF020FF)
+ WriteLog("GPU: WriteByte--Attempt to write to GPU register file by %s!\n", whoName[who]);
+
+ if ((offset >= GPU_WORK_RAM_BASE) && (offset <= GPU_WORK_RAM_BASE + 0x0FFF))
{
gpu_ram_8[offset & 0xFFF] = data;
- if (gpu_in_exec == 0)
+
+//This is the same stupid worthless code that was in the DSP!!! AARRRGGGGHHHHH!!!!!!
+/* if (!gpu_in_exec)
{
-// s68000releaseTimeslice();
m68k_end_timeslice();
dsp_releaseTimeslice();
- }
+ }*/
return;
}
- else if ((offset >= gpu_control_ram_base) && (offset < gpu_control_ram_base+0x20))
+ else if ((offset >= GPU_CONTROL_RAM_BASE) && (offset <= GPU_CONTROL_RAM_BASE + 0x1F))
{
- uint32 reg = offset & 0x1C;
+ uint32_t reg = offset & 0x1C;
int bytenum = offset & 0x03;
//This is definitely wrong!
if ((reg >= 0x1C) && (reg <= 0x1F))
- gpu_div_control = (gpu_div_control & (~(0xFF << (bytenum << 3)))) | (data << (bytenum << 3));
+ gpu_div_control = (gpu_div_control & (~(0xFF << (bytenum << 3)))) | (data << (bytenum << 3));
else
{
- uint32 old_data = gpu_long_read(offset & 0xFFFFFFC);
+ uint32_t old_data = GPUReadLong(offset & 0xFFFFFFC, who);
bytenum = 3 - bytenum; // convention motorola !!!
- old_data = (old_data & (~(0xFF << (bytenum << 3)))) | (data << (bytenum << 3));
- gpu_long_write(offset & 0xFFFFFFC, old_data);
+ old_data = (old_data & (~(0xFF << (bytenum << 3)))) | (data << (bytenum << 3));
+ GPUWriteLong(offset & 0xFFFFFFC, old_data, who);
}
return;
}
-// fprintf(log_get(),"gpu: writing %.2x at 0x%.8x\n",data,offset);
- jaguar_byte_write(offset, data);
+// WriteLog("gpu: writing %.2x at 0x%.8x\n",data,offset);
+ JaguarWriteByte(offset, data, who);
}
//
// GPU word access (write)
//
-
-void gpu_word_write(unsigned offset, unsigned data)
+void GPUWriteWord(uint32_t offset, uint16_t data, uint32_t who/*=UNKNOWN*/)
{
+ if (offset >= 0xF02000 && offset <= 0xF020FF)
+ WriteLog("GPU: WriteWord--Attempt to write to GPU register file by %s!\n", whoName[who]);
- if ((offset >= gpu_work_ram_base) && (offset < gpu_work_ram_base+0x1000))
+ if ((offset >= GPU_WORK_RAM_BASE) && (offset <= GPU_WORK_RAM_BASE + 0x0FFE))
{
-
gpu_ram_8[offset & 0xFFF] = (data>>8) & 0xFF;
- gpu_ram_8[(offset+1) & 0xFFF] = data & 0xFF;
- if (gpu_in_exec == 0)
+ gpu_ram_8[(offset+1) & 0xFFF] = data & 0xFF;//*/
+/* offset &= 0xFFF;
+ SET16(gpu_ram_8, offset, data);//*/
+
+/*if (offset >= 0xF03214 && offset < 0xF0321F)
+ WriteLog("GPU: Writing WORD (%04X) to GPU RAM (%08X)...\n", data, offset);//*/
+
+
+//This is the same stupid worthless code that was in the DSP!!! AARRRGGGGHHHHH!!!!!!
+/* if (!gpu_in_exec)
{
-// s68000releaseTimeslice();
m68k_end_timeslice();
dsp_releaseTimeslice();
- }
+ }*/
return;
}
- if ((offset >= gpu_control_ram_base) && (offset < gpu_control_ram_base+0x20))
+ else if ((offset >= GPU_CONTROL_RAM_BASE) && (offset <= GPU_CONTROL_RAM_BASE + 0x1E))
{
if (offset & 0x01) // This is supposed to weed out unaligned writes, but does nothing...
{
- //exit(0);
- //__asm int 3
+#ifdef GPU_DEBUG
+ WriteLog("GPU: Write16--unaligned write @ %08X [%04X]\n", offset, data);
+ GPUDumpRegisters();
+#endif // GPU_DEBUG
+ return;
}
+//Dual locations in this range: $1C Divide unit remainder/Divide unit control (R/W)
+//This just literally sucks.
if ((offset & 0x1C) == 0x1C)
{
//This doesn't look right either--handles cases 1, 2, & 3 all the same!
- if (offset & 0x03)
- gpu_div_control = (gpu_div_control&0xFFFF0000) | (data&0xFFFF);
+ if (offset & 0x02)
+ gpu_div_control = (gpu_div_control & 0xFFFF0000) | (data & 0xFFFF);
else
- gpu_div_control = (gpu_div_control&0xFFFF) | ((data&0xFFFF)<<16);
+ gpu_div_control = (gpu_div_control & 0x0000FFFF) | ((data & 0xFFFF) << 16);
}
- else
+ else
{
- uint32 old_data = gpu_long_read(offset & 0xFFFFFFC);
- if (offset & 0x03)
+//WriteLog("[GPU W16:%08X,%04X]", offset, data);
+ uint32_t old_data = GPUReadLong(offset & 0xFFFFFFC, who);
+
+ if (offset & 0x02)
old_data = (old_data & 0xFFFF0000) | (data & 0xFFFF);
else
- old_data = (old_data & 0xFFFF) | ((data & 0xFFFF) << 16);
- gpu_long_write(offset & 0xFFFFFFC, old_data);
+ old_data = (old_data & 0x0000FFFF) | ((data & 0xFFFF) << 16);
+
+ GPUWriteLong(offset & 0xFFFFFFC, old_data, who);
}
+
+ return;
+ }
+ else if ((offset == GPU_WORK_RAM_BASE + 0x0FFF) || (GPU_CONTROL_RAM_BASE + 0x1F))
+ {
+#ifdef GPU_DEBUG
+ WriteLog("GPU: Write16--unaligned write @ %08X by %s [%04X]!\n", offset, whoName[who], data);
+ GPUDumpRegisters();
+#endif // GPU_DEBUG
return;
}
-// fprintf(log_get(),"gpu: writing %.4x at 0x%.8x\n",data,offset);
- jaguar_word_write(offset, data);
+
+ // Have to be careful here--this can cause an infinite loop!
+ JaguarWriteWord(offset, data, who);
}
//
// GPU dword access (write)
//
-
-void gpu_long_write(unsigned offset, unsigned data)
+void GPUWriteLong(uint32_t offset, uint32_t data, uint32_t who/*=UNKNOWN*/)
{
+ if (offset >= 0xF02000 && offset <= 0xF020FF)
+ WriteLog("GPU: WriteLong--Attempt to write to GPU register file by %s!\n", whoName[who]);
- if ((offset >= gpu_work_ram_base) && (offset < gpu_work_ram_base+0x1000))
+// if ((offset >= GPU_WORK_RAM_BASE) && (offset < GPU_WORK_RAM_BASE + 0x1000))
+ if ((offset >= GPU_WORK_RAM_BASE) && (offset <= GPU_WORK_RAM_BASE + 0x0FFC))
{
- gpu_ram_8[offset & 0xFFF] = (data >> 24) & 0xFF;
- gpu_ram_8[(offset+1) & 0xFFF] = (data >> 16) & 0xFF;
- gpu_ram_8[(offset+2) & 0xFFF] = (data >> 8) & 0xFF;
- gpu_ram_8[(offset+3) & 0xFFF] = data & 0xFF;
+#ifdef GPU_DEBUG
+ if (offset & 0x03)
+ {
+ WriteLog("GPU: Write32--unaligned write @ %08X [%08X] by %s\n", offset, data, whoName[who]);
+ GPUDumpRegisters();
+ }
+#endif // GPU_DEBUG
+
+ offset &= 0xFFF;
+ SET32(gpu_ram_8, offset, data);
return;
}
- else if ((offset >= gpu_control_ram_base) && (offset < gpu_control_ram_base+0x20))
+// else if ((offset >= GPU_CONTROL_RAM_BASE) && (offset < GPU_CONTROL_RAM_BASE+0x20))
+ else if ((offset >= GPU_CONTROL_RAM_BASE) && (offset <= GPU_CONTROL_RAM_BASE + 0x1C))
{
offset &= 0x1F;
switch (offset)
{
case 0x00:
- /*if (data&0x8)
- gpu_flags=(data&(~0x08))|(gpu_flags&0x08); // update dsp_flags, but keep imask unchanged
- else*/
- gpu_flags = data;
- gpu_flag_z = gpu_flags & 0x01;
- gpu_flag_c = (gpu_flags>>1) & 0x01;
- gpu_flag_n = (gpu_flags>>2) & 0x01;
- gpu_update_register_banks();
- gpu_control &= ~((gpu_flags & CINT04FLAGS) >> 3);
- gpu_check_irqs();
+ {
+ bool IMASKCleared = (gpu_flags & IMASK) && !(data & IMASK);
+ // NOTE: According to the JTRM, writing a 1 to IMASK has no effect; only the
+ // IRQ logic can set it. So we mask it out here to prevent problems...
+ gpu_flags = data & (~IMASK);
+ gpu_flag_z = gpu_flags & ZERO_FLAG;
+ gpu_flag_c = (gpu_flags & CARRY_FLAG) >> 1;
+ gpu_flag_n = (gpu_flags & NEGA_FLAG) >> 2;
+ GPUUpdateRegisterBanks();
+ gpu_control &= ~((gpu_flags & CINT04FLAGS) >> 3); // Interrupt latch clear bits
+//Writing here is only an interrupt enable--this approach is just plain wrong!
+// GPUHandleIRQs();
+//This, however, is A-OK! ;-)
+ if (IMASKCleared) // If IMASK was cleared,
+ GPUHandleIRQs(); // see if any other interrupts need servicing!
+#ifdef GPU_DEBUG
+ if (gpu_flags & (INT_ENA0 | INT_ENA1 | INT_ENA2 | INT_ENA3 | INT_ENA4))
+ WriteLog("GPU: Interrupt enable set by %s! Bits: %02X\n", whoName[who], (gpu_flags >> 4) & 0x1F);
+ WriteLog("GPU: REGPAGE %s...\n", (gpu_flags & REGPAGE ? "set" : "cleared"));
+#endif // GPU_DEBUG
break;
+ }
case 0x04:
gpu_matrix_control = data;
break;
case 0x08:
- gpu_pointer_to_matrix=data;
+ // This can only point to long aligned addresses
+ gpu_pointer_to_matrix = data & 0xFFFFFFFC;
break;
case 0x0C:
- gpu_data_organization=data;
+ gpu_data_organization = data;
break;
case 0x10:
- gpu_pc = data; /*fprintf(log_get(),"setting gpu pc to 0x%.8x\n",gpu_pc);*/
+ gpu_pc = data;
+#ifdef GPU_DEBUG
+WriteLog("GPU: %s setting GPU PC to %08X %s\n", whoName[who], gpu_pc, (GPU_RUNNING ? "(GPU is RUNNING!)" : ""));//*/
+#endif // GPU_DEBUG
break;
case 0x14:
- {
- uint32 gpu_was_running = GPU_RUNNING;
-
- data &= (~0x7C0); // disable writes to irq pending
- /*if (GPU_RUNNING)
- {
- fprintf(log_get(),"gpu pc is 0x%.8x\n",gpu_pc);
- fclose(log_get());
- exit(0);
- }*/
- // check for GPU->CPU interrupt
+ {
+// uint32_t gpu_was_running = GPU_RUNNING;
+ data &= ~0xF7C0; // Disable writes to INT_LAT0-4 & TOM version number
+
+ // check for GPU -> CPU interrupt
if (data & 0x02)
{
-// fprintf(log_get(),"GPU->CPU interrupt\n");
- if (tom_irq_enabled(IRQ_GPU))
+//WriteLog("GPU->CPU interrupt\n");
+ if (TOMIRQEnabled(IRQ_GPU))
{
- if ((tom_irq_enabled(IRQ_GPU)) && (jaguar_interrupt_handler_is_valid(64)))
- {
- tom_set_pending_gpu_int();
-// s68000interrupt(7,64);
-// s68000flushInterrupts();
- m68k_set_irq(7); // Set 68000 NMI
- gpu_releaseTimeslice();
- }
-/*
- uint32 addr=jaguar_word_read(((IRQ_GPU+64)<<2)+0);
- addr<<=16;
- addr|=jaguar_word_read(((IRQ_GPU+64)<<2)+2);
- if ((addr)&&(jaguar_interrupt_handler_is_valid(IRQ_GPU+64)))
+//This is the programmer's responsibility, to make sure the handler is valid, not ours!
+// if ((TOMIRQEnabled(IRQ_GPU))// && (JaguarInterruptHandlerIsValid(64)))
{
- s68000interrupt(7,IRQ_GPU+64);
- s68000flushInterrupts();
+ TOMSetPendingGPUInt();
+ m68k_set_irq(2); // Set 68000 IPL 2
+ GPUReleaseTimeslice();
}
-*/
}
- data &= ~(0x02);
+ data &= ~0x02;
}
- // check for CPU->GPU interrupt
+
+ // check for CPU -> GPU interrupt #0
if (data & 0x04)
{
- //fprintf(log_get(),"CPU->GPU interrupt\n");
- gpu_set_irq_line(0, 1);
-// s68000releaseTimeslice();
+//WriteLog("CPU->GPU interrupt\n");
+ GPUSetIRQLine(0, ASSERT_LINE);
m68k_end_timeslice();
- dsp_releaseTimeslice();
- data &= ~(0x04);
+ DSPReleaseTimeslice();
+ data &= ~0x04;
}
+
// single stepping
if (data & 0x10)
{
- //fprintf(log_get(),"asked to perform a single step (single step is %senabled)\n",(data&0x8)?"":"not ");
+ //WriteLog("asked to perform a single step (single step is %senabled)\n",(data&0x8)?"":"not ");
}
- gpu_control = (gpu_control & 0x107C0) | (data & (~0x107C0));
+
+ gpu_control = (gpu_control & 0xF7C0) | (data & (~0xF7C0));
// if gpu wasn't running but is now running, execute a few cycles
#ifndef GPU_SINGLE_STEPPING
- if ((!gpu_was_running) && (GPU_RUNNING))
- gpu_exec(200);
+/* if (!gpu_was_running && GPU_RUNNING)
+#ifdef GPU_DEBUG
+ {
+ WriteLog("GPU: Write32--About to do stupid braindead GPU execution for 200 cycles.\n");
+#endif // GPU_DEBUG
+ GPUExec(200);
+#ifdef GPU_DEBUG
+ }
+#endif // GPU_DEBUG//*/
#else
if (gpu_control & 0x18)
- gpu_exec(1);
+ GPUExec(1);
#endif // #ifndef GPU_SINGLE_STEPPING
#ifdef GPU_DEBUG
-fprintf(log_get(), "Write to GPU CTRL: %08X ", data);
+WriteLog("Write to GPU CTRL by %s: %08X ", whoName[who], data);
if (GPU_RUNNING)
- fprintf(log_get(), "-- Starting to run at %08X...", gpu_pc);
-fprintf(log_get(), "\n");
-#endif // #ifdef GPU_DEBUG
+ WriteLog(" --> Starting to run at %08X by %s...", gpu_pc, whoName[who]);
+else
+ WriteLog(" --> Stopped by %s! (GPU_PC: %08X)", whoName[who], gpu_pc);
+WriteLog("\n");
+#endif // GPU_DEBUG
+//if (GPU_RUNNING)
+// GPUDumpDisassembly();
+/*if (GPU_RUNNING)
+{
+ if (gpu_pc == 0xF035D8)
+ {
+// GPUDumpDisassembly();
+// log_done();
+// exit(1);
+ gpu_control &= 0xFFFFFFFE; // Don't run it and let's see what happens!
+//Hmm. Seems to lock up when going into the demo...
+//Try to disable the collision altogether!
+ }
+}//*/
+extern int effect_start5;
+static bool finished = false;
+//if (GPU_RUNNING && effect_start5 && !finished)
+if (GPU_RUNNING && effect_start5 && gpu_pc == 0xF035D8)
+{
+ // Let's do a dump of $6528!
+/* uint32_t numItems = JaguarReadWord(0x6BD6);
+ WriteLog("\nDump of $6528: %u items.\n\n", numItems);
+ for(int i=0; i<numItems*3*4; i+=3*4)
+ {
+ WriteLog("\t%04X: %08X %08X %08X -> ", 0x6528+i, JaguarReadLong(0x6528+i),
+ JaguarReadLong(0x6528+i+4), JaguarReadLong(0x6528+i+8));
+ uint16_t link = JaguarReadWord(0x6528+i+8+2);
+ for(int j=0; j<40; j+=4)
+ WriteLog("%08X ", JaguarReadLong(link + j));
+ WriteLog("\n");
+ }
+ WriteLog("\n");//*/
+ // Let's try a manual blit here...
+//This isn't working the way it should! !!! FIX !!!
+//Err, actually, it is.
+// NOW, it works right! Problem solved!!! It's a blitter bug!
+/* uint32_t src = 0x4D54, dst = 0xF03000, width = 10 * 4;
+ for(int y=0; y<127; y++)
+ {
+ for(int x=0; x<2; x++)
+ {
+ JaguarWriteLong(dst, JaguarReadLong(src));
+
+ src += 4;
+ dst += 4;
+ }
+ src += width - (2 * 4);
+ }//*/
+/* finished = true;
+ doGPUDis = true;
+ WriteLog("\nGPU: About to execute collision detection code.\n\n");//*/
+
+/* WriteLog("\nGPU: About to execute collision detection code. Data @ 4D54:\n\n");
+ int count = 0;
+ for(int i=0x004D54; i<0x004D54+2048; i++)
+ {
+ WriteLog("%02X ", JaguarReadByte(i));
+ count++;
+ if (count == 32)
+ {
+ count = 0;
+ WriteLog("\n");
+ }
+ }
+ WriteLog("\n\nData @ F03000:\n\n");
+ count = 0;
+ for(int i=0xF03000; i<0xF03200; i++)
+ {
+ WriteLog("%02X ", JaguarReadByte(i));
+ count++;
+ if (count == 32)
+ {
+ count = 0;
+ WriteLog("\n");
+ }
+ }
+ WriteLog("\n\n");
+ log_done();
+ exit(0);//*/
+}
+//if (!GPU_RUNNING)
+// doGPUDis = false;
+/*if (!GPU_RUNNING && finished)
+{
+ WriteLog("\nGPU: Finished collision detection code. Exiting!\n\n");
+ GPUDumpRegisters();
+ log_done();
+ exit(0);
+}//*/
+ // (?) If we're set running by the M68K (or DSP?) then end its timeslice to
+ // allow the GPU a chance to run...
+ // Yes! This partially fixed Trevor McFur...
+ if (GPU_RUNNING)
+ m68k_end_timeslice();
break;
}
case 0x18:
}
return;
}
-// fprintf(log_get(),"gpu: writing %.8x at 0x%.8x\n",data,offset);
- jaguar_word_write(offset, (data >> 16) & 0xFFFF);
- jaguar_word_write(offset+2, data & 0xFFFF);
+
+// JaguarWriteWord(offset, (data >> 16) & 0xFFFF, who);
+// JaguarWriteWord(offset+2, data & 0xFFFF, who);
+// We're a 32-bit processor, we can do a long write...!
+ JaguarWriteLong(offset, data, who);
}
-void gpu_update_register_banks(void)
+//
+// Change register banks if necessary
+//
+void GPUUpdateRegisterBanks(void)
{
- uint32 temp;
- int bank = (gpu_flags & 0x4000);
-
-// fprintf(log_get(),"gpu_update_register_banks at gpu pc 0x%.8x bank=%i iflag=%i\n",gpu_pc,bank?1:0,(gpu_flags&0x8)?1:0);
-
- if (gpu_flags & 0x8)
- bank = 0;
-
- if ((!bank && (gpu_reg_bank_0 != gpu_reg)) || (bank && (gpu_reg_bank_1 != gpu_reg)))
- {
-// fprintf(log_get(),"\tswitching to bank %i\n",bank?1:0);
- for(int i=0; i<32; i++)
- {
- temp = gpu_reg[i];
- gpu_reg[i] = gpu_alternate_reg[i];
- gpu_alternate_reg[i] = temp;
- }
+ int bank = (gpu_flags & REGPAGE); // REGPAGE bit
- // switch flags
- temp = gpu_flag_z;
- gpu_flag_z = gpu_alternate_flag_z;
- gpu_alternate_flag_z = temp;
+ if (gpu_flags & IMASK) // IMASK bit
+ bank = 0; // IMASK forces main bank to be bank 0
- temp = gpu_flag_n;
- gpu_flag_n = gpu_alternate_flag_n;
- gpu_alternate_flag_n = temp;
-
- temp = gpu_flag_c;
- gpu_flag_c = gpu_alternate_flag_c;
- gpu_alternate_flag_c = temp;
-
- if (!bank)
- {
- gpu_reg_bank_0 = gpu_reg;
- gpu_reg_bank_1 = gpu_alternate_reg;
- }
- else
- {
- gpu_reg_bank_0 = gpu_alternate_reg;
- gpu_reg_bank_1 = gpu_reg;
- }
- }
-// else
-// {
-// fprintf(log_get(),"\tnot switching banks\n");
-// }
+ if (bank)
+ gpu_reg = gpu_reg_bank_1, gpu_alternate_reg = gpu_reg_bank_0;
+ else
+ gpu_reg = gpu_reg_bank_0, gpu_alternate_reg = gpu_reg_bank_1;
}
-void gpu_check_irqs(void)
+void GPUHandleIRQs(void)
{
- int bits, mask, which = 0;
+ // Bail out if we're already in an interrupt!
+ if (gpu_flags & IMASK)
+ return;
- // get the active interrupt bits
- bits = (gpu_control >> 6) & 0x1F;
- bits |= (gpu_control >> 10) & 0x20;
+ // Get the interrupt latch & enable bits
+ uint32_t bits = (gpu_control >> 6) & 0x1F, mask = (gpu_flags >> 4) & 0x1F;
- // get the interrupt mask
- mask = (gpu_flags >> 4) & 0x1F;
- mask |= (gpu_flags >> 11) & 0x20;
-
- // bail if nothing is available
+ // Bail out if latched interrupts aren't enabled
bits &= mask;
if (!bits)
return;
-
- // determine which interrupt
- if (bits & 0x01) which = 0;
- if (bits & 0x02) which = 1;
- if (bits & 0x04) which = 2;
- if (bits & 0x08) which = 3;
- if (bits & 0x10) which = 4;
- if (bits & 0x20) which = 5;
-
- if (gpu_flags & 0x8)
- return;
+
+ // Determine which interrupt to service
+ uint32_t which = 0; //Isn't there a #pragma to disable this warning???
+ if (bits & 0x01)
+ which = 0;
+ if (bits & 0x02)
+ which = 1;
+ if (bits & 0x04)
+ which = 2;
+ if (bits & 0x08)
+ which = 3;
+ if (bits & 0x10)
+ which = 4;
if (start_logging)
- fprintf(log_get(),"gpu: generating irg %i\n",which);
+ WriteLog("GPU: Generating IRQ #%i\n", which);
- // set the interrupt flag
- gpu_flags |= 0x08;
- gpu_update_register_banks();
+ // set the interrupt flag
+ gpu_flags |= IMASK;
+ GPUUpdateRegisterBanks();
- // subqt #4,r31 ; pre-decrement stack pointer
- // move pc,r30 ; address of interrupted code
+ // subqt #4,r31 ; pre-decrement stack pointer
+ // move pc,r30 ; address of interrupted code
// store r30,(r31) ; store return address
gpu_reg[31] -= 4;
- gpu_reg[30] = gpu_pc - 2;
- gpu_long_write(gpu_reg[31], gpu_pc - 2);
-
- // movei #service_address,r30 ; pointer to ISR entry
- // jump (r30) ; jump to ISR
+ GPUWriteLong(gpu_reg[31], gpu_pc - 2, GPU);
+
+ // movei #service_address,r30 ; pointer to ISR entry
+ // jump (r30) ; jump to ISR
// nop
- gpu_pc = gpu_work_ram_base;
- gpu_pc += which * 0x10;
- gpu_reg[30] = gpu_pc;
+ gpu_pc = gpu_reg[30] = GPU_WORK_RAM_BASE + (which * 0x10);
}
-void gpu_set_irq_line(int irqline, int state)
+void GPUSetIRQLine(int irqline, int state)
{
if (start_logging)
- fprintf(log_get(),"gpu: setting irg line %i\n",irqline);
- int mask = 0x40 << irqline;
- gpu_control &= ~mask;
+ WriteLog("GPU: Setting GPU IRQ line #%i\n", irqline);
+
+ uint32_t mask = 0x0040 << irqline;
+ gpu_control &= ~mask; // Clear the interrupt latch
if (state)
{
- gpu_control |= mask;
- gpu_check_irqs();
+ gpu_control |= mask; // Assert the interrupt latch
+ GPUHandleIRQs(); // And handle the interrupt...
}
}
-void gpu_init(void)
+//TEMPORARY: Testing only!
+//#include "gpu2.h"
+//#include "gpu3.h"
+
+void GPUInit(void)
{
- memory_malloc_secure((void **)&gpu_ram_8, 0x1000, "GPU work ram");
-// gpu_ram_16=(uint16*)gpu_ram_8;
-// gpu_ram_32=(uint32*)gpu_ram_8;
+// memory_malloc_secure((void **)&gpu_ram_8, 0x1000, "GPU work RAM");
+// memory_malloc_secure((void **)&gpu_reg_bank_0, 32 * sizeof(int32_t), "GPU bank 0 regs");
+// memory_malloc_secure((void **)&gpu_reg_bank_1, 32 * sizeof(int32_t), "GPU bank 1 regs");
- memory_malloc_secure((void **)&gpu_reg, 32*sizeof(int32), "GPU bank 0 regs");
- memory_malloc_secure((void **)&gpu_alternate_reg, 32*sizeof(int32), "GPU bank 1 regs");
-
build_branch_condition_table();
- gpu_reset();
+ GPUReset();
+
+//TEMPORARY: Testing only!
+// gpu2_init();
+// gpu3_init();
}
-void gpu_reset(void)
+void GPUReset(void)
{
- gpu_pc = 0x00F03000;
- gpu_acc = 0x00000000;
- gpu_remain = 0x00000000;
- gpu_hidata = 0x00000000;
- gpu_flags = 0x00040000;
+ // GPU registers (directly visible)
+ gpu_flags = 0x00000000;
gpu_matrix_control = 0x00000000;
gpu_pointer_to_matrix = 0x00000000;
gpu_data_organization = 0xFFFFFFFF;
- gpu_control = 0x00012800;
+ gpu_pc = 0x00F03000;
+ gpu_control = 0x00002800; // Correctly sets this as TOM Rev. 2
+ gpu_hidata = 0x00000000;
+ gpu_remain = 0x00000000; // These two registers are RO/WO
gpu_div_control = 0x00000000;
- gpu_in_exec = 0;
- for(int i=0; i<32; i++)
- {
- gpu_reg[i] = 0x00000000;
- gpu_alternate_reg[i] = 0x00000000;
- }
-
- gpu_reg_bank_0 = gpu_reg;
- gpu_reg_bank_1 = gpu_alternate_reg;
-// gpu_reg_bank_1 = gpu_reg;
-// gpu_reg_bank_0 = gpu_alternate_reg;
+ // GPU internal register
+ gpu_acc = 0x00000000;
- reset_flag_z();
- reset_flag_n();
- reset_flag_c();
+ gpu_reg = gpu_reg_bank_0;
+ gpu_alternate_reg = gpu_reg_bank_1;
- gpu_alternate_flag_z = 0;
- gpu_alternate_flag_n = 0;
- gpu_alternate_flag_c = 0;
+ for(int i=0; i<32; i++)
+ gpu_reg[i] = gpu_alternate_reg[i] = 0x00000000;
+ CLR_ZNC;
memset(gpu_ram_8, 0xFF, 0x1000);
+ gpu_in_exec = 0;
+//not needed GPUInterruptPending = false;
+ GPUResetStats();
- gpu_reset_stats();
+ // Contents of local RAM are quasi-stable; we simulate this by randomizing RAM contents
+ for(uint32_t i=0; i<4096; i+=4)
+ *((uint32_t *)(&gpu_ram_8[i])) = rand();
}
-uint32 gpu_read_pc(void)
+uint32_t GPUReadPC(void)
{
return gpu_pc;
}
-void gpu_reset_stats(void)
+void GPUResetStats(void)
{
- for(uint32 i=0; i<64; i++)
+ for(uint32_t i=0; i<64; i++)
gpu_opcode_use[i] = 0;
+ WriteLog("--> GPU stats were reset!\n");
}
-void gpu_done(void)
-{
- fprintf(log_get(), "GPU: stopped at PC=%08X (GPU %s running)\n", gpu_pc, GPU_RUNNING ? "was" : "wasn't");
-
- // get the active interrupt bits
- int bits = (gpu_control >> 6) & 0x1F;
- bits |= (gpu_control >> 10) & 0x20;
-
- // get the interrupt mask
- int mask = (gpu_flags >> 4) & 0x1F;
- mask |= (gpu_flags >> 11) & 0x20;
-
+void GPUDumpDisassembly(void)
+{
+ char buffer[512];
- fprintf(log_get(), "GPU: ibits=0x%.8x imask=0x%.8x\n", bits, mask);
-// fprintf(log_get(),"\nregisters bank 0\n");
-// for (int j=0;j<8;j++)
-// {
-// fprintf(log_get(),"\tr%2i=0x%.8x r%2i=0x%.8x r%2i=0x%.8x r%2i=0x%.8x\n",
-// (j<<2)+0,gpu_reg[(j<<2)+0],
-// (j<<2)+1,gpu_reg[(j<<2)+1],
-// (j<<2)+2,gpu_reg[(j<<2)+2],
-// (j<<2)+3,gpu_reg[(j<<2)+3]);
-//
-// }
-// fprintf(log_get(),"registers bank 1\n");
-// for (j=0;j<8;j++)
-// {
-// fprintf(log_get(),"\tr%2i=0x%.8x r%2i=0x%.8x r%2i=0x%.8x r%2i=0x%.8x\n",
-// (j<<2)+0,gpu_alternate_reg[(j<<2)+0],
-// (j<<2)+1,gpu_alternate_reg[(j<<2)+1],
-// (j<<2)+2,gpu_alternate_reg[(j<<2)+2],
-// (j<<2)+3,gpu_alternate_reg[(j<<2)+3]);
-//
-// }
- fprintf(log_get(),"---[GPU code at 00F03000]---------------------------\n");
- static char buffer[512];
- int j = 0xF03000;
- for(int i=0; i<4096; i++)
+ WriteLog("\n---[GPU code at 00F03000]---------------------------\n");
+ uint32_t j = 0xF03000;
+ while (j <= 0xF03FFF)
{
- uint32 oldj = j;
+ uint32_t oldj = j;
j += dasmjag(JAGUAR_GPU, buffer, j);
- fprintf(log_get(),"\t%08X: %s\n", oldj, buffer);
+ WriteLog("\t%08X: %s\n", oldj, buffer);
}
+}
- fprintf(log_get(), "---[GPU code at %08X]---------------------------\n", gpu_pc);
- j = gpu_pc - 64;
- for(int i=0; i<4096; i++)
+void GPUDumpRegisters(void)
+{
+ WriteLog("\n---[GPU flags: NCZ %d%d%d]-----------------------\n", gpu_flag_n, gpu_flag_c, gpu_flag_z);
+ WriteLog("\nRegisters bank 0\n");
+ for(int j=0; j<8; j++)
{
- uint32 oldj = j;
- j += dasmjag(JAGUAR_GPU, buffer, j);
- fprintf(log_get(), "\t%08X: %s\n", oldj, buffer);
+ WriteLog("\tR%02i = %08X R%02i = %08X R%02i = %08X R%02i = %08X\n",
+ (j << 2) + 0, gpu_reg_bank_0[(j << 2) + 0],
+ (j << 2) + 1, gpu_reg_bank_0[(j << 2) + 1],
+ (j << 2) + 2, gpu_reg_bank_0[(j << 2) + 2],
+ (j << 2) + 3, gpu_reg_bank_0[(j << 2) + 3]);
+ }
+ WriteLog("Registers bank 1\n");
+ for(int j=0; j<8; j++)
+ {
+ WriteLog("\tR%02i = %08X R%02i = %08X R%02i = %08X R%02i = %08X\n",
+ (j << 2) + 0, gpu_reg_bank_1[(j << 2) + 0],
+ (j << 2) + 1, gpu_reg_bank_1[(j << 2) + 1],
+ (j << 2) + 2, gpu_reg_bank_1[(j << 2) + 2],
+ (j << 2) + 3, gpu_reg_bank_1[(j << 2) + 3]);
}
+}
+
+void GPUDumpMemory(void)
+{
+ WriteLog("\n---[GPU data at 00F03000]---------------------------\n");
+ for(int i=0; i<0xFFF; i+=4)
+ WriteLog("\t%08X: %02X %02X %02X %02X\n", 0xF03000+i, gpu_ram_8[i],
+ gpu_ram_8[i+1], gpu_ram_8[i+2], gpu_ram_8[i+3]);
+}
+
+void GPUDone(void)
+{
+ WriteLog("GPU: Stopped at PC=%08X (GPU %s running)\n", (unsigned int)gpu_pc, GPU_RUNNING ? "was" : "wasn't");
+
+ // Get the interrupt latch & enable bits
+ uint8_t bits = (gpu_control >> 6) & 0x1F, mask = (gpu_flags >> 4) & 0x1F;
+ WriteLog("GPU: Latch bits = %02X, enable bits = %02X\n", bits, mask);
- fprintf(log_get(), "gpu opcodes use:\n");
+ GPUDumpRegisters();
+ GPUDumpDisassembly();
+
+ WriteLog("\nGPU opcodes use:\n");
for(int i=0; i<64; i++)
{
if (gpu_opcode_use[i])
- fprintf(log_get(), "\t%s %lu\n", gpu_opcode_str[i], gpu_opcode_use[i]);
+ WriteLog("\t%17s %lu\n", gpu_opcode_str[i], gpu_opcode_use[i]);
}
- memory_free(gpu_ram_8);
+ WriteLog("\n");
+
+// memory_free(gpu_ram_8);
+// memory_free(gpu_reg_bank_0);
+// memory_free(gpu_reg_bank_1);
}
//
// Main GPU execution core
//
-
-void gpu_exec(int32 cycles)
+static int testCount = 1;
+static int len = 0;
+static bool tripwire = false;
+void GPUExec(int32_t cycles)
{
if (!GPU_RUNNING)
return;
gpu_control &= ~0x10;
}
#endif
- gpu_check_irqs();
+ GPUHandleIRQs();
gpu_releaseTimeSlice_flag = 0;
gpu_in_exec++;
- while ((cycles > 0) && GPU_RUNNING)
+ while (cycles > 0 && GPU_RUNNING)
+ {
+if (gpu_ram_8[0x054] == 0x98 && gpu_ram_8[0x055] == 0x0A && gpu_ram_8[0x056] == 0x03
+ && gpu_ram_8[0x057] == 0x00 && gpu_ram_8[0x058] == 0x00 && gpu_ram_8[0x059] == 0x00)
+{
+ if (gpu_pc == 0xF03000)
+ {
+ extern uint32_t starCount;
+ starCount = 0;
+/* WriteLog("GPU: Starting starfield generator... Dump of [R03=%08X]:\n", gpu_reg_bank_0[03]);
+ uint32_t base = gpu_reg_bank_0[3];
+ for(uint32_t i=0; i<0x100; i+=16)
+ {
+ WriteLog("%02X: ", i);
+ for(uint32_t j=0; j<16; j++)
+ {
+ WriteLog("%02X ", JaguarReadByte(base + i + j));
+ }
+ WriteLog("\n");
+ }*/
+ }
+// if (gpu_pc == 0xF03)
{
- gpu_flag_c = (gpu_flag_c ? 1 : 0);
+ }
+}//*/
+/*if (gpu_pc == 0xF03B9E && gpu_reg_bank_0[01] == 0)
+{
+ GPUDumpRegisters();
+ WriteLog("GPU: Starting disassembly log...\n");
+ doGPUDis = true;
+}//*/
+/*if (gpu_pc == 0xF0359A)
+{
+ doGPUDis = true;
+ GPUDumpRegisters();
+}*/
+/* gpu_flag_c = (gpu_flag_c ? 1 : 0);
gpu_flag_z = (gpu_flag_z ? 1 : 0);
- gpu_flag_n = (gpu_flag_n ? 1 : 0);
-
- uint16 opcode = gpu_word_read(gpu_pc);
-/*static char buffer[512];
-dasmjag(JAGUAR_GPU, buffer, gpu_pc);
-fprintf(log_get(), "GPU: [%08X] %s\n", gpu_pc, buffer);*/
+ gpu_flag_n = (gpu_flag_n ? 1 : 0);*/
+#if 0
+if (gpu_pc == 0xF03200)
+ doGPUDis = true;
+#endif
- uint32 index = opcode >> 10;
+ uint16_t opcode = GPUReadWord(gpu_pc, GPU);
+ uint32_t index = opcode >> 10;
+ gpu_instruction = opcode; // Added for GPU #3...
gpu_opcode_first_parameter = (opcode >> 5) & 0x1F;
gpu_opcode_second_parameter = opcode & 0x1F;
+/*if (gpu_pc == 0xF03BE8)
+WriteLog("Start of OP frame write...\n");
+if (gpu_pc == 0xF03EEE)
+WriteLog("--> Writing BRANCH object ---\n");
+if (gpu_pc == 0xF03F62)
+WriteLog("--> Writing BITMAP object ***\n");//*/
+/*if (gpu_pc == 0xF03546)
+{
+ WriteLog("\n--> GPU PC: F03546\n");
+ GPUDumpRegisters();
+ GPUDumpDisassembly();
+}//*/
+/*if (gpu_pc == 0xF033F6)
+{
+ WriteLog("\n--> GPU PC: F033F6\n");
+ GPUDumpRegisters();
+ GPUDumpDisassembly();
+}//*/
+/*if (gpu_pc == 0xF033CC)
+{
+ WriteLog("\n--> GPU PC: F033CC\n");
+ GPUDumpRegisters();
+ GPUDumpDisassembly();
+}//*/
+/*if (gpu_pc == 0xF033D6)
+{
+ WriteLog("\n--> GPU PC: F033D6 (#%d)\n", testCount++);
+ GPUDumpRegisters();
+ GPUDumpMemory();
+}//*/
+/*if (gpu_pc == 0xF033D8)
+{
+ WriteLog("\n--> GPU PC: F033D8 (#%d)\n", testCount++);
+ GPUDumpRegisters();
+ GPUDumpMemory();
+}//*/
+/*if (gpu_pc == 0xF0358E)
+{
+ WriteLog("\n--> GPU PC: F0358E (#%d)\n", testCount++);
+ GPUDumpRegisters();
+ GPUDumpMemory();
+}//*/
+/*if (gpu_pc == 0xF034CA)
+{
+ WriteLog("\n--> GPU PC: F034CA (#%d)\n", testCount++);
+ GPUDumpRegisters();
+}//*/
+/*if (gpu_pc == 0xF034CA)
+{
+ len = gpu_reg[1] + 4;//, r9save = gpu_reg[9];
+ WriteLog("\nAbout to subtract [#%d] (R14=%08X, R15=%08X, R9=%08X):\n ", testCount++, gpu_reg[14], gpu_reg[15], gpu_reg[9]);
+ for(int i=0; i<len; i+=4)
+ WriteLog(" %08X", GPUReadLong(gpu_reg[15]+i));
+ WriteLog("\n ");
+ for(int i=0; i<len; i+=4)
+ WriteLog(" %08X", GPUReadLong(gpu_reg[14]+i));
+ WriteLog("\n\n");
+}
+if (gpu_pc == 0xF034DE)
+{
+ WriteLog("\nSubtracted! (R14=%08X, R15=%08X):\n ", gpu_reg[14], gpu_reg[15]);
+ for(int i=0; i<len; i+=4)
+ WriteLog(" %08X", GPUReadLong(gpu_reg[15]+i));
+ WriteLog("\n ");
+ for(int i=0; i<len; i+=4)
+ WriteLog(" %08X", GPUReadLong(gpu_reg[14]+i));
+ WriteLog("\n ");
+ for(int i=0; i<len; i+=4)
+ WriteLog(" --------");
+ WriteLog("\n ");
+ for(int i=0; i<len; i+=4)
+ WriteLog(" %08X", GPUReadLong(gpu_reg[9]+4+i));
+ WriteLog("\n\n");
+}//*/
+/*if (gpu_pc == 0xF035C8)
+{
+ WriteLog("\n--> GPU PC: F035C8 (#%d)\n", testCount++);
+ GPUDumpRegisters();
+ GPUDumpDisassembly();
+}//*/
+
+if (gpu_start_log)
+{
+// gpu_reset_stats();
+static char buffer[512];
+dasmjag(JAGUAR_GPU, buffer, gpu_pc);
+WriteLog("GPU: [%08X] %s (RM=%08X, RN=%08X) -> ", gpu_pc, buffer, RM, RN);
+}//*/
+//$E400 -> 1110 01 -> $39 -> 57
+//GPU #1
gpu_pc += 2;
gpu_opcode[index]();
+//GPU #2
+// gpu2_opcode[index]();
+// gpu_pc += 2;
+//GPU #3 (Doesn't show ATARI logo! #1 & #2 do...)
+// gpu_pc += 2;
+// gpu3_opcode[index]();
+
+// BIOS hacking
+//GPU: [00F03548] jr nz,00F03560 (0xd561) (RM=00F03114, RN=00000004) -> --> JR: Branch taken.
+/*static bool firstTime = true;
+if (gpu_pc == 0xF03548 && firstTime)
+{
+ gpu_flag_z = 1;
+// firstTime = false;
+
+//static char buffer[512];
+//int k=0xF03548;
+//while (k<0xF0356C)
+//{
+//int oldk = k;
+//k += dasmjag(JAGUAR_GPU, buffer, k);
+//WriteLog("GPU: [%08X] %s\n", oldk, buffer);
+//}
+// gpu_start_log = 1;
+}//*/
+//GPU: [00F0354C] jump nz,(r29) (0xd3a1) (RM=00F03314, RN=00000004) -> (RM=00F03314, RN=00000004)
+/*if (gpu_pc == 0xF0354C)
+ gpu_flag_z = 0;//, gpu_start_log = 1;//*/
+
cycles -= gpu_opcode_cycles[index];
gpu_opcode_use[index]++;
+if (gpu_start_log)
+ WriteLog("(RM=%08X, RN=%08X)\n", RM, RN);//*/
+if ((gpu_pc < 0xF03000 || gpu_pc > 0xF03FFF) && !tripwire)
+{
+ WriteLog("GPU: Executing outside local RAM! GPU_PC: %08X\n", gpu_pc);
+ tripwire = true;
+}
}
gpu_in_exec--;
// GPU opcodes
//
+/*
+GPU opcodes use (offset punch--vertically below bad guy):
+ add 18686
+ addq 32621
+ sub 7483
+ subq 10252
+ and 21229
+ or 15003
+ btst 1822
+ bset 2072
+ mult 141
+ div 2392
+ shlq 13449
+ shrq 10297
+ sharq 11104
+ cmp 6775
+ cmpq 5944
+ move 31259
+ moveq 4473
+ movei 23277
+ loadb 46
+ loadw 4201
+ load 28580
+ load_r14_indexed 1183
+ load_r15_indexed 1125
+ storew 178
+ store 10144
+ store_r14_indexed 320
+ store_r15_indexed 1
+ move_pc 1742
+ jump 24467
+ jr 18090
+ nop 41362
+*/
+
+
static void gpu_opcode_jump(void)
{
- uint32 delayed_pc = Rm;
- uint32 jaguar_flags;
-
+#ifdef GPU_DIS_JUMP
+const char * condition[32] =
+{ "T", "nz", "z", "???", "nc", "nc nz", "nc z", "???", "c", "c nz",
+ "c z", "???", "???", "???", "???", "???", "???", "???", "???",
+ "???", "nn", "nn nz", "nn z", "???", "n", "n nz", "n z", "???",
+ "???", "???", "???", "F" };
+ if (doGPUDis)
+ WriteLog("%06X: JUMP %s, (R%02u) [NCZ:%u%u%u, R%02u=%08X] ", gpu_pc-2, condition[IMM_2], IMM_1, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM);
+#endif
// normalize flags
- gpu_flag_c = (gpu_flag_c ? 1 : 0);
+/* gpu_flag_c = (gpu_flag_c ? 1 : 0);
gpu_flag_z = (gpu_flag_z ? 1 : 0);
- gpu_flag_n = (gpu_flag_n ? 1 : 0);
-
- jaguar_flags = (gpu_flag_n << 2) | (gpu_flag_c << 1) | gpu_flag_z;
+ gpu_flag_n = (gpu_flag_n ? 1 : 0);*/
+ // KLUDGE: Used by BRANCH_CONDITION
+ uint32_t jaguar_flags = (gpu_flag_n << 2) | (gpu_flag_c << 1) | gpu_flag_z;
- if (branch_condition(imm_2))
+ if (BRANCH_CONDITION(IMM_2))
{
- gpu_exec(1);
+#ifdef GPU_DIS_JUMP
+ if (doGPUDis)
+ WriteLog("Branched!\n");
+#endif
+if (gpu_start_log)
+ WriteLog(" --> JUMP: Branch taken.\n");
+ uint32_t delayed_pc = RM;
+ GPUExec(1);
+ gpu_pc = delayed_pc;
+/* uint16_t opcode = GPUReadWord(gpu_pc, GPU);
+ gpu_opcode_first_parameter = (opcode >> 5) & 0x1F;
+ gpu_opcode_second_parameter = opcode & 0x1F;
+
gpu_pc = delayed_pc;
+ gpu_opcode[opcode>>10]();//*/
}
+#ifdef GPU_DIS_JUMP
+ else
+ if (doGPUDis)
+ WriteLog("Branch NOT taken.\n");
+#endif
}
+
static void gpu_opcode_jr(void)
{
- int32 offset=(imm_1&0x10) ? (0xFFFFFFF0|imm_1) : imm_1;
-
- int32 delayed_pc = gpu_pc + (offset * 2);
- uint32 jaguar_flags;
-
+#ifdef GPU_DIS_JR
+const char * condition[32] =
+{ "T", "nz", "z", "???", "nc", "nc nz", "nc z", "???", "c", "c nz",
+ "c z", "???", "???", "???", "???", "???", "???", "???", "???",
+ "???", "nn", "nn nz", "nn z", "???", "n", "n nz", "n z", "???",
+ "???", "???", "???", "F" };
+ if (doGPUDis)
+ WriteLog("%06X: JR %s, %06X [NCZ:%u%u%u] ", gpu_pc-2, condition[IMM_2], gpu_pc+((IMM_1 & 0x10 ? 0xFFFFFFF0 | IMM_1 : IMM_1) * 2), gpu_flag_n, gpu_flag_c, gpu_flag_z);
+#endif
+/* if (CONDITION(jaguar.op & 31))
+ {
+ int32_t r1 = (INT8)((jaguar.op >> 2) & 0xF8) >> 2;
+ uint32_t newpc = jaguar.PC + r1;
+ CALL_MAME_DEBUG;
+ jaguar.op = ROPCODE(jaguar.PC);
+ jaguar.PC = newpc;
+ (*jaguar.table[jaguar.op >> 10])();
+
+ jaguar_icount -= 3; // 3 wait states guaranteed
+ }*/
// normalize flags
- gpu_flag_c=gpu_flag_c?1:0;
- gpu_flag_z=gpu_flag_z?1:0;
- gpu_flag_n=gpu_flag_n?1:0;
-
- jaguar_flags=(gpu_flag_n<<2)|(gpu_flag_c<<1)|gpu_flag_z;
+/* gpu_flag_n = (gpu_flag_n ? 1 : 0);
+ gpu_flag_c = (gpu_flag_c ? 1 : 0);
+ gpu_flag_z = (gpu_flag_z ? 1 : 0);*/
+ // KLUDGE: Used by BRANCH_CONDITION
+ uint32_t jaguar_flags = (gpu_flag_n << 2) | (gpu_flag_c << 1) | gpu_flag_z;
- if (branch_condition(imm_2))
+ if (BRANCH_CONDITION(IMM_2))
{
- gpu_exec(1);
- gpu_pc=delayed_pc;
+#ifdef GPU_DIS_JR
+ if (doGPUDis)
+ WriteLog("Branched!\n");
+#endif
+if (gpu_start_log)
+ WriteLog(" --> JR: Branch taken.\n");
+ int32_t offset = (IMM_1 & 0x10 ? 0xFFFFFFF0 | IMM_1 : IMM_1); // Sign extend IMM_1
+ int32_t delayed_pc = gpu_pc + (offset * 2);
+ GPUExec(1);
+ gpu_pc = delayed_pc;
+/* uint16_t opcode = GPUReadWord(gpu_pc, GPU);
+ gpu_opcode_first_parameter = (opcode >> 5) & 0x1F;
+ gpu_opcode_second_parameter = opcode & 0x1F;
+
+ gpu_pc = delayed_pc;
+ gpu_opcode[opcode>>10]();//*/
}
+#ifdef GPU_DIS_JR
+ else
+ if (doGPUDis)
+ WriteLog("Branch NOT taken.\n");
+#endif
}
+
static void gpu_opcode_add(void)
{
- uint32 _Rm=Rm;
- uint32 _Rn=Rn;
- uint32 res;
-#ifdef __PORT__
-#ifndef USE_ASSEMBLY
-{
-/* uint32 index = opcode >> 10;
- gpu_opcode_first_parameter = (opcode & 0x3E0) >> 5;
- gpu_opcode_second_parameter = (opcode & 0x1F);
- gpu_pc += 2;
- gpu_opcode[index]();
- cycles -= gpu_opcode_cycles[index];
- gpu_opcode_use[index]++;*/
-/* int dreg = jaguar.op & 31;
- UINT32 r1 = jaguar.r[(jaguar.op >> 5) & 31];
- UINT32 r2 = jaguar.r[dreg];
- UINT32 res = r2 + r1;
- jaguar.r[dreg] = res;
- CLR_ZNC; SET_ZNC_ADD(r2,r1,res);*/
-
- UINT32 res = Rn + Rm;
- CLR_ZNC; SET_ZNC_ADD(Rn, Rm, res);
- Rn = res;
- return;
+#ifdef GPU_DIS_ADD
+ if (doGPUDis)
+ WriteLog("%06X: ADD R%02u, R%02u [NCZ:%u%u%u, R%02u=%08X, R%02u=%08X] -> ", gpu_pc-2, IMM_1, IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN);
+#endif
+ uint32_t res = RN + RM;
+ CLR_ZNC; SET_ZNC_ADD(RN, RM, res);
+ RN = res;
+#ifdef GPU_DIS_ADD
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN);
+#endif
}
-#else
- /*
- GCC on WIN32 (more importantly mingw) doesn't know the declared
- variables in asm until we put a _ before it.
-
- So the declaration dsp_flag_c needs to be _dsp_flag_c on mingw.
- */
-
-#ifdef __GCCWIN32__
-
- asm(
- "addl %1, %2 \n\
- setc _gpu_flag_c \n\
- setz _gpu_flag_z \n\
- sets _gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "d"(_Rm), "a"(_Rn));
-
-#else
- asm(
- "addl %1, %2 \n\
- setc gpu_flag_c \n\
- setz gpu_flag_z \n\
- sets gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "d"(_Rm), "a"(_Rn));
-
-#endif // #ifdef __GCCWIN32__
-#endif // #ifndef USE_ASSEMBLY
-
-#else
- __asm
- {
- mov edx,_Rm
- mov eax,_Rn
- add eax,edx
- setc [gpu_flag_c]
- setz [gpu_flag_z]
- sets [gpu_flag_n]
- mov res,eax
- };
-#endif // #ifdef __PORT__
- Rn=res;
-}
static void gpu_opcode_addc(void)
{
- uint32 _Rm=Rm;
- uint32 _Rn=Rn;
- uint32 res;
-#ifdef __PORT__
-#ifndef USE_ASSEMBLY
-{
+#ifdef GPU_DIS_ADDC
+ if (doGPUDis)
+ WriteLog("%06X: ADDC R%02u, R%02u [NCZ:%u%u%u, R%02u=%08X, R%02u=%08X] -> ", gpu_pc-2, IMM_1, IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN);
+#endif
/* int dreg = jaguar.op & 31;
- UINT32 r1 = jaguar.r[(jaguar.op >> 5) & 31];
- UINT32 r2 = jaguar.r[dreg];
- UINT32 res = r2 + r1 + ((jaguar.FLAGS >> 1) & 1);
+ uint32_t r1 = jaguar.r[(jaguar.op >> 5) & 31];
+ uint32_t r2 = jaguar.r[dreg];
+ uint32_t res = r2 + r1 + ((jaguar.FLAGS >> 1) & 1);
jaguar.r[dreg] = res;
CLR_ZNC; SET_ZNC_ADD(r2,r1,res);*/
- UINT32 res = Rn + Rm + gpu_flag_c;
- CLR_ZNC; SET_ZNC_ADD(Rn, Rm, res);
- Rn = res;
- return;
+ uint32_t res = RN + RM + gpu_flag_c;
+ uint32_t carry = gpu_flag_c;
+// SET_ZNC_ADD(RN, RM, res); //???BUG??? Yes!
+ SET_ZNC_ADD(RN + carry, RM, res);
+// SET_ZNC_ADD(RN, RM + carry, res);
+ RN = res;
+#ifdef GPU_DIS_ADDC
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN);
+#endif
}
-#else
- /*
- GCC on WIN32 (more importantly mingw) doesn't know the declared
- variables in asm until we put a _ before it.
-
- So the declaration dsp_flag_c needs to be _dsp_flag_c on mingw.
- */
-
-#ifdef __GCCWIN32__
-
- asm(
- "addl %1, %2 \n\
- cmp $0, _gpu_flag_c \n\
- clc \n\
- jz 1f \n\
- stc \n\
- 1: \n\
- adc %1, %2 \n\
- setc _gpu_flag_c \n\
- setz _gpu_flag_z \n\
- sets _gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "d"(_Rm), "a"(_Rn));
-#else
-
- asm(
- "addl %1, %2 \n\
- cmp $0, gpu_flag_c \n\
- clc \n\
- jz 1f \n\
- stc \n\
- 1: \n\
- adc %1, %2 \n\
- setc gpu_flag_c \n\
- setz gpu_flag_z \n\
- sets gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "d"(_Rm), "a"(_Rn));
-
-#endif // #ifdef __GCCWIN32__
-#endif // #ifndef USE_ASSEMBLY
-
-#else
- __asm
- {
- mov edx,_Rm
- mov eax,_Rn
- cmp [gpu_flag_c],0
- clc
- jz gpu_opcode_addc_no_carry
- stc
-gpu_opcode_addc_no_carry:
- adc eax,edx
- setc [gpu_flag_c]
- setz [gpu_flag_z]
- sets [gpu_flag_n]
- mov res,eax
- };
-#endif
- Rn=res;
-}
static void gpu_opcode_addq(void)
{
- uint32 _Rn=Rn;
- uint32 _Rm=gpu_convert_zero[imm_1];
- uint32 res;
-#ifdef __PORT__
-#ifndef USE_ASSEMBLY
-{
-/* int dreg = jaguar.op & 31;
- UINT32 r1 = convert_zero[(jaguar.op >> 5) & 31];
- UINT32 r2 = jaguar.r[dreg];
- UINT32 res = r2 + r1;
- jaguar.r[dreg] = res;
- CLR_ZNC; SET_ZNC_ADD(r2,r1,res);*/
- UINT32 r1 = gpu_convert_zero[imm_1];
- UINT32 res = Rn + r1;
- CLR_ZNC; SET_ZNC_ADD(Rn, r1, res);
- Rn = res;
- return;
-}
-#else
- /*
- GCC on WIN32 (more importantly mingw) doesn't know the declared
- variables in asm until we put a _ before it.
-
- So the declaration dsp_flag_c needs to be _dsp_flag_c on mingw.
- */
-
-#ifdef __GCCWIN32__
-
- asm(
- "addl %1, %2 \n\
- setc _gpu_flag_c \n\
- setz _gpu_flag_z \n\
- sets _gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "d"(_Rm), "a"(_Rn));
-
-#else
-
- asm(
- "addl %1, %2 \n\
- setc gpu_flag_c \n\
- setz gpu_flag_z \n\
- sets gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "d"(_Rm), "a"(_Rn));
-
-#endif // #ifdef __GCCWIN32__
-#endif // #ifndef USE_ASSEMBLY
-
-#else
- __asm
- {
- mov edx,_Rm
- mov eax,_Rn
- add eax,edx
- setc [gpu_flag_c]
- setz [gpu_flag_z]
- sets [gpu_flag_n]
- mov res,eax
- };
+#ifdef GPU_DIS_ADDQ
+ if (doGPUDis)
+ WriteLog("%06X: ADDQ #%u, R%02u [NCZ:%u%u%u, R%02u=%08X] -> ", gpu_pc-2, gpu_convert_zero[IMM_1], IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
+ uint32_t r1 = gpu_convert_zero[IMM_1];
+ uint32_t res = RN + r1;
+ CLR_ZNC; SET_ZNC_ADD(RN, r1, res);
+ RN = res;
+#ifdef GPU_DIS_ADDQ
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
#endif
- Rn=res;
}
+
static void gpu_opcode_addqt(void)
{
- Rn += gpu_convert_zero[imm_1];
+#ifdef GPU_DIS_ADDQT
+ if (doGPUDis)
+ WriteLog("%06X: ADDQT #%u, R%02u [NCZ:%u%u%u, R%02u=%08X] -> ", gpu_pc-2, gpu_convert_zero[IMM_1], IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
+ RN += gpu_convert_zero[IMM_1];
+#ifdef GPU_DIS_ADDQT
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
}
+
static void gpu_opcode_sub(void)
{
- uint32 _Rm=Rm;
- uint32 _Rn=Rn;
- uint32 res;
-#ifdef __PORT__
-#ifndef USE_ASSEMBLY
-{
-/* int dreg = jaguar.op & 31;
- UINT32 r1 = jaguar.r[(jaguar.op >> 5) & 31];
- UINT32 r2 = jaguar.r[dreg];
- UINT32 res = r2 - r1;
- jaguar.r[dreg] = res;
- CLR_ZNC; SET_ZNC_SUB(r2,r1,res);*/
- UINT32 res = Rn - Rm;
- CLR_ZNC; SET_ZNC_SUB(Rn, Rm, res);
- Rn = res;
- return;
-}
-#else
- /*
- GCC on WIN32 (more importantly mingw) doesn't know the declared
- variables in asm until we put a _ before it.
-
- So the declaration dsp_flag_c needs to be _dsp_flag_c on mingw.
- */
-
-#ifdef __GCCWIN32__
-
- asm(
- "subl %1, %2 \n\
- setc _gpu_flag_c \n\
- setz _gpu_flag_z \n\
- sets _gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "d"(_Rm), "a"(_Rn));
-
-#else
-
- asm(
- "subl %1, %2 \n\
- setc gpu_flag_c \n\
- setz gpu_flag_z \n\
- sets gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "d"(_Rm), "a"(_Rn));
-
-#endif // #ifdef __GCCWIN32__
-#endif // #ifndef USE_ASSEMBLY
-
-#else
- __asm
- {
- mov eax,_Rn
- mov edx,_Rm
- sub eax,edx
- setc [gpu_flag_c]
- setz [gpu_flag_z]
- sets [gpu_flag_n]
- mov res,eax
- };
-#endif
- Rn=res;
+#ifdef GPU_DIS_SUB
+ if (doGPUDis)
+ WriteLog("%06X: SUB R%02u, R%02u [NCZ:%u%u%u, R%02u=%08X, R%02u=%08X] -> ", gpu_pc-2, IMM_1, IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN);
+#endif
+ uint32_t res = RN - RM;
+ SET_ZNC_SUB(RN, RM, res);
+ RN = res;
+#ifdef GPU_DIS_SUB
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN);
+#endif
}
+
static void gpu_opcode_subc(void)
{
- uint32 _Rm=Rm;
- uint32 _Rn=Rn;
- uint32 res;
-#ifdef __PORT__
-#ifndef USE_ASSEMBLY
-{
-/* int dreg = jaguar.op & 31;
- UINT32 r1 = jaguar.r[(jaguar.op >> 5) & 31];
- UINT32 r2 = jaguar.r[dreg];
- UINT32 res = r2 - r1 - ((jaguar.FLAGS >> 1) & 1);
- jaguar.r[dreg] = res;
- CLR_ZNC; SET_ZNC_SUB(r2,r1,res);*/
- UINT32 res = Rn - Rm - gpu_flag_c;
- CLR_ZNC; SET_ZNC_SUB(Rn, Rm, res);
- Rn = res;
- return;
-}
-#else
- /*
- GCC on WIN32 (more importantly mingw) doesn't know the declared
- variables in asm until we put a _ before it.
-
- So the declaration dsp_flag_c needs to be _dsp_flag_c on mingw.
- */
-
-#ifdef __GCCWIN32__
-
- asm(
- "addl %1, %2 \n\
- cmp $0, _gpu_flag_c \n\
- clc \n\
- jz 1f \n\
- stc \n\
- 1: \n\
- sbb %1, %2 \n\
- setc _gpu_flag_c \n\
- setz _gpu_flag_z \n\
- sets _gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "d"(_Rm), "a"(_Rn));
-
-#else
-
- asm(
- "addl %1, %2 \n\
- cmp $0, gpu_flag_c \n\
- clc \n\
- jz 1f \n\
- stc \n\
- 1: \n\
- sbb %1, %2 \n\
- setc gpu_flag_c \n\
- setz gpu_flag_z \n\
- sets gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "d"(_Rm), "a"(_Rn));
-
-#endif // #ifdef __GCCWIN32__
-#endif // #ifndef USE_ASSEMBLY
-
-#else
- __asm
- {
- cmp [gpu_flag_c],0
- clc
- jz gpu_opcode_subc_no_carry
- stc
-gpu_opcode_subc_no_carry:
- mov edx,_Rm
- mov eax,_Rn
- sbb eax,edx
- setc [gpu_flag_c]
- setz [gpu_flag_z]
- sets [gpu_flag_n]
- mov res,eax
- };
-#endif
- Rn=res;
+#ifdef GPU_DIS_SUBC
+ if (doGPUDis)
+ WriteLog("%06X: SUBC R%02u, R%02u [NCZ:%u%u%u, R%02u=%08X, R%02u=%08X] -> ", gpu_pc-2, IMM_1, IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN);
+#endif
+ // This is how the GPU ALU does it--Two's complement with inverted carry
+ uint64_t res = (uint64_t)RN + (uint64_t)(RM ^ 0xFFFFFFFF) + (gpu_flag_c ^ 1);
+ // Carry out of the result is inverted too
+ gpu_flag_c = ((res >> 32) & 0x01) ^ 1;
+ RN = (res & 0xFFFFFFFF);
+ SET_ZN(RN);
+#ifdef GPU_DIS_SUBC
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN);
+#endif
}
+
static void gpu_opcode_subq(void)
{
- uint32 _Rm=gpu_convert_zero[imm_1];
- uint32 _Rn=Rn;
- uint32 res;
-#ifdef __PORT__
-#ifndef USE_ASSEMBLY
-{
-/* int dreg = jaguar.op & 31;
- UINT32 r1 = convert_zero[(jaguar.op >> 5) & 31];
- UINT32 r2 = jaguar.r[dreg];
- UINT32 res = r2 - r1;
- jaguar.r[dreg] = res;
- CLR_ZNC; SET_ZNC_SUB(r2,r1,res);*/
- UINT32 r1 = gpu_convert_zero[imm_1];
- UINT32 res = Rn - r1;
- CLR_ZNC; SET_ZNC_SUB(Rn, r1, res);
- Rn = res;
- return;
-}
-#else
- /*
- GCC on WIN32 (more importantly mingw) doesn't know the declared
- variables in asm until we put a _ before it.
-
- So the declaration dsp_flag_c needs to be _dsp_flag_c on mingw.
- */
-
-#ifdef __GCCWIN32__
-
- asm(
- "subl %1, %2 \n\
- setc _gpu_flag_c \n\
- setz _gpu_flag_z \n\
- sets _gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "d"(_Rm), "a"(_Rn));
-
-#else
-
- asm(
- "subl %1, %2 \n\
- setc gpu_flag_c \n\
- setz gpu_flag_z \n\
- sets gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "d"(_Rm), "a"(_Rn));
-
-#endif // #ifdef __GCCWIN32__
-#endif // #ifndef USE_ASSEMBLY
-
-#else
- __asm
- {
- mov eax,_Rn
- mov edx,_Rm
- sub eax,edx
- setc [gpu_flag_c]
- setz [gpu_flag_z]
- sets [gpu_flag_n]
- mov res,eax
- };
+#ifdef GPU_DIS_SUBQ
+ if (doGPUDis)
+ WriteLog("%06X: SUBQ #%u, R%02u [NCZ:%u%u%u, R%02u=%08X] -> ", gpu_pc-2, gpu_convert_zero[IMM_1], IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
+ uint32_t r1 = gpu_convert_zero[IMM_1];
+ uint32_t res = RN - r1;
+ SET_ZNC_SUB(RN, r1, res);
+ RN = res;
+#ifdef GPU_DIS_SUBQ
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
#endif
- Rn=res;
}
+
static void gpu_opcode_subqt(void)
{
- Rn -= gpu_convert_zero[imm_1];
+#ifdef GPU_DIS_SUBQT
+ if (doGPUDis)
+ WriteLog("%06X: SUBQT #%u, R%02u [NCZ:%u%u%u, R%02u=%08X] -> ", gpu_pc-2, gpu_convert_zero[IMM_1], IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
+ RN -= gpu_convert_zero[IMM_1];
+#ifdef GPU_DIS_SUBQT
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
}
+
static void gpu_opcode_cmp(void)
{
- uint32 _Rm=Rm;
- uint32 _Rn=Rn;
-#ifdef __PORT__
-#ifndef USE_ASSEMBLY
-{
-/* UINT32 r1 = jaguar.r[(jaguar.op >> 5) & 31];
- UINT32 r2 = jaguar.r[jaguar.op & 31];
- UINT32 res = r2 - r1;
- CLR_ZNC; SET_ZNC_SUB(r2,r1,res);*/
- UINT32 res = Rn - Rm;
- CLR_ZNC; SET_ZNC_SUB(Rn, Rm, res);
- return;
-}
-#else
-
- /*
- GCC on WIN32 (more importantly mingw) doesn't know the declared
- variables in asm until we put a _ before it.
-
- So the declaration dsp_flag_c needs to be _dsp_flag_c on mingw.
- */
-
-#ifdef __GCCWIN32__
-
- asm(
- "cmpl %0, %1 \n\
- setc _gpu_flag_c \n\
- setz _gpu_flag_z \n\
- sets _gpu_flag_n \n\
- "
- :
- : "d"(_Rm), "a"(_Rn));
-
-#else
-
- asm(
- "cmpl %0, %1 \n\
- setc gpu_flag_c \n\
- setz gpu_flag_z \n\
- sets gpu_flag_n \n\
- "
- :
- : "d"(_Rm), "a"(_Rn));
-
-#endif // #ifdef __GCCWIN32__
-#endif // #ifndef USE_ASSEMBLY
-
-#else
- __asm
- {
- mov eax,_Rn
- mov edx,_Rm
- cmp eax,edx
- setc [gpu_flag_c]
- setz [gpu_flag_z]
- sets [gpu_flag_n]
- };
+#ifdef GPU_DIS_CMP
+ if (doGPUDis)
+ WriteLog("%06X: CMP R%02u, R%02u [NCZ:%u%u%u, R%02u=%08X, R%02u=%08X] -> ", gpu_pc-2, IMM_1, IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN);
+#endif
+ uint32_t res = RN - RM;
+ SET_ZNC_SUB(RN, RM, res);
+#ifdef GPU_DIS_CMP
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z);
#endif
}
+
static void gpu_opcode_cmpq(void)
{
- static int32 sqtable[32] =
+ static int32_t sqtable[32] =
{ 0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,-16,-15,-14,-13,-12,-11,-10,-9,-8,-7,-6,-5,-4,-3,-2,-1 };
- int32 _Rm=sqtable[imm_1&0x1f];
- uint32 _Rn=Rn;
-#ifdef __PORT__
-#ifndef USE_ASSEMBLY
-{
-/* UINT32 r1 = (INT8)(jaguar.op >> 2) >> 3;
- UINT32 r2 = jaguar.r[jaguar.op & 31];
- UINT32 res = r2 - r1;
- CLR_ZNC; SET_ZNC_SUB(r2,r1,res);*/
- UINT32 r1 = sqtable[imm_1 & 0x1F]; // I like this better -> (INT8)(jaguar.op >> 2) >> 3;
- UINT32 res = Rn - r1;
- CLR_ZNC; SET_ZNC_SUB(Rn, r1, res);
- return;
-}
-#else
- /*
- GCC on WIN32 (more importantly mingw) doesn't know the declared
- variables in asm until we put a _ before it.
-
- So the declaration dsp_flag_c needs to be _dsp_flag_c on mingw.
- */
-
-#ifdef __GCCWIN32__
-
- asm(
- "cmpl %0, %1 \n\
- setc _gpu_flag_c \n\
- setz _gpu_flag_z \n\
- sets _gpu_flag_n \n\
- "
- :
- : "d"(_Rm), "a"(_Rn));
-
-#else
-
- asm(
- "cmpl %0, %1 \n\
- setc gpu_flag_c \n\
- setz gpu_flag_z \n\
- sets gpu_flag_n \n\
- "
- :
- : "d"(_Rm), "a"(_Rn));
-
-#endif // #ifdef __GCCWIN32__
-#endif // #ifndef USE_ASSEMBLY
-
-#else
- __asm
- {
- mov eax,_Rn
- mov edx,_Rm
- cmp eax,edx
- setc [gpu_flag_c]
- setz [gpu_flag_z]
- sets [gpu_flag_n]
- };
+#ifdef GPU_DIS_CMPQ
+ if (doGPUDis)
+ WriteLog("%06X: CMPQ #%d, R%02u [NCZ:%u%u%u, R%02u=%08X] -> ", gpu_pc-2, sqtable[IMM_1], IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
+ uint32_t r1 = sqtable[IMM_1 & 0x1F]; // I like this better -> (INT8)(jaguar.op >> 2) >> 3;
+ uint32_t res = RN - r1;
+ SET_ZNC_SUB(RN, r1, res);
+#ifdef GPU_DIS_CMPQ
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z);
#endif
}
+
static void gpu_opcode_and(void)
{
- uint32 _Rm=Rm;
- uint32 _Rn=Rn;
- uint32 res;
-#ifdef __PORT__
-#ifndef USE_ASSEMBLY
-{
-/* int dreg = jaguar.op & 31;
- UINT32 r1 = jaguar.r[(jaguar.op >> 5) & 31];
- UINT32 r2 = jaguar.r[dreg];
- UINT32 res = r2 & r1;
- jaguar.r[dreg] = res;
- CLR_ZN; SET_ZN(res);*/
- UINT32 res = Rn & Rm;
- Rn = res;
- CLR_ZN; SET_ZN(res);
- return;
-}
-#else
-
- /*
- GCC on WIN32 (more importantly mingw) doesn't know the declared
- variables in asm until we put a _ before it.
-
- So the declaration dsp_flag_c needs to be _dsp_flag_c on mingw.
- */
-
-#ifdef __GCCWIN32__
-
- asm(
- "andl %1, %2 \n\
- setz _gpu_flag_z \n\
- sets _gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "d"(_Rm), "a"(_Rn));
-
-#else
-
- asm(
- "andl %1, %2 \n\
- setz gpu_flag_z \n\
- sets gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "d"(_Rm), "a"(_Rn));
-
-#endif // #ifdef __GCCWIN32__
-#endif // #ifndef USE_ASSEMBLY
-
-#else
- __asm
- {
- mov eax,_Rn
- mov edx,_Rm
- and eax,edx
- setz [gpu_flag_z]
- sets [gpu_flag_n]
- mov res,eax
- };
+#ifdef GPU_DIS_AND
+ if (doGPUDis)
+ WriteLog("%06X: AND R%02u, R%02u [NCZ:%u%u%u, R%02u=%08X, R%02u=%08X] -> ", gpu_pc-2, IMM_1, IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN);
+#endif
+ RN = RN & RM;
+ SET_ZN(RN);
+#ifdef GPU_DIS_AND
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN);
#endif
- Rn=res;
}
+
static void gpu_opcode_or(void)
{
- uint32 _Rm=Rm;
- uint32 _Rn=Rn;
- uint32 res;
-#ifdef __PORT__
-#ifndef USE_ASSEMBLY
-{
-/* int dreg = jaguar.op & 31;
- UINT32 r1 = jaguar.r[(jaguar.op >> 5) & 31];
- UINT32 r2 = jaguar.r[dreg];
- UINT32 res = r1 | r2;
- jaguar.r[dreg] = res;
- CLR_ZN; SET_ZN(res);*/
- UINT32 res = Rn | Rm;
- Rn = res;
- CLR_ZN; SET_ZN(res);
- return;
-}
-#else
- /*
- GCC on WIN32 (more importantly mingw) doesn't know the declared
- variables in asm until we put a _ before it.
-
- So the declaration dsp_flag_c needs to be _dsp_flag_c on mingw.
- */
-
-#ifdef __GCCWIN32__
-
- asm(
- "orl %1, %2 \n\
- setz _gpu_flag_z \n\
- sets _gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "d"(_Rm), "a"(_Rn));
-
-#else
-
- asm(
- "orl %1, %2 \n\
- setz gpu_flag_z \n\
- sets gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "d"(_Rm), "a"(_Rn));
-
-#endif // #ifdef __GCCWIN32__
-#endif // #ifndef USE_ASSEMBLY
-
-#else
- __asm
- {
- mov eax,_Rn
- mov edx,_Rm
- or eax,edx
- setz [gpu_flag_z]
- sets [gpu_flag_n]
- mov res,eax
- };
+#ifdef GPU_DIS_OR
+ if (doGPUDis)
+ WriteLog("%06X: OR R%02u, R%02u [NCZ:%u%u%u, R%02u=%08X, R%02u=%08X] -> ", gpu_pc-2, IMM_1, IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN);
+#endif
+ RN = RN | RM;
+ SET_ZN(RN);
+#ifdef GPU_DIS_OR
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN);
#endif
- Rn=res;
}
+
static void gpu_opcode_xor(void)
{
- uint32 _Rm=Rm;
- uint32 _Rn=Rn;
- uint32 res;
-#ifdef __PORT__
-#ifndef USE_ASSEMBLY
-{
-/* int dreg = jaguar.op & 31;
- UINT32 r1 = jaguar.r[(jaguar.op >> 5) & 31];
- UINT32 r2 = jaguar.r[dreg];
- UINT32 res = r1 ^ r2;
- jaguar.r[dreg] = res;
- CLR_ZN; SET_ZN(res);*/
- UINT32 res = Rn ^ Rm;
- Rn = res;
- CLR_ZN; SET_ZN(res);
- return;
-}
-#else
- /*
- GCC on WIN32 (more importantly mingw) doesn't know the declared
- variables in asm until we put a _ before it.
-
- So the declaration dsp_flag_c needs to be _dsp_flag_c on mingw.
- */
-
-#ifdef __GCCWIN32__
-
- asm(
- "xorl %1, %2 \n\
- setz _gpu_flag_z \n\
- sets _gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "d"(_Rm), "a"(_Rn));
-
-#else
-
- asm(
- "xorl %1, %2 \n\
- setz gpu_flag_z \n\
- sets gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "d"(_Rm), "a"(_Rn));
-
-#endif // #ifdef __GCCWIN32__
-#endif // #ifndef USE_ASSEMBLY
-
-#else
- __asm
- {
- mov eax,_Rn
- mov edx,_Rm
- xor eax,edx
- setz [gpu_flag_z]
- sets [gpu_flag_n]
- mov res,eax
- };
+#ifdef GPU_DIS_XOR
+ if (doGPUDis)
+ WriteLog("%06X: XOR R%02u, R%02u [NCZ:%u%u%u, R%02u=%08X, R%02u=%08X] -> ", gpu_pc-2, IMM_1, IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN);
+#endif
+ RN = RN ^ RM;
+ SET_ZN(RN);
+#ifdef GPU_DIS_XOR
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN);
#endif
- Rn=res;
}
+
static void gpu_opcode_not(void)
{
- uint32 _Rn=Rn;
- uint32 res;
-#ifdef __PORT__
-#ifndef USE_ASSEMBLY
-{
-/* int dreg = jaguar.op & 31;
- UINT32 res = ~jaguar.r[dreg];
- jaguar.r[dreg] = res;
- CLR_ZN; SET_ZN(res);*/
- UINT32 res = ~Rn;
- Rn = res;
- CLR_ZN; SET_ZN(res);
- return;
-}
-#else
- /*
- GCC on WIN32 (more importantly mingw) doesn't know the declared
- variables in asm until we put a _ before it.
-
- So the declaration dsp_flag_c needs to be _dsp_flag_c on mingw.
- */
-
-#ifdef __GCCWIN32__
-
- asm(
- "notl %1 \n\
- setz _gpu_flag_z \n\
- sets _gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "a"(_Rn));
-
-#else
-
- asm(
- "notl %1 \n\
- setz gpu_flag_z \n\
- sets gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "a"(_Rn));
-
-#endif // #ifdef __GCCWIN32__
-#endif // #ifndef USE_ASSEMBLY
-
-#else
- __asm
- {
- mov eax,_Rn
- not eax
- setz [gpu_flag_z]
- sets [gpu_flag_n]
- mov res,eax
- };
+#ifdef GPU_DIS_NOT
+ if (doGPUDis)
+ WriteLog("%06X: NOT R%02u, R%02u [NCZ:%u%u%u, R%02u=%08X, R%02u=%08X] -> ", gpu_pc-2, IMM_1, IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN);
+#endif
+ RN = ~RN;
+ SET_ZN(RN);
+#ifdef GPU_DIS_NOT
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN);
#endif
- Rn=res;
}
+
static void gpu_opcode_move_pc(void)
{
- Rn = gpu_pc-2;
+#ifdef GPU_DIS_MOVEPC
+ if (doGPUDis)
+ WriteLog("%06X: MOVE PC, R%02u [NCZ:%u%u%u, PC=%08X, R%02u=%08X] -> ", gpu_pc-2, IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, gpu_pc-2, IMM_2, RN);
+#endif
+ // Should be previous PC--this might not always be previous instruction!
+ // Then again, this will point right at the *current* instruction, i.e., MOVE PC,R!
+ RN = gpu_pc - 2;
+#ifdef GPU_DIS_MOVEPC
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
}
+
static void gpu_opcode_sat8(void)
{
- int32 _Rn=(int32)Rn;
-
- uint32 res= Rn = (_Rn<0) ? 0 : (_Rn > 0xff ? 0xff : _Rn);
- set_flag_z(res);
- reset_flag_n();
+#ifdef GPU_DIS_SAT8
+ if (doGPUDis)
+ WriteLog("%06X: SAT8 R%02u [NCZ:%u%u%u, R%02u=%08X] -> ", gpu_pc-2, IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
+ RN = ((int32_t)RN < 0 ? 0 : (RN > 0xFF ? 0xFF : RN));
+ SET_ZN(RN);
+#ifdef GPU_DIS_SAT8
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
}
+
static void gpu_opcode_sat16(void)
{
- int32 _Rn=(int32)Rn;
- uint32 res= Rn = (_Rn<0) ? 0 : (_Rn > 0xFFFF ? 0xFFFF : _Rn);
- set_flag_z(res);
- reset_flag_n();
+ RN = ((int32_t)RN < 0 ? 0 : (RN > 0xFFFF ? 0xFFFF : RN));
+ SET_ZN(RN);
}
static void gpu_opcode_sat24(void)
{
- int32 _Rn=(int32)Rn;
-
- uint32 res= Rn = (_Rn<0) ? 0 : (_Rn > 0xFFFFFF ? 0xFFFFFF : _Rn);
- set_flag_z(res);
- reset_flag_n();
+ RN = ((int32_t)RN < 0 ? 0 : (RN > 0xFFFFFF ? 0xFFFFFF : RN));
+ SET_ZN(RN);
}
+
static void gpu_opcode_store_r14_indexed(void)
{
- gpu_long_write( gpu_reg[14] + (gpu_convert_zero[imm_1] << 2),Rn);
+#ifdef GPU_DIS_STORE14I
+ if (doGPUDis)
+ WriteLog("%06X: STORE R%02u, (R14+$%02X) [NCZ:%u%u%u, R%02u=%08X, R14+$%02X=%08X]\n", gpu_pc-2, IMM_2, gpu_convert_zero[IMM_1] << 2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN, gpu_convert_zero[IMM_1] << 2, gpu_reg[14]+(gpu_convert_zero[IMM_1] << 2));
+#endif
+#ifdef GPU_CORRECT_ALIGNMENT
+ uint32_t address = gpu_reg[14] + (gpu_convert_zero[IMM_1] << 2);
+
+ if (address >= 0xF03000 && address <= 0xF03FFF)
+ GPUWriteLong(address & 0xFFFFFFFC, RN, GPU);
+ else
+ GPUWriteLong(address, RN, GPU);
+#else
+ GPUWriteLong(gpu_reg[14] + (gpu_convert_zero[IMM_1] << 2), RN, GPU);
+#endif
}
+
static void gpu_opcode_store_r15_indexed(void)
{
- gpu_long_write( gpu_reg[15] + (gpu_convert_zero[imm_1] << 2),Rn);
+#ifdef GPU_DIS_STORE15I
+ if (doGPUDis)
+ WriteLog("%06X: STORE R%02u, (R15+$%02X) [NCZ:%u%u%u, R%02u=%08X, R15+$%02X=%08X]\n", gpu_pc-2, IMM_2, gpu_convert_zero[IMM_1] << 2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN, gpu_convert_zero[IMM_1] << 2, gpu_reg[15]+(gpu_convert_zero[IMM_1] << 2));
+#endif
+#ifdef GPU_CORRECT_ALIGNMENT
+ uint32_t address = gpu_reg[15] + (gpu_convert_zero[IMM_1] << 2);
+
+ if (address >= 0xF03000 && address <= 0xF03FFF)
+ GPUWriteLong(address & 0xFFFFFFFC, RN, GPU);
+ else
+ GPUWriteLong(address, RN, GPU);
+#else
+ GPUWriteLong(gpu_reg[15] + (gpu_convert_zero[IMM_1] << 2), RN, GPU);
+#endif
}
+
static void gpu_opcode_load_r14_ri(void)
{
- Rn=gpu_long_read(gpu_reg[14] + Rm);
+#ifdef GPU_DIS_LOAD14R
+ if (doGPUDis)
+ WriteLog("%06X: LOAD (R14+R%02u), R%02u [NCZ:%u%u%u, R14+R%02u=%08X, R%02u=%08X] -> ", gpu_pc-2, IMM_1, IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM+gpu_reg[14], IMM_2, RN);
+#endif
+#ifdef GPU_CORRECT_ALIGNMENT
+ uint32_t address = gpu_reg[14] + RM;
+
+ if (address >= 0xF03000 && address <= 0xF03FFF)
+ RN = GPUReadLong(address & 0xFFFFFFFC, GPU);
+ else
+ RN = GPUReadLong(address, GPU);
+#else
+ RN = GPUReadLong(gpu_reg[14] + RM, GPU);
+#endif
+#ifdef GPU_DIS_LOAD14R
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
}
+
static void gpu_opcode_load_r15_ri(void)
{
- Rn=gpu_long_read(gpu_reg[15] + Rm);
+#ifdef GPU_DIS_LOAD15R
+ if (doGPUDis)
+ WriteLog("%06X: LOAD (R15+R%02u), R%02u [NCZ:%u%u%u, R15+R%02u=%08X, R%02u=%08X] -> ", gpu_pc-2, IMM_1, IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM+gpu_reg[15], IMM_2, RN);
+#endif
+#ifdef GPU_CORRECT_ALIGNMENT
+ uint32_t address = gpu_reg[15] + RM;
+
+ if (address >= 0xF03000 && address <= 0xF03FFF)
+ RN = GPUReadLong(address & 0xFFFFFFFC, GPU);
+ else
+ RN = GPUReadLong(address, GPU);
+#else
+ RN = GPUReadLong(gpu_reg[15] + RM, GPU);
+#endif
+#ifdef GPU_DIS_LOAD15R
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
}
+
static void gpu_opcode_store_r14_ri(void)
{
- gpu_long_write(gpu_reg[14] + Rm,Rn);
+#ifdef GPU_DIS_STORE14R
+ if (doGPUDis)
+ WriteLog("%06X: STORE R%02u, (R14+R%02u) [NCZ:%u%u%u, R%02u=%08X, R14+R%02u=%08X]\n", gpu_pc-2, IMM_2, IMM_1, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN, IMM_1, RM+gpu_reg[14]);
+#endif
+#ifdef GPU_CORRECT_ALIGNMENT
+ uint32_t address = gpu_reg[14] + RM;
+
+ if (address >= 0xF03000 && address <= 0xF03FFF)
+ GPUWriteLong(address & 0xFFFFFFFC, RN, GPU);
+ else
+ GPUWriteLong(address, RN, GPU);
+#else
+ GPUWriteLong(gpu_reg[14] + RM, RN, GPU);
+#endif
}
+
static void gpu_opcode_store_r15_ri(void)
{
- gpu_long_write(gpu_reg[15] + Rm,Rn);
+#ifdef GPU_DIS_STORE15R
+ if (doGPUDis)
+ WriteLog("%06X: STORE R%02u, (R15+R%02u) [NCZ:%u%u%u, R%02u=%08X, R15+R%02u=%08X]\n", gpu_pc-2, IMM_2, IMM_1, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN, IMM_1, RM+gpu_reg[15]);
+#endif
+#ifdef GPU_CORRECT_ALIGNMENT_STORE
+ uint32_t address = gpu_reg[15] + RM;
+
+ if (address >= 0xF03000 && address <= 0xF03FFF)
+ GPUWriteLong(address & 0xFFFFFFFC, RN, GPU);
+ else
+ GPUWriteLong(address, RN, GPU);
+#else
+ GPUWriteLong(gpu_reg[15] + RM, RN, GPU);
+#endif
}
+
static void gpu_opcode_nop(void)
{
+#ifdef GPU_DIS_NOP
+ if (doGPUDis)
+ WriteLog("%06X: NOP [NCZ:%u%u%u]\n", gpu_pc-2, gpu_flag_n, gpu_flag_c, gpu_flag_z);
+#endif
}
+
static void gpu_opcode_pack(void)
{
- uint32 _Rn=Rn;
-
- if (Rm==0)
- {
- Rn =((_Rn & 0x03C00000) >> 10) |
- ((_Rn & 0x0001E000) >> 5) |
- ((_Rn & 0x000000FF));
- }
- else
- {
- Rn =((_Rn & 0x0000F000) << 10) |
- ((_Rn & 0x00000F00) << 5) |
- ((_Rn & 0x000000FF));
- }
- reset_flag_z();
- reset_flag_n();
- set_flag_z(Rn);
- set_flag_n(Rn);
+#ifdef GPU_DIS_PACK
+ if (doGPUDis)
+ WriteLog("%06X: %s R%02u [NCZ:%u%u%u, R%02u=%08X, R%02u=%08X] -> ", gpu_pc-2, (!IMM_1 ? "PACK " : "UNPACK"), IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
+ uint32_t val = RN;
+
+//BUG! if (RM == 0) // Pack
+ if (IMM_1 == 0) // Pack
+ RN = ((val >> 10) & 0x0000F000) | ((val >> 5) & 0x00000F00) | (val & 0x000000FF);
+ else // Unpack
+ RN = ((val & 0x0000F000) << 10) | ((val & 0x00000F00) << 5) | (val & 0x000000FF);
+#ifdef GPU_DIS_PACK
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
}
+
static void gpu_opcode_storeb(void)
{
- if ((Rm >= 0xF03000) && (Rm < 0xF04000))
- gpu_long_write(Rm,Rn&0xff);
+#ifdef GPU_DIS_STOREB
+ if (doGPUDis)
+ WriteLog("%06X: STOREB R%02u, (R%02u) [NCZ:%u%u%u, R%02u=%08X, R%02u=%08X]\n", gpu_pc-2, IMM_2, IMM_1, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN, IMM_1, RM);
+#endif
+//Is this right???
+// Would appear to be so...!
+ if ((RM >= 0xF03000) && (RM <= 0xF03FFF))
+ GPUWriteLong(RM, RN & 0xFF, GPU);
else
- jaguar_byte_write(Rm,Rn);
+ JaguarWriteByte(RM, RN, GPU);
}
+
static void gpu_opcode_storew(void)
{
- if ((Rm >= 0xF03000) && (Rm < 0xF04000))
- gpu_long_write(Rm,Rn&0xffff);
+#ifdef GPU_DIS_STOREW
+ if (doGPUDis)
+ WriteLog("%06X: STOREW R%02u, (R%02u) [NCZ:%u%u%u, R%02u=%08X, R%02u=%08X]\n", gpu_pc-2, IMM_2, IMM_1, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN, IMM_1, RM);
+#endif
+#ifdef GPU_CORRECT_ALIGNMENT
+ if ((RM >= 0xF03000) && (RM <= 0xF03FFF))
+ GPUWriteLong(RM & 0xFFFFFFFE, RN & 0xFFFF, GPU);
else
- jaguar_word_write(Rm,Rn);
+ JaguarWriteWord(RM, RN, GPU);
+#else
+ if ((RM >= 0xF03000) && (RM <= 0xF03FFF))
+ GPUWriteLong(RM, RN & 0xFFFF, GPU);
+ else
+ JaguarWriteWord(RM, RN, GPU);
+#endif
}
+
static void gpu_opcode_store(void)
{
- gpu_long_write(Rm,Rn);
+#ifdef GPU_DIS_STORE
+ if (doGPUDis)
+ WriteLog("%06X: STORE R%02u, (R%02u) [NCZ:%u%u%u, R%02u=%08X, R%02u=%08X]\n", gpu_pc-2, IMM_2, IMM_1, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN, IMM_1, RM);
+#endif
+#ifdef GPU_CORRECT_ALIGNMENT
+ if ((RM >= 0xF03000) && (RM <= 0xF03FFF))
+ GPUWriteLong(RM & 0xFFFFFFFC, RN, GPU);
+ else
+ GPUWriteLong(RM, RN, GPU);
+#else
+ GPUWriteLong(RM, RN, GPU);
+#endif
}
+
static void gpu_opcode_storep(void)
{
- uint32 _Rm=Rm;
- gpu_long_write(_Rm, gpu_hidata);
- gpu_long_write(_Rm+4, Rn);
+#ifdef GPU_CORRECT_ALIGNMENT
+ if ((RM >= 0xF03000) && (RM <= 0xF03FFF))
+ {
+ GPUWriteLong((RM & 0xFFFFFFF8) + 0, gpu_hidata, GPU);
+ GPUWriteLong((RM & 0xFFFFFFF8) + 4, RN, GPU);
+ }
+ else
+ {
+ GPUWriteLong(RM + 0, gpu_hidata, GPU);
+ GPUWriteLong(RM + 4, RN, GPU);
+ }
+#else
+ GPUWriteLong(RM + 0, gpu_hidata, GPU);
+ GPUWriteLong(RM + 4, RN, GPU);
+#endif
}
static void gpu_opcode_loadb(void)
{
- if ((Rm >= 0xF03000) && (Rm < 0xF04000))
- Rn=gpu_long_read(Rm)&0xff;
+#ifdef GPU_DIS_LOADB
+ if (doGPUDis)
+ WriteLog("%06X: LOADB (R%02u), R%02u [NCZ:%u%u%u, R%02u=%08X, R%02u=%08X] -> ", gpu_pc-2, IMM_1, IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN);
+#endif
+ if ((RM >= 0xF03000) && (RM <= 0xF03FFF))
+ RN = GPUReadLong(RM, GPU) & 0xFF;
else
- Rn=jaguar_byte_read(Rm);
+ RN = JaguarReadByte(RM, GPU);
+#ifdef GPU_DIS_LOADB
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
}
+
static void gpu_opcode_loadw(void)
{
- if ((Rm >= 0xF03000) && (Rm < 0xF04000))
- Rn=gpu_long_read(Rm)&0xffff;
+#ifdef GPU_DIS_LOADW
+ if (doGPUDis)
+ WriteLog("%06X: LOADW (R%02u), R%02u [NCZ:%u%u%u, R%02u=%08X, R%02u=%08X] -> ", gpu_pc-2, IMM_1, IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN);
+#endif
+#ifdef GPU_CORRECT_ALIGNMENT
+ if ((RM >= 0xF03000) && (RM <= 0xF03FFF))
+ RN = GPUReadLong(RM & 0xFFFFFFFE, GPU) & 0xFFFF;
+ else
+ RN = JaguarReadWord(RM, GPU);
+#else
+ if ((RM >= 0xF03000) && (RM <= 0xF03FFF))
+ RN = GPUReadLong(RM, GPU) & 0xFFFF;
else
- Rn=jaguar_word_read(Rm);
+ RN = JaguarReadWord(RM, GPU);
+#endif
+#ifdef GPU_DIS_LOADW
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
}
+
+// According to the docs, & "Do The Same", this address is long aligned...
+// So let's try it:
+// And it works!!! Need to fix all instances...
+// Also, Power Drive Rally seems to contradict the idea that only LOADs in
+// the $F03000-$F03FFF range are aligned...
+#warning "!!! Alignment issues, need to find definitive final word on this !!!"
+/*
+Preliminary testing on real hardware seems to confirm that something strange goes on
+with unaligned reads in main memory. When the address is off by 1, the result is the
+same as the long address with the top byte replaced by something. So if the read is
+from $401, and $400 has 12 34 56 78, the value read will be $nn345678, where nn is a currently unknown vlaue.
+When the address is off by 2, the result would be $nnnn5678, where nnnn is unknown.
+When the address is off by 3, the result would be $nnnnnn78, where nnnnnn is unknown.
+It may be that the "unknown" values come from the prefetch queue, but not sure how
+to test that. They seem to be stable, though, which would indicate such a mechanism.
+Sometimes, however, the off by 2 case returns $12345678!
+*/
static void gpu_opcode_load(void)
{
- Rn = gpu_long_read(Rm);
+#ifdef GPU_DIS_LOAD
+ if (doGPUDis)
+ WriteLog("%06X: LOAD (R%02u), R%02u [NCZ:%u%u%u, R%02u=%08X, R%02u=%08X] -> ", gpu_pc-2, IMM_1, IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN);
+#endif
+#ifdef GPU_CORRECT_ALIGNMENT
+ uint32_t mask[4] = { 0x00000000, 0xFF000000, 0xFFFF0000, 0xFFFFFF00 };
+// if ((RM >= 0xF03000) && (RM <= 0xF03FFF))
+ RN = GPUReadLong(RM & 0xFFFFFFFC, GPU);
+// RN = GPUReadLong(RM & 0x00FFFFFC, GPU);
+// else
+// RN = GPUReadLong(RM, GPU);
+ // Simulate garbage in unaligned reads...
+//seems that this behavior is different in GPU mem vs. main mem...
+// if ((RM < 0xF03000) || (RM > 0xF0BFFF))
+// RN |= mask[RM & 0x03];
+#else
+ RN = GPUReadLong(RM, GPU);
+#endif
+#ifdef GPU_DIS_LOAD
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
}
+
static void gpu_opcode_loadp(void)
{
- uint32 _Rm=Rm;
-
- gpu_hidata = gpu_long_read(_Rm);
- Rn = gpu_long_read(_Rm+4);
+#ifdef GPU_CORRECT_ALIGNMENT
+ if ((RM >= 0xF03000) && (RM <= 0xF03FFF))
+ {
+ gpu_hidata = GPUReadLong((RM & 0xFFFFFFF8) + 0, GPU);
+ RN = GPUReadLong((RM & 0xFFFFFFF8) + 4, GPU);
+ }
+ else
+ {
+ gpu_hidata = GPUReadLong(RM + 0, GPU);
+ RN = GPUReadLong(RM + 4, GPU);
+ }
+#else
+ gpu_hidata = GPUReadLong(RM + 0, GPU);
+ RN = GPUReadLong(RM + 4, GPU);
+#endif
}
+
static void gpu_opcode_load_r14_indexed(void)
{
- Rn = gpu_long_read( gpu_reg[14] + (gpu_convert_zero[imm_1] << 2));
+#ifdef GPU_DIS_LOAD14I
+ if (doGPUDis)
+ WriteLog("%06X: LOAD (R14+$%02X), R%02u [NCZ:%u%u%u, R14+$%02X=%08X, R%02u=%08X] -> ", gpu_pc-2, gpu_convert_zero[IMM_1] << 2, IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, gpu_convert_zero[IMM_1] << 2, gpu_reg[14]+(gpu_convert_zero[IMM_1] << 2), IMM_2, RN);
+#endif
+#ifdef GPU_CORRECT_ALIGNMENT
+ uint32_t address = gpu_reg[14] + (gpu_convert_zero[IMM_1] << 2);
+
+ if ((RM >= 0xF03000) && (RM <= 0xF03FFF))
+ RN = GPUReadLong(address & 0xFFFFFFFC, GPU);
+ else
+ RN = GPUReadLong(address, GPU);
+#else
+ RN = GPUReadLong(gpu_reg[14] + (gpu_convert_zero[IMM_1] << 2), GPU);
+#endif
+#ifdef GPU_DIS_LOAD14I
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
}
+
static void gpu_opcode_load_r15_indexed(void)
{
- Rn = gpu_long_read( gpu_reg[15] + (gpu_convert_zero[imm_1] << 2));
+#ifdef GPU_DIS_LOAD15I
+ if (doGPUDis)
+ WriteLog("%06X: LOAD (R15+$%02X), R%02u [NCZ:%u%u%u, R15+$%02X=%08X, R%02u=%08X] -> ", gpu_pc-2, gpu_convert_zero[IMM_1] << 2, IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, gpu_convert_zero[IMM_1] << 2, gpu_reg[15]+(gpu_convert_zero[IMM_1] << 2), IMM_2, RN);
+#endif
+#ifdef GPU_CORRECT_ALIGNMENT
+ uint32_t address = gpu_reg[15] + (gpu_convert_zero[IMM_1] << 2);
+
+ if ((RM >= 0xF03000) && (RM <= 0xF03FFF))
+ RN = GPUReadLong(address & 0xFFFFFFFC, GPU);
+ else
+ RN = GPUReadLong(address, GPU);
+#else
+ RN = GPUReadLong(gpu_reg[15] + (gpu_convert_zero[IMM_1] << 2), GPU);
+#endif
+#ifdef GPU_DIS_LOAD15I
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
}
+
static void gpu_opcode_movei(void)
{
- Rn = (uint32)gpu_word_read(gpu_pc) | ((uint32)gpu_word_read(gpu_pc + 2) << 16);
+#ifdef GPU_DIS_MOVEI
+ if (doGPUDis)
+ WriteLog("%06X: MOVEI #$%08X, R%02u [NCZ:%u%u%u, R%02u=%08X] -> ", gpu_pc-2, (uint32_t)GPUReadWord(gpu_pc) | ((uint32_t)GPUReadWord(gpu_pc + 2) << 16), IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
+ // This instruction is followed by 32-bit value in LSW / MSW format...
+ RN = (uint32_t)GPUReadWord(gpu_pc, GPU) | ((uint32_t)GPUReadWord(gpu_pc + 2, GPU) << 16);
gpu_pc += 4;
+#ifdef GPU_DIS_MOVEI
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
}
+
static void gpu_opcode_moveta(void)
{
- alternate_Rn = Rm;
+#ifdef GPU_DIS_MOVETA
+ if (doGPUDis)
+ WriteLog("%06X: MOVETA R%02u, R%02u [NCZ:%u%u%u, R%02u=%08X, R%02u(alt)=%08X] -> ", gpu_pc-2, IMM_1, IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, ALTERNATE_RN);
+#endif
+ ALTERNATE_RN = RM;
+#ifdef GPU_DIS_MOVETA
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X, R%02u(alt)=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, ALTERNATE_RN);
+#endif
}
+
static void gpu_opcode_movefa(void)
{
- Rn = alternate_Rm;
+#ifdef GPU_DIS_MOVEFA
+ if (doGPUDis)
+ WriteLog("%06X: MOVEFA R%02u, R%02u [NCZ:%u%u%u, R%02u(alt)=%08X, R%02u=%08X] -> ", gpu_pc-2, IMM_1, IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, ALTERNATE_RM, IMM_2, RN);
+#endif
+ RN = ALTERNATE_RM;
+#ifdef GPU_DIS_MOVEFA
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u(alt)=%08X, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, ALTERNATE_RM, IMM_2, RN);
+#endif
}
+
static void gpu_opcode_move(void)
{
- Rn = Rm;
+#ifdef GPU_DIS_MOVE
+ if (doGPUDis)
+ WriteLog("%06X: MOVE R%02u, R%02u [NCZ:%u%u%u, R%02u=%08X, R%02u=%08X] -> ", gpu_pc-2, IMM_1, IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN);
+#endif
+ RN = RM;
+#ifdef GPU_DIS_MOVE
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN);
+#endif
}
+
static void gpu_opcode_moveq(void)
{
- Rn = imm_1;
+#ifdef GPU_DIS_MOVEQ
+ if (doGPUDis)
+ WriteLog("%06X: MOVEQ #%u, R%02u [NCZ:%u%u%u, R%02u=%08X] -> ", gpu_pc-2, IMM_1, IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
+ RN = IMM_1;
+#ifdef GPU_DIS_MOVEQ
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
}
+
static void gpu_opcode_resmac(void)
{
- Rn = gpu_acc;
+ RN = gpu_acc;
}
+
static void gpu_opcode_imult(void)
{
- uint32 res=Rn=((int16)Rn)*((int16)Rm);
- set_flag_z(res);
- set_flag_n(res);
+#ifdef GPU_DIS_IMULT
+ if (doGPUDis)
+ WriteLog("%06X: IMULT R%02u, R%02u [NCZ:%u%u%u, R%02u=%08X, R%02u=%08X] -> ", gpu_pc-2, IMM_1, IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN);
+#endif
+ RN = (int16_t)RN * (int16_t)RM;
+ SET_ZN(RN);
+#ifdef GPU_DIS_IMULT
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN);
+#endif
}
+
static void gpu_opcode_mult(void)
{
- uint32 res=Rn = ((uint16)Rm) * ((uint16)Rn);
- set_flag_z(res);
- set_flag_n(res);
+#ifdef GPU_DIS_MULT
+ if (doGPUDis)
+ WriteLog("%06X: MULT R%02u, R%02u [NCZ:%u%u%u, R%02u=%08X, R%02u=%08X] -> ", gpu_pc-2, IMM_1, IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN);
+#endif
+ RN = (uint16_t)RM * (uint16_t)RN;
+// RN = (RM & 0xFFFF) * (RN & 0xFFFF);
+ SET_ZN(RN);
+#ifdef GPU_DIS_MULT
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN);
+#endif
}
+
static void gpu_opcode_bclr(void)
{
- uint32 _Rm=imm_1;
- uint32 _Rn=Rn;
- uint32 res;
-#ifdef __PORT__
-#ifndef USE_ASSEMBLY
-{
-/* int dreg = jaguar.op & 31;
- UINT32 r1 = (jaguar.op >> 5) & 31;
- UINT32 r2 = jaguar.r[dreg];
- UINT32 res = r2 & ~(1 << r1);
- jaguar.r[dreg] = res;
- CLR_ZN; SET_ZN(res);*/
- UINT32 res = Rn & ~(1 << imm_1);
- Rn = res;
- CLR_ZN; SET_ZN(res);
- return;
-}
-#else
- /*
- GCC on WIN32 (more importantly mingw) doesn't know the declared
- variables in asm until we put a _ before it.
-
- So the declaration dsp_flag_c needs to be _dsp_flag_c on mingw.
- */
-
-#ifdef __GCCWIN32__
-
- asm(
- "btrl %1, %2 \n\
- cmpl $0, %2 \n\
- setz _gpu_flag_z \n\
- sets _gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "c"(_Rm), "a"(_Rn));
-
-#else
-
- asm(
- "btrl %1, %2 \n\
- cmpl $0, %2 \n\
- setz gpu_flag_z \n\
- sets gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "c"(_Rm), "a"(_Rn));
-
-#endif // #ifdef __GCCWIN32__
-#endif // #ifndef USE_ASSEMBLY
-
-#else
- __asm
- {
- mov eax,_Rn
- mov ecx,_Rm
- btr eax,ecx
- cmp eax,0
- setz [gpu_flag_z]
- sets [gpu_flag_n]
- mov res,eax
- };
+#ifdef GPU_DIS_BCLR
+ if (doGPUDis)
+ WriteLog("%06X: BCLR #%u, R%02u [NCZ:%u%u%u, R%02u=%08X] -> ", gpu_pc-2, IMM_1, IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
+ uint32_t res = RN & ~(1 << IMM_1);
+ RN = res;
+ SET_ZN(res);
+#ifdef GPU_DIS_BCLR
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
#endif
- Rn=res;
}
+
static void gpu_opcode_btst(void)
{
- uint32 _Rm=imm_1;
- uint32 _Rn=Rn;
-#ifdef __PORT__
-#ifndef USE_ASSEMBLY
-{
-/* UINT32 r1 = (jaguar.op >> 5) & 31;
- UINT32 r2 = jaguar.r[jaguar.op & 31];
- CLR_Z; jaguar.FLAGS |= (~r2 >> r1) & 1;*/
- CLR_Z; gpu_flag_z = (~Rn >> imm_1) & 1;
- return;
-}
-#else
- /*
- GCC on WIN32 (more importantly mingw) doesn't know the declared
- variables in asm until we put a _ before it.
-
- So the declaration dsp_flag_c needs to be _dsp_flag_c on mingw.
- */
-
-#ifdef __GCCWIN32__
-
- asm(
- "bt %0, %1 \n\
- setnc _gpu_flag_z \n\
- "
- :
- : "c"(_Rm), "a"(_Rn));
-
-#else
-
- asm(
- "bt %0, %1 \n\
- setnc gpu_flag_z \n\
- "
- :
- : "c"(_Rm), "a"(_Rn));
-
-#endif // #ifdef __GCCWIN32__
-#endif // #ifndef USE_ASSEMBLY
-
-#else
- __asm
- {
- mov eax,_Rn
- mov ecx,_Rm
- bt eax,ecx
- setnc [gpu_flag_z]
- };
+#ifdef GPU_DIS_BTST
+ if (doGPUDis)
+ WriteLog("%06X: BTST #%u, R%02u [NCZ:%u%u%u, R%02u=%08X] -> ", gpu_pc-2, IMM_1, IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
+ gpu_flag_z = (~RN >> IMM_1) & 1;
+#ifdef GPU_DIS_BTST
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
#endif
}
+
static void gpu_opcode_bset(void)
{
- uint32 _Rm=imm_1;
- uint32 _Rn=Rn;
- uint32 res;
-#ifdef __PORT__
-#ifndef USE_ASSEMBLY
-{
-/* int dreg = jaguar.op & 31;
- UINT32 r1 = (jaguar.op >> 5) & 31;
- UINT32 r2 = jaguar.r[dreg];
- UINT32 res = r2 | (1 << r1);
- jaguar.r[dreg] = res;
- CLR_ZN; SET_ZN(res);*/
- UINT32 res = Rn | (1 << imm_1);
- Rn = res;
- CLR_ZN; SET_ZN(res);
- return;
-}
-#else
- /*
- GCC on WIN32 (more importantly mingw) doesn't know the declared
- variables in asm until we put a _ before it.
-
- So the declaration dsp_flag_c needs to be _dsp_flag_c on mingw.
- */
-
-#ifdef __GCCWIN32__
-
- asm(
- "btsl %1, %2 \n\
- cmpl $0, %2 \n\
- setz _gpu_flag_z \n\
- sets _gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "c"(_Rm), "a"(_Rn));
-
-#else
-
- asm(
- "btsl %1, %2 \n\
- cmpl $0, %2 \n\
- setz gpu_flag_z \n\
- sets gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "c"(_Rm), "a"(_Rn));
-
-#endif // #ifdef __GCCWIN32__
-#endif // #ifndef USE_ASSEMBLY
-
-#else
- __asm
- {
- mov eax,_Rn
- mov ecx,_Rm
- bts eax,ecx
- cmp eax,0
- setz [gpu_flag_z]
- sets [gpu_flag_n]
- mov res,eax
- };
+#ifdef GPU_DIS_BSET
+ if (doGPUDis)
+ WriteLog("%06X: BSET #%u, R%02u [NCZ:%u%u%u, R%02u=%08X] -> ", gpu_pc-2, IMM_1, IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
+ uint32_t res = RN | (1 << IMM_1);
+ RN = res;
+ SET_ZN(res);
+#ifdef GPU_DIS_BSET
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
#endif
- Rn=res;
}
+
static void gpu_opcode_imacn(void)
{
- uint32 res = ((int16)Rm) * ((int16)(Rn));
+ uint32_t res = (int16_t)RM * (int16_t)(RN);
gpu_acc += res;
}
+
static void gpu_opcode_mtoi(void)
{
- uint32 _Rm=Rm;
- uint32 res=Rn=(((INT32)_Rm >> 8) & 0xff800000) | (_Rm & 0x007fffff);
- set_flag_z(res);
- set_flag_n(res);
+ uint32_t _RM = RM;
+ uint32_t res = RN = (((int32_t)_RM >> 8) & 0xFF800000) | (_RM & 0x007FFFFF);
+ SET_ZN(res);
}
+
static void gpu_opcode_normi(void)
{
- uint32 _Rm = Rm;
- uint32 res = 0;
+ uint32_t _RM = RM;
+ uint32_t res = 0;
- if (_Rm)
+ if (_RM)
{
- while ((_Rm & 0xFFC00000) == 0)
+ while ((_RM & 0xFFC00000) == 0)
{
- _Rm <<= 1;
+ _RM <<= 1;
res--;
}
- while ((_Rm & 0xFF800000) != 0)
+ while ((_RM & 0xFF800000) != 0)
{
- _Rm >>= 1;
+ _RM >>= 1;
res++;
}
}
- Rn = res;
- set_flag_z(res);
- set_flag_n(res);
+ RN = res;
+ SET_ZN(res);
}
static void gpu_opcode_mmult(void)
{
- int count = gpu_matrix_control & 0x0F;
- uint32 addr = gpu_pointer_to_matrix; // in the gpu ram
- int64 accum = 0;
- uint32 res;
+ int count = gpu_matrix_control & 0x0F; // Matrix width
+ uint32_t addr = gpu_pointer_to_matrix; // In the GPU's RAM
+ int64_t accum = 0;
+ uint32_t res;
- if (!(gpu_matrix_control & 0x10))
+ if (gpu_matrix_control & 0x10) // Column stepping
{
- for (int i = 0; i < count; i++)
- {
- int16 a;
- if (i&0x01)
- a=(int16)((gpu_alternate_reg[gpu_opcode_first_parameter + (i>>1)]>>16)&0xffff);
+ for(int i=0; i<count; i++)
+ {
+ int16_t a;
+ if (i & 0x01)
+ a = (int16_t)((gpu_alternate_reg[IMM_1 + (i >> 1)] >> 16) & 0xFFFF);
else
- a=(int16)(gpu_alternate_reg[gpu_opcode_first_parameter + (i>>1)]&0xffff);
+ a = (int16_t)(gpu_alternate_reg[IMM_1 + (i >> 1)] & 0xFFFF);
- int16 b=((int16)gpu_word_read(addr+2));
- accum += a*b;
- addr += 4;
+ int16_t b = ((int16_t)GPUReadWord(addr + 2, GPU));
+ accum += a * b;
+ addr += 4 * count;
}
}
- else
+ else // Row stepping
{
- for (int i = 0; i < count; i++)
+ for(int i=0; i<count; i++)
{
- int16 a;
- if (i&0x01)
- a=(int16)((gpu_alternate_reg[gpu_opcode_first_parameter + (i>>1)]>>16)&0xffff);
+ int16_t a;
+ if (i & 0x01)
+ a = (int16_t)((gpu_alternate_reg[IMM_1 + (i >> 1)] >> 16) & 0xFFFF);
else
- a=(int16)(gpu_alternate_reg[gpu_opcode_first_parameter + (i>>1)]&0xffff);
+ a = (int16_t)(gpu_alternate_reg[IMM_1 + (i >> 1)] & 0xFFFF);
- int16 b=((int16)gpu_word_read(addr+2));
- accum += a*b;
- addr += 4 * count;
+ int16_t b = ((int16_t)GPUReadWord(addr + 2, GPU));
+ accum += a * b;
+ addr += 4;
}
}
- Rn = res = (int32)accum;
- // carry flag to do
- set_flag_z(res);
- set_flag_n(res);
+ RN = res = (int32_t)accum;
+ // carry flag to do (out of the last add)
+ SET_ZN(res);
}
+
static void gpu_opcode_abs(void)
{
- uint32 _Rn=Rn;
- uint32 res;
-
- if (_Rn==0x80000000)
- {
- set_flag_n(1);
- }
+#ifdef GPU_DIS_ABS
+ if (doGPUDis)
+ WriteLog("%06X: ABS R%02u [NCZ:%u%u%u, R%02u=%08X] -> ", gpu_pc-2, IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
+ gpu_flag_c = RN >> 31;
+ if (RN == 0x80000000)
+ //Is 0x80000000 a positive number? If so, then we need to set C to 0 as well!
+ gpu_flag_n = 1, gpu_flag_z = 0;
else
{
- gpu_flag_c = ((_Rn&0x80000000)>>31);
- res= Rn = (((int32)_Rn)<0) ? -_Rn : _Rn;
- reset_flag_n();
- set_flag_z(res);
+ if (gpu_flag_c)
+ RN = -RN;
+ gpu_flag_n = 0; SET_FLAG_Z(RN);
}
+#ifdef GPU_DIS_ABS
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
}
-static void gpu_opcode_div(void)
-{
- uint32 _Rm=Rm;
- uint32 _Rn=Rn;
- if (_Rm)
+static void gpu_opcode_div(void) // RN / RM
+{
+#ifdef GPU_DIS_DIV
+ if (doGPUDis)
+ WriteLog("%06X: DIV R%02u, R%02u (%s) [NCZ:%u%u%u, R%02u=%08X, R%02u=%08X] -> ", gpu_pc-2, IMM_1, IMM_2, (gpu_div_control & 0x01 ? "16.16" : "32"), gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN);
+#endif
+// NOTE: remainder is NOT calculated correctly here!
+// The original tried to get it right by checking to see if the
+// remainder was negative, but that's too late...
+// The code there should do it now, but I'm not 100% sure...
+// [Now it should be correct, but not displaying correct behavior of the actual
+// hardware. A step in the right direction.]
+
+ if (RM)
{
- if (gpu_div_control & 1)
+ if (gpu_div_control & 0x01) // 16.16 division
{
- gpu_remain = (((uint64)_Rn) << 16) % _Rm;
- if (gpu_remain&0x80000000)
- gpu_remain-=_Rm;
- Rn = (((uint64)_Rn) << 16) / _Rm;
+ gpu_remain = ((uint64_t)RN << 16) % RM;
+ RN = ((uint64_t)RN << 16) / RM;
}
else
{
- gpu_remain = _Rn % _Rm;
- if (gpu_remain&0x80000000)
- gpu_remain-=_Rm;
- Rn/=_Rm;
+ // We calculate the remainder first because we destroy RN after
+ // this by assigning it to itself.
+ gpu_remain = RN % RM;
+ RN = RN / RM;
}
+
+// What we really should do here is figure out why this condition
+// happens in the real divide unit and emulate *that* behavior.
+#if 0
+ if ((gpu_remain - RM) & 0x80000000) // If the result would have been negative...
+ gpu_remain -= RM; // Then make it negative!
+#endif
}
else
- Rn=0xffffffff;
+ RN = 0xFFFFFFFF;
+
+#ifdef GPU_DIS_DIV
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X, R%02u=%08X] Remainder: %08X\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN, gpu_remain);
+#endif
}
+
static void gpu_opcode_imultn(void)
{
- uint32 res = (int32)((int16)Rn * (int16)Rm);
- gpu_acc = (int32)res;
- set_flag_z(res);
- set_flag_n(res);
+ uint32_t res = (int32_t)((int16_t)RN * (int16_t)RM);
+ gpu_acc = (int32_t)res;
+ SET_FLAG_Z(res);
+ SET_FLAG_N(res);
}
+
static void gpu_opcode_neg(void)
{
- uint32 _Rn=Rn;
- uint32 res;
-#ifdef __PORT__
-#ifndef USE_ASSEMBLY
-{
-/* int dreg = jaguar.op & 31;
- UINT32 r2 = jaguar.r[dreg];
- UINT32 res = -r2;
- jaguar.r[dreg] = res;
- CLR_ZNC; SET_ZNC_SUB(0,r2,res);*/
- UINT32 res = -Rn;
- CLR_ZNC; SET_ZNC_SUB(0, Rn, res);
- Rn = res;
- return;
-}
-#else
- /*
- GCC on WIN32 (more importantly mingw) doesn't know the declared
- variables in asm until we put a _ before it.
-
- So the declaration dsp_flag_c needs to be _dsp_flag_c on mingw.
- */
-
-#ifdef __GCCWIN32__
-
- asm(
- "subl %1, %2 \n\
- setc _gpu_flag_c \n\
- setz _gpu_flag_z \n\
- sets _gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "d"(_Rn), "a"(0));
-
-#else
-
- asm(
- "subl %1, %2 \n\
- setc gpu_flag_c \n\
- setz gpu_flag_z \n\
- sets gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "d"(_Rn), "a"(0));
-
-#endif // #ifdef __GCCWIN32__
-#endif // #ifndef USE_ASSEMBLY
-
-#else
- __asm
- {
- xor eax,eax
- mov edx,_Rn
- sub eax,edx
- setc [gpu_flag_c]
- setz [gpu_flag_z]
- sets [gpu_flag_n]
- mov res,eax
- };
+#ifdef GPU_DIS_NEG
+ if (doGPUDis)
+ WriteLog("%06X: NEG R%02u [NCZ:%u%u%u, R%02u=%08X] -> ", gpu_pc-2, IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
+ uint32_t res = -RN;
+ SET_ZNC_SUB(0, RN, res);
+ RN = res;
+#ifdef GPU_DIS_NEG
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
#endif
- Rn=res;
}
+
static void gpu_opcode_shlq(void)
{
- uint32 shift=(32-gpu_convert_zero[imm_1]);
- uint32 _Rn=Rn;
- uint32 res;
-#ifdef __PORT__
-#ifndef USE_ASSEMBLY
-/* int dreg = jaguar.op & 31;
- INT32 r1 = convert_zero[(jaguar.op >> 5) & 31];
- UINT32 r2 = jaguar.r[dreg];
- UINT32 res = r2 << (32 - r1);
- jaguar.r[dreg] = res;
- CLR_ZNC; SET_ZN(res); jaguar.FLAGS |= (r2 >> 30) & 2;*/
-{
- INT32 r1 = gpu_convert_zero[imm_1];
- UINT32 res = Rn << (32 - r1);
- CLR_ZNC; SET_ZN(res); gpu_flag_c = (Rn >> 31) & 1;
- Rn = res;
- return;
-}
-#else
- /*
- GCC on WIN32 (more importantly mingw) doesn't know the declared
- variables in asm until we put a _ before it.
-
- So the declaration dsp_flag_c needs to be _dsp_flag_c on mingw.
- */
-
-#ifdef __GCCWIN32__
-
- asm(
- "testl $0x80000000, %2 \n\
- setnz _gpu_flag_c \n\
- shl %%cl, %2 \n\
- cmpl $0, %2 \n\
- setz _gpu_flag_z \n\
- sets _gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "c"(shift), "a"(_Rn));
-
-#else
-
- asm(
- "testl $0x80000000, %2 \n\
- setnz gpu_flag_c \n\
- shl %%cl, %2 \n\
- cmpl $0, %2 \n\
- setz gpu_flag_z \n\
- sets gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "c"(shift), "a"(_Rn));
-
-#endif // #ifdef __GCCWIN32__
-#endif // #ifndef USE_ASSEMBLY
-
-#else
- __asm
- {
- mov ecx,shift
- mov eax,_Rn
- test eax,0x80000000
- setnz [gpu_flag_c]
- shl eax,cl
- cmp eax,0
- setz [gpu_flag_z]
- sets [gpu_flag_n]
- mov res,eax
- }
+#ifdef GPU_DIS_SHLQ
+ if (doGPUDis)
+ WriteLog("%06X: SHLQ #%u, R%02u [NCZ:%u%u%u, R%02u=%08X] -> ", gpu_pc-2, 32 - IMM_1, IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
+// Was a bug here...
+// (Look at Aaron's code: If r1 = 32, then 32 - 32 = 0 which is wrong!)
+ int32_t r1 = 32 - IMM_1;
+ uint32_t res = RN << r1;
+ SET_ZN(res); gpu_flag_c = (RN >> 31) & 1;
+ RN = res;
+#ifdef GPU_DIS_SHLQ
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
#endif
- Rn=res;
}
+
static void gpu_opcode_shrq(void)
{
- uint32 shift=gpu_convert_zero[imm_1];
- uint32 _Rn=Rn;
-
- uint32 res;
-#ifdef __PORT__
-#ifndef USE_ASSEMBLY
-/* int dreg = jaguar.op & 31;
- INT32 r1 = convert_zero[(jaguar.op >> 5) & 31];
- UINT32 r2 = jaguar.r[dreg];
- UINT32 res = r2 >> r1;
- jaguar.r[dreg] = res;
- CLR_ZNC; SET_ZN(res); jaguar.FLAGS |= (r2 << 1) & 2;*/
-{
- INT32 r1 = gpu_convert_zero[imm_1];
- UINT32 res = Rn >> r1;
- CLR_ZNC; SET_ZN(res); gpu_flag_c = Rn & 1;
- Rn = res;
- return;
-}
-#else
- /*
- GCC on WIN32 (more importantly mingw) doesn't know the declared
- variables in asm until we put a _ before it.
-
- So the declaration dsp_flag_c needs to be _dsp_flag_c on mingw.
- */
-
-#ifdef __GCCWIN32__
-
- asm(
- "testl $0x00000001, %2 \n\
- setnz _gpu_flag_c \n\
- shr %%cl, %2 \n\
- cmpl $0, %2 \n\
- setz _gpu_flag_z \n\
- sets _gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "c"(shift), "a"(_Rn));
-
-#else
-
- asm(
- "testl $0x00000001, %2 \n\
- setnz gpu_flag_c \n\
- shr %%cl, %2 \n\
- cmpl $0, %2 \n\
- setz gpu_flag_z \n\
- sets gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "c"(shift), "a"(_Rn));
-
-#endif // #ifdef __GCCWIN32__
-#endif // #ifndef USE_ASSEMBLY
-
-#else
- __asm
- {
- mov ecx,shift
- mov eax,_Rn
- test eax,0x00000001
- setnz [gpu_flag_c]
- shr eax,cl
- cmp eax,0
- setz [gpu_flag_z]
- sets [gpu_flag_n]
- mov res,eax
- }
+#ifdef GPU_DIS_SHRQ
+ if (doGPUDis)
+ WriteLog("%06X: SHRQ #%u, R%02u [NCZ:%u%u%u, R%02u=%08X] -> ", gpu_pc-2, gpu_convert_zero[IMM_1], IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
+ int32_t r1 = gpu_convert_zero[IMM_1];
+ uint32_t res = RN >> r1;
+ SET_ZN(res); gpu_flag_c = RN & 1;
+ RN = res;
+#ifdef GPU_DIS_SHRQ
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
#endif
- Rn=res;
}
+
static void gpu_opcode_ror(void)
{
- uint32 shift=Rm;
- uint32 _Rn=Rn;
- uint32 res;
-#ifdef __PORT__
-#ifndef USE_ASSEMBLY
-//#ifndef __PORT__ // For testing...
-/* int dreg = jaguar.op & 31;
- UINT32 r1 = jaguar.r[(jaguar.op >> 5) & 31] & 31;
- UINT32 r2 = jaguar.r[dreg];
- UINT32 res = (r2 >> r1) | (r2 << (32 - r1));
- jaguar.r[dreg] = res;
- CLR_ZNC; SET_ZN(res); jaguar.FLAGS |= (r2 >> 30) & 2;*/
-{
- UINT32 r1 = Rm & 0x1F;
- UINT32 res = (Rn >> r1) | (Rn << (32 - r1));
- CLR_ZNC; SET_ZN(res); gpu_flag_c = (Rn >> 31) & 1;
- Rn = res;
- return;
-}
-#else
- /*
- GCC on WIN32 (more importantly mingw) doesn't know the declared
- variables in asm until we put a _ before it.
-
- So the declaration dsp_flag_c needs to be _dsp_flag_c on mingw.
- */
-
-#ifdef __GCCWIN32__
-
- asm(
- "testl $0x80000000, %2 \n\
- setnz _gpu_flag_c \n\
- ror %%cl, %2 \n\
- cmpl $0, %2 \n\
- setz _gpu_flag_z \n\
- sets _gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "c"(shift), "a"(_Rn));
-
-#else
-
- asm(
- "testl $0x80000000, %2 \n\
- setnz gpu_flag_c \n\
- ror %%cl, %2 \n\
- cmpl $0, %2 \n\
- setz gpu_flag_z \n\
- sets gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "c"(shift), "a"(_Rn));
-
-#endif // #ifdef __GCCWIN32__
-#endif // #ifndef USE_ASSEMBLY
-
-#else
- __asm
- {
- mov ecx,shift
- mov eax,_Rn
- test eax,0x80000000
- setnz [gpu_flag_c]
- ror eax,cl
- cmp eax,0
- setz [gpu_flag_z]
- sets [gpu_flag_n]
- mov res,eax
- }
+#ifdef GPU_DIS_ROR
+ if (doGPUDis)
+ WriteLog("%06X: ROR R%02u, R%02u [NCZ:%u%u%u, R%02u=%08X, R%02u=%08X] -> ", gpu_pc-2, IMM_1, IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN);
+#endif
+ uint32_t r1 = RM & 0x1F;
+ uint32_t res = (RN >> r1) | (RN << (32 - r1));
+ SET_ZN(res); gpu_flag_c = (RN >> 31) & 1;
+ RN = res;
+#ifdef GPU_DIS_ROR
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN);
#endif
- Rn=res;
}
+
static void gpu_opcode_rorq(void)
{
- uint32 shift = gpu_convert_zero[imm_1 & 0x1F];
- uint32 _Rn = Rn;
- uint32 res;
-#ifdef __PORT__
-#ifndef USE_ASSEMBLY
-/* uint32 index = opcode >> 10;
- gpu_opcode_first_parameter = (opcode & 0x3E0) >> 5;
- gpu_opcode_second_parameter = (opcode & 0x1F);
- gpu_pc += 2;
- gpu_opcode[index]();
- cycles -= gpu_opcode_cycles[index];
- gpu_opcode_use[index]++;*/
+#ifdef GPU_DIS_RORQ
+ if (doGPUDis)
+ WriteLog("%06X: RORQ #%u, R%02u [NCZ:%u%u%u, R%02u=%08X] -> ", gpu_pc-2, gpu_convert_zero[IMM_1], IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
+ uint32_t r1 = gpu_convert_zero[IMM_1 & 0x1F];
+ uint32_t r2 = RN;
+ uint32_t res = (r2 >> r1) | (r2 << (32 - r1));
+ RN = res;
+ SET_ZN(res); gpu_flag_c = (r2 >> 31) & 0x01;
+#ifdef GPU_DIS_RORQ
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
+}
+
+static void gpu_opcode_sha(void)
+{
/* int dreg = jaguar.op & 31;
- UINT32 r1 = convert_zero[(jaguar.op >> 5) & 31];
- UINT32 r2 = jaguar.r[dreg];
- UINT32 res = (r2 >> r1) | (r2 << (32 - r1));
+ int32_t r1 = (int32_t)jaguar.r[(jaguar.op >> 5) & 31];
+ uint32_t r2 = jaguar.r[dreg];
+ uint32_t res;
+
+ CLR_ZNC;
+ if (r1 < 0)
+ {
+ res = (r1 <= -32) ? 0 : (r2 << -r1);
+ jaguar.FLAGS |= (r2 >> 30) & 2;
+ }
+ else
+ {
+ res = (r1 >= 32) ? ((int32_t)r2 >> 31) : ((int32_t)r2 >> r1);
+ jaguar.FLAGS |= (r2 << 1) & 2;
+ }
jaguar.r[dreg] = res;
- CLR_ZNC; SET_ZN(res); jaguar.FLAGS |= (r2 >> 30) & 2;*/
-{
- UINT32 r1 = gpu_convert_zero[imm_1 & 0x1F];
- UINT32 r2 = Rn;
- UINT32 res = (r2 >> r1) | (r2 << (32 - r1));
- Rn = res;
- CLR_ZNC; SET_ZN(res); gpu_flag_c = (r2 >> 31) & 0x01;
- return;
-}
-#else
+ SET_ZN(res);*/
- /*
- GCC on WIN32 (more importantly mingw) doesn't know the declared
- variables in asm until we put a _ before it.
-
- So the declaration dsp_flag_c needs to be _dsp_flag_c on mingw.
- */
-
-#ifdef __GCCWIN32__
-
- asm(
- "testl $0x80000000, %2 \n\
- setnz _gpu_flag_c \n\
- ror %%cl, %2 \n\
- cmpl $0, %2 \n\
- setz _gpu_flag_z \n\
- sets _gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "c"(shift), "a"(_Rn));
-
-#else
-
- asm(
- "testl $0x80000000, %2 \n\
- setnz gpu_flag_c \n\
- ror %%cl, %2 \n\
- cmpl $0, %2 \n\
- setz gpu_flag_z \n\
- sets gpu_flag_n \n\
- movl %%eax, %0 \n\
- "
- : "=m"(res)
- : "c"(shift), "a"(_Rn));
-
-#endif // #ifdef __GCCWIN32__
-#endif // #ifndef USE_ASSEMBLY
+#ifdef GPU_DIS_SHA
+ if (doGPUDis)
+ WriteLog("%06X: SHA R%02u, R%02u [NCZ:%u%u%u, R%02u=%08X, R%02u=%08X] -> ", gpu_pc-2, IMM_1, IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN);
+#endif
+ uint32_t res;
-#else
- __asm
+ if ((int32_t)RM < 0)
{
- mov ecx,shift
- mov eax,_Rn
- test eax,0x80000000
- setnz [gpu_flag_c]
- ror eax,cl
- cmp eax,0
- setz [gpu_flag_z]
- sets [gpu_flag_n]
- mov res,eax
+ res = ((int32_t)RM <= -32) ? 0 : (RN << -(int32_t)RM);
+ gpu_flag_c = RN >> 31;
}
-#endif // #ifdef __PORT__
- Rn = res;
-}
+ else
+ {
+ res = ((int32_t)RM >= 32) ? ((int32_t)RN >> 31) : ((int32_t)RN >> (int32_t)RM);
+ gpu_flag_c = RN & 0x01;
+ }
+ RN = res;
+ SET_ZN(res);
+#ifdef GPU_DIS_SHA
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN);
+#endif
-static void gpu_opcode_sha(void)
-{
- int32 sRm=(int32)Rm;
- uint32 _Rn=Rn;
+/* int32_t sRM=(int32_t)RM;
+ uint32_t _RN=RN;
- if (sRm<0)
+ if (sRM<0)
{
- uint32 shift=-sRm;
+ uint32_t shift=-sRM;
if (shift>=32) shift=32;
- gpu_flag_c=(_Rn&0x80000000)>>31;
+ gpu_flag_c=(_RN&0x80000000)>>31;
while (shift)
{
- _Rn<<=1;
+ _RN<<=1;
shift--;
}
}
else
{
- uint32 shift=sRm;
+ uint32_t shift=sRM;
if (shift>=32) shift=32;
- gpu_flag_c=_Rn&0x1;
+ gpu_flag_c=_RN&0x1;
while (shift)
{
- _Rn=((int32)_Rn)>>1;
+ _RN=((int32_t)_RN)>>1;
shift--;
}
}
- Rn=_Rn;
- set_flag_z(_Rn);
- set_flag_n(_Rn);
+ RN=_RN;
+ SET_FLAG_Z(_RN);
+ SET_FLAG_N(_RN);*/
}
+
static void gpu_opcode_sharq(void)
{
- uint32 shift=gpu_convert_zero[imm_1];
- uint32 _Rn=Rn;
-
- gpu_flag_c = (_Rn & 0x1);
- while (shift)
- {
- _Rn=((int32)_Rn)>>1;
- shift--;
- }
- Rn=_Rn;
- set_flag_z(_Rn);
- set_flag_n(_Rn);
+#ifdef GPU_DIS_SHARQ
+ if (doGPUDis)
+ WriteLog("%06X: SHARQ #%u, R%02u [NCZ:%u%u%u, R%02u=%08X] -> ", gpu_pc-2, gpu_convert_zero[IMM_1], IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
+ uint32_t res = (int32_t)RN >> gpu_convert_zero[IMM_1];
+ SET_ZN(res); gpu_flag_c = RN & 0x01;
+ RN = res;
+#ifdef GPU_DIS_SHARQ
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_2, RN);
+#endif
}
+
static void gpu_opcode_sh(void)
{
- int32 sRm=(int32)Rm;
- uint32 _Rn=Rn;
-
- if (sRm<0)
+#ifdef GPU_DIS_SH
+ if (doGPUDis)
+ WriteLog("%06X: SH R%02u, R%02u [NCZ:%u%u%u, R%02u=%08X, R%02u=%08X] -> ", gpu_pc-2, IMM_1, IMM_2, gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN);
+#endif
+ if (RM & 0x80000000) // Shift left
{
- uint32 shift=(-sRm);
- if (shift>=32) shift=32;
- gpu_flag_c=(_Rn&0x80000000)>>31;
- while (shift)
- {
- _Rn<<=1;
- shift--;
- }
+ gpu_flag_c = RN >> 31;
+ RN = ((int32_t)RM <= -32 ? 0 : RN << -(int32_t)RM);
}
- else
+ else // Shift right
{
- uint32 shift=sRm;
- if (shift>=32) shift=32;
- gpu_flag_c=_Rn&0x1;
- while (shift)
- {
- _Rn>>=1;
- shift--;
- }
+ gpu_flag_c = RN & 0x01;
+ RN = (RM >= 32 ? 0 : RN >> RM);
}
- Rn=_Rn;
- set_flag_z(_Rn);
- set_flag_n(_Rn);
+ SET_ZN(RN);
+#ifdef GPU_DIS_SH
+ if (doGPUDis)
+ WriteLog("[NCZ:%u%u%u, R%02u=%08X, R%02u=%08X]\n", gpu_flag_n, gpu_flag_c, gpu_flag_z, IMM_1, RM, IMM_2, RN);
+#endif
}
+
+
+//Temporary: Testing only!
+//#include "gpu2.cpp"
+//#include "gpu3.cpp"
+
+#else
+
+
+// New thread-safe GPU core
+
+int GPUCore(void * data)
+{
+}
+
+#endif
+