Search
lxdream.org :: lxdream/src/sh4/sh4core.in
lxdream 0.9.1
released Jun 29
Download Now
filename src/sh4/sh4core.in
changeset 374:8f80a795513e
prev369:4b4223e7d720
next378:f10fbdd4e24b
author nkeynes
date Tue Sep 11 02:14:46 2007 +0000 (16 years ago)
permissions -rw-r--r--
last change Cache the pointer to the last FR bank (speeds fp ops up by about 10%)
Implement experimental fix for FLOAT/FTRC
Make read/write sr functions non-static (share with translator)
Much more translator WIP
file annotate diff log raw
nkeynes@359
     1
/**
nkeynes@374
     2
 * $Id: sh4core.in,v 1.4 2007-09-11 02:14:46 nkeynes Exp $
nkeynes@359
     3
 * 
nkeynes@359
     4
 * SH4 emulation core, and parent module for all the SH4 peripheral
nkeynes@359
     5
 * modules.
nkeynes@359
     6
 *
nkeynes@359
     7
 * Copyright (c) 2005 Nathan Keynes.
nkeynes@359
     8
 *
nkeynes@359
     9
 * This program is free software; you can redistribute it and/or modify
nkeynes@359
    10
 * it under the terms of the GNU General Public License as published by
nkeynes@359
    11
 * the Free Software Foundation; either version 2 of the License, or
nkeynes@359
    12
 * (at your option) any later version.
nkeynes@359
    13
 *
nkeynes@359
    14
 * This program is distributed in the hope that it will be useful,
nkeynes@359
    15
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
nkeynes@359
    16
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
nkeynes@359
    17
 * GNU General Public License for more details.
nkeynes@359
    18
 */
nkeynes@359
    19
nkeynes@359
    20
#define MODULE sh4_module
nkeynes@359
    21
#include <math.h>
nkeynes@359
    22
#include "dream.h"
nkeynes@359
    23
#include "sh4/sh4core.h"
nkeynes@359
    24
#include "sh4/sh4mmio.h"
nkeynes@359
    25
#include "sh4/intc.h"
nkeynes@359
    26
#include "mem.h"
nkeynes@359
    27
#include "clock.h"
nkeynes@359
    28
#include "syscall.h"
nkeynes@359
    29
nkeynes@359
    30
#define SH4_CALLTRACE 1
nkeynes@359
    31
nkeynes@359
    32
#define MAX_INT 0x7FFFFFFF
nkeynes@359
    33
#define MIN_INT 0x80000000
nkeynes@359
    34
#define MAX_INTF 2147483647.0
nkeynes@359
    35
#define MIN_INTF -2147483648.0
nkeynes@359
    36
nkeynes@359
    37
#define EXV_EXCEPTION    0x100  /* General exception vector */
nkeynes@359
    38
#define EXV_TLBMISS      0x400  /* TLB-miss exception vector */
nkeynes@359
    39
#define EXV_INTERRUPT    0x600  /* External interrupt vector */
nkeynes@359
    40
nkeynes@359
    41
/********************** SH4 Module Definition ****************************/
nkeynes@359
    42
nkeynes@359
    43
void sh4_init( void );
nkeynes@359
    44
void sh4_reset( void );
nkeynes@359
    45
uint32_t sh4_run_slice( uint32_t );
nkeynes@359
    46
void sh4_start( void );
nkeynes@359
    47
void sh4_stop( void );
nkeynes@359
    48
void sh4_save_state( FILE *f );
nkeynes@359
    49
int sh4_load_state( FILE *f );
nkeynes@359
    50
void sh4_accept_interrupt( void );
nkeynes@359
    51
nkeynes@359
    52
struct dreamcast_module sh4_module = { "SH4", sh4_init, sh4_reset, 
nkeynes@359
    53
				       NULL, sh4_run_slice, sh4_stop,
nkeynes@359
    54
				       sh4_save_state, sh4_load_state };
nkeynes@359
    55
nkeynes@359
    56
struct sh4_registers sh4r;
nkeynes@359
    57
nkeynes@359
    58
void sh4_init(void)
nkeynes@359
    59
{
nkeynes@359
    60
    register_io_regions( mmio_list_sh4mmio );
nkeynes@359
    61
    MMU_init();
nkeynes@359
    62
    sh4_reset();
nkeynes@359
    63
}
nkeynes@359
    64
nkeynes@359
    65
void sh4_reset(void)
nkeynes@359
    66
{
nkeynes@359
    67
    /* zero everything out, for the sake of having a consistent state. */
nkeynes@359
    68
    memset( &sh4r, 0, sizeof(sh4r) );
nkeynes@359
    69
nkeynes@359
    70
    /* Resume running if we were halted */
nkeynes@359
    71
    sh4r.sh4_state = SH4_STATE_RUNNING;
nkeynes@359
    72
nkeynes@359
    73
    sh4r.pc    = 0xA0000000;
nkeynes@359
    74
    sh4r.new_pc= 0xA0000002;
nkeynes@359
    75
    sh4r.vbr   = 0x00000000;
nkeynes@359
    76
    sh4r.fpscr = 0x00040001;
nkeynes@359
    77
    sh4r.sr    = 0x700000F0;
nkeynes@374
    78
    sh4r.fr_bank = &sh4r.fr[0][0];
nkeynes@359
    79
nkeynes@359
    80
    /* Mem reset will do this, but if we want to reset _just_ the SH4... */
nkeynes@359
    81
    MMIO_WRITE( MMU, EXPEVT, EXC_POWER_RESET );
nkeynes@359
    82
nkeynes@359
    83
    /* Peripheral modules */
nkeynes@359
    84
    CPG_reset();
nkeynes@359
    85
    INTC_reset();
nkeynes@359
    86
    MMU_reset();
nkeynes@359
    87
    TMU_reset();
nkeynes@359
    88
    SCIF_reset();
nkeynes@359
    89
}
nkeynes@359
    90
nkeynes@359
    91
static struct breakpoint_struct sh4_breakpoints[MAX_BREAKPOINTS];
nkeynes@359
    92
static int sh4_breakpoint_count = 0;
nkeynes@359
    93
static uint16_t *sh4_icache = NULL;
nkeynes@359
    94
static uint32_t sh4_icache_addr = 0;
nkeynes@359
    95
nkeynes@359
    96
void sh4_set_breakpoint( uint32_t pc, int type )
nkeynes@359
    97
{
nkeynes@359
    98
    sh4_breakpoints[sh4_breakpoint_count].address = pc;
nkeynes@359
    99
    sh4_breakpoints[sh4_breakpoint_count].type = type;
nkeynes@359
   100
    sh4_breakpoint_count++;
nkeynes@359
   101
}
nkeynes@359
   102
nkeynes@359
   103
gboolean sh4_clear_breakpoint( uint32_t pc, int type )
nkeynes@359
   104
{
nkeynes@359
   105
    int i;
nkeynes@359
   106
nkeynes@359
   107
    for( i=0; i<sh4_breakpoint_count; i++ ) {
nkeynes@359
   108
	if( sh4_breakpoints[i].address == pc && 
nkeynes@359
   109
	    sh4_breakpoints[i].type == type ) {
nkeynes@359
   110
	    while( ++i < sh4_breakpoint_count ) {
nkeynes@359
   111
		sh4_breakpoints[i-1].address = sh4_breakpoints[i].address;
nkeynes@359
   112
		sh4_breakpoints[i-1].type = sh4_breakpoints[i].type;
nkeynes@359
   113
	    }
nkeynes@359
   114
	    sh4_breakpoint_count--;
nkeynes@359
   115
	    return TRUE;
nkeynes@359
   116
	}
nkeynes@359
   117
    }
nkeynes@359
   118
    return FALSE;
nkeynes@359
   119
}
nkeynes@359
   120
nkeynes@359
   121
int sh4_get_breakpoint( uint32_t pc )
nkeynes@359
   122
{
nkeynes@359
   123
    int i;
nkeynes@359
   124
    for( i=0; i<sh4_breakpoint_count; i++ ) {
nkeynes@359
   125
	if( sh4_breakpoints[i].address == pc )
nkeynes@359
   126
	    return sh4_breakpoints[i].type;
nkeynes@359
   127
    }
nkeynes@359
   128
    return 0;
nkeynes@359
   129
}
nkeynes@359
   130
nkeynes@359
   131
uint32_t sh4_run_slice( uint32_t nanosecs ) 
nkeynes@359
   132
{
nkeynes@359
   133
    int i;
nkeynes@359
   134
    sh4r.slice_cycle = 0;
nkeynes@359
   135
nkeynes@359
   136
    if( sh4r.sh4_state != SH4_STATE_RUNNING ) {
nkeynes@359
   137
	if( sh4r.event_pending < nanosecs ) {
nkeynes@359
   138
	    sh4r.sh4_state = SH4_STATE_RUNNING;
nkeynes@359
   139
	    sh4r.slice_cycle = sh4r.event_pending;
nkeynes@359
   140
	}
nkeynes@359
   141
    }
nkeynes@359
   142
nkeynes@359
   143
    if( sh4_breakpoint_count == 0 ) {
nkeynes@359
   144
	for( ; sh4r.slice_cycle < nanosecs; sh4r.slice_cycle += sh4_cpu_period ) {
nkeynes@359
   145
	    if( SH4_EVENT_PENDING() ) {
nkeynes@359
   146
		if( sh4r.event_types & PENDING_EVENT ) {
nkeynes@359
   147
		    event_execute();
nkeynes@359
   148
		}
nkeynes@359
   149
		/* Eventq execute may (quite likely) deliver an immediate IRQ */
nkeynes@359
   150
		if( sh4r.event_types & PENDING_IRQ ) {
nkeynes@359
   151
		    sh4_accept_interrupt();
nkeynes@359
   152
		}
nkeynes@359
   153
	    }
nkeynes@359
   154
	    if( !sh4_execute_instruction() ) {
nkeynes@359
   155
		break;
nkeynes@359
   156
	    }
nkeynes@359
   157
	}
nkeynes@359
   158
    } else {
nkeynes@359
   159
	for( ;sh4r.slice_cycle < nanosecs; sh4r.slice_cycle += sh4_cpu_period ) {
nkeynes@359
   160
	    if( SH4_EVENT_PENDING() ) {
nkeynes@359
   161
		if( sh4r.event_types & PENDING_EVENT ) {
nkeynes@359
   162
		    event_execute();
nkeynes@359
   163
		}
nkeynes@359
   164
		/* Eventq execute may (quite likely) deliver an immediate IRQ */
nkeynes@359
   165
		if( sh4r.event_types & PENDING_IRQ ) {
nkeynes@359
   166
		    sh4_accept_interrupt();
nkeynes@359
   167
		}
nkeynes@359
   168
	    }
nkeynes@359
   169
                 
nkeynes@359
   170
	    if( !sh4_execute_instruction() )
nkeynes@359
   171
		break;
nkeynes@359
   172
#ifdef ENABLE_DEBUG_MODE
nkeynes@359
   173
	    for( i=0; i<sh4_breakpoint_count; i++ ) {
nkeynes@359
   174
		if( sh4_breakpoints[i].address == sh4r.pc ) {
nkeynes@359
   175
		    break;
nkeynes@359
   176
		}
nkeynes@359
   177
	    }
nkeynes@359
   178
	    if( i != sh4_breakpoint_count ) {
nkeynes@359
   179
		dreamcast_stop();
nkeynes@359
   180
		if( sh4_breakpoints[i].type == BREAK_ONESHOT )
nkeynes@359
   181
		    sh4_clear_breakpoint( sh4r.pc, BREAK_ONESHOT );
nkeynes@359
   182
		break;
nkeynes@359
   183
	    }
nkeynes@359
   184
#endif	
nkeynes@359
   185
	}
nkeynes@359
   186
    }
nkeynes@359
   187
nkeynes@359
   188
    /* If we aborted early, but the cpu is still technically running,
nkeynes@359
   189
     * we're doing a hard abort - cut the timeslice back to what we
nkeynes@359
   190
     * actually executed
nkeynes@359
   191
     */
nkeynes@359
   192
    if( sh4r.slice_cycle != nanosecs && sh4r.sh4_state == SH4_STATE_RUNNING ) {
nkeynes@359
   193
	nanosecs = sh4r.slice_cycle;
nkeynes@359
   194
    }
nkeynes@359
   195
    if( sh4r.sh4_state != SH4_STATE_STANDBY ) {
nkeynes@359
   196
	TMU_run_slice( nanosecs );
nkeynes@359
   197
	SCIF_run_slice( nanosecs );
nkeynes@359
   198
    }
nkeynes@359
   199
    return nanosecs;
nkeynes@359
   200
}
nkeynes@359
   201
nkeynes@359
   202
void sh4_stop(void)
nkeynes@359
   203
{
nkeynes@359
   204
nkeynes@359
   205
}
nkeynes@359
   206
nkeynes@359
   207
void sh4_save_state( FILE *f )
nkeynes@359
   208
{
nkeynes@359
   209
    fwrite( &sh4r, sizeof(sh4r), 1, f );
nkeynes@359
   210
    MMU_save_state( f );
nkeynes@359
   211
    INTC_save_state( f );
nkeynes@359
   212
    TMU_save_state( f );
nkeynes@359
   213
    SCIF_save_state( f );
nkeynes@359
   214
}
nkeynes@359
   215
nkeynes@359
   216
int sh4_load_state( FILE * f )
nkeynes@359
   217
{
nkeynes@359
   218
    fread( &sh4r, sizeof(sh4r), 1, f );
nkeynes@359
   219
    MMU_load_state( f );
nkeynes@359
   220
    INTC_load_state( f );
nkeynes@359
   221
    TMU_load_state( f );
nkeynes@359
   222
    return SCIF_load_state( f );
nkeynes@359
   223
}
nkeynes@359
   224
nkeynes@359
   225
/********************** SH4 emulation core  ****************************/
nkeynes@359
   226
nkeynes@359
   227
void sh4_set_pc( int pc )
nkeynes@359
   228
{
nkeynes@359
   229
    sh4r.pc = pc;
nkeynes@359
   230
    sh4r.new_pc = pc+2;
nkeynes@359
   231
}
nkeynes@359
   232
nkeynes@359
   233
#define UNDEF(ir) return sh4_raise_slot_exception(EXC_ILLEGAL, EXC_SLOT_ILLEGAL)
nkeynes@359
   234
#define UNIMP(ir) do{ ERROR( "Halted on unimplemented instruction at %08x, opcode = %04x", sh4r.pc, ir ); dreamcast_stop(); return FALSE; }while(0)
nkeynes@359
   235
nkeynes@359
   236
#if(SH4_CALLTRACE == 1)
nkeynes@359
   237
#define MAX_CALLSTACK 32
nkeynes@359
   238
static struct call_stack {
nkeynes@359
   239
    sh4addr_t call_addr;
nkeynes@359
   240
    sh4addr_t target_addr;
nkeynes@359
   241
    sh4addr_t stack_pointer;
nkeynes@359
   242
} call_stack[MAX_CALLSTACK];
nkeynes@359
   243
nkeynes@359
   244
static int call_stack_depth = 0;
nkeynes@359
   245
int sh4_call_trace_on = 0;
nkeynes@359
   246
nkeynes@359
   247
static inline trace_call( sh4addr_t source, sh4addr_t dest ) 
nkeynes@359
   248
{
nkeynes@359
   249
    if( call_stack_depth < MAX_CALLSTACK ) {
nkeynes@359
   250
	call_stack[call_stack_depth].call_addr = source;
nkeynes@359
   251
	call_stack[call_stack_depth].target_addr = dest;
nkeynes@359
   252
	call_stack[call_stack_depth].stack_pointer = sh4r.r[15];
nkeynes@359
   253
    }
nkeynes@359
   254
    call_stack_depth++;
nkeynes@359
   255
}
nkeynes@359
   256
nkeynes@359
   257
static inline trace_return( sh4addr_t source, sh4addr_t dest )
nkeynes@359
   258
{
nkeynes@359
   259
    if( call_stack_depth > 0 ) {
nkeynes@359
   260
	call_stack_depth--;
nkeynes@359
   261
    }
nkeynes@359
   262
}
nkeynes@359
   263
nkeynes@359
   264
void fprint_stack_trace( FILE *f )
nkeynes@359
   265
{
nkeynes@359
   266
    int i = call_stack_depth -1;
nkeynes@359
   267
    if( i >= MAX_CALLSTACK )
nkeynes@359
   268
	i = MAX_CALLSTACK - 1;
nkeynes@359
   269
    for( ; i >= 0; i-- ) {
nkeynes@359
   270
	fprintf( f, "%d. Call from %08X => %08X, SP=%08X\n", 
nkeynes@359
   271
		 (call_stack_depth - i), call_stack[i].call_addr,
nkeynes@359
   272
		 call_stack[i].target_addr, call_stack[i].stack_pointer );
nkeynes@359
   273
    }
nkeynes@359
   274
}
nkeynes@359
   275
nkeynes@359
   276
#define TRACE_CALL( source, dest ) trace_call(source, dest)
nkeynes@359
   277
#define TRACE_RETURN( source, dest ) trace_return(source, dest)
nkeynes@359
   278
#else
nkeynes@359
   279
#define TRACE_CALL( dest, rts ) 
nkeynes@359
   280
#define TRACE_RETURN( source, dest )
nkeynes@359
   281
#endif
nkeynes@359
   282
nkeynes@359
   283
#define RAISE( x, v ) do{			\
nkeynes@359
   284
    if( sh4r.vbr == 0 ) { \
nkeynes@359
   285
        ERROR( "%08X: VBR not initialized while raising exception %03X, halting", sh4r.pc, x ); \
nkeynes@359
   286
        dreamcast_stop(); return FALSE;	\
nkeynes@359
   287
    } else { \
nkeynes@359
   288
        sh4r.spc = sh4r.pc;	\
nkeynes@359
   289
        sh4r.ssr = sh4_read_sr(); \
nkeynes@359
   290
        sh4r.sgr = sh4r.r[15]; \
nkeynes@359
   291
        MMIO_WRITE(MMU,EXPEVT,x); \
nkeynes@359
   292
        sh4r.pc = sh4r.vbr + v; \
nkeynes@359
   293
        sh4r.new_pc = sh4r.pc + 2; \
nkeynes@374
   294
        sh4_write_sr( sh4r.ssr |SR_MD|SR_BL|SR_RB ); \
nkeynes@359
   295
	if( sh4r.in_delay_slot ) { \
nkeynes@359
   296
	    sh4r.in_delay_slot = 0; \
nkeynes@359
   297
	    sh4r.spc -= 2; \
nkeynes@359
   298
	} \
nkeynes@359
   299
    } \
nkeynes@359
   300
    return TRUE; } while(0)
nkeynes@359
   301
nkeynes@359
   302
#define MEM_READ_BYTE( addr ) sh4_read_byte(addr)
nkeynes@359
   303
#define MEM_READ_WORD( addr ) sh4_read_word(addr)
nkeynes@359
   304
#define MEM_READ_LONG( addr ) sh4_read_long(addr)
nkeynes@359
   305
#define MEM_WRITE_BYTE( addr, val ) sh4_write_byte(addr, val)
nkeynes@359
   306
#define MEM_WRITE_WORD( addr, val ) sh4_write_word(addr, val)
nkeynes@359
   307
#define MEM_WRITE_LONG( addr, val ) sh4_write_long(addr, val)
nkeynes@359
   308
nkeynes@359
   309
#define FP_WIDTH (IS_FPU_DOUBLESIZE() ? 8 : 4)
nkeynes@359
   310
nkeynes@359
   311
#define MEM_FP_READ( addr, reg ) sh4_read_float( addr, reg );
nkeynes@359
   312
#define MEM_FP_WRITE( addr, reg ) sh4_write_float( addr, reg );
nkeynes@359
   313
nkeynes@359
   314
#define CHECKPRIV() if( !IS_SH4_PRIVMODE() ) return sh4_raise_slot_exception( EXC_ILLEGAL, EXC_SLOT_ILLEGAL )
nkeynes@367
   315
#define CHECKRALIGN16(addr) if( (addr)&0x01 ) return sh4_raise_exception( EXC_DATA_ADDR_READ )
nkeynes@367
   316
#define CHECKRALIGN32(addr) if( (addr)&0x03 ) return sh4_raise_exception( EXC_DATA_ADDR_READ )
nkeynes@367
   317
#define CHECKWALIGN16(addr) if( (addr)&0x01 ) return sh4_raise_exception( EXC_DATA_ADDR_WRITE )
nkeynes@367
   318
#define CHECKWALIGN32(addr) if( (addr)&0x03 ) return sh4_raise_exception( EXC_DATA_ADDR_WRITE )
nkeynes@359
   319
nkeynes@367
   320
#define CHECKFPUEN() if( !IS_FPU_ENABLED() ) { if( ir == 0xFFFD ) { UNDEF(ir); } else { return sh4_raise_slot_exception( EXC_FPU_DISABLED, EXC_SLOT_FPU_DISABLED ); } }
nkeynes@359
   321
#define CHECKDEST(p) if( (p) == 0 ) { ERROR( "%08X: Branch/jump to NULL, CPU halted", sh4r.pc ); dreamcast_stop(); return FALSE; }
nkeynes@359
   322
#define CHECKSLOTILLEGAL() if(sh4r.in_delay_slot) return sh4_raise_exception(EXC_SLOT_ILLEGAL)
nkeynes@359
   323
nkeynes@359
   324
static void sh4_switch_banks( )
nkeynes@359
   325
{
nkeynes@359
   326
    uint32_t tmp[8];
nkeynes@359
   327
nkeynes@359
   328
    memcpy( tmp, sh4r.r, sizeof(uint32_t)*8 );
nkeynes@359
   329
    memcpy( sh4r.r, sh4r.r_bank, sizeof(uint32_t)*8 );
nkeynes@359
   330
    memcpy( sh4r.r_bank, tmp, sizeof(uint32_t)*8 );
nkeynes@359
   331
}
nkeynes@359
   332
nkeynes@374
   333
void sh4_write_sr( uint32_t newval )
nkeynes@359
   334
{
nkeynes@359
   335
    if( (newval ^ sh4r.sr) & SR_RB )
nkeynes@359
   336
        sh4_switch_banks();
nkeynes@359
   337
    sh4r.sr = newval;
nkeynes@359
   338
    sh4r.t = (newval&SR_T) ? 1 : 0;
nkeynes@359
   339
    sh4r.s = (newval&SR_S) ? 1 : 0;
nkeynes@359
   340
    sh4r.m = (newval&SR_M) ? 1 : 0;
nkeynes@359
   341
    sh4r.q = (newval&SR_Q) ? 1 : 0;
nkeynes@359
   342
    intc_mask_changed();
nkeynes@359
   343
}
nkeynes@359
   344
nkeynes@359
   345
static void sh4_write_float( uint32_t addr, int reg )
nkeynes@359
   346
{
nkeynes@359
   347
    if( IS_FPU_DOUBLESIZE() ) {
nkeynes@359
   348
	if( reg & 1 ) {
nkeynes@359
   349
	    sh4_write_long( addr, *((uint32_t *)&XF((reg)&0x0E)) );
nkeynes@359
   350
	    sh4_write_long( addr+4, *((uint32_t *)&XF(reg)) );
nkeynes@359
   351
	} else {
nkeynes@359
   352
	    sh4_write_long( addr, *((uint32_t *)&FR(reg)) ); 
nkeynes@359
   353
	    sh4_write_long( addr+4, *((uint32_t *)&FR((reg)|0x01)) );
nkeynes@359
   354
	}
nkeynes@359
   355
    } else {
nkeynes@359
   356
	sh4_write_long( addr, *((uint32_t *)&FR((reg))) );
nkeynes@359
   357
    }
nkeynes@359
   358
}
nkeynes@359
   359
nkeynes@359
   360
static void sh4_read_float( uint32_t addr, int reg )
nkeynes@359
   361
{
nkeynes@359
   362
    if( IS_FPU_DOUBLESIZE() ) {
nkeynes@359
   363
	if( reg & 1 ) {
nkeynes@359
   364
	    *((uint32_t *)&XF((reg) & 0x0E)) = sh4_read_long(addr);
nkeynes@359
   365
	    *((uint32_t *)&XF(reg)) = sh4_read_long(addr+4);
nkeynes@359
   366
	} else {
nkeynes@359
   367
	    *((uint32_t *)&FR(reg)) = sh4_read_long(addr);
nkeynes@359
   368
	    *((uint32_t *)&FR((reg) | 0x01)) = sh4_read_long(addr+4);
nkeynes@359
   369
	}
nkeynes@359
   370
    } else {
nkeynes@359
   371
	*((uint32_t *)&FR(reg)) = sh4_read_long(addr);
nkeynes@359
   372
    }
nkeynes@359
   373
}
nkeynes@359
   374
nkeynes@374
   375
uint32_t sh4_read_sr( void )
nkeynes@359
   376
{
nkeynes@359
   377
    /* synchronize sh4r.sr with the various bitflags */
nkeynes@359
   378
    sh4r.sr &= SR_MQSTMASK;
nkeynes@359
   379
    if( sh4r.t ) sh4r.sr |= SR_T;
nkeynes@359
   380
    if( sh4r.s ) sh4r.sr |= SR_S;
nkeynes@359
   381
    if( sh4r.m ) sh4r.sr |= SR_M;
nkeynes@359
   382
    if( sh4r.q ) sh4r.sr |= SR_Q;
nkeynes@359
   383
    return sh4r.sr;
nkeynes@359
   384
}
nkeynes@359
   385
nkeynes@359
   386
/**
nkeynes@359
   387
 * Raise a general CPU exception for the specified exception code.
nkeynes@359
   388
 * (NOT for TRAPA or TLB exceptions)
nkeynes@359
   389
 */
nkeynes@359
   390
gboolean sh4_raise_exception( int code )
nkeynes@359
   391
{
nkeynes@359
   392
    RAISE( code, EXV_EXCEPTION );
nkeynes@359
   393
}
nkeynes@359
   394
nkeynes@359
   395
gboolean sh4_raise_slot_exception( int normal_code, int slot_code ) {
nkeynes@359
   396
    if( sh4r.in_delay_slot ) {
nkeynes@359
   397
	return sh4_raise_exception(slot_code);
nkeynes@359
   398
    } else {
nkeynes@359
   399
	return sh4_raise_exception(normal_code);
nkeynes@359
   400
    }
nkeynes@359
   401
}
nkeynes@359
   402
nkeynes@359
   403
gboolean sh4_raise_tlb_exception( int code )
nkeynes@359
   404
{
nkeynes@359
   405
    RAISE( code, EXV_TLBMISS );
nkeynes@359
   406
}
nkeynes@359
   407
nkeynes@359
   408
void sh4_accept_interrupt( void )
nkeynes@359
   409
{
nkeynes@359
   410
    uint32_t code = intc_accept_interrupt();
nkeynes@359
   411
    sh4r.ssr = sh4_read_sr();
nkeynes@359
   412
    sh4r.spc = sh4r.pc;
nkeynes@359
   413
    sh4r.sgr = sh4r.r[15];
nkeynes@374
   414
    sh4_write_sr( sh4r.ssr|SR_BL|SR_MD|SR_RB );
nkeynes@359
   415
    MMIO_WRITE( MMU, INTEVT, code );
nkeynes@359
   416
    sh4r.pc = sh4r.vbr + 0x600;
nkeynes@359
   417
    sh4r.new_pc = sh4r.pc + 2;
nkeynes@359
   418
    //    WARN( "Accepting interrupt %03X, from %08X => %08X", code, sh4r.spc, sh4r.pc );
nkeynes@359
   419
}
nkeynes@359
   420
nkeynes@359
   421
gboolean sh4_execute_instruction( void )
nkeynes@359
   422
{
nkeynes@359
   423
    uint32_t pc;
nkeynes@359
   424
    unsigned short ir;
nkeynes@359
   425
    uint32_t tmp;
nkeynes@359
   426
    float ftmp;
nkeynes@359
   427
    double dtmp;
nkeynes@359
   428
    
nkeynes@359
   429
#define R0 sh4r.r[0]
nkeynes@359
   430
    pc = sh4r.pc;
nkeynes@359
   431
    if( pc > 0xFFFFFF00 ) {
nkeynes@359
   432
	/* SYSCALL Magic */
nkeynes@359
   433
	syscall_invoke( pc );
nkeynes@359
   434
	sh4r.in_delay_slot = 0;
nkeynes@359
   435
	pc = sh4r.pc = sh4r.pr;
nkeynes@359
   436
	sh4r.new_pc = sh4r.pc + 2;
nkeynes@359
   437
    }
nkeynes@359
   438
    CHECKRALIGN16(pc);
nkeynes@359
   439
nkeynes@359
   440
    /* Read instruction */
nkeynes@359
   441
    uint32_t pageaddr = pc >> 12;
nkeynes@359
   442
    if( sh4_icache != NULL && pageaddr == sh4_icache_addr ) {
nkeynes@359
   443
	ir = sh4_icache[(pc&0xFFF)>>1];
nkeynes@359
   444
    } else {
nkeynes@359
   445
	sh4_icache = (uint16_t *)mem_get_page(pc);
nkeynes@359
   446
	if( ((uint32_t)sh4_icache) < MAX_IO_REGIONS ) {
nkeynes@359
   447
	    /* If someone's actually been so daft as to try to execute out of an IO
nkeynes@359
   448
	     * region, fallback on the full-blown memory read
nkeynes@359
   449
	     */
nkeynes@359
   450
	    sh4_icache = NULL;
nkeynes@359
   451
	    ir = MEM_READ_WORD(pc);
nkeynes@359
   452
	} else {
nkeynes@359
   453
	    sh4_icache_addr = pageaddr;
nkeynes@359
   454
	    ir = sh4_icache[(pc&0xFFF)>>1];
nkeynes@359
   455
	}
nkeynes@359
   456
    }
nkeynes@359
   457
%%
nkeynes@359
   458
AND Rm, Rn {: sh4r.r[Rn] &= sh4r.r[Rm]; :}
nkeynes@359
   459
AND #imm, R0 {: R0 &= imm; :}
nkeynes@359
   460
AND.B #imm, @(R0, GBR) {: MEM_WRITE_BYTE( R0 + sh4r.gbr, imm & MEM_READ_BYTE(R0 + sh4r.gbr) ); :}
nkeynes@359
   461
NOT Rm, Rn {: sh4r.r[Rn] = ~sh4r.r[Rm]; :}
nkeynes@359
   462
OR Rm, Rn {: sh4r.r[Rn] |= sh4r.r[Rm]; :}
nkeynes@359
   463
OR #imm, R0  {: R0 |= imm; :}
nkeynes@359
   464
OR.B #imm, @(R0, GBR) {: MEM_WRITE_BYTE( R0 + sh4r.gbr, imm | MEM_READ_BYTE(R0 + sh4r.gbr) ); :}
nkeynes@359
   465
TAS.B @Rn {:
nkeynes@359
   466
    tmp = MEM_READ_BYTE( sh4r.r[Rn] );
nkeynes@359
   467
    sh4r.t = ( tmp == 0 ? 1 : 0 );
nkeynes@359
   468
    MEM_WRITE_BYTE( sh4r.r[Rn], tmp | 0x80 );
nkeynes@359
   469
:}
nkeynes@359
   470
TST Rm, Rn {: sh4r.t = (sh4r.r[Rn]&sh4r.r[Rm] ? 0 : 1); :}
nkeynes@359
   471
TST #imm, R0 {: sh4r.t = (R0 & imm ? 0 : 1); :}
nkeynes@359
   472
TST.B #imm, @(R0, GBR) {: sh4r.t = ( MEM_READ_BYTE(R0 + sh4r.gbr) & imm ? 0 : 1 ); :}
nkeynes@359
   473
XOR Rm, Rn {: sh4r.r[Rn] ^= sh4r.r[Rm]; :}
nkeynes@359
   474
XOR #imm, R0 {: R0 ^= imm; :}
nkeynes@359
   475
XOR.B #imm, @(R0, GBR) {: MEM_WRITE_BYTE( R0 + sh4r.gbr, imm ^ MEM_READ_BYTE(R0 + sh4r.gbr) ); :}
nkeynes@359
   476
XTRCT Rm, Rn {: sh4r.r[Rn] = (sh4r.r[Rn]>>16) | (sh4r.r[Rm]<<16); :}
nkeynes@359
   477
nkeynes@359
   478
ROTL Rn {:
nkeynes@359
   479
    sh4r.t = sh4r.r[Rn] >> 31;
nkeynes@359
   480
    sh4r.r[Rn] <<= 1;
nkeynes@359
   481
    sh4r.r[Rn] |= sh4r.t;
nkeynes@359
   482
:}
nkeynes@359
   483
ROTR Rn {:
nkeynes@359
   484
    sh4r.t = sh4r.r[Rn] & 0x00000001;
nkeynes@359
   485
    sh4r.r[Rn] >>= 1;
nkeynes@359
   486
    sh4r.r[Rn] |= (sh4r.t << 31);
nkeynes@359
   487
:}
nkeynes@359
   488
ROTCL Rn {:
nkeynes@359
   489
    tmp = sh4r.r[Rn] >> 31;
nkeynes@359
   490
    sh4r.r[Rn] <<= 1;
nkeynes@359
   491
    sh4r.r[Rn] |= sh4r.t;
nkeynes@359
   492
    sh4r.t = tmp;
nkeynes@359
   493
:}
nkeynes@359
   494
ROTCR Rn {:
nkeynes@359
   495
    tmp = sh4r.r[Rn] & 0x00000001;
nkeynes@359
   496
    sh4r.r[Rn] >>= 1;
nkeynes@359
   497
    sh4r.r[Rn] |= (sh4r.t << 31 );
nkeynes@359
   498
    sh4r.t = tmp;
nkeynes@359
   499
:}
nkeynes@359
   500
SHAD Rm, Rn {:
nkeynes@359
   501
    tmp = sh4r.r[Rm];
nkeynes@359
   502
    if( (tmp & 0x80000000) == 0 ) sh4r.r[Rn] <<= (tmp&0x1f);
nkeynes@359
   503
    else if( (tmp & 0x1F) == 0 )  
nkeynes@359
   504
        sh4r.r[Rn] = ((int32_t)sh4r.r[Rn]) >> 31;
nkeynes@359
   505
    else 
nkeynes@359
   506
	sh4r.r[Rn] = ((int32_t)sh4r.r[Rn]) >> (((~sh4r.r[Rm]) & 0x1F)+1);
nkeynes@359
   507
:}
nkeynes@359
   508
SHLD Rm, Rn {:
nkeynes@359
   509
    tmp = sh4r.r[Rm];
nkeynes@359
   510
    if( (tmp & 0x80000000) == 0 ) sh4r.r[Rn] <<= (tmp&0x1f);
nkeynes@359
   511
    else if( (tmp & 0x1F) == 0 ) sh4r.r[Rn] = 0;
nkeynes@359
   512
    else sh4r.r[Rn] >>= (((~tmp) & 0x1F)+1);
nkeynes@359
   513
:}
nkeynes@359
   514
SHAL Rn {:
nkeynes@359
   515
    sh4r.t = sh4r.r[Rn] >> 31;
nkeynes@359
   516
    sh4r.r[Rn] <<= 1;
nkeynes@359
   517
:}
nkeynes@359
   518
SHAR Rn {:
nkeynes@359
   519
    sh4r.t = sh4r.r[Rn] & 0x00000001;
nkeynes@359
   520
    sh4r.r[Rn] = ((int32_t)sh4r.r[Rn]) >> 1;
nkeynes@359
   521
:}
nkeynes@359
   522
SHLL Rn {: sh4r.t = sh4r.r[Rn] >> 31; sh4r.r[Rn] <<= 1; :}
nkeynes@359
   523
SHLR Rn {: sh4r.t = sh4r.r[Rn] & 0x00000001; sh4r.r[Rn] >>= 1; :}
nkeynes@359
   524
SHLL2 Rn {: sh4r.r[Rn] <<= 2; :}
nkeynes@359
   525
SHLR2 Rn {: sh4r.r[Rn] >>= 2; :}
nkeynes@359
   526
SHLL8 Rn {: sh4r.r[Rn] <<= 8; :}
nkeynes@359
   527
SHLR8 Rn {: sh4r.r[Rn] >>= 8; :}
nkeynes@359
   528
SHLL16 Rn {: sh4r.r[Rn] <<= 16; :}
nkeynes@359
   529
SHLR16 Rn {: sh4r.r[Rn] >>= 16; :}
nkeynes@359
   530
nkeynes@359
   531
EXTU.B Rm, Rn {: sh4r.r[Rn] = sh4r.r[Rm]&0x000000FF; :}
nkeynes@359
   532
EXTU.W Rm, Rn {: sh4r.r[Rn] = sh4r.r[Rm]&0x0000FFFF; :}
nkeynes@359
   533
EXTS.B Rm, Rn {: sh4r.r[Rn] = SIGNEXT8( sh4r.r[Rm]&0x000000FF ); :}
nkeynes@359
   534
EXTS.W Rm, Rn {: sh4r.r[Rn] = SIGNEXT16( sh4r.r[Rm]&0x0000FFFF ); :}
nkeynes@359
   535
SWAP.B Rm, Rn {: sh4r.r[Rn] = (sh4r.r[Rm]&0xFFFF0000) | ((sh4r.r[Rm]&0x0000FF00)>>8) | ((sh4r.r[Rm]&0x000000FF)<<8); :}
nkeynes@359
   536
SWAP.W Rm, Rn {: sh4r.r[Rn] = (sh4r.r[Rm]>>16) | (sh4r.r[Rm]<<16); :}
nkeynes@359
   537
nkeynes@359
   538
CLRT {: sh4r.t = 0; :}
nkeynes@359
   539
SETT {: sh4r.t = 1; :}
nkeynes@359
   540
CLRMAC {: sh4r.mac = 0; :}
nkeynes@359
   541
LDTLB {: /* TODO */ :}
nkeynes@359
   542
CLRS {: sh4r.s = 0; :}
nkeynes@359
   543
SETS {: sh4r.s = 1; :}
nkeynes@359
   544
MOVT Rn {: sh4r.r[Rn] = sh4r.t; :}
nkeynes@359
   545
NOP {: /* NOP */ :}
nkeynes@359
   546
nkeynes@359
   547
PREF @Rn {:
nkeynes@359
   548
     tmp = sh4r.r[Rn];
nkeynes@359
   549
     if( (tmp & 0xFC000000) == 0xE0000000 ) {
nkeynes@369
   550
	 sh4_flush_store_queue(tmp);
nkeynes@359
   551
     }
nkeynes@359
   552
:}
nkeynes@359
   553
OCBI @Rn {: :}
nkeynes@359
   554
OCBP @Rn {: :}
nkeynes@359
   555
OCBWB @Rn {: :}
nkeynes@359
   556
MOVCA.L R0, @Rn {:
nkeynes@359
   557
    tmp = sh4r.r[Rn];
nkeynes@359
   558
    CHECKWALIGN32(tmp);
nkeynes@359
   559
    MEM_WRITE_LONG( tmp, R0 );
nkeynes@359
   560
:}
nkeynes@359
   561
MOV.B Rm, @(R0, Rn) {: MEM_WRITE_BYTE( R0 + sh4r.r[Rn], sh4r.r[Rm] ); :}
nkeynes@359
   562
MOV.W Rm, @(R0, Rn) {: 
nkeynes@359
   563
    CHECKWALIGN16( R0 + sh4r.r[Rn] );
nkeynes@359
   564
    MEM_WRITE_WORD( R0 + sh4r.r[Rn], sh4r.r[Rm] );
nkeynes@359
   565
:}
nkeynes@359
   566
MOV.L Rm, @(R0, Rn) {:
nkeynes@359
   567
    CHECKWALIGN32( R0 + sh4r.r[Rn] );
nkeynes@359
   568
    MEM_WRITE_LONG( R0 + sh4r.r[Rn], sh4r.r[Rm] );
nkeynes@359
   569
:}
nkeynes@359
   570
MOV.B @(R0, Rm), Rn {: sh4r.r[Rn] = MEM_READ_BYTE( R0 + sh4r.r[Rm] ); :}
nkeynes@359
   571
MOV.W @(R0, Rm), Rn {: CHECKRALIGN16( R0 + sh4r.r[Rm] );
nkeynes@359
   572
                    sh4r.r[Rn] = MEM_READ_WORD( R0 + sh4r.r[Rm] );
nkeynes@359
   573
:}
nkeynes@359
   574
MOV.L @(R0, Rm), Rn {: CHECKRALIGN32( R0 + sh4r.r[Rm] );
nkeynes@359
   575
                    sh4r.r[Rn] = MEM_READ_LONG( R0 + sh4r.r[Rm] );
nkeynes@359
   576
:}
nkeynes@359
   577
MOV.L Rm, @(disp, Rn) {:
nkeynes@359
   578
    tmp = sh4r.r[Rn] + disp;
nkeynes@359
   579
    CHECKWALIGN32( tmp );
nkeynes@359
   580
    MEM_WRITE_LONG( tmp, sh4r.r[Rm] );
nkeynes@359
   581
:}
nkeynes@359
   582
MOV.B Rm, @Rn {: MEM_WRITE_BYTE( sh4r.r[Rn], sh4r.r[Rm] ); :}
nkeynes@359
   583
MOV.W Rm, @Rn {: CHECKWALIGN16( sh4r.r[Rn] ); MEM_WRITE_WORD( sh4r.r[Rn], sh4r.r[Rm] ); :}
nkeynes@359
   584
MOV.L Rm, @Rn {: CHECKWALIGN32( sh4r.r[Rn] ); MEM_WRITE_LONG( sh4r.r[Rn], sh4r.r[Rm] ); :}
nkeynes@359
   585
MOV.B Rm, @-Rn {: sh4r.r[Rn] --; MEM_WRITE_BYTE( sh4r.r[Rn], sh4r.r[Rm] ); :}
nkeynes@359
   586
MOV.W Rm, @-Rn {: sh4r.r[Rn] -= 2; CHECKWALIGN16( sh4r.r[Rn] ); MEM_WRITE_WORD( sh4r.r[Rn], sh4r.r[Rm] ); :}
nkeynes@359
   587
MOV.L Rm, @-Rn {: sh4r.r[Rn] -= 4; CHECKWALIGN32( sh4r.r[Rn] ); MEM_WRITE_LONG( sh4r.r[Rn], sh4r.r[Rm] ); :}
nkeynes@359
   588
MOV.L @(disp, Rm), Rn {:
nkeynes@359
   589
    tmp = sh4r.r[Rm] + disp;
nkeynes@359
   590
    CHECKRALIGN32( tmp );
nkeynes@359
   591
    sh4r.r[Rn] = MEM_READ_LONG( tmp );
nkeynes@359
   592
:}
nkeynes@359
   593
MOV.B @Rm, Rn {: sh4r.r[Rn] = MEM_READ_BYTE( sh4r.r[Rm] ); :}
nkeynes@359
   594
MOV.W @Rm, Rn {: CHECKRALIGN16( sh4r.r[Rm] ); sh4r.r[Rn] = MEM_READ_WORD( sh4r.r[Rm] ); :}
nkeynes@359
   595
MOV.L @Rm, Rn {: CHECKRALIGN32( sh4r.r[Rm] ); sh4r.r[Rn] = MEM_READ_LONG( sh4r.r[Rm] ); :}
nkeynes@359
   596
MOV Rm, Rn {: sh4r.r[Rn] = sh4r.r[Rm]; :}
nkeynes@359
   597
MOV.B @Rm+, Rn {: sh4r.r[Rn] = MEM_READ_BYTE( sh4r.r[Rm] ); sh4r.r[Rm] ++; :}
nkeynes@359
   598
MOV.W @Rm+, Rn {: CHECKRALIGN16( sh4r.r[Rm] ); sh4r.r[Rn] = MEM_READ_WORD( sh4r.r[Rm] ); sh4r.r[Rm] += 2; :}
nkeynes@359
   599
MOV.L @Rm+, Rn {: CHECKRALIGN32( sh4r.r[Rm] ); sh4r.r[Rn] = MEM_READ_LONG( sh4r.r[Rm] ); sh4r.r[Rm] += 4; :}
nkeynes@359
   600
MOV.L @(disp, PC), Rn {:
nkeynes@359
   601
    CHECKSLOTILLEGAL();
nkeynes@359
   602
    tmp = (pc&0xFFFFFFFC) + disp + 4;
nkeynes@359
   603
    sh4r.r[Rn] = MEM_READ_LONG( tmp );
nkeynes@359
   604
:}
nkeynes@359
   605
MOV.B R0, @(disp, GBR) {: MEM_WRITE_BYTE( sh4r.gbr + disp, R0 ); :}
nkeynes@359
   606
MOV.W R0, @(disp, GBR) {:
nkeynes@359
   607
    tmp = sh4r.gbr + disp;
nkeynes@359
   608
    CHECKWALIGN16( tmp );
nkeynes@359
   609
    MEM_WRITE_WORD( tmp, R0 );
nkeynes@359
   610
:}
nkeynes@359
   611
MOV.L R0, @(disp, GBR) {:
nkeynes@359
   612
    tmp = sh4r.gbr + disp;
nkeynes@359
   613
    CHECKWALIGN32( tmp );
nkeynes@359
   614
    MEM_WRITE_LONG( tmp, R0 );
nkeynes@359
   615
:}
nkeynes@359
   616
MOV.B @(disp, GBR), R0 {: R0 = MEM_READ_BYTE( sh4r.gbr + disp ); :}
nkeynes@359
   617
MOV.W @(disp, GBR), R0 {: 
nkeynes@359
   618
    tmp = sh4r.gbr + disp;
nkeynes@359
   619
    CHECKRALIGN16( tmp );
nkeynes@359
   620
    R0 = MEM_READ_WORD( tmp );
nkeynes@359
   621
:}
nkeynes@359
   622
MOV.L @(disp, GBR), R0 {:
nkeynes@359
   623
    tmp = sh4r.gbr + disp;
nkeynes@359
   624
    CHECKRALIGN32( tmp );
nkeynes@359
   625
    R0 = MEM_READ_LONG( tmp );
nkeynes@359
   626
:}
nkeynes@359
   627
MOV.B R0, @(disp, Rn) {: MEM_WRITE_BYTE( sh4r.r[Rn] + disp, R0 ); :}
nkeynes@359
   628
MOV.W R0, @(disp, Rn) {: 
nkeynes@359
   629
    tmp = sh4r.r[Rn] + disp;
nkeynes@359
   630
    CHECKWALIGN16( tmp );
nkeynes@359
   631
    MEM_WRITE_WORD( tmp, R0 );
nkeynes@359
   632
:}
nkeynes@359
   633
MOV.B @(disp, Rm), R0 {: R0 = MEM_READ_BYTE( sh4r.r[Rm] + disp ); :}
nkeynes@359
   634
MOV.W @(disp, Rm), R0 {: 
nkeynes@359
   635
    tmp = sh4r.r[Rm] + disp;
nkeynes@359
   636
    CHECKRALIGN16( tmp );
nkeynes@359
   637
    R0 = MEM_READ_WORD( tmp );
nkeynes@359
   638
:}
nkeynes@359
   639
MOV.W @(disp, PC), Rn {:
nkeynes@359
   640
    CHECKSLOTILLEGAL();
nkeynes@359
   641
    tmp = pc + 4 + disp;
nkeynes@359
   642
    sh4r.r[Rn] = MEM_READ_WORD( tmp );
nkeynes@359
   643
:}
nkeynes@359
   644
MOVA @(disp, PC), R0 {:
nkeynes@359
   645
    CHECKSLOTILLEGAL();
nkeynes@359
   646
    R0 = (pc&0xFFFFFFFC) + disp + 4;
nkeynes@359
   647
:}
nkeynes@359
   648
MOV #imm, Rn {:  sh4r.r[Rn] = imm; :}
nkeynes@359
   649
nkeynes@359
   650
CMP/EQ #imm, R0 {: sh4r.t = ( R0 == imm ? 1 : 0 ); :}
nkeynes@359
   651
CMP/EQ Rm, Rn {: sh4r.t = ( sh4r.r[Rm] == sh4r.r[Rn] ? 1 : 0 ); :}
nkeynes@359
   652
CMP/GE Rm, Rn {: sh4r.t = ( ((int32_t)sh4r.r[Rn]) >= ((int32_t)sh4r.r[Rm]) ? 1 : 0 ); :}
nkeynes@359
   653
CMP/GT Rm, Rn {: sh4r.t = ( ((int32_t)sh4r.r[Rn]) > ((int32_t)sh4r.r[Rm]) ? 1 : 0 ); :}
nkeynes@359
   654
CMP/HI Rm, Rn {: sh4r.t = ( sh4r.r[Rn] > sh4r.r[Rm] ? 1 : 0 ); :}
nkeynes@359
   655
CMP/HS Rm, Rn {: sh4r.t = ( sh4r.r[Rn] >= sh4r.r[Rm] ? 1 : 0 ); :}
nkeynes@359
   656
CMP/PL Rn {: sh4r.t = ( ((int32_t)sh4r.r[Rn]) > 0 ? 1 : 0 ); :}
nkeynes@359
   657
CMP/PZ Rn {: sh4r.t = ( ((int32_t)sh4r.r[Rn]) >= 0 ? 1 : 0 ); :}
nkeynes@359
   658
CMP/STR Rm, Rn {: 
nkeynes@359
   659
    /* set T = 1 if any byte in RM & RN is the same */
nkeynes@359
   660
    tmp = sh4r.r[Rm] ^ sh4r.r[Rn];
nkeynes@359
   661
    sh4r.t = ((tmp&0x000000FF)==0 || (tmp&0x0000FF00)==0 ||
nkeynes@359
   662
             (tmp&0x00FF0000)==0 || (tmp&0xFF000000)==0)?1:0;
nkeynes@359
   663
:}
nkeynes@359
   664
nkeynes@359
   665
ADD Rm, Rn {: sh4r.r[Rn] += sh4r.r[Rm]; :}
nkeynes@359
   666
ADD #imm, Rn {: sh4r.r[Rn] += imm; :}
nkeynes@359
   667
ADDC Rm, Rn {:
nkeynes@359
   668
    tmp = sh4r.r[Rn];
nkeynes@359
   669
    sh4r.r[Rn] += sh4r.r[Rm] + sh4r.t;
nkeynes@359
   670
    sh4r.t = ( sh4r.r[Rn] < tmp || (sh4r.r[Rn] == tmp && sh4r.t != 0) ? 1 : 0 );
nkeynes@359
   671
:}
nkeynes@359
   672
ADDV Rm, Rn {:
nkeynes@359
   673
    tmp = sh4r.r[Rn] + sh4r.r[Rm];
nkeynes@359
   674
    sh4r.t = ( (sh4r.r[Rn]>>31) == (sh4r.r[Rm]>>31) && ((sh4r.r[Rn]>>31) != (tmp>>31)) );
nkeynes@359
   675
    sh4r.r[Rn] = tmp;
nkeynes@359
   676
:}
nkeynes@359
   677
DIV0U {: sh4r.m = sh4r.q = sh4r.t = 0; :}
nkeynes@359
   678
DIV0S Rm, Rn {: 
nkeynes@359
   679
    sh4r.q = sh4r.r[Rn]>>31;
nkeynes@359
   680
    sh4r.m = sh4r.r[Rm]>>31;
nkeynes@359
   681
    sh4r.t = sh4r.q ^ sh4r.m;
nkeynes@359
   682
:}
nkeynes@359
   683
DIV1 Rm, Rn {:
nkeynes@359
   684
    /* This is just from the sh4p manual with some
nkeynes@359
   685
     * simplifications (someone want to check it's correct? :)
nkeynes@359
   686
     * Why they couldn't just provide a real DIV instruction...
nkeynes@359
   687
     */
nkeynes@359
   688
    uint32_t tmp0, tmp1, tmp2, dir;
nkeynes@359
   689
nkeynes@359
   690
    dir = sh4r.q ^ sh4r.m;
nkeynes@359
   691
    sh4r.q = (sh4r.r[Rn] >> 31);
nkeynes@359
   692
    tmp2 = sh4r.r[Rm];
nkeynes@359
   693
    sh4r.r[Rn] = (sh4r.r[Rn] << 1) | sh4r.t;
nkeynes@359
   694
    tmp0 = sh4r.r[Rn];
nkeynes@359
   695
    if( dir ) {
nkeynes@359
   696
         sh4r.r[Rn] += tmp2;
nkeynes@359
   697
         tmp1 = (sh4r.r[Rn]<tmp0 ? 1 : 0 );
nkeynes@359
   698
    } else {
nkeynes@359
   699
         sh4r.r[Rn] -= tmp2;
nkeynes@359
   700
         tmp1 = (sh4r.r[Rn]>tmp0 ? 1 : 0 );
nkeynes@359
   701
    }
nkeynes@359
   702
    sh4r.q ^= sh4r.m ^ tmp1;
nkeynes@359
   703
    sh4r.t = ( sh4r.q == sh4r.m ? 1 : 0 );
nkeynes@359
   704
:}
nkeynes@359
   705
DMULS.L Rm, Rn {: sh4r.mac = SIGNEXT32(sh4r.r[Rm]) * SIGNEXT32(sh4r.r[Rn]); :}
nkeynes@359
   706
DMULU.L Rm, Rn {: sh4r.mac = ((uint64_t)sh4r.r[Rm]) * ((uint64_t)sh4r.r[Rn]); :}
nkeynes@359
   707
DT Rn {:
nkeynes@359
   708
    sh4r.r[Rn] --;
nkeynes@359
   709
    sh4r.t = ( sh4r.r[Rn] == 0 ? 1 : 0 );
nkeynes@359
   710
:}
nkeynes@359
   711
MAC.W @Rm+, @Rn+ {:
nkeynes@359
   712
    CHECKRALIGN16( sh4r.r[Rn] );
nkeynes@359
   713
    CHECKRALIGN16( sh4r.r[Rm] );
nkeynes@359
   714
    int32_t stmp = SIGNEXT16(MEM_READ_WORD(sh4r.r[Rn]));
nkeynes@359
   715
    sh4r.r[Rn] += 2;
nkeynes@359
   716
    stmp = stmp * SIGNEXT16(MEM_READ_WORD(sh4r.r[Rm]));
nkeynes@359
   717
    sh4r.r[Rm] += 2;
nkeynes@359
   718
    if( sh4r.s ) {
nkeynes@359
   719
	int64_t tmpl = (int64_t)((int32_t)sh4r.mac) + (int64_t)stmp;
nkeynes@359
   720
	if( tmpl > (int64_t)0x000000007FFFFFFFLL ) {
nkeynes@359
   721
	    sh4r.mac = 0x000000017FFFFFFFLL;
nkeynes@359
   722
	} else if( tmpl < (int64_t)0xFFFFFFFF80000000LL ) {
nkeynes@359
   723
	    sh4r.mac = 0x0000000180000000LL;
nkeynes@359
   724
	} else {
nkeynes@359
   725
	    sh4r.mac = (sh4r.mac & 0xFFFFFFFF00000000LL) |
nkeynes@359
   726
		((uint32_t)(sh4r.mac + stmp));
nkeynes@359
   727
	}
nkeynes@359
   728
    } else {
nkeynes@359
   729
	sh4r.mac += SIGNEXT32(stmp);
nkeynes@359
   730
    }
nkeynes@359
   731
:}
nkeynes@359
   732
MAC.L @Rm+, @Rn+ {:
nkeynes@359
   733
    CHECKRALIGN32( sh4r.r[Rm] );
nkeynes@359
   734
    CHECKRALIGN32( sh4r.r[Rn] );
nkeynes@359
   735
    int64_t tmpl = SIGNEXT32(MEM_READ_LONG(sh4r.r[Rn]));
nkeynes@359
   736
    sh4r.r[Rn] += 4;
nkeynes@359
   737
    tmpl = tmpl * SIGNEXT32(MEM_READ_LONG(sh4r.r[Rm])) + sh4r.mac;
nkeynes@359
   738
    sh4r.r[Rm] += 4;
nkeynes@359
   739
    if( sh4r.s ) {
nkeynes@359
   740
        /* 48-bit Saturation. Yuch */
nkeynes@359
   741
        if( tmpl < (int64_t)0xFFFF800000000000LL )
nkeynes@359
   742
            tmpl = 0xFFFF800000000000LL;
nkeynes@359
   743
        else if( tmpl > (int64_t)0x00007FFFFFFFFFFFLL )
nkeynes@359
   744
            tmpl = 0x00007FFFFFFFFFFFLL;
nkeynes@359
   745
    }
nkeynes@359
   746
    sh4r.mac = tmpl;
nkeynes@359
   747
:}
nkeynes@359
   748
MUL.L Rm, Rn {: sh4r.mac = (sh4r.mac&0xFFFFFFFF00000000LL) |
nkeynes@359
   749
                        (sh4r.r[Rm] * sh4r.r[Rn]); :}
nkeynes@359
   750
MULU.W Rm, Rn {:
nkeynes@359
   751
    sh4r.mac = (sh4r.mac&0xFFFFFFFF00000000LL) |
nkeynes@359
   752
               (uint32_t)((sh4r.r[Rm]&0xFFFF) * (sh4r.r[Rn]&0xFFFF));
nkeynes@359
   753
:}
nkeynes@359
   754
MULS.W Rm, Rn {:
nkeynes@359
   755
    sh4r.mac = (sh4r.mac&0xFFFFFFFF00000000LL) |
nkeynes@359
   756
               (uint32_t)(SIGNEXT32(sh4r.r[Rm]&0xFFFF) * SIGNEXT32(sh4r.r[Rn]&0xFFFF));
nkeynes@359
   757
:}
nkeynes@359
   758
NEGC Rm, Rn {:
nkeynes@359
   759
    tmp = 0 - sh4r.r[Rm];
nkeynes@359
   760
    sh4r.r[Rn] = tmp - sh4r.t;
nkeynes@359
   761
    sh4r.t = ( 0<tmp || tmp<sh4r.r[Rn] ? 1 : 0 );
nkeynes@359
   762
:}
nkeynes@359
   763
NEG Rm, Rn {: sh4r.r[Rn] = 0 - sh4r.r[Rm]; :}
nkeynes@359
   764
SUB Rm, Rn {: sh4r.r[Rn] -= sh4r.r[Rm]; :}
nkeynes@359
   765
SUBC Rm, Rn {: 
nkeynes@359
   766
    tmp = sh4r.r[Rn];
nkeynes@359
   767
    sh4r.r[Rn] = sh4r.r[Rn] - sh4r.r[Rm] - sh4r.t;
nkeynes@359
   768
    sh4r.t = (sh4r.r[Rn] > tmp || (sh4r.r[Rn] == tmp && sh4r.t == 1));
nkeynes@359
   769
:}
nkeynes@359
   770
nkeynes@359
   771
BRAF Rn {:
nkeynes@359
   772
     CHECKSLOTILLEGAL();
nkeynes@359
   773
     CHECKDEST( pc + 4 + sh4r.r[Rn] );
nkeynes@359
   774
     sh4r.in_delay_slot = 1;
nkeynes@359
   775
     sh4r.pc = sh4r.new_pc;
nkeynes@359
   776
     sh4r.new_pc = pc + 4 + sh4r.r[Rn];
nkeynes@359
   777
     return TRUE;
nkeynes@359
   778
:}
nkeynes@359
   779
BSRF Rn {:
nkeynes@359
   780
     CHECKSLOTILLEGAL();
nkeynes@359
   781
     CHECKDEST( pc + 4 + sh4r.r[Rn] );
nkeynes@359
   782
     sh4r.in_delay_slot = 1;
nkeynes@359
   783
     sh4r.pr = sh4r.pc + 4;
nkeynes@359
   784
     sh4r.pc = sh4r.new_pc;
nkeynes@359
   785
     sh4r.new_pc = pc + 4 + sh4r.r[Rn];
nkeynes@359
   786
     TRACE_CALL( pc, sh4r.new_pc );
nkeynes@359
   787
     return TRUE;
nkeynes@359
   788
:}
nkeynes@359
   789
BT disp {:
nkeynes@359
   790
    CHECKSLOTILLEGAL();
nkeynes@359
   791
    if( sh4r.t ) {
nkeynes@359
   792
        CHECKDEST( sh4r.pc + disp + 4 )
nkeynes@359
   793
        sh4r.pc += disp + 4;
nkeynes@359
   794
        sh4r.new_pc = sh4r.pc + 2;
nkeynes@359
   795
        return TRUE;
nkeynes@359
   796
    }
nkeynes@359
   797
:}
nkeynes@359
   798
BF disp {:
nkeynes@359
   799
    CHECKSLOTILLEGAL();
nkeynes@359
   800
    if( !sh4r.t ) {
nkeynes@359
   801
        CHECKDEST( sh4r.pc + disp + 4 )
nkeynes@359
   802
        sh4r.pc += disp + 4;
nkeynes@359
   803
        sh4r.new_pc = sh4r.pc + 2;
nkeynes@359
   804
        return TRUE;
nkeynes@359
   805
    }
nkeynes@359
   806
:}
nkeynes@359
   807
BT/S disp {:
nkeynes@359
   808
    CHECKSLOTILLEGAL();
nkeynes@359
   809
    if( sh4r.t ) {
nkeynes@359
   810
        CHECKDEST( sh4r.pc + disp + 4 )
nkeynes@359
   811
        sh4r.in_delay_slot = 1;
nkeynes@359
   812
        sh4r.pc = sh4r.new_pc;
nkeynes@359
   813
        sh4r.new_pc = pc + disp + 4;
nkeynes@359
   814
        sh4r.in_delay_slot = 1;
nkeynes@359
   815
        return TRUE;
nkeynes@359
   816
    }
nkeynes@359
   817
:}
nkeynes@359
   818
BF/S disp {:
nkeynes@359
   819
    CHECKSLOTILLEGAL();
nkeynes@359
   820
    if( !sh4r.t ) {
nkeynes@359
   821
        CHECKDEST( sh4r.pc + disp + 4 )
nkeynes@359
   822
        sh4r.in_delay_slot = 1;
nkeynes@359
   823
        sh4r.pc = sh4r.new_pc;
nkeynes@359
   824
        sh4r.new_pc = pc + disp + 4;
nkeynes@359
   825
        return TRUE;
nkeynes@359
   826
    }
nkeynes@359
   827
:}
nkeynes@359
   828
BRA disp {:
nkeynes@359
   829
    CHECKSLOTILLEGAL();
nkeynes@359
   830
    CHECKDEST( sh4r.pc + disp + 4 );
nkeynes@359
   831
    sh4r.in_delay_slot = 1;
nkeynes@359
   832
    sh4r.pc = sh4r.new_pc;
nkeynes@359
   833
    sh4r.new_pc = pc + 4 + disp;
nkeynes@359
   834
    return TRUE;
nkeynes@359
   835
:}
nkeynes@359
   836
BSR disp {:
nkeynes@359
   837
    CHECKDEST( sh4r.pc + disp + 4 );
nkeynes@359
   838
    CHECKSLOTILLEGAL();
nkeynes@359
   839
    sh4r.in_delay_slot = 1;
nkeynes@359
   840
    sh4r.pr = pc + 4;
nkeynes@359
   841
    sh4r.pc = sh4r.new_pc;
nkeynes@359
   842
    sh4r.new_pc = pc + 4 + disp;
nkeynes@359
   843
    TRACE_CALL( pc, sh4r.new_pc );
nkeynes@359
   844
    return TRUE;
nkeynes@359
   845
:}
nkeynes@359
   846
TRAPA #imm {:
nkeynes@359
   847
    CHECKSLOTILLEGAL();
nkeynes@359
   848
    MMIO_WRITE( MMU, TRA, imm<<2 );
nkeynes@359
   849
    sh4r.pc += 2;
nkeynes@359
   850
    sh4_raise_exception( EXC_TRAP );
nkeynes@359
   851
:}
nkeynes@359
   852
RTS {: 
nkeynes@359
   853
    CHECKSLOTILLEGAL();
nkeynes@359
   854
    CHECKDEST( sh4r.pr );
nkeynes@359
   855
    sh4r.in_delay_slot = 1;
nkeynes@359
   856
    sh4r.pc = sh4r.new_pc;
nkeynes@359
   857
    sh4r.new_pc = sh4r.pr;
nkeynes@359
   858
    TRACE_RETURN( pc, sh4r.new_pc );
nkeynes@359
   859
    return TRUE;
nkeynes@359
   860
:}
nkeynes@359
   861
SLEEP {:
nkeynes@359
   862
    if( MMIO_READ( CPG, STBCR ) & 0x80 ) {
nkeynes@359
   863
	sh4r.sh4_state = SH4_STATE_STANDBY;
nkeynes@359
   864
    } else {
nkeynes@359
   865
	sh4r.sh4_state = SH4_STATE_SLEEP;
nkeynes@359
   866
    }
nkeynes@359
   867
    return FALSE; /* Halt CPU */
nkeynes@359
   868
:}
nkeynes@359
   869
RTE {:
nkeynes@359
   870
    CHECKPRIV();
nkeynes@359
   871
    CHECKDEST( sh4r.spc );
nkeynes@359
   872
    CHECKSLOTILLEGAL();
nkeynes@359
   873
    sh4r.in_delay_slot = 1;
nkeynes@359
   874
    sh4r.pc = sh4r.new_pc;
nkeynes@359
   875
    sh4r.new_pc = sh4r.spc;
nkeynes@374
   876
    sh4_write_sr( sh4r.ssr );
nkeynes@359
   877
    return TRUE;
nkeynes@359
   878
:}
nkeynes@359
   879
JMP @Rn {:
nkeynes@359
   880
    CHECKDEST( sh4r.r[Rn] );
nkeynes@359
   881
    CHECKSLOTILLEGAL();
nkeynes@359
   882
    sh4r.in_delay_slot = 1;
nkeynes@359
   883
    sh4r.pc = sh4r.new_pc;
nkeynes@359
   884
    sh4r.new_pc = sh4r.r[Rn];
nkeynes@359
   885
    return TRUE;
nkeynes@359
   886
:}
nkeynes@359
   887
JSR @Rn {:
nkeynes@359
   888
    CHECKDEST( sh4r.r[Rn] );
nkeynes@359
   889
    CHECKSLOTILLEGAL();
nkeynes@359
   890
    sh4r.in_delay_slot = 1;
nkeynes@359
   891
    sh4r.pc = sh4r.new_pc;
nkeynes@359
   892
    sh4r.new_pc = sh4r.r[Rn];
nkeynes@359
   893
    sh4r.pr = pc + 4;
nkeynes@359
   894
    TRACE_CALL( pc, sh4r.new_pc );
nkeynes@359
   895
    return TRUE;
nkeynes@359
   896
:}
nkeynes@359
   897
STS MACH, Rn {: sh4r.r[Rn] = (sh4r.mac>>32); :}
nkeynes@359
   898
STS.L MACH, @-Rn {:
nkeynes@359
   899
    sh4r.r[Rn] -= 4;
nkeynes@359
   900
    CHECKWALIGN32( sh4r.r[Rn] );
nkeynes@359
   901
    MEM_WRITE_LONG( sh4r.r[Rn], (sh4r.mac>>32) );
nkeynes@359
   902
:}
nkeynes@359
   903
STC.L SR, @-Rn {:
nkeynes@359
   904
    CHECKPRIV();
nkeynes@359
   905
    sh4r.r[Rn] -= 4;
nkeynes@359
   906
    CHECKWALIGN32( sh4r.r[Rn] );
nkeynes@359
   907
    MEM_WRITE_LONG( sh4r.r[Rn], sh4_read_sr() );
nkeynes@359
   908
:}
nkeynes@359
   909
LDS.L @Rm+, MACH {:
nkeynes@359
   910
    CHECKRALIGN32( sh4r.r[Rm] );
nkeynes@359
   911
    sh4r.mac = (sh4r.mac & 0x00000000FFFFFFFF) |
nkeynes@359
   912
               (((uint64_t)MEM_READ_LONG(sh4r.r[Rm]))<<32);
nkeynes@359
   913
    sh4r.r[Rm] += 4;
nkeynes@359
   914
:}
nkeynes@359
   915
LDC.L @Rm+, SR {:
nkeynes@359
   916
    CHECKSLOTILLEGAL();
nkeynes@359
   917
    CHECKPRIV();
nkeynes@359
   918
    CHECKWALIGN32( sh4r.r[Rm] );
nkeynes@374
   919
    sh4_write_sr( MEM_READ_LONG(sh4r.r[Rm]) );
nkeynes@359
   920
    sh4r.r[Rm] +=4;
nkeynes@359
   921
:}
nkeynes@359
   922
LDS Rm, MACH {:
nkeynes@359
   923
    sh4r.mac = (sh4r.mac & 0x00000000FFFFFFFF) |
nkeynes@359
   924
               (((uint64_t)sh4r.r[Rm])<<32);
nkeynes@359
   925
:}
nkeynes@359
   926
LDC Rm, SR {:
nkeynes@359
   927
    CHECKSLOTILLEGAL();
nkeynes@359
   928
    CHECKPRIV();
nkeynes@374
   929
    sh4_write_sr( sh4r.r[Rm] );
nkeynes@359
   930
:}
nkeynes@359
   931
LDC Rm, SGR {:
nkeynes@359
   932
    CHECKPRIV();
nkeynes@359
   933
    sh4r.sgr = sh4r.r[Rm];
nkeynes@359
   934
:}
nkeynes@359
   935
LDC.L @Rm+, SGR {:
nkeynes@359
   936
    CHECKPRIV();
nkeynes@359
   937
    CHECKRALIGN32( sh4r.r[Rm] );
nkeynes@359
   938
    sh4r.sgr = MEM_READ_LONG(sh4r.r[Rm]);
nkeynes@359
   939
    sh4r.r[Rm] +=4;
nkeynes@359
   940
:}
nkeynes@359
   941
STS MACL, Rn {: sh4r.r[Rn] = (uint32_t)sh4r.mac; :}
nkeynes@359
   942
STS.L MACL, @-Rn {:
nkeynes@359
   943
    sh4r.r[Rn] -= 4;
nkeynes@359
   944
    CHECKWALIGN32( sh4r.r[Rn] );
nkeynes@359
   945
    MEM_WRITE_LONG( sh4r.r[Rn], (uint32_t)sh4r.mac );
nkeynes@359
   946
:}
nkeynes@359
   947
STC.L GBR, @-Rn {:
nkeynes@359
   948
    sh4r.r[Rn] -= 4;
nkeynes@359
   949
    CHECKWALIGN32( sh4r.r[Rn] );
nkeynes@359
   950
    MEM_WRITE_LONG( sh4r.r[Rn], sh4r.gbr );
nkeynes@359
   951
:}
nkeynes@359
   952
LDS.L @Rm+, MACL {:
nkeynes@359
   953
    CHECKRALIGN32( sh4r.r[Rm] );
nkeynes@359
   954
    sh4r.mac = (sh4r.mac & 0xFFFFFFFF00000000LL) |
nkeynes@359
   955
               (uint64_t)((uint32_t)MEM_READ_LONG(sh4r.r[Rm]));
nkeynes@359
   956
    sh4r.r[Rm] += 4;
nkeynes@359
   957
:}
nkeynes@359
   958
LDC.L @Rm+, GBR {:
nkeynes@359
   959
    CHECKRALIGN32( sh4r.r[Rm] );
nkeynes@359
   960
    sh4r.gbr = MEM_READ_LONG(sh4r.r[Rm]);
nkeynes@359
   961
    sh4r.r[Rm] +=4;
nkeynes@359
   962
:}
nkeynes@359
   963
LDS Rm, MACL {:
nkeynes@359
   964
    sh4r.mac = (sh4r.mac & 0xFFFFFFFF00000000LL) |
nkeynes@359
   965
               (uint64_t)((uint32_t)(sh4r.r[Rm]));
nkeynes@359
   966
:}
nkeynes@359
   967
LDC Rm, GBR {: sh4r.gbr = sh4r.r[Rm]; :}
nkeynes@359
   968
STS PR, Rn {: sh4r.r[Rn] = sh4r.pr; :}
nkeynes@359
   969
STS.L PR, @-Rn {:
nkeynes@359
   970
    sh4r.r[Rn] -= 4;
nkeynes@359
   971
    CHECKWALIGN32( sh4r.r[Rn] );
nkeynes@359
   972
    MEM_WRITE_LONG( sh4r.r[Rn], sh4r.pr );
nkeynes@359
   973
:}
nkeynes@359
   974
STC.L VBR, @-Rn {:
nkeynes@359
   975
    CHECKPRIV();
nkeynes@359
   976
    sh4r.r[Rn] -= 4;
nkeynes@359
   977
    CHECKWALIGN32( sh4r.r[Rn] );
nkeynes@359
   978
    MEM_WRITE_LONG( sh4r.r[Rn], sh4r.vbr );
nkeynes@359
   979
:}
nkeynes@359
   980
LDS.L @Rm+, PR {:
nkeynes@359
   981
    CHECKRALIGN32( sh4r.r[Rm] );
nkeynes@359
   982
    sh4r.pr = MEM_READ_LONG( sh4r.r[Rm] );
nkeynes@359
   983
    sh4r.r[Rm] += 4;
nkeynes@359
   984
:}
nkeynes@359
   985
LDC.L @Rm+, VBR {:
nkeynes@359
   986
    CHECKPRIV();
nkeynes@359
   987
    CHECKRALIGN32( sh4r.r[Rm] );
nkeynes@359
   988
    sh4r.vbr = MEM_READ_LONG(sh4r.r[Rm]);
nkeynes@359
   989
    sh4r.r[Rm] +=4;
nkeynes@359
   990
:}
nkeynes@359
   991
LDS Rm, PR {: sh4r.pr = sh4r.r[Rm]; :}
nkeynes@359
   992
LDC Rm, VBR {:
nkeynes@359
   993
    CHECKPRIV();
nkeynes@359
   994
    sh4r.vbr = sh4r.r[Rm];
nkeynes@359
   995
:}
nkeynes@359
   996
STC SGR, Rn {:
nkeynes@359
   997
    CHECKPRIV();
nkeynes@359
   998
    sh4r.r[Rn] = sh4r.sgr;
nkeynes@359
   999
:}
nkeynes@359
  1000
STC.L SGR, @-Rn {:
nkeynes@359
  1001
    CHECKPRIV();
nkeynes@359
  1002
    sh4r.r[Rn] -= 4;
nkeynes@359
  1003
    CHECKWALIGN32( sh4r.r[Rn] );
nkeynes@359
  1004
    MEM_WRITE_LONG( sh4r.r[Rn], sh4r.sgr );
nkeynes@359
  1005
:}
nkeynes@359
  1006
STC.L SSR, @-Rn {:
nkeynes@359
  1007
    CHECKPRIV();
nkeynes@359
  1008
    sh4r.r[Rn] -= 4;
nkeynes@359
  1009
    CHECKWALIGN32( sh4r.r[Rn] );
nkeynes@359
  1010
    MEM_WRITE_LONG( sh4r.r[Rn], sh4r.ssr );
nkeynes@359
  1011
:}
nkeynes@359
  1012
LDC.L @Rm+, SSR {:
nkeynes@359
  1013
    CHECKPRIV();
nkeynes@359
  1014
    CHECKRALIGN32( sh4r.r[Rm] );
nkeynes@359
  1015
    sh4r.ssr = MEM_READ_LONG(sh4r.r[Rm]);
nkeynes@359
  1016
    sh4r.r[Rm] +=4;
nkeynes@359
  1017
:}
nkeynes@359
  1018
LDC Rm, SSR {:
nkeynes@359
  1019
    CHECKPRIV();
nkeynes@359
  1020
    sh4r.ssr = sh4r.r[Rm];
nkeynes@359
  1021
:}
nkeynes@359
  1022
STC.L SPC, @-Rn {:
nkeynes@359
  1023
    CHECKPRIV();
nkeynes@359
  1024
    sh4r.r[Rn] -= 4;
nkeynes@359
  1025
    CHECKWALIGN32( sh4r.r[Rn] );
nkeynes@359
  1026
    MEM_WRITE_LONG( sh4r.r[Rn], sh4r.spc );
nkeynes@359
  1027
:}
nkeynes@359
  1028
LDC.L @Rm+, SPC {:
nkeynes@359
  1029
    CHECKPRIV();
nkeynes@359
  1030
    CHECKRALIGN32( sh4r.r[Rm] );
nkeynes@359
  1031
    sh4r.spc = MEM_READ_LONG(sh4r.r[Rm]);
nkeynes@359
  1032
    sh4r.r[Rm] +=4;
nkeynes@359
  1033
:}
nkeynes@359
  1034
LDC Rm, SPC {:
nkeynes@359
  1035
    CHECKPRIV();
nkeynes@359
  1036
    sh4r.spc = sh4r.r[Rm];
nkeynes@359
  1037
:}
nkeynes@359
  1038
STS FPUL, Rn {: sh4r.r[Rn] = sh4r.fpul; :}
nkeynes@359
  1039
STS.L FPUL, @-Rn {:
nkeynes@359
  1040
    sh4r.r[Rn] -= 4;
nkeynes@359
  1041
    CHECKWALIGN32( sh4r.r[Rn] );
nkeynes@359
  1042
    MEM_WRITE_LONG( sh4r.r[Rn], sh4r.fpul );
nkeynes@359
  1043
:}
nkeynes@359
  1044
LDS.L @Rm+, FPUL {:
nkeynes@359
  1045
    CHECKRALIGN32( sh4r.r[Rm] );
nkeynes@359
  1046
    sh4r.fpul = MEM_READ_LONG(sh4r.r[Rm]);
nkeynes@359
  1047
    sh4r.r[Rm] +=4;
nkeynes@359
  1048
:}
nkeynes@359
  1049
LDS Rm, FPUL {: sh4r.fpul = sh4r.r[Rm]; :}
nkeynes@359
  1050
STS FPSCR, Rn {: sh4r.r[Rn] = sh4r.fpscr; :}
nkeynes@359
  1051
STS.L FPSCR, @-Rn {:
nkeynes@359
  1052
    sh4r.r[Rn] -= 4;
nkeynes@359
  1053
    CHECKWALIGN32( sh4r.r[Rn] );
nkeynes@359
  1054
    MEM_WRITE_LONG( sh4r.r[Rn], sh4r.fpscr );
nkeynes@359
  1055
:}
nkeynes@359
  1056
LDS.L @Rm+, FPSCR {:
nkeynes@359
  1057
    CHECKRALIGN32( sh4r.r[Rm] );
nkeynes@359
  1058
    sh4r.fpscr = MEM_READ_LONG(sh4r.r[Rm]);
nkeynes@359
  1059
    sh4r.r[Rm] +=4;
nkeynes@374
  1060
    sh4r.fr_bank = &sh4r.fr[(sh4r.fpscr&FPSCR_FR)>>21][0];
nkeynes@359
  1061
:}
nkeynes@374
  1062
LDS Rm, FPSCR {: 
nkeynes@374
  1063
    sh4r.fpscr = sh4r.r[Rm]; 
nkeynes@374
  1064
    sh4r.fr_bank = &sh4r.fr[(sh4r.fpscr&FPSCR_FR)>>21][0];
nkeynes@374
  1065
:}
nkeynes@359
  1066
STC DBR, Rn {: CHECKPRIV(); sh4r.r[Rn] = sh4r.dbr; :}
nkeynes@359
  1067
STC.L DBR, @-Rn {:
nkeynes@359
  1068
    CHECKPRIV();
nkeynes@359
  1069
    sh4r.r[Rn] -= 4;
nkeynes@359
  1070
    CHECKWALIGN32( sh4r.r[Rn] );
nkeynes@359
  1071
    MEM_WRITE_LONG( sh4r.r[Rn], sh4r.dbr );
nkeynes@359
  1072
:}
nkeynes@359
  1073
LDC.L @Rm+, DBR {:
nkeynes@359
  1074
    CHECKPRIV();
nkeynes@359
  1075
    CHECKRALIGN32( sh4r.r[Rm] );
nkeynes@359
  1076
    sh4r.dbr = MEM_READ_LONG(sh4r.r[Rm]);
nkeynes@359
  1077
    sh4r.r[Rm] +=4;
nkeynes@359
  1078
:}
nkeynes@359
  1079
LDC Rm, DBR {:
nkeynes@359
  1080
    CHECKPRIV();
nkeynes@359
  1081
    sh4r.dbr = sh4r.r[Rm];
nkeynes@359
  1082
:}
nkeynes@359
  1083
STC.L Rm_BANK, @-Rn {:
nkeynes@359
  1084
    CHECKPRIV();
nkeynes@359
  1085
    sh4r.r[Rn] -= 4;
nkeynes@359
  1086
    CHECKWALIGN32( sh4r.r[Rn] );
nkeynes@359
  1087
    MEM_WRITE_LONG( sh4r.r[Rn], sh4r.r_bank[Rm_BANK] );
nkeynes@359
  1088
:}
nkeynes@359
  1089
LDC.L @Rm+, Rn_BANK {:
nkeynes@359
  1090
    CHECKPRIV();
nkeynes@359
  1091
    CHECKRALIGN32( sh4r.r[Rm] );
nkeynes@359
  1092
    sh4r.r_bank[Rn_BANK] = MEM_READ_LONG( sh4r.r[Rm] );
nkeynes@359
  1093
    sh4r.r[Rm] += 4;
nkeynes@359
  1094
:}
nkeynes@359
  1095
LDC Rm, Rn_BANK {:
nkeynes@359
  1096
    CHECKPRIV();
nkeynes@359
  1097
    sh4r.r_bank[Rn_BANK] = sh4r.r[Rm];
nkeynes@359
  1098
:}
nkeynes@359
  1099
STC SR, Rn {: 
nkeynes@359
  1100
    CHECKPRIV();
nkeynes@359
  1101
    sh4r.r[Rn] = sh4_read_sr();
nkeynes@359
  1102
:}
nkeynes@359
  1103
STC GBR, Rn {:
nkeynes@359
  1104
    CHECKPRIV();
nkeynes@359
  1105
    sh4r.r[Rn] = sh4r.gbr;
nkeynes@359
  1106
:}
nkeynes@359
  1107
STC VBR, Rn {:
nkeynes@359
  1108
    CHECKPRIV();
nkeynes@359
  1109
    sh4r.r[Rn] = sh4r.vbr;
nkeynes@359
  1110
:}
nkeynes@359
  1111
STC SSR, Rn {:
nkeynes@359
  1112
    CHECKPRIV();
nkeynes@359
  1113
    sh4r.r[Rn] = sh4r.ssr;
nkeynes@359
  1114
:}
nkeynes@359
  1115
STC SPC, Rn {:
nkeynes@359
  1116
    CHECKPRIV();
nkeynes@359
  1117
    sh4r.r[Rn] = sh4r.spc;
nkeynes@359
  1118
:}
nkeynes@359
  1119
STC Rm_BANK, Rn {:
nkeynes@359
  1120
    CHECKPRIV();
nkeynes@359
  1121
    sh4r.r[Rn] = sh4r.r_bank[Rm_BANK];
nkeynes@359
  1122
:}
nkeynes@359
  1123
nkeynes@359
  1124
FADD FRm, FRn {:
nkeynes@359
  1125
    CHECKFPUEN();
nkeynes@359
  1126
    if( IS_FPU_DOUBLEPREC() ) {
nkeynes@359
  1127
	DR(FRn) += DR(FRm);
nkeynes@359
  1128
    } else {
nkeynes@359
  1129
	FR(FRn) += FR(FRm);
nkeynes@359
  1130
    }
nkeynes@359
  1131
:}
nkeynes@359
  1132
FSUB FRm, FRn {:
nkeynes@359
  1133
    CHECKFPUEN();
nkeynes@359
  1134
    if( IS_FPU_DOUBLEPREC() ) {
nkeynes@359
  1135
	DR(FRn) -= DR(FRm);
nkeynes@359
  1136
    } else {
nkeynes@359
  1137
	FR(FRn) -= FR(FRm);
nkeynes@359
  1138
    }
nkeynes@359
  1139
:}
nkeynes@359
  1140
nkeynes@359
  1141
FMUL FRm, FRn {:
nkeynes@359
  1142
    CHECKFPUEN();
nkeynes@359
  1143
    if( IS_FPU_DOUBLEPREC() ) {
nkeynes@359
  1144
	DR(FRn) *= DR(FRm);
nkeynes@359
  1145
    } else {
nkeynes@359
  1146
	FR(FRn) *= FR(FRm);
nkeynes@359
  1147
    }
nkeynes@359
  1148
:}
nkeynes@359
  1149
nkeynes@359
  1150
FDIV FRm, FRn {:
nkeynes@359
  1151
    CHECKFPUEN();
nkeynes@359
  1152
    if( IS_FPU_DOUBLEPREC() ) {
nkeynes@359
  1153
	DR(FRn) /= DR(FRm);
nkeynes@359
  1154
    } else {
nkeynes@359
  1155
	FR(FRn) /= FR(FRm);
nkeynes@359
  1156
    }
nkeynes@359
  1157
:}
nkeynes@359
  1158
nkeynes@359
  1159
FCMP/EQ FRm, FRn {:
nkeynes@359
  1160
    CHECKFPUEN();
nkeynes@359
  1161
    if( IS_FPU_DOUBLEPREC() ) {
nkeynes@359
  1162
	sh4r.t = ( DR(FRn) == DR(FRm) ? 1 : 0 );
nkeynes@359
  1163
    } else {
nkeynes@359
  1164
	sh4r.t = ( FR(FRn) == FR(FRm) ? 1 : 0 );
nkeynes@359
  1165
    }
nkeynes@359
  1166
:}
nkeynes@359
  1167
nkeynes@359
  1168
FCMP/GT FRm, FRn {:
nkeynes@359
  1169
    CHECKFPUEN();
nkeynes@359
  1170
    if( IS_FPU_DOUBLEPREC() ) {
nkeynes@359
  1171
	sh4r.t = ( DR(FRn) > DR(FRm) ? 1 : 0 );
nkeynes@359
  1172
    } else {
nkeynes@359
  1173
	sh4r.t = ( FR(FRn) > FR(FRm) ? 1 : 0 );
nkeynes@359
  1174
    }
nkeynes@359
  1175
:}
nkeynes@359
  1176
nkeynes@359
  1177
FMOV @(R0, Rm), FRn {: MEM_FP_READ( sh4r.r[Rm] + R0, FRn ); :}
nkeynes@359
  1178
FMOV FRm, @(R0, Rn) {: MEM_FP_WRITE( sh4r.r[Rn] + R0, FRm ); :}
nkeynes@359
  1179
FMOV @Rm, FRn {: MEM_FP_READ( sh4r.r[Rm], FRn ); :}
nkeynes@359
  1180
FMOV @Rm+, FRn {: MEM_FP_READ( sh4r.r[Rm], FRn ); sh4r.r[Rm] += FP_WIDTH; :}
nkeynes@359
  1181
FMOV FRm, @Rn {: MEM_FP_WRITE( sh4r.r[Rn], FRm ); :}
nkeynes@359
  1182
FMOV FRm, @-Rn {: sh4r.r[Rn] -= FP_WIDTH; MEM_FP_WRITE( sh4r.r[Rn], FRm ); :}
nkeynes@359
  1183
FMOV FRm, FRn {: 
nkeynes@359
  1184
    if( IS_FPU_DOUBLESIZE() )
nkeynes@359
  1185
	DR(FRn) = DR(FRm);
nkeynes@359
  1186
    else
nkeynes@359
  1187
	FR(FRn) = FR(FRm);
nkeynes@359
  1188
:}
nkeynes@359
  1189
FSTS FPUL, FRn {: CHECKFPUEN(); FR(FRn) = FPULf; :}
nkeynes@359
  1190
FLDS FRm, FPUL {: CHECKFPUEN(); FPULf = FR(FRm); :}
nkeynes@359
  1191
FLOAT FPUL, FRn {: 
nkeynes@359
  1192
    CHECKFPUEN();
nkeynes@374
  1193
    if( IS_FPU_DOUBLEPREC() ) {
nkeynes@374
  1194
	if( FRn&1 ) { // No, really...
nkeynes@374
  1195
	    dtmp = (double)FPULi;
nkeynes@374
  1196
	    FR(FRn) = *(((float *)&dtmp)+1);
nkeynes@374
  1197
	} else {
nkeynes@374
  1198
	    DRF(FRn>>1) = (double)FPULi;
nkeynes@374
  1199
	}
nkeynes@374
  1200
    } else {
nkeynes@359
  1201
	FR(FRn) = (float)FPULi;
nkeynes@374
  1202
    }
nkeynes@359
  1203
:}
nkeynes@359
  1204
FTRC FRm, FPUL {:
nkeynes@359
  1205
    CHECKFPUEN();
nkeynes@359
  1206
    if( IS_FPU_DOUBLEPREC() ) {
nkeynes@374
  1207
	if( FRm&1 ) {
nkeynes@374
  1208
	    dtmp = 0;
nkeynes@374
  1209
	    *(((float *)&dtmp)+1) = FR(FRm);
nkeynes@374
  1210
	} else {
nkeynes@374
  1211
	    dtmp = DRF(FRm>>1);
nkeynes@374
  1212
	}
nkeynes@359
  1213
        if( dtmp >= MAX_INTF )
nkeynes@359
  1214
            FPULi = MAX_INT;
nkeynes@359
  1215
        else if( dtmp <= MIN_INTF )
nkeynes@359
  1216
            FPULi = MIN_INT;
nkeynes@359
  1217
        else 
nkeynes@359
  1218
            FPULi = (int32_t)dtmp;
nkeynes@359
  1219
    } else {
nkeynes@359
  1220
	ftmp = FR(FRm);
nkeynes@359
  1221
	if( ftmp >= MAX_INTF )
nkeynes@359
  1222
	    FPULi = MAX_INT;
nkeynes@359
  1223
	else if( ftmp <= MIN_INTF )
nkeynes@359
  1224
	    FPULi = MIN_INT;
nkeynes@359
  1225
	else
nkeynes@359
  1226
	    FPULi = (int32_t)ftmp;
nkeynes@359
  1227
    }
nkeynes@359
  1228
:}
nkeynes@359
  1229
FNEG FRn {:
nkeynes@359
  1230
    CHECKFPUEN();
nkeynes@359
  1231
    if( IS_FPU_DOUBLEPREC() ) {
nkeynes@359
  1232
	DR(FRn) = -DR(FRn);
nkeynes@359
  1233
    } else {
nkeynes@359
  1234
        FR(FRn) = -FR(FRn);
nkeynes@359
  1235
    }
nkeynes@359
  1236
:}
nkeynes@359
  1237
FABS FRn {:
nkeynes@359
  1238
    CHECKFPUEN();
nkeynes@359
  1239
    if( IS_FPU_DOUBLEPREC() ) {
nkeynes@359
  1240
	DR(FRn) = fabs(DR(FRn));
nkeynes@359
  1241
    } else {
nkeynes@359
  1242
        FR(FRn) = fabsf(FR(FRn));
nkeynes@359
  1243
    }
nkeynes@359
  1244
:}
nkeynes@359
  1245
FSQRT FRn {:
nkeynes@359
  1246
    CHECKFPUEN();
nkeynes@359
  1247
    if( IS_FPU_DOUBLEPREC() ) {
nkeynes@359
  1248
	DR(FRn) = sqrt(DR(FRn));
nkeynes@359
  1249
    } else {
nkeynes@359
  1250
        FR(FRn) = sqrtf(FR(FRn));
nkeynes@359
  1251
    }
nkeynes@359
  1252
:}
nkeynes@359
  1253
FLDI0 FRn {:
nkeynes@359
  1254
    CHECKFPUEN();
nkeynes@359
  1255
    if( IS_FPU_DOUBLEPREC() ) {
nkeynes@359
  1256
	DR(FRn) = 0.0;
nkeynes@359
  1257
    } else {
nkeynes@359
  1258
        FR(FRn) = 0.0;
nkeynes@359
  1259
    }
nkeynes@359
  1260
:}
nkeynes@359
  1261
FLDI1 FRn {:
nkeynes@359
  1262
    CHECKFPUEN();
nkeynes@359
  1263
    if( IS_FPU_DOUBLEPREC() ) {
nkeynes@359
  1264
	DR(FRn) = 1.0;
nkeynes@359
  1265
    } else {
nkeynes@359
  1266
        FR(FRn) = 1.0;
nkeynes@359
  1267
    }
nkeynes@359
  1268
:}
nkeynes@359
  1269
FMAC FR0, FRm, FRn {:
nkeynes@359
  1270
    CHECKFPUEN();
nkeynes@359
  1271
    if( IS_FPU_DOUBLEPREC() ) {
nkeynes@359
  1272
        DR(FRn) += DR(FRm)*DR(0);
nkeynes@359
  1273
    } else {
nkeynes@359
  1274
	FR(FRn) += FR(FRm)*FR(0);
nkeynes@359
  1275
    }
nkeynes@359
  1276
:}
nkeynes@374
  1277
FRCHG {: 
nkeynes@374
  1278
    CHECKFPUEN(); 
nkeynes@374
  1279
    sh4r.fpscr ^= FPSCR_FR; 
nkeynes@374
  1280
    sh4r.fr_bank = &sh4r.fr[(sh4r.fpscr&FPSCR_FR)>>21][0];
nkeynes@374
  1281
:}
nkeynes@359
  1282
FSCHG {: CHECKFPUEN(); sh4r.fpscr ^= FPSCR_SZ; :}
nkeynes@359
  1283
FCNVSD FPUL, FRn {:
nkeynes@359
  1284
    CHECKFPUEN();
nkeynes@359
  1285
    if( IS_FPU_DOUBLEPREC() && !IS_FPU_DOUBLESIZE() ) {
nkeynes@359
  1286
	DR(FRn) = (double)FPULf;
nkeynes@359
  1287
    }
nkeynes@359
  1288
:}
nkeynes@359
  1289
FCNVDS FRm, FPUL {:
nkeynes@359
  1290
    CHECKFPUEN();
nkeynes@359
  1291
    if( IS_FPU_DOUBLEPREC() && !IS_FPU_DOUBLESIZE() ) {
nkeynes@359
  1292
	FPULf = (float)DR(FRm);
nkeynes@359
  1293
    }
nkeynes@359
  1294
:}
nkeynes@359
  1295
nkeynes@359
  1296
FSRRA FRn {:
nkeynes@359
  1297
    CHECKFPUEN();
nkeynes@359
  1298
    if( !IS_FPU_DOUBLEPREC() ) {
nkeynes@359
  1299
	FR(FRn) = 1.0/sqrtf(FR(FRn));
nkeynes@359
  1300
    }
nkeynes@359
  1301
:}
nkeynes@359
  1302
FIPR FVm, FVn {:
nkeynes@359
  1303
    CHECKFPUEN();
nkeynes@359
  1304
    if( !IS_FPU_DOUBLEPREC() ) {
nkeynes@359
  1305
        int tmp2 = FVn<<2;
nkeynes@359
  1306
        tmp = FVm<<2;
nkeynes@359
  1307
        FR(tmp2+3) = FR(tmp)*FR(tmp2) +
nkeynes@359
  1308
            FR(tmp+1)*FR(tmp2+1) +
nkeynes@359
  1309
            FR(tmp+2)*FR(tmp2+2) +
nkeynes@359
  1310
            FR(tmp+3)*FR(tmp2+3);
nkeynes@359
  1311
    }
nkeynes@359
  1312
:}
nkeynes@359
  1313
FSCA FPUL, FRn {:
nkeynes@359
  1314
    CHECKFPUEN();
nkeynes@359
  1315
    if( !IS_FPU_DOUBLEPREC() ) {
nkeynes@359
  1316
        float angle = (((float)(FPULi&0xFFFF))/65536.0) * 2 * M_PI;
nkeynes@359
  1317
        FR(FRn) = sinf(angle);
nkeynes@359
  1318
        FR((FRn)+1) = cosf(angle);
nkeynes@359
  1319
    }
nkeynes@359
  1320
:}
nkeynes@359
  1321
FTRV XMTRX, FVn {:
nkeynes@359
  1322
    CHECKFPUEN();
nkeynes@359
  1323
    if( !IS_FPU_DOUBLEPREC() ) {
nkeynes@359
  1324
        tmp = FVn<<2;
nkeynes@374
  1325
	float *xf = &sh4r.fr[((~sh4r.fpscr)&FPSCR_FR)>>21][0];
nkeynes@359
  1326
        float fv[4] = { FR(tmp), FR(tmp+1), FR(tmp+2), FR(tmp+3) };
nkeynes@374
  1327
        FR(tmp) = xf[1] * fv[0] + xf[5]*fv[1] +
nkeynes@374
  1328
	    xf[9]*fv[2] + xf[13]*fv[3];
nkeynes@374
  1329
        FR(tmp+1) = xf[0] * fv[0] + xf[4]*fv[1] +
nkeynes@374
  1330
	    xf[8]*fv[2] + xf[12]*fv[3];
nkeynes@374
  1331
        FR(tmp+2) = xf[3] * fv[0] + xf[7]*fv[1] +
nkeynes@374
  1332
	    xf[11]*fv[2] + xf[15]*fv[3];
nkeynes@374
  1333
        FR(tmp+3) = xf[2] * fv[0] + xf[6]*fv[1] +
nkeynes@374
  1334
	    xf[10]*fv[2] + xf[14]*fv[3];
nkeynes@359
  1335
    }
nkeynes@359
  1336
:}
nkeynes@359
  1337
UNDEF {:
nkeynes@359
  1338
    UNDEF(ir);
nkeynes@359
  1339
:}
nkeynes@359
  1340
%%
nkeynes@359
  1341
    sh4r.pc = sh4r.new_pc;
nkeynes@359
  1342
    sh4r.new_pc += 2;
nkeynes@359
  1343
    sh4r.in_delay_slot = 0;
nkeynes@359
  1344
    return TRUE;
nkeynes@359
  1345
}
.