Search
lxdream.org :: lxdream/src/sh4/sh4x86.in
lxdream 0.9.1
released Jun 29
Download Now
filename src/sh4/sh4x86.in
changeset 1263:b3de98d19faf
prev1218:be02e87f9f87
next1292:799fdd4f704a
author nkeynes
date Tue Mar 06 12:19:08 2012 +1000 (12 years ago)
permissions -rw-r--r--
last change Move x86dasm/* files under xlat/disasm
file annotate diff log raw
nkeynes@359
     1
/**
nkeynes@586
     2
 * $Id$
nkeynes@359
     3
 * 
nkeynes@359
     4
 * SH4 => x86 translation. This version does no real optimization, it just
nkeynes@359
     5
 * outputs straight-line x86 code - it mainly exists to provide a baseline
nkeynes@359
     6
 * to test the optimizing versions against.
nkeynes@359
     7
 *
nkeynes@359
     8
 * Copyright (c) 2007 Nathan Keynes.
nkeynes@359
     9
 *
nkeynes@359
    10
 * This program is free software; you can redistribute it and/or modify
nkeynes@359
    11
 * it under the terms of the GNU General Public License as published by
nkeynes@359
    12
 * the Free Software Foundation; either version 2 of the License, or
nkeynes@359
    13
 * (at your option) any later version.
nkeynes@359
    14
 *
nkeynes@359
    15
 * This program is distributed in the hope that it will be useful,
nkeynes@359
    16
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
nkeynes@359
    17
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
nkeynes@359
    18
 * GNU General Public License for more details.
nkeynes@359
    19
 */
nkeynes@359
    20
nkeynes@368
    21
#include <assert.h>
nkeynes@388
    22
#include <math.h>
nkeynes@368
    23
nkeynes@380
    24
#ifndef NDEBUG
nkeynes@380
    25
#define DEBUG_JUMPS 1
nkeynes@380
    26
#endif
nkeynes@380
    27
nkeynes@905
    28
#include "lxdream.h"
nkeynes@368
    29
#include "sh4/sh4core.h"
nkeynes@1091
    30
#include "sh4/sh4dasm.h"
nkeynes@368
    31
#include "sh4/sh4trans.h"
nkeynes@671
    32
#include "sh4/sh4stat.h"
nkeynes@388
    33
#include "sh4/sh4mmio.h"
nkeynes@939
    34
#include "sh4/mmu.h"
nkeynes@991
    35
#include "xlat/xltcache.h"
nkeynes@991
    36
#include "xlat/x86/x86op.h"
nkeynes@1263
    37
#include "xlat/xlatdasm.h"
nkeynes@368
    38
#include "clock.h"
nkeynes@368
    39
nkeynes@368
    40
#define DEFAULT_BACKPATCH_SIZE 4096
nkeynes@368
    41
nkeynes@991
    42
/* Offset of a reg relative to the sh4r structure */
nkeynes@991
    43
#define REG_OFFSET(reg)  (((char *)&sh4r.reg) - ((char *)&sh4r) - 128)
nkeynes@991
    44
nkeynes@995
    45
#define R_T      REG_OFFSET(t)
nkeynes@995
    46
#define R_Q      REG_OFFSET(q)
nkeynes@995
    47
#define R_S      REG_OFFSET(s)
nkeynes@995
    48
#define R_M      REG_OFFSET(m)
nkeynes@995
    49
#define R_SR     REG_OFFSET(sr)
nkeynes@995
    50
#define R_GBR    REG_OFFSET(gbr)
nkeynes@995
    51
#define R_SSR    REG_OFFSET(ssr)
nkeynes@995
    52
#define R_SPC    REG_OFFSET(spc)
nkeynes@995
    53
#define R_VBR    REG_OFFSET(vbr)
nkeynes@995
    54
#define R_MACH   REG_OFFSET(mac)+4
nkeynes@995
    55
#define R_MACL   REG_OFFSET(mac)
nkeynes@995
    56
#define R_PC     REG_OFFSET(pc)
nkeynes@991
    57
#define R_NEW_PC REG_OFFSET(new_pc)
nkeynes@995
    58
#define R_PR     REG_OFFSET(pr)
nkeynes@995
    59
#define R_SGR    REG_OFFSET(sgr)
nkeynes@995
    60
#define R_FPUL   REG_OFFSET(fpul)
nkeynes@995
    61
#define R_FPSCR  REG_OFFSET(fpscr)
nkeynes@995
    62
#define R_DBR    REG_OFFSET(dbr)
nkeynes@995
    63
#define R_R(rn)  REG_OFFSET(r[rn])
nkeynes@995
    64
#define R_FR(f)  REG_OFFSET(fr[0][(f)^1])
nkeynes@995
    65
#define R_XF(f)  REG_OFFSET(fr[1][(f)^1])
nkeynes@995
    66
#define R_DR(f)  REG_OFFSET(fr[(f)&1][(f)&0x0E])
nkeynes@995
    67
#define R_DRL(f) REG_OFFSET(fr[(f)&1][(f)|0x01])
nkeynes@995
    68
#define R_DRH(f) REG_OFFSET(fr[(f)&1][(f)&0x0E])
nkeynes@995
    69
nkeynes@995
    70
#define DELAY_NONE 0
nkeynes@995
    71
#define DELAY_PC 1
nkeynes@995
    72
#define DELAY_PC_PR 2
nkeynes@991
    73
nkeynes@1112
    74
#define SH4_MODE_UNKNOWN -1
nkeynes@1112
    75
nkeynes@586
    76
struct backpatch_record {
nkeynes@604
    77
    uint32_t fixup_offset;
nkeynes@586
    78
    uint32_t fixup_icount;
nkeynes@596
    79
    int32_t exc_code;
nkeynes@586
    80
};
nkeynes@586
    81
nkeynes@368
    82
/** 
nkeynes@368
    83
 * Struct to manage internal translation state. This state is not saved -
nkeynes@368
    84
 * it is only valid between calls to sh4_translate_begin_block() and
nkeynes@368
    85
 * sh4_translate_end_block()
nkeynes@368
    86
 */
nkeynes@368
    87
struct sh4_x86_state {
nkeynes@590
    88
    int in_delay_slot;
nkeynes@1112
    89
    uint8_t *code;
nkeynes@368
    90
    gboolean fpuen_checked; /* true if we've already checked fpu enabled. */
nkeynes@409
    91
    gboolean branch_taken; /* true if we branched unconditionally */
nkeynes@901
    92
    gboolean double_prec; /* true if FPU is in double-precision mode */
nkeynes@903
    93
    gboolean double_size; /* true if FPU is in double-size mode */
nkeynes@903
    94
    gboolean sse3_enabled; /* true if host supports SSE3 instructions */
nkeynes@408
    95
    uint32_t block_start_pc;
nkeynes@547
    96
    uint32_t stack_posn;   /* Trace stack height for alignment purposes */
nkeynes@1112
    97
    uint32_t sh4_mode;     /* Mirror of sh4r.xlat_sh4_mode */
nkeynes@417
    98
    int tstate;
nkeynes@368
    99
nkeynes@1125
   100
    /* mode settings */
nkeynes@586
   101
    gboolean tlb_on; /* True if tlb translation is active */
nkeynes@1125
   102
    struct mem_region_fn **priv_address_space;
nkeynes@1125
   103
    struct mem_region_fn **user_address_space;
nkeynes@586
   104
nkeynes@1125
   105
    /* Instrumentation */
nkeynes@1125
   106
    xlat_block_begin_callback_t begin_callback;
nkeynes@1125
   107
    xlat_block_end_callback_t end_callback;
nkeynes@1125
   108
    gboolean fastmem;
nkeynes@1125
   109
    
nkeynes@368
   110
    /* Allocated memory for the (block-wide) back-patch list */
nkeynes@586
   111
    struct backpatch_record *backpatch_list;
nkeynes@368
   112
    uint32_t backpatch_posn;
nkeynes@368
   113
    uint32_t backpatch_size;
nkeynes@368
   114
};
nkeynes@368
   115
nkeynes@368
   116
static struct sh4_x86_state sh4_x86;
nkeynes@368
   117
nkeynes@388
   118
static uint32_t max_int = 0x7FFFFFFF;
nkeynes@388
   119
static uint32_t min_int = 0x80000000;
nkeynes@394
   120
static uint32_t save_fcw; /* save value for fpu control word */
nkeynes@394
   121
static uint32_t trunc_fcw = 0x0F7F; /* fcw value for truncation mode */
nkeynes@386
   122
nkeynes@1214
   123
static void sh4_x86_translate_unlink_block( void *use_list );
nkeynes@1196
   124
nkeynes@1214
   125
static struct xlat_target_fns x86_target_fns = {
nkeynes@1214
   126
	sh4_x86_translate_unlink_block
nkeynes@1214
   127
};	
nkeynes@1214
   128
nkeynes@1091
   129
nkeynes@903
   130
gboolean is_sse3_supported()
nkeynes@903
   131
{
nkeynes@903
   132
    uint32_t features;
nkeynes@903
   133
    
nkeynes@903
   134
    __asm__ __volatile__(
nkeynes@903
   135
        "mov $0x01, %%eax\n\t"
nkeynes@908
   136
        "cpuid\n\t" : "=c" (features) : : "eax", "edx", "ebx");
nkeynes@903
   137
    return (features & 1) ? TRUE : FALSE;
nkeynes@903
   138
}
nkeynes@903
   139
nkeynes@1125
   140
void sh4_translate_set_address_space( struct mem_region_fn **priv, struct mem_region_fn **user )
nkeynes@1125
   141
{
nkeynes@1125
   142
    sh4_x86.priv_address_space = priv;
nkeynes@1125
   143
    sh4_x86.user_address_space = user;
nkeynes@1125
   144
}
nkeynes@1125
   145
nkeynes@669
   146
void sh4_translate_init(void)
nkeynes@368
   147
{
nkeynes@368
   148
    sh4_x86.backpatch_list = malloc(DEFAULT_BACKPATCH_SIZE);
nkeynes@586
   149
    sh4_x86.backpatch_size = DEFAULT_BACKPATCH_SIZE / sizeof(struct backpatch_record);
nkeynes@1125
   150
    sh4_x86.begin_callback = NULL;
nkeynes@1125
   151
    sh4_x86.end_callback = NULL;
nkeynes@1125
   152
    sh4_translate_set_address_space( sh4_address_space, sh4_user_address_space );
nkeynes@1125
   153
    sh4_x86.fastmem = TRUE;
nkeynes@903
   154
    sh4_x86.sse3_enabled = is_sse3_supported();
nkeynes@1216
   155
    xlat_set_target_fns(&x86_target_fns);
nkeynes@368
   156
}
nkeynes@368
   157
nkeynes@1125
   158
void sh4_translate_set_callbacks( xlat_block_begin_callback_t begin, xlat_block_end_callback_t end )
nkeynes@1125
   159
{
nkeynes@1125
   160
    sh4_x86.begin_callback = begin;
nkeynes@1125
   161
    sh4_x86.end_callback = end;
nkeynes@1125
   162
}
nkeynes@1125
   163
nkeynes@1125
   164
void sh4_translate_set_fastmem( gboolean flag )
nkeynes@1125
   165
{
nkeynes@1125
   166
    sh4_x86.fastmem = flag;
nkeynes@1125
   167
}
nkeynes@1125
   168
nkeynes@586
   169
static void sh4_x86_add_backpatch( uint8_t *fixup_addr, uint32_t fixup_pc, uint32_t exc_code )
nkeynes@368
   170
{
nkeynes@991
   171
    int reloc_size = 4;
nkeynes@991
   172
    
nkeynes@991
   173
    if( exc_code == -2 ) {
nkeynes@991
   174
        reloc_size = sizeof(void *);
nkeynes@991
   175
    }
nkeynes@991
   176
    
nkeynes@368
   177
    if( sh4_x86.backpatch_posn == sh4_x86.backpatch_size ) {
nkeynes@368
   178
	sh4_x86.backpatch_size <<= 1;
nkeynes@586
   179
	sh4_x86.backpatch_list = realloc( sh4_x86.backpatch_list, 
nkeynes@586
   180
					  sh4_x86.backpatch_size * sizeof(struct backpatch_record));
nkeynes@368
   181
	assert( sh4_x86.backpatch_list != NULL );
nkeynes@368
   182
    }
nkeynes@586
   183
    if( sh4_x86.in_delay_slot ) {
nkeynes@586
   184
	fixup_pc -= 2;
nkeynes@586
   185
    }
nkeynes@991
   186
nkeynes@604
   187
    sh4_x86.backpatch_list[sh4_x86.backpatch_posn].fixup_offset = 
nkeynes@991
   188
	(((uint8_t *)fixup_addr) - ((uint8_t *)xlat_current_block->code)) - reloc_size;
nkeynes@586
   189
    sh4_x86.backpatch_list[sh4_x86.backpatch_posn].fixup_icount = (fixup_pc - sh4_x86.block_start_pc)>>1;
nkeynes@586
   190
    sh4_x86.backpatch_list[sh4_x86.backpatch_posn].exc_code = exc_code;
nkeynes@586
   191
    sh4_x86.backpatch_posn++;
nkeynes@368
   192
}
nkeynes@368
   193
nkeynes@991
   194
#define TSTATE_NONE -1
nkeynes@995
   195
#define TSTATE_O    X86_COND_O
nkeynes@995
   196
#define TSTATE_C    X86_COND_C
nkeynes@995
   197
#define TSTATE_E    X86_COND_E
nkeynes@995
   198
#define TSTATE_NE   X86_COND_NE
nkeynes@995
   199
#define TSTATE_G    X86_COND_G
nkeynes@995
   200
#define TSTATE_GE   X86_COND_GE
nkeynes@995
   201
#define TSTATE_A    X86_COND_A
nkeynes@995
   202
#define TSTATE_AE   X86_COND_AE
nkeynes@359
   203
nkeynes@991
   204
#define MARK_JMP8(x) uint8_t *_mark_jmp_##x = (xlat_output-1)
nkeynes@991
   205
#define JMP_TARGET(x) *_mark_jmp_##x += (xlat_output - _mark_jmp_##x)
nkeynes@368
   206
nkeynes@991
   207
/* Convenience instructions */
nkeynes@991
   208
#define LDC_t()          CMPB_imms_rbpdisp(1,R_T); CMC()
nkeynes@991
   209
#define SETE_t()         SETCCB_cc_rbpdisp(X86_COND_E,R_T)
nkeynes@991
   210
#define SETA_t()         SETCCB_cc_rbpdisp(X86_COND_A,R_T)
nkeynes@991
   211
#define SETAE_t()        SETCCB_cc_rbpdisp(X86_COND_AE,R_T)
nkeynes@991
   212
#define SETG_t()         SETCCB_cc_rbpdisp(X86_COND_G,R_T)
nkeynes@991
   213
#define SETGE_t()        SETCCB_cc_rbpdisp(X86_COND_GE,R_T)
nkeynes@991
   214
#define SETC_t()         SETCCB_cc_rbpdisp(X86_COND_C,R_T)
nkeynes@991
   215
#define SETO_t()         SETCCB_cc_rbpdisp(X86_COND_O,R_T)
nkeynes@991
   216
#define SETNE_t()        SETCCB_cc_rbpdisp(X86_COND_NE,R_T)
nkeynes@991
   217
#define SETC_r8(r1)      SETCCB_cc_r8(X86_COND_C, r1)
nkeynes@991
   218
#define JAE_label(label) JCC_cc_rel8(X86_COND_AE,-1); MARK_JMP8(label)
nkeynes@1112
   219
#define JBE_label(label) JCC_cc_rel8(X86_COND_BE,-1); MARK_JMP8(label)
nkeynes@991
   220
#define JE_label(label)  JCC_cc_rel8(X86_COND_E,-1); MARK_JMP8(label)
nkeynes@991
   221
#define JGE_label(label) JCC_cc_rel8(X86_COND_GE,-1); MARK_JMP8(label)
nkeynes@991
   222
#define JNA_label(label) JCC_cc_rel8(X86_COND_NA,-1); MARK_JMP8(label)
nkeynes@991
   223
#define JNE_label(label) JCC_cc_rel8(X86_COND_NE,-1); MARK_JMP8(label)
nkeynes@991
   224
#define JNO_label(label) JCC_cc_rel8(X86_COND_NO,-1); MARK_JMP8(label)
nkeynes@1197
   225
#define JP_label(label)  JCC_cc_rel8(X86_COND_P,-1); MARK_JMP8(label)
nkeynes@991
   226
#define JS_label(label)  JCC_cc_rel8(X86_COND_S,-1); MARK_JMP8(label)
nkeynes@991
   227
#define JMP_label(label) JMP_rel8(-1); MARK_JMP8(label)
nkeynes@991
   228
#define JNE_exc(exc)     JCC_cc_rel32(X86_COND_NE,0); sh4_x86_add_backpatch(xlat_output, pc, exc)
nkeynes@374
   229
nkeynes@1197
   230
#define LOAD_t() if( sh4_x86.tstate == TSTATE_NONE ) { \
nkeynes@1197
   231
	CMPL_imms_rbpdisp( 1, R_T ); sh4_x86.tstate = TSTATE_E; }     
nkeynes@1197
   232
nkeynes@991
   233
/** Branch if T is set (either in the current cflags, or in sh4r.t) */
nkeynes@1197
   234
#define JT_label(label) LOAD_t() \
nkeynes@991
   235
    JCC_cc_rel8(sh4_x86.tstate,-1); MARK_JMP8(label)
nkeynes@368
   236
nkeynes@991
   237
/** Branch if T is clear (either in the current cflags or in sh4r.t) */
nkeynes@1197
   238
#define JF_label(label) LOAD_t() \
nkeynes@991
   239
    JCC_cc_rel8(sh4_x86.tstate^1, -1); MARK_JMP8(label)
nkeynes@359
   240
nkeynes@939
   241
nkeynes@991
   242
#define load_reg(x86reg,sh4reg)     MOVL_rbpdisp_r32( REG_OFFSET(r[sh4reg]), x86reg )
nkeynes@991
   243
#define store_reg(x86reg,sh4reg)    MOVL_r32_rbpdisp( x86reg, REG_OFFSET(r[sh4reg]) )
nkeynes@374
   244
nkeynes@375
   245
/**
nkeynes@375
   246
 * Load an FR register (single-precision floating point) into an integer x86
nkeynes@375
   247
 * register (eg for register-to-register moves)
nkeynes@375
   248
 */
nkeynes@991
   249
#define load_fr(reg,frm)  MOVL_rbpdisp_r32( REG_OFFSET(fr[0][(frm)^1]), reg )
nkeynes@991
   250
#define load_xf(reg,frm)  MOVL_rbpdisp_r32( REG_OFFSET(fr[1][(frm)^1]), reg )
nkeynes@375
   251
nkeynes@375
   252
/**
nkeynes@669
   253
 * Load the low half of a DR register (DR or XD) into an integer x86 register 
nkeynes@669
   254
 */
nkeynes@991
   255
#define load_dr0(reg,frm) MOVL_rbpdisp_r32( REG_OFFSET(fr[frm&1][frm|0x01]), reg )
nkeynes@991
   256
#define load_dr1(reg,frm) MOVL_rbpdisp_r32( REG_OFFSET(fr[frm&1][frm&0x0E]), reg )
nkeynes@669
   257
nkeynes@669
   258
/**
nkeynes@669
   259
 * Store an FR register (single-precision floating point) from an integer x86+
nkeynes@375
   260
 * register (eg for register-to-register moves)
nkeynes@375
   261
 */
nkeynes@991
   262
#define store_fr(reg,frm) MOVL_r32_rbpdisp( reg, REG_OFFSET(fr[0][(frm)^1]) )
nkeynes@991
   263
#define store_xf(reg,frm) MOVL_r32_rbpdisp( reg, REG_OFFSET(fr[1][(frm)^1]) )
nkeynes@375
   264
nkeynes@991
   265
#define store_dr0(reg,frm) MOVL_r32_rbpdisp( reg, REG_OFFSET(fr[frm&1][frm|0x01]) )
nkeynes@991
   266
#define store_dr1(reg,frm) MOVL_r32_rbpdisp( reg, REG_OFFSET(fr[frm&1][frm&0x0E]) )
nkeynes@375
   267
nkeynes@374
   268
nkeynes@991
   269
#define push_fpul()  FLDF_rbpdisp(R_FPUL)
nkeynes@991
   270
#define pop_fpul()   FSTPF_rbpdisp(R_FPUL)
nkeynes@991
   271
#define push_fr(frm) FLDF_rbpdisp( REG_OFFSET(fr[0][(frm)^1]) )
nkeynes@991
   272
#define pop_fr(frm)  FSTPF_rbpdisp( REG_OFFSET(fr[0][(frm)^1]) )
nkeynes@991
   273
#define push_xf(frm) FLDF_rbpdisp( REG_OFFSET(fr[1][(frm)^1]) )
nkeynes@991
   274
#define pop_xf(frm)  FSTPF_rbpdisp( REG_OFFSET(fr[1][(frm)^1]) )
nkeynes@991
   275
#define push_dr(frm) FLDD_rbpdisp( REG_OFFSET(fr[0][(frm)&0x0E]) )
nkeynes@991
   276
#define pop_dr(frm)  FSTPD_rbpdisp( REG_OFFSET(fr[0][(frm)&0x0E]) )
nkeynes@991
   277
#define push_xdr(frm) FLDD_rbpdisp( REG_OFFSET(fr[1][(frm)&0x0E]) )
nkeynes@991
   278
#define pop_xdr(frm)  FSTPD_rbpdisp( REG_OFFSET(fr[1][(frm)&0x0E]) )
nkeynes@377
   279
nkeynes@991
   280
#ifdef ENABLE_SH4STATS
nkeynes@995
   281
#define COUNT_INST(id) MOVL_imm32_r32( id, REG_EAX ); CALL1_ptr_r32(sh4_stats_add, REG_EAX); sh4_x86.tstate = TSTATE_NONE
nkeynes@991
   282
#else
nkeynes@991
   283
#define COUNT_INST(id)
nkeynes@991
   284
#endif
nkeynes@377
   285
nkeynes@374
   286
nkeynes@368
   287
/* Exception checks - Note that all exception checks will clobber EAX */
nkeynes@416
   288
nkeynes@416
   289
#define check_priv( ) \
nkeynes@1112
   290
    if( (sh4_x86.sh4_mode & SR_MD) == 0 ) { \
nkeynes@937
   291
        if( sh4_x86.in_delay_slot ) { \
nkeynes@1191
   292
            exit_block_exc(EXC_SLOT_ILLEGAL, (pc-2), 4 ); \
nkeynes@937
   293
        } else { \
nkeynes@1191
   294
            exit_block_exc(EXC_ILLEGAL, pc, 2); \
nkeynes@937
   295
        } \
nkeynes@956
   296
        sh4_x86.branch_taken = TRUE; \
nkeynes@937
   297
        sh4_x86.in_delay_slot = DELAY_NONE; \
nkeynes@937
   298
        return 2; \
nkeynes@937
   299
    }
nkeynes@416
   300
nkeynes@416
   301
#define check_fpuen( ) \
nkeynes@416
   302
    if( !sh4_x86.fpuen_checked ) {\
nkeynes@416
   303
	sh4_x86.fpuen_checked = TRUE;\
nkeynes@995
   304
	MOVL_rbpdisp_r32( R_SR, REG_EAX );\
nkeynes@991
   305
	ANDL_imms_r32( SR_FD, REG_EAX );\
nkeynes@416
   306
	if( sh4_x86.in_delay_slot ) {\
nkeynes@586
   307
	    JNE_exc(EXC_SLOT_FPU_DISABLED);\
nkeynes@416
   308
	} else {\
nkeynes@586
   309
	    JNE_exc(EXC_FPU_DISABLED);\
nkeynes@416
   310
	}\
nkeynes@875
   311
	sh4_x86.tstate = TSTATE_NONE; \
nkeynes@416
   312
    }
nkeynes@416
   313
nkeynes@586
   314
#define check_ralign16( x86reg ) \
nkeynes@991
   315
    TESTL_imms_r32( 0x00000001, x86reg ); \
nkeynes@586
   316
    JNE_exc(EXC_DATA_ADDR_READ)
nkeynes@416
   317
nkeynes@586
   318
#define check_walign16( x86reg ) \
nkeynes@991
   319
    TESTL_imms_r32( 0x00000001, x86reg ); \
nkeynes@586
   320
    JNE_exc(EXC_DATA_ADDR_WRITE);
nkeynes@368
   321
nkeynes@586
   322
#define check_ralign32( x86reg ) \
nkeynes@991
   323
    TESTL_imms_r32( 0x00000003, x86reg ); \
nkeynes@586
   324
    JNE_exc(EXC_DATA_ADDR_READ)
nkeynes@368
   325
nkeynes@586
   326
#define check_walign32( x86reg ) \
nkeynes@991
   327
    TESTL_imms_r32( 0x00000003, x86reg ); \
nkeynes@586
   328
    JNE_exc(EXC_DATA_ADDR_WRITE);
nkeynes@368
   329
nkeynes@732
   330
#define check_ralign64( x86reg ) \
nkeynes@991
   331
    TESTL_imms_r32( 0x00000007, x86reg ); \
nkeynes@732
   332
    JNE_exc(EXC_DATA_ADDR_READ)
nkeynes@732
   333
nkeynes@732
   334
#define check_walign64( x86reg ) \
nkeynes@991
   335
    TESTL_imms_r32( 0x00000007, x86reg ); \
nkeynes@732
   336
    JNE_exc(EXC_DATA_ADDR_WRITE);
nkeynes@732
   337
nkeynes@1125
   338
#define address_space() ((sh4_x86.sh4_mode&SR_MD) ? (uintptr_t)sh4_x86.priv_address_space : (uintptr_t)sh4_x86.user_address_space)
nkeynes@1004
   339
nkeynes@824
   340
#define UNDEF(ir)
nkeynes@939
   341
/* Note: For SR.MD == 1 && MMUCR.AT == 0, there are no memory exceptions, so 
nkeynes@939
   342
 * don't waste the cycles expecting them. Otherwise we need to save the exception pointer.
nkeynes@586
   343
 */
nkeynes@941
   344
#ifdef HAVE_FRAME_ADDRESS
nkeynes@995
   345
static void call_read_func(int addr_reg, int value_reg, int offset, int pc)
nkeynes@995
   346
{
nkeynes@1004
   347
    decode_address(address_space(), addr_reg);
nkeynes@1112
   348
    if( !sh4_x86.tlb_on && (sh4_x86.sh4_mode & SR_MD) ) { 
nkeynes@995
   349
        CALL1_r32disp_r32(REG_ECX, offset, addr_reg);
nkeynes@995
   350
    } else {
nkeynes@995
   351
        if( addr_reg != REG_ARG1 ) {
nkeynes@995
   352
            MOVL_r32_r32( addr_reg, REG_ARG1 );
nkeynes@995
   353
        }
nkeynes@995
   354
        MOVP_immptr_rptr( 0, REG_ARG2 );
nkeynes@995
   355
        sh4_x86_add_backpatch( xlat_output, pc, -2 );
nkeynes@995
   356
        CALL2_r32disp_r32_r32(REG_ECX, offset, REG_ARG1, REG_ARG2);
nkeynes@995
   357
    }
nkeynes@995
   358
    if( value_reg != REG_RESULT1 ) { 
nkeynes@995
   359
        MOVL_r32_r32( REG_RESULT1, value_reg );
nkeynes@995
   360
    }
nkeynes@995
   361
}
nkeynes@995
   362
nkeynes@995
   363
static void call_write_func(int addr_reg, int value_reg, int offset, int pc)
nkeynes@995
   364
{
nkeynes@1004
   365
    decode_address(address_space(), addr_reg);
nkeynes@1112
   366
    if( !sh4_x86.tlb_on && (sh4_x86.sh4_mode & SR_MD) ) { 
nkeynes@995
   367
        CALL2_r32disp_r32_r32(REG_ECX, offset, addr_reg, value_reg);
nkeynes@995
   368
    } else {
nkeynes@995
   369
        if( value_reg != REG_ARG2 ) {
nkeynes@995
   370
            MOVL_r32_r32( value_reg, REG_ARG2 );
nkeynes@995
   371
	}        
nkeynes@995
   372
        if( addr_reg != REG_ARG1 ) {
nkeynes@995
   373
            MOVL_r32_r32( addr_reg, REG_ARG1 );
nkeynes@995
   374
        }
nkeynes@995
   375
#if MAX_REG_ARG > 2        
nkeynes@995
   376
        MOVP_immptr_rptr( 0, REG_ARG3 );
nkeynes@995
   377
        sh4_x86_add_backpatch( xlat_output, pc, -2 );
nkeynes@995
   378
        CALL3_r32disp_r32_r32_r32(REG_ECX, offset, REG_ARG1, REG_ARG2, REG_ARG3);
nkeynes@995
   379
#else
nkeynes@995
   380
        MOVL_imm32_rspdisp( 0, 0 );
nkeynes@995
   381
        sh4_x86_add_backpatch( xlat_output, pc, -2 );
nkeynes@995
   382
        CALL3_r32disp_r32_r32_r32(REG_ECX, offset, REG_ARG1, REG_ARG2, 0);
nkeynes@995
   383
#endif
nkeynes@995
   384
    }
nkeynes@995
   385
}
nkeynes@995
   386
#else
nkeynes@995
   387
static void call_read_func(int addr_reg, int value_reg, int offset, int pc)
nkeynes@995
   388
{
nkeynes@1004
   389
    decode_address(address_space(), addr_reg);
nkeynes@995
   390
    CALL1_r32disp_r32(REG_ECX, offset, addr_reg);
nkeynes@995
   391
    if( value_reg != REG_RESULT1 ) {
nkeynes@995
   392
        MOVL_r32_r32( REG_RESULT1, value_reg );
nkeynes@995
   393
    }
nkeynes@995
   394
}     
nkeynes@995
   395
nkeynes@996
   396
static void call_write_func(int addr_reg, int value_reg, int offset, int pc)
nkeynes@995
   397
{
nkeynes@1004
   398
    decode_address(address_space(), addr_reg);
nkeynes@995
   399
    CALL2_r32disp_r32_r32(REG_ECX, offset, addr_reg, value_reg);
nkeynes@995
   400
}
nkeynes@941
   401
#endif
nkeynes@939
   402
                
nkeynes@995
   403
#define MEM_REGION_PTR(name) offsetof( struct mem_region_fn, name )
nkeynes@995
   404
#define MEM_READ_BYTE( addr_reg, value_reg ) call_read_func(addr_reg, value_reg, MEM_REGION_PTR(read_byte), pc)
nkeynes@995
   405
#define MEM_READ_BYTE_FOR_WRITE( addr_reg, value_reg ) call_read_func( addr_reg, value_reg, MEM_REGION_PTR(read_byte_for_write), pc) 
nkeynes@995
   406
#define MEM_READ_WORD( addr_reg, value_reg ) call_read_func(addr_reg, value_reg, MEM_REGION_PTR(read_word), pc)
nkeynes@995
   407
#define MEM_READ_LONG( addr_reg, value_reg ) call_read_func(addr_reg, value_reg, MEM_REGION_PTR(read_long), pc)
nkeynes@995
   408
#define MEM_WRITE_BYTE( addr_reg, value_reg ) call_write_func(addr_reg, value_reg, MEM_REGION_PTR(write_byte), pc)
nkeynes@995
   409
#define MEM_WRITE_WORD( addr_reg, value_reg ) call_write_func(addr_reg, value_reg, MEM_REGION_PTR(write_word), pc)
nkeynes@995
   410
#define MEM_WRITE_LONG( addr_reg, value_reg ) call_write_func(addr_reg, value_reg, MEM_REGION_PTR(write_long), pc)
nkeynes@995
   411
#define MEM_PREFETCH( addr_reg ) call_read_func(addr_reg, REG_RESULT1, MEM_REGION_PTR(prefetch), pc)
nkeynes@368
   412
nkeynes@1191
   413
#define SLOTILLEGAL() exit_block_exc(EXC_SLOT_ILLEGAL, pc-2, 4); sh4_x86.in_delay_slot = DELAY_NONE; return 2;
nkeynes@539
   414
nkeynes@1182
   415
/** Offset of xlat_sh4_mode field relative to the code pointer */ 
nkeynes@1186
   416
#define XLAT_SH4_MODE_CODE_OFFSET  (int32_t)(offsetof(struct xlat_cache_block, xlat_sh4_mode) - offsetof(struct xlat_cache_block,code) )
nkeynes@1186
   417
#define XLAT_CHAIN_CODE_OFFSET (int32_t)(offsetof(struct xlat_cache_block, chain) - offsetof(struct xlat_cache_block,code) )
nkeynes@1186
   418
#define XLAT_ACTIVE_CODE_OFFSET (int32_t)(offsetof(struct xlat_cache_block, active) - offsetof(struct xlat_cache_block,code) )
nkeynes@1182
   419
nkeynes@901
   420
void sh4_translate_begin_block( sh4addr_t pc ) 
nkeynes@901
   421
{
nkeynes@1112
   422
	sh4_x86.code = xlat_output;
nkeynes@901
   423
    sh4_x86.in_delay_slot = FALSE;
nkeynes@901
   424
    sh4_x86.fpuen_checked = FALSE;
nkeynes@901
   425
    sh4_x86.branch_taken = FALSE;
nkeynes@901
   426
    sh4_x86.backpatch_posn = 0;
nkeynes@901
   427
    sh4_x86.block_start_pc = pc;
nkeynes@939
   428
    sh4_x86.tlb_on = IS_TLB_ENABLED();
nkeynes@901
   429
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@901
   430
    sh4_x86.double_prec = sh4r.fpscr & FPSCR_PR;
nkeynes@903
   431
    sh4_x86.double_size = sh4r.fpscr & FPSCR_SZ;
nkeynes@1112
   432
    sh4_x86.sh4_mode = sh4r.xlat_sh4_mode;
nkeynes@1125
   433
    emit_prologue();
nkeynes@1125
   434
    if( sh4_x86.begin_callback ) {
nkeynes@1125
   435
        CALL_ptr( sh4_x86.begin_callback );
nkeynes@1125
   436
    }
nkeynes@1218
   437
    if( sh4_profile_blocks ) {
nkeynes@1186
   438
    	MOVP_immptr_rptr( sh4_x86.code + XLAT_ACTIVE_CODE_OFFSET, REG_EAX );
nkeynes@1182
   439
    	ADDL_imms_r32disp( 1, REG_EAX, 0 );
nkeynes@1182
   440
    }  
nkeynes@901
   441
}
nkeynes@901
   442
nkeynes@901
   443
nkeynes@593
   444
uint32_t sh4_translate_end_block_size()
nkeynes@593
   445
{
nkeynes@1196
   446
	uint32_t epilogue_size = EPILOGUE_SIZE;
nkeynes@1196
   447
	if( sh4_x86.end_callback ) {
nkeynes@1196
   448
	    epilogue_size += (CALL1_PTR_MIN_SIZE - 1);
nkeynes@1196
   449
	}
nkeynes@596
   450
    if( sh4_x86.backpatch_posn <= 3 ) {
nkeynes@1196
   451
        epilogue_size += (sh4_x86.backpatch_posn*(12+CALL1_PTR_MIN_SIZE));
nkeynes@596
   452
    } else {
nkeynes@1196
   453
        epilogue_size += (3*(12+CALL1_PTR_MIN_SIZE)) + (sh4_x86.backpatch_posn-3)*(15+CALL1_PTR_MIN_SIZE);
nkeynes@596
   454
    }
nkeynes@1196
   455
    return epilogue_size;
nkeynes@593
   456
}
nkeynes@593
   457
nkeynes@593
   458
nkeynes@590
   459
/**
nkeynes@590
   460
 * Embed a breakpoint into the generated code
nkeynes@590
   461
 */
nkeynes@586
   462
void sh4_translate_emit_breakpoint( sh4vma_t pc )
nkeynes@586
   463
{
nkeynes@995
   464
    MOVL_imm32_r32( pc, REG_EAX );
nkeynes@995
   465
    CALL1_ptr_r32( sh4_translate_breakpoint_hit, REG_EAX );
nkeynes@875
   466
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@586
   467
}
nkeynes@590
   468
nkeynes@601
   469
nkeynes@601
   470
#define UNTRANSLATABLE(pc) !IS_IN_ICACHE(pc)
nkeynes@601
   471
nkeynes@1112
   472
/**
nkeynes@1112
   473
 * Test if the loaded target code pointer in %eax is valid, and if so jump
nkeynes@1112
   474
 * directly into it, bypassing the normal exit.
nkeynes@1112
   475
 */
nkeynes@1112
   476
static void jump_next_block()
nkeynes@1112
   477
{
nkeynes@1149
   478
	uint8_t *ptr = xlat_output;
nkeynes@1112
   479
	TESTP_rptr_rptr(REG_EAX, REG_EAX);
nkeynes@1112
   480
	JE_label(nocode);
nkeynes@1112
   481
	if( sh4_x86.sh4_mode == SH4_MODE_UNKNOWN ) {
nkeynes@1112
   482
	    /* sr/fpscr was changed, possibly updated xlat_sh4_mode, so reload it */
nkeynes@1112
   483
	    MOVL_rbpdisp_r32( REG_OFFSET(xlat_sh4_mode), REG_ECX );
nkeynes@1112
   484
	    CMPL_r32_r32disp( REG_ECX, REG_EAX, XLAT_SH4_MODE_CODE_OFFSET );
nkeynes@1112
   485
	} else {
nkeynes@1112
   486
	    CMPL_imms_r32disp( sh4_x86.sh4_mode, REG_EAX, XLAT_SH4_MODE_CODE_OFFSET );
nkeynes@1112
   487
	}
nkeynes@1112
   488
	JNE_label(wrongmode);
nkeynes@1112
   489
	LEAP_rptrdisp_rptr(REG_EAX, PROLOGUE_SIZE,REG_EAX);
nkeynes@1125
   490
	if( sh4_x86.end_callback ) {
nkeynes@1125
   491
	    /* Note this does leave the stack out of alignment, but doesn't matter
nkeynes@1125
   492
	     * for what we're currently using it for.
nkeynes@1125
   493
	     */
nkeynes@1125
   494
	    PUSH_r32(REG_EAX);
nkeynes@1125
   495
	    MOVP_immptr_rptr(sh4_x86.end_callback, REG_ECX);
nkeynes@1125
   496
	    JMP_rptr(REG_ECX);
nkeynes@1125
   497
	} else {
nkeynes@1125
   498
	    JMP_rptr(REG_EAX);
nkeynes@1125
   499
	}
nkeynes@1149
   500
	JMP_TARGET(wrongmode);
nkeynes@1176
   501
	MOVP_rptrdisp_rptr( REG_EAX, XLAT_CHAIN_CODE_OFFSET, REG_EAX );
nkeynes@1149
   502
	int rel = ptr - xlat_output;
nkeynes@1149
   503
    JMP_prerel(rel);
nkeynes@1149
   504
	JMP_TARGET(nocode); 
nkeynes@1112
   505
}
nkeynes@1112
   506
nkeynes@1186
   507
/**
nkeynes@1186
   508
 * 
nkeynes@1186
   509
 */
nkeynes@1263
   510
void FASTCALL sh4_translate_link_block( uint32_t pc )
nkeynes@1186
   511
{
nkeynes@1186
   512
    uint8_t *target = (uint8_t *)xlat_get_code_by_vma(pc);
nkeynes@1186
   513
    while( target != NULL && sh4r.xlat_sh4_mode != XLAT_BLOCK_MODE(target) ) {
nkeynes@1186
   514
        target = XLAT_BLOCK_CHAIN(target);
nkeynes@1186
   515
	}
nkeynes@1186
   516
    if( target == NULL ) {
nkeynes@1186
   517
        target = sh4_translate_basic_block( pc );
nkeynes@1186
   518
    }
nkeynes@1186
   519
    uint8_t *backpatch = ((uint8_t *)__builtin_return_address(0)) - (CALL1_PTR_MIN_SIZE);
nkeynes@1186
   520
    *backpatch = 0xE9;
nkeynes@1186
   521
    *(uint32_t *)(backpatch+1) = (uint32_t)(target-backpatch)+PROLOGUE_SIZE-5;
nkeynes@1186
   522
    *(void **)(backpatch+5) = XLAT_BLOCK_FOR_CODE(target)->use_list;
nkeynes@1186
   523
    XLAT_BLOCK_FOR_CODE(target)->use_list = backpatch; 
nkeynes@1186
   524
nkeynes@1198
   525
    uint8_t * volatile *retptr = ((uint8_t * volatile *)__builtin_frame_address(0))+1;
nkeynes@1186
   526
    assert( *retptr == ((uint8_t *)__builtin_return_address(0)) );
nkeynes@1186
   527
	*retptr = backpatch;
nkeynes@1186
   528
}
nkeynes@1186
   529
nkeynes@1186
   530
static void emit_translate_and_backpatch()
nkeynes@1186
   531
{
nkeynes@1186
   532
    /* NB: this is either 7 bytes (i386) or 12 bytes (x86-64) */
nkeynes@1263
   533
    CALL1_ptr_r32(sh4_translate_link_block, REG_ARG1);
nkeynes@1186
   534
nkeynes@1186
   535
    /* When patched, the jmp instruction will be 5 bytes (either platform) -
nkeynes@1186
   536
     * we need to reserve sizeof(void*) bytes for the use-list
nkeynes@1186
   537
	 * pointer
nkeynes@1186
   538
	 */ 
nkeynes@1186
   539
    if( sizeof(void*) == 8 ) {
nkeynes@1186
   540
        NOP();
nkeynes@1186
   541
    } else {
nkeynes@1186
   542
        NOP2();
nkeynes@1186
   543
    }
nkeynes@1186
   544
}
nkeynes@1186
   545
nkeynes@1186
   546
/**
nkeynes@1186
   547
 * If we're jumping to a fixed address (or at least fixed relative to the
nkeynes@1186
   548
 * current PC, then we can do a direct branch. REG_ARG1 should contain
nkeynes@1186
   549
 * the PC at this point.
nkeynes@1186
   550
 */
nkeynes@1186
   551
static void jump_next_block_fixed_pc( sh4addr_t pc )
nkeynes@1186
   552
{
nkeynes@1186
   553
	if( IS_IN_ICACHE(pc) ) {
nkeynes@1194
   554
	    if( sh4_x86.sh4_mode != SH4_MODE_UNKNOWN && sh4_x86.end_callback == NULL ) {
nkeynes@1186
   555
	        /* Fixed address, in cache, and fixed SH4 mode - generate a call to the
nkeynes@1186
   556
	         * fetch-and-backpatch routine, which will replace the call with a branch */
nkeynes@1186
   557
           emit_translate_and_backpatch();	         
nkeynes@1186
   558
           return;
nkeynes@1186
   559
		} else {
nkeynes@1186
   560
            MOVP_moffptr_rax( xlat_get_lut_entry(GET_ICACHE_PHYS(pc)) );
nkeynes@1186
   561
            ANDP_imms_rptr( -4, REG_EAX );
nkeynes@1186
   562
        }
nkeynes@1186
   563
	} else if( sh4_x86.tlb_on ) {
nkeynes@1186
   564
        CALL1_ptr_r32(xlat_get_code_by_vma, REG_ARG1);
nkeynes@1186
   565
    } else {
nkeynes@1186
   566
        CALL1_ptr_r32(xlat_get_code, REG_ARG1);
nkeynes@1186
   567
    }
nkeynes@1186
   568
    jump_next_block();
nkeynes@1186
   569
nkeynes@1186
   570
nkeynes@1186
   571
}
nkeynes@1186
   572
nkeynes@1214
   573
static void sh4_x86_translate_unlink_block( void *use_list )
nkeynes@1186
   574
{
nkeynes@1186
   575
	uint8_t *tmp = xlat_output; /* In case something is active, which should never happen */
nkeynes@1186
   576
	void *next = use_list;
nkeynes@1186
   577
	while( next != NULL ) {
nkeynes@1186
   578
    	xlat_output = (uint8_t *)next;
nkeynes@1186
   579
 	    next = *(void **)(xlat_output+5);
nkeynes@1186
   580
 		emit_translate_and_backpatch();
nkeynes@1186
   581
 	}
nkeynes@1186
   582
 	xlat_output = tmp;
nkeynes@1186
   583
}
nkeynes@1186
   584
nkeynes@1186
   585
nkeynes@1186
   586
nkeynes@1125
   587
static void exit_block()
nkeynes@1125
   588
{
nkeynes@1125
   589
	emit_epilogue();
nkeynes@1125
   590
	if( sh4_x86.end_callback ) {
nkeynes@1125
   591
	    MOVP_immptr_rptr(sh4_x86.end_callback, REG_ECX);
nkeynes@1125
   592
	    JMP_rptr(REG_ECX);
nkeynes@1125
   593
	} else {
nkeynes@1125
   594
	    RET();
nkeynes@1125
   595
	}
nkeynes@1125
   596
}
nkeynes@1125
   597
nkeynes@590
   598
/**
nkeynes@995
   599
 * Exit the block with sh4r.pc already written
nkeynes@995
   600
 */
nkeynes@995
   601
void exit_block_pcset( sh4addr_t pc )
nkeynes@995
   602
{
nkeynes@995
   603
    MOVL_imm32_r32( ((pc - sh4_x86.block_start_pc)>>1)*sh4_cpu_period, REG_ECX );
nkeynes@1112
   604
    ADDL_rbpdisp_r32( REG_OFFSET(slice_cycle), REG_ECX );
nkeynes@1112
   605
    MOVL_r32_rbpdisp( REG_ECX, REG_OFFSET(slice_cycle) );
nkeynes@1112
   606
    CMPL_r32_rbpdisp( REG_ECX, REG_OFFSET(event_pending) );
nkeynes@1112
   607
    JBE_label(exitloop);
nkeynes@995
   608
    MOVL_rbpdisp_r32( R_PC, REG_ARG1 );
nkeynes@995
   609
    if( sh4_x86.tlb_on ) {
nkeynes@995
   610
        CALL1_ptr_r32(xlat_get_code_by_vma,REG_ARG1);
nkeynes@995
   611
    } else {
nkeynes@995
   612
        CALL1_ptr_r32(xlat_get_code,REG_ARG1);
nkeynes@995
   613
    }
nkeynes@1112
   614
    
nkeynes@1112
   615
    jump_next_block();
nkeynes@1112
   616
    JMP_TARGET(exitloop);
nkeynes@995
   617
    exit_block();
nkeynes@995
   618
}
nkeynes@995
   619
nkeynes@995
   620
/**
nkeynes@995
   621
 * Exit the block with sh4r.new_pc written with the target pc
nkeynes@995
   622
 */
nkeynes@995
   623
void exit_block_newpcset( sh4addr_t pc )
nkeynes@995
   624
{
nkeynes@995
   625
    MOVL_imm32_r32( ((pc - sh4_x86.block_start_pc)>>1)*sh4_cpu_period, REG_ECX );
nkeynes@1112
   626
    ADDL_rbpdisp_r32( REG_OFFSET(slice_cycle), REG_ECX );
nkeynes@1112
   627
    MOVL_r32_rbpdisp( REG_ECX, REG_OFFSET(slice_cycle) );
nkeynes@995
   628
    MOVL_rbpdisp_r32( R_NEW_PC, REG_ARG1 );
nkeynes@995
   629
    MOVL_r32_rbpdisp( REG_ARG1, R_PC );
nkeynes@1112
   630
    CMPL_r32_rbpdisp( REG_ECX, REG_OFFSET(event_pending) );
nkeynes@1112
   631
    JBE_label(exitloop);
nkeynes@995
   632
    if( sh4_x86.tlb_on ) {
nkeynes@995
   633
        CALL1_ptr_r32(xlat_get_code_by_vma,REG_ARG1);
nkeynes@995
   634
    } else {
nkeynes@995
   635
        CALL1_ptr_r32(xlat_get_code,REG_ARG1);
nkeynes@995
   636
    }
nkeynes@1112
   637
	
nkeynes@1112
   638
	jump_next_block();
nkeynes@1112
   639
    JMP_TARGET(exitloop);
nkeynes@995
   640
    exit_block();
nkeynes@995
   641
}
nkeynes@995
   642
nkeynes@995
   643
nkeynes@995
   644
/**
nkeynes@995
   645
 * Exit the block to an absolute PC
nkeynes@995
   646
 */
nkeynes@995
   647
void exit_block_abs( sh4addr_t pc, sh4addr_t endpc )
nkeynes@995
   648
{
nkeynes@1112
   649
    MOVL_imm32_r32( ((endpc - sh4_x86.block_start_pc)>>1)*sh4_cpu_period, REG_ECX );
nkeynes@1112
   650
    ADDL_rbpdisp_r32( REG_OFFSET(slice_cycle), REG_ECX );
nkeynes@1112
   651
    MOVL_r32_rbpdisp( REG_ECX, REG_OFFSET(slice_cycle) );
nkeynes@1112
   652
nkeynes@1112
   653
    MOVL_imm32_r32( pc, REG_ARG1 );
nkeynes@1112
   654
    MOVL_r32_rbpdisp( REG_ARG1, R_PC );
nkeynes@1112
   655
    CMPL_r32_rbpdisp( REG_ECX, REG_OFFSET(event_pending) );
nkeynes@1112
   656
    JBE_label(exitloop);
nkeynes@1186
   657
    jump_next_block_fixed_pc(pc);    
nkeynes@1112
   658
    JMP_TARGET(exitloop);
nkeynes@995
   659
    exit_block();
nkeynes@995
   660
}
nkeynes@995
   661
nkeynes@995
   662
/**
nkeynes@995
   663
 * Exit the block to a relative PC
nkeynes@995
   664
 */
nkeynes@995
   665
void exit_block_rel( sh4addr_t pc, sh4addr_t endpc )
nkeynes@995
   666
{
nkeynes@1112
   667
    MOVL_imm32_r32( ((endpc - sh4_x86.block_start_pc)>>1)*sh4_cpu_period, REG_ECX );
nkeynes@1112
   668
    ADDL_rbpdisp_r32( REG_OFFSET(slice_cycle), REG_ECX );
nkeynes@1112
   669
    MOVL_r32_rbpdisp( REG_ECX, REG_OFFSET(slice_cycle) );
nkeynes@1112
   670
nkeynes@1112
   671
	if( pc == sh4_x86.block_start_pc && sh4_x86.sh4_mode == sh4r.xlat_sh4_mode ) {
nkeynes@1112
   672
	    /* Special case for tight loops - the PC doesn't change, and
nkeynes@1112
   673
	     * we already know the target address. Just check events pending before
nkeynes@1112
   674
	     * looping.
nkeynes@1112
   675
	     */
nkeynes@1112
   676
        CMPL_r32_rbpdisp( REG_ECX, REG_OFFSET(event_pending) );
nkeynes@1112
   677
        uint32_t backdisp = ((uintptr_t)(sh4_x86.code - xlat_output)) + PROLOGUE_SIZE;
nkeynes@1112
   678
        JCC_cc_prerel(X86_COND_A, backdisp);
nkeynes@1112
   679
	} else {
nkeynes@1112
   680
        MOVL_imm32_r32( pc - sh4_x86.block_start_pc, REG_ARG1 );
nkeynes@1112
   681
        ADDL_rbpdisp_r32( R_PC, REG_ARG1 );
nkeynes@1112
   682
        MOVL_r32_rbpdisp( REG_ARG1, R_PC );
nkeynes@1112
   683
        CMPL_r32_rbpdisp( REG_ECX, REG_OFFSET(event_pending) );
nkeynes@1112
   684
        JBE_label(exitloop2);
nkeynes@1186
   685
        
nkeynes@1186
   686
        jump_next_block_fixed_pc(pc);
nkeynes@1112
   687
        JMP_TARGET(exitloop2);
nkeynes@995
   688
    }
nkeynes@995
   689
    exit_block();
nkeynes@995
   690
}
nkeynes@995
   691
nkeynes@995
   692
/**
nkeynes@995
   693
 * Exit unconditionally with a general exception
nkeynes@995
   694
 */
nkeynes@1191
   695
void exit_block_exc( int code, sh4addr_t pc, int inst_adjust )
nkeynes@995
   696
{
nkeynes@995
   697
    MOVL_imm32_r32( pc - sh4_x86.block_start_pc, REG_ECX );
nkeynes@995
   698
    ADDL_r32_rbpdisp( REG_ECX, R_PC );
nkeynes@1191
   699
    MOVL_imm32_r32( ((pc - sh4_x86.block_start_pc + inst_adjust)>>1)*sh4_cpu_period, REG_ECX );
nkeynes@995
   700
    ADDL_r32_rbpdisp( REG_ECX, REG_OFFSET(slice_cycle) );
nkeynes@995
   701
    MOVL_imm32_r32( code, REG_ARG1 );
nkeynes@995
   702
    CALL1_ptr_r32( sh4_raise_exception, REG_ARG1 );
nkeynes@995
   703
    exit_block();
nkeynes@995
   704
}    
nkeynes@995
   705
nkeynes@995
   706
/**
nkeynes@590
   707
 * Embed a call to sh4_execute_instruction for situations that we
nkeynes@601
   708
 * can't translate (just page-crossing delay slots at the moment).
nkeynes@601
   709
 * Caller is responsible for setting new_pc before calling this function.
nkeynes@601
   710
 *
nkeynes@601
   711
 * Performs:
nkeynes@601
   712
 *   Set PC = endpc
nkeynes@601
   713
 *   Set sh4r.in_delay_slot = sh4_x86.in_delay_slot
nkeynes@601
   714
 *   Update slice_cycle for endpc+2 (single step doesn't update slice_cycle)
nkeynes@601
   715
 *   Call sh4_execute_instruction
nkeynes@601
   716
 *   Call xlat_get_code_by_vma / xlat_get_code as for normal exit
nkeynes@590
   717
 */
nkeynes@601
   718
void exit_block_emu( sh4vma_t endpc )
nkeynes@590
   719
{
nkeynes@995
   720
    MOVL_imm32_r32( endpc - sh4_x86.block_start_pc, REG_ECX );   // 5
nkeynes@991
   721
    ADDL_r32_rbpdisp( REG_ECX, R_PC );
nkeynes@586
   722
    
nkeynes@995
   723
    MOVL_imm32_r32( (((endpc - sh4_x86.block_start_pc)>>1)+1)*sh4_cpu_period, REG_ECX ); // 5
nkeynes@991
   724
    ADDL_r32_rbpdisp( REG_ECX, REG_OFFSET(slice_cycle) );     // 6
nkeynes@995
   725
    MOVL_imm32_r32( sh4_x86.in_delay_slot ? 1 : 0, REG_ECX );
nkeynes@995
   726
    MOVL_r32_rbpdisp( REG_ECX, REG_OFFSET(in_delay_slot) );
nkeynes@590
   727
nkeynes@1112
   728
    CALL_ptr( sh4_execute_instruction );
nkeynes@926
   729
    exit_block();
nkeynes@590
   730
} 
nkeynes@539
   731
nkeynes@359
   732
/**
nkeynes@995
   733
 * Write the block trailer (exception handling block)
nkeynes@995
   734
 */
nkeynes@995
   735
void sh4_translate_end_block( sh4addr_t pc ) {
nkeynes@995
   736
    if( sh4_x86.branch_taken == FALSE ) {
nkeynes@995
   737
        // Didn't exit unconditionally already, so write the termination here
nkeynes@995
   738
        exit_block_rel( pc, pc );
nkeynes@995
   739
    }
nkeynes@995
   740
    if( sh4_x86.backpatch_posn != 0 ) {
nkeynes@995
   741
        unsigned int i;
nkeynes@995
   742
        // Exception raised - cleanup and exit
nkeynes@995
   743
        uint8_t *end_ptr = xlat_output;
nkeynes@995
   744
        MOVL_r32_r32( REG_EDX, REG_ECX );
nkeynes@995
   745
        ADDL_r32_r32( REG_EDX, REG_ECX );
nkeynes@995
   746
        ADDL_r32_rbpdisp( REG_ECX, R_SPC );
nkeynes@995
   747
        MOVL_moffptr_eax( &sh4_cpu_period );
nkeynes@1191
   748
        INC_r32( REG_EDX );  /* Add 1 for the aborting instruction itself */ 
nkeynes@995
   749
        MULL_r32( REG_EDX );
nkeynes@995
   750
        ADDL_r32_rbpdisp( REG_EAX, REG_OFFSET(slice_cycle) );
nkeynes@995
   751
        exit_block();
nkeynes@995
   752
nkeynes@995
   753
        for( i=0; i< sh4_x86.backpatch_posn; i++ ) {
nkeynes@995
   754
            uint32_t *fixup_addr = (uint32_t *)&xlat_current_block->code[sh4_x86.backpatch_list[i].fixup_offset];
nkeynes@995
   755
            if( sh4_x86.backpatch_list[i].exc_code < 0 ) {
nkeynes@995
   756
                if( sh4_x86.backpatch_list[i].exc_code == -2 ) {
nkeynes@995
   757
                    *((uintptr_t *)fixup_addr) = (uintptr_t)xlat_output; 
nkeynes@995
   758
                } else {
nkeynes@995
   759
                    *fixup_addr += xlat_output - (uint8_t *)&xlat_current_block->code[sh4_x86.backpatch_list[i].fixup_offset] - 4;
nkeynes@995
   760
                }
nkeynes@995
   761
                MOVL_imm32_r32( sh4_x86.backpatch_list[i].fixup_icount, REG_EDX );
nkeynes@995
   762
                int rel = end_ptr - xlat_output;
nkeynes@995
   763
                JMP_prerel(rel);
nkeynes@995
   764
            } else {
nkeynes@995
   765
                *fixup_addr += xlat_output - (uint8_t *)&xlat_current_block->code[sh4_x86.backpatch_list[i].fixup_offset] - 4;
nkeynes@995
   766
                MOVL_imm32_r32( sh4_x86.backpatch_list[i].exc_code, REG_ARG1 );
nkeynes@995
   767
                CALL1_ptr_r32( sh4_raise_exception, REG_ARG1 );
nkeynes@995
   768
                MOVL_imm32_r32( sh4_x86.backpatch_list[i].fixup_icount, REG_EDX );
nkeynes@995
   769
                int rel = end_ptr - xlat_output;
nkeynes@995
   770
                JMP_prerel(rel);
nkeynes@995
   771
            }
nkeynes@995
   772
        }
nkeynes@995
   773
    }
nkeynes@995
   774
}
nkeynes@539
   775
nkeynes@359
   776
/**
nkeynes@359
   777
 * Translate a single instruction. Delayed branches are handled specially
nkeynes@359
   778
 * by translating both branch and delayed instruction as a single unit (as
nkeynes@359
   779
 * 
nkeynes@586
   780
 * The instruction MUST be in the icache (assert check)
nkeynes@359
   781
 *
nkeynes@359
   782
 * @return true if the instruction marks the end of a basic block
nkeynes@359
   783
 * (eg a branch or 
nkeynes@359
   784
 */
nkeynes@590
   785
uint32_t sh4_translate_instruction( sh4vma_t pc )
nkeynes@359
   786
{
nkeynes@388
   787
    uint32_t ir;
nkeynes@586
   788
    /* Read instruction from icache */
nkeynes@586
   789
    assert( IS_IN_ICACHE(pc) );
nkeynes@586
   790
    ir = *(uint16_t *)GET_ICACHE_PTR(pc);
nkeynes@586
   791
    
nkeynes@586
   792
    if( !sh4_x86.in_delay_slot ) {
nkeynes@596
   793
	sh4_translate_add_recovery( (pc - sh4_x86.block_start_pc)>>1 );
nkeynes@388
   794
    }
nkeynes@1003
   795
    
nkeynes@1003
   796
    /* check for breakpoints at this pc */
nkeynes@1003
   797
    for( int i=0; i<sh4_breakpoint_count; i++ ) {
nkeynes@1003
   798
        if( sh4_breakpoints[i].address == pc ) {
nkeynes@1003
   799
            sh4_translate_emit_breakpoint(pc);
nkeynes@1003
   800
            break;
nkeynes@1003
   801
        }
nkeynes@571
   802
    }
nkeynes@359
   803
%%
nkeynes@359
   804
/* ALU operations */
nkeynes@359
   805
ADD Rm, Rn {:
nkeynes@671
   806
    COUNT_INST(I_ADD);
nkeynes@991
   807
    load_reg( REG_EAX, Rm );
nkeynes@991
   808
    load_reg( REG_ECX, Rn );
nkeynes@991
   809
    ADDL_r32_r32( REG_EAX, REG_ECX );
nkeynes@991
   810
    store_reg( REG_ECX, Rn );
nkeynes@417
   811
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
   812
:}
nkeynes@359
   813
ADD #imm, Rn {:  
nkeynes@671
   814
    COUNT_INST(I_ADDI);
nkeynes@991
   815
    ADDL_imms_rbpdisp( imm, REG_OFFSET(r[Rn]) );
nkeynes@417
   816
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
   817
:}
nkeynes@359
   818
ADDC Rm, Rn {:
nkeynes@671
   819
    COUNT_INST(I_ADDC);
nkeynes@417
   820
    if( sh4_x86.tstate != TSTATE_C ) {
nkeynes@911
   821
        LDC_t();
nkeynes@417
   822
    }
nkeynes@991
   823
    load_reg( REG_EAX, Rm );
nkeynes@991
   824
    load_reg( REG_ECX, Rn );
nkeynes@991
   825
    ADCL_r32_r32( REG_EAX, REG_ECX );
nkeynes@991
   826
    store_reg( REG_ECX, Rn );
nkeynes@359
   827
    SETC_t();
nkeynes@417
   828
    sh4_x86.tstate = TSTATE_C;
nkeynes@359
   829
:}
nkeynes@359
   830
ADDV Rm, Rn {:
nkeynes@671
   831
    COUNT_INST(I_ADDV);
nkeynes@991
   832
    load_reg( REG_EAX, Rm );
nkeynes@991
   833
    load_reg( REG_ECX, Rn );
nkeynes@991
   834
    ADDL_r32_r32( REG_EAX, REG_ECX );
nkeynes@991
   835
    store_reg( REG_ECX, Rn );
nkeynes@359
   836
    SETO_t();
nkeynes@417
   837
    sh4_x86.tstate = TSTATE_O;
nkeynes@359
   838
:}
nkeynes@359
   839
AND Rm, Rn {:
nkeynes@671
   840
    COUNT_INST(I_AND);
nkeynes@991
   841
    load_reg( REG_EAX, Rm );
nkeynes@991
   842
    load_reg( REG_ECX, Rn );
nkeynes@991
   843
    ANDL_r32_r32( REG_EAX, REG_ECX );
nkeynes@991
   844
    store_reg( REG_ECX, Rn );
nkeynes@417
   845
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
   846
:}
nkeynes@359
   847
AND #imm, R0 {:  
nkeynes@671
   848
    COUNT_INST(I_ANDI);
nkeynes@991
   849
    load_reg( REG_EAX, 0 );
nkeynes@991
   850
    ANDL_imms_r32(imm, REG_EAX); 
nkeynes@991
   851
    store_reg( REG_EAX, 0 );
nkeynes@417
   852
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
   853
:}
nkeynes@359
   854
AND.B #imm, @(R0, GBR) {: 
nkeynes@671
   855
    COUNT_INST(I_ANDB);
nkeynes@991
   856
    load_reg( REG_EAX, 0 );
nkeynes@991
   857
    ADDL_rbpdisp_r32( R_GBR, REG_EAX );
nkeynes@991
   858
    MOVL_r32_rspdisp(REG_EAX, 0);
nkeynes@991
   859
    MEM_READ_BYTE_FOR_WRITE( REG_EAX, REG_EDX );
nkeynes@991
   860
    MOVL_rspdisp_r32(0, REG_EAX);
nkeynes@991
   861
    ANDL_imms_r32(imm, REG_EDX );
nkeynes@991
   862
    MEM_WRITE_BYTE( REG_EAX, REG_EDX );
nkeynes@417
   863
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
   864
:}
nkeynes@359
   865
CMP/EQ Rm, Rn {:  
nkeynes@671
   866
    COUNT_INST(I_CMPEQ);
nkeynes@991
   867
    load_reg( REG_EAX, Rm );
nkeynes@991
   868
    load_reg( REG_ECX, Rn );
nkeynes@991
   869
    CMPL_r32_r32( REG_EAX, REG_ECX );
nkeynes@359
   870
    SETE_t();
nkeynes@417
   871
    sh4_x86.tstate = TSTATE_E;
nkeynes@359
   872
:}
nkeynes@359
   873
CMP/EQ #imm, R0 {:  
nkeynes@671
   874
    COUNT_INST(I_CMPEQI);
nkeynes@991
   875
    load_reg( REG_EAX, 0 );
nkeynes@991
   876
    CMPL_imms_r32(imm, REG_EAX);
nkeynes@359
   877
    SETE_t();
nkeynes@417
   878
    sh4_x86.tstate = TSTATE_E;
nkeynes@359
   879
:}
nkeynes@359
   880
CMP/GE Rm, Rn {:  
nkeynes@671
   881
    COUNT_INST(I_CMPGE);
nkeynes@991
   882
    load_reg( REG_EAX, Rm );
nkeynes@991
   883
    load_reg( REG_ECX, Rn );
nkeynes@991
   884
    CMPL_r32_r32( REG_EAX, REG_ECX );
nkeynes@359
   885
    SETGE_t();
nkeynes@417
   886
    sh4_x86.tstate = TSTATE_GE;
nkeynes@359
   887
:}
nkeynes@359
   888
CMP/GT Rm, Rn {: 
nkeynes@671
   889
    COUNT_INST(I_CMPGT);
nkeynes@991
   890
    load_reg( REG_EAX, Rm );
nkeynes@991
   891
    load_reg( REG_ECX, Rn );
nkeynes@991
   892
    CMPL_r32_r32( REG_EAX, REG_ECX );
nkeynes@359
   893
    SETG_t();
nkeynes@417
   894
    sh4_x86.tstate = TSTATE_G;
nkeynes@359
   895
:}
nkeynes@359
   896
CMP/HI Rm, Rn {:  
nkeynes@671
   897
    COUNT_INST(I_CMPHI);
nkeynes@991
   898
    load_reg( REG_EAX, Rm );
nkeynes@991
   899
    load_reg( REG_ECX, Rn );
nkeynes@991
   900
    CMPL_r32_r32( REG_EAX, REG_ECX );
nkeynes@359
   901
    SETA_t();
nkeynes@417
   902
    sh4_x86.tstate = TSTATE_A;
nkeynes@359
   903
:}
nkeynes@359
   904
CMP/HS Rm, Rn {: 
nkeynes@671
   905
    COUNT_INST(I_CMPHS);
nkeynes@991
   906
    load_reg( REG_EAX, Rm );
nkeynes@991
   907
    load_reg( REG_ECX, Rn );
nkeynes@991
   908
    CMPL_r32_r32( REG_EAX, REG_ECX );
nkeynes@359
   909
    SETAE_t();
nkeynes@417
   910
    sh4_x86.tstate = TSTATE_AE;
nkeynes@359
   911
 :}
nkeynes@359
   912
CMP/PL Rn {: 
nkeynes@671
   913
    COUNT_INST(I_CMPPL);
nkeynes@991
   914
    load_reg( REG_EAX, Rn );
nkeynes@991
   915
    CMPL_imms_r32( 0, REG_EAX );
nkeynes@359
   916
    SETG_t();
nkeynes@417
   917
    sh4_x86.tstate = TSTATE_G;
nkeynes@359
   918
:}
nkeynes@359
   919
CMP/PZ Rn {:  
nkeynes@671
   920
    COUNT_INST(I_CMPPZ);
nkeynes@991
   921
    load_reg( REG_EAX, Rn );
nkeynes@991
   922
    CMPL_imms_r32( 0, REG_EAX );
nkeynes@359
   923
    SETGE_t();
nkeynes@417
   924
    sh4_x86.tstate = TSTATE_GE;
nkeynes@359
   925
:}
nkeynes@361
   926
CMP/STR Rm, Rn {:  
nkeynes@671
   927
    COUNT_INST(I_CMPSTR);
nkeynes@991
   928
    load_reg( REG_EAX, Rm );
nkeynes@991
   929
    load_reg( REG_ECX, Rn );
nkeynes@991
   930
    XORL_r32_r32( REG_ECX, REG_EAX );
nkeynes@991
   931
    TESTB_r8_r8( REG_AL, REG_AL );
nkeynes@991
   932
    JE_label(target1);
nkeynes@991
   933
    TESTB_r8_r8( REG_AH, REG_AH );
nkeynes@991
   934
    JE_label(target2);
nkeynes@991
   935
    SHRL_imm_r32( 16, REG_EAX );
nkeynes@991
   936
    TESTB_r8_r8( REG_AL, REG_AL );
nkeynes@991
   937
    JE_label(target3);
nkeynes@991
   938
    TESTB_r8_r8( REG_AH, REG_AH );
nkeynes@380
   939
    JMP_TARGET(target1);
nkeynes@380
   940
    JMP_TARGET(target2);
nkeynes@380
   941
    JMP_TARGET(target3);
nkeynes@368
   942
    SETE_t();
nkeynes@417
   943
    sh4_x86.tstate = TSTATE_E;
nkeynes@361
   944
:}
nkeynes@361
   945
DIV0S Rm, Rn {:
nkeynes@671
   946
    COUNT_INST(I_DIV0S);
nkeynes@991
   947
    load_reg( REG_EAX, Rm );
nkeynes@991
   948
    load_reg( REG_ECX, Rn );
nkeynes@991
   949
    SHRL_imm_r32( 31, REG_EAX );
nkeynes@991
   950
    SHRL_imm_r32( 31, REG_ECX );
nkeynes@995
   951
    MOVL_r32_rbpdisp( REG_EAX, R_M );
nkeynes@995
   952
    MOVL_r32_rbpdisp( REG_ECX, R_Q );
nkeynes@991
   953
    CMPL_r32_r32( REG_EAX, REG_ECX );
nkeynes@386
   954
    SETNE_t();
nkeynes@417
   955
    sh4_x86.tstate = TSTATE_NE;
nkeynes@361
   956
:}
nkeynes@361
   957
DIV0U {:  
nkeynes@671
   958
    COUNT_INST(I_DIV0U);
nkeynes@991
   959
    XORL_r32_r32( REG_EAX, REG_EAX );
nkeynes@995
   960
    MOVL_r32_rbpdisp( REG_EAX, R_Q );
nkeynes@995
   961
    MOVL_r32_rbpdisp( REG_EAX, R_M );
nkeynes@995
   962
    MOVL_r32_rbpdisp( REG_EAX, R_T );
nkeynes@417
   963
    sh4_x86.tstate = TSTATE_C; // works for DIV1
nkeynes@361
   964
:}
nkeynes@386
   965
DIV1 Rm, Rn {:
nkeynes@671
   966
    COUNT_INST(I_DIV1);
nkeynes@995
   967
    MOVL_rbpdisp_r32( R_M, REG_ECX );
nkeynes@991
   968
    load_reg( REG_EAX, Rn );
nkeynes@417
   969
    if( sh4_x86.tstate != TSTATE_C ) {
nkeynes@417
   970
	LDC_t();
nkeynes@417
   971
    }
nkeynes@991
   972
    RCLL_imm_r32( 1, REG_EAX );
nkeynes@991
   973
    SETC_r8( REG_DL ); // Q'
nkeynes@991
   974
    CMPL_rbpdisp_r32( R_Q, REG_ECX );
nkeynes@991
   975
    JE_label(mqequal);
nkeynes@991
   976
    ADDL_rbpdisp_r32( REG_OFFSET(r[Rm]), REG_EAX );
nkeynes@991
   977
    JMP_label(end);
nkeynes@380
   978
    JMP_TARGET(mqequal);
nkeynes@991
   979
    SUBL_rbpdisp_r32( REG_OFFSET(r[Rm]), REG_EAX );
nkeynes@386
   980
    JMP_TARGET(end);
nkeynes@991
   981
    store_reg( REG_EAX, Rn ); // Done with Rn now
nkeynes@991
   982
    SETC_r8(REG_AL); // tmp1
nkeynes@991
   983
    XORB_r8_r8( REG_DL, REG_AL ); // Q' = Q ^ tmp1
nkeynes@991
   984
    XORB_r8_r8( REG_AL, REG_CL ); // Q'' = Q' ^ M
nkeynes@995
   985
    MOVL_r32_rbpdisp( REG_ECX, R_Q );
nkeynes@991
   986
    XORL_imms_r32( 1, REG_AL );   // T = !Q'
nkeynes@991
   987
    MOVZXL_r8_r32( REG_AL, REG_EAX );
nkeynes@995
   988
    MOVL_r32_rbpdisp( REG_EAX, R_T );
nkeynes@417
   989
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@374
   990
:}
nkeynes@361
   991
DMULS.L Rm, Rn {:  
nkeynes@671
   992
    COUNT_INST(I_DMULS);
nkeynes@991
   993
    load_reg( REG_EAX, Rm );
nkeynes@991
   994
    load_reg( REG_ECX, Rn );
nkeynes@991
   995
    IMULL_r32(REG_ECX);
nkeynes@995
   996
    MOVL_r32_rbpdisp( REG_EDX, R_MACH );
nkeynes@995
   997
    MOVL_r32_rbpdisp( REG_EAX, R_MACL );
nkeynes@417
   998
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@361
   999
:}
nkeynes@361
  1000
DMULU.L Rm, Rn {:  
nkeynes@671
  1001
    COUNT_INST(I_DMULU);
nkeynes@991
  1002
    load_reg( REG_EAX, Rm );
nkeynes@991
  1003
    load_reg( REG_ECX, Rn );
nkeynes@991
  1004
    MULL_r32(REG_ECX);
nkeynes@995
  1005
    MOVL_r32_rbpdisp( REG_EDX, R_MACH );
nkeynes@995
  1006
    MOVL_r32_rbpdisp( REG_EAX, R_MACL );    
nkeynes@417
  1007
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@361
  1008
:}
nkeynes@359
  1009
DT Rn {:  
nkeynes@671
  1010
    COUNT_INST(I_DT);
nkeynes@991
  1011
    load_reg( REG_EAX, Rn );
nkeynes@991
  1012
    ADDL_imms_r32( -1, REG_EAX );
nkeynes@991
  1013
    store_reg( REG_EAX, Rn );
nkeynes@359
  1014
    SETE_t();
nkeynes@417
  1015
    sh4_x86.tstate = TSTATE_E;
nkeynes@359
  1016
:}
nkeynes@359
  1017
EXTS.B Rm, Rn {:  
nkeynes@671
  1018
    COUNT_INST(I_EXTSB);
nkeynes@991
  1019
    load_reg( REG_EAX, Rm );
nkeynes@991
  1020
    MOVSXL_r8_r32( REG_EAX, REG_EAX );
nkeynes@991
  1021
    store_reg( REG_EAX, Rn );
nkeynes@359
  1022
:}
nkeynes@361
  1023
EXTS.W Rm, Rn {:  
nkeynes@671
  1024
    COUNT_INST(I_EXTSW);
nkeynes@991
  1025
    load_reg( REG_EAX, Rm );
nkeynes@991
  1026
    MOVSXL_r16_r32( REG_EAX, REG_EAX );
nkeynes@991
  1027
    store_reg( REG_EAX, Rn );
nkeynes@361
  1028
:}
nkeynes@361
  1029
EXTU.B Rm, Rn {:  
nkeynes@671
  1030
    COUNT_INST(I_EXTUB);
nkeynes@991
  1031
    load_reg( REG_EAX, Rm );
nkeynes@991
  1032
    MOVZXL_r8_r32( REG_EAX, REG_EAX );
nkeynes@991
  1033
    store_reg( REG_EAX, Rn );
nkeynes@361
  1034
:}
nkeynes@361
  1035
EXTU.W Rm, Rn {:  
nkeynes@671
  1036
    COUNT_INST(I_EXTUW);
nkeynes@991
  1037
    load_reg( REG_EAX, Rm );
nkeynes@991
  1038
    MOVZXL_r16_r32( REG_EAX, REG_EAX );
nkeynes@991
  1039
    store_reg( REG_EAX, Rn );
nkeynes@361
  1040
:}
nkeynes@586
  1041
MAC.L @Rm+, @Rn+ {:
nkeynes@671
  1042
    COUNT_INST(I_MACL);
nkeynes@586
  1043
    if( Rm == Rn ) {
nkeynes@991
  1044
	load_reg( REG_EAX, Rm );
nkeynes@991
  1045
	check_ralign32( REG_EAX );
nkeynes@991
  1046
	MEM_READ_LONG( REG_EAX, REG_EAX );
nkeynes@991
  1047
	MOVL_r32_rspdisp(REG_EAX, 0);
nkeynes@991
  1048
	load_reg( REG_EAX, Rm );
nkeynes@991
  1049
	LEAL_r32disp_r32( REG_EAX, 4, REG_EAX );
nkeynes@991
  1050
	MEM_READ_LONG( REG_EAX, REG_EAX );
nkeynes@991
  1051
        ADDL_imms_rbpdisp( 8, REG_OFFSET(r[Rn]) );
nkeynes@586
  1052
    } else {
nkeynes@991
  1053
	load_reg( REG_EAX, Rm );
nkeynes@991
  1054
	check_ralign32( REG_EAX );
nkeynes@991
  1055
	MEM_READ_LONG( REG_EAX, REG_EAX );
nkeynes@991
  1056
	MOVL_r32_rspdisp( REG_EAX, 0 );
nkeynes@991
  1057
	load_reg( REG_EAX, Rn );
nkeynes@991
  1058
	check_ralign32( REG_EAX );
nkeynes@991
  1059
	MEM_READ_LONG( REG_EAX, REG_EAX );
nkeynes@991
  1060
	ADDL_imms_rbpdisp( 4, REG_OFFSET(r[Rn]) );
nkeynes@991
  1061
	ADDL_imms_rbpdisp( 4, REG_OFFSET(r[Rm]) );
nkeynes@586
  1062
    }
nkeynes@939
  1063
    
nkeynes@991
  1064
    IMULL_rspdisp( 0 );
nkeynes@991
  1065
    ADDL_r32_rbpdisp( REG_EAX, R_MACL );
nkeynes@991
  1066
    ADCL_r32_rbpdisp( REG_EDX, R_MACH );
nkeynes@386
  1067
nkeynes@995
  1068
    MOVL_rbpdisp_r32( R_S, REG_ECX );
nkeynes@991
  1069
    TESTL_r32_r32(REG_ECX, REG_ECX);
nkeynes@991
  1070
    JE_label( nosat );
nkeynes@995
  1071
    CALL_ptr( signsat48 );
nkeynes@386
  1072
    JMP_TARGET( nosat );
nkeynes@417
  1073
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@386
  1074
:}
nkeynes@386
  1075
MAC.W @Rm+, @Rn+ {:  
nkeynes@671
  1076
    COUNT_INST(I_MACW);
nkeynes@586
  1077
    if( Rm == Rn ) {
nkeynes@991
  1078
	load_reg( REG_EAX, Rm );
nkeynes@991
  1079
	check_ralign16( REG_EAX );
nkeynes@991
  1080
	MEM_READ_WORD( REG_EAX, REG_EAX );
nkeynes@991
  1081
        MOVL_r32_rspdisp( REG_EAX, 0 );
nkeynes@991
  1082
	load_reg( REG_EAX, Rm );
nkeynes@991
  1083
	LEAL_r32disp_r32( REG_EAX, 2, REG_EAX );
nkeynes@991
  1084
	MEM_READ_WORD( REG_EAX, REG_EAX );
nkeynes@991
  1085
	ADDL_imms_rbpdisp( 4, REG_OFFSET(r[Rn]) );
nkeynes@586
  1086
	// Note translate twice in case of page boundaries. Maybe worth
nkeynes@586
  1087
	// adding a page-boundary check to skip the second translation
nkeynes@586
  1088
    } else {
nkeynes@1193
  1089
	load_reg( REG_EAX, Rn );
nkeynes@991
  1090
	check_ralign16( REG_EAX );
nkeynes@991
  1091
	MEM_READ_WORD( REG_EAX, REG_EAX );
nkeynes@991
  1092
        MOVL_r32_rspdisp( REG_EAX, 0 );
nkeynes@1193
  1093
	load_reg( REG_EAX, Rm );
nkeynes@991
  1094
	check_ralign16( REG_EAX );
nkeynes@991
  1095
	MEM_READ_WORD( REG_EAX, REG_EAX );
nkeynes@991
  1096
	ADDL_imms_rbpdisp( 2, REG_OFFSET(r[Rn]) );
nkeynes@991
  1097
	ADDL_imms_rbpdisp( 2, REG_OFFSET(r[Rm]) );
nkeynes@586
  1098
    }
nkeynes@991
  1099
    IMULL_rspdisp( 0 );
nkeynes@995
  1100
    MOVL_rbpdisp_r32( R_S, REG_ECX );
nkeynes@991
  1101
    TESTL_r32_r32( REG_ECX, REG_ECX );
nkeynes@991
  1102
    JE_label( nosat );
nkeynes@386
  1103
nkeynes@991
  1104
    ADDL_r32_rbpdisp( REG_EAX, R_MACL );  // 6
nkeynes@991
  1105
    JNO_label( end );            // 2
nkeynes@995
  1106
    MOVL_imm32_r32( 1, REG_EDX );         // 5
nkeynes@995
  1107
    MOVL_r32_rbpdisp( REG_EDX, R_MACH );   // 6
nkeynes@991
  1108
    JS_label( positive );        // 2
nkeynes@995
  1109
    MOVL_imm32_r32( 0x80000000, REG_EAX );// 5
nkeynes@995
  1110
    MOVL_r32_rbpdisp( REG_EAX, R_MACL );   // 6
nkeynes@991
  1111
    JMP_label(end2);           // 2
nkeynes@386
  1112
nkeynes@386
  1113
    JMP_TARGET(positive);
nkeynes@995
  1114
    MOVL_imm32_r32( 0x7FFFFFFF, REG_EAX );// 5
nkeynes@995
  1115
    MOVL_r32_rbpdisp( REG_EAX, R_MACL );   // 6
nkeynes@991
  1116
    JMP_label(end3);            // 2
nkeynes@386
  1117
nkeynes@386
  1118
    JMP_TARGET(nosat);
nkeynes@991
  1119
    ADDL_r32_rbpdisp( REG_EAX, R_MACL );  // 6
nkeynes@991
  1120
    ADCL_r32_rbpdisp( REG_EDX, R_MACH );  // 6
nkeynes@386
  1121
    JMP_TARGET(end);
nkeynes@386
  1122
    JMP_TARGET(end2);
nkeynes@386
  1123
    JMP_TARGET(end3);
nkeynes@417
  1124
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@386
  1125
:}
nkeynes@359
  1126
MOVT Rn {:  
nkeynes@671
  1127
    COUNT_INST(I_MOVT);
nkeynes@995
  1128
    MOVL_rbpdisp_r32( R_T, REG_EAX );
nkeynes@991
  1129
    store_reg( REG_EAX, Rn );
nkeynes@359
  1130
:}
nkeynes@361
  1131
MUL.L Rm, Rn {:  
nkeynes@671
  1132
    COUNT_INST(I_MULL);
nkeynes@991
  1133
    load_reg( REG_EAX, Rm );
nkeynes@991
  1134
    load_reg( REG_ECX, Rn );
nkeynes@991
  1135
    MULL_r32( REG_ECX );
nkeynes@995
  1136
    MOVL_r32_rbpdisp( REG_EAX, R_MACL );
nkeynes@417
  1137
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@361
  1138
:}
nkeynes@374
  1139
MULS.W Rm, Rn {:
nkeynes@671
  1140
    COUNT_INST(I_MULSW);
nkeynes@995
  1141
    MOVSXL_rbpdisp16_r32( R_R(Rm), REG_EAX );
nkeynes@995
  1142
    MOVSXL_rbpdisp16_r32( R_R(Rn), REG_ECX );
nkeynes@991
  1143
    MULL_r32( REG_ECX );
nkeynes@995
  1144
    MOVL_r32_rbpdisp( REG_EAX, R_MACL );
nkeynes@417
  1145
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@361
  1146
:}
nkeynes@374
  1147
MULU.W Rm, Rn {:  
nkeynes@671
  1148
    COUNT_INST(I_MULUW);
nkeynes@995
  1149
    MOVZXL_rbpdisp16_r32( R_R(Rm), REG_EAX );
nkeynes@995
  1150
    MOVZXL_rbpdisp16_r32( R_R(Rn), REG_ECX );
nkeynes@991
  1151
    MULL_r32( REG_ECX );
nkeynes@995
  1152
    MOVL_r32_rbpdisp( REG_EAX, R_MACL );
nkeynes@417
  1153
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@374
  1154
:}
nkeynes@359
  1155
NEG Rm, Rn {:
nkeynes@671
  1156
    COUNT_INST(I_NEG);
nkeynes@991
  1157
    load_reg( REG_EAX, Rm );
nkeynes@991
  1158
    NEGL_r32( REG_EAX );
nkeynes@991
  1159
    store_reg( REG_EAX, Rn );
nkeynes@417
  1160
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  1161
:}
nkeynes@359
  1162
NEGC Rm, Rn {:  
nkeynes@671
  1163
    COUNT_INST(I_NEGC);
nkeynes@991
  1164
    load_reg( REG_EAX, Rm );
nkeynes@991
  1165
    XORL_r32_r32( REG_ECX, REG_ECX );
nkeynes@359
  1166
    LDC_t();
nkeynes@991
  1167
    SBBL_r32_r32( REG_EAX, REG_ECX );
nkeynes@991
  1168
    store_reg( REG_ECX, Rn );
nkeynes@359
  1169
    SETC_t();
nkeynes@417
  1170
    sh4_x86.tstate = TSTATE_C;
nkeynes@359
  1171
:}
nkeynes@359
  1172
NOT Rm, Rn {:  
nkeynes@671
  1173
    COUNT_INST(I_NOT);
nkeynes@991
  1174
    load_reg( REG_EAX, Rm );
nkeynes@991
  1175
    NOTL_r32( REG_EAX );
nkeynes@991
  1176
    store_reg( REG_EAX, Rn );
nkeynes@417
  1177
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  1178
:}
nkeynes@359
  1179
OR Rm, Rn {:  
nkeynes@671
  1180
    COUNT_INST(I_OR);
nkeynes@991
  1181
    load_reg( REG_EAX, Rm );
nkeynes@991
  1182
    load_reg( REG_ECX, Rn );
nkeynes@991
  1183
    ORL_r32_r32( REG_EAX, REG_ECX );
nkeynes@991
  1184
    store_reg( REG_ECX, Rn );
nkeynes@417
  1185
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  1186
:}
nkeynes@359
  1187
OR #imm, R0 {:
nkeynes@671
  1188
    COUNT_INST(I_ORI);
nkeynes@991
  1189
    load_reg( REG_EAX, 0 );
nkeynes@991
  1190
    ORL_imms_r32(imm, REG_EAX);
nkeynes@991
  1191
    store_reg( REG_EAX, 0 );
nkeynes@417
  1192
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  1193
:}
nkeynes@374
  1194
OR.B #imm, @(R0, GBR) {:  
nkeynes@671
  1195
    COUNT_INST(I_ORB);
nkeynes@991
  1196
    load_reg( REG_EAX, 0 );
nkeynes@991
  1197
    ADDL_rbpdisp_r32( R_GBR, REG_EAX );
nkeynes@991
  1198
    MOVL_r32_rspdisp( REG_EAX, 0 );
nkeynes@991
  1199
    MEM_READ_BYTE_FOR_WRITE( REG_EAX, REG_EDX );
nkeynes@991
  1200
    MOVL_rspdisp_r32( 0, REG_EAX );
nkeynes@991
  1201
    ORL_imms_r32(imm, REG_EDX );
nkeynes@991
  1202
    MEM_WRITE_BYTE( REG_EAX, REG_EDX );
nkeynes@417
  1203
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@374
  1204
:}
nkeynes@359
  1205
ROTCL Rn {:
nkeynes@671
  1206
    COUNT_INST(I_ROTCL);
nkeynes@991
  1207
    load_reg( REG_EAX, Rn );
nkeynes@417
  1208
    if( sh4_x86.tstate != TSTATE_C ) {
nkeynes@417
  1209
	LDC_t();
nkeynes@417
  1210
    }
nkeynes@991
  1211
    RCLL_imm_r32( 1, REG_EAX );
nkeynes@991
  1212
    store_reg( REG_EAX, Rn );
nkeynes@359
  1213
    SETC_t();
nkeynes@417
  1214
    sh4_x86.tstate = TSTATE_C;
nkeynes@359
  1215
:}
nkeynes@359
  1216
ROTCR Rn {:  
nkeynes@671
  1217
    COUNT_INST(I_ROTCR);
nkeynes@991
  1218
    load_reg( REG_EAX, Rn );
nkeynes@417
  1219
    if( sh4_x86.tstate != TSTATE_C ) {
nkeynes@417
  1220
	LDC_t();
nkeynes@417
  1221
    }
nkeynes@991
  1222
    RCRL_imm_r32( 1, REG_EAX );
nkeynes@991
  1223
    store_reg( REG_EAX, Rn );
nkeynes@359
  1224
    SETC_t();
nkeynes@417
  1225
    sh4_x86.tstate = TSTATE_C;
nkeynes@359
  1226
:}
nkeynes@359
  1227
ROTL Rn {:  
nkeynes@671
  1228
    COUNT_INST(I_ROTL);
nkeynes@991
  1229
    load_reg( REG_EAX, Rn );
nkeynes@991
  1230
    ROLL_imm_r32( 1, REG_EAX );
nkeynes@991
  1231
    store_reg( REG_EAX, Rn );
nkeynes@359
  1232
    SETC_t();
nkeynes@417
  1233
    sh4_x86.tstate = TSTATE_C;
nkeynes@359
  1234
:}
nkeynes@359
  1235
ROTR Rn {:  
nkeynes@671
  1236
    COUNT_INST(I_ROTR);
nkeynes@991
  1237
    load_reg( REG_EAX, Rn );
nkeynes@991
  1238
    RORL_imm_r32( 1, REG_EAX );
nkeynes@991
  1239
    store_reg( REG_EAX, Rn );
nkeynes@359
  1240
    SETC_t();
nkeynes@417
  1241
    sh4_x86.tstate = TSTATE_C;
nkeynes@359
  1242
:}
nkeynes@359
  1243
SHAD Rm, Rn {:
nkeynes@671
  1244
    COUNT_INST(I_SHAD);
nkeynes@359
  1245
    /* Annoyingly enough, not directly convertible */
nkeynes@991
  1246
    load_reg( REG_EAX, Rn );
nkeynes@991
  1247
    load_reg( REG_ECX, Rm );
nkeynes@991
  1248
    CMPL_imms_r32( 0, REG_ECX );
nkeynes@991
  1249
    JGE_label(doshl);
nkeynes@361
  1250
                    
nkeynes@991
  1251
    NEGL_r32( REG_ECX );      // 2
nkeynes@991
  1252
    ANDB_imms_r8( 0x1F, REG_CL ); // 3
nkeynes@991
  1253
    JE_label(emptysar);     // 2
nkeynes@991
  1254
    SARL_cl_r32( REG_EAX );       // 2
nkeynes@991
  1255
    JMP_label(end);          // 2
nkeynes@386
  1256
nkeynes@386
  1257
    JMP_TARGET(emptysar);
nkeynes@991
  1258
    SARL_imm_r32(31, REG_EAX );  // 3
nkeynes@991
  1259
    JMP_label(end2);
nkeynes@382
  1260
nkeynes@380
  1261
    JMP_TARGET(doshl);
nkeynes@991
  1262
    ANDB_imms_r8( 0x1F, REG_CL ); // 3
nkeynes@991
  1263
    SHLL_cl_r32( REG_EAX );       // 2
nkeynes@380
  1264
    JMP_TARGET(end);
nkeynes@386
  1265
    JMP_TARGET(end2);
nkeynes@991
  1266
    store_reg( REG_EAX, Rn );
nkeynes@417
  1267
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  1268
:}
nkeynes@359
  1269
SHLD Rm, Rn {:  
nkeynes@671
  1270
    COUNT_INST(I_SHLD);
nkeynes@991
  1271
    load_reg( REG_EAX, Rn );
nkeynes@991
  1272
    load_reg( REG_ECX, Rm );
nkeynes@991
  1273
    CMPL_imms_r32( 0, REG_ECX );
nkeynes@991
  1274
    JGE_label(doshl);
nkeynes@368
  1275
nkeynes@991
  1276
    NEGL_r32( REG_ECX );      // 2
nkeynes@991
  1277
    ANDB_imms_r8( 0x1F, REG_CL ); // 3
nkeynes@991
  1278
    JE_label(emptyshr );
nkeynes@991
  1279
    SHRL_cl_r32( REG_EAX );       // 2
nkeynes@991
  1280
    JMP_label(end);          // 2
nkeynes@386
  1281
nkeynes@386
  1282
    JMP_TARGET(emptyshr);
nkeynes@991
  1283
    XORL_r32_r32( REG_EAX, REG_EAX );
nkeynes@991
  1284
    JMP_label(end2);
nkeynes@382
  1285
nkeynes@382
  1286
    JMP_TARGET(doshl);
nkeynes@991
  1287
    ANDB_imms_r8( 0x1F, REG_CL ); // 3
nkeynes@991
  1288
    SHLL_cl_r32( REG_EAX );       // 2
nkeynes@382
  1289
    JMP_TARGET(end);
nkeynes@386
  1290
    JMP_TARGET(end2);
nkeynes@991
  1291
    store_reg( REG_EAX, Rn );
nkeynes@417
  1292
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  1293
:}
nkeynes@359
  1294
SHAL Rn {: 
nkeynes@671
  1295
    COUNT_INST(I_SHAL);
nkeynes@991
  1296
    load_reg( REG_EAX, Rn );
nkeynes@991
  1297
    SHLL_imm_r32( 1, REG_EAX );
nkeynes@397
  1298
    SETC_t();
nkeynes@991
  1299
    store_reg( REG_EAX, Rn );
nkeynes@417
  1300
    sh4_x86.tstate = TSTATE_C;
nkeynes@359
  1301
:}
nkeynes@359
  1302
SHAR Rn {:  
nkeynes@671
  1303
    COUNT_INST(I_SHAR);
nkeynes@991
  1304
    load_reg( REG_EAX, Rn );
nkeynes@991
  1305
    SARL_imm_r32( 1, REG_EAX );
nkeynes@397
  1306
    SETC_t();
nkeynes@991
  1307
    store_reg( REG_EAX, Rn );
nkeynes@417
  1308
    sh4_x86.tstate = TSTATE_C;
nkeynes@359
  1309
:}
nkeynes@359
  1310
SHLL Rn {:  
nkeynes@671
  1311
    COUNT_INST(I_SHLL);
nkeynes@991
  1312
    load_reg( REG_EAX, Rn );
nkeynes@991
  1313
    SHLL_imm_r32( 1, REG_EAX );
nkeynes@397
  1314
    SETC_t();
nkeynes@991
  1315
    store_reg( REG_EAX, Rn );
nkeynes@417
  1316
    sh4_x86.tstate = TSTATE_C;
nkeynes@359
  1317
:}
nkeynes@359
  1318
SHLL2 Rn {:
nkeynes@671
  1319
    COUNT_INST(I_SHLL);
nkeynes@991
  1320
    load_reg( REG_EAX, Rn );
nkeynes@991
  1321
    SHLL_imm_r32( 2, REG_EAX );
nkeynes@991
  1322
    store_reg( REG_EAX, Rn );
nkeynes@417
  1323
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  1324
:}
nkeynes@359
  1325
SHLL8 Rn {:  
nkeynes@671
  1326
    COUNT_INST(I_SHLL);
nkeynes@991
  1327
    load_reg( REG_EAX, Rn );
nkeynes@991
  1328
    SHLL_imm_r32( 8, REG_EAX );
nkeynes@991
  1329
    store_reg( REG_EAX, Rn );
nkeynes@417
  1330
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  1331
:}
nkeynes@359
  1332
SHLL16 Rn {:  
nkeynes@671
  1333
    COUNT_INST(I_SHLL);
nkeynes@991
  1334
    load_reg( REG_EAX, Rn );
nkeynes@991
  1335
    SHLL_imm_r32( 16, REG_EAX );
nkeynes@991
  1336
    store_reg( REG_EAX, Rn );
nkeynes@417
  1337
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  1338
:}
nkeynes@359
  1339
SHLR Rn {:  
nkeynes@671
  1340
    COUNT_INST(I_SHLR);
nkeynes@991
  1341
    load_reg( REG_EAX, Rn );
nkeynes@991
  1342
    SHRL_imm_r32( 1, REG_EAX );
nkeynes@397
  1343
    SETC_t();
nkeynes@991
  1344
    store_reg( REG_EAX, Rn );
nkeynes@417
  1345
    sh4_x86.tstate = TSTATE_C;
nkeynes@359
  1346
:}
nkeynes@359
  1347
SHLR2 Rn {:  
nkeynes@671
  1348
    COUNT_INST(I_SHLR);
nkeynes@991
  1349
    load_reg( REG_EAX, Rn );
nkeynes@991
  1350
    SHRL_imm_r32( 2, REG_EAX );
nkeynes@991
  1351
    store_reg( REG_EAX, Rn );
nkeynes@417
  1352
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  1353
:}
nkeynes@359
  1354
SHLR8 Rn {:  
nkeynes@671
  1355
    COUNT_INST(I_SHLR);
nkeynes@991
  1356
    load_reg( REG_EAX, Rn );
nkeynes@991
  1357
    SHRL_imm_r32( 8, REG_EAX );
nkeynes@991
  1358
    store_reg( REG_EAX, Rn );
nkeynes@417
  1359
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  1360
:}
nkeynes@359
  1361
SHLR16 Rn {:  
nkeynes@671
  1362
    COUNT_INST(I_SHLR);
nkeynes@991
  1363
    load_reg( REG_EAX, Rn );
nkeynes@991
  1364
    SHRL_imm_r32( 16, REG_EAX );
nkeynes@991
  1365
    store_reg( REG_EAX, Rn );
nkeynes@417
  1366
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  1367
:}
nkeynes@359
  1368
SUB Rm, Rn {:  
nkeynes@671
  1369
    COUNT_INST(I_SUB);
nkeynes@991
  1370
    load_reg( REG_EAX, Rm );
nkeynes@991
  1371
    load_reg( REG_ECX, Rn );
nkeynes@991
  1372
    SUBL_r32_r32( REG_EAX, REG_ECX );
nkeynes@991
  1373
    store_reg( REG_ECX, Rn );
nkeynes@417
  1374
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  1375
:}
nkeynes@359
  1376
SUBC Rm, Rn {:  
nkeynes@671
  1377
    COUNT_INST(I_SUBC);
nkeynes@991
  1378
    load_reg( REG_EAX, Rm );
nkeynes@991
  1379
    load_reg( REG_ECX, Rn );
nkeynes@417
  1380
    if( sh4_x86.tstate != TSTATE_C ) {
nkeynes@417
  1381
	LDC_t();
nkeynes@417
  1382
    }
nkeynes@991
  1383
    SBBL_r32_r32( REG_EAX, REG_ECX );
nkeynes@991
  1384
    store_reg( REG_ECX, Rn );
nkeynes@394
  1385
    SETC_t();
nkeynes@417
  1386
    sh4_x86.tstate = TSTATE_C;
nkeynes@359
  1387
:}
nkeynes@359
  1388
SUBV Rm, Rn {:  
nkeynes@671
  1389
    COUNT_INST(I_SUBV);
nkeynes@991
  1390
    load_reg( REG_EAX, Rm );
nkeynes@991
  1391
    load_reg( REG_ECX, Rn );
nkeynes@991
  1392
    SUBL_r32_r32( REG_EAX, REG_ECX );
nkeynes@991
  1393
    store_reg( REG_ECX, Rn );
nkeynes@359
  1394
    SETO_t();
nkeynes@417
  1395
    sh4_x86.tstate = TSTATE_O;
nkeynes@359
  1396
:}
nkeynes@359
  1397
SWAP.B Rm, Rn {:  
nkeynes@671
  1398
    COUNT_INST(I_SWAPB);
nkeynes@991
  1399
    load_reg( REG_EAX, Rm );
nkeynes@991
  1400
    XCHGB_r8_r8( REG_AL, REG_AH ); // NB: does not touch EFLAGS
nkeynes@991
  1401
    store_reg( REG_EAX, Rn );
nkeynes@359
  1402
:}
nkeynes@359
  1403
SWAP.W Rm, Rn {:  
nkeynes@671
  1404
    COUNT_INST(I_SWAPB);
nkeynes@991
  1405
    load_reg( REG_EAX, Rm );
nkeynes@991
  1406
    MOVL_r32_r32( REG_EAX, REG_ECX );
nkeynes@991
  1407
    SHLL_imm_r32( 16, REG_ECX );
nkeynes@991
  1408
    SHRL_imm_r32( 16, REG_EAX );
nkeynes@991
  1409
    ORL_r32_r32( REG_EAX, REG_ECX );
nkeynes@991
  1410
    store_reg( REG_ECX, Rn );
nkeynes@417
  1411
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  1412
:}
nkeynes@361
  1413
TAS.B @Rn {:  
nkeynes@671
  1414
    COUNT_INST(I_TASB);
nkeynes@991
  1415
    load_reg( REG_EAX, Rn );
nkeynes@991
  1416
    MOVL_r32_rspdisp( REG_EAX, 0 );
nkeynes@991
  1417
    MEM_READ_BYTE_FOR_WRITE( REG_EAX, REG_EDX );
nkeynes@991
  1418
    TESTB_r8_r8( REG_DL, REG_DL );
nkeynes@361
  1419
    SETE_t();
nkeynes@991
  1420
    ORB_imms_r8( 0x80, REG_DL );
nkeynes@991
  1421
    MOVL_rspdisp_r32( 0, REG_EAX );
nkeynes@991
  1422
    MEM_WRITE_BYTE( REG_EAX, REG_EDX );
nkeynes@417
  1423
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@361
  1424
:}
nkeynes@361
  1425
TST Rm, Rn {:  
nkeynes@671
  1426
    COUNT_INST(I_TST);
nkeynes@991
  1427
    load_reg( REG_EAX, Rm );
nkeynes@991
  1428
    load_reg( REG_ECX, Rn );
nkeynes@991
  1429
    TESTL_r32_r32( REG_EAX, REG_ECX );
nkeynes@361
  1430
    SETE_t();
nkeynes@417
  1431
    sh4_x86.tstate = TSTATE_E;
nkeynes@361
  1432
:}
nkeynes@368
  1433
TST #imm, R0 {:  
nkeynes@671
  1434
    COUNT_INST(I_TSTI);
nkeynes@991
  1435
    load_reg( REG_EAX, 0 );
nkeynes@991
  1436
    TESTL_imms_r32( imm, REG_EAX );
nkeynes@368
  1437
    SETE_t();
nkeynes@417
  1438
    sh4_x86.tstate = TSTATE_E;
nkeynes@368
  1439
:}
nkeynes@368
  1440
TST.B #imm, @(R0, GBR) {:  
nkeynes@671
  1441
    COUNT_INST(I_TSTB);
nkeynes@991
  1442
    load_reg( REG_EAX, 0);
nkeynes@991
  1443
    ADDL_rbpdisp_r32( R_GBR, REG_EAX );
nkeynes@991
  1444
    MEM_READ_BYTE( REG_EAX, REG_EAX );
nkeynes@991
  1445
    TESTB_imms_r8( imm, REG_AL );
nkeynes@368
  1446
    SETE_t();
nkeynes@417
  1447
    sh4_x86.tstate = TSTATE_E;
nkeynes@368
  1448
:}
nkeynes@359
  1449
XOR Rm, Rn {:  
nkeynes@671
  1450
    COUNT_INST(I_XOR);
nkeynes@991
  1451
    load_reg( REG_EAX, Rm );
nkeynes@991
  1452
    load_reg( REG_ECX, Rn );
nkeynes@991
  1453
    XORL_r32_r32( REG_EAX, REG_ECX );
nkeynes@991
  1454
    store_reg( REG_ECX, Rn );
nkeynes@417
  1455
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  1456
:}
nkeynes@359
  1457
XOR #imm, R0 {:  
nkeynes@671
  1458
    COUNT_INST(I_XORI);
nkeynes@991
  1459
    load_reg( REG_EAX, 0 );
nkeynes@991
  1460
    XORL_imms_r32( imm, REG_EAX );
nkeynes@991
  1461
    store_reg( REG_EAX, 0 );
nkeynes@417
  1462
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  1463
:}
nkeynes@359
  1464
XOR.B #imm, @(R0, GBR) {:  
nkeynes@671
  1465
    COUNT_INST(I_XORB);
nkeynes@991
  1466
    load_reg( REG_EAX, 0 );
nkeynes@991
  1467
    ADDL_rbpdisp_r32( R_GBR, REG_EAX ); 
nkeynes@991
  1468
    MOVL_r32_rspdisp( REG_EAX, 0 );
nkeynes@991
  1469
    MEM_READ_BYTE_FOR_WRITE(REG_EAX, REG_EDX);
nkeynes@991
  1470
    MOVL_rspdisp_r32( 0, REG_EAX );
nkeynes@991
  1471
    XORL_imms_r32( imm, REG_EDX );
nkeynes@991
  1472
    MEM_WRITE_BYTE( REG_EAX, REG_EDX );
nkeynes@417
  1473
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  1474
:}
nkeynes@361
  1475
XTRCT Rm, Rn {:
nkeynes@671
  1476
    COUNT_INST(I_XTRCT);
nkeynes@991
  1477
    load_reg( REG_EAX, Rm );
nkeynes@991
  1478
    load_reg( REG_ECX, Rn );
nkeynes@991
  1479
    SHLL_imm_r32( 16, REG_EAX );
nkeynes@991
  1480
    SHRL_imm_r32( 16, REG_ECX );
nkeynes@991
  1481
    ORL_r32_r32( REG_EAX, REG_ECX );
nkeynes@991
  1482
    store_reg( REG_ECX, Rn );
nkeynes@417
  1483
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  1484
:}
nkeynes@359
  1485
nkeynes@359
  1486
/* Data move instructions */
nkeynes@359
  1487
MOV Rm, Rn {:  
nkeynes@671
  1488
    COUNT_INST(I_MOV);
nkeynes@991
  1489
    load_reg( REG_EAX, Rm );
nkeynes@991
  1490
    store_reg( REG_EAX, Rn );
nkeynes@359
  1491
:}
nkeynes@359
  1492
MOV #imm, Rn {:  
nkeynes@671
  1493
    COUNT_INST(I_MOVI);
nkeynes@995
  1494
    MOVL_imm32_r32( imm, REG_EAX );
nkeynes@991
  1495
    store_reg( REG_EAX, Rn );
nkeynes@359
  1496
:}
nkeynes@359
  1497
MOV.B Rm, @Rn {:  
nkeynes@671
  1498
    COUNT_INST(I_MOVB);
nkeynes@991
  1499
    load_reg( REG_EAX, Rn );
nkeynes@991
  1500
    load_reg( REG_EDX, Rm );
nkeynes@991
  1501
    MEM_WRITE_BYTE( REG_EAX, REG_EDX );
nkeynes@417
  1502
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  1503
:}
nkeynes@359
  1504
MOV.B Rm, @-Rn {:  
nkeynes@671
  1505
    COUNT_INST(I_MOVB);
nkeynes@991
  1506
    load_reg( REG_EAX, Rn );
nkeynes@991
  1507
    LEAL_r32disp_r32( REG_EAX, -1, REG_EAX );
nkeynes@991
  1508
    load_reg( REG_EDX, Rm );
nkeynes@991
  1509
    MEM_WRITE_BYTE( REG_EAX, REG_EDX );
nkeynes@991
  1510
    ADDL_imms_rbpdisp( -1, REG_OFFSET(r[Rn]) );
nkeynes@417
  1511
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  1512
:}
nkeynes@359
  1513
MOV.B Rm, @(R0, Rn) {:  
nkeynes@671
  1514
    COUNT_INST(I_MOVB);
nkeynes@991
  1515
    load_reg( REG_EAX, 0 );
nkeynes@991
  1516
    ADDL_rbpdisp_r32( REG_OFFSET(r[Rn]), REG_EAX );
nkeynes@991
  1517
    load_reg( REG_EDX, Rm );
nkeynes@991
  1518
    MEM_WRITE_BYTE( REG_EAX, REG_EDX );
nkeynes@417
  1519
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  1520
:}
nkeynes@359
  1521
MOV.B R0, @(disp, GBR) {:  
nkeynes@671
  1522
    COUNT_INST(I_MOVB);
nkeynes@995
  1523
    MOVL_rbpdisp_r32( R_GBR, REG_EAX );
nkeynes@991
  1524
    ADDL_imms_r32( disp, REG_EAX );
nkeynes@991
  1525
    load_reg( REG_EDX, 0 );
nkeynes@991
  1526
    MEM_WRITE_BYTE( REG_EAX, REG_EDX );
nkeynes@417
  1527
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  1528
:}
nkeynes@359
  1529
MOV.B R0, @(disp, Rn) {:  
nkeynes@671
  1530
    COUNT_INST(I_MOVB);
nkeynes@991
  1531
    load_reg( REG_EAX, Rn );
nkeynes@991
  1532
    ADDL_imms_r32( disp, REG_EAX );
nkeynes@991
  1533
    load_reg( REG_EDX, 0 );
nkeynes@991
  1534
    MEM_WRITE_BYTE( REG_EAX, REG_EDX );
nkeynes@417
  1535
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  1536
:}
nkeynes@359
  1537
MOV.B @Rm, Rn {:  
nkeynes@671
  1538
    COUNT_INST(I_MOVB);
nkeynes@991
  1539
    load_reg( REG_EAX, Rm );
nkeynes@991
  1540
    MEM_READ_BYTE( REG_EAX, REG_EAX );
nkeynes@991
  1541
    store_reg( REG_EAX, Rn );
nkeynes@417
  1542
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  1543
:}
nkeynes@359
  1544
MOV.B @Rm+, Rn {:  
nkeynes@671
  1545
    COUNT_INST(I_MOVB);
nkeynes@991
  1546
    load_reg( REG_EAX, Rm );
nkeynes@991
  1547
    MEM_READ_BYTE( REG_EAX, REG_EAX );
nkeynes@939
  1548
    if( Rm != Rn ) {
nkeynes@991
  1549
    	ADDL_imms_rbpdisp( 1, REG_OFFSET(r[Rm]) );
nkeynes@939
  1550
    }
nkeynes@991
  1551
    store_reg( REG_EAX, Rn );
nkeynes@417
  1552
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  1553
:}
nkeynes@359
  1554
MOV.B @(R0, Rm), Rn {:  
nkeynes@671
  1555
    COUNT_INST(I_MOVB);
nkeynes@991
  1556
    load_reg( REG_EAX, 0 );
nkeynes@991
  1557
    ADDL_rbpdisp_r32( REG_OFFSET(r[Rm]), REG_EAX );
nkeynes@991
  1558
    MEM_READ_BYTE( REG_EAX, REG_EAX );
nkeynes@991
  1559
    store_reg( REG_EAX, Rn );
nkeynes@417
  1560
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  1561
:}
nkeynes@359
  1562
MOV.B @(disp, GBR), R0 {:  
nkeynes@671
  1563
    COUNT_INST(I_MOVB);
nkeynes@995
  1564
    MOVL_rbpdisp_r32( R_GBR, REG_EAX );
nkeynes@991
  1565
    ADDL_imms_r32( disp, REG_EAX );
nkeynes@991
  1566
    MEM_READ_BYTE( REG_EAX, REG_EAX );
nkeynes@991
  1567
    store_reg( REG_EAX, 0 );
nkeynes@417
  1568
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  1569
:}
nkeynes@359
  1570
MOV.B @(disp, Rm), R0 {:  
nkeynes@671
  1571
    COUNT_INST(I_MOVB);
nkeynes@991
  1572
    load_reg( REG_EAX, Rm );
nkeynes@991
  1573
    ADDL_imms_r32( disp, REG_EAX );
nkeynes@991
  1574
    MEM_READ_BYTE( REG_EAX, REG_EAX );
nkeynes@991
  1575
    store_reg( REG_EAX, 0 );
nkeynes@417
  1576
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  1577
:}
nkeynes@374
  1578
MOV.L Rm, @Rn {:
nkeynes@671
  1579
    COUNT_INST(I_MOVL);
nkeynes@991
  1580
    load_reg( REG_EAX, Rn );
nkeynes@991
  1581
    check_walign32(REG_EAX);
nkeynes@991
  1582
    MOVL_r32_r32( REG_EAX, REG_ECX );
nkeynes@991
  1583
    ANDL_imms_r32( 0xFC000000, REG_ECX );
nkeynes@991
  1584
    CMPL_imms_r32( 0xE0000000, REG_ECX );
nkeynes@991
  1585
    JNE_label( notsq );
nkeynes@991
  1586
    ANDL_imms_r32( 0x3C, REG_EAX );
nkeynes@991
  1587
    load_reg( REG_EDX, Rm );
nkeynes@991
  1588
    MOVL_r32_sib( REG_EDX, 0, REG_EBP, REG_EAX, REG_OFFSET(store_queue) );
nkeynes@991
  1589
    JMP_label(end);
nkeynes@930
  1590
    JMP_TARGET(notsq);
nkeynes@991
  1591
    load_reg( REG_EDX, Rm );
nkeynes@991
  1592
    MEM_WRITE_LONG( REG_EAX, REG_EDX );
nkeynes@930
  1593
    JMP_TARGET(end);
nkeynes@417
  1594
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@361
  1595
:}
nkeynes@361
  1596
MOV.L Rm, @-Rn {:  
nkeynes@671
  1597
    COUNT_INST(I_MOVL);
nkeynes@991
  1598
    load_reg( REG_EAX, Rn );
nkeynes@991
  1599
    ADDL_imms_r32( -4, REG_EAX );
nkeynes@991
  1600
    check_walign32( REG_EAX );
nkeynes@991
  1601
    load_reg( REG_EDX, Rm );
nkeynes@991
  1602
    MEM_WRITE_LONG( REG_EAX, REG_EDX );
nkeynes@991
  1603
    ADDL_imms_rbpdisp( -4, REG_OFFSET(r[Rn]) );
nkeynes@417
  1604
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@361
  1605
:}
nkeynes@361
  1606
MOV.L Rm, @(R0, Rn) {:  
nkeynes@671
  1607
    COUNT_INST(I_MOVL);
nkeynes@991
  1608
    load_reg( REG_EAX, 0 );
nkeynes@991
  1609
    ADDL_rbpdisp_r32( REG_OFFSET(r[Rn]), REG_EAX );
nkeynes@991
  1610
    check_walign32( REG_EAX );
nkeynes@991
  1611
    load_reg( REG_EDX, Rm );
nkeynes@991
  1612
    MEM_WRITE_LONG( REG_EAX, REG_EDX );
nkeynes@417
  1613
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@361
  1614
:}
nkeynes@361
  1615
MOV.L R0, @(disp, GBR) {:  
nkeynes@671
  1616
    COUNT_INST(I_MOVL);
nkeynes@995
  1617
    MOVL_rbpdisp_r32( R_GBR, REG_EAX );
nkeynes@991
  1618
    ADDL_imms_r32( disp, REG_EAX );
nkeynes@991
  1619
    check_walign32( REG_EAX );
nkeynes@991
  1620
    load_reg( REG_EDX, 0 );
nkeynes@991
  1621
    MEM_WRITE_LONG( REG_EAX, REG_EDX );
nkeynes@417
  1622
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@361
  1623
:}
nkeynes@361
  1624
MOV.L Rm, @(disp, Rn) {:  
nkeynes@671
  1625
    COUNT_INST(I_MOVL);
nkeynes@991
  1626
    load_reg( REG_EAX, Rn );
nkeynes@991
  1627
    ADDL_imms_r32( disp, REG_EAX );
nkeynes@991
  1628
    check_walign32( REG_EAX );
nkeynes@991
  1629
    MOVL_r32_r32( REG_EAX, REG_ECX );
nkeynes@991
  1630
    ANDL_imms_r32( 0xFC000000, REG_ECX );
nkeynes@991
  1631
    CMPL_imms_r32( 0xE0000000, REG_ECX );
nkeynes@991
  1632
    JNE_label( notsq );
nkeynes@991
  1633
    ANDL_imms_r32( 0x3C, REG_EAX );
nkeynes@991
  1634
    load_reg( REG_EDX, Rm );
nkeynes@991
  1635
    MOVL_r32_sib( REG_EDX, 0, REG_EBP, REG_EAX, REG_OFFSET(store_queue) );
nkeynes@991
  1636
    JMP_label(end);
nkeynes@930
  1637
    JMP_TARGET(notsq);
nkeynes@991
  1638
    load_reg( REG_EDX, Rm );
nkeynes@991
  1639
    MEM_WRITE_LONG( REG_EAX, REG_EDX );
nkeynes@930
  1640
    JMP_TARGET(end);
nkeynes@417
  1641
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@361
  1642
:}
nkeynes@361
  1643
MOV.L @Rm, Rn {:  
nkeynes@671
  1644
    COUNT_INST(I_MOVL);
nkeynes@991
  1645
    load_reg( REG_EAX, Rm );
nkeynes@991
  1646
    check_ralign32( REG_EAX );
nkeynes@991
  1647
    MEM_READ_LONG( REG_EAX, REG_EAX );
nkeynes@991
  1648
    store_reg( REG_EAX, Rn );
nkeynes@417
  1649
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@361
  1650
:}
nkeynes@361
  1651
MOV.L @Rm+, Rn {:  
nkeynes@671
  1652
    COUNT_INST(I_MOVL);
nkeynes@991
  1653
    load_reg( REG_EAX, Rm );
nkeynes@991
  1654
    check_ralign32( REG_EAX );
nkeynes@991
  1655
    MEM_READ_LONG( REG_EAX, REG_EAX );
nkeynes@939
  1656
    if( Rm != Rn ) {
nkeynes@991
  1657
    	ADDL_imms_rbpdisp( 4, REG_OFFSET(r[Rm]) );
nkeynes@939
  1658
    }
nkeynes@991
  1659
    store_reg( REG_EAX, Rn );
nkeynes@417
  1660
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@361
  1661
:}
nkeynes@361
  1662
MOV.L @(R0, Rm), Rn {:  
nkeynes@671
  1663
    COUNT_INST(I_MOVL);
nkeynes@991
  1664
    load_reg( REG_EAX, 0 );
nkeynes@991
  1665
    ADDL_rbpdisp_r32( REG_OFFSET(r[Rm]), REG_EAX );
nkeynes@991
  1666
    check_ralign32( REG_EAX );
nkeynes@991
  1667
    MEM_READ_LONG( REG_EAX, REG_EAX );
nkeynes@991
  1668
    store_reg( REG_EAX, Rn );
nkeynes@417
  1669
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@361
  1670
:}
nkeynes@361
  1671
MOV.L @(disp, GBR), R0 {:
nkeynes@671
  1672
    COUNT_INST(I_MOVL);
nkeynes@995
  1673
    MOVL_rbpdisp_r32( R_GBR, REG_EAX );
nkeynes@991
  1674
    ADDL_imms_r32( disp, REG_EAX );
nkeynes@991
  1675
    check_ralign32( REG_EAX );
nkeynes@991
  1676
    MEM_READ_LONG( REG_EAX, REG_EAX );
nkeynes@991
  1677
    store_reg( REG_EAX, 0 );
nkeynes@417
  1678
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@361
  1679
:}
nkeynes@361
  1680
MOV.L @(disp, PC), Rn {:  
nkeynes@671
  1681
    COUNT_INST(I_MOVLPC);
nkeynes@374
  1682
    if( sh4_x86.in_delay_slot ) {
nkeynes@374
  1683
	SLOTILLEGAL();
nkeynes@374
  1684
    } else {
nkeynes@388
  1685
	uint32_t target = (pc & 0xFFFFFFFC) + disp + 4;
nkeynes@1125
  1686
	if( sh4_x86.fastmem && IS_IN_ICACHE(target) ) {
nkeynes@586
  1687
	    // If the target address is in the same page as the code, it's
nkeynes@586
  1688
	    // pretty safe to just ref it directly and circumvent the whole
nkeynes@586
  1689
	    // memory subsystem. (this is a big performance win)
nkeynes@586
  1690
nkeynes@586
  1691
	    // FIXME: There's a corner-case that's not handled here when
nkeynes@586
  1692
	    // the current code-page is in the ITLB but not in the UTLB.
nkeynes@586
  1693
	    // (should generate a TLB miss although need to test SH4 
nkeynes@586
  1694
	    // behaviour to confirm) Unlikely to be anyone depending on this
nkeynes@586
  1695
	    // behaviour though.
nkeynes@586
  1696
	    sh4ptr_t ptr = GET_ICACHE_PTR(target);
nkeynes@991
  1697
	    MOVL_moffptr_eax( ptr );
nkeynes@388
  1698
	} else {
nkeynes@586
  1699
	    // Note: we use sh4r.pc for the calc as we could be running at a
nkeynes@586
  1700
	    // different virtual address than the translation was done with,
nkeynes@586
  1701
	    // but we can safely assume that the low bits are the same.
nkeynes@995
  1702
	    MOVL_imm32_r32( (pc-sh4_x86.block_start_pc) + disp + 4 - (pc&0x03), REG_EAX );
nkeynes@991
  1703
	    ADDL_rbpdisp_r32( R_PC, REG_EAX );
nkeynes@991
  1704
	    MEM_READ_LONG( REG_EAX, REG_EAX );
nkeynes@586
  1705
	    sh4_x86.tstate = TSTATE_NONE;
nkeynes@388
  1706
	}
nkeynes@991
  1707
	store_reg( REG_EAX, Rn );
nkeynes@374
  1708
    }
nkeynes@361
  1709
:}
nkeynes@361
  1710
MOV.L @(disp, Rm), Rn {:  
nkeynes@671
  1711
    COUNT_INST(I_MOVL);
nkeynes@991
  1712
    load_reg( REG_EAX, Rm );
nkeynes@991
  1713
    ADDL_imms_r32( disp, REG_EAX );
nkeynes@991
  1714
    check_ralign32( REG_EAX );
nkeynes@991
  1715
    MEM_READ_LONG( REG_EAX, REG_EAX );
nkeynes@991
  1716
    store_reg( REG_EAX, Rn );
nkeynes@417
  1717
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@361
  1718
:}
nkeynes@361
  1719
MOV.W Rm, @Rn {:  
nkeynes@671
  1720
    COUNT_INST(I_MOVW);
nkeynes@991
  1721
    load_reg( REG_EAX, Rn );
nkeynes@991
  1722
    check_walign16( REG_EAX );
nkeynes@991
  1723
    load_reg( REG_EDX, Rm );
nkeynes@991
  1724
    MEM_WRITE_WORD( REG_EAX, REG_EDX );
nkeynes@417
  1725
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@361
  1726
:}
nkeynes@361
  1727
MOV.W Rm, @-Rn {:  
nkeynes@671
  1728
    COUNT_INST(I_MOVW);
nkeynes@991
  1729
    load_reg( REG_EAX, Rn );
nkeynes@991
  1730
    check_walign16( REG_EAX );
nkeynes@991
  1731
    LEAL_r32disp_r32( REG_EAX, -2, REG_EAX );
nkeynes@991
  1732
    load_reg( REG_EDX, Rm );
nkeynes@991
  1733
    MEM_WRITE_WORD( REG_EAX, REG_EDX );
nkeynes@991
  1734
    ADDL_imms_rbpdisp( -2, REG_OFFSET(r[Rn]) );
nkeynes@417
  1735
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@361
  1736
:}
nkeynes@361
  1737
MOV.W Rm, @(R0, Rn) {:  
nkeynes@671
  1738
    COUNT_INST(I_MOVW);
nkeynes@991
  1739
    load_reg( REG_EAX, 0 );
nkeynes@991
  1740
    ADDL_rbpdisp_r32( REG_OFFSET(r[Rn]), REG_EAX );
nkeynes@991
  1741
    check_walign16( REG_EAX );
nkeynes@991
  1742
    load_reg( REG_EDX, Rm );
nkeynes@991
  1743
    MEM_WRITE_WORD( REG_EAX, REG_EDX );
nkeynes@417
  1744
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@361
  1745
:}
nkeynes@361
  1746
MOV.W R0, @(disp, GBR) {:  
nkeynes@671
  1747
    COUNT_INST(I_MOVW);
nkeynes@995
  1748
    MOVL_rbpdisp_r32( R_GBR, REG_EAX );
nkeynes@991
  1749
    ADDL_imms_r32( disp, REG_EAX );
nkeynes@991
  1750
    check_walign16( REG_EAX );
nkeynes@991
  1751
    load_reg( REG_EDX, 0 );
nkeynes@991
  1752
    MEM_WRITE_WORD( REG_EAX, REG_EDX );
nkeynes@417
  1753
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@361
  1754
:}
nkeynes@361
  1755
MOV.W R0, @(disp, Rn) {:  
nkeynes@671
  1756
    COUNT_INST(I_MOVW);
nkeynes@991
  1757
    load_reg( REG_EAX, Rn );
nkeynes@991
  1758
    ADDL_imms_r32( disp, REG_EAX );
nkeynes@991
  1759
    check_walign16( REG_EAX );
nkeynes@991
  1760
    load_reg( REG_EDX, 0 );
nkeynes@991
  1761
    MEM_WRITE_WORD( REG_EAX, REG_EDX );
nkeynes@417
  1762
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@361
  1763
:}
nkeynes@361
  1764
MOV.W @Rm, Rn {:  
nkeynes@671
  1765
    COUNT_INST(I_MOVW);
nkeynes@991
  1766
    load_reg( REG_EAX, Rm );
nkeynes@991
  1767
    check_ralign16( REG_EAX );
nkeynes@991
  1768
    MEM_READ_WORD( REG_EAX, REG_EAX );
nkeynes@991
  1769
    store_reg( REG_EAX, Rn );
nkeynes@417
  1770
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@361
  1771
:}
nkeynes@361
  1772
MOV.W @Rm+, Rn {:  
nkeynes@671
  1773
    COUNT_INST(I_MOVW);
nkeynes@991
  1774
    load_reg( REG_EAX, Rm );
nkeynes@991
  1775
    check_ralign16( REG_EAX );
nkeynes@991
  1776
    MEM_READ_WORD( REG_EAX, REG_EAX );
nkeynes@939
  1777
    if( Rm != Rn ) {
nkeynes@991
  1778
        ADDL_imms_rbpdisp( 2, REG_OFFSET(r[Rm]) );
nkeynes@939
  1779
    }
nkeynes@991
  1780
    store_reg( REG_EAX, Rn );
nkeynes@417
  1781
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@361
  1782
:}
nkeynes@361
  1783
MOV.W @(R0, Rm), Rn {:  
nkeynes@671
  1784
    COUNT_INST(I_MOVW);
nkeynes@991
  1785
    load_reg( REG_EAX, 0 );
nkeynes@991
  1786
    ADDL_rbpdisp_r32( REG_OFFSET(r[Rm]), REG_EAX );
nkeynes@991
  1787
    check_ralign16( REG_EAX );
nkeynes@991
  1788
    MEM_READ_WORD( REG_EAX, REG_EAX );
nkeynes@991
  1789
    store_reg( REG_EAX, Rn );
nkeynes@417
  1790
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@361
  1791
:}
nkeynes@361
  1792
MOV.W @(disp, GBR), R0 {:  
nkeynes@671
  1793
    COUNT_INST(I_MOVW);
nkeynes@995
  1794
    MOVL_rbpdisp_r32( R_GBR, REG_EAX );
nkeynes@991
  1795
    ADDL_imms_r32( disp, REG_EAX );
nkeynes@991
  1796
    check_ralign16( REG_EAX );
nkeynes@991
  1797
    MEM_READ_WORD( REG_EAX, REG_EAX );
nkeynes@991
  1798
    store_reg( REG_EAX, 0 );
nkeynes@417
  1799
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@361
  1800
:}
nkeynes@361
  1801
MOV.W @(disp, PC), Rn {:  
nkeynes@671
  1802
    COUNT_INST(I_MOVW);
nkeynes@374
  1803
    if( sh4_x86.in_delay_slot ) {
nkeynes@374
  1804
	SLOTILLEGAL();
nkeynes@374
  1805
    } else {
nkeynes@586
  1806
	// See comments for MOV.L @(disp, PC), Rn
nkeynes@586
  1807
	uint32_t target = pc + disp + 4;
nkeynes@1125
  1808
	if( sh4_x86.fastmem && IS_IN_ICACHE(target) ) {
nkeynes@586
  1809
	    sh4ptr_t ptr = GET_ICACHE_PTR(target);
nkeynes@991
  1810
	    MOVL_moffptr_eax( ptr );
nkeynes@991
  1811
	    MOVSXL_r16_r32( REG_EAX, REG_EAX );
nkeynes@586
  1812
	} else {
nkeynes@995
  1813
	    MOVL_imm32_r32( (pc - sh4_x86.block_start_pc) + disp + 4, REG_EAX );
nkeynes@991
  1814
	    ADDL_rbpdisp_r32( R_PC, REG_EAX );
nkeynes@991
  1815
	    MEM_READ_WORD( REG_EAX, REG_EAX );
nkeynes@586
  1816
	    sh4_x86.tstate = TSTATE_NONE;
nkeynes@586
  1817
	}
nkeynes@991
  1818
	store_reg( REG_EAX, Rn );
nkeynes@374
  1819
    }
nkeynes@361
  1820
:}
nkeynes@361
  1821
MOV.W @(disp, Rm), R0 {:  
nkeynes@671
  1822
    COUNT_INST(I_MOVW);
nkeynes@991
  1823
    load_reg( REG_EAX, Rm );
nkeynes@991
  1824
    ADDL_imms_r32( disp, REG_EAX );
nkeynes@991
  1825
    check_ralign16( REG_EAX );
nkeynes@991
  1826
    MEM_READ_WORD( REG_EAX, REG_EAX );
nkeynes@991
  1827
    store_reg( REG_EAX, 0 );
nkeynes@417
  1828
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@361
  1829
:}
nkeynes@361
  1830
MOVA @(disp, PC), R0 {:  
nkeynes@671
  1831
    COUNT_INST(I_MOVA);
nkeynes@374
  1832
    if( sh4_x86.in_delay_slot ) {
nkeynes@374
  1833
	SLOTILLEGAL();
nkeynes@374
  1834
    } else {
nkeynes@995
  1835
	MOVL_imm32_r32( (pc - sh4_x86.block_start_pc) + disp + 4 - (pc&0x03), REG_ECX );
nkeynes@991
  1836
	ADDL_rbpdisp_r32( R_PC, REG_ECX );
nkeynes@991
  1837
	store_reg( REG_ECX, 0 );
nkeynes@586
  1838
	sh4_x86.tstate = TSTATE_NONE;
nkeynes@374
  1839
    }
nkeynes@361
  1840
:}
nkeynes@361
  1841
MOVCA.L R0, @Rn {:  
nkeynes@671
  1842
    COUNT_INST(I_MOVCA);
nkeynes@991
  1843
    load_reg( REG_EAX, Rn );
nkeynes@991
  1844
    check_walign32( REG_EAX );
nkeynes@991
  1845
    load_reg( REG_EDX, 0 );
nkeynes@991
  1846
    MEM_WRITE_LONG( REG_EAX, REG_EDX );
nkeynes@417
  1847
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@361
  1848
:}
nkeynes@359
  1849
nkeynes@359
  1850
/* Control transfer instructions */
nkeynes@374
  1851
BF disp {:
nkeynes@671
  1852
    COUNT_INST(I_BF);
nkeynes@374
  1853
    if( sh4_x86.in_delay_slot ) {
nkeynes@374
  1854
	SLOTILLEGAL();
nkeynes@374
  1855
    } else {
nkeynes@586
  1856
	sh4vma_t target = disp + pc + 4;
nkeynes@991
  1857
	JT_label( nottaken );
nkeynes@586
  1858
	exit_block_rel(target, pc+2 );
nkeynes@380
  1859
	JMP_TARGET(nottaken);
nkeynes@408
  1860
	return 2;
nkeynes@374
  1861
    }
nkeynes@374
  1862
:}
nkeynes@374
  1863
BF/S disp {:
nkeynes@671
  1864
    COUNT_INST(I_BFS);
nkeynes@374
  1865
    if( sh4_x86.in_delay_slot ) {
nkeynes@374
  1866
	SLOTILLEGAL();
nkeynes@374
  1867
    } else {
nkeynes@590
  1868
	sh4_x86.in_delay_slot = DELAY_PC;
nkeynes@601
  1869
	if( UNTRANSLATABLE(pc+2) ) {
nkeynes@995
  1870
	    MOVL_imm32_r32( pc + 4 - sh4_x86.block_start_pc, REG_EAX );
nkeynes@991
  1871
	    JT_label(nottaken);
nkeynes@991
  1872
	    ADDL_imms_r32( disp, REG_EAX );
nkeynes@601
  1873
	    JMP_TARGET(nottaken);
nkeynes@991
  1874
	    ADDL_rbpdisp_r32( R_PC, REG_EAX );
nkeynes@995
  1875
	    MOVL_r32_rbpdisp( REG_EAX, R_NEW_PC );
nkeynes@601
  1876
	    exit_block_emu(pc+2);
nkeynes@601
  1877
	    sh4_x86.branch_taken = TRUE;
nkeynes@601
  1878
	    return 2;
nkeynes@601
  1879
	} else {
nkeynes@1197
  1880
	    LOAD_t();
nkeynes@601
  1881
	    sh4vma_t target = disp + pc + 4;
nkeynes@991
  1882
	    JCC_cc_rel32(sh4_x86.tstate,0);
nkeynes@991
  1883
	    uint32_t *patch = ((uint32_t *)xlat_output)-1;
nkeynes@879
  1884
	    int save_tstate = sh4_x86.tstate;
nkeynes@601
  1885
	    sh4_translate_instruction(pc+2);
nkeynes@1091
  1886
            sh4_x86.in_delay_slot = DELAY_PC; /* Cleared by sh4_translate_instruction */
nkeynes@601
  1887
	    exit_block_rel( target, pc+4 );
nkeynes@601
  1888
	    
nkeynes@601
  1889
	    // not taken
nkeynes@601
  1890
	    *patch = (xlat_output - ((uint8_t *)patch)) - 4;
nkeynes@879
  1891
	    sh4_x86.tstate = save_tstate;
nkeynes@601
  1892
	    sh4_translate_instruction(pc+2);
nkeynes@601
  1893
	    return 4;
nkeynes@417
  1894
	}
nkeynes@374
  1895
    }
nkeynes@374
  1896
:}
nkeynes@374
  1897
BRA disp {:  
nkeynes@671
  1898
    COUNT_INST(I_BRA);
nkeynes@374
  1899
    if( sh4_x86.in_delay_slot ) {
nkeynes@374
  1900
	SLOTILLEGAL();
nkeynes@374
  1901
    } else {
nkeynes@590
  1902
	sh4_x86.in_delay_slot = DELAY_PC;
nkeynes@409
  1903
	sh4_x86.branch_taken = TRUE;
nkeynes@601
  1904
	if( UNTRANSLATABLE(pc+2) ) {
nkeynes@995
  1905
	    MOVL_rbpdisp_r32( R_PC, REG_EAX );
nkeynes@991
  1906
	    ADDL_imms_r32( pc + disp + 4 - sh4_x86.block_start_pc, REG_EAX );
nkeynes@995
  1907
	    MOVL_r32_rbpdisp( REG_EAX, R_NEW_PC );
nkeynes@601
  1908
	    exit_block_emu(pc+2);
nkeynes@601
  1909
	    return 2;
nkeynes@601
  1910
	} else {
nkeynes@601
  1911
	    sh4_translate_instruction( pc + 2 );
nkeynes@601
  1912
	    exit_block_rel( disp + pc + 4, pc+4 );
nkeynes@601
  1913
	    return 4;
nkeynes@601
  1914
	}
nkeynes@374
  1915
    }
nkeynes@374
  1916
:}
nkeynes@374
  1917
BRAF Rn {:  
nkeynes@671
  1918
    COUNT_INST(I_BRAF);
nkeynes@374
  1919
    if( sh4_x86.in_delay_slot ) {
nkeynes@374
  1920
	SLOTILLEGAL();
nkeynes@374
  1921
    } else {
nkeynes@995
  1922
	MOVL_rbpdisp_r32( R_PC, REG_EAX );
nkeynes@991
  1923
	ADDL_imms_r32( pc + 4 - sh4_x86.block_start_pc, REG_EAX );
nkeynes@991
  1924
	ADDL_rbpdisp_r32( REG_OFFSET(r[Rn]), REG_EAX );
nkeynes@995
  1925
	MOVL_r32_rbpdisp( REG_EAX, R_NEW_PC );
nkeynes@590
  1926
	sh4_x86.in_delay_slot = DELAY_PC;
nkeynes@417
  1927
	sh4_x86.tstate = TSTATE_NONE;
nkeynes@409
  1928
	sh4_x86.branch_taken = TRUE;
nkeynes@601
  1929
	if( UNTRANSLATABLE(pc+2) ) {
nkeynes@601
  1930
	    exit_block_emu(pc+2);
nkeynes@601
  1931
	    return 2;
nkeynes@601
  1932
	} else {
nkeynes@601
  1933
	    sh4_translate_instruction( pc + 2 );
nkeynes@974
  1934
	    exit_block_newpcset(pc+4);
nkeynes@601
  1935
	    return 4;
nkeynes@601
  1936
	}
nkeynes@374
  1937
    }
nkeynes@374
  1938
:}
nkeynes@374
  1939
BSR disp {:  
nkeynes@671
  1940
    COUNT_INST(I_BSR);
nkeynes@374
  1941
    if( sh4_x86.in_delay_slot ) {
nkeynes@374
  1942
	SLOTILLEGAL();
nkeynes@374
  1943
    } else {
nkeynes@995
  1944
	MOVL_rbpdisp_r32( R_PC, REG_EAX );
nkeynes@991
  1945
	ADDL_imms_r32( pc + 4 - sh4_x86.block_start_pc, REG_EAX );
nkeynes@995
  1946
	MOVL_r32_rbpdisp( REG_EAX, R_PR );
nkeynes@590
  1947
	sh4_x86.in_delay_slot = DELAY_PC;
nkeynes@409
  1948
	sh4_x86.branch_taken = TRUE;
nkeynes@601
  1949
	sh4_x86.tstate = TSTATE_NONE;
nkeynes@601
  1950
	if( UNTRANSLATABLE(pc+2) ) {
nkeynes@991
  1951
	    ADDL_imms_r32( disp, REG_EAX );
nkeynes@995
  1952
	    MOVL_r32_rbpdisp( REG_EAX, R_NEW_PC );
nkeynes@601
  1953
	    exit_block_emu(pc+2);
nkeynes@601
  1954
	    return 2;
nkeynes@601
  1955
	} else {
nkeynes@601
  1956
	    sh4_translate_instruction( pc + 2 );
nkeynes@601
  1957
	    exit_block_rel( disp + pc + 4, pc+4 );
nkeynes@601
  1958
	    return 4;
nkeynes@601
  1959
	}
nkeynes@374
  1960
    }
nkeynes@374
  1961
:}
nkeynes@374
  1962
BSRF Rn {:  
nkeynes@671
  1963
    COUNT_INST(I_BSRF);
nkeynes@374
  1964
    if( sh4_x86.in_delay_slot ) {
nkeynes@374
  1965
	SLOTILLEGAL();
nkeynes@374
  1966
    } else {
nkeynes@995
  1967
	MOVL_rbpdisp_r32( R_PC, REG_EAX );
nkeynes@991
  1968
	ADDL_imms_r32( pc + 4 - sh4_x86.block_start_pc, REG_EAX );
nkeynes@995
  1969
	MOVL_r32_rbpdisp( REG_EAX, R_PR );
nkeynes@991
  1970
	ADDL_rbpdisp_r32( REG_OFFSET(r[Rn]), REG_EAX );
nkeynes@995
  1971
	MOVL_r32_rbpdisp( REG_EAX, R_NEW_PC );
nkeynes@590
  1972
nkeynes@601
  1973
	sh4_x86.in_delay_slot = DELAY_PC;
nkeynes@417
  1974
	sh4_x86.tstate = TSTATE_NONE;
nkeynes@409
  1975
	sh4_x86.branch_taken = TRUE;
nkeynes@601
  1976
	if( UNTRANSLATABLE(pc+2) ) {
nkeynes@601
  1977
	    exit_block_emu(pc+2);
nkeynes@601
  1978
	    return 2;
nkeynes@601
  1979
	} else {
nkeynes@601
  1980
	    sh4_translate_instruction( pc + 2 );
nkeynes@974
  1981
	    exit_block_newpcset(pc+4);
nkeynes@601
  1982
	    return 4;
nkeynes@601
  1983
	}
nkeynes@374
  1984
    }
nkeynes@374
  1985
:}
nkeynes@374
  1986
BT disp {:
nkeynes@671
  1987
    COUNT_INST(I_BT);
nkeynes@374
  1988
    if( sh4_x86.in_delay_slot ) {
nkeynes@374
  1989
	SLOTILLEGAL();
nkeynes@374
  1990
    } else {
nkeynes@586
  1991
	sh4vma_t target = disp + pc + 4;
nkeynes@991
  1992
	JF_label( nottaken );
nkeynes@586
  1993
	exit_block_rel(target, pc+2 );
nkeynes@380
  1994
	JMP_TARGET(nottaken);
nkeynes@408
  1995
	return 2;
nkeynes@374
  1996
    }
nkeynes@374
  1997
:}
nkeynes@374
  1998
BT/S disp {:
nkeynes@671
  1999
    COUNT_INST(I_BTS);
nkeynes@374
  2000
    if( sh4_x86.in_delay_slot ) {
nkeynes@374
  2001
	SLOTILLEGAL();
nkeynes@374
  2002
    } else {
nkeynes@590
  2003
	sh4_x86.in_delay_slot = DELAY_PC;
nkeynes@601
  2004
	if( UNTRANSLATABLE(pc+2) ) {
nkeynes@995
  2005
	    MOVL_imm32_r32( pc + 4 - sh4_x86.block_start_pc, REG_EAX );
nkeynes@991
  2006
	    JF_label(nottaken);
nkeynes@991
  2007
	    ADDL_imms_r32( disp, REG_EAX );
nkeynes@601
  2008
	    JMP_TARGET(nottaken);
nkeynes@991
  2009
	    ADDL_rbpdisp_r32( R_PC, REG_EAX );
nkeynes@995
  2010
	    MOVL_r32_rbpdisp( REG_EAX, R_NEW_PC );
nkeynes@601
  2011
	    exit_block_emu(pc+2);
nkeynes@601
  2012
	    sh4_x86.branch_taken = TRUE;
nkeynes@601
  2013
	    return 2;
nkeynes@601
  2014
	} else {
nkeynes@1197
  2015
		LOAD_t();
nkeynes@991
  2016
	    JCC_cc_rel32(sh4_x86.tstate^1,0);
nkeynes@991
  2017
	    uint32_t *patch = ((uint32_t *)xlat_output)-1;
nkeynes@991
  2018
nkeynes@879
  2019
	    int save_tstate = sh4_x86.tstate;
nkeynes@601
  2020
	    sh4_translate_instruction(pc+2);
nkeynes@1091
  2021
            sh4_x86.in_delay_slot = DELAY_PC; /* Cleared by sh4_translate_instruction */
nkeynes@601
  2022
	    exit_block_rel( disp + pc + 4, pc+4 );
nkeynes@601
  2023
	    // not taken
nkeynes@601
  2024
	    *patch = (xlat_output - ((uint8_t *)patch)) - 4;
nkeynes@879
  2025
	    sh4_x86.tstate = save_tstate;
nkeynes@601
  2026
	    sh4_translate_instruction(pc+2);
nkeynes@601
  2027
	    return 4;
nkeynes@417
  2028
	}
nkeynes@374
  2029
    }
nkeynes@374
  2030
:}
nkeynes@374
  2031
JMP @Rn {:  
nkeynes@671
  2032
    COUNT_INST(I_JMP);
nkeynes@374
  2033
    if( sh4_x86.in_delay_slot ) {
nkeynes@374
  2034
	SLOTILLEGAL();
nkeynes@374
  2035
    } else {
nkeynes@991
  2036
	load_reg( REG_ECX, Rn );
nkeynes@995
  2037
	MOVL_r32_rbpdisp( REG_ECX, R_NEW_PC );
nkeynes@590
  2038
	sh4_x86.in_delay_slot = DELAY_PC;
nkeynes@409
  2039
	sh4_x86.branch_taken = TRUE;
nkeynes@601
  2040
	if( UNTRANSLATABLE(pc+2) ) {
nkeynes@601
  2041
	    exit_block_emu(pc+2);
nkeynes@601
  2042
	    return 2;
nkeynes@601
  2043
	} else {
nkeynes@601
  2044
	    sh4_translate_instruction(pc+2);
nkeynes@974
  2045
	    exit_block_newpcset(pc+4);
nkeynes@601
  2046
	    return 4;
nkeynes@601
  2047
	}
nkeynes@374
  2048
    }
nkeynes@374
  2049
:}
nkeynes@374
  2050
JSR @Rn {:  
nkeynes@671
  2051
    COUNT_INST(I_JSR);
nkeynes@374
  2052
    if( sh4_x86.in_delay_slot ) {
nkeynes@374
  2053
	SLOTILLEGAL();
nkeynes@374
  2054
    } else {
nkeynes@995
  2055
	MOVL_rbpdisp_r32( R_PC, REG_EAX );
nkeynes@991
  2056
	ADDL_imms_r32( pc + 4 - sh4_x86.block_start_pc, REG_EAX );
nkeynes@995
  2057
	MOVL_r32_rbpdisp( REG_EAX, R_PR );
nkeynes@991
  2058
	load_reg( REG_ECX, Rn );
nkeynes@995
  2059
	MOVL_r32_rbpdisp( REG_ECX, R_NEW_PC );
nkeynes@601
  2060
	sh4_x86.in_delay_slot = DELAY_PC;
nkeynes@409
  2061
	sh4_x86.branch_taken = TRUE;
nkeynes@601
  2062
	sh4_x86.tstate = TSTATE_NONE;
nkeynes@601
  2063
	if( UNTRANSLATABLE(pc+2) ) {
nkeynes@601
  2064
	    exit_block_emu(pc+2);
nkeynes@601
  2065
	    return 2;
nkeynes@601
  2066
	} else {
nkeynes@601
  2067
	    sh4_translate_instruction(pc+2);
nkeynes@974
  2068
	    exit_block_newpcset(pc+4);
nkeynes@601
  2069
	    return 4;
nkeynes@601
  2070
	}
nkeynes@374
  2071
    }
nkeynes@374
  2072
:}
nkeynes@374
  2073
RTE {:  
nkeynes@671
  2074
    COUNT_INST(I_RTE);
nkeynes@374
  2075
    if( sh4_x86.in_delay_slot ) {
nkeynes@374
  2076
	SLOTILLEGAL();
nkeynes@374
  2077
    } else {
nkeynes@408
  2078
	check_priv();
nkeynes@995
  2079
	MOVL_rbpdisp_r32( R_SPC, REG_ECX );
nkeynes@995
  2080
	MOVL_r32_rbpdisp( REG_ECX, R_NEW_PC );
nkeynes@995
  2081
	MOVL_rbpdisp_r32( R_SSR, REG_EAX );
nkeynes@995
  2082
	CALL1_ptr_r32( sh4_write_sr, REG_EAX );
nkeynes@590
  2083
	sh4_x86.in_delay_slot = DELAY_PC;
nkeynes@377
  2084
	sh4_x86.fpuen_checked = FALSE;
nkeynes@417
  2085
	sh4_x86.tstate = TSTATE_NONE;
nkeynes@409
  2086
	sh4_x86.branch_taken = TRUE;
nkeynes@1112
  2087
    sh4_x86.sh4_mode = SH4_MODE_UNKNOWN;
nkeynes@601
  2088
	if( UNTRANSLATABLE(pc+2) ) {
nkeynes@601
  2089
	    exit_block_emu(pc+2);
nkeynes@601
  2090
	    return 2;
nkeynes@601
  2091
	} else {
nkeynes@601
  2092
	    sh4_translate_instruction(pc+2);
nkeynes@974
  2093
	    exit_block_newpcset(pc+4);
nkeynes@601
  2094
	    return 4;
nkeynes@601
  2095
	}
nkeynes@374
  2096
    }
nkeynes@374
  2097
:}
nkeynes@374
  2098
RTS {:  
nkeynes@671
  2099
    COUNT_INST(I_RTS);
nkeynes@374
  2100
    if( sh4_x86.in_delay_slot ) {
nkeynes@374
  2101
	SLOTILLEGAL();
nkeynes@374
  2102
    } else {
nkeynes@995
  2103
	MOVL_rbpdisp_r32( R_PR, REG_ECX );
nkeynes@995
  2104
	MOVL_r32_rbpdisp( REG_ECX, R_NEW_PC );
nkeynes@590
  2105
	sh4_x86.in_delay_slot = DELAY_PC;
nkeynes@409
  2106
	sh4_x86.branch_taken = TRUE;
nkeynes@601
  2107
	if( UNTRANSLATABLE(pc+2) ) {
nkeynes@601
  2108
	    exit_block_emu(pc+2);
nkeynes@601
  2109
	    return 2;
nkeynes@601
  2110
	} else {
nkeynes@601
  2111
	    sh4_translate_instruction(pc+2);
nkeynes@974
  2112
	    exit_block_newpcset(pc+4);
nkeynes@601
  2113
	    return 4;
nkeynes@601
  2114
	}
nkeynes@374
  2115
    }
nkeynes@374
  2116
:}
nkeynes@374
  2117
TRAPA #imm {:  
nkeynes@671
  2118
    COUNT_INST(I_TRAPA);
nkeynes@374
  2119
    if( sh4_x86.in_delay_slot ) {
nkeynes@374
  2120
	SLOTILLEGAL();
nkeynes@374
  2121
    } else {
nkeynes@995
  2122
	MOVL_imm32_r32( pc+2 - sh4_x86.block_start_pc, REG_ECX );   // 5
nkeynes@991
  2123
	ADDL_r32_rbpdisp( REG_ECX, R_PC );
nkeynes@995
  2124
	MOVL_imm32_r32( imm, REG_EAX );
nkeynes@995
  2125
	CALL1_ptr_r32( sh4_raise_trap, REG_EAX );
nkeynes@417
  2126
	sh4_x86.tstate = TSTATE_NONE;
nkeynes@974
  2127
	exit_block_pcset(pc+2);
nkeynes@409
  2128
	sh4_x86.branch_taken = TRUE;
nkeynes@408
  2129
	return 2;
nkeynes@374
  2130
    }
nkeynes@374
  2131
:}
nkeynes@374
  2132
UNDEF {:  
nkeynes@671
  2133
    COUNT_INST(I_UNDEF);
nkeynes@374
  2134
    if( sh4_x86.in_delay_slot ) {
nkeynes@1191
  2135
	exit_block_exc(EXC_SLOT_ILLEGAL, pc-2, 4);    
nkeynes@374
  2136
    } else {
nkeynes@1191
  2137
	exit_block_exc(EXC_ILLEGAL, pc, 2);    
nkeynes@408
  2138
	return 2;
nkeynes@374
  2139
    }
nkeynes@368
  2140
:}
nkeynes@374
  2141
nkeynes@374
  2142
CLRMAC {:  
nkeynes@671
  2143
    COUNT_INST(I_CLRMAC);
nkeynes@991
  2144
    XORL_r32_r32(REG_EAX, REG_EAX);
nkeynes@995
  2145
    MOVL_r32_rbpdisp( REG_EAX, R_MACL );
nkeynes@995
  2146
    MOVL_r32_rbpdisp( REG_EAX, R_MACH );
nkeynes@417
  2147
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@368
  2148
:}
nkeynes@374
  2149
CLRS {:
nkeynes@671
  2150
    COUNT_INST(I_CLRS);
nkeynes@374
  2151
    CLC();
nkeynes@991
  2152
    SETCCB_cc_rbpdisp(X86_COND_C, R_S);
nkeynes@872
  2153
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@368
  2154
:}
nkeynes@374
  2155
CLRT {:  
nkeynes@671
  2156
    COUNT_INST(I_CLRT);
nkeynes@374
  2157
    CLC();
nkeynes@374
  2158
    SETC_t();
nkeynes@417
  2159
    sh4_x86.tstate = TSTATE_C;
nkeynes@359
  2160
:}
nkeynes@374
  2161
SETS {:  
nkeynes@671
  2162
    COUNT_INST(I_SETS);
nkeynes@374
  2163
    STC();
nkeynes@991
  2164
    SETCCB_cc_rbpdisp(X86_COND_C, R_S);
nkeynes@872
  2165
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  2166
:}
nkeynes@374
  2167
SETT {:  
nkeynes@671
  2168
    COUNT_INST(I_SETT);
nkeynes@374
  2169
    STC();
nkeynes@374
  2170
    SETC_t();
nkeynes@417
  2171
    sh4_x86.tstate = TSTATE_C;
nkeynes@374
  2172
:}
nkeynes@359
  2173
nkeynes@375
  2174
/* Floating point moves */
nkeynes@375
  2175
FMOV FRm, FRn {:  
nkeynes@671
  2176
    COUNT_INST(I_FMOV1);
nkeynes@377
  2177
    check_fpuen();
nkeynes@901
  2178
    if( sh4_x86.double_size ) {
nkeynes@991
  2179
        load_dr0( REG_EAX, FRm );
nkeynes@991
  2180
        load_dr1( REG_ECX, FRm );
nkeynes@991
  2181
        store_dr0( REG_EAX, FRn );
nkeynes@991
  2182
        store_dr1( REG_ECX, FRn );
nkeynes@901
  2183
    } else {
nkeynes@991
  2184
        load_fr( REG_EAX, FRm ); // SZ=0 branch
nkeynes@991
  2185
        store_fr( REG_EAX, FRn );
nkeynes@901
  2186
    }
nkeynes@375
  2187
:}
nkeynes@416
  2188
FMOV FRm, @Rn {: 
nkeynes@671
  2189
    COUNT_INST(I_FMOV2);
nkeynes@586
  2190
    check_fpuen();
nkeynes@991
  2191
    load_reg( REG_EAX, Rn );
nkeynes@901
  2192
    if( sh4_x86.double_size ) {
nkeynes@991
  2193
        check_walign64( REG_EAX );
nkeynes@991
  2194
        load_dr0( REG_EDX, FRm );
nkeynes@991
  2195
        MEM_WRITE_LONG( REG_EAX, REG_EDX );
nkeynes@991
  2196
        load_reg( REG_EAX, Rn );
nkeynes@991
  2197
        LEAL_r32disp_r32( REG_EAX, 4, REG_EAX );
nkeynes@991
  2198
        load_dr1( REG_EDX, FRm );
nkeynes@991
  2199
        MEM_WRITE_LONG( REG_EAX, REG_EDX );
nkeynes@901
  2200
    } else {
nkeynes@991
  2201
        check_walign32( REG_EAX );
nkeynes@991
  2202
        load_fr( REG_EDX, FRm );
nkeynes@991
  2203
        MEM_WRITE_LONG( REG_EAX, REG_EDX );
nkeynes@901
  2204
    }
nkeynes@417
  2205
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@375
  2206
:}
nkeynes@375
  2207
FMOV @Rm, FRn {:  
nkeynes@671
  2208
    COUNT_INST(I_FMOV5);
nkeynes@586
  2209
    check_fpuen();
nkeynes@991
  2210
    load_reg( REG_EAX, Rm );
nkeynes@901
  2211
    if( sh4_x86.double_size ) {
nkeynes@991
  2212
        check_ralign64( REG_EAX );
nkeynes@991
  2213
        MEM_READ_LONG( REG_EAX, REG_EAX );
nkeynes@991
  2214
        store_dr0( REG_EAX, FRn );
nkeynes@991
  2215
        load_reg( REG_EAX, Rm );
nkeynes@991
  2216
        LEAL_r32disp_r32( REG_EAX, 4, REG_EAX );
nkeynes@991
  2217
        MEM_READ_LONG( REG_EAX, REG_EAX );
nkeynes@991
  2218
        store_dr1( REG_EAX, FRn );
nkeynes@901
  2219
    } else {
nkeynes@991
  2220
        check_ralign32( REG_EAX );
nkeynes@991
  2221
        MEM_READ_LONG( REG_EAX, REG_EAX );
nkeynes@991
  2222
        store_fr( REG_EAX, FRn );
nkeynes@901
  2223
    }
nkeynes@417
  2224
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@375
  2225
:}
nkeynes@377
  2226
FMOV FRm, @-Rn {:  
nkeynes@671
  2227
    COUNT_INST(I_FMOV3);
nkeynes@586
  2228
    check_fpuen();
nkeynes@991
  2229
    load_reg( REG_EAX, Rn );
nkeynes@901
  2230
    if( sh4_x86.double_size ) {
nkeynes@991
  2231
        check_walign64( REG_EAX );
nkeynes@991
  2232
        LEAL_r32disp_r32( REG_EAX, -8, REG_EAX );
nkeynes@991
  2233
        load_dr0( REG_EDX, FRm );
nkeynes@991
  2234
        MEM_WRITE_LONG( REG_EAX, REG_EDX );
nkeynes@991
  2235
        load_reg( REG_EAX, Rn );
nkeynes@991
  2236
        LEAL_r32disp_r32( REG_EAX, -4, REG_EAX );
nkeynes@991
  2237
        load_dr1( REG_EDX, FRm );
nkeynes@991
  2238
        MEM_WRITE_LONG( REG_EAX, REG_EDX );
nkeynes@991
  2239
        ADDL_imms_rbpdisp(-8,REG_OFFSET(r[Rn]));
nkeynes@901
  2240
    } else {
nkeynes@991
  2241
        check_walign32( REG_EAX );
nkeynes@991
  2242
        LEAL_r32disp_r32( REG_EAX, -4, REG_EAX );
nkeynes@991
  2243
        load_fr( REG_EDX, FRm );
nkeynes@991
  2244
        MEM_WRITE_LONG( REG_EAX, REG_EDX );
nkeynes@991
  2245
        ADDL_imms_rbpdisp(-4,REG_OFFSET(r[Rn]));
nkeynes@901
  2246
    }
nkeynes@417
  2247
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@377
  2248
:}
nkeynes@416
  2249
FMOV @Rm+, FRn {:
nkeynes@671
  2250
    COUNT_INST(I_FMOV6);
nkeynes@586
  2251
    check_fpuen();
nkeynes@991
  2252
    load_reg( REG_EAX, Rm );
nkeynes@901
  2253
    if( sh4_x86.double_size ) {
nkeynes@991
  2254
        check_ralign64( REG_EAX );
nkeynes@991
  2255
        MEM_READ_LONG( REG_EAX, REG_EAX );
nkeynes@991
  2256
        store_dr0( REG_EAX, FRn );
nkeynes@991
  2257
        load_reg( REG_EAX, Rm );
nkeynes@991
  2258
        LEAL_r32disp_r32( REG_EAX, 4, REG_EAX );
nkeynes@991
  2259
        MEM_READ_LONG( REG_EAX, REG_EAX );
nkeynes@991
  2260
        store_dr1( REG_EAX, FRn );
nkeynes@991
  2261
        ADDL_imms_rbpdisp( 8, REG_OFFSET(r[Rm]) );
nkeynes@901
  2262
    } else {
nkeynes@991
  2263
        check_ralign32( REG_EAX );
nkeynes@991
  2264
        MEM_READ_LONG( REG_EAX, REG_EAX );
nkeynes@991
  2265
        store_fr( REG_EAX, FRn );
nkeynes@991
  2266
        ADDL_imms_rbpdisp( 4, REG_OFFSET(r[Rm]) );
nkeynes@901
  2267
    }
nkeynes@417
  2268
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@377
  2269
:}
nkeynes@377
  2270
FMOV FRm, @(R0, Rn) {:  
nkeynes@671
  2271
    COUNT_INST(I_FMOV4);
nkeynes@586
  2272
    check_fpuen();
nkeynes@991
  2273
    load_reg( REG_EAX, Rn );
nkeynes@991
  2274
    ADDL_rbpdisp_r32( REG_OFFSET(r[0]), REG_EAX );
nkeynes@901
  2275
    if( sh4_x86.double_size ) {
nkeynes@991
  2276
        check_walign64( REG_EAX );
nkeynes@991
  2277
        load_dr0( REG_EDX, FRm );
nkeynes@991
  2278
        MEM_WRITE_LONG( REG_EAX, REG_EDX );
nkeynes@991
  2279
        load_reg( REG_EAX, Rn );
nkeynes@991
  2280
        ADDL_rbpdisp_r32( REG_OFFSET(r[0]), REG_EAX );
nkeynes@991
  2281
        LEAL_r32disp_r32( REG_EAX, 4, REG_EAX );
nkeynes@991
  2282
        load_dr1( REG_EDX, FRm );
nkeynes@991
  2283
        MEM_WRITE_LONG( REG_EAX, REG_EDX );
nkeynes@901
  2284
    } else {
nkeynes@991
  2285
        check_walign32( REG_EAX );
nkeynes@991
  2286
        load_fr( REG_EDX, FRm );
nkeynes@991
  2287
        MEM_WRITE_LONG( REG_EAX, REG_EDX ); // 12
nkeynes@901
  2288
    }
nkeynes@417
  2289
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@377
  2290
:}
nkeynes@377
  2291
FMOV @(R0, Rm), FRn {:  
nkeynes@671
  2292
    COUNT_INST(I_FMOV7);
nkeynes@586
  2293
    check_fpuen();
nkeynes@991
  2294
    load_reg( REG_EAX, Rm );
nkeynes@991
  2295
    ADDL_rbpdisp_r32( REG_OFFSET(r[0]), REG_EAX );
nkeynes@901
  2296
    if( sh4_x86.double_size ) {
nkeynes@991
  2297
        check_ralign64( REG_EAX );
nkeynes@991
  2298
        MEM_READ_LONG( REG_EAX, REG_EAX );
nkeynes@991
  2299
        store_dr0( REG_EAX, FRn );
nkeynes@991
  2300
        load_reg( REG_EAX, Rm );
nkeynes@991
  2301
        ADDL_rbpdisp_r32( REG_OFFSET(r[0]), REG_EAX );
nkeynes@991
  2302
        LEAL_r32disp_r32( REG_EAX, 4, REG_EAX );
nkeynes@991
  2303
        MEM_READ_LONG( REG_EAX, REG_EAX );
nkeynes@991
  2304
        store_dr1( REG_EAX, FRn );
nkeynes@901
  2305
    } else {
nkeynes@991
  2306
        check_ralign32( REG_EAX );
nkeynes@991
  2307
        MEM_READ_LONG( REG_EAX, REG_EAX );
nkeynes@991
  2308
        store_fr( REG_EAX, FRn );
nkeynes@901
  2309
    }
nkeynes@417
  2310
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@377
  2311
:}
nkeynes@377
  2312
FLDI0 FRn {:  /* IFF PR=0 */
nkeynes@671
  2313
    COUNT_INST(I_FLDI0);
nkeynes@377
  2314
    check_fpuen();
nkeynes@901
  2315
    if( sh4_x86.double_prec == 0 ) {
nkeynes@991
  2316
        XORL_r32_r32( REG_EAX, REG_EAX );
nkeynes@991
  2317
        store_fr( REG_EAX, FRn );
nkeynes@901
  2318
    }
nkeynes@417
  2319
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@377
  2320
:}
nkeynes@377
  2321
FLDI1 FRn {:  /* IFF PR=0 */
nkeynes@671
  2322
    COUNT_INST(I_FLDI1);
nkeynes@377
  2323
    check_fpuen();
nkeynes@901
  2324
    if( sh4_x86.double_prec == 0 ) {
nkeynes@995
  2325
        MOVL_imm32_r32( 0x3F800000, REG_EAX );
nkeynes@991
  2326
        store_fr( REG_EAX, FRn );
nkeynes@901
  2327
    }
nkeynes@377
  2328
:}
nkeynes@377
  2329
nkeynes@377
  2330
FLOAT FPUL, FRn {:  
nkeynes@671
  2331
    COUNT_INST(I_FLOAT);
nkeynes@377
  2332
    check_fpuen();
nkeynes@991
  2333
    FILD_rbpdisp(R_FPUL);
nkeynes@901
  2334
    if( sh4_x86.double_prec ) {
nkeynes@901
  2335
        pop_dr( FRn );
nkeynes@901
  2336
    } else {
nkeynes@901
  2337
        pop_fr( FRn );
nkeynes@901
  2338
    }
nkeynes@377
  2339
:}
nkeynes@377
  2340
FTRC FRm, FPUL {:  
nkeynes@671
  2341
    COUNT_INST(I_FTRC);
nkeynes@377
  2342
    check_fpuen();
nkeynes@901
  2343
    if( sh4_x86.double_prec ) {
nkeynes@901
  2344
        push_dr( FRm );
nkeynes@901
  2345
    } else {
nkeynes@901
  2346
        push_fr( FRm );
nkeynes@901
  2347
    }
nkeynes@1197
  2348
    MOVP_immptr_rptr( &min_int, REG_ECX );
nkeynes@1197
  2349
    FILD_r32disp( REG_ECX, 0 );
nkeynes@1197
  2350
    FCOMIP_st(1);              
nkeynes@1197
  2351
    JAE_label( sat );     
nkeynes@1197
  2352
    JP_label( sat2 );       
nkeynes@995
  2353
    MOVP_immptr_rptr( &max_int, REG_ECX );
nkeynes@991
  2354
    FILD_r32disp( REG_ECX, 0 );
nkeynes@388
  2355
    FCOMIP_st(1);
nkeynes@1197
  2356
    JNA_label( sat3 );
nkeynes@995
  2357
    MOVP_immptr_rptr( &save_fcw, REG_EAX );
nkeynes@991
  2358
    FNSTCW_r32disp( REG_EAX, 0 );
nkeynes@995
  2359
    MOVP_immptr_rptr( &trunc_fcw, REG_EDX );
nkeynes@991
  2360
    FLDCW_r32disp( REG_EDX, 0 );
nkeynes@995
  2361
    FISTP_rbpdisp(R_FPUL);             
nkeynes@991
  2362
    FLDCW_r32disp( REG_EAX, 0 );
nkeynes@995
  2363
    JMP_label(end);             
nkeynes@388
  2364
nkeynes@388
  2365
    JMP_TARGET(sat);
nkeynes@388
  2366
    JMP_TARGET(sat2);
nkeynes@1197
  2367
    JMP_TARGET(sat3);
nkeynes@991
  2368
    MOVL_r32disp_r32( REG_ECX, 0, REG_ECX ); // 2
nkeynes@995
  2369
    MOVL_r32_rbpdisp( REG_ECX, R_FPUL );
nkeynes@388
  2370
    FPOP_st();
nkeynes@388
  2371
    JMP_TARGET(end);
nkeynes@417
  2372
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@377
  2373
:}
nkeynes@377
  2374
FLDS FRm, FPUL {:  
nkeynes@671
  2375
    COUNT_INST(I_FLDS);
nkeynes@377
  2376
    check_fpuen();
nkeynes@991
  2377
    load_fr( REG_EAX, FRm );
nkeynes@995
  2378
    MOVL_r32_rbpdisp( REG_EAX, R_FPUL );
nkeynes@377
  2379
:}
nkeynes@377
  2380
FSTS FPUL, FRn {:  
nkeynes@671
  2381
    COUNT_INST(I_FSTS);
nkeynes@377
  2382
    check_fpuen();
nkeynes@995
  2383
    MOVL_rbpdisp_r32( R_FPUL, REG_EAX );
nkeynes@991
  2384
    store_fr( REG_EAX, FRn );
nkeynes@377
  2385
:}
nkeynes@377
  2386
FCNVDS FRm, FPUL {:  
nkeynes@671
  2387
    COUNT_INST(I_FCNVDS);
nkeynes@377
  2388
    check_fpuen();
nkeynes@901
  2389
    if( sh4_x86.double_prec ) {
nkeynes@901
  2390
        push_dr( FRm );
nkeynes@901
  2391
        pop_fpul();
nkeynes@901
  2392
    }
nkeynes@377
  2393
:}
nkeynes@377
  2394
FCNVSD FPUL, FRn {:  
nkeynes@671
  2395
    COUNT_INST(I_FCNVSD);
nkeynes@377
  2396
    check_fpuen();
nkeynes@901
  2397
    if( sh4_x86.double_prec ) {
nkeynes@901
  2398
        push_fpul();
nkeynes@901
  2399
        pop_dr( FRn );
nkeynes@901
  2400
    }
nkeynes@377
  2401
:}
nkeynes@375
  2402
nkeynes@359
  2403
/* Floating point instructions */
nkeynes@374
  2404
FABS FRn {:  
nkeynes@671
  2405
    COUNT_INST(I_FABS);
nkeynes@377
  2406
    check_fpuen();
nkeynes@901
  2407
    if( sh4_x86.double_prec ) {
nkeynes@901
  2408
        push_dr(FRn);
nkeynes@901
  2409
        FABS_st0();
nkeynes@901
  2410
        pop_dr(FRn);
nkeynes@901
  2411
    } else {
nkeynes@901
  2412
        push_fr(FRn);
nkeynes@901
  2413
        FABS_st0();
nkeynes@901
  2414
        pop_fr(FRn);
nkeynes@901
  2415
    }
nkeynes@374
  2416
:}
nkeynes@377
  2417
FADD FRm, FRn {:  
nkeynes@671
  2418
    COUNT_INST(I_FADD);
nkeynes@377
  2419
    check_fpuen();
nkeynes@901
  2420
    if( sh4_x86.double_prec ) {
nkeynes@901
  2421
        push_dr(FRm);
nkeynes@901
  2422
        push_dr(FRn);
nkeynes@901
  2423
        FADDP_st(1);
nkeynes@901
  2424
        pop_dr(FRn);
nkeynes@901
  2425
    } else {
nkeynes@901
  2426
        push_fr(FRm);
nkeynes@901
  2427
        push_fr(FRn);
nkeynes@901
  2428
        FADDP_st(1);
nkeynes@901
  2429
        pop_fr(FRn);
nkeynes@901
  2430
    }
nkeynes@375
  2431
:}
nkeynes@377
  2432
FDIV FRm, FRn {:  
nkeynes@671
  2433
    COUNT_INST(I_FDIV);
nkeynes@377
  2434
    check_fpuen();
nkeynes@901
  2435
    if( sh4_x86.double_prec ) {
nkeynes@901
  2436
        push_dr(FRn);
nkeynes@901
  2437
        push_dr(FRm);
nkeynes@901
  2438
        FDIVP_st(1);
nkeynes@901
  2439
        pop_dr(FRn);
nkeynes@901
  2440
    } else {
nkeynes@901
  2441
        push_fr(FRn);
nkeynes@901
  2442
        push_fr(FRm);
nkeynes@901
  2443
        FDIVP_st(1);
nkeynes@901
  2444
        pop_fr(FRn);
nkeynes@901
  2445
    }
nkeynes@375
  2446
:}
nkeynes@375
  2447
FMAC FR0, FRm, FRn {:  
nkeynes@671
  2448
    COUNT_INST(I_FMAC);
nkeynes@377
  2449
    check_fpuen();
nkeynes@901
  2450
    if( sh4_x86.double_prec ) {
nkeynes@901
  2451
        push_dr( 0 );
nkeynes@901
  2452
        push_dr( FRm );
nkeynes@901
  2453
        FMULP_st(1);
nkeynes@901
  2454
        push_dr( FRn );
nkeynes@901
  2455
        FADDP_st(1);
nkeynes@901
  2456
        pop_dr( FRn );
nkeynes@901
  2457
    } else {
nkeynes@901
  2458
        push_fr( 0 );
nkeynes@901
  2459
        push_fr( FRm );
nkeynes@901
  2460
        FMULP_st(1);
nkeynes@901
  2461
        push_fr( FRn );
nkeynes@901
  2462
        FADDP_st(1);
nkeynes@901
  2463
        pop_fr( FRn );
nkeynes@901
  2464
    }
nkeynes@375
  2465
:}
nkeynes@375
  2466
nkeynes@377
  2467
FMUL FRm, FRn {:  
nkeynes@671
  2468
    COUNT_INST(I_FMUL);
nkeynes@377
  2469
    check_fpuen();
nkeynes@901
  2470
    if( sh4_x86.double_prec ) {
nkeynes@901
  2471
        push_dr(FRm);
nkeynes@901
  2472
        push_dr(FRn);
nkeynes@901
  2473
        FMULP_st(1);
nkeynes@901
  2474
        pop_dr(FRn);
nkeynes@901
  2475
    } else {
nkeynes@901
  2476
        push_fr(FRm);
nkeynes@901
  2477
        push_fr(FRn);
nkeynes@901
  2478
        FMULP_st(1);
nkeynes@901
  2479
        pop_fr(FRn);
nkeynes@901
  2480
    }
nkeynes@377
  2481
:}
nkeynes@377
  2482
FNEG FRn {:  
nkeynes@671
  2483
    COUNT_INST(I_FNEG);
nkeynes@377
  2484
    check_fpuen();
nkeynes@901
  2485
    if( sh4_x86.double_prec ) {
nkeynes@901
  2486
        push_dr(FRn);
nkeynes@901
  2487
        FCHS_st0();
nkeynes@901
  2488
        pop_dr(FRn);
nkeynes@901
  2489
    } else {
nkeynes@901
  2490
        push_fr(FRn);
nkeynes@901
  2491
        FCHS_st0();
nkeynes@901
  2492
        pop_fr(FRn);
nkeynes@901
  2493
    }
nkeynes@377
  2494
:}
nkeynes@377
  2495
FSRRA FRn {:  
nkeynes@671
  2496
    COUNT_INST(I_FSRRA);
nkeynes@377
  2497
    check_fpuen();
nkeynes@901
  2498
    if( sh4_x86.double_prec == 0 ) {
nkeynes@901
  2499
        FLD1_st0();
nkeynes@901
  2500
        push_fr(FRn);
nkeynes@901
  2501
        FSQRT_st0();
nkeynes@901
  2502
        FDIVP_st(1);
nkeynes@901
  2503
        pop_fr(FRn);
nkeynes@901
  2504
    }
nkeynes@377
  2505
:}
nkeynes@377
  2506
FSQRT FRn {:  
nkeynes@671
  2507
    COUNT_INST(I_FSQRT);
nkeynes@377
  2508
    check_fpuen();
nkeynes@901
  2509
    if( sh4_x86.double_prec ) {
nkeynes@901
  2510
        push_dr(FRn);
nkeynes@901
  2511
        FSQRT_st0();
nkeynes@901
  2512
        pop_dr(FRn);
nkeynes@901
  2513
    } else {
nkeynes@901
  2514
        push_fr(FRn);
nkeynes@901
  2515
        FSQRT_st0();
nkeynes@901
  2516
        pop_fr(FRn);
nkeynes@901
  2517
    }
nkeynes@377
  2518
:}
nkeynes@377
  2519
FSUB FRm, FRn {:  
nkeynes@671
  2520
    COUNT_INST(I_FSUB);
nkeynes@377
  2521
    check_fpuen();
nkeynes@901
  2522
    if( sh4_x86.double_prec ) {
nkeynes@901
  2523
        push_dr(FRn);
nkeynes@901
  2524
        push_dr(FRm);
nkeynes@901
  2525
        FSUBP_st(1);
nkeynes@901
  2526
        pop_dr(FRn);
nkeynes@901
  2527
    } else {
nkeynes@901
  2528
        push_fr(FRn);
nkeynes@901
  2529
        push_fr(FRm);
nkeynes@901
  2530
        FSUBP_st(1);
nkeynes@901
  2531
        pop_fr(FRn);
nkeynes@901
  2532
    }
nkeynes@377
  2533
:}
nkeynes@377
  2534
nkeynes@377
  2535
FCMP/EQ FRm, FRn {:  
nkeynes@671
  2536
    COUNT_INST(I_FCMPEQ);
nkeynes@377
  2537
    check_fpuen();
nkeynes@901
  2538
    if( sh4_x86.double_prec ) {
nkeynes@901
  2539
        push_dr(FRm);
nkeynes@901
  2540
        push_dr(FRn);
nkeynes@901
  2541
    } else {
nkeynes@901
  2542
        push_fr(FRm);
nkeynes@901
  2543
        push_fr(FRn);
nkeynes@901
  2544
    }
nkeynes@1197
  2545
    XORL_r32_r32(REG_EAX, REG_EAX);
nkeynes@1197
  2546
    XORL_r32_r32(REG_EDX, REG_EDX);
nkeynes@377
  2547
    FCOMIP_st(1);
nkeynes@1197
  2548
    SETCCB_cc_r8(X86_COND_NP, REG_DL);
nkeynes@1197
  2549
    CMOVCCL_cc_r32_r32(X86_COND_E, REG_EDX, REG_EAX);
nkeynes@1197
  2550
    MOVL_r32_rbpdisp(REG_EAX, R_T);
nkeynes@377
  2551
    FPOP_st();
nkeynes@1197
  2552
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@377
  2553
:}
nkeynes@377
  2554
FCMP/GT FRm, FRn {:  
nkeynes@671
  2555
    COUNT_INST(I_FCMPGT);
nkeynes@377
  2556
    check_fpuen();
nkeynes@901
  2557
    if( sh4_x86.double_prec ) {
nkeynes@901
  2558
        push_dr(FRm);
nkeynes@901
  2559
        push_dr(FRn);
nkeynes@901
  2560
    } else {
nkeynes@901
  2561
        push_fr(FRm);
nkeynes@901
  2562
        push_fr(FRn);
nkeynes@901
  2563
    }
nkeynes@377
  2564
    FCOMIP_st(1);
nkeynes@377
  2565
    SETA_t();
nkeynes@377
  2566
    FPOP_st();
nkeynes@901
  2567
    sh4_x86.tstate = TSTATE_A;
nkeynes@377
  2568
:}
nkeynes@377
  2569
nkeynes@377
  2570
FSCA FPUL, FRn {:  
nkeynes@671
  2571
    COUNT_INST(I_FSCA);
nkeynes@377
  2572
    check_fpuen();
nkeynes@901
  2573
    if( sh4_x86.double_prec == 0 ) {
nkeynes@991
  2574
        LEAP_rbpdisp_rptr( REG_OFFSET(fr[0][FRn&0x0E]), REG_EDX );
nkeynes@995
  2575
        MOVL_rbpdisp_r32( R_FPUL, REG_EAX );
nkeynes@995
  2576
        CALL2_ptr_r32_r32( sh4_fsca, REG_EAX, REG_EDX );
nkeynes@901
  2577
    }
nkeynes@417
  2578
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@377
  2579
:}
nkeynes@377
  2580
FIPR FVm, FVn {:  
nkeynes@671
  2581
    COUNT_INST(I_FIPR);
nkeynes@377
  2582
    check_fpuen();
nkeynes@901
  2583
    if( sh4_x86.double_prec == 0 ) {
nkeynes@904
  2584
        if( sh4_x86.sse3_enabled ) {
nkeynes@991
  2585
            MOVAPS_rbpdisp_xmm( REG_OFFSET(fr[0][FVm<<2]), 4 );
nkeynes@991
  2586
            MULPS_rbpdisp_xmm( REG_OFFSET(fr[0][FVn<<2]), 4 );
nkeynes@903
  2587
            HADDPS_xmm_xmm( 4, 4 ); 
nkeynes@903
  2588
            HADDPS_xmm_xmm( 4, 4 );
nkeynes@991
  2589
            MOVSS_xmm_rbpdisp( 4, REG_OFFSET(fr[0][(FVn<<2)+2]) );
nkeynes@903
  2590
        } else {
nkeynes@904
  2591
            push_fr( FVm<<2 );
nkeynes@903
  2592
            push_fr( FVn<<2 );
nkeynes@903
  2593
            FMULP_st(1);
nkeynes@903
  2594
            push_fr( (FVm<<2)+1);
nkeynes@903
  2595
            push_fr( (FVn<<2)+1);
nkeynes@903
  2596
            FMULP_st(1);
nkeynes@903
  2597
            FADDP_st(1);
nkeynes@903
  2598
            push_fr( (FVm<<2)+2);
nkeynes@903
  2599
            push_fr( (FVn<<2)+2);
nkeynes@903
  2600
            FMULP_st(1);
nkeynes@903
  2601
            FADDP_st(1);
nkeynes@903
  2602
            push_fr( (FVm<<2)+3);
nkeynes@903
  2603
            push_fr( (FVn<<2)+3);
nkeynes@903
  2604
            FMULP_st(1);
nkeynes@903
  2605
            FADDP_st(1);
nkeynes@903
  2606
            pop_fr( (FVn<<2)+3);
nkeynes@904
  2607
        }
nkeynes@901
  2608
    }
nkeynes@377
  2609
:}
nkeynes@377
  2610
FTRV XMTRX, FVn {:  
nkeynes@671
  2611
    COUNT_INST(I_FTRV);
nkeynes@377
  2612
    check_fpuen();
nkeynes@901
  2613
    if( sh4_x86.double_prec == 0 ) {
nkeynes@1194
  2614
        if( sh4_x86.sse3_enabled && sh4_x86.begin_callback == NULL ) {
nkeynes@1194
  2615
        	/* FIXME: For now, disable this inlining when we're running in shadow mode -
nkeynes@1194
  2616
        	 * it gives slightly different results from the emu core. Need to
nkeynes@1194
  2617
        	 * fix the precision so both give the right results.
nkeynes@1194
  2618
        	 */
nkeynes@991
  2619
            MOVAPS_rbpdisp_xmm( REG_OFFSET(fr[1][0]), 1 ); // M1  M0  M3  M2
nkeynes@991
  2620
            MOVAPS_rbpdisp_xmm( REG_OFFSET(fr[1][4]), 0 ); // M5  M4  M7  M6
nkeynes@991
  2621
            MOVAPS_rbpdisp_xmm( REG_OFFSET(fr[1][8]), 3 ); // M9  M8  M11 M10
nkeynes@991
  2622
            MOVAPS_rbpdisp_xmm( REG_OFFSET(fr[1][12]), 2 );// M13 M12 M15 M14
nkeynes@903
  2623
nkeynes@991
  2624
            MOVSLDUP_rbpdisp_xmm( REG_OFFSET(fr[0][FVn<<2]), 4 ); // V1 V1 V3 V3
nkeynes@991
  2625
            MOVSHDUP_rbpdisp_xmm( REG_OFFSET(fr[0][FVn<<2]), 5 ); // V0 V0 V2 V2
nkeynes@991
  2626
            MOV_xmm_xmm( 4, 6 );
nkeynes@991
  2627
            MOV_xmm_xmm( 5, 7 );
nkeynes@903
  2628
            MOVLHPS_xmm_xmm( 4, 4 );  // V1 V1 V1 V1
nkeynes@903
  2629
            MOVHLPS_xmm_xmm( 6, 6 );  // V3 V3 V3 V3
nkeynes@903
  2630
            MOVLHPS_xmm_xmm( 5, 5 );  // V0 V0 V0 V0
nkeynes@903
  2631
            MOVHLPS_xmm_xmm( 7, 7 );  // V2 V2 V2 V2
nkeynes@903
  2632
            MULPS_xmm_xmm( 0, 4 );
nkeynes@903
  2633
            MULPS_xmm_xmm( 1, 5 );
nkeynes@903
  2634
            MULPS_xmm_xmm( 2, 6 );
nkeynes@903
  2635
            MULPS_xmm_xmm( 3, 7 );
nkeynes@903
  2636
            ADDPS_xmm_xmm( 5, 4 );
nkeynes@903
  2637
            ADDPS_xmm_xmm( 7, 6 );
nkeynes@903
  2638
            ADDPS_xmm_xmm( 6, 4 );
nkeynes@991
  2639
            MOVAPS_xmm_rbpdisp( 4, REG_OFFSET(fr[0][FVn<<2]) );
nkeynes@903
  2640
        } else {
nkeynes@991
  2641
            LEAP_rbpdisp_rptr( REG_OFFSET(fr[0][FVn<<2]), REG_EAX );
nkeynes@995
  2642
            CALL1_ptr_r32( sh4_ftrv, REG_EAX );
nkeynes@903
  2643
        }
nkeynes@901
  2644
    }
nkeynes@417
  2645
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@377
  2646
:}
nkeynes@377
  2647
nkeynes@377
  2648
FRCHG {:  
nkeynes@671
  2649
    COUNT_INST(I_FRCHG);
nkeynes@377
  2650
    check_fpuen();
nkeynes@991
  2651
    XORL_imms_rbpdisp( FPSCR_FR, R_FPSCR );
nkeynes@995
  2652
    CALL_ptr( sh4_switch_fr_banks );
nkeynes@417
  2653
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@377
  2654
:}
nkeynes@377
  2655
FSCHG {:  
nkeynes@671
  2656
    COUNT_INST(I_FSCHG);
nkeynes@377
  2657
    check_fpuen();
nkeynes@991
  2658
    XORL_imms_rbpdisp( FPSCR_SZ, R_FPSCR);
nkeynes@991
  2659
    XORL_imms_rbpdisp( FPSCR_SZ, REG_OFFSET(xlat_sh4_mode) );
nkeynes@417
  2660
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@901
  2661
    sh4_x86.double_size = !sh4_x86.double_size;
nkeynes@1112
  2662
    sh4_x86.sh4_mode = sh4_x86.sh4_mode ^ FPSCR_SZ;
nkeynes@377
  2663
:}
nkeynes@359
  2664
nkeynes@359
  2665
/* Processor control instructions */
nkeynes@368
  2666
LDC Rm, SR {:
nkeynes@671
  2667
    COUNT_INST(I_LDCSR);
nkeynes@386
  2668
    if( sh4_x86.in_delay_slot ) {
nkeynes@386
  2669
	SLOTILLEGAL();
nkeynes@386
  2670
    } else {
nkeynes@386
  2671
	check_priv();
nkeynes@991
  2672
	load_reg( REG_EAX, Rm );
nkeynes@995
  2673
	CALL1_ptr_r32( sh4_write_sr, REG_EAX );
nkeynes@386
  2674
	sh4_x86.fpuen_checked = FALSE;
nkeynes@417
  2675
	sh4_x86.tstate = TSTATE_NONE;
nkeynes@1112
  2676
    sh4_x86.sh4_mode = SH4_MODE_UNKNOWN;
nkeynes@937
  2677
	return 2;
nkeynes@386
  2678
    }
nkeynes@368
  2679
:}
nkeynes@359
  2680
LDC Rm, GBR {: 
nkeynes@671
  2681
    COUNT_INST(I_LDC);
nkeynes@991
  2682
    load_reg( REG_EAX, Rm );
nkeynes@995
  2683
    MOVL_r32_rbpdisp( REG_EAX, R_GBR );
nkeynes@359
  2684
:}
nkeynes@359
  2685
LDC Rm, VBR {:  
nkeynes@671
  2686
    COUNT_INST(I_LDC);
nkeynes@386
  2687
    check_priv();
nkeynes@991
  2688
    load_reg( REG_EAX, Rm );
nkeynes@995
  2689
    MOVL_r32_rbpdisp( REG_EAX, R_VBR );
nkeynes@417
  2690
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  2691
:}
nkeynes@359
  2692
LDC Rm, SSR {:  
nkeynes@671
  2693
    COUNT_INST(I_LDC);
nkeynes@386
  2694
    check_priv();
nkeynes@991
  2695
    load_reg( REG_EAX, Rm );
nkeynes@995
  2696
    MOVL_r32_rbpdisp( REG_EAX, R_SSR );
nkeynes@417
  2697
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  2698
:}
nkeynes@359
  2699
LDC Rm, SGR {:  
nkeynes@671
  2700
    COUNT_INST(I_LDC);
nkeynes@386
  2701
    check_priv();
nkeynes@991
  2702
    load_reg( REG_EAX, Rm );
nkeynes@995
  2703
    MOVL_r32_rbpdisp( REG_EAX, R_SGR );
nkeynes@417
  2704
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  2705
:}
nkeynes@359
  2706
LDC Rm, SPC {:  
nkeynes@671
  2707
    COUNT_INST(I_LDC);
nkeynes@386
  2708
    check_priv();
nkeynes@991
  2709
    load_reg( REG_EAX, Rm );
nkeynes@995
  2710
    MOVL_r32_rbpdisp( REG_EAX, R_SPC );
nkeynes@417
  2711
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  2712
:}
nkeynes@359
  2713
LDC Rm, DBR {:  
nkeynes@671
  2714
    COUNT_INST(I_LDC);
nkeynes@386
  2715
    check_priv();
nkeynes@991
  2716
    load_reg( REG_EAX, Rm );
nkeynes@995
  2717
    MOVL_r32_rbpdisp( REG_EAX, R_DBR );
nkeynes@417
  2718
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  2719
:}
nkeynes@374
  2720
LDC Rm, Rn_BANK {:  
nkeynes@671
  2721
    COUNT_INST(I_LDC);
nkeynes@386
  2722
    check_priv();
nkeynes@991
  2723
    load_reg( REG_EAX, Rm );
nkeynes@995
  2724
    MOVL_r32_rbpdisp( REG_EAX, REG_OFFSET(r_bank[Rn_BANK]) );
nkeynes@417
  2725
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@374
  2726
:}
nkeynes@359
  2727
LDC.L @Rm+, GBR {:  
nkeynes@671
  2728
    COUNT_INST(I_LDCM);
nkeynes@991
  2729
    load_reg( REG_EAX, Rm );
nkeynes@991
  2730
    check_ralign32( REG_EAX );
nkeynes@991
  2731
    MEM_READ_LONG( REG_EAX, REG_EAX );
nkeynes@991
  2732
    ADDL_imms_rbpdisp( 4, REG_OFFSET(r[Rm]) );
nkeynes@995
  2733
    MOVL_r32_rbpdisp( REG_EAX, R_GBR );
nkeynes@417
  2734
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  2735
:}
nkeynes@368
  2736
LDC.L @Rm+, SR {:
nkeynes@671
  2737
    COUNT_INST(I_LDCSRM);
nkeynes@386
  2738
    if( sh4_x86.in_delay_slot ) {
nkeynes@386
  2739
	SLOTILLEGAL();
nkeynes@386
  2740
    } else {
nkeynes@586
  2741
	check_priv();
nkeynes@991
  2742
	load_reg( REG_EAX, Rm );
nkeynes@991
  2743
	check_ralign32( REG_EAX );
nkeynes@991
  2744
	MEM_READ_LONG( REG_EAX, REG_EAX );
nkeynes@991
  2745
	ADDL_imms_rbpdisp( 4, REG_OFFSET(r[Rm]) );
nkeynes@995
  2746
	CALL1_ptr_r32( sh4_write_sr, REG_EAX );
nkeynes@386
  2747
	sh4_x86.fpuen_checked = FALSE;
nkeynes@417
  2748
	sh4_x86.tstate = TSTATE_NONE;
nkeynes@1112
  2749
    sh4_x86.sh4_mode = SH4_MODE_UNKNOWN;
nkeynes@937
  2750
	return 2;
nkeynes@386
  2751
    }
nkeynes@359
  2752
:}
nkeynes@359
  2753
LDC.L @Rm+, VBR {:  
nkeynes@671
  2754
    COUNT_INST(I_LDCM);
nkeynes@586
  2755
    check_priv();
nkeynes@991
  2756
    load_reg( REG_EAX, Rm );
nkeynes@991
  2757
    check_ralign32( REG_EAX );
nkeynes@991
  2758
    MEM_READ_LONG( REG_EAX, REG_EAX );
nkeynes@991
  2759
    ADDL_imms_rbpdisp( 4, REG_OFFSET(r[Rm]) );
nkeynes@995
  2760
    MOVL_r32_rbpdisp( REG_EAX, R_VBR );
nkeynes@417
  2761
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  2762
:}
nkeynes@359
  2763
LDC.L @Rm+, SSR {:
nkeynes@671
  2764
    COUNT_INST(I_LDCM);
nkeynes@586
  2765
    check_priv();
nkeynes@991
  2766
    load_reg( REG_EAX, Rm );
nkeynes@991
  2767
    check_ralign32( REG_EAX );
nkeynes@991
  2768
    MEM_READ_LONG( REG_EAX, REG_EAX );
nkeynes@991
  2769
    ADDL_imms_rbpdisp( 4, REG_OFFSET(r[Rm]) );
nkeynes@995
  2770
    MOVL_r32_rbpdisp( REG_EAX, R_SSR );
nkeynes@417
  2771
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  2772
:}
nkeynes@359
  2773
LDC.L @Rm+, SGR {:  
nkeynes@671
  2774
    COUNT_INST(I_LDCM);
nkeynes@586
  2775
    check_priv();
nkeynes@991
  2776
    load_reg( REG_EAX, Rm );
nkeynes@991
  2777
    check_ralign32( REG_EAX );
nkeynes@991
  2778
    MEM_READ_LONG( REG_EAX, REG_EAX );
nkeynes@991
  2779
    ADDL_imms_rbpdisp( 4, REG_OFFSET(r[Rm]) );
nkeynes@995
  2780
    MOVL_r32_rbpdisp( REG_EAX, R_SGR );
nkeynes@417
  2781
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  2782
:}
nkeynes@359
  2783
LDC.L @Rm+, SPC {:  
nkeynes@671
  2784
    COUNT_INST(I_LDCM);
nkeynes@586
  2785
    check_priv();
nkeynes@991
  2786
    load_reg( REG_EAX, Rm );
nkeynes@991
  2787
    check_ralign32( REG_EAX );
nkeynes@991
  2788
    MEM_READ_LONG( REG_EAX, REG_EAX );
nkeynes@991
  2789
    ADDL_imms_rbpdisp( 4, REG_OFFSET(r[Rm]) );
nkeynes@995
  2790
    MOVL_r32_rbpdisp( REG_EAX, R_SPC );
nkeynes@417
  2791
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  2792
:}
nkeynes@359
  2793
LDC.L @Rm+, DBR {:  
nkeynes@671
  2794
    COUNT_INST(I_LDCM);
nkeynes@586
  2795
    check_priv();
nkeynes@991
  2796
    load_reg( REG_EAX, Rm );
nkeynes@991
  2797
    check_ralign32( REG_EAX );
nkeynes@991
  2798
    MEM_READ_LONG( REG_EAX, REG_EAX );
nkeynes@991
  2799
    ADDL_imms_rbpdisp( 4, REG_OFFSET(r[Rm]) );
nkeynes@995
  2800
    MOVL_r32_rbpdisp( REG_EAX, R_DBR );
nkeynes@417
  2801
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  2802
:}
nkeynes@359
  2803
LDC.L @Rm+, Rn_BANK {:  
nkeynes@671
  2804
    COUNT_INST(I_LDCM);
nkeynes@586
  2805
    check_priv();
nkeynes@991
  2806
    load_reg( REG_EAX, Rm );
nkeynes@991
  2807
    check_ralign32( REG_EAX );
nkeynes@991
  2808
    MEM_READ_LONG( REG_EAX, REG_EAX );
nkeynes@991
  2809
    ADDL_imms_rbpdisp( 4, REG_OFFSET(r[Rm]) );
nkeynes@995
  2810
    MOVL_r32_rbpdisp( REG_EAX, REG_OFFSET(r_bank[Rn_BANK]) );
nkeynes@417
  2811
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  2812
:}
nkeynes@626
  2813
LDS Rm, FPSCR {:
nkeynes@673
  2814
    COUNT_INST(I_LDSFPSCR);
nkeynes@626
  2815
    check_fpuen();
nkeynes@991
  2816
    load_reg( REG_EAX, Rm );
nkeynes@995
  2817
    CALL1_ptr_r32( sh4_write_fpscr, REG_EAX );
nkeynes@417
  2818
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@1112
  2819
    sh4_x86.sh4_mode = SH4_MODE_UNKNOWN;
nkeynes@901
  2820
    return 2;
nkeynes@359
  2821
:}
nkeynes@359
  2822
LDS.L @Rm+, FPSCR {:  
nkeynes@673
  2823
    COUNT_INST(I_LDSFPSCRM);
nkeynes@626
  2824
    check_fpuen();
nkeynes@991
  2825
    load_reg( REG_EAX, Rm );
nkeynes@991
  2826
    check_ralign32( REG_EAX );
nkeynes@991
  2827
    MEM_READ_LONG( REG_EAX, REG_EAX );
nkeynes@991
  2828
    ADDL_imms_rbpdisp( 4, REG_OFFSET(r[Rm]) );
nkeynes@995
  2829
    CALL1_ptr_r32( sh4_write_fpscr, REG_EAX );
nkeynes@417
  2830
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@1112
  2831
    sh4_x86.sh4_mode = SH4_MODE_UNKNOWN;
nkeynes@901
  2832
    return 2;
nkeynes@359
  2833
:}
nkeynes@359
  2834
LDS Rm, FPUL {:  
nkeynes@671
  2835
    COUNT_INST(I_LDS);
nkeynes@626
  2836
    check_fpuen();
nkeynes@991
  2837
    load_reg( REG_EAX, Rm );
nkeynes@995
  2838
    MOVL_r32_rbpdisp( REG_EAX, R_FPUL );
nkeynes@359
  2839
:}
nkeynes@359
  2840
LDS.L @Rm+, FPUL {:  
nkeynes@671
  2841
    COUNT_INST(I_LDSM);
nkeynes@626
  2842
    check_fpuen();
nkeynes@991
  2843
    load_reg( REG_EAX, Rm );
nkeynes@991
  2844
    check_ralign32( REG_EAX );
nkeynes@991
  2845
    MEM_READ_LONG( REG_EAX, REG_EAX );
nkeynes@991
  2846
    ADDL_imms_rbpdisp( 4, REG_OFFSET(r[Rm]) );
nkeynes@995
  2847
    MOVL_r32_rbpdisp( REG_EAX, R_FPUL );
nkeynes@417
  2848
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  2849
:}
nkeynes@359
  2850
LDS Rm, MACH {: 
nkeynes@671
  2851
    COUNT_INST(I_LDS);
nkeynes@991
  2852
    load_reg( REG_EAX, Rm );
nkeynes@995
  2853
    MOVL_r32_rbpdisp( REG_EAX, R_MACH );
nkeynes@359
  2854
:}
nkeynes@359
  2855
LDS.L @Rm+, MACH {:  
nkeynes@671
  2856
    COUNT_INST(I_LDSM);
nkeynes@991
  2857
    load_reg( REG_EAX, Rm );
nkeynes@991
  2858
    check_ralign32( REG_EAX );
nkeynes@991
  2859
    MEM_READ_LONG( REG_EAX, REG_EAX );
nkeynes@991
  2860
    ADDL_imms_rbpdisp( 4, REG_OFFSET(r[Rm]) );
nkeynes@995
  2861
    MOVL_r32_rbpdisp( REG_EAX, R_MACH );
nkeynes@417
  2862
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  2863
:}
nkeynes@359
  2864
LDS Rm, MACL {:  
nkeynes@671
  2865
    COUNT_INST(I_LDS);
nkeynes@991
  2866
    load_reg( REG_EAX, Rm );
nkeynes@995
  2867
    MOVL_r32_rbpdisp( REG_EAX, R_MACL );
nkeynes@359
  2868
:}
nkeynes@359
  2869
LDS.L @Rm+, MACL {:  
nkeynes@671
  2870
    COUNT_INST(I_LDSM);
nkeynes@991
  2871
    load_reg( REG_EAX, Rm );
nkeynes@991
  2872
    check_ralign32( REG_EAX );
nkeynes@991
  2873
    MEM_READ_LONG( REG_EAX, REG_EAX );
nkeynes@991
  2874
    ADDL_imms_rbpdisp( 4, REG_OFFSET(r[Rm]) );
nkeynes@995
  2875
    MOVL_r32_rbpdisp( REG_EAX, R_MACL );
nkeynes@417
  2876
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  2877
:}
nkeynes@359
  2878
LDS Rm, PR {:  
nkeynes@671
  2879
    COUNT_INST(I_LDS);
nkeynes@991
  2880
    load_reg( REG_EAX, Rm );
nkeynes@995
  2881
    MOVL_r32_rbpdisp( REG_EAX, R_PR );
nkeynes@359
  2882
:}
nkeynes@359
  2883
LDS.L @Rm+, PR {:  
nkeynes@671
  2884
    COUNT_INST(I_LDSM);
nkeynes@991
  2885
    load_reg( REG_EAX, Rm );
nkeynes@991
  2886
    check_ralign32( REG_EAX );
nkeynes@991
  2887
    MEM_READ_LONG( REG_EAX, REG_EAX );
nkeynes@991
  2888
    ADDL_imms_rbpdisp( 4, REG_OFFSET(r[Rm]) );
nkeynes@995
  2889
    MOVL_r32_rbpdisp( REG_EAX, R_PR );
nkeynes@417
  2890
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  2891
:}
nkeynes@550
  2892
LDTLB {:  
nkeynes@671
  2893
    COUNT_INST(I_LDTLB);
nkeynes@995
  2894
    CALL_ptr( MMU_ldtlb );
nkeynes@875
  2895
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@550
  2896
:}
nkeynes@671
  2897
OCBI @Rn {:
nkeynes@671
  2898
    COUNT_INST(I_OCBI);
nkeynes@671
  2899
:}
nkeynes@671
  2900
OCBP @Rn {:
nkeynes@671
  2901
    COUNT_INST(I_OCBP);
nkeynes@671
  2902
:}
nkeynes@671
  2903
OCBWB @Rn {:
nkeynes@671
  2904
    COUNT_INST(I_OCBWB);
nkeynes@671
  2905
:}
nkeynes@374
  2906
PREF @Rn {:
nkeynes@671
  2907
    COUNT_INST(I_PREF);
nkeynes@991
  2908
    load_reg( REG_EAX, Rn );
nkeynes@991
  2909
    MEM_PREFETCH( REG_EAX );
nkeynes@417
  2910
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@374
  2911
:}
nkeynes@388
  2912
SLEEP {: 
nkeynes@671
  2913
    COUNT_INST(I_SLEEP);
nkeynes@388
  2914
    check_priv();
nkeynes@995
  2915
    CALL_ptr( sh4_sleep );
nkeynes@417
  2916
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@590
  2917
    sh4_x86.in_delay_slot = DELAY_NONE;
nkeynes@408
  2918
    return 2;
nkeynes@388
  2919
:}
nkeynes@386
  2920
STC SR, Rn {:
nkeynes@671
  2921
    COUNT_INST(I_STCSR);
nkeynes@386
  2922
    check_priv();
nkeynes@995
  2923
    CALL_ptr(sh4_read_sr);
nkeynes@991
  2924
    store_reg( REG_EAX, Rn );
nkeynes@417
  2925
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  2926
:}
nkeynes@359
  2927
STC GBR, Rn {:  
nkeynes@671
  2928
    COUNT_INST(I_STC);
nkeynes@995
  2929
    MOVL_rbpdisp_r32( R_GBR, REG_EAX );
nkeynes@991
  2930
    store_reg( REG_EAX, Rn );
nkeynes@359
  2931
:}
nkeynes@359
  2932
STC VBR, Rn {:  
nkeynes@671
  2933
    COUNT_INST(I_STC);
nkeynes@386
  2934
    check_priv();
nkeynes@995
  2935
    MOVL_rbpdisp_r32( R_VBR, REG_EAX );
nkeynes@991
  2936
    store_reg( REG_EAX, Rn );
nkeynes@417
  2937
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  2938
:}
nkeynes@359
  2939
STC SSR, Rn {:  
nkeynes@671
  2940
    COUNT_INST(I_STC);
nkeynes@386
  2941
    check_priv();
nkeynes@995
  2942
    MOVL_rbpdisp_r32( R_SSR, REG_EAX );
nkeynes@991
  2943
    store_reg( REG_EAX, Rn );
nkeynes@417
  2944
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  2945
:}
nkeynes@359
  2946
STC SPC, Rn {:  
nkeynes@671
  2947
    COUNT_INST(I_STC);
nkeynes@386
  2948
    check_priv();
nkeynes@995
  2949
    MOVL_rbpdisp_r32( R_SPC, REG_EAX );
nkeynes@991
  2950
    store_reg( REG_EAX, Rn );
nkeynes@417
  2951
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  2952
:}
nkeynes@359
  2953
STC SGR, Rn {:  
nkeynes@671
  2954
    COUNT_INST(I_STC);
nkeynes@386
  2955
    check_priv();
nkeynes@995
  2956
    MOVL_rbpdisp_r32( R_SGR, REG_EAX );
nkeynes@991
  2957
    store_reg( REG_EAX, Rn );
nkeynes@417
  2958
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  2959
:}
nkeynes@359
  2960
STC DBR, Rn {:  
nkeynes@671
  2961
    COUNT_INST(I_STC);
nkeynes@386
  2962
    check_priv();
nkeynes@995
  2963
    MOVL_rbpdisp_r32( R_DBR, REG_EAX );
nkeynes@991
  2964
    store_reg( REG_EAX, Rn );
nkeynes@417
  2965
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  2966
:}
nkeynes@374
  2967
STC Rm_BANK, Rn {:
nkeynes@671
  2968
    COUNT_INST(I_STC);
nkeynes@386
  2969
    check_priv();
nkeynes@995
  2970
    MOVL_rbpdisp_r32( REG_OFFSET(r_bank[Rm_BANK]), REG_EAX );
nkeynes@991
  2971
    store_reg( REG_EAX, Rn );
nkeynes@417
  2972
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  2973
:}
nkeynes@374
  2974
STC.L SR, @-Rn {:
nkeynes@671
  2975
    COUNT_INST(I_STCSRM);
nkeynes@586
  2976
    check_priv();
nkeynes@995
  2977
    CALL_ptr( sh4_read_sr );
nkeynes@991
  2978
    MOVL_r32_r32( REG_EAX, REG_EDX );
nkeynes@991
  2979
    load_reg( REG_EAX, Rn );
nkeynes@991
  2980
    check_walign32( REG_EAX );
nkeynes@991
  2981
    LEAL_r32disp_r32( REG_EAX, -4, REG_EAX );
nkeynes@991
  2982
    MEM_WRITE_LONG( REG_EAX, REG_EDX );
nkeynes@991
  2983
    ADDL_imms_rbpdisp( -4, REG_OFFSET(r[Rn]) );
nkeynes@417
  2984
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  2985
:}
nkeynes@359
  2986
STC.L VBR, @-Rn {:  
nkeynes@671
  2987
    COUNT_INST(I_STCM);
nkeynes@586
  2988
    check_priv();
nkeynes@991
  2989
    load_reg( REG_EAX, Rn );
nkeynes@991
  2990
    check_walign32( REG_EAX );
nkeynes@991
  2991
    ADDL_imms_r32( -4, REG_EAX );
nkeynes@995
  2992
    MOVL_rbpdisp_r32( R_VBR, REG_EDX );
nkeynes@991
  2993
    MEM_WRITE_LONG( REG_EAX, REG_EDX );
nkeynes@991
  2994
    ADDL_imms_rbpdisp( -4, REG_OFFSET(r[Rn]) );
nkeynes@417
  2995
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  2996
:}
nkeynes@359
  2997
STC.L SSR, @-Rn {:  
nkeynes@671
  2998
    COUNT_INST(I_STCM);
nkeynes@586
  2999
    check_priv();
nkeynes@991
  3000
    load_reg( REG_EAX, Rn );
nkeynes@991
  3001
    check_walign32( REG_EAX );
nkeynes@991
  3002
    ADDL_imms_r32( -4, REG_EAX );
nkeynes@995
  3003
    MOVL_rbpdisp_r32( R_SSR, REG_EDX );
nkeynes@991
  3004
    MEM_WRITE_LONG( REG_EAX, REG_EDX );
nkeynes@991
  3005
    ADDL_imms_rbpdisp( -4, REG_OFFSET(r[Rn]) );
nkeynes@417
  3006
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  3007
:}
nkeynes@416
  3008
STC.L SPC, @-Rn {:
nkeynes@671
  3009
    COUNT_INST(I_STCM);
nkeynes@586
  3010
    check_priv();
nkeynes@991
  3011
    load_reg( REG_EAX, Rn );
nkeynes@991
  3012
    check_walign32( REG_EAX );
nkeynes@991
  3013
    ADDL_imms_r32( -4, REG_EAX );
nkeynes@995
  3014
    MOVL_rbpdisp_r32( R_SPC, REG_EDX );
nkeynes@991
  3015
    MEM_WRITE_LONG( REG_EAX, REG_EDX );
nkeynes@991
  3016
    ADDL_imms_rbpdisp( -4, REG_OFFSET(r[Rn]) );
nkeynes@417
  3017
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  3018
:}
nkeynes@359
  3019
STC.L SGR, @-Rn {:  
nkeynes@671
  3020
    COUNT_INST(I_STCM);
nkeynes@586
  3021
    check_priv();
nkeynes@991
  3022
    load_reg( REG_EAX, Rn );
nkeynes@991
  3023
    check_walign32( REG_EAX );
nkeynes@991
  3024
    ADDL_imms_r32( -4, REG_EAX );
nkeynes@995
  3025
    MOVL_rbpdisp_r32( R_SGR, REG_EDX );
nkeynes@991
  3026
    MEM_WRITE_LONG( REG_EAX, REG_EDX );
nkeynes@991
  3027
    ADDL_imms_rbpdisp( -4, REG_OFFSET(r[Rn]) );
nkeynes@417
  3028
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  3029
:}
nkeynes@359
  3030
STC.L DBR, @-Rn {:  
nkeynes@671
  3031
    COUNT_INST(I_STCM);
nkeynes@586
  3032
    check_priv();
nkeynes@991
  3033
    load_reg( REG_EAX, Rn );
nkeynes@991
  3034
    check_walign32( REG_EAX );
nkeynes@991
  3035
    ADDL_imms_r32( -4, REG_EAX );
nkeynes@995
  3036
    MOVL_rbpdisp_r32( R_DBR, REG_EDX );
nkeynes@991
  3037
    MEM_WRITE_LONG( REG_EAX, REG_EDX );
nkeynes@991
  3038
    ADDL_imms_rbpdisp( -4, REG_OFFSET(r[Rn]) );
nkeynes@417
  3039
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  3040
:}
nkeynes@374
  3041
STC.L Rm_BANK, @-Rn {:  
nkeynes@671
  3042
    COUNT_INST(I_STCM);
nkeynes@586
  3043
    check_priv();
nkeynes@991
  3044
    load_reg( REG_EAX, Rn );
nkeynes@991
  3045
    check_walign32( REG_EAX );
nkeynes@991
  3046
    ADDL_imms_r32( -4, REG_EAX );
nkeynes@995
  3047
    MOVL_rbpdisp_r32( REG_OFFSET(r_bank[Rm_BANK]), REG_EDX );
nkeynes@991
  3048
    MEM_WRITE_LONG( REG_EAX, REG_EDX );
nkeynes@991
  3049
    ADDL_imms_rbpdisp( -4, REG_OFFSET(r[Rn]) );
nkeynes@417
  3050
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@374
  3051
:}
nkeynes@359
  3052
STC.L GBR, @-Rn {:  
nkeynes@671
  3053
    COUNT_INST(I_STCM);
nkeynes@991
  3054
    load_reg( REG_EAX, Rn );
nkeynes@991
  3055
    check_walign32( REG_EAX );
nkeynes@991
  3056
    ADDL_imms_r32( -4, REG_EAX );
nkeynes@995
  3057
    MOVL_rbpdisp_r32( R_GBR, REG_EDX );
nkeynes@991
  3058
    MEM_WRITE_LONG( REG_EAX, REG_EDX );
nkeynes@991
  3059
    ADDL_imms_rbpdisp( -4, REG_OFFSET(r[Rn]) );
nkeynes@417
  3060
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  3061
:}
nkeynes@359
  3062
STS FPSCR, Rn {:  
nkeynes@673
  3063
    COUNT_INST(I_STSFPSCR);
nkeynes@626
  3064
    check_fpuen();
nkeynes@995
  3065
    MOVL_rbpdisp_r32( R_FPSCR, REG_EAX );
nkeynes@991
  3066
    store_reg( REG_EAX, Rn );
nkeynes@359
  3067
:}
nkeynes@359
  3068
STS.L FPSCR, @-Rn {:  
nkeynes@673
  3069
    COUNT_INST(I_STSFPSCRM);
nkeynes@626
  3070
    check_fpuen();
nkeynes@991
  3071
    load_reg( REG_EAX, Rn );
nkeynes@991
  3072
    check_walign32( REG_EAX );
nkeynes@991
  3073
    ADDL_imms_r32( -4, REG_EAX );
nkeynes@995
  3074
    MOVL_rbpdisp_r32( R_FPSCR, REG_EDX );
nkeynes@991
  3075
    MEM_WRITE_LONG( REG_EAX, REG_EDX );
nkeynes@991
  3076
    ADDL_imms_rbpdisp( -4, REG_OFFSET(r[Rn]) );
nkeynes@417
  3077
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  3078
:}
nkeynes@359
  3079
STS FPUL, Rn {:  
nkeynes@671
  3080
    COUNT_INST(I_STS);
nkeynes@626
  3081
    check_fpuen();
nkeynes@995
  3082
    MOVL_rbpdisp_r32( R_FPUL, REG_EAX );
nkeynes@991
  3083
    store_reg( REG_EAX, Rn );
nkeynes@359
  3084
:}
nkeynes@359
  3085
STS.L FPUL, @-Rn {:  
nkeynes@671
  3086
    COUNT_INST(I_STSM);
nkeynes@626
  3087
    check_fpuen();
nkeynes@991
  3088
    load_reg( REG_EAX, Rn );
nkeynes@991
  3089
    check_walign32( REG_EAX );
nkeynes@991
  3090
    ADDL_imms_r32( -4, REG_EAX );
nkeynes@995
  3091
    MOVL_rbpdisp_r32( R_FPUL, REG_EDX );
nkeynes@991
  3092
    MEM_WRITE_LONG( REG_EAX, REG_EDX );
nkeynes@991
  3093
    ADDL_imms_rbpdisp( -4, REG_OFFSET(r[Rn]) );
nkeynes@417
  3094
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  3095
:}
nkeynes@359
  3096
STS MACH, Rn {:  
nkeynes@671
  3097
    COUNT_INST(I_STS);
nkeynes@995
  3098
    MOVL_rbpdisp_r32( R_MACH, REG_EAX );
nkeynes@991
  3099
    store_reg( REG_EAX, Rn );
nkeynes@359
  3100
:}
nkeynes@359
  3101
STS.L MACH, @-Rn {:  
nkeynes@671
  3102
    COUNT_INST(I_STSM);
nkeynes@991
  3103
    load_reg( REG_EAX, Rn );
nkeynes@991
  3104
    check_walign32( REG_EAX );
nkeynes@991
  3105
    ADDL_imms_r32( -4, REG_EAX );
nkeynes@995
  3106
    MOVL_rbpdisp_r32( R_MACH, REG_EDX );
nkeynes@991
  3107
    MEM_WRITE_LONG( REG_EAX, REG_EDX );
nkeynes@991
  3108
    ADDL_imms_rbpdisp( -4, REG_OFFSET(r[Rn]) );
nkeynes@417
  3109
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  3110
:}
nkeynes@359
  3111
STS MACL, Rn {:  
nkeynes@671
  3112
    COUNT_INST(I_STS);
nkeynes@995
  3113
    MOVL_rbpdisp_r32( R_MACL, REG_EAX );
nkeynes@991
  3114
    store_reg( REG_EAX, Rn );
nkeynes@359
  3115
:}
nkeynes@359
  3116
STS.L MACL, @-Rn {:  
nkeynes@671
  3117
    COUNT_INST(I_STSM);
nkeynes@991
  3118
    load_reg( REG_EAX, Rn );
nkeynes@991
  3119
    check_walign32( REG_EAX );
nkeynes@991
  3120
    ADDL_imms_r32( -4, REG_EAX );
nkeynes@995
  3121
    MOVL_rbpdisp_r32( R_MACL, REG_EDX );
nkeynes@991
  3122
    MEM_WRITE_LONG( REG_EAX, REG_EDX );
nkeynes@991
  3123
    ADDL_imms_rbpdisp( -4, REG_OFFSET(r[Rn]) );
nkeynes@417
  3124
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  3125
:}
nkeynes@359
  3126
STS PR, Rn {:  
nkeynes@671
  3127
    COUNT_INST(I_STS);
nkeynes@995
  3128
    MOVL_rbpdisp_r32( R_PR, REG_EAX );
nkeynes@991
  3129
    store_reg( REG_EAX, Rn );
nkeynes@359
  3130
:}
nkeynes@359
  3131
STS.L PR, @-Rn {:  
nkeynes@671
  3132
    COUNT_INST(I_STSM);
nkeynes@991
  3133
    load_reg( REG_EAX, Rn );
nkeynes@991
  3134
    check_walign32( REG_EAX );
nkeynes@991
  3135
    ADDL_imms_r32( -4, REG_EAX );
nkeynes@995
  3136
    MOVL_rbpdisp_r32( R_PR, REG_EDX );
nkeynes@991
  3137
    MEM_WRITE_LONG( REG_EAX, REG_EDX );
nkeynes@991
  3138
    ADDL_imms_rbpdisp( -4, REG_OFFSET(r[Rn]) );
nkeynes@417
  3139
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@359
  3140
:}
nkeynes@359
  3141
nkeynes@671
  3142
NOP {: 
nkeynes@671
  3143
    COUNT_INST(I_NOP);
nkeynes@671
  3144
    /* Do nothing. Well, we could emit an 0x90, but what would really be the point? */ 
nkeynes@671
  3145
:}
nkeynes@359
  3146
%%
nkeynes@590
  3147
    sh4_x86.in_delay_slot = DELAY_NONE;
nkeynes@359
  3148
    return 0;
nkeynes@359
  3149
}
nkeynes@995
  3150
nkeynes@995
  3151
nkeynes@995
  3152
/**
nkeynes@995
  3153
 * The unwind methods only work if we compiled with DWARF2 frame information
nkeynes@995
  3154
 * (ie -fexceptions), otherwise we have to use the direct frame scan.
nkeynes@995
  3155
 */
nkeynes@995
  3156
#ifdef HAVE_EXCEPTIONS
nkeynes@995
  3157
#include <unwind.h>
nkeynes@995
  3158
nkeynes@995
  3159
struct UnwindInfo {
nkeynes@995
  3160
    uintptr_t block_start;
nkeynes@995
  3161
    uintptr_t block_end;
nkeynes@995
  3162
    void *pc;
nkeynes@995
  3163
};
nkeynes@995
  3164
nkeynes@995
  3165
static _Unwind_Reason_Code xlat_check_frame( struct _Unwind_Context *context, void *arg )
nkeynes@995
  3166
{
nkeynes@995
  3167
    struct UnwindInfo *info = arg;
nkeynes@995
  3168
    void *pc = (void *)_Unwind_GetIP(context);
nkeynes@995
  3169
    if( ((uintptr_t)pc) >= info->block_start && ((uintptr_t)pc) < info->block_end ) {
nkeynes@995
  3170
        info->pc = pc;
nkeynes@995
  3171
        return _URC_NORMAL_STOP;
nkeynes@995
  3172
    }
nkeynes@995
  3173
    return _URC_NO_REASON;
nkeynes@995
  3174
}
nkeynes@995
  3175
nkeynes@995
  3176
void *xlat_get_native_pc( void *code, uint32_t code_size )
nkeynes@995
  3177
{
nkeynes@995
  3178
    struct _Unwind_Exception exc;
nkeynes@995
  3179
    struct UnwindInfo info;
nkeynes@995
  3180
nkeynes@995
  3181
    info.pc = NULL;
nkeynes@995
  3182
    info.block_start = (uintptr_t)code;
nkeynes@995
  3183
    info.block_end = info.block_start + code_size;
nkeynes@995
  3184
    void *result = NULL;
nkeynes@995
  3185
    _Unwind_Backtrace( xlat_check_frame, &info );
nkeynes@995
  3186
    return info.pc;
nkeynes@995
  3187
}
nkeynes@995
  3188
#else
nkeynes@995
  3189
/* Assume this is an ia32 build - amd64 should always have dwarf information */
nkeynes@995
  3190
void *xlat_get_native_pc( void *code, uint32_t code_size )
nkeynes@995
  3191
{
nkeynes@995
  3192
    void *result = NULL;
nkeynes@1120
  3193
    __asm__(
nkeynes@995
  3194
        "mov %%ebp, %%eax\n\t"
nkeynes@995
  3195
        "mov $0x8, %%ecx\n\t"
nkeynes@995
  3196
        "mov %1, %%edx\n"
nkeynes@995
  3197
        "frame_loop: test %%eax, %%eax\n\t"
nkeynes@995
  3198
        "je frame_not_found\n\t"
nkeynes@995
  3199
        "cmp (%%eax), %%edx\n\t"
nkeynes@995
  3200
        "je frame_found\n\t"
nkeynes@995
  3201
        "sub $0x1, %%ecx\n\t"
nkeynes@995
  3202
        "je frame_not_found\n\t"
nkeynes@995
  3203
        "movl (%%eax), %%eax\n\t"
nkeynes@995
  3204
        "jmp frame_loop\n"
nkeynes@995
  3205
        "frame_found: movl 0x4(%%eax), %0\n"
nkeynes@995
  3206
        "frame_not_found:"
nkeynes@995
  3207
        : "=r" (result)
nkeynes@995
  3208
        : "r" (((uint8_t *)&sh4r) + 128 )
nkeynes@995
  3209
        : "eax", "ecx", "edx" );
nkeynes@995
  3210
    return result;
nkeynes@995
  3211
}
nkeynes@995
  3212
#endif
nkeynes@995
  3213
.