Search
lxdream.org :: lxdream/src/sh4/ia32mac.h
lxdream 0.9.1
released Jun 29
Download Now
filename src/sh4/ia32mac.h
changeset 561:533f6b478071
prev559:06714bc64271
next569:a1c49e1e8776
author nkeynes
date Tue Jan 01 05:08:38 2008 +0000 (12 years ago)
branchlxdream-mmu
permissions -rw-r--r--
last change Enable Id keyword on all source files
file annotate diff log raw
nkeynes@539
     1
/**
nkeynes@561
     2
 * $Id$
nkeynes@539
     3
 * 
nkeynes@539
     4
 * Provides the implementation for the ia32 ABI (eg prologue, epilogue, and
nkeynes@539
     5
 * calling conventions)
nkeynes@539
     6
 *
nkeynes@539
     7
 * Copyright (c) 2007 Nathan Keynes.
nkeynes@539
     8
 *
nkeynes@539
     9
 * This program is free software; you can redistribute it and/or modify
nkeynes@539
    10
 * it under the terms of the GNU General Public License as published by
nkeynes@539
    11
 * the Free Software Foundation; either version 2 of the License, or
nkeynes@539
    12
 * (at your option) any later version.
nkeynes@539
    13
 *
nkeynes@539
    14
 * This program is distributed in the hope that it will be useful,
nkeynes@539
    15
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
nkeynes@539
    16
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
nkeynes@539
    17
 * GNU General Public License for more details.
nkeynes@539
    18
 */
nkeynes@539
    19
nkeynes@539
    20
#ifndef __lxdream_ia32abi_H
nkeynes@539
    21
#define __lxdream_ia32abi_H 1
nkeynes@539
    22
nkeynes@539
    23
#define load_ptr( reg, ptr ) load_imm32( reg, (uint32_t)ptr );
nkeynes@539
    24
nkeynes@539
    25
/**
nkeynes@539
    26
 * Note: clobbers EAX to make the indirect call - this isn't usually
nkeynes@539
    27
 * a problem since the callee will usually clobber it anyway.
nkeynes@539
    28
 */
nkeynes@539
    29
#define CALL_FUNC0_SIZE 13
nkeynes@539
    30
static inline void call_func0( void *ptr )
nkeynes@539
    31
{
nkeynes@539
    32
    int adj = (-sh4_x86.stack_posn)&0x0F;
nkeynes@539
    33
    SUB_imm8s_r32( adj, R_ESP );
nkeynes@539
    34
    load_imm32(R_EAX, (uint32_t)ptr);
nkeynes@539
    35
    CALL_r32(R_EAX);
nkeynes@539
    36
    ADD_imm8s_r32( adj, R_ESP );
nkeynes@539
    37
}
nkeynes@539
    38
nkeynes@539
    39
#define CALL_FUNC1_SIZE 14
nkeynes@539
    40
static inline void call_func1( void *ptr, int arg1 )
nkeynes@539
    41
{
nkeynes@539
    42
    int adj = (-4-sh4_x86.stack_posn)&0x0F;
nkeynes@539
    43
    SUB_imm8s_r32( adj, R_ESP );
nkeynes@539
    44
    PUSH_r32(arg1);
nkeynes@539
    45
    load_imm32(R_EAX, (uint32_t)ptr);
nkeynes@539
    46
    CALL_r32(R_EAX);
nkeynes@539
    47
    ADD_imm8s_r32( adj+4, R_ESP );
nkeynes@539
    48
    sh4_x86.stack_posn -= 4;
nkeynes@539
    49
}
nkeynes@539
    50
nkeynes@539
    51
#define CALL_FUNC2_SIZE 15
nkeynes@539
    52
static inline void call_func2( void *ptr, int arg1, int arg2 )
nkeynes@539
    53
{
nkeynes@539
    54
    int adj = (-8-sh4_x86.stack_posn)&0x0F;
nkeynes@539
    55
    SUB_imm8s_r32( adj, R_ESP );
nkeynes@539
    56
    PUSH_r32(arg2);
nkeynes@539
    57
    PUSH_r32(arg1);
nkeynes@539
    58
    load_imm32(R_EAX, (uint32_t)ptr);
nkeynes@539
    59
    CALL_r32(R_EAX);
nkeynes@539
    60
    ADD_imm8s_r32( adj+8, R_ESP );
nkeynes@539
    61
    sh4_x86.stack_posn -= 8;
nkeynes@539
    62
}
nkeynes@539
    63
nkeynes@539
    64
/**
nkeynes@539
    65
 * Write a double (64-bit) value into memory, with the first word in arg2a, and
nkeynes@539
    66
 * the second in arg2b
nkeynes@539
    67
 * NB: 30 bytes
nkeynes@539
    68
 */
nkeynes@539
    69
#define MEM_WRITE_DOUBLE_SIZE 36
nkeynes@539
    70
static inline void MEM_WRITE_DOUBLE( int addr, int arg2a, int arg2b )
nkeynes@539
    71
{
nkeynes@539
    72
    int adj = (-8-sh4_x86.stack_posn)&0x0F;
nkeynes@539
    73
    SUB_imm8s_r32( adj, R_ESP );
nkeynes@539
    74
    ADD_imm8s_r32( 4, addr );
nkeynes@539
    75
    PUSH_r32(arg2b);
nkeynes@539
    76
    PUSH_r32(addr);
nkeynes@539
    77
    ADD_imm8s_r32( -4, addr );
nkeynes@539
    78
    SUB_imm8s_r32( 8, R_ESP );
nkeynes@539
    79
    PUSH_r32(arg2a);
nkeynes@539
    80
    PUSH_r32(addr);
nkeynes@539
    81
    load_imm32(R_EAX, (uint32_t)sh4_write_long);
nkeynes@539
    82
    CALL_r32(R_EAX);
nkeynes@539
    83
    ADD_imm8s_r32( 16, R_ESP );
nkeynes@539
    84
    load_imm32(R_EAX, (uint32_t)sh4_write_long);
nkeynes@539
    85
    CALL_r32(R_EAX);
nkeynes@539
    86
    ADD_imm8s_r32( adj+8, R_ESP );
nkeynes@539
    87
    sh4_x86.stack_posn -= 16;
nkeynes@539
    88
}
nkeynes@539
    89
nkeynes@539
    90
/**
nkeynes@539
    91
 * Read a double (64-bit) value from memory, writing the first word into arg2a
nkeynes@539
    92
 * and the second into arg2b. The addr must not be in EAX
nkeynes@539
    93
 * NB: 27 bytes
nkeynes@539
    94
 */
nkeynes@539
    95
#define MEM_READ_DOUBLE_SIZE 36
nkeynes@539
    96
static inline void MEM_READ_DOUBLE( int addr, int arg2a, int arg2b )
nkeynes@539
    97
{
nkeynes@539
    98
    int adj = (-4-sh4_x86.stack_posn)&0x0F;
nkeynes@539
    99
    int adj2 = (-8-sh4_x86.stack_posn)&0x0F;
nkeynes@539
   100
    SUB_imm8s_r32( adj, R_ESP );
nkeynes@539
   101
    PUSH_r32(addr);
nkeynes@539
   102
    load_imm32(R_EAX, (uint32_t)sh4_read_long);
nkeynes@539
   103
    CALL_r32(R_EAX);
nkeynes@539
   104
    POP_r32(addr);
nkeynes@539
   105
    SUB_imm8s_r32( adj2-adj, R_ESP );
nkeynes@539
   106
    PUSH_r32(R_EAX);
nkeynes@539
   107
    ADD_imm8s_r32( 4, addr );
nkeynes@539
   108
    PUSH_r32(addr);
nkeynes@539
   109
    load_imm32(R_EAX, (uint32_t)sh4_read_long);
nkeynes@539
   110
    CALL_r32(R_EAX);
nkeynes@539
   111
    ADD_imm8s_r32( 4, R_ESP );
nkeynes@539
   112
    MOV_r32_r32( R_EAX, arg2b );
nkeynes@539
   113
    POP_r32(arg2a);
nkeynes@539
   114
    ADD_imm8s_r32( adj2, R_ESP );
nkeynes@539
   115
    sh4_x86.stack_posn -= 4;
nkeynes@539
   116
}
nkeynes@539
   117
nkeynes@539
   118
#define EXIT_BLOCK_SIZE 29
nkeynes@539
   119
nkeynes@539
   120
nkeynes@539
   121
/**
nkeynes@539
   122
 * Emit the 'start of block' assembly. Sets up the stack frame and save
nkeynes@539
   123
 * SI/DI as required
nkeynes@539
   124
 */
nkeynes@539
   125
void sh4_translate_begin_block( sh4addr_t pc ) 
nkeynes@539
   126
{
nkeynes@539
   127
    PUSH_r32(R_EBP);
nkeynes@539
   128
    /* mov &sh4r, ebp */
nkeynes@539
   129
    load_ptr( R_EBP, &sh4r );
nkeynes@539
   130
    
nkeynes@539
   131
    sh4_x86.in_delay_slot = FALSE;
nkeynes@539
   132
    sh4_x86.priv_checked = FALSE;
nkeynes@539
   133
    sh4_x86.fpuen_checked = FALSE;
nkeynes@539
   134
    sh4_x86.branch_taken = FALSE;
nkeynes@539
   135
    sh4_x86.backpatch_posn = 0;
nkeynes@539
   136
    sh4_x86.block_start_pc = pc;
nkeynes@539
   137
    sh4_x86.tstate = TSTATE_NONE;
nkeynes@539
   138
    sh4_x86.stack_posn = 8;
nkeynes@539
   139
}
nkeynes@539
   140
nkeynes@539
   141
/**
nkeynes@539
   142
 * Exit the block with sh4r.pc already written
nkeynes@539
   143
 * Bytes: 15
nkeynes@539
   144
 */
nkeynes@539
   145
void exit_block_pcset( pc )
nkeynes@539
   146
{
nkeynes@539
   147
    load_imm32( R_ECX, ((pc - sh4_x86.block_start_pc)>>1)*sh4_cpu_period ); // 5
nkeynes@539
   148
    ADD_r32_sh4r( R_ECX, REG_OFFSET(slice_cycle) );    // 6
nkeynes@539
   149
    load_spreg( R_EAX, REG_OFFSET(pc) );
nkeynes@539
   150
    call_func1(xlat_get_code,R_EAX);
nkeynes@539
   151
    POP_r32(R_EBP);
nkeynes@539
   152
    RET();
nkeynes@539
   153
}
nkeynes@539
   154
nkeynes@539
   155
/**
nkeynes@539
   156
 * Exit the block to an absolute PC
nkeynes@539
   157
 */
nkeynes@539
   158
void exit_block( sh4addr_t pc, sh4addr_t endpc )
nkeynes@539
   159
{
nkeynes@539
   160
    load_imm32( R_ECX, pc );                            // 5
nkeynes@539
   161
    store_spreg( R_ECX, REG_OFFSET(pc) );               // 3
nkeynes@539
   162
    MOV_moff32_EAX( xlat_get_lut_entry(pc) ); // 5
nkeynes@539
   163
    AND_imm8s_r32( 0xFC, R_EAX ); // 3
nkeynes@539
   164
    load_imm32( R_ECX, ((endpc - sh4_x86.block_start_pc)>>1)*sh4_cpu_period ); // 5
nkeynes@539
   165
    ADD_r32_sh4r( R_ECX, REG_OFFSET(slice_cycle) );     // 6
nkeynes@539
   166
    POP_r32(R_EBP);
nkeynes@539
   167
    RET();
nkeynes@539
   168
}
nkeynes@539
   169
nkeynes@539
   170
/**
nkeynes@539
   171
 * Write the block trailer (exception handling block)
nkeynes@539
   172
 */
nkeynes@539
   173
void sh4_translate_end_block( sh4addr_t pc ) {
nkeynes@539
   174
    if( sh4_x86.branch_taken == FALSE ) {
nkeynes@539
   175
	// Didn't exit unconditionally already, so write the termination here
nkeynes@539
   176
	exit_block( pc, pc );
nkeynes@539
   177
    }
nkeynes@539
   178
    if( sh4_x86.backpatch_posn != 0 ) {
nkeynes@559
   179
	unsigned int i;
nkeynes@559
   180
	// Raise exception
nkeynes@539
   181
	uint8_t *end_ptr = xlat_output;
nkeynes@539
   182
	load_spreg( R_ECX, REG_OFFSET(pc) );
nkeynes@539
   183
	ADD_r32_r32( R_EDX, R_ECX );
nkeynes@539
   184
	ADD_r32_r32( R_EDX, R_ECX );
nkeynes@539
   185
	store_spreg( R_ECX, REG_OFFSET(pc) );
nkeynes@539
   186
	MOV_moff32_EAX( &sh4_cpu_period );
nkeynes@539
   187
	MUL_r32( R_EDX );
nkeynes@539
   188
	ADD_r32_sh4r( R_EAX, REG_OFFSET(slice_cycle) );
nkeynes@539
   189
nkeynes@559
   190
        POP_r32(R_EDX);
nkeynes@559
   191
        call_func1( sh4_raise_exception, R_EDX );
nkeynes@539
   192
	load_spreg( R_EAX, REG_OFFSET(pc) );
nkeynes@539
   193
	call_func1(xlat_get_code,R_EAX);
nkeynes@539
   194
	POP_r32(R_EBP);
nkeynes@539
   195
	RET();
nkeynes@539
   196
nkeynes@559
   197
	// Exception already raised - just cleanup
nkeynes@559
   198
	uint8_t *preexc_ptr = xlat_output;
nkeynes@559
   199
	load_imm32( R_ECX, sh4_x86.block_start_pc );
nkeynes@559
   200
	ADD_r32_r32( R_EDX, R_ECX );
nkeynes@559
   201
	ADD_r32_r32( R_EDX, R_ECX );
nkeynes@559
   202
	store_spreg( R_ECX, REG_OFFSET(spc) );
nkeynes@559
   203
	MOV_moff32_EAX( &sh4_cpu_period );
nkeynes@559
   204
	MUL_r32( R_EDX );
nkeynes@559
   205
	ADD_r32_sh4r( R_EAX, REG_OFFSET(slice_cycle) );
nkeynes@559
   206
	load_spreg( R_EAX, REG_OFFSET(pc) );
nkeynes@559
   207
	call_func1(xlat_get_code,R_EAX);
nkeynes@559
   208
	POP_r32(R_EBP);
nkeynes@559
   209
	RET();
nkeynes@559
   210
nkeynes@559
   211
	for( i=0; i< sh4_x86.backpatch_posn; i++ ) {
nkeynes@559
   212
	    *sh4_x86.backpatch_list[i].fixup_addr =
nkeynes@559
   213
		xlat_output - ((uint8_t *)sh4_x86.backpatch_list[i].fixup_addr) - 4;
nkeynes@559
   214
	    if( sh4_x86.backpatch_list[i].exc_code == -1 ) {
nkeynes@559
   215
		load_imm32( R_EDX, sh4_x86.backpatch_list[i].fixup_icount );
nkeynes@559
   216
		int rel = preexc_ptr - xlat_output;
nkeynes@559
   217
		JMP_rel(rel);
nkeynes@559
   218
	    } else {
nkeynes@559
   219
		PUSH_imm32( sh4_x86.backpatch_list[i].exc_code );
nkeynes@559
   220
		load_imm32( R_EDX, sh4_x86.backpatch_list[i].fixup_icount );
nkeynes@559
   221
		int rel = end_ptr - xlat_output;
nkeynes@559
   222
		JMP_rel(rel);
nkeynes@559
   223
	    }
nkeynes@559
   224
	}
nkeynes@539
   225
    }
nkeynes@539
   226
}
nkeynes@539
   227
nkeynes@539
   228
#endif
nkeynes@539
   229
nkeynes@539
   230
.