Search
lxdream.org :: lxdream/src/sh4/sh4trans.c
lxdream 0.9.1
released Jun 29
Download Now
filename src/sh4/sh4trans.c
changeset 905:4c17ebd9ef5e
prev901:32c5cf5e206f
next906:268ea359f884
author nkeynes
date Wed Oct 29 23:51:58 2008 +0000 (15 years ago)
permissions -rw-r--r--
last change Use regparam calling conventions for all functions called from translated code,
along with a few other high-use functions. Can probably extend this to all functions,
but as it is this is a nice performance boost
file annotate diff log raw
nkeynes@359
     1
/**
nkeynes@586
     2
 * $Id$
nkeynes@359
     3
 * 
nkeynes@359
     4
 * SH4 translation core module. This part handles the non-target-specific
nkeynes@359
     5
 * section of the translation.
nkeynes@359
     6
 *
nkeynes@359
     7
 * Copyright (c) 2005 Nathan Keynes.
nkeynes@359
     8
 *
nkeynes@359
     9
 * This program is free software; you can redistribute it and/or modify
nkeynes@359
    10
 * it under the terms of the GNU General Public License as published by
nkeynes@359
    11
 * the Free Software Foundation; either version 2 of the License, or
nkeynes@359
    12
 * (at your option) any later version.
nkeynes@359
    13
 *
nkeynes@359
    14
 * This program is distributed in the hope that it will be useful,
nkeynes@359
    15
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
nkeynes@359
    16
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
nkeynes@359
    17
 * GNU General Public License for more details.
nkeynes@359
    18
 */
nkeynes@398
    19
#include <assert.h>
nkeynes@430
    20
#include "eventq.h"
nkeynes@430
    21
#include "syscall.h"
nkeynes@586
    22
#include "clock.h"
nkeynes@669
    23
#include "dreamcast.h"
nkeynes@430
    24
#include "sh4/sh4core.h"
nkeynes@430
    25
#include "sh4/sh4trans.h"
nkeynes@430
    26
#include "sh4/xltcache.h"
nkeynes@359
    27
nkeynes@586
    28
nkeynes@359
    29
/**
nkeynes@359
    30
 * Execute a timeslice using translated code only (ie translate/execute loop)
nkeynes@359
    31
 */
nkeynes@740
    32
uint32_t sh4_translate_run_slice( uint32_t nanosecs ) 
nkeynes@359
    33
{
nkeynes@408
    34
    void * (*code)() = NULL;
nkeynes@368
    35
    while( sh4r.slice_cycle < nanosecs ) {
nkeynes@736
    36
        if( sh4r.event_pending <= sh4r.slice_cycle ) {
nkeynes@736
    37
            if( sh4r.event_types & PENDING_EVENT ) {
nkeynes@736
    38
                event_execute();
nkeynes@736
    39
            }
nkeynes@736
    40
            /* Eventq execute may (quite likely) deliver an immediate IRQ */
nkeynes@736
    41
            if( sh4r.event_types & PENDING_IRQ ) {
nkeynes@736
    42
                sh4_accept_interrupt();
nkeynes@736
    43
                code = NULL;
nkeynes@736
    44
            }
nkeynes@736
    45
        }
nkeynes@359
    46
nkeynes@736
    47
        if( code == NULL ) {
nkeynes@736
    48
            if( sh4r.pc > 0xFFFFFF00 ) {
nkeynes@736
    49
                syscall_invoke( sh4r.pc );
nkeynes@736
    50
                sh4r.in_delay_slot = 0;
nkeynes@736
    51
                sh4r.pc = sh4r.pr;
nkeynes@736
    52
            }
nkeynes@736
    53
nkeynes@736
    54
            code = xlat_get_code_by_vma( sh4r.pc );
nkeynes@901
    55
            if( code == NULL || (sh4r.fpscr & (FPSCR_PR|FPSCR_SZ)) != XLAT_BLOCK_FPSCR(code) ) {
nkeynes@736
    56
                code = sh4_translate_basic_block( sh4r.pc );
nkeynes@736
    57
            }
nkeynes@736
    58
        }
nkeynes@736
    59
        code = code();
nkeynes@359
    60
    }
nkeynes@359
    61
    return nanosecs;
nkeynes@359
    62
}
nkeynes@359
    63
nkeynes@359
    64
uint8_t *xlat_output;
nkeynes@596
    65
xlat_cache_block_t xlat_current_block;
nkeynes@586
    66
struct xlat_recovery_record xlat_recovery[MAX_RECOVERY_SIZE];
nkeynes@586
    67
uint32_t xlat_recovery_posn;
nkeynes@359
    68
nkeynes@596
    69
void sh4_translate_add_recovery( uint32_t icount )
nkeynes@596
    70
{
nkeynes@596
    71
    xlat_recovery[xlat_recovery_posn].xlat_offset = 
nkeynes@736
    72
        ((uintptr_t)xlat_output) - ((uintptr_t)xlat_current_block->code);
nkeynes@596
    73
    xlat_recovery[xlat_recovery_posn].sh4_icount = icount;
nkeynes@596
    74
    xlat_recovery_posn++;
nkeynes@596
    75
}
nkeynes@596
    76
nkeynes@359
    77
/**
nkeynes@359
    78
 * Translate a linear basic block, ie all instructions from the start address
nkeynes@359
    79
 * (inclusive) until the next branch/jump instruction or the end of the page
nkeynes@359
    80
 * is reached.
nkeynes@359
    81
 * @return the address of the translated block
nkeynes@359
    82
 * eg due to lack of buffer space.
nkeynes@359
    83
 */
nkeynes@359
    84
void * sh4_translate_basic_block( sh4addr_t start )
nkeynes@359
    85
{
nkeynes@408
    86
    sh4addr_t pc = start;
nkeynes@410
    87
    sh4addr_t lastpc = (pc&0xFFFFF000)+0x1000;
nkeynes@586
    88
    int done, i;
nkeynes@596
    89
    xlat_current_block = xlat_start_block( start );
nkeynes@596
    90
    xlat_output = (uint8_t *)xlat_current_block->code;
nkeynes@586
    91
    xlat_recovery_posn = 0;
nkeynes@596
    92
    uint8_t *eob = xlat_output + xlat_current_block->size;
nkeynes@588
    93
nkeynes@588
    94
    if( GET_ICACHE_END() < lastpc ) {
nkeynes@711
    95
        lastpc = GET_ICACHE_END();
nkeynes@588
    96
    }
nkeynes@588
    97
nkeynes@408
    98
    sh4_translate_begin_block(pc);
nkeynes@359
    99
nkeynes@408
   100
    do {
nkeynes@711
   101
        /* check for breakpoints at this pc */
nkeynes@711
   102
        for( i=0; i<sh4_breakpoint_count; i++ ) {
nkeynes@711
   103
            if( sh4_breakpoints[i].address == pc ) {
nkeynes@711
   104
                sh4_translate_emit_breakpoint(pc);
nkeynes@711
   105
                break;
nkeynes@711
   106
            }
nkeynes@711
   107
        }
nkeynes@711
   108
        if( eob - xlat_output < MAX_INSTRUCTION_SIZE ) {
nkeynes@711
   109
            uint8_t *oldstart = xlat_current_block->code;
nkeynes@711
   110
            xlat_current_block = xlat_extend_block( xlat_output - oldstart + MAX_INSTRUCTION_SIZE );
nkeynes@711
   111
            xlat_output = xlat_current_block->code + (xlat_output - oldstart);
nkeynes@711
   112
            eob = xlat_current_block->code + xlat_current_block->size;
nkeynes@711
   113
        }
nkeynes@711
   114
        done = sh4_translate_instruction( pc ); 
nkeynes@711
   115
        assert( xlat_output <= eob );
nkeynes@711
   116
        pc += 2;
nkeynes@711
   117
        if ( pc >= lastpc ) {
nkeynes@711
   118
            done = 2;
nkeynes@711
   119
        }
nkeynes@408
   120
    } while( !done );
nkeynes@408
   121
    pc += (done - 2);
nkeynes@617
   122
nkeynes@617
   123
    // Add end-of-block recovery for post-instruction checks
nkeynes@617
   124
    sh4_translate_add_recovery( (pc - start)>>1 ); 
nkeynes@617
   125
nkeynes@593
   126
    int epilogue_size = sh4_translate_end_block_size();
nkeynes@593
   127
    uint32_t recovery_size = sizeof(struct xlat_recovery_record)*xlat_recovery_posn;
nkeynes@711
   128
    uint32_t finalsize = (xlat_output - xlat_current_block->code) + epilogue_size + recovery_size;
nkeynes@711
   129
    if( xlat_current_block->size < finalsize ) {
nkeynes@711
   130
        uint8_t *oldstart = xlat_current_block->code;
nkeynes@711
   131
        xlat_current_block = xlat_extend_block( finalsize );
nkeynes@711
   132
        xlat_output = xlat_current_block->code + (xlat_output - oldstart);
nkeynes@410
   133
    }	
nkeynes@368
   134
    sh4_translate_end_block(pc);
nkeynes@711
   135
    assert( xlat_output <= (xlat_current_block->code + xlat_current_block->size - recovery_size) );
nkeynes@736
   136
nkeynes@586
   137
    /* Write the recovery records onto the end of the code block */
nkeynes@586
   138
    memcpy( xlat_output, xlat_recovery, recovery_size);
nkeynes@596
   139
    xlat_current_block->recover_table_offset = xlat_output - (uint8_t *)xlat_current_block->code;
nkeynes@596
   140
    xlat_current_block->recover_table_size = xlat_recovery_posn;
nkeynes@901
   141
    xlat_current_block->fpscr = sh4r.fpscr & (FPSCR_PR|FPSCR_SZ);
nkeynes@901
   142
    xlat_current_block->fpscr_mask = (FPSCR_PR|FPSCR_SZ);
nkeynes@586
   143
    xlat_commit_block( finalsize, pc-start );
nkeynes@596
   144
    return xlat_current_block->code;
nkeynes@359
   145
}
nkeynes@359
   146
nkeynes@398
   147
/**
nkeynes@586
   148
 * "Execute" the supplied recovery record. Currently this only updates
nkeynes@586
   149
 * sh4r.pc and sh4r.slice_cycle according to the currently executing
nkeynes@586
   150
 * instruction. In future this may be more sophisticated (ie will
nkeynes@586
   151
 * call into generated code).
nkeynes@398
   152
 */
nkeynes@586
   153
void sh4_translate_run_recovery( xlat_recovery_record_t recovery )
nkeynes@398
   154
{
nkeynes@586
   155
    sh4r.slice_cycle += (recovery->sh4_icount * sh4_cpu_period);
nkeynes@586
   156
    sh4r.pc += (recovery->sh4_icount<<1);
nkeynes@586
   157
}
nkeynes@359
   158
nkeynes@740
   159
void sh4_translate_exit_recover( )
nkeynes@586
   160
{
nkeynes@586
   161
    void *pc = xlat_get_native_pc();
nkeynes@586
   162
    if( pc != NULL ) {
nkeynes@736
   163
        // could be null if we're not actually running inside the translator
nkeynes@736
   164
        void *code = xlat_get_code( sh4r.pc );
nkeynes@809
   165
        xlat_recovery_record_t recover = xlat_get_post_recovery(code, pc, TRUE);
nkeynes@736
   166
        if( recover != NULL ) {
nkeynes@736
   167
            // Can be null if there is no recovery necessary
nkeynes@736
   168
            sh4_translate_run_recovery(recover);
nkeynes@736
   169
        }
nkeynes@398
   170
    }
nkeynes@586
   171
}
nkeynes@398
   172
nkeynes@905
   173
void FASTCALL sh4_translate_breakpoint_hit(uint32_t pc)
nkeynes@591
   174
{
nkeynes@591
   175
    if( sh4_starting && sh4r.slice_cycle == 0 && pc == sh4r.pc ) {
nkeynes@736
   176
        return;
nkeynes@591
   177
    }
nkeynes@740
   178
    sh4_core_exit( CORE_EXIT_BREAKPOINT );
nkeynes@591
   179
}
nkeynes@591
   180
nkeynes@586
   181
/**
nkeynes@586
   182
 * Exit the current block at the end of the current instruction, flush the
nkeynes@586
   183
 * translation cache (completely) and return control to sh4_xlat_run_slice.
nkeynes@586
   184
 *
nkeynes@586
   185
 * As a special case, if the current instruction is actually the last 
nkeynes@586
   186
 * instruction in the block (ie it's in a delay slot), this function 
nkeynes@586
   187
 * returns to allow normal completion of the translation block. Otherwise
nkeynes@586
   188
 * this function never returns.
nkeynes@586
   189
 *
nkeynes@586
   190
 * Must only be invoked (indirectly) from within translated code.
nkeynes@586
   191
 */
nkeynes@740
   192
gboolean sh4_translate_flush_cache()
nkeynes@586
   193
{
nkeynes@586
   194
    void *pc = xlat_get_native_pc();
nkeynes@586
   195
    assert( pc != NULL );
nkeynes@586
   196
nkeynes@586
   197
    void *code = xlat_get_code( sh4r.pc );
nkeynes@809
   198
    xlat_recovery_record_t recover = xlat_get_post_recovery(code, pc, FALSE);
nkeynes@586
   199
    if( recover != NULL ) {
nkeynes@736
   200
        // Can be null if there is no recovery necessary
nkeynes@736
   201
        sh4_translate_run_recovery(recover);
nkeynes@736
   202
        xlat_flush_cache();
nkeynes@740
   203
        return TRUE;
nkeynes@586
   204
    } else {
nkeynes@736
   205
        xlat_flush_cache();
nkeynes@740
   206
        return FALSE;
nkeynes@586
   207
    }
nkeynes@398
   208
}
nkeynes@586
   209
nkeynes@905
   210
void * FASTCALL xlat_get_code_by_vma( sh4vma_t vma )
nkeynes@586
   211
{
nkeynes@586
   212
    void *result = NULL;
nkeynes@586
   213
nkeynes@588
   214
    if( IS_IN_ICACHE(vma) ) {
nkeynes@736
   215
        return xlat_get_code( GET_ICACHE_PHYS(vma) );
nkeynes@586
   216
    }
nkeynes@586
   217
nkeynes@588
   218
    if( vma > 0xFFFFFF00 ) {
nkeynes@736
   219
        // lxdream hook
nkeynes@736
   220
        return NULL;
nkeynes@588
   221
    }
nkeynes@588
   222
nkeynes@588
   223
    if( !mmu_update_icache(vma) ) {
nkeynes@736
   224
        // fault - off to the fault handler
nkeynes@736
   225
        if( !mmu_update_icache(sh4r.pc) ) {
nkeynes@736
   226
            // double fault - halt
nkeynes@736
   227
            ERROR( "Double fault - halting" );
nkeynes@740
   228
            sh4_core_exit(CORE_EXIT_HALT);
nkeynes@736
   229
            return NULL;
nkeynes@736
   230
        }
nkeynes@588
   231
    }
nkeynes@588
   232
nkeynes@588
   233
    assert( IS_IN_ICACHE(sh4r.pc) );
nkeynes@588
   234
    result = xlat_get_code( GET_ICACHE_PHYS(sh4r.pc) );
nkeynes@586
   235
    return result;
nkeynes@586
   236
}
nkeynes@586
   237
.