Search
lxdream.org :: lxdream/src/sh4/sh4trans.c
lxdream 0.9.1
released Jun 29
Download Now
filename src/sh4/sh4trans.c
changeset 991:60c7fab9c880
prev978:eed5089fcfdb
next1003:7b2688cbbca3
author nkeynes
date Wed Mar 04 23:12:21 2009 +0000 (15 years ago)
permissions -rw-r--r--
last change Move xltcache to xlat/ src directory
Commit new and improved x86 opcode file - cleaned up and added support for amd64 extended registers
file annotate diff log raw
nkeynes@359
     1
/**
nkeynes@586
     2
 * $Id$
nkeynes@359
     3
 * 
nkeynes@359
     4
 * SH4 translation core module. This part handles the non-target-specific
nkeynes@359
     5
 * section of the translation.
nkeynes@359
     6
 *
nkeynes@359
     7
 * Copyright (c) 2005 Nathan Keynes.
nkeynes@359
     8
 *
nkeynes@359
     9
 * This program is free software; you can redistribute it and/or modify
nkeynes@359
    10
 * it under the terms of the GNU General Public License as published by
nkeynes@359
    11
 * the Free Software Foundation; either version 2 of the License, or
nkeynes@359
    12
 * (at your option) any later version.
nkeynes@359
    13
 *
nkeynes@359
    14
 * This program is distributed in the hope that it will be useful,
nkeynes@359
    15
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
nkeynes@359
    16
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
nkeynes@359
    17
 * GNU General Public License for more details.
nkeynes@359
    18
 */
nkeynes@398
    19
#include <assert.h>
nkeynes@430
    20
#include "eventq.h"
nkeynes@430
    21
#include "syscall.h"
nkeynes@586
    22
#include "clock.h"
nkeynes@669
    23
#include "dreamcast.h"
nkeynes@430
    24
#include "sh4/sh4core.h"
nkeynes@430
    25
#include "sh4/sh4trans.h"
nkeynes@975
    26
#include "sh4/sh4mmio.h"
nkeynes@975
    27
#include "sh4/mmu.h"
nkeynes@991
    28
#include "xlat/xltcache.h"
nkeynes@359
    29
nkeynes@359
    30
/**
nkeynes@359
    31
 * Execute a timeslice using translated code only (ie translate/execute loop)
nkeynes@359
    32
 */
nkeynes@740
    33
uint32_t sh4_translate_run_slice( uint32_t nanosecs ) 
nkeynes@359
    34
{
nkeynes@408
    35
    void * (*code)() = NULL;
nkeynes@368
    36
    while( sh4r.slice_cycle < nanosecs ) {
nkeynes@736
    37
        if( sh4r.event_pending <= sh4r.slice_cycle ) {
nkeynes@736
    38
            if( sh4r.event_types & PENDING_EVENT ) {
nkeynes@736
    39
                event_execute();
nkeynes@736
    40
            }
nkeynes@736
    41
            /* Eventq execute may (quite likely) deliver an immediate IRQ */
nkeynes@736
    42
            if( sh4r.event_types & PENDING_IRQ ) {
nkeynes@736
    43
                sh4_accept_interrupt();
nkeynes@736
    44
                code = NULL;
nkeynes@736
    45
            }
nkeynes@736
    46
        }
nkeynes@359
    47
nkeynes@736
    48
        if( code == NULL ) {
nkeynes@736
    49
            if( sh4r.pc > 0xFFFFFF00 ) {
nkeynes@736
    50
                syscall_invoke( sh4r.pc );
nkeynes@736
    51
                sh4r.in_delay_slot = 0;
nkeynes@736
    52
                sh4r.pc = sh4r.pr;
nkeynes@736
    53
            }
nkeynes@736
    54
nkeynes@736
    55
            code = xlat_get_code_by_vma( sh4r.pc );
nkeynes@953
    56
            if( code == NULL || sh4r.xlat_sh4_mode != XLAT_BLOCK_MODE(code) ) {
nkeynes@736
    57
                code = sh4_translate_basic_block( sh4r.pc );
nkeynes@736
    58
            }
nkeynes@953
    59
        } else if( sh4r.xlat_sh4_mode != XLAT_BLOCK_MODE(code) ) {
nkeynes@954
    60
            if( !IS_IN_ICACHE(sh4r.pc) ) {
nkeynes@954
    61
                /* If TLB is off, we may have gotten here without updating
nkeynes@954
    62
                 * the icache, so do it now. This should never fail, so...
nkeynes@954
    63
                 */
nkeynes@954
    64
                mmu_update_icache(sh4r.pc);
nkeynes@954
    65
                assert( IS_IN_ICACHE(sh4r.pc) ); 
nkeynes@954
    66
            }
nkeynes@953
    67
            code = sh4_translate_basic_block( sh4r.pc );
nkeynes@736
    68
        }
nkeynes@736
    69
        code = code();
nkeynes@359
    70
    }
nkeynes@359
    71
    return nanosecs;
nkeynes@359
    72
}
nkeynes@359
    73
nkeynes@359
    74
uint8_t *xlat_output;
nkeynes@596
    75
xlat_cache_block_t xlat_current_block;
nkeynes@586
    76
struct xlat_recovery_record xlat_recovery[MAX_RECOVERY_SIZE];
nkeynes@586
    77
uint32_t xlat_recovery_posn;
nkeynes@359
    78
nkeynes@596
    79
void sh4_translate_add_recovery( uint32_t icount )
nkeynes@596
    80
{
nkeynes@596
    81
    xlat_recovery[xlat_recovery_posn].xlat_offset = 
nkeynes@736
    82
        ((uintptr_t)xlat_output) - ((uintptr_t)xlat_current_block->code);
nkeynes@596
    83
    xlat_recovery[xlat_recovery_posn].sh4_icount = icount;
nkeynes@596
    84
    xlat_recovery_posn++;
nkeynes@596
    85
}
nkeynes@596
    86
nkeynes@359
    87
/**
nkeynes@359
    88
 * Translate a linear basic block, ie all instructions from the start address
nkeynes@359
    89
 * (inclusive) until the next branch/jump instruction or the end of the page
nkeynes@359
    90
 * is reached.
nkeynes@914
    91
 * @param start VMA of the block start (which must already be in the icache)
nkeynes@359
    92
 * @return the address of the translated block
nkeynes@359
    93
 * eg due to lack of buffer space.
nkeynes@359
    94
 */
nkeynes@359
    95
void * sh4_translate_basic_block( sh4addr_t start )
nkeynes@359
    96
{
nkeynes@408
    97
    sh4addr_t pc = start;
nkeynes@410
    98
    sh4addr_t lastpc = (pc&0xFFFFF000)+0x1000;
nkeynes@586
    99
    int done, i;
nkeynes@914
   100
    xlat_current_block = xlat_start_block( GET_ICACHE_PHYS(start) );
nkeynes@596
   101
    xlat_output = (uint8_t *)xlat_current_block->code;
nkeynes@586
   102
    xlat_recovery_posn = 0;
nkeynes@596
   103
    uint8_t *eob = xlat_output + xlat_current_block->size;
nkeynes@588
   104
nkeynes@588
   105
    if( GET_ICACHE_END() < lastpc ) {
nkeynes@711
   106
        lastpc = GET_ICACHE_END();
nkeynes@588
   107
    }
nkeynes@588
   108
nkeynes@408
   109
    sh4_translate_begin_block(pc);
nkeynes@359
   110
nkeynes@408
   111
    do {
nkeynes@711
   112
        /* check for breakpoints at this pc */
nkeynes@711
   113
        for( i=0; i<sh4_breakpoint_count; i++ ) {
nkeynes@711
   114
            if( sh4_breakpoints[i].address == pc ) {
nkeynes@711
   115
                sh4_translate_emit_breakpoint(pc);
nkeynes@711
   116
                break;
nkeynes@711
   117
            }
nkeynes@711
   118
        }
nkeynes@711
   119
        if( eob - xlat_output < MAX_INSTRUCTION_SIZE ) {
nkeynes@711
   120
            uint8_t *oldstart = xlat_current_block->code;
nkeynes@711
   121
            xlat_current_block = xlat_extend_block( xlat_output - oldstart + MAX_INSTRUCTION_SIZE );
nkeynes@711
   122
            xlat_output = xlat_current_block->code + (xlat_output - oldstart);
nkeynes@711
   123
            eob = xlat_current_block->code + xlat_current_block->size;
nkeynes@711
   124
        }
nkeynes@711
   125
        done = sh4_translate_instruction( pc ); 
nkeynes@711
   126
        assert( xlat_output <= eob );
nkeynes@711
   127
        pc += 2;
nkeynes@711
   128
        if ( pc >= lastpc ) {
nkeynes@711
   129
            done = 2;
nkeynes@711
   130
        }
nkeynes@408
   131
    } while( !done );
nkeynes@408
   132
    pc += (done - 2);
nkeynes@617
   133
nkeynes@617
   134
    // Add end-of-block recovery for post-instruction checks
nkeynes@617
   135
    sh4_translate_add_recovery( (pc - start)>>1 ); 
nkeynes@617
   136
nkeynes@593
   137
    int epilogue_size = sh4_translate_end_block_size();
nkeynes@593
   138
    uint32_t recovery_size = sizeof(struct xlat_recovery_record)*xlat_recovery_posn;
nkeynes@711
   139
    uint32_t finalsize = (xlat_output - xlat_current_block->code) + epilogue_size + recovery_size;
nkeynes@711
   140
    if( xlat_current_block->size < finalsize ) {
nkeynes@711
   141
        uint8_t *oldstart = xlat_current_block->code;
nkeynes@711
   142
        xlat_current_block = xlat_extend_block( finalsize );
nkeynes@711
   143
        xlat_output = xlat_current_block->code + (xlat_output - oldstart);
nkeynes@410
   144
    }	
nkeynes@368
   145
    sh4_translate_end_block(pc);
nkeynes@711
   146
    assert( xlat_output <= (xlat_current_block->code + xlat_current_block->size - recovery_size) );
nkeynes@736
   147
nkeynes@586
   148
    /* Write the recovery records onto the end of the code block */
nkeynes@586
   149
    memcpy( xlat_output, xlat_recovery, recovery_size);
nkeynes@596
   150
    xlat_current_block->recover_table_offset = xlat_output - (uint8_t *)xlat_current_block->code;
nkeynes@596
   151
    xlat_current_block->recover_table_size = xlat_recovery_posn;
nkeynes@953
   152
    xlat_current_block->xlat_sh4_mode = sh4r.xlat_sh4_mode;
nkeynes@586
   153
    xlat_commit_block( finalsize, pc-start );
nkeynes@596
   154
    return xlat_current_block->code;
nkeynes@359
   155
}
nkeynes@359
   156
nkeynes@398
   157
/**
nkeynes@586
   158
 * "Execute" the supplied recovery record. Currently this only updates
nkeynes@586
   159
 * sh4r.pc and sh4r.slice_cycle according to the currently executing
nkeynes@586
   160
 * instruction. In future this may be more sophisticated (ie will
nkeynes@586
   161
 * call into generated code).
nkeynes@398
   162
 */
nkeynes@586
   163
void sh4_translate_run_recovery( xlat_recovery_record_t recovery )
nkeynes@398
   164
{
nkeynes@586
   165
    sh4r.slice_cycle += (recovery->sh4_icount * sh4_cpu_period);
nkeynes@586
   166
    sh4r.pc += (recovery->sh4_icount<<1);
nkeynes@586
   167
}
nkeynes@359
   168
nkeynes@953
   169
/**
nkeynes@953
   170
 * Same as sh4_translate_run_recovery, but is used to recover from a taken
nkeynes@953
   171
 * exception - that is, it fixes sh4r.spc rather than sh4r.pc
nkeynes@953
   172
 */
nkeynes@953
   173
void sh4_translate_run_exception_recovery( xlat_recovery_record_t recovery )
nkeynes@953
   174
{
nkeynes@953
   175
    sh4r.slice_cycle += (recovery->sh4_icount * sh4_cpu_period);
nkeynes@953
   176
    sh4r.spc += (recovery->sh4_icount<<1);
nkeynes@953
   177
}    
nkeynes@953
   178
nkeynes@740
   179
void sh4_translate_exit_recover( )
nkeynes@586
   180
{
nkeynes@906
   181
    void *code = xlat_get_code_by_vma( sh4r.pc );
nkeynes@906
   182
    if( code != NULL ) {
nkeynes@906
   183
        uint32_t size = xlat_get_code_size( code );
nkeynes@906
   184
        void *pc = xlat_get_native_pc( code, size );
nkeynes@906
   185
        if( pc != NULL ) {
nkeynes@906
   186
            // could be null if we're not actually running inside the translator
nkeynes@953
   187
            xlat_recovery_record_t recover = xlat_get_pre_recovery(code, pc);
nkeynes@906
   188
            if( recover != NULL ) {
nkeynes@906
   189
                // Can be null if there is no recovery necessary
nkeynes@906
   190
                sh4_translate_run_recovery(recover);
nkeynes@906
   191
            }
nkeynes@736
   192
        }
nkeynes@398
   193
    }
nkeynes@586
   194
}
nkeynes@398
   195
nkeynes@953
   196
void sh4_translate_exception_exit_recover( )
nkeynes@953
   197
{
nkeynes@953
   198
    void *code = xlat_get_code_by_vma( sh4r.spc );
nkeynes@953
   199
    if( code != NULL ) {
nkeynes@953
   200
        uint32_t size = xlat_get_code_size( code );
nkeynes@953
   201
        void *pc = xlat_get_native_pc( code, size );
nkeynes@953
   202
        if( pc != NULL ) {
nkeynes@953
   203
            // could be null if we're not actually running inside the translator
nkeynes@953
   204
            xlat_recovery_record_t recover = xlat_get_pre_recovery(code, pc);
nkeynes@953
   205
            if( recover != NULL ) {
nkeynes@953
   206
                // Can be null if there is no recovery necessary
nkeynes@953
   207
                sh4_translate_run_exception_recovery(recover);
nkeynes@953
   208
            }
nkeynes@953
   209
        }
nkeynes@953
   210
    }
nkeynes@953
   211
    
nkeynes@953
   212
}
nkeynes@953
   213
nkeynes@905
   214
void FASTCALL sh4_translate_breakpoint_hit(uint32_t pc)
nkeynes@591
   215
{
nkeynes@591
   216
    if( sh4_starting && sh4r.slice_cycle == 0 && pc == sh4r.pc ) {
nkeynes@736
   217
        return;
nkeynes@591
   218
    }
nkeynes@740
   219
    sh4_core_exit( CORE_EXIT_BREAKPOINT );
nkeynes@591
   220
}
nkeynes@591
   221
nkeynes@905
   222
void * FASTCALL xlat_get_code_by_vma( sh4vma_t vma )
nkeynes@586
   223
{
nkeynes@586
   224
    void *result = NULL;
nkeynes@586
   225
nkeynes@588
   226
    if( IS_IN_ICACHE(vma) ) {
nkeynes@736
   227
        return xlat_get_code( GET_ICACHE_PHYS(vma) );
nkeynes@586
   228
    }
nkeynes@586
   229
nkeynes@588
   230
    if( vma > 0xFFFFFF00 ) {
nkeynes@736
   231
        // lxdream hook
nkeynes@736
   232
        return NULL;
nkeynes@588
   233
    }
nkeynes@588
   234
nkeynes@588
   235
    if( !mmu_update_icache(vma) ) {
nkeynes@736
   236
        // fault - off to the fault handler
nkeynes@736
   237
        if( !mmu_update_icache(sh4r.pc) ) {
nkeynes@736
   238
            // double fault - halt
nkeynes@736
   239
            ERROR( "Double fault - halting" );
nkeynes@740
   240
            sh4_core_exit(CORE_EXIT_HALT);
nkeynes@736
   241
            return NULL;
nkeynes@736
   242
        }
nkeynes@588
   243
    }
nkeynes@588
   244
nkeynes@588
   245
    assert( IS_IN_ICACHE(sh4r.pc) );
nkeynes@588
   246
    result = xlat_get_code( GET_ICACHE_PHYS(sh4r.pc) );
nkeynes@586
   247
    return result;
nkeynes@586
   248
}
nkeynes@586
   249
.