Search
lxdream.org :: lxdream/src/sh4/sh4trans.c
lxdream 0.9.1
released Jun 29
Download Now
filename src/sh4/sh4trans.c
changeset 1195:072131b61d2a
prev1188:1cc9bb0b3848
next1263:b3de98d19faf
author nkeynes
date Thu Feb 23 15:24:47 2012 +1000 (12 years ago)
permissions -rw-r--r--
last change Check for existence of glDrawBuffer (assuming that glReadBuffer will
follow). Note only need to guard the common code in gl_fbo.c
file annotate diff log raw
nkeynes@359
     1
/**
nkeynes@586
     2
 * $Id$
nkeynes@359
     3
 * 
nkeynes@359
     4
 * SH4 translation core module. This part handles the non-target-specific
nkeynes@359
     5
 * section of the translation.
nkeynes@359
     6
 *
nkeynes@359
     7
 * Copyright (c) 2005 Nathan Keynes.
nkeynes@359
     8
 *
nkeynes@359
     9
 * This program is free software; you can redistribute it and/or modify
nkeynes@359
    10
 * it under the terms of the GNU General Public License as published by
nkeynes@359
    11
 * the Free Software Foundation; either version 2 of the License, or
nkeynes@359
    12
 * (at your option) any later version.
nkeynes@359
    13
 *
nkeynes@359
    14
 * This program is distributed in the hope that it will be useful,
nkeynes@359
    15
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
nkeynes@359
    16
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
nkeynes@359
    17
 * GNU General Public License for more details.
nkeynes@359
    18
 */
nkeynes@398
    19
#include <assert.h>
nkeynes@430
    20
#include "eventq.h"
nkeynes@430
    21
#include "syscall.h"
nkeynes@586
    22
#include "clock.h"
nkeynes@669
    23
#include "dreamcast.h"
nkeynes@430
    24
#include "sh4/sh4core.h"
nkeynes@430
    25
#include "sh4/sh4trans.h"
nkeynes@975
    26
#include "sh4/sh4mmio.h"
nkeynes@975
    27
#include "sh4/mmu.h"
nkeynes@991
    28
#include "xlat/xltcache.h"
nkeynes@586
    29
nkeynes@1125
    30
//#define SINGLESTEP 1
nkeynes@1125
    31
nkeynes@359
    32
/**
nkeynes@359
    33
 * Execute a timeslice using translated code only (ie translate/execute loop)
nkeynes@359
    34
 */
nkeynes@740
    35
uint32_t sh4_translate_run_slice( uint32_t nanosecs ) 
nkeynes@359
    36
{
nkeynes@1112
    37
    event_schedule( EVENT_ENDTIMESLICE, nanosecs );
nkeynes@1112
    38
    for(;;) {
nkeynes@736
    39
        if( sh4r.event_pending <= sh4r.slice_cycle ) {
nkeynes@1187
    40
            sh4_handle_pending_events();
nkeynes@1112
    41
            if( sh4r.slice_cycle >= nanosecs )
nkeynes@1112
    42
                return nanosecs;
nkeynes@736
    43
        }
nkeynes@359
    44
nkeynes@1112
    45
        if( IS_SYSCALL(sh4r.pc) ) {
nkeynes@1112
    46
            uint32_t pc = sh4r.pc;
nkeynes@1112
    47
            sh4r.pc = sh4r.pr;
nkeynes@1112
    48
            sh4r.in_delay_slot = 0;
nkeynes@1112
    49
            syscall_invoke( pc );
nkeynes@1112
    50
        }
nkeynes@736
    51
nkeynes@1187
    52
        void * (*code)() = xlat_get_code_by_vma( sh4r.pc );
nkeynes@1149
    53
        if( code != NULL ) {
nkeynes@1149
    54
            while( sh4r.xlat_sh4_mode != XLAT_BLOCK_MODE(code) ) {
nkeynes@1149
    55
                code = XLAT_BLOCK_CHAIN(code);
nkeynes@1149
    56
                if( code == NULL ) {
nkeynes@1149
    57
                    code = sh4_translate_basic_block( sh4r.pc );
nkeynes@1149
    58
                    break;
nkeynes@1149
    59
                }
nkeynes@1149
    60
            }
nkeynes@1149
    61
        } else {
nkeynes@936
    62
            code = sh4_translate_basic_block( sh4r.pc );
nkeynes@736
    63
        }
nkeynes@1112
    64
        code();
nkeynes@359
    65
    }
nkeynes@359
    66
}
nkeynes@359
    67
nkeynes@359
    68
uint8_t *xlat_output;
nkeynes@596
    69
xlat_cache_block_t xlat_current_block;
nkeynes@586
    70
struct xlat_recovery_record xlat_recovery[MAX_RECOVERY_SIZE];
nkeynes@586
    71
uint32_t xlat_recovery_posn;
nkeynes@359
    72
nkeynes@596
    73
void sh4_translate_add_recovery( uint32_t icount )
nkeynes@596
    74
{
nkeynes@596
    75
    xlat_recovery[xlat_recovery_posn].xlat_offset = 
nkeynes@736
    76
        ((uintptr_t)xlat_output) - ((uintptr_t)xlat_current_block->code);
nkeynes@596
    77
    xlat_recovery[xlat_recovery_posn].sh4_icount = icount;
nkeynes@596
    78
    xlat_recovery_posn++;
nkeynes@596
    79
}
nkeynes@596
    80
nkeynes@359
    81
/**
nkeynes@359
    82
 * Translate a linear basic block, ie all instructions from the start address
nkeynes@359
    83
 * (inclusive) until the next branch/jump instruction or the end of the page
nkeynes@359
    84
 * is reached.
nkeynes@914
    85
 * @param start VMA of the block start (which must already be in the icache)
nkeynes@359
    86
 * @return the address of the translated block
nkeynes@359
    87
 * eg due to lack of buffer space.
nkeynes@359
    88
 */
nkeynes@359
    89
void * sh4_translate_basic_block( sh4addr_t start )
nkeynes@359
    90
{
nkeynes@408
    91
    sh4addr_t pc = start;
nkeynes@410
    92
    sh4addr_t lastpc = (pc&0xFFFFF000)+0x1000;
nkeynes@586
    93
    int done, i;
nkeynes@914
    94
    xlat_current_block = xlat_start_block( GET_ICACHE_PHYS(start) );
nkeynes@596
    95
    xlat_output = (uint8_t *)xlat_current_block->code;
nkeynes@586
    96
    xlat_recovery_posn = 0;
nkeynes@596
    97
    uint8_t *eob = xlat_output + xlat_current_block->size;
nkeynes@588
    98
nkeynes@588
    99
    if( GET_ICACHE_END() < lastpc ) {
nkeynes@711
   100
        lastpc = GET_ICACHE_END();
nkeynes@588
   101
    }
nkeynes@588
   102
nkeynes@408
   103
    sh4_translate_begin_block(pc);
nkeynes@359
   104
nkeynes@408
   105
    do {
nkeynes@711
   106
        if( eob - xlat_output < MAX_INSTRUCTION_SIZE ) {
nkeynes@711
   107
            uint8_t *oldstart = xlat_current_block->code;
nkeynes@711
   108
            xlat_current_block = xlat_extend_block( xlat_output - oldstart + MAX_INSTRUCTION_SIZE );
nkeynes@711
   109
            xlat_output = xlat_current_block->code + (xlat_output - oldstart);
nkeynes@711
   110
            eob = xlat_current_block->code + xlat_current_block->size;
nkeynes@711
   111
        }
nkeynes@711
   112
        done = sh4_translate_instruction( pc ); 
nkeynes@711
   113
        assert( xlat_output <= eob );
nkeynes@711
   114
        pc += 2;
nkeynes@1195
   115
        if ( pc >= lastpc && done == 0 ) {
nkeynes@711
   116
            done = 2;
nkeynes@711
   117
        }
nkeynes@1125
   118
#ifdef SINGLESTEP
nkeynes@1125
   119
        if( !done ) done = 2;
nkeynes@1125
   120
#endif
nkeynes@408
   121
    } while( !done );
nkeynes@408
   122
    pc += (done - 2);
nkeynes@617
   123
nkeynes@617
   124
    // Add end-of-block recovery for post-instruction checks
nkeynes@617
   125
    sh4_translate_add_recovery( (pc - start)>>1 ); 
nkeynes@617
   126
nkeynes@593
   127
    int epilogue_size = sh4_translate_end_block_size();
nkeynes@593
   128
    uint32_t recovery_size = sizeof(struct xlat_recovery_record)*xlat_recovery_posn;
nkeynes@711
   129
    uint32_t finalsize = (xlat_output - xlat_current_block->code) + epilogue_size + recovery_size;
nkeynes@711
   130
    if( xlat_current_block->size < finalsize ) {
nkeynes@711
   131
        uint8_t *oldstart = xlat_current_block->code;
nkeynes@711
   132
        xlat_current_block = xlat_extend_block( finalsize );
nkeynes@711
   133
        xlat_output = xlat_current_block->code + (xlat_output - oldstart);
nkeynes@410
   134
    }	
nkeynes@368
   135
    sh4_translate_end_block(pc);
nkeynes@711
   136
    assert( xlat_output <= (xlat_current_block->code + xlat_current_block->size - recovery_size) );
nkeynes@736
   137
nkeynes@586
   138
    /* Write the recovery records onto the end of the code block */
nkeynes@586
   139
    memcpy( xlat_output, xlat_recovery, recovery_size);
nkeynes@596
   140
    xlat_current_block->recover_table_offset = xlat_output - (uint8_t *)xlat_current_block->code;
nkeynes@596
   141
    xlat_current_block->recover_table_size = xlat_recovery_posn;
nkeynes@936
   142
    xlat_current_block->xlat_sh4_mode = sh4r.xlat_sh4_mode;
nkeynes@1195
   143
    xlat_commit_block( finalsize, start, pc );
nkeynes@596
   144
    return xlat_current_block->code;
nkeynes@359
   145
}
nkeynes@359
   146
nkeynes@398
   147
/**
nkeynes@586
   148
 * "Execute" the supplied recovery record. Currently this only updates
nkeynes@586
   149
 * sh4r.pc and sh4r.slice_cycle according to the currently executing
nkeynes@586
   150
 * instruction. In future this may be more sophisticated (ie will
nkeynes@586
   151
 * call into generated code).
nkeynes@398
   152
 */
nkeynes@586
   153
void sh4_translate_run_recovery( xlat_recovery_record_t recovery )
nkeynes@398
   154
{
nkeynes@586
   155
    sh4r.slice_cycle += (recovery->sh4_icount * sh4_cpu_period);
nkeynes@586
   156
    sh4r.pc += (recovery->sh4_icount<<1);
nkeynes@586
   157
}
nkeynes@359
   158
nkeynes@941
   159
/**
nkeynes@941
   160
 * Same as sh4_translate_run_recovery, but is used to recover from a taken
nkeynes@941
   161
 * exception - that is, it fixes sh4r.spc rather than sh4r.pc
nkeynes@941
   162
 */
nkeynes@941
   163
void sh4_translate_run_exception_recovery( xlat_recovery_record_t recovery )
nkeynes@941
   164
{
nkeynes@941
   165
    sh4r.slice_cycle += (recovery->sh4_icount * sh4_cpu_period);
nkeynes@941
   166
    sh4r.spc += (recovery->sh4_icount<<1);
nkeynes@941
   167
}    
nkeynes@941
   168
nkeynes@740
   169
void sh4_translate_exit_recover( )
nkeynes@586
   170
{
nkeynes@906
   171
    void *code = xlat_get_code_by_vma( sh4r.pc );
nkeynes@906
   172
    if( code != NULL ) {
nkeynes@906
   173
        uint32_t size = xlat_get_code_size( code );
nkeynes@906
   174
        void *pc = xlat_get_native_pc( code, size );
nkeynes@906
   175
        if( pc != NULL ) {
nkeynes@906
   176
            // could be null if we're not actually running inside the translator
nkeynes@949
   177
            xlat_recovery_record_t recover = xlat_get_pre_recovery(code, pc);
nkeynes@906
   178
            if( recover != NULL ) {
nkeynes@906
   179
                // Can be null if there is no recovery necessary
nkeynes@906
   180
                sh4_translate_run_recovery(recover);
nkeynes@906
   181
            }
nkeynes@736
   182
        }
nkeynes@398
   183
    }
nkeynes@586
   184
}
nkeynes@398
   185
nkeynes@941
   186
void sh4_translate_exception_exit_recover( )
nkeynes@941
   187
{
nkeynes@941
   188
    void *code = xlat_get_code_by_vma( sh4r.spc );
nkeynes@941
   189
    if( code != NULL ) {
nkeynes@941
   190
        uint32_t size = xlat_get_code_size( code );
nkeynes@941
   191
        void *pc = xlat_get_native_pc( code, size );
nkeynes@941
   192
        if( pc != NULL ) {
nkeynes@941
   193
            // could be null if we're not actually running inside the translator
nkeynes@941
   194
            xlat_recovery_record_t recover = xlat_get_pre_recovery(code, pc);
nkeynes@941
   195
            if( recover != NULL ) {
nkeynes@941
   196
                // Can be null if there is no recovery necessary
nkeynes@941
   197
                sh4_translate_run_exception_recovery(recover);
nkeynes@941
   198
            }
nkeynes@941
   199
        }
nkeynes@941
   200
    }
nkeynes@941
   201
    
nkeynes@941
   202
}
nkeynes@941
   203
nkeynes@905
   204
void FASTCALL sh4_translate_breakpoint_hit(uint32_t pc)
nkeynes@591
   205
{
nkeynes@591
   206
    if( sh4_starting && sh4r.slice_cycle == 0 && pc == sh4r.pc ) {
nkeynes@736
   207
        return;
nkeynes@591
   208
    }
nkeynes@740
   209
    sh4_core_exit( CORE_EXIT_BREAKPOINT );
nkeynes@591
   210
}
nkeynes@591
   211
nkeynes@905
   212
void * FASTCALL xlat_get_code_by_vma( sh4vma_t vma )
nkeynes@586
   213
{
nkeynes@586
   214
    void *result = NULL;
nkeynes@586
   215
nkeynes@588
   216
    if( IS_IN_ICACHE(vma) ) {
nkeynes@736
   217
        return xlat_get_code( GET_ICACHE_PHYS(vma) );
nkeynes@586
   218
    }
nkeynes@586
   219
nkeynes@1014
   220
    if( IS_SYSCALL(vma) ) {
nkeynes@736
   221
        // lxdream hook
nkeynes@736
   222
        return NULL;
nkeynes@588
   223
    }
nkeynes@588
   224
nkeynes@588
   225
    if( !mmu_update_icache(vma) ) {
nkeynes@736
   226
        // fault - off to the fault handler
nkeynes@736
   227
        if( !mmu_update_icache(sh4r.pc) ) {
nkeynes@736
   228
            // double fault - halt
nkeynes@736
   229
            ERROR( "Double fault - halting" );
nkeynes@740
   230
            sh4_core_exit(CORE_EXIT_HALT);
nkeynes@736
   231
            return NULL;
nkeynes@736
   232
        }
nkeynes@588
   233
    }
nkeynes@588
   234
nkeynes@588
   235
    assert( IS_IN_ICACHE(sh4r.pc) );
nkeynes@588
   236
    result = xlat_get_code( GET_ICACHE_PHYS(sh4r.pc) );
nkeynes@586
   237
    return result;
nkeynes@586
   238
}
nkeynes@586
   239
nkeynes@1091
   240
/**
nkeynes@1091
   241
 * Crashdump translation information.
nkeynes@1091
   242
 *
nkeynes@1091
   243
 * Print out the currently executing block (if any), in source and target
nkeynes@1091
   244
 * assembly.
nkeynes@1091
   245
 *
nkeynes@1091
   246
 * Note: we want to be _really_ careful not to cause a second-level crash
nkeynes@1091
   247
 * at this point (e.g. if the lookup tables are corrupted...)
nkeynes@1091
   248
 */
nkeynes@1091
   249
void sh4_translate_crashdump()
nkeynes@1091
   250
{
nkeynes@1091
   251
    if( !IS_IN_ICACHE(sh4r.pc) ) {
nkeynes@1091
   252
        /** If we're crashing due to an icache lookup failure, we'll probably
nkeynes@1091
   253
         * hit this case - just complain and return.
nkeynes@1091
   254
         */
nkeynes@1091
   255
        fprintf( stderr, "** SH4 PC not in current instruction region **\n" );
nkeynes@1091
   256
        return;
nkeynes@1091
   257
    }
nkeynes@1091
   258
    uint32_t pma = GET_ICACHE_PHYS(sh4r.pc);
nkeynes@1091
   259
    void *code = xlat_get_code( pma );
nkeynes@1091
   260
    if( code == NULL ) {
nkeynes@1091
   261
        fprintf( stderr, "** No translated block for current SH4 PC **\n" );
nkeynes@1091
   262
        return;
nkeynes@1091
   263
    }
nkeynes@1091
   264
nkeynes@1091
   265
    /* Sanity check on the code pointer */
nkeynes@1091
   266
    if( !xlat_is_code_pointer(code) ) {
nkeynes@1091
   267
        fprintf( stderr, "** Possibly corrupt translation cache **\n" );
nkeynes@1091
   268
        return;
nkeynes@1091
   269
    }
nkeynes@1091
   270
nkeynes@1091
   271
    void *native_pc = xlat_get_native_pc( code, xlat_get_code_size(code) );
nkeynes@1091
   272
    sh4_translate_disasm_block( stderr, code, sh4r.pc, native_pc );
nkeynes@1091
   273
}
nkeynes@1094
   274
nkeynes@1094
   275
/**
nkeynes@1094
   276
 * Dual-dump the translated block and original SH4 code for the basic block
nkeynes@1094
   277
 * starting at sh4_pc. If there is no translated block, this prints an error
nkeynes@1094
   278
 * and returns.
nkeynes@1094
   279
 */
nkeynes@1094
   280
void sh4_translate_dump_block( uint32_t sh4_pc )
nkeynes@1094
   281
{
nkeynes@1094
   282
    if( !IS_IN_ICACHE(sh4_pc) ) {
nkeynes@1094
   283
        fprintf( stderr, "** Address %08x not in current instruction region **\n", sh4_pc );
nkeynes@1094
   284
        return;
nkeynes@1094
   285
    }
nkeynes@1094
   286
    uint32_t pma = GET_ICACHE_PHYS(sh4_pc);
nkeynes@1094
   287
    void *code = xlat_get_code( pma );
nkeynes@1094
   288
    if( code == NULL ) {
nkeynes@1094
   289
        fprintf( stderr, "** No translated block for address %08x **\n", sh4_pc );
nkeynes@1094
   290
        return;
nkeynes@1094
   291
    }
nkeynes@1094
   292
    sh4_translate_disasm_block( stderr, code, sh4_pc, NULL );
nkeynes@1094
   293
}
nkeynes@1094
   294
nkeynes@1188
   295
void sh4_translate_dump_cache_by_activity( unsigned int topN )
nkeynes@1188
   296
{
nkeynes@1188
   297
    struct xlat_block_ref blocks[topN];
nkeynes@1188
   298
    topN = xlat_get_cache_blocks_by_activity(blocks, topN);
nkeynes@1188
   299
    unsigned int i;
nkeynes@1188
   300
    for( i=0; i<topN; i++ ) {
nkeynes@1188
   301
        fprintf( stderr, "0x%08X (%p): %d \n", blocks[i].pc, blocks[i].block->code, blocks[i].block->active);
nkeynes@1188
   302
        sh4_translate_disasm_block( stderr, blocks[i].block->code, blocks[i].pc, NULL );
nkeynes@1188
   303
        fprintf( stderr, "\n" );
nkeynes@1188
   304
    }
nkeynes@1188
   305
}
.