filename | src/sh4/sh4trans.c |
changeset | 1195:072131b61d2a |
prev | 1188:1cc9bb0b3848 |
next | 1263:b3de98d19faf |
author | nkeynes |
date | Wed Feb 15 17:54:51 2012 +1000 (12 years ago) |
permissions | -rw-r--r-- |
last change | Use GL_TEXTURE_2D instead of GL_TEXTURE_RECTANGLE_ARB for frame buffers, for systems that don't provide the latter (and there's not really much difference anyway). Add macro wrangling for GL_DEPTH24_STENCIL8 format |
file | annotate | diff | log | raw |
nkeynes@359 | 1 | /** |
nkeynes@586 | 2 | * $Id$ |
nkeynes@359 | 3 | * |
nkeynes@359 | 4 | * SH4 translation core module. This part handles the non-target-specific |
nkeynes@359 | 5 | * section of the translation. |
nkeynes@359 | 6 | * |
nkeynes@359 | 7 | * Copyright (c) 2005 Nathan Keynes. |
nkeynes@359 | 8 | * |
nkeynes@359 | 9 | * This program is free software; you can redistribute it and/or modify |
nkeynes@359 | 10 | * it under the terms of the GNU General Public License as published by |
nkeynes@359 | 11 | * the Free Software Foundation; either version 2 of the License, or |
nkeynes@359 | 12 | * (at your option) any later version. |
nkeynes@359 | 13 | * |
nkeynes@359 | 14 | * This program is distributed in the hope that it will be useful, |
nkeynes@359 | 15 | * but WITHOUT ANY WARRANTY; without even the implied warranty of |
nkeynes@359 | 16 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
nkeynes@359 | 17 | * GNU General Public License for more details. |
nkeynes@359 | 18 | */ |
nkeynes@398 | 19 | #include <assert.h> |
nkeynes@430 | 20 | #include "eventq.h" |
nkeynes@430 | 21 | #include "syscall.h" |
nkeynes@586 | 22 | #include "clock.h" |
nkeynes@669 | 23 | #include "dreamcast.h" |
nkeynes@430 | 24 | #include "sh4/sh4core.h" |
nkeynes@430 | 25 | #include "sh4/sh4trans.h" |
nkeynes@975 | 26 | #include "sh4/sh4mmio.h" |
nkeynes@975 | 27 | #include "sh4/mmu.h" |
nkeynes@991 | 28 | #include "xlat/xltcache.h" |
nkeynes@586 | 29 | |
nkeynes@1125 | 30 | //#define SINGLESTEP 1 |
nkeynes@1125 | 31 | |
nkeynes@359 | 32 | /** |
nkeynes@359 | 33 | * Execute a timeslice using translated code only (ie translate/execute loop) |
nkeynes@359 | 34 | */ |
nkeynes@740 | 35 | uint32_t sh4_translate_run_slice( uint32_t nanosecs ) |
nkeynes@359 | 36 | { |
nkeynes@1112 | 37 | event_schedule( EVENT_ENDTIMESLICE, nanosecs ); |
nkeynes@1112 | 38 | for(;;) { |
nkeynes@736 | 39 | if( sh4r.event_pending <= sh4r.slice_cycle ) { |
nkeynes@1187 | 40 | sh4_handle_pending_events(); |
nkeynes@1112 | 41 | if( sh4r.slice_cycle >= nanosecs ) |
nkeynes@1112 | 42 | return nanosecs; |
nkeynes@736 | 43 | } |
nkeynes@359 | 44 | |
nkeynes@1112 | 45 | if( IS_SYSCALL(sh4r.pc) ) { |
nkeynes@1112 | 46 | uint32_t pc = sh4r.pc; |
nkeynes@1112 | 47 | sh4r.pc = sh4r.pr; |
nkeynes@1112 | 48 | sh4r.in_delay_slot = 0; |
nkeynes@1112 | 49 | syscall_invoke( pc ); |
nkeynes@1112 | 50 | } |
nkeynes@736 | 51 | |
nkeynes@1187 | 52 | void * (*code)() = xlat_get_code_by_vma( sh4r.pc ); |
nkeynes@1149 | 53 | if( code != NULL ) { |
nkeynes@1149 | 54 | while( sh4r.xlat_sh4_mode != XLAT_BLOCK_MODE(code) ) { |
nkeynes@1149 | 55 | code = XLAT_BLOCK_CHAIN(code); |
nkeynes@1149 | 56 | if( code == NULL ) { |
nkeynes@1149 | 57 | code = sh4_translate_basic_block( sh4r.pc ); |
nkeynes@1149 | 58 | break; |
nkeynes@1149 | 59 | } |
nkeynes@1149 | 60 | } |
nkeynes@1149 | 61 | } else { |
nkeynes@936 | 62 | code = sh4_translate_basic_block( sh4r.pc ); |
nkeynes@736 | 63 | } |
nkeynes@1112 | 64 | code(); |
nkeynes@359 | 65 | } |
nkeynes@359 | 66 | } |
nkeynes@359 | 67 | |
nkeynes@359 | 68 | uint8_t *xlat_output; |
nkeynes@596 | 69 | xlat_cache_block_t xlat_current_block; |
nkeynes@586 | 70 | struct xlat_recovery_record xlat_recovery[MAX_RECOVERY_SIZE]; |
nkeynes@586 | 71 | uint32_t xlat_recovery_posn; |
nkeynes@359 | 72 | |
nkeynes@596 | 73 | void sh4_translate_add_recovery( uint32_t icount ) |
nkeynes@596 | 74 | { |
nkeynes@596 | 75 | xlat_recovery[xlat_recovery_posn].xlat_offset = |
nkeynes@736 | 76 | ((uintptr_t)xlat_output) - ((uintptr_t)xlat_current_block->code); |
nkeynes@596 | 77 | xlat_recovery[xlat_recovery_posn].sh4_icount = icount; |
nkeynes@596 | 78 | xlat_recovery_posn++; |
nkeynes@596 | 79 | } |
nkeynes@596 | 80 | |
nkeynes@359 | 81 | /** |
nkeynes@359 | 82 | * Translate a linear basic block, ie all instructions from the start address |
nkeynes@359 | 83 | * (inclusive) until the next branch/jump instruction or the end of the page |
nkeynes@359 | 84 | * is reached. |
nkeynes@914 | 85 | * @param start VMA of the block start (which must already be in the icache) |
nkeynes@359 | 86 | * @return the address of the translated block |
nkeynes@359 | 87 | * eg due to lack of buffer space. |
nkeynes@359 | 88 | */ |
nkeynes@359 | 89 | void * sh4_translate_basic_block( sh4addr_t start ) |
nkeynes@359 | 90 | { |
nkeynes@408 | 91 | sh4addr_t pc = start; |
nkeynes@410 | 92 | sh4addr_t lastpc = (pc&0xFFFFF000)+0x1000; |
nkeynes@586 | 93 | int done, i; |
nkeynes@914 | 94 | xlat_current_block = xlat_start_block( GET_ICACHE_PHYS(start) ); |
nkeynes@596 | 95 | xlat_output = (uint8_t *)xlat_current_block->code; |
nkeynes@586 | 96 | xlat_recovery_posn = 0; |
nkeynes@596 | 97 | uint8_t *eob = xlat_output + xlat_current_block->size; |
nkeynes@588 | 98 | |
nkeynes@588 | 99 | if( GET_ICACHE_END() < lastpc ) { |
nkeynes@711 | 100 | lastpc = GET_ICACHE_END(); |
nkeynes@588 | 101 | } |
nkeynes@588 | 102 | |
nkeynes@408 | 103 | sh4_translate_begin_block(pc); |
nkeynes@359 | 104 | |
nkeynes@408 | 105 | do { |
nkeynes@711 | 106 | if( eob - xlat_output < MAX_INSTRUCTION_SIZE ) { |
nkeynes@711 | 107 | uint8_t *oldstart = xlat_current_block->code; |
nkeynes@711 | 108 | xlat_current_block = xlat_extend_block( xlat_output - oldstart + MAX_INSTRUCTION_SIZE ); |
nkeynes@711 | 109 | xlat_output = xlat_current_block->code + (xlat_output - oldstart); |
nkeynes@711 | 110 | eob = xlat_current_block->code + xlat_current_block->size; |
nkeynes@711 | 111 | } |
nkeynes@711 | 112 | done = sh4_translate_instruction( pc ); |
nkeynes@711 | 113 | assert( xlat_output <= eob ); |
nkeynes@711 | 114 | pc += 2; |
nkeynes@1195 | 115 | if ( pc >= lastpc && done == 0 ) { |
nkeynes@711 | 116 | done = 2; |
nkeynes@711 | 117 | } |
nkeynes@1125 | 118 | #ifdef SINGLESTEP |
nkeynes@1125 | 119 | if( !done ) done = 2; |
nkeynes@1125 | 120 | #endif |
nkeynes@408 | 121 | } while( !done ); |
nkeynes@408 | 122 | pc += (done - 2); |
nkeynes@617 | 123 | |
nkeynes@617 | 124 | // Add end-of-block recovery for post-instruction checks |
nkeynes@617 | 125 | sh4_translate_add_recovery( (pc - start)>>1 ); |
nkeynes@617 | 126 | |
nkeynes@593 | 127 | int epilogue_size = sh4_translate_end_block_size(); |
nkeynes@593 | 128 | uint32_t recovery_size = sizeof(struct xlat_recovery_record)*xlat_recovery_posn; |
nkeynes@711 | 129 | uint32_t finalsize = (xlat_output - xlat_current_block->code) + epilogue_size + recovery_size; |
nkeynes@711 | 130 | if( xlat_current_block->size < finalsize ) { |
nkeynes@711 | 131 | uint8_t *oldstart = xlat_current_block->code; |
nkeynes@711 | 132 | xlat_current_block = xlat_extend_block( finalsize ); |
nkeynes@711 | 133 | xlat_output = xlat_current_block->code + (xlat_output - oldstart); |
nkeynes@410 | 134 | } |
nkeynes@368 | 135 | sh4_translate_end_block(pc); |
nkeynes@711 | 136 | assert( xlat_output <= (xlat_current_block->code + xlat_current_block->size - recovery_size) ); |
nkeynes@736 | 137 | |
nkeynes@586 | 138 | /* Write the recovery records onto the end of the code block */ |
nkeynes@586 | 139 | memcpy( xlat_output, xlat_recovery, recovery_size); |
nkeynes@596 | 140 | xlat_current_block->recover_table_offset = xlat_output - (uint8_t *)xlat_current_block->code; |
nkeynes@596 | 141 | xlat_current_block->recover_table_size = xlat_recovery_posn; |
nkeynes@936 | 142 | xlat_current_block->xlat_sh4_mode = sh4r.xlat_sh4_mode; |
nkeynes@1195 | 143 | xlat_commit_block( finalsize, start, pc ); |
nkeynes@596 | 144 | return xlat_current_block->code; |
nkeynes@359 | 145 | } |
nkeynes@359 | 146 | |
nkeynes@398 | 147 | /** |
nkeynes@586 | 148 | * "Execute" the supplied recovery record. Currently this only updates |
nkeynes@586 | 149 | * sh4r.pc and sh4r.slice_cycle according to the currently executing |
nkeynes@586 | 150 | * instruction. In future this may be more sophisticated (ie will |
nkeynes@586 | 151 | * call into generated code). |
nkeynes@398 | 152 | */ |
nkeynes@586 | 153 | void sh4_translate_run_recovery( xlat_recovery_record_t recovery ) |
nkeynes@398 | 154 | { |
nkeynes@586 | 155 | sh4r.slice_cycle += (recovery->sh4_icount * sh4_cpu_period); |
nkeynes@586 | 156 | sh4r.pc += (recovery->sh4_icount<<1); |
nkeynes@586 | 157 | } |
nkeynes@359 | 158 | |
nkeynes@941 | 159 | /** |
nkeynes@941 | 160 | * Same as sh4_translate_run_recovery, but is used to recover from a taken |
nkeynes@941 | 161 | * exception - that is, it fixes sh4r.spc rather than sh4r.pc |
nkeynes@941 | 162 | */ |
nkeynes@941 | 163 | void sh4_translate_run_exception_recovery( xlat_recovery_record_t recovery ) |
nkeynes@941 | 164 | { |
nkeynes@941 | 165 | sh4r.slice_cycle += (recovery->sh4_icount * sh4_cpu_period); |
nkeynes@941 | 166 | sh4r.spc += (recovery->sh4_icount<<1); |
nkeynes@941 | 167 | } |
nkeynes@941 | 168 | |
nkeynes@740 | 169 | void sh4_translate_exit_recover( ) |
nkeynes@586 | 170 | { |
nkeynes@906 | 171 | void *code = xlat_get_code_by_vma( sh4r.pc ); |
nkeynes@906 | 172 | if( code != NULL ) { |
nkeynes@906 | 173 | uint32_t size = xlat_get_code_size( code ); |
nkeynes@906 | 174 | void *pc = xlat_get_native_pc( code, size ); |
nkeynes@906 | 175 | if( pc != NULL ) { |
nkeynes@906 | 176 | // could be null if we're not actually running inside the translator |
nkeynes@949 | 177 | xlat_recovery_record_t recover = xlat_get_pre_recovery(code, pc); |
nkeynes@906 | 178 | if( recover != NULL ) { |
nkeynes@906 | 179 | // Can be null if there is no recovery necessary |
nkeynes@906 | 180 | sh4_translate_run_recovery(recover); |
nkeynes@906 | 181 | } |
nkeynes@736 | 182 | } |
nkeynes@398 | 183 | } |
nkeynes@586 | 184 | } |
nkeynes@398 | 185 | |
nkeynes@941 | 186 | void sh4_translate_exception_exit_recover( ) |
nkeynes@941 | 187 | { |
nkeynes@941 | 188 | void *code = xlat_get_code_by_vma( sh4r.spc ); |
nkeynes@941 | 189 | if( code != NULL ) { |
nkeynes@941 | 190 | uint32_t size = xlat_get_code_size( code ); |
nkeynes@941 | 191 | void *pc = xlat_get_native_pc( code, size ); |
nkeynes@941 | 192 | if( pc != NULL ) { |
nkeynes@941 | 193 | // could be null if we're not actually running inside the translator |
nkeynes@941 | 194 | xlat_recovery_record_t recover = xlat_get_pre_recovery(code, pc); |
nkeynes@941 | 195 | if( recover != NULL ) { |
nkeynes@941 | 196 | // Can be null if there is no recovery necessary |
nkeynes@941 | 197 | sh4_translate_run_exception_recovery(recover); |
nkeynes@941 | 198 | } |
nkeynes@941 | 199 | } |
nkeynes@941 | 200 | } |
nkeynes@941 | 201 | |
nkeynes@941 | 202 | } |
nkeynes@941 | 203 | |
nkeynes@905 | 204 | void FASTCALL sh4_translate_breakpoint_hit(uint32_t pc) |
nkeynes@591 | 205 | { |
nkeynes@591 | 206 | if( sh4_starting && sh4r.slice_cycle == 0 && pc == sh4r.pc ) { |
nkeynes@736 | 207 | return; |
nkeynes@591 | 208 | } |
nkeynes@740 | 209 | sh4_core_exit( CORE_EXIT_BREAKPOINT ); |
nkeynes@591 | 210 | } |
nkeynes@591 | 211 | |
nkeynes@905 | 212 | void * FASTCALL xlat_get_code_by_vma( sh4vma_t vma ) |
nkeynes@586 | 213 | { |
nkeynes@586 | 214 | void *result = NULL; |
nkeynes@586 | 215 | |
nkeynes@588 | 216 | if( IS_IN_ICACHE(vma) ) { |
nkeynes@736 | 217 | return xlat_get_code( GET_ICACHE_PHYS(vma) ); |
nkeynes@586 | 218 | } |
nkeynes@586 | 219 | |
nkeynes@1014 | 220 | if( IS_SYSCALL(vma) ) { |
nkeynes@736 | 221 | // lxdream hook |
nkeynes@736 | 222 | return NULL; |
nkeynes@588 | 223 | } |
nkeynes@588 | 224 | |
nkeynes@588 | 225 | if( !mmu_update_icache(vma) ) { |
nkeynes@736 | 226 | // fault - off to the fault handler |
nkeynes@736 | 227 | if( !mmu_update_icache(sh4r.pc) ) { |
nkeynes@736 | 228 | // double fault - halt |
nkeynes@736 | 229 | ERROR( "Double fault - halting" ); |
nkeynes@740 | 230 | sh4_core_exit(CORE_EXIT_HALT); |
nkeynes@736 | 231 | return NULL; |
nkeynes@736 | 232 | } |
nkeynes@588 | 233 | } |
nkeynes@588 | 234 | |
nkeynes@588 | 235 | assert( IS_IN_ICACHE(sh4r.pc) ); |
nkeynes@588 | 236 | result = xlat_get_code( GET_ICACHE_PHYS(sh4r.pc) ); |
nkeynes@586 | 237 | return result; |
nkeynes@586 | 238 | } |
nkeynes@586 | 239 | |
nkeynes@1091 | 240 | /** |
nkeynes@1091 | 241 | * Crashdump translation information. |
nkeynes@1091 | 242 | * |
nkeynes@1091 | 243 | * Print out the currently executing block (if any), in source and target |
nkeynes@1091 | 244 | * assembly. |
nkeynes@1091 | 245 | * |
nkeynes@1091 | 246 | * Note: we want to be _really_ careful not to cause a second-level crash |
nkeynes@1091 | 247 | * at this point (e.g. if the lookup tables are corrupted...) |
nkeynes@1091 | 248 | */ |
nkeynes@1091 | 249 | void sh4_translate_crashdump() |
nkeynes@1091 | 250 | { |
nkeynes@1091 | 251 | if( !IS_IN_ICACHE(sh4r.pc) ) { |
nkeynes@1091 | 252 | /** If we're crashing due to an icache lookup failure, we'll probably |
nkeynes@1091 | 253 | * hit this case - just complain and return. |
nkeynes@1091 | 254 | */ |
nkeynes@1091 | 255 | fprintf( stderr, "** SH4 PC not in current instruction region **\n" ); |
nkeynes@1091 | 256 | return; |
nkeynes@1091 | 257 | } |
nkeynes@1091 | 258 | uint32_t pma = GET_ICACHE_PHYS(sh4r.pc); |
nkeynes@1091 | 259 | void *code = xlat_get_code( pma ); |
nkeynes@1091 | 260 | if( code == NULL ) { |
nkeynes@1091 | 261 | fprintf( stderr, "** No translated block for current SH4 PC **\n" ); |
nkeynes@1091 | 262 | return; |
nkeynes@1091 | 263 | } |
nkeynes@1091 | 264 | |
nkeynes@1091 | 265 | /* Sanity check on the code pointer */ |
nkeynes@1091 | 266 | if( !xlat_is_code_pointer(code) ) { |
nkeynes@1091 | 267 | fprintf( stderr, "** Possibly corrupt translation cache **\n" ); |
nkeynes@1091 | 268 | return; |
nkeynes@1091 | 269 | } |
nkeynes@1091 | 270 | |
nkeynes@1091 | 271 | void *native_pc = xlat_get_native_pc( code, xlat_get_code_size(code) ); |
nkeynes@1091 | 272 | sh4_translate_disasm_block( stderr, code, sh4r.pc, native_pc ); |
nkeynes@1091 | 273 | } |
nkeynes@1094 | 274 | |
nkeynes@1094 | 275 | /** |
nkeynes@1094 | 276 | * Dual-dump the translated block and original SH4 code for the basic block |
nkeynes@1094 | 277 | * starting at sh4_pc. If there is no translated block, this prints an error |
nkeynes@1094 | 278 | * and returns. |
nkeynes@1094 | 279 | */ |
nkeynes@1094 | 280 | void sh4_translate_dump_block( uint32_t sh4_pc ) |
nkeynes@1094 | 281 | { |
nkeynes@1094 | 282 | if( !IS_IN_ICACHE(sh4_pc) ) { |
nkeynes@1094 | 283 | fprintf( stderr, "** Address %08x not in current instruction region **\n", sh4_pc ); |
nkeynes@1094 | 284 | return; |
nkeynes@1094 | 285 | } |
nkeynes@1094 | 286 | uint32_t pma = GET_ICACHE_PHYS(sh4_pc); |
nkeynes@1094 | 287 | void *code = xlat_get_code( pma ); |
nkeynes@1094 | 288 | if( code == NULL ) { |
nkeynes@1094 | 289 | fprintf( stderr, "** No translated block for address %08x **\n", sh4_pc ); |
nkeynes@1094 | 290 | return; |
nkeynes@1094 | 291 | } |
nkeynes@1094 | 292 | sh4_translate_disasm_block( stderr, code, sh4_pc, NULL ); |
nkeynes@1094 | 293 | } |
nkeynes@1094 | 294 | |
nkeynes@1188 | 295 | void sh4_translate_dump_cache_by_activity( unsigned int topN ) |
nkeynes@1188 | 296 | { |
nkeynes@1188 | 297 | struct xlat_block_ref blocks[topN]; |
nkeynes@1188 | 298 | topN = xlat_get_cache_blocks_by_activity(blocks, topN); |
nkeynes@1188 | 299 | unsigned int i; |
nkeynes@1188 | 300 | for( i=0; i<topN; i++ ) { |
nkeynes@1188 | 301 | fprintf( stderr, "0x%08X (%p): %d \n", blocks[i].pc, blocks[i].block->code, blocks[i].block->active); |
nkeynes@1188 | 302 | sh4_translate_disasm_block( stderr, blocks[i].block->code, blocks[i].pc, NULL ); |
nkeynes@1188 | 303 | fprintf( stderr, "\n" ); |
nkeynes@1188 | 304 | } |
nkeynes@1188 | 305 | } |
.