nkeynes@539 | 1 | /**
|
nkeynes@586 | 2 | * $Id$
|
nkeynes@539 | 3 | *
|
nkeynes@736 | 4 | * Provides the implementation for the AMD64 ABI (eg prologue, epilogue, and
|
nkeynes@539 | 5 | * calling conventions)
|
nkeynes@539 | 6 | *
|
nkeynes@539 | 7 | * Copyright (c) 2007 Nathan Keynes.
|
nkeynes@539 | 8 | *
|
nkeynes@539 | 9 | * This program is free software; you can redistribute it and/or modify
|
nkeynes@539 | 10 | * it under the terms of the GNU General Public License as published by
|
nkeynes@539 | 11 | * the Free Software Foundation; either version 2 of the License, or
|
nkeynes@539 | 12 | * (at your option) any later version.
|
nkeynes@539 | 13 | *
|
nkeynes@539 | 14 | * This program is distributed in the hope that it will be useful,
|
nkeynes@539 | 15 | * but WITHOUT ANY WARRANTY; without even the implied warranty of
|
nkeynes@539 | 16 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
nkeynes@539 | 17 | * GNU General Public License for more details.
|
nkeynes@539 | 18 | */
|
nkeynes@539 | 19 |
|
nkeynes@736 | 20 | #ifndef lxdream_ia64abi_H
|
nkeynes@736 | 21 | #define lxdream_ia64abi_H 1
|
nkeynes@539 | 22 |
|
nkeynes@586 | 23 | #include <unwind.h>
|
nkeynes@539 | 24 |
|
nkeynes@539 | 25 | #define load_ptr( reg, ptr ) load_imm64( reg, (uint64_t)ptr );
|
nkeynes@736 | 26 |
|
nkeynes@930 | 27 | static inline decode_address( int addr_reg )
|
nkeynes@930 | 28 | {
|
nkeynes@930 | 29 | MOV_r32_r32( addr_reg, R_ECX );
|
nkeynes@930 | 30 | SHR_imm8_r32( 12, R_ECX );
|
nkeynes@930 | 31 | load_ptr( R_EDI, sh4_address_space );
|
nkeynes@930 | 32 | REXW(); OP(0x8B); OP(0x0C); OP(0xCF); // mov.q [%rdi + %rcx*8], %rcx
|
nkeynes@930 | 33 | }
|
nkeynes@930 | 34 |
|
nkeynes@539 | 35 | /**
|
nkeynes@539 | 36 | * Note: clobbers EAX to make the indirect call - this isn't usually
|
nkeynes@539 | 37 | * a problem since the callee will usually clobber it anyway.
|
nkeynes@539 | 38 | * Size: 12 bytes
|
nkeynes@539 | 39 | */
|
nkeynes@539 | 40 | #define CALL_FUNC0_SIZE 12
|
nkeynes@539 | 41 | static inline void call_func0( void *ptr )
|
nkeynes@539 | 42 | {
|
nkeynes@539 | 43 | load_imm64(R_EAX, (uint64_t)ptr);
|
nkeynes@539 | 44 | CALL_r32(R_EAX);
|
nkeynes@539 | 45 | }
|
nkeynes@539 | 46 |
|
nkeynes@539 | 47 | #define CALL_FUNC1_SIZE 14
|
nkeynes@539 | 48 | static inline void call_func1( void *ptr, int arg1 )
|
nkeynes@539 | 49 | {
|
nkeynes@800 | 50 | REXW(); MOV_r32_r32(arg1, R_EDI);
|
nkeynes@539 | 51 | call_func0(ptr);
|
nkeynes@539 | 52 | }
|
nkeynes@539 | 53 |
|
nkeynes@927 | 54 | static inline void call_func1_exc( void *ptr, int arg1, int pc )
|
nkeynes@927 | 55 | {
|
nkeynes@927 | 56 | REXW(); MOV_r32_r32(arg1, R_EDI);
|
nkeynes@927 | 57 | load_exc_backpatch(R_ESI);
|
nkeynes@927 | 58 | call_func0(ptr);
|
nkeynes@927 | 59 | }
|
nkeynes@927 | 60 |
|
nkeynes@930 | 61 | static inline void call_func1_r32disp8( int preg, uint32_t disp8, int arg1 )
|
nkeynes@930 | 62 | {
|
nkeynes@930 | 63 | REXW(); MOV_r32_r32(arg1, R_EDI);
|
nkeynes@930 | 64 | CALL_r32disp8(preg, disp8);
|
nkeynes@930 | 65 | }
|
nkeynes@930 | 66 |
|
nkeynes@539 | 67 | #define CALL_FUNC2_SIZE 16
|
nkeynes@539 | 68 | static inline void call_func2( void *ptr, int arg1, int arg2 )
|
nkeynes@539 | 69 | {
|
nkeynes@800 | 70 | REXW(); MOV_r32_r32(arg1, R_EDI);
|
nkeynes@800 | 71 | REXW(); MOV_r32_r32(arg2, R_ESI);
|
nkeynes@539 | 72 | call_func0(ptr);
|
nkeynes@539 | 73 | }
|
nkeynes@539 | 74 |
|
nkeynes@930 | 75 | static inline void call_func2_r32disp8( int preg, uint32_t disp8, int arg1, int arg2 )
|
nkeynes@930 | 76 | {
|
nkeynes@930 | 77 | REXW(); MOV_r32_r32(arg1, R_EDI);
|
nkeynes@930 | 78 | REXW(); MOV_r32_r32(arg2, R_ESI);
|
nkeynes@930 | 79 | CALL_r32disp8(preg, disp8);
|
nkeynes@930 | 80 | }
|
nkeynes@930 | 81 |
|
nkeynes@930 | 82 |
|
nkeynes@586 | 83 | #define MEM_WRITE_DOUBLE_SIZE 35
|
nkeynes@539 | 84 | /**
|
nkeynes@539 | 85 | * Write a double (64-bit) value into memory, with the first word in arg2a, and
|
nkeynes@539 | 86 | * the second in arg2b
|
nkeynes@539 | 87 | */
|
nkeynes@539 | 88 | static inline void MEM_WRITE_DOUBLE( int addr, int arg2a, int arg2b )
|
nkeynes@539 | 89 | {
|
nkeynes@539 | 90 | PUSH_r32(arg2b);
|
nkeynes@539 | 91 | PUSH_r32(addr);
|
nkeynes@539 | 92 | call_func2(sh4_write_long, addr, arg2a);
|
nkeynes@586 | 93 | POP_r32(R_EDI);
|
nkeynes@586 | 94 | POP_r32(R_ESI);
|
nkeynes@586 | 95 | ADD_imm8s_r32(4, R_EDI);
|
nkeynes@586 | 96 | call_func0(sh4_write_long);
|
nkeynes@539 | 97 | }
|
nkeynes@539 | 98 |
|
nkeynes@547 | 99 | #define MEM_READ_DOUBLE_SIZE 43
|
nkeynes@539 | 100 | /**
|
nkeynes@539 | 101 | * Read a double (64-bit) value from memory, writing the first word into arg2a
|
nkeynes@539 | 102 | * and the second into arg2b. The addr must not be in EAX
|
nkeynes@539 | 103 | */
|
nkeynes@539 | 104 | static inline void MEM_READ_DOUBLE( int addr, int arg2a, int arg2b )
|
nkeynes@539 | 105 | {
|
nkeynes@547 | 106 | REXW(); SUB_imm8s_r32( 8, R_ESP );
|
nkeynes@539 | 107 | PUSH_r32(addr);
|
nkeynes@539 | 108 | call_func1(sh4_read_long, addr);
|
nkeynes@539 | 109 | POP_r32(R_EDI);
|
nkeynes@539 | 110 | PUSH_r32(R_EAX);
|
nkeynes@539 | 111 | ADD_imm8s_r32(4, R_EDI);
|
nkeynes@539 | 112 | call_func0(sh4_read_long);
|
nkeynes@539 | 113 | MOV_r32_r32(R_EAX, arg2b);
|
nkeynes@539 | 114 | POP_r32(arg2a);
|
nkeynes@547 | 115 | REXW(); ADD_imm8s_r32( 8, R_ESP );
|
nkeynes@539 | 116 | }
|
nkeynes@539 | 117 |
|
nkeynes@539 | 118 |
|
nkeynes@539 | 119 | /**
|
nkeynes@539 | 120 | * Emit the 'start of block' assembly. Sets up the stack frame and save
|
nkeynes@539 | 121 | * SI/DI as required
|
nkeynes@539 | 122 | */
|
nkeynes@901 | 123 | void enter_block( )
|
nkeynes@539 | 124 | {
|
nkeynes@539 | 125 | PUSH_r32(R_EBP);
|
nkeynes@669 | 126 | load_ptr( R_EBP, ((uint8_t *)&sh4r) + 128 );
|
nkeynes@926 | 127 | // Minimum aligned allocation is 16 bytes
|
nkeynes@926 | 128 | REXW(); SUB_imm8s_r32( 16, R_ESP );
|
nkeynes@926 | 129 | }
|
nkeynes@926 | 130 |
|
nkeynes@926 | 131 | static inline void exit_block( )
|
nkeynes@926 | 132 | {
|
nkeynes@926 | 133 | REXW(); ADD_imm8s_r32( 16, R_ESP );
|
nkeynes@926 | 134 | POP_r32(R_EBP);
|
nkeynes@926 | 135 | RET();
|
nkeynes@539 | 136 | }
|
nkeynes@908 | 137 |
|
nkeynes@539 | 138 | /**
|
nkeynes@539 | 139 | * Exit the block with sh4r.pc already written
|
nkeynes@539 | 140 | */
|
nkeynes@586 | 141 | void exit_block_pcset( sh4addr_t pc )
|
nkeynes@539 | 142 | {
|
nkeynes@539 | 143 | load_imm32( R_ECX, ((pc - sh4_x86.block_start_pc)>>1)*sh4_cpu_period ); // 5
|
nkeynes@539 | 144 | ADD_r32_sh4r( R_ECX, REG_OFFSET(slice_cycle) ); // 6
|
nkeynes@590 | 145 | load_spreg( R_EAX, R_PC );
|
nkeynes@590 | 146 | if( sh4_x86.tlb_on ) {
|
nkeynes@736 | 147 | call_func1(xlat_get_code_by_vma,R_EAX);
|
nkeynes@590 | 148 | } else {
|
nkeynes@736 | 149 | call_func1(xlat_get_code,R_EAX);
|
nkeynes@590 | 150 | }
|
nkeynes@926 | 151 | exit_block();
|
nkeynes@590 | 152 | }
|
nkeynes@590 | 153 |
|
nkeynes@590 | 154 | /**
|
nkeynes@590 | 155 | * Exit the block with sh4r.new_pc written with the target address
|
nkeynes@590 | 156 | */
|
nkeynes@590 | 157 | void exit_block_newpcset( sh4addr_t pc )
|
nkeynes@590 | 158 | {
|
nkeynes@590 | 159 | load_imm32( R_ECX, ((pc - sh4_x86.block_start_pc)>>1)*sh4_cpu_period ); // 5
|
nkeynes@590 | 160 | ADD_r32_sh4r( R_ECX, REG_OFFSET(slice_cycle) ); // 6
|
nkeynes@590 | 161 | load_spreg( R_EAX, R_NEW_PC );
|
nkeynes@590 | 162 | store_spreg( R_EAX, R_PC );
|
nkeynes@586 | 163 | if( sh4_x86.tlb_on ) {
|
nkeynes@736 | 164 | call_func1(xlat_get_code_by_vma,R_EAX);
|
nkeynes@586 | 165 | } else {
|
nkeynes@736 | 166 | call_func1(xlat_get_code,R_EAX);
|
nkeynes@586 | 167 | }
|
nkeynes@926 | 168 | exit_block();
|
nkeynes@539 | 169 | }
|
nkeynes@539 | 170 |
|
nkeynes@586 | 171 | #define EXIT_BLOCK_SIZE(pc) (25 + (IS_IN_ICACHE(pc)?10:CALL_FUNC1_SIZE))
|
nkeynes@539 | 172 | /**
|
nkeynes@539 | 173 | * Exit the block to an absolute PC
|
nkeynes@539 | 174 | */
|
nkeynes@926 | 175 | void exit_block_abs( sh4addr_t pc, sh4addr_t endpc )
|
nkeynes@539 | 176 | {
|
nkeynes@539 | 177 | load_imm32( R_ECX, pc ); // 5
|
nkeynes@539 | 178 | store_spreg( R_ECX, REG_OFFSET(pc) ); // 3
|
nkeynes@586 | 179 | if( IS_IN_ICACHE(pc) ) {
|
nkeynes@736 | 180 | REXW(); MOV_moff32_EAX( xlat_get_lut_entry(pc) );
|
nkeynes@926 | 181 | REXW(); AND_imm8s_r32( 0xFC, R_EAX ); // 4
|
nkeynes@586 | 182 | } else if( sh4_x86.tlb_on ) {
|
nkeynes@736 | 183 | call_func1(xlat_get_code_by_vma, R_ECX);
|
nkeynes@586 | 184 | } else {
|
nkeynes@736 | 185 | call_func1(xlat_get_code,R_ECX);
|
nkeynes@586 | 186 | }
|
nkeynes@539 | 187 | load_imm32( R_ECX, ((endpc - sh4_x86.block_start_pc)>>1)*sh4_cpu_period ); // 5
|
nkeynes@539 | 188 | ADD_r32_sh4r( R_ECX, REG_OFFSET(slice_cycle) ); // 6
|
nkeynes@926 | 189 | exit_block();
|
nkeynes@539 | 190 | }
|
nkeynes@539 | 191 |
|
nkeynes@539 | 192 |
|
nkeynes@586 | 193 | #define EXIT_BLOCK_REL_SIZE(pc) (28 + (IS_IN_ICACHE(pc)?10:CALL_FUNC1_SIZE))
|
nkeynes@586 | 194 |
|
nkeynes@586 | 195 | /**
|
nkeynes@586 | 196 | * Exit the block to a relative PC
|
nkeynes@586 | 197 | */
|
nkeynes@586 | 198 | void exit_block_rel( sh4addr_t pc, sh4addr_t endpc )
|
nkeynes@586 | 199 | {
|
nkeynes@586 | 200 | load_imm32( R_ECX, pc - sh4_x86.block_start_pc ); // 5
|
nkeynes@586 | 201 | ADD_sh4r_r32( R_PC, R_ECX );
|
nkeynes@586 | 202 | store_spreg( R_ECX, REG_OFFSET(pc) ); // 3
|
nkeynes@586 | 203 | if( IS_IN_ICACHE(pc) ) {
|
nkeynes@736 | 204 | REXW(); MOV_moff32_EAX( xlat_get_lut_entry(GET_ICACHE_PHYS(pc)) ); // 5
|
nkeynes@926 | 205 | REXW(); AND_imm8s_r32( 0xFC, R_EAX ); // 4
|
nkeynes@586 | 206 | } else if( sh4_x86.tlb_on ) {
|
nkeynes@736 | 207 | call_func1(xlat_get_code_by_vma,R_ECX);
|
nkeynes@586 | 208 | } else {
|
nkeynes@736 | 209 | call_func1(xlat_get_code,R_ECX);
|
nkeynes@586 | 210 | }
|
nkeynes@586 | 211 | load_imm32( R_ECX, ((endpc - sh4_x86.block_start_pc)>>1)*sh4_cpu_period ); // 5
|
nkeynes@586 | 212 | ADD_r32_sh4r( R_ECX, REG_OFFSET(slice_cycle) ); // 6
|
nkeynes@926 | 213 | exit_block();
|
nkeynes@586 | 214 | }
|
nkeynes@586 | 215 |
|
nkeynes@539 | 216 | /**
|
nkeynes@539 | 217 | * Write the block trailer (exception handling block)
|
nkeynes@539 | 218 | */
|
nkeynes@539 | 219 | void sh4_translate_end_block( sh4addr_t pc ) {
|
nkeynes@539 | 220 | if( sh4_x86.branch_taken == FALSE ) {
|
nkeynes@736 | 221 | // Didn't exit unconditionally already, so write the termination here
|
nkeynes@736 | 222 | exit_block_rel( pc, pc );
|
nkeynes@539 | 223 | }
|
nkeynes@539 | 224 | if( sh4_x86.backpatch_posn != 0 ) {
|
nkeynes@736 | 225 | unsigned int i;
|
nkeynes@736 | 226 | // Raise exception
|
nkeynes@736 | 227 | uint8_t *end_ptr = xlat_output;
|
nkeynes@736 | 228 | MOV_r32_r32( R_EDX, R_ECX );
|
nkeynes@736 | 229 | ADD_r32_r32( R_EDX, R_ECX );
|
nkeynes@736 | 230 | ADD_r32_sh4r( R_ECX, R_PC );
|
nkeynes@736 | 231 | MOV_moff32_EAX( &sh4_cpu_period );
|
nkeynes@736 | 232 | MUL_r32( R_EDX );
|
nkeynes@736 | 233 | ADD_r32_sh4r( R_EAX, REG_OFFSET(slice_cycle) );
|
nkeynes@539 | 234 |
|
nkeynes@736 | 235 | call_func0( sh4_raise_exception );
|
nkeynes@736 | 236 | load_spreg( R_EAX, R_PC );
|
nkeynes@736 | 237 | if( sh4_x86.tlb_on ) {
|
nkeynes@736 | 238 | call_func1(xlat_get_code_by_vma,R_EAX);
|
nkeynes@736 | 239 | } else {
|
nkeynes@736 | 240 | call_func1(xlat_get_code,R_EAX);
|
nkeynes@736 | 241 | }
|
nkeynes@926 | 242 | exit_block();
|
nkeynes@926 | 243 |
|
nkeynes@736 | 244 | // Exception already raised - just cleanup
|
nkeynes@736 | 245 | uint8_t *preexc_ptr = xlat_output;
|
nkeynes@736 | 246 | MOV_r32_r32( R_EDX, R_ECX );
|
nkeynes@736 | 247 | ADD_r32_r32( R_EDX, R_ECX );
|
nkeynes@736 | 248 | ADD_r32_sh4r( R_ECX, R_SPC );
|
nkeynes@736 | 249 | MOV_moff32_EAX( &sh4_cpu_period );
|
nkeynes@736 | 250 | MUL_r32( R_EDX );
|
nkeynes@736 | 251 | ADD_r32_sh4r( R_EAX, REG_OFFSET(slice_cycle) );
|
nkeynes@736 | 252 | load_spreg( R_EDI, R_PC );
|
nkeynes@736 | 253 | if( sh4_x86.tlb_on ) {
|
nkeynes@736 | 254 | call_func0(xlat_get_code_by_vma);
|
nkeynes@736 | 255 | } else {
|
nkeynes@736 | 256 | call_func0(xlat_get_code);
|
nkeynes@736 | 257 | }
|
nkeynes@926 | 258 | exit_block();
|
nkeynes@586 | 259 |
|
nkeynes@736 | 260 | for( i=0; i< sh4_x86.backpatch_posn; i++ ) {
|
nkeynes@736 | 261 | uint32_t *fixup_addr = (uint32_t *)&xlat_current_block->code[sh4_x86.backpatch_list[i].fixup_offset];
|
nkeynes@736 | 262 | if( sh4_x86.backpatch_list[i].exc_code < 0 ) {
|
nkeynes@927 | 263 | if( sh4_x86.backpatch_list[i].exc_code == -2 ) {
|
nkeynes@927 | 264 | *((uintptr_t *)fixup_addr) = (uintptr_t)xlat_output;
|
nkeynes@927 | 265 | } else {
|
nkeynes@927 | 266 | *fixup_addr = xlat_output - (uint8_t *)&xlat_current_block->code[sh4_x86.backpatch_list[i].fixup_offset] - 4;
|
nkeynes@927 | 267 | }
|
nkeynes@736 | 268 | load_imm32( R_EDX, sh4_x86.backpatch_list[i].fixup_icount );
|
nkeynes@736 | 269 | int rel = preexc_ptr - xlat_output;
|
nkeynes@736 | 270 | JMP_rel(rel);
|
nkeynes@736 | 271 | } else {
|
nkeynes@927 | 272 | *fixup_addr = xlat_output - (uint8_t *)&xlat_current_block->code[sh4_x86.backpatch_list[i].fixup_offset] - 4;
|
nkeynes@736 | 273 | load_imm32( R_EDI, sh4_x86.backpatch_list[i].exc_code );
|
nkeynes@736 | 274 | load_imm32( R_EDX, sh4_x86.backpatch_list[i].fixup_icount );
|
nkeynes@736 | 275 | int rel = end_ptr - xlat_output;
|
nkeynes@736 | 276 | JMP_rel(rel);
|
nkeynes@736 | 277 | }
|
nkeynes@736 | 278 | }
|
nkeynes@539 | 279 | }
|
nkeynes@539 | 280 | }
|
nkeynes@539 | 281 |
|
nkeynes@926 | 282 | struct UnwindInfo {
|
nkeynes@926 | 283 | uintptr_t block_start;
|
nkeynes@926 | 284 | uintptr_t block_end;
|
nkeynes@926 | 285 | void *pc;
|
nkeynes@926 | 286 | };
|
nkeynes@926 | 287 |
|
nkeynes@586 | 288 | _Unwind_Reason_Code xlat_check_frame( struct _Unwind_Context *context, void *arg )
|
nkeynes@586 | 289 | {
|
nkeynes@926 | 290 | struct UnwindInfo *info = arg;
|
nkeynes@926 | 291 | void *pc = (void *)_Unwind_GetIP(context);
|
nkeynes@926 | 292 | if( ((uintptr_t)pc) >= info->block_start && ((uintptr_t)pc) < info->block_end ) {
|
nkeynes@926 | 293 | info->pc = pc;
|
nkeynes@586 | 294 | return _URC_NORMAL_STOP;
|
nkeynes@586 | 295 | }
|
nkeynes@926 | 296 |
|
nkeynes@586 | 297 | return _URC_NO_REASON;
|
nkeynes@586 | 298 | }
|
nkeynes@586 | 299 |
|
nkeynes@926 | 300 | void *xlat_get_native_pc( void *code, uint32_t code_size )
|
nkeynes@586 | 301 | {
|
nkeynes@586 | 302 | struct _Unwind_Exception exc;
|
nkeynes@926 | 303 | struct UnwindInfo info;
|
nkeynes@736 | 304 |
|
nkeynes@926 | 305 | info.pc = NULL;
|
nkeynes@926 | 306 | info.block_start = (uintptr_t)code;
|
nkeynes@926 | 307 | info.block_end = info.block_start + code_size;
|
nkeynes@586 | 308 | void *result = NULL;
|
nkeynes@926 | 309 | _Unwind_Backtrace( xlat_check_frame, &info );
|
nkeynes@926 | 310 | return info.pc;
|
nkeynes@586 | 311 | }
|
nkeynes@586 | 312 |
|
nkeynes@736 | 313 | #endif /* !lxdream_ia64abi_H */
|