4 * Provides the implementation for the ia32 ABI (eg prologue, epilogue, and
7 * Copyright (c) 2007 Nathan Keynes.
9 * This program is free software; you can redistribute it and/or modify
10 * it under the terms of the GNU General Public License as published by
11 * the Free Software Foundation; either version 2 of the License, or
12 * (at your option) any later version.
14 * This program is distributed in the hope that it will be useful,
15 * but WITHOUT ANY WARRANTY; without even the implied warranty of
16 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
17 * GNU General Public License for more details.
20 #ifndef __lxdream_ia32abi_H
21 #define __lxdream_ia32abi_H 1
23 #define load_ptr( reg, ptr ) load_imm32( reg, (uint32_t)ptr );
26 * Note: clobbers EAX to make the indirect call - this isn't usually
27 * a problem since the callee will usually clobber it anyway.
29 #define CALL_FUNC0_SIZE 7
30 static inline void call_func0( void *ptr )
32 load_imm32(R_EAX, (uint32_t)ptr);
36 #define CALL_FUNC1_SIZE 11
37 static inline void call_func1( void *ptr, int arg1 )
41 ADD_imm8s_r32( 4, R_ESP );
44 #define CALL_FUNC2_SIZE 12
45 static inline void call_func2( void *ptr, int arg1, int arg2 )
50 ADD_imm8s_r32( 8, R_ESP );
54 * Write a double (64-bit) value into memory, with the first word in arg2a, and
58 #define MEM_WRITE_DOUBLE_SIZE 30
59 static inline void MEM_WRITE_DOUBLE( int addr, int arg2a, int arg2b )
61 ADD_imm8s_r32( 4, addr );
64 ADD_imm8s_r32( -4, addr );
67 call_func0(sh4_write_long);
68 ADD_imm8s_r32( 8, R_ESP );
69 call_func0(sh4_write_long);
70 ADD_imm8s_r32( 8, R_ESP );
74 * Read a double (64-bit) value from memory, writing the first word into arg2a
75 * and the second into arg2b. The addr must not be in EAX
78 #define MEM_READ_DOUBLE_SIZE 27
79 static inline void MEM_READ_DOUBLE( int addr, int arg2a, int arg2b )
82 call_func0(sh4_read_long);
85 ADD_imm8s_r32( 4, R_ECX );
87 call_func0(sh4_read_long);
88 ADD_imm8s_r32( 4, R_ESP );
89 MOV_r32_r32( R_EAX, arg2b );
94 * Emit the 'start of block' assembly. Sets up the stack frame and save
97 void sh4_translate_begin_block( sh4addr_t pc )
101 load_ptr( R_EBP, &sh4r );
103 sh4_x86.in_delay_slot = FALSE;
104 sh4_x86.priv_checked = FALSE;
105 sh4_x86.fpuen_checked = FALSE;
106 sh4_x86.branch_taken = FALSE;
107 sh4_x86.backpatch_posn = 0;
108 sh4_x86.recovery_posn = 0;
109 sh4_x86.block_start_pc = pc;
110 sh4_x86.tlb_on = IS_MMU_ENABLED();
111 sh4_x86.tstate = TSTATE_NONE;
113 sh4_x86.stack_posn = 8;
118 * Exit the block with sh4r.pc already written
120 void exit_block_pcset( sh4addr_t pc )
122 load_imm32( R_ECX, ((pc - sh4_x86.block_start_pc)>>1)*sh4_cpu_period ); // 5
123 ADD_r32_sh4r( R_ECX, REG_OFFSET(slice_cycle) ); // 6
124 load_spreg( R_EAX, R_PC );
125 if( sh4_x86.tlb_on ) {
126 call_func1(xlat_get_code_by_vma,R_EAX);
128 call_func1(xlat_get_code,R_EAX);
135 * Exit the block with sh4r.new_pc written with the target pc
137 void exit_block_newpcset( sh4addr_t pc )
139 load_imm32( R_ECX, ((pc - sh4_x86.block_start_pc)>>1)*sh4_cpu_period ); // 5
140 ADD_r32_sh4r( R_ECX, REG_OFFSET(slice_cycle) ); // 6
141 load_spreg( R_EAX, R_NEW_PC );
142 store_spreg( R_EAX, R_PC );
143 if( sh4_x86.tlb_on ) {
144 call_func1(xlat_get_code_by_vma,R_EAX);
146 call_func1(xlat_get_code,R_EAX);
152 #define EXIT_BLOCK_SIZE(pc) (24 + (IS_IN_ICACHE(pc)?5:CALL_FUNC1_SIZE))
156 * Exit the block to an absolute PC
158 void exit_block( sh4addr_t pc, sh4addr_t endpc )
160 load_imm32( R_ECX, pc ); // 5
161 store_spreg( R_ECX, REG_OFFSET(pc) ); // 3
162 if( IS_IN_ICACHE(pc) ) {
163 MOV_moff32_EAX( xlat_get_lut_entry(GET_ICACHE_PHYS(pc)) ); // 5
164 } else if( sh4_x86.tlb_on ) {
165 call_func1(xlat_get_code_by_vma,R_ECX);
167 call_func1(xlat_get_code,R_ECX);
169 AND_imm8s_r32( 0xFC, R_EAX ); // 3
170 load_imm32( R_ECX, ((endpc - sh4_x86.block_start_pc)>>1)*sh4_cpu_period ); // 5
171 ADD_r32_sh4r( R_ECX, REG_OFFSET(slice_cycle) ); // 6
176 #define EXIT_BLOCK_REL_SIZE(pc) (27 + (IS_IN_ICACHE(pc)?5:CALL_FUNC1_SIZE))
179 * Exit the block to a relative PC
181 void exit_block_rel( sh4addr_t pc, sh4addr_t endpc )
183 load_imm32( R_ECX, pc - sh4_x86.block_start_pc ); // 5
184 ADD_sh4r_r32( R_PC, R_ECX );
185 store_spreg( R_ECX, REG_OFFSET(pc) ); // 3
186 if( IS_IN_ICACHE(pc) ) {
187 MOV_moff32_EAX( xlat_get_lut_entry(GET_ICACHE_PHYS(pc)) ); // 5
188 } else if( sh4_x86.tlb_on ) {
189 call_func1(xlat_get_code_by_vma,R_ECX);
191 call_func1(xlat_get_code,R_ECX);
193 AND_imm8s_r32( 0xFC, R_EAX ); // 3
194 load_imm32( R_ECX, ((endpc - sh4_x86.block_start_pc)>>1)*sh4_cpu_period ); // 5
195 ADD_r32_sh4r( R_ECX, REG_OFFSET(slice_cycle) ); // 6
201 * Write the block trailer (exception handling block)
203 void sh4_translate_end_block( sh4addr_t pc ) {
204 if( sh4_x86.branch_taken == FALSE ) {
205 // Didn't exit unconditionally already, so write the termination here
206 exit_block_rel( pc, pc );
208 if( sh4_x86.backpatch_posn != 0 ) {
211 uint8_t *end_ptr = xlat_output;
212 MOV_r32_r32( R_EDX, R_ECX );
213 ADD_r32_r32( R_EDX, R_ECX );
214 ADD_r32_sh4r( R_ECX, R_PC );
215 MOV_moff32_EAX( &sh4_cpu_period );
217 ADD_r32_sh4r( R_EAX, REG_OFFSET(slice_cycle) );
219 call_func0( sh4_raise_exception );
220 ADD_imm8s_r32( 4, R_ESP );
221 load_spreg( R_EAX, R_PC );
222 if( sh4_x86.tlb_on ) {
223 call_func1(xlat_get_code_by_vma,R_EAX);
225 call_func1(xlat_get_code,R_EAX);
230 // Exception already raised - just cleanup
231 uint8_t *preexc_ptr = xlat_output;
232 MOV_r32_r32( R_EDX, R_ECX );
233 ADD_r32_r32( R_EDX, R_ECX );
234 ADD_r32_sh4r( R_ECX, R_SPC );
235 MOV_moff32_EAX( &sh4_cpu_period );
237 ADD_r32_sh4r( R_EAX, REG_OFFSET(slice_cycle) );
238 load_spreg( R_EAX, R_PC );
239 if( sh4_x86.tlb_on ) {
240 call_func1(xlat_get_code_by_vma,R_EAX);
242 call_func1(xlat_get_code,R_EAX);
247 for( i=0; i< sh4_x86.backpatch_posn; i++ ) {
248 *sh4_x86.backpatch_list[i].fixup_addr =
249 xlat_output - ((uint8_t *)sh4_x86.backpatch_list[i].fixup_addr) - 4;
250 if( sh4_x86.backpatch_list[i].exc_code == -1 ) {
251 load_imm32( R_EDX, sh4_x86.backpatch_list[i].fixup_icount );
252 int rel = preexc_ptr - xlat_output;
255 PUSH_imm32( sh4_x86.backpatch_list[i].exc_code );
256 load_imm32( R_EDX, sh4_x86.backpatch_list[i].fixup_icount );
257 int rel = end_ptr - xlat_output;
264 void *xlat_get_native_pc()
268 "mov %%ebp, %%eax\n\t"
269 "mov $0x8, %%ecx\n\t"
271 "frame_loop: test %%eax, %%eax\n\t"
272 "je frame_not_found\n\t"
273 "cmp (%%eax), %%edx\n\t"
275 "sub $0x1, %%ecx\n\t"
276 "je frame_not_found\n\t"
277 "movl (%%eax), %%eax\n\t"
279 "frame_found: movl 0x4(%%eax), %0\n"
283 : "eax", "ecx", "edx" );
.