Search
lxdream.org :: lxdream/src/sh4/ia64abi.h
lxdream 0.9.1
released Jun 29
Download Now
filename src/sh4/ia64abi.h
changeset 957:0f6131f6cc3a
prev953:f4a156508ad1
next991:60c7fab9c880
author nkeynes
date Thu Jan 15 04:15:11 2009 +0000 (15 years ago)
permissions -rw-r--r--
last change Add support for the Intel ICC compiler (C only, icc doesn't support Obj-C)
- Rename Obj-C source to .m
- Separate paths.c into paths_unix.c and paths_osx.m
- Add configuration detection of ICC, along with specific opt flags
file annotate diff log raw
nkeynes@539
     1
/**
nkeynes@586
     2
 * $Id$
nkeynes@539
     3
 * 
nkeynes@736
     4
 * Provides the implementation for the AMD64 ABI (eg prologue, epilogue, and
nkeynes@539
     5
 * calling conventions)
nkeynes@539
     6
 *
nkeynes@539
     7
 * Copyright (c) 2007 Nathan Keynes.
nkeynes@539
     8
 *
nkeynes@539
     9
 * This program is free software; you can redistribute it and/or modify
nkeynes@539
    10
 * it under the terms of the GNU General Public License as published by
nkeynes@539
    11
 * the Free Software Foundation; either version 2 of the License, or
nkeynes@539
    12
 * (at your option) any later version.
nkeynes@539
    13
 *
nkeynes@539
    14
 * This program is distributed in the hope that it will be useful,
nkeynes@539
    15
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
nkeynes@539
    16
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
nkeynes@539
    17
 * GNU General Public License for more details.
nkeynes@539
    18
 */
nkeynes@539
    19
nkeynes@736
    20
#ifndef lxdream_ia64abi_H
nkeynes@736
    21
#define lxdream_ia64abi_H 1
nkeynes@539
    22
nkeynes@586
    23
#include <unwind.h>
nkeynes@539
    24
nkeynes@539
    25
#define load_ptr( reg, ptr ) load_imm64( reg, (uint64_t)ptr );
nkeynes@736
    26
nkeynes@953
    27
static inline decode_address( int addr_reg )
nkeynes@953
    28
{
nkeynes@953
    29
    uintptr_t base = (sh4r.xlat_sh4_mode&SR_MD) ? (uintptr_t)sh4_address_space : (uintptr_t)sh4_user_address_space;
nkeynes@953
    30
    MOV_r32_r32( addr_reg, R_ECX ); 
nkeynes@953
    31
    SHR_imm8_r32( 12, R_ECX ); 
nkeynes@953
    32
    load_ptr( R_EDI, base );
nkeynes@953
    33
    REXW(); OP(0x8B); OP(0x0C); OP(0xCF);   // mov.q [%rdi + %rcx*8], %rcx
nkeynes@953
    34
}
nkeynes@953
    35
nkeynes@539
    36
/**
nkeynes@539
    37
 * Note: clobbers EAX to make the indirect call - this isn't usually
nkeynes@539
    38
 * a problem since the callee will usually clobber it anyway.
nkeynes@539
    39
 * Size: 12 bytes
nkeynes@539
    40
 */
nkeynes@539
    41
#define CALL_FUNC0_SIZE 12
nkeynes@539
    42
static inline void call_func0( void *ptr )
nkeynes@539
    43
{
nkeynes@539
    44
    load_imm64(R_EAX, (uint64_t)ptr);
nkeynes@539
    45
    CALL_r32(R_EAX);
nkeynes@539
    46
}
nkeynes@539
    47
nkeynes@539
    48
#define CALL_FUNC1_SIZE 14
nkeynes@539
    49
static inline void call_func1( void *ptr, int arg1 )
nkeynes@539
    50
{
nkeynes@800
    51
    REXW(); MOV_r32_r32(arg1, R_EDI);
nkeynes@539
    52
    call_func0(ptr);
nkeynes@539
    53
}
nkeynes@539
    54
nkeynes@927
    55
static inline void call_func1_exc( void *ptr, int arg1, int pc )
nkeynes@927
    56
{
nkeynes@927
    57
    REXW(); MOV_r32_r32(arg1, R_EDI);
nkeynes@927
    58
    load_exc_backpatch(R_ESI);
nkeynes@927
    59
    call_func0(ptr);
nkeynes@927
    60
}
nkeynes@927
    61
nkeynes@953
    62
static inline void call_func1_r32disp8( int preg, uint32_t disp8, int arg1 )
nkeynes@953
    63
{
nkeynes@953
    64
    REXW(); MOV_r32_r32(arg1, R_EDI);
nkeynes@953
    65
    CALL_r32disp8(preg, disp8);    
nkeynes@953
    66
}
nkeynes@953
    67
nkeynes@953
    68
static inline void call_func1_r32disp8_exc( int preg, uint32_t disp8, int arg1, int pc )
nkeynes@953
    69
{
nkeynes@953
    70
    REXW(); MOV_r32_r32(arg1, R_EDI);
nkeynes@953
    71
    load_exc_backpatch(R_ESI);
nkeynes@953
    72
    CALL_r32disp8(preg, disp8);
nkeynes@953
    73
}
nkeynes@953
    74
nkeynes@539
    75
#define CALL_FUNC2_SIZE 16
nkeynes@539
    76
static inline void call_func2( void *ptr, int arg1, int arg2 )
nkeynes@539
    77
{
nkeynes@800
    78
    REXW(); MOV_r32_r32(arg1, R_EDI);
nkeynes@800
    79
    REXW(); MOV_r32_r32(arg2, R_ESI);
nkeynes@539
    80
    call_func0(ptr);
nkeynes@539
    81
}
nkeynes@539
    82
nkeynes@953
    83
static inline void call_func2_r32disp8( int preg, uint32_t disp8, int arg1, int arg2 )
nkeynes@539
    84
{
nkeynes@953
    85
    REXW(); MOV_r32_r32(arg1, R_EDI);
nkeynes@953
    86
    REXW(); MOV_r32_r32(arg2, R_ESI);
nkeynes@953
    87
    CALL_r32disp8(preg, disp8);    
nkeynes@539
    88
}
nkeynes@539
    89
nkeynes@953
    90
static inline void call_func2_r32disp8_exc( int preg, uint32_t disp8, int arg1, int arg2, int pc )
nkeynes@539
    91
{
nkeynes@953
    92
    REXW(); MOV_r32_r32(arg1, R_EDI);
nkeynes@953
    93
    REXW(); MOV_r32_r32(arg2, R_ESI);
nkeynes@953
    94
    load_exc_backpatch(R_EDX);
nkeynes@953
    95
    CALL_r32disp8(preg, disp8);
nkeynes@539
    96
}
nkeynes@539
    97
nkeynes@539
    98
nkeynes@953
    99
nkeynes@539
   100
/**
nkeynes@539
   101
 * Emit the 'start of block' assembly. Sets up the stack frame and save
nkeynes@539
   102
 * SI/DI as required
nkeynes@539
   103
 */
nkeynes@901
   104
void enter_block( ) 
nkeynes@539
   105
{
nkeynes@539
   106
    PUSH_r32(R_EBP);
nkeynes@669
   107
    load_ptr( R_EBP, ((uint8_t *)&sh4r) + 128 );
nkeynes@926
   108
    // Minimum aligned allocation is 16 bytes
nkeynes@926
   109
    REXW(); SUB_imm8s_r32( 16, R_ESP );
nkeynes@926
   110
}
nkeynes@926
   111
nkeynes@926
   112
static inline void exit_block( )
nkeynes@926
   113
{
nkeynes@926
   114
    REXW(); ADD_imm8s_r32( 16, R_ESP );
nkeynes@926
   115
    POP_r32(R_EBP);
nkeynes@926
   116
    RET();
nkeynes@539
   117
}
nkeynes@908
   118
nkeynes@539
   119
/**
nkeynes@539
   120
 * Exit the block with sh4r.pc already written
nkeynes@539
   121
 */
nkeynes@586
   122
void exit_block_pcset( sh4addr_t pc )
nkeynes@539
   123
{
nkeynes@539
   124
    load_imm32( R_ECX, ((pc - sh4_x86.block_start_pc)>>1)*sh4_cpu_period ); // 5
nkeynes@539
   125
    ADD_r32_sh4r( R_ECX, REG_OFFSET(slice_cycle) );    // 6
nkeynes@590
   126
    load_spreg( R_EAX, R_PC );
nkeynes@590
   127
    if( sh4_x86.tlb_on ) {
nkeynes@736
   128
        call_func1(xlat_get_code_by_vma,R_EAX);
nkeynes@590
   129
    } else {
nkeynes@736
   130
        call_func1(xlat_get_code,R_EAX);
nkeynes@590
   131
    }
nkeynes@926
   132
    exit_block();
nkeynes@590
   133
}
nkeynes@590
   134
nkeynes@590
   135
/**
nkeynes@590
   136
 * Exit the block with sh4r.new_pc written with the target address
nkeynes@590
   137
 */
nkeynes@590
   138
void exit_block_newpcset( sh4addr_t pc )
nkeynes@590
   139
{
nkeynes@590
   140
    load_imm32( R_ECX, ((pc - sh4_x86.block_start_pc)>>1)*sh4_cpu_period ); // 5
nkeynes@590
   141
    ADD_r32_sh4r( R_ECX, REG_OFFSET(slice_cycle) );    // 6
nkeynes@590
   142
    load_spreg( R_EAX, R_NEW_PC );
nkeynes@590
   143
    store_spreg( R_EAX, R_PC );
nkeynes@586
   144
    if( sh4_x86.tlb_on ) {
nkeynes@736
   145
        call_func1(xlat_get_code_by_vma,R_EAX);
nkeynes@586
   146
    } else {
nkeynes@736
   147
        call_func1(xlat_get_code,R_EAX);
nkeynes@586
   148
    }
nkeynes@926
   149
    exit_block();
nkeynes@539
   150
}
nkeynes@539
   151
nkeynes@586
   152
#define EXIT_BLOCK_SIZE(pc) (25 + (IS_IN_ICACHE(pc)?10:CALL_FUNC1_SIZE))
nkeynes@539
   153
/**
nkeynes@539
   154
 * Exit the block to an absolute PC
nkeynes@539
   155
 */
nkeynes@926
   156
void exit_block_abs( sh4addr_t pc, sh4addr_t endpc )
nkeynes@539
   157
{
nkeynes@539
   158
    load_imm32( R_ECX, pc );                            // 5
nkeynes@539
   159
    store_spreg( R_ECX, REG_OFFSET(pc) );               // 3
nkeynes@586
   160
    if( IS_IN_ICACHE(pc) ) {
nkeynes@736
   161
        REXW(); MOV_moff32_EAX( xlat_get_lut_entry(pc) );
nkeynes@926
   162
        REXW(); AND_imm8s_r32( 0xFC, R_EAX ); // 4
nkeynes@586
   163
    } else if( sh4_x86.tlb_on ) {
nkeynes@736
   164
        call_func1(xlat_get_code_by_vma, R_ECX);
nkeynes@586
   165
    } else {
nkeynes@736
   166
        call_func1(xlat_get_code,R_ECX);
nkeynes@586
   167
    }
nkeynes@539
   168
    load_imm32( R_ECX, ((endpc - sh4_x86.block_start_pc)>>1)*sh4_cpu_period ); // 5
nkeynes@539
   169
    ADD_r32_sh4r( R_ECX, REG_OFFSET(slice_cycle) );     // 6
nkeynes@926
   170
    exit_block();
nkeynes@539
   171
}
nkeynes@539
   172
nkeynes@539
   173
nkeynes@586
   174
#define EXIT_BLOCK_REL_SIZE(pc)  (28 + (IS_IN_ICACHE(pc)?10:CALL_FUNC1_SIZE))
nkeynes@586
   175
nkeynes@586
   176
/**
nkeynes@586
   177
 * Exit the block to a relative PC
nkeynes@586
   178
 */
nkeynes@586
   179
void exit_block_rel( sh4addr_t pc, sh4addr_t endpc )
nkeynes@586
   180
{
nkeynes@586
   181
    load_imm32( R_ECX, pc - sh4_x86.block_start_pc );   // 5
nkeynes@586
   182
    ADD_sh4r_r32( R_PC, R_ECX );
nkeynes@586
   183
    store_spreg( R_ECX, REG_OFFSET(pc) );               // 3
nkeynes@586
   184
    if( IS_IN_ICACHE(pc) ) {
nkeynes@736
   185
        REXW(); MOV_moff32_EAX( xlat_get_lut_entry(GET_ICACHE_PHYS(pc)) ); // 5
nkeynes@926
   186
        REXW(); AND_imm8s_r32( 0xFC, R_EAX ); // 4
nkeynes@586
   187
    } else if( sh4_x86.tlb_on ) {
nkeynes@736
   188
        call_func1(xlat_get_code_by_vma,R_ECX);
nkeynes@586
   189
    } else {
nkeynes@736
   190
        call_func1(xlat_get_code,R_ECX);
nkeynes@586
   191
    }
nkeynes@586
   192
    load_imm32( R_ECX, ((endpc - sh4_x86.block_start_pc)>>1)*sh4_cpu_period ); // 5
nkeynes@586
   193
    ADD_r32_sh4r( R_ECX, REG_OFFSET(slice_cycle) );     // 6
nkeynes@926
   194
    exit_block();
nkeynes@586
   195
}
nkeynes@586
   196
nkeynes@539
   197
/**
nkeynes@957
   198
 * Exit unconditionally with a general exception
nkeynes@957
   199
 */
nkeynes@957
   200
void exit_block_exc( int code, sh4addr_t pc )
nkeynes@957
   201
{
nkeynes@957
   202
    load_imm32( R_ECX, pc - sh4_x86.block_start_pc );   // 5
nkeynes@957
   203
    ADD_r32_sh4r( R_ECX, R_PC );
nkeynes@957
   204
    load_imm32( R_ECX, ((pc - sh4_x86.block_start_pc)>>1)*sh4_cpu_period ); // 5
nkeynes@957
   205
    ADD_r32_sh4r( R_ECX, REG_OFFSET(slice_cycle) );     // 6
nkeynes@957
   206
    load_imm32( R_EAX, code );
nkeynes@957
   207
    call_func1( sh4_raise_exception, R_EAX );
nkeynes@957
   208
    
nkeynes@957
   209
    load_spreg( R_EAX, R_PC );
nkeynes@957
   210
    if( sh4_x86.tlb_on ) {
nkeynes@957
   211
        call_func1(xlat_get_code_by_vma,R_EAX);
nkeynes@957
   212
    } else {
nkeynes@957
   213
        call_func1(xlat_get_code,R_EAX);
nkeynes@957
   214
    }
nkeynes@957
   215
nkeynes@957
   216
    exit_block();
nkeynes@957
   217
}    
nkeynes@957
   218
nkeynes@957
   219
nkeynes@957
   220
/**
nkeynes@539
   221
 * Write the block trailer (exception handling block)
nkeynes@539
   222
 */
nkeynes@539
   223
void sh4_translate_end_block( sh4addr_t pc ) {
nkeynes@539
   224
    if( sh4_x86.branch_taken == FALSE ) {
nkeynes@736
   225
        // Didn't exit unconditionally already, so write the termination here
nkeynes@736
   226
        exit_block_rel( pc, pc );
nkeynes@539
   227
    }
nkeynes@539
   228
    if( sh4_x86.backpatch_posn != 0 ) {
nkeynes@736
   229
        unsigned int i;
nkeynes@736
   230
        // Raise exception
nkeynes@736
   231
        uint8_t *end_ptr = xlat_output;
nkeynes@736
   232
        MOV_r32_r32( R_EDX, R_ECX );
nkeynes@736
   233
        ADD_r32_r32( R_EDX, R_ECX );
nkeynes@736
   234
        ADD_r32_sh4r( R_ECX, R_PC );
nkeynes@736
   235
        MOV_moff32_EAX( &sh4_cpu_period );
nkeynes@736
   236
        MUL_r32( R_EDX );
nkeynes@736
   237
        ADD_r32_sh4r( R_EAX, REG_OFFSET(slice_cycle) );
nkeynes@539
   238
nkeynes@736
   239
        call_func0( sh4_raise_exception );
nkeynes@736
   240
        load_spreg( R_EAX, R_PC );
nkeynes@736
   241
        if( sh4_x86.tlb_on ) {
nkeynes@736
   242
            call_func1(xlat_get_code_by_vma,R_EAX);
nkeynes@736
   243
        } else {
nkeynes@736
   244
            call_func1(xlat_get_code,R_EAX);
nkeynes@736
   245
        }
nkeynes@926
   246
        exit_block();
nkeynes@926
   247
        
nkeynes@736
   248
        // Exception already raised - just cleanup
nkeynes@736
   249
        uint8_t *preexc_ptr = xlat_output;
nkeynes@736
   250
        MOV_r32_r32( R_EDX, R_ECX );
nkeynes@736
   251
        ADD_r32_r32( R_EDX, R_ECX );
nkeynes@736
   252
        ADD_r32_sh4r( R_ECX, R_SPC );
nkeynes@736
   253
        MOV_moff32_EAX( &sh4_cpu_period );
nkeynes@736
   254
        MUL_r32( R_EDX );
nkeynes@736
   255
        ADD_r32_sh4r( R_EAX, REG_OFFSET(slice_cycle) );
nkeynes@736
   256
        load_spreg( R_EDI, R_PC );
nkeynes@736
   257
        if( sh4_x86.tlb_on ) {
nkeynes@736
   258
            call_func0(xlat_get_code_by_vma);
nkeynes@736
   259
        } else {
nkeynes@736
   260
            call_func0(xlat_get_code);
nkeynes@736
   261
        }
nkeynes@926
   262
        exit_block();
nkeynes@586
   263
nkeynes@736
   264
        for( i=0; i< sh4_x86.backpatch_posn; i++ ) {
nkeynes@736
   265
            uint32_t *fixup_addr = (uint32_t *)&xlat_current_block->code[sh4_x86.backpatch_list[i].fixup_offset];
nkeynes@736
   266
            if( sh4_x86.backpatch_list[i].exc_code < 0 ) {
nkeynes@927
   267
                if( sh4_x86.backpatch_list[i].exc_code == -2 ) {
nkeynes@927
   268
                    *((uintptr_t *)fixup_addr) = (uintptr_t)xlat_output; 
nkeynes@927
   269
                } else {
nkeynes@927
   270
                    *fixup_addr = xlat_output - (uint8_t *)&xlat_current_block->code[sh4_x86.backpatch_list[i].fixup_offset] - 4;
nkeynes@927
   271
                }
nkeynes@736
   272
                load_imm32( R_EDX, sh4_x86.backpatch_list[i].fixup_icount );
nkeynes@736
   273
                int rel = preexc_ptr - xlat_output;
nkeynes@736
   274
                JMP_rel(rel);
nkeynes@736
   275
            } else {
nkeynes@927
   276
                *fixup_addr = xlat_output - (uint8_t *)&xlat_current_block->code[sh4_x86.backpatch_list[i].fixup_offset] - 4;
nkeynes@736
   277
                load_imm32( R_EDI, sh4_x86.backpatch_list[i].exc_code );
nkeynes@736
   278
                load_imm32( R_EDX, sh4_x86.backpatch_list[i].fixup_icount );
nkeynes@736
   279
                int rel = end_ptr - xlat_output;
nkeynes@736
   280
                JMP_rel(rel);
nkeynes@736
   281
            }
nkeynes@736
   282
        }
nkeynes@539
   283
    }
nkeynes@539
   284
}
nkeynes@539
   285
nkeynes@926
   286
struct UnwindInfo {
nkeynes@926
   287
    uintptr_t block_start;
nkeynes@926
   288
    uintptr_t block_end;
nkeynes@926
   289
    void *pc;
nkeynes@926
   290
};
nkeynes@926
   291
nkeynes@586
   292
_Unwind_Reason_Code xlat_check_frame( struct _Unwind_Context *context, void *arg )
nkeynes@586
   293
{
nkeynes@926
   294
    struct UnwindInfo *info = arg;
nkeynes@926
   295
    void *pc = (void *)_Unwind_GetIP(context);
nkeynes@926
   296
    if( ((uintptr_t)pc) >= info->block_start && ((uintptr_t)pc) < info->block_end ) {
nkeynes@926
   297
        info->pc = pc;
nkeynes@586
   298
        return _URC_NORMAL_STOP;
nkeynes@586
   299
    }
nkeynes@926
   300
   
nkeynes@586
   301
    return _URC_NO_REASON;
nkeynes@586
   302
}
nkeynes@586
   303
nkeynes@926
   304
void *xlat_get_native_pc( void *code, uint32_t code_size )
nkeynes@586
   305
{
nkeynes@586
   306
    struct _Unwind_Exception exc;
nkeynes@926
   307
    struct UnwindInfo info;
nkeynes@736
   308
nkeynes@926
   309
    info.pc = NULL;
nkeynes@926
   310
    info.block_start = (uintptr_t)code;
nkeynes@926
   311
    info.block_end = info.block_start + code_size;
nkeynes@586
   312
    void *result = NULL;
nkeynes@926
   313
    _Unwind_Backtrace( xlat_check_frame, &info );
nkeynes@926
   314
    return info.pc;
nkeynes@586
   315
}
nkeynes@586
   316
nkeynes@736
   317
#endif /* !lxdream_ia64abi_H */
.