Search
lxdream.org :: lxdream/src/pvr2/scene.c
lxdream 0.9.1
released Jun 29
Download Now
filename src/pvr2/scene.c
changeset 1142:fd82bfba61c4
prev1140:7dc1c71ece76
next1155:f9aefb4613e5
author nkeynes
date Thu Nov 11 17:51:37 2010 +1000 (13 years ago)
permissions -rw-r--r--
last change Add convenience gl_check_error() function
file annotate diff log raw
nkeynes@635
     1
/**
nkeynes@636
     2
 * $Id$
nkeynes@635
     3
 *
nkeynes@827
     4
 * Manage the internal vertex/polygon buffers and scene data structure.
nkeynes@635
     5
 * Where possible this uses VBOs for the vertex + index data.
nkeynes@635
     6
 *
nkeynes@635
     7
 * Copyright (c) 2005 Nathan Keynes.
nkeynes@635
     8
 *
nkeynes@635
     9
 * This program is free software; you can redistribute it and/or modify
nkeynes@635
    10
 * it under the terms of the GNU General Public License as published by
nkeynes@635
    11
 * the Free Software Foundation; either version 2 of the License, or
nkeynes@635
    12
 * (at your option) any later version.
nkeynes@635
    13
 *
nkeynes@635
    14
 * This program is distributed in the hope that it will be useful,
nkeynes@635
    15
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
nkeynes@635
    16
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
nkeynes@635
    17
 * GNU General Public License for more details.
nkeynes@635
    18
 */
nkeynes@635
    19
nkeynes@635
    20
#include <assert.h>
nkeynes@635
    21
#include <string.h>
nkeynes@645
    22
#include <math.h>
nkeynes@635
    23
#include "lxdream.h"
nkeynes@635
    24
#include "display.h"
nkeynes@635
    25
#include "pvr2/pvr2.h"
nkeynes@677
    26
#include "pvr2/pvr2mmio.h"
nkeynes@635
    27
#include "pvr2/glutil.h"
nkeynes@635
    28
#include "pvr2/scene.h"
nkeynes@635
    29
nkeynes@863
    30
#define U8TOFLOAT(n)  (((float)((n)+1))/256.0)
nkeynes@863
    31
nkeynes@687
    32
static void unpack_bgra(uint32_t bgra, float *rgba)
nkeynes@687
    33
{
nkeynes@687
    34
    rgba[0] = ((float)(((bgra&0x00FF0000)>>16) + 1)) / 256.0;
nkeynes@687
    35
    rgba[1] = ((float)(((bgra&0x0000FF00)>>8) + 1)) / 256.0;
nkeynes@687
    36
    rgba[2] = ((float)((bgra&0x000000FF) + 1)) / 256.0;
nkeynes@687
    37
    rgba[3] = ((float)(((bgra&0xFF000000)>>24) + 1)) / 256.0;
nkeynes@687
    38
}
nkeynes@635
    39
nkeynes@639
    40
static inline uint32_t bgra_to_rgba(uint32_t bgra)
nkeynes@639
    41
{
nkeynes@639
    42
    return (bgra&0xFF00FF00) | ((bgra&0x00FF0000)>>16) | ((bgra&0x000000FF)<<16);
nkeynes@639
    43
}
nkeynes@639
    44
nkeynes@645
    45
/**
nkeynes@645
    46
 * Convert a half-float (16-bit) FP number to a regular 32-bit float.
nkeynes@645
    47
 * Source is 1-bit sign, 5-bit exponent, 10-bit mantissa.
nkeynes@645
    48
 * TODO: Check the correctness of this.
nkeynes@645
    49
 */
nkeynes@645
    50
static float halftofloat( uint16_t half )
nkeynes@645
    51
{
nkeynes@645
    52
    union {
nkeynes@645
    53
        float f;
nkeynes@645
    54
        uint32_t i;
nkeynes@645
    55
    } temp;
nkeynes@645
    56
    temp.i = ((uint32_t)half)<<16;
nkeynes@645
    57
    return temp.f;
nkeynes@645
    58
}
nkeynes@645
    59
nkeynes@847
    60
static float parse_fog_density( uint32_t value )
nkeynes@847
    61
{
nkeynes@847
    62
    union {
nkeynes@847
    63
        uint32_t i;
nkeynes@847
    64
        float f;
nkeynes@847
    65
    } u;
nkeynes@847
    66
    u.i = (((value+127)&0xFF)<<23)|((value & 0xFF00)<<7);
nkeynes@847
    67
    return u.f;
nkeynes@847
    68
}
nkeynes@645
    69
nkeynes@635
    70
struct pvr2_scene_struct pvr2_scene;
nkeynes@635
    71
nkeynes@635
    72
static gboolean vbo_init = FALSE;
nkeynes@863
    73
static float scene_shadow_intensity = 0.0;
nkeynes@669
    74
nkeynes@669
    75
#ifdef ENABLE_VERTEX_BUFFER
nkeynes@635
    76
static gboolean vbo_supported = FALSE;
nkeynes@669
    77
#endif
nkeynes@635
    78
nkeynes@635
    79
/**
nkeynes@635
    80
 * Test for VBO support, and allocate all the system memory needed for the
nkeynes@635
    81
 * temporary structures. GL context must have been initialized before this
nkeynes@635
    82
 * point.
nkeynes@635
    83
 */
nkeynes@635
    84
void pvr2_scene_init()
nkeynes@635
    85
{
nkeynes@635
    86
    if( !vbo_init ) {
nkeynes@645
    87
#ifdef ENABLE_VERTEX_BUFFER
nkeynes@736
    88
        if( isGLVertexBufferSupported() ) {
nkeynes@736
    89
            vbo_supported = TRUE;
nkeynes@736
    90
            pvr2_scene.vbo_id = 1;
nkeynes@736
    91
        }
nkeynes@645
    92
#endif
nkeynes@736
    93
        pvr2_scene.vertex_array = NULL;
nkeynes@736
    94
        pvr2_scene.vertex_array_size = 0;
nkeynes@736
    95
        pvr2_scene.poly_array = g_malloc( MAX_POLY_BUFFER_SIZE );
nkeynes@736
    96
        pvr2_scene.buf_to_poly_map = g_malloc0( BUF_POLY_MAP_SIZE );
nkeynes@736
    97
        vbo_init = TRUE;
nkeynes@635
    98
    }
nkeynes@635
    99
}
nkeynes@635
   100
nkeynes@639
   101
/**
nkeynes@639
   102
 * Clear the scene data structures in preparation for fresh data
nkeynes@639
   103
 */
nkeynes@639
   104
void pvr2_scene_reset()
nkeynes@639
   105
{
nkeynes@639
   106
    pvr2_scene.poly_count = 0;
nkeynes@639
   107
    pvr2_scene.vertex_count = 0;
nkeynes@639
   108
    memset( pvr2_scene.buf_to_poly_map, 0, BUF_POLY_MAP_SIZE );
nkeynes@639
   109
}
nkeynes@639
   110
nkeynes@635
   111
void pvr2_scene_shutdown()
nkeynes@635
   112
{
nkeynes@645
   113
#ifdef ENABLE_VERTEX_BUFFER
nkeynes@635
   114
    if( vbo_supported ) {
nkeynes@736
   115
        glBindBufferARB( GL_ARRAY_BUFFER_ARB, 0 );
nkeynes@736
   116
        glDeleteBuffersARB( 1, &pvr2_scene.vbo_id );
nkeynes@736
   117
        pvr2_scene.vbo_id = 0;
nkeynes@635
   118
    } else {
nkeynes@645
   119
#endif
nkeynes@736
   120
        g_free( pvr2_scene.vertex_array );
nkeynes@736
   121
        pvr2_scene.vertex_array = NULL;
nkeynes@645
   122
#ifdef ENABLE_VERTEX_BUFFER
nkeynes@635
   123
    }
nkeynes@645
   124
#endif
nkeynes@645
   125
nkeynes@635
   126
    g_free( pvr2_scene.poly_array );
nkeynes@645
   127
    pvr2_scene.poly_array = NULL;
nkeynes@635
   128
    g_free( pvr2_scene.buf_to_poly_map );
nkeynes@645
   129
    pvr2_scene.buf_to_poly_map = NULL;
nkeynes@635
   130
    vbo_init = FALSE;
nkeynes@635
   131
}
nkeynes@635
   132
nkeynes@635
   133
void *vertex_buffer_map()
nkeynes@635
   134
{
nkeynes@687
   135
    // Allow 8 vertexes for the background (4+4)
nkeynes@687
   136
    uint32_t size = (pvr2_scene.vertex_count + 8) * sizeof(struct vertex_struct);
nkeynes@645
   137
#ifdef ENABLE_VERTEX_BUFFER
nkeynes@635
   138
    if( vbo_supported ) {
nkeynes@690
   139
        glGetError();
nkeynes@736
   140
        glBindBufferARB( GL_ARRAY_BUFFER_ARB, pvr2_scene.vbo_id );
nkeynes@736
   141
        if( size > pvr2_scene.vertex_array_size ) {
nkeynes@736
   142
            glBufferDataARB( GL_ARRAY_BUFFER_ARB, size, NULL, GL_DYNAMIC_DRAW_ARB );
nkeynes@736
   143
            int status = glGetError();
nkeynes@736
   144
            if( status != 0 ) {
nkeynes@736
   145
                fprintf( stderr, "Error %08X allocating vertex buffer\n", status );
nkeynes@736
   146
                abort();
nkeynes@736
   147
            }
nkeynes@736
   148
            pvr2_scene.vertex_array_size = size;
nkeynes@736
   149
        }
nkeynes@736
   150
        pvr2_scene.vertex_array = glMapBufferARB( GL_ARRAY_BUFFER_ARB, GL_WRITE_ONLY_ARB );
nkeynes@736
   151
        assert(pvr2_scene.vertex_array != NULL );
nkeynes@635
   152
    } else {
nkeynes@645
   153
#endif
nkeynes@736
   154
        if( size > pvr2_scene.vertex_array_size ) {
nkeynes@736
   155
            pvr2_scene.vertex_array = g_realloc( pvr2_scene.vertex_array, size );
nkeynes@736
   156
        }
nkeynes@645
   157
#ifdef ENABLE_VERTEX_BUFFER
nkeynes@635
   158
    }
nkeynes@645
   159
#endif
nkeynes@635
   160
    return pvr2_scene.vertex_array;
nkeynes@635
   161
}
nkeynes@635
   162
nkeynes@635
   163
gboolean vertex_buffer_unmap()
nkeynes@635
   164
{
nkeynes@645
   165
#ifdef ENABLE_VERTEX_BUFFER
nkeynes@635
   166
    if( vbo_supported ) {
nkeynes@736
   167
        pvr2_scene.vertex_array = NULL;
nkeynes@736
   168
        return glUnmapBufferARB( GL_ARRAY_BUFFER_ARB );
nkeynes@635
   169
    } else {
nkeynes@736
   170
        return TRUE;
nkeynes@635
   171
    }
nkeynes@645
   172
#else
nkeynes@645
   173
    return TRUE;
nkeynes@645
   174
#endif
nkeynes@635
   175
}
nkeynes@635
   176
nkeynes@639
   177
static struct polygon_struct *scene_add_polygon( pvraddr_t poly_idx, int vertex_count,
nkeynes@863
   178
                                                 shadow_mode_t is_modified )
nkeynes@635
   179
{
nkeynes@863
   180
    int vert_mul = is_modified != SHADOW_NONE ? 2 : 1;
nkeynes@635
   181
nkeynes@635
   182
    if( pvr2_scene.buf_to_poly_map[poly_idx] != NULL ) {
nkeynes@687
   183
        if( vertex_count > pvr2_scene.buf_to_poly_map[poly_idx]->vertex_count ) {
nkeynes@687
   184
            pvr2_scene.vertex_count += (vertex_count - pvr2_scene.buf_to_poly_map[poly_idx]->vertex_count) * vert_mul;
nkeynes@687
   185
            pvr2_scene.buf_to_poly_map[poly_idx]->vertex_count = vertex_count;
nkeynes@687
   186
        }
nkeynes@687
   187
        return pvr2_scene.buf_to_poly_map[poly_idx];
nkeynes@635
   188
    } else {
nkeynes@687
   189
        struct polygon_struct *poly = &pvr2_scene.poly_array[pvr2_scene.poly_count++];
nkeynes@687
   190
        poly->context = &pvr2_scene.pvr2_pbuf[poly_idx];
nkeynes@687
   191
        poly->vertex_count = vertex_count;
nkeynes@687
   192
        poly->vertex_index = -1;
nkeynes@687
   193
        poly->mod_vertex_index = -1;
nkeynes@687
   194
        poly->next = NULL;
nkeynes@1133
   195
        poly->sub_next = NULL;
nkeynes@687
   196
        pvr2_scene.buf_to_poly_map[poly_idx] = poly;
nkeynes@687
   197
        pvr2_scene.vertex_count += (vertex_count * vert_mul);
nkeynes@687
   198
        return poly;
nkeynes@635
   199
    }
nkeynes@635
   200
}
nkeynes@635
   201
nkeynes@635
   202
/**
nkeynes@1133
   203
 * Given a starting polygon, break it at the specified triangle so that the
nkeynes@1133
   204
 * preceding triangles are retained, and the remainder are contained in a
nkeynes@1133
   205
 * new sub-polygon. Does not preserve winding.
nkeynes@1133
   206
 */
nkeynes@1133
   207
static struct polygon_struct *scene_split_subpolygon( struct polygon_struct *parent, int split_offset )
nkeynes@1133
   208
{
nkeynes@1133
   209
    assert( split_offset > 0 && split_offset < (parent->vertex_count-2) );
nkeynes@1133
   210
    assert( pvr2_scene.poly_count < MAX_POLYGONS );
nkeynes@1133
   211
    struct polygon_struct *poly = &pvr2_scene.poly_array[pvr2_scene.poly_count++];
nkeynes@1133
   212
    poly->vertex_count = parent->vertex_count - split_offset;
nkeynes@1133
   213
    poly->vertex_index = parent->vertex_index + split_offset;
nkeynes@1133
   214
    if( parent->mod_vertex_index == -1 ) {
nkeynes@1133
   215
        poly->mod_vertex_index = -1;
nkeynes@1133
   216
    } else {
nkeynes@1133
   217
        poly->mod_vertex_index = parent->mod_vertex_index + split_offset;
nkeynes@1133
   218
    }
nkeynes@1133
   219
    poly->context = parent->context;
nkeynes@1133
   220
    poly->next = NULL;
nkeynes@1133
   221
    poly->sub_next = parent->sub_next;
nkeynes@1133
   222
nkeynes@1133
   223
    parent->sub_next = poly;
nkeynes@1133
   224
    parent->vertex_count = split_offset + 2;
nkeynes@1133
   225
nkeynes@1133
   226
    return poly;
nkeynes@1133
   227
}
nkeynes@1133
   228
nkeynes@1140
   229
static float scene_get_palette_offset( uint32_t tex )
nkeynes@1140
   230
{
nkeynes@1140
   231
    uint32_t fmt = (tex & PVR2_TEX_FORMAT_MASK);
nkeynes@1140
   232
    if( fmt == PVR2_TEX_FORMAT_IDX4 ) {
nkeynes@1140
   233
        return ((float)((tex & 0x07E00000) >> 17))/1024.0 + 0.0002;
nkeynes@1140
   234
    } else if( fmt == PVR2_TEX_FORMAT_IDX8 ) {
nkeynes@1140
   235
        return ((float)((tex & 0x06000000) >> 17))/1024.0 + 0.0002;
nkeynes@1140
   236
    } else {
nkeynes@1140
   237
        return -1.0;
nkeynes@1140
   238
    }
nkeynes@1140
   239
}
nkeynes@1140
   240
nkeynes@1133
   241
/**
nkeynes@635
   242
 * Decode a single PVR2 renderable vertex (opaque/trans/punch-out, but not shadow
nkeynes@635
   243
 * volume)
nkeynes@635
   244
 * @param vert Pointer to output vertex structure
nkeynes@635
   245
 * @param poly1 First word of polygon context (needed to understand vertex)
nkeynes@639
   246
 * @param poly2 Second word of polygon context
nkeynes@635
   247
 * @param pvr2_data Pointer to raw pvr2 vertex data (in VRAM)
nkeynes@635
   248
 * @param modify_offset Offset in 32-bit words to the tex/color data. 0 for
nkeynes@635
   249
 *        the normal vertex, half the vertex length for the modified vertex.
nkeynes@635
   250
 */
nkeynes@827
   251
static void pvr2_decode_render_vertex( struct vertex_struct *vert, uint32_t poly1,
nkeynes@1140
   252
                                       uint32_t poly2, uint32_t tex, uint32_t *pvr2_data,
nkeynes@736
   253
                                       int modify_offset )
nkeynes@635
   254
{
nkeynes@639
   255
    gboolean force_alpha = !POLY2_ALPHA_ENABLE(poly2);
nkeynes@635
   256
    union pvr2_data_type {
nkeynes@687
   257
        uint32_t *ival;
nkeynes@687
   258
        float *fval;
nkeynes@635
   259
    } data;
nkeynes@635
   260
nkeynes@635
   261
    data.ival = pvr2_data;
nkeynes@687
   262
nkeynes@635
   263
    vert->x = *data.fval++;
nkeynes@635
   264
    vert->y = *data.fval++;
nkeynes@635
   265
nkeynes@635
   266
    float z = *data.fval++;
nkeynes@645
   267
    if( !isfinite(z) ) {
nkeynes@687
   268
        z = 0;
nkeynes@648
   269
    } else if( z != 0 ) {
nkeynes@687
   270
        z = 1/z;
nkeynes@645
   271
    }
nkeynes@635
   272
    if( z > pvr2_scene.bounds[5] ) {
nkeynes@687
   273
        pvr2_scene.bounds[5] = z;
nkeynes@635
   274
    } else if( z < pvr2_scene.bounds[4] && z != 0 ) {
nkeynes@687
   275
        pvr2_scene.bounds[4] = z;
nkeynes@635
   276
    }
nkeynes@635
   277
    vert->z = z;
nkeynes@635
   278
    data.ival += modify_offset;
nkeynes@635
   279
nkeynes@687
   280
nkeynes@635
   281
    if( POLY1_TEXTURED(poly1) ) {
nkeynes@687
   282
        if( POLY1_UV16(poly1) ) {
nkeynes@687
   283
            vert->u = halftofloat( *data.ival>>16 );
nkeynes@687
   284
            vert->v = halftofloat( *data.ival );
nkeynes@687
   285
            data.ival++;
nkeynes@687
   286
        } else {
nkeynes@687
   287
            vert->u = *data.fval++;
nkeynes@687
   288
            vert->v = *data.fval++;
nkeynes@687
   289
        }
nkeynes@1139
   290
nkeynes@1139
   291
        switch( POLY2_TEX_BLEND(poly2) ) {
nkeynes@1139
   292
        case 0:/* Convert replace => modulate by setting colour values to 1.0 */
nkeynes@1139
   293
            vert->rgba[0] = vert->rgba[1] = vert->rgba[2] = vert->rgba[3] = 1.0;
nkeynes@1140
   294
            vert->tex_mode = 0.0;
nkeynes@1139
   295
            data.ival++; /* Skip the colour word */
nkeynes@1139
   296
            break;
nkeynes@1140
   297
        case 2: /* Decal */
nkeynes@1140
   298
            vert->tex_mode = 1.0;
nkeynes@1140
   299
            unpack_bgra(*data.ival++, vert->rgba);
nkeynes@1140
   300
            break;
nkeynes@1139
   301
        case 1:
nkeynes@687
   302
            force_alpha = TRUE;
nkeynes@1139
   303
            /* fall-through */
nkeynes@1140
   304
        default:
nkeynes@1140
   305
            vert->tex_mode = 0.0;
nkeynes@1139
   306
            unpack_bgra(*data.ival++, vert->rgba);
nkeynes@1139
   307
            break;
nkeynes@687
   308
        }
nkeynes@1140
   309
        vert->r = scene_get_palette_offset(tex);
nkeynes@1139
   310
    } else {
nkeynes@1140
   311
        vert->tex_mode = 2.0;
nkeynes@1140
   312
        vert->r = -1.0;
nkeynes@1139
   313
        unpack_bgra(*data.ival++, vert->rgba);
nkeynes@635
   314
    }
nkeynes@1139
   315
nkeynes@687
   316
    if( POLY1_SPECULAR(poly1) ) {
nkeynes@687
   317
        unpack_bgra(*data.ival++, vert->offset_rgba);
nkeynes@687
   318
    } else {
nkeynes@687
   319
        vert->offset_rgba[0] = 0.0;
nkeynes@687
   320
        vert->offset_rgba[1] = 0.0;
nkeynes@687
   321
        vert->offset_rgba[2] = 0.0;
nkeynes@827
   322
        vert->offset_rgba[3] = 0.0;
nkeynes@687
   323
    }
nkeynes@687
   324
nkeynes@639
   325
    if( force_alpha ) {
nkeynes@687
   326
        vert->rgba[3] = 1.0;
nkeynes@635
   327
    }
nkeynes@635
   328
}
nkeynes@635
   329
nkeynes@635
   330
/**
nkeynes@687
   331
 * Compute texture, colour, and z values for 1 or more result points by interpolating from
nkeynes@687
   332
 * a set of 3 input points. The result point(s) must define their x,y.
nkeynes@635
   333
 */
nkeynes@827
   334
static void scene_compute_vertexes( struct vertex_struct *result,
nkeynes@687
   335
                                    int result_count,
nkeynes@736
   336
                                    struct vertex_struct *input,
nkeynes@736
   337
                                    gboolean is_solid_shaded )
nkeynes@635
   338
{
nkeynes@687
   339
    int i,j;
nkeynes@635
   340
    float sx = input[2].x - input[1].x;
nkeynes@635
   341
    float sy = input[2].y - input[1].y;
nkeynes@635
   342
    float tx = input[0].x - input[1].x;
nkeynes@635
   343
    float ty = input[0].y - input[1].y;
nkeynes@635
   344
nkeynes@635
   345
    float detxy = ((sy) * (tx)) - ((ty) * (sx));
nkeynes@635
   346
    if( detxy == 0 ) {
nkeynes@827
   347
        // If the input points fall on a line, they don't define a usable
nkeynes@687
   348
        // polygon - the PVR2 takes the last input point as the result in
nkeynes@687
   349
        // this case.
nkeynes@687
   350
        for( i=0; i<result_count; i++ ) {
nkeynes@687
   351
            float x = result[i].x;
nkeynes@687
   352
            float y = result[i].y;
nkeynes@687
   353
            memcpy( &result[i], &input[2], sizeof(struct vertex_struct) );
nkeynes@687
   354
            result[i].x = x;
nkeynes@687
   355
            result[i].y = y;
nkeynes@687
   356
        }
nkeynes@687
   357
        return;
nkeynes@635
   358
    }
nkeynes@635
   359
    float sz = input[2].z - input[1].z;
nkeynes@635
   360
    float tz = input[0].z - input[1].z;
nkeynes@635
   361
    float su = input[2].u - input[1].u;
nkeynes@635
   362
    float tu = input[0].u - input[1].u;
nkeynes@635
   363
    float sv = input[2].v - input[1].v;
nkeynes@635
   364
    float tv = input[0].v - input[1].v;
nkeynes@635
   365
nkeynes@687
   366
    for( i=0; i<result_count; i++ ) {
nkeynes@687
   367
        float t = ((result[i].x - input[1].x) * sy -
nkeynes@687
   368
                (result[i].y - input[1].y) * sx) / detxy;
nkeynes@687
   369
        float s = ((result[i].y - input[1].y) * tx -
nkeynes@687
   370
                (result[i].x - input[1].x) * ty) / detxy;
nkeynes@687
   371
nkeynes@687
   372
        float rz = input[1].z + (t*tz) + (s*sz);
nkeynes@687
   373
        if( rz > pvr2_scene.bounds[5] ) {
nkeynes@687
   374
            pvr2_scene.bounds[5] = rz;
nkeynes@687
   375
        } else if( rz < pvr2_scene.bounds[4] ) {
nkeynes@827
   376
            pvr2_scene.bounds[4] = rz;
nkeynes@687
   377
        }
nkeynes@687
   378
        result[i].z = rz;
nkeynes@687
   379
        result[i].u = input[1].u + (t*tu) + (s*su);
nkeynes@687
   380
        result[i].v = input[1].v + (t*tv) + (s*sv);
nkeynes@1140
   381
        result[i].r = input[1].r; /* Last two components are flat */
nkeynes@1140
   382
        result[i].tex_mode = input[1].tex_mode;
nkeynes@687
   383
nkeynes@687
   384
        if( is_solid_shaded ) {
nkeynes@687
   385
            memcpy( result->rgba, input[2].rgba, sizeof(result->rgba) );
nkeynes@687
   386
            memcpy( result->offset_rgba, input[2].offset_rgba, sizeof(result->offset_rgba) );
nkeynes@687
   387
        } else {
nkeynes@687
   388
            float *rgba0 = input[0].rgba;
nkeynes@687
   389
            float *rgba1 = input[1].rgba;
nkeynes@687
   390
            float *rgba2 = input[2].rgba;
nkeynes@687
   391
            float *rgba3 = result[i].rgba;
nkeynes@687
   392
            for( j=0; j<8; j++ ) {
nkeynes@687
   393
                float tc = *rgba0++ - *rgba1;
nkeynes@687
   394
                float sc = *rgba2++ - *rgba1;
nkeynes@687
   395
                float rc = *rgba1++ + (t*tc) + (s*sc);
nkeynes@687
   396
                *rgba3++ = rc;
nkeynes@687
   397
            }
nkeynes@687
   398
        }
nkeynes@635
   399
    }
nkeynes@653
   400
}
nkeynes@635
   401
nkeynes@847
   402
static float scene_compute_lut_fog_vertex( float z, float fog_density, float fog_table[][2] )
nkeynes@847
   403
{
nkeynes@847
   404
    union {
nkeynes@847
   405
        uint32_t i;
nkeynes@847
   406
        float f;
nkeynes@847
   407
    } v;
nkeynes@847
   408
    v.f = z * fog_density;
nkeynes@847
   409
    if( v.f < 1.0 ) v.f = 1.0;
nkeynes@847
   410
    else if( v.f > 255.9999 ) v.f = 255.9999;
nkeynes@847
   411
    
nkeynes@847
   412
    uint32_t index = ((v.i >> 18) & 0x0F)|((v.i>>19)&0x70);
nkeynes@847
   413
    return fog_table[index][0];
nkeynes@847
   414
}
nkeynes@847
   415
nkeynes@847
   416
/**
nkeynes@847
   417
 * Compute the fog coefficients for all polygons using lookup-table fog. It's 
nkeynes@847
   418
 * a little more convenient to do this as a separate pass, since we don't have
nkeynes@847
   419
 * to worry about computed vertexes.
nkeynes@847
   420
 */
nkeynes@847
   421
static void scene_compute_lut_fog( )
nkeynes@847
   422
{
nkeynes@847
   423
    int i,j;
nkeynes@847
   424
nkeynes@847
   425
    float fog_density = parse_fog_density(MMIO_READ( PVR2, RENDER_FOGCOEFF ));
nkeynes@847
   426
    float fog_table[128][2];
nkeynes@847
   427
    
nkeynes@847
   428
    /* Parse fog table out into floating-point format */
nkeynes@847
   429
    for( i=0; i<128; i++ ) {
nkeynes@847
   430
        uint32_t ent = MMIO_READ( PVR2, RENDER_FOGTABLE + (i<<2) );
nkeynes@847
   431
        fog_table[i][0] = ((float)(((ent&0x0000FF00)>>8) + 1)) / 256.0;
nkeynes@847
   432
        fog_table[i][1] = ((float)((ent&0x000000FF) + 1)) / 256.0;
nkeynes@847
   433
    }
nkeynes@847
   434
    
nkeynes@847
   435
    
nkeynes@847
   436
    for( i=0; i<pvr2_scene.poly_count; i++ ) {
nkeynes@847
   437
        int mode = POLY2_FOG_MODE(pvr2_scene.poly_array[i].context[1]);
nkeynes@1132
   438
        uint32_t index = pvr2_scene.poly_array[i].vertex_index;
nkeynes@847
   439
        if( mode == PVR2_POLY_FOG_LOOKUP ) {
nkeynes@1132
   440
            for( j=0; j<pvr2_scene.poly_array[i].vertex_count; j++ ) {
nkeynes@847
   441
                pvr2_scene.vertex_array[index+j].offset_rgba[3] = 
nkeynes@847
   442
                    scene_compute_lut_fog_vertex( pvr2_scene.vertex_array[index+j].z, fog_density, fog_table );
nkeynes@847
   443
            }
nkeynes@847
   444
        } else if( mode == PVR2_POLY_FOG_LOOKUP2 ) {
nkeynes@1132
   445
            for( j=0; j<pvr2_scene.poly_array[i].vertex_count; j++ ) {
nkeynes@847
   446
                pvr2_scene.vertex_array[index+j].rgba[0] = pvr2_scene.fog_lut_colour[0];
nkeynes@847
   447
                pvr2_scene.vertex_array[index+j].rgba[1] = pvr2_scene.fog_lut_colour[1];
nkeynes@847
   448
                pvr2_scene.vertex_array[index+j].rgba[2] = pvr2_scene.fog_lut_colour[2];
nkeynes@847
   449
                pvr2_scene.vertex_array[index+j].rgba[3] = 
nkeynes@847
   450
                    scene_compute_lut_fog_vertex( pvr2_scene.vertex_array[index+j].z, fog_density, fog_table );
nkeynes@1132
   451
                pvr2_scene.vertex_array[index+j].offset_rgba[3] = 0;
nkeynes@1132
   452
            }
nkeynes@1132
   453
        } else if( mode == PVR2_POLY_FOG_DISABLED ) {
nkeynes@1132
   454
            for( j=0; j<pvr2_scene.poly_array[i].vertex_count; j++ ) {
nkeynes@1132
   455
                pvr2_scene.vertex_array[index+j].offset_rgba[3] = 0;
nkeynes@847
   456
            }
nkeynes@847
   457
        }
nkeynes@635
   458
    }    
nkeynes@847
   459
}
nkeynes@635
   460
nkeynes@1133
   461
/**
nkeynes@1133
   462
 * Manually cull back-facing polygons where we can - this actually saves
nkeynes@1133
   463
 * us a lot of time vs passing everything to GL to do it.
nkeynes@1133
   464
 */
nkeynes@1133
   465
static void scene_backface_cull()
nkeynes@1133
   466
{
nkeynes@1133
   467
    unsigned poly_idx;
nkeynes@1133
   468
    unsigned poly_count = pvr2_scene.poly_count; /* Note: we don't want to process any sub-polygons created here */
nkeynes@1133
   469
    for( poly_idx = 0; poly_idx<poly_count; poly_idx++ ) {
nkeynes@1133
   470
        uint32_t poly1 = pvr2_scene.poly_array[poly_idx].context[0];
nkeynes@1133
   471
        if( POLY1_CULL_ENABLE(poly1) ) {
nkeynes@1133
   472
            struct polygon_struct *poly = &pvr2_scene.poly_array[poly_idx];
nkeynes@1133
   473
            unsigned vert_idx = poly->vertex_index;
nkeynes@1133
   474
            unsigned tri_count = poly->vertex_count-2;
nkeynes@1133
   475
            struct vertex_struct *vert = &pvr2_scene.vertex_array[vert_idx];
nkeynes@1133
   476
            unsigned i;
nkeynes@1133
   477
            gboolean ccw = (POLY1_CULL_MODE(poly1) == CULL_CCW);
nkeynes@1133
   478
            int first_visible = -1, last_visible = -1;
nkeynes@1133
   479
            for( i=0; i<tri_count; i++ ) {
nkeynes@1133
   480
                float ux = vert[i+1].x - vert[i].x;
nkeynes@1133
   481
                float uy = vert[i+1].y - vert[i].y;
nkeynes@1133
   482
                float vx = vert[i+2].x - vert[i].x;
nkeynes@1133
   483
                float vy = vert[i+2].y - vert[i].y;
nkeynes@1133
   484
                float nz = (ux*vy) - (uy*vx);
nkeynes@1133
   485
                if( ccw ? nz > 0 : nz < 0 ) {
nkeynes@1133
   486
                    /* Surface is visible */
nkeynes@1133
   487
                    if( first_visible == -1 ) {
nkeynes@1133
   488
                        first_visible = i;
nkeynes@1133
   489
                        /* Elide the initial hidden triangles (note we don't
nkeynes@1133
   490
                         * need to care about winding anymore here) */
nkeynes@1133
   491
                        poly->vertex_index += i;
nkeynes@1133
   492
                        poly->vertex_count -= i;
nkeynes@1133
   493
                        if( poly->mod_vertex_index != -1 )
nkeynes@1133
   494
                            poly->mod_vertex_index += i;
nkeynes@1133
   495
                    } else if( last_visible != i-1 ) {
nkeynes@1133
   496
                        /* And... here we have to split the polygon. Allocate a new
nkeynes@1133
   497
                         * sub-polygon to hold the vertex references */
nkeynes@1133
   498
                        struct polygon_struct *sub = scene_split_subpolygon(poly, (i-first_visible));
nkeynes@1133
   499
                        poly->vertex_count -= (i-first_visible-1) - last_visible;
nkeynes@1133
   500
                        first_visible = i;
nkeynes@1133
   501
                        poly = sub;
nkeynes@1133
   502
                    }
nkeynes@1133
   503
                    last_visible = i;
nkeynes@1133
   504
                } /* Else culled */
nkeynes@1133
   505
                /* Invert ccw flag for triangle strip processing */
nkeynes@1133
   506
                ccw = !ccw;
nkeynes@1133
   507
            }
nkeynes@1133
   508
            if( last_visible == -1 ) {
nkeynes@1133
   509
                /* No visible surfaces, so we can mark the whole polygon as being vertex-less */
nkeynes@1133
   510
                poly->vertex_count = 0;
nkeynes@1133
   511
            } else if( last_visible != tri_count-1 ) {
nkeynes@1133
   512
                /* Remove final hidden tris */
nkeynes@1133
   513
                poly->vertex_count -= (tri_count - 1 - last_visible);
nkeynes@1133
   514
            }
nkeynes@1133
   515
        }
nkeynes@1133
   516
    }
nkeynes@1133
   517
}
nkeynes@1133
   518
nkeynes@863
   519
static void scene_add_cheap_shadow_vertexes( struct vertex_struct *src, struct vertex_struct *dest, int count )
nkeynes@863
   520
{
nkeynes@863
   521
    unsigned int i, j;
nkeynes@863
   522
    
nkeynes@863
   523
    for( i=0; i<count; i++ ) {
nkeynes@863
   524
        dest->x = src->x;
nkeynes@863
   525
        dest->y = src->y;
nkeynes@863
   526
        dest->z = src->z;
nkeynes@863
   527
        dest->u = src->u;
nkeynes@863
   528
        dest->v = src->v;
nkeynes@1140
   529
        dest->r = src->r;
nkeynes@1140
   530
        dest->tex_mode = src->tex_mode;
nkeynes@863
   531
        dest->rgba[0] = src->rgba[0] * scene_shadow_intensity;
nkeynes@863
   532
        dest->rgba[1] = src->rgba[1] * scene_shadow_intensity;
nkeynes@863
   533
        dest->rgba[2] = src->rgba[2] * scene_shadow_intensity;
nkeynes@863
   534
        dest->rgba[3] = src->rgba[3] * scene_shadow_intensity;
nkeynes@863
   535
        dest->offset_rgba[0] = src->offset_rgba[0] * scene_shadow_intensity;
nkeynes@863
   536
        dest->offset_rgba[1] = src->offset_rgba[1] * scene_shadow_intensity;
nkeynes@863
   537
        dest->offset_rgba[2] = src->offset_rgba[2] * scene_shadow_intensity;
nkeynes@863
   538
        dest->offset_rgba[3] = src->offset_rgba[3];
nkeynes@863
   539
        dest++;
nkeynes@863
   540
        src++;
nkeynes@863
   541
    }
nkeynes@635
   542
}
nkeynes@635
   543
nkeynes@639
   544
static void scene_add_vertexes( pvraddr_t poly_idx, int vertex_length,
nkeynes@863
   545
                                shadow_mode_t is_modified )
nkeynes@635
   546
{
nkeynes@635
   547
    struct polygon_struct *poly = pvr2_scene.buf_to_poly_map[poly_idx];
nkeynes@635
   548
    uint32_t *ptr = &pvr2_scene.pvr2_pbuf[poly_idx];
nkeynes@635
   549
    uint32_t *context = ptr;
nkeynes@635
   550
    unsigned int i;
nkeynes@635
   551
nkeynes@635
   552
    if( poly->vertex_index == -1 ) {
nkeynes@863
   553
        ptr += (is_modified == SHADOW_FULL ? 5 : 3 );
nkeynes@687
   554
        poly->vertex_index = pvr2_scene.vertex_index;
nkeynes@687
   555
nkeynes@687
   556
        assert( poly != NULL );
nkeynes@687
   557
        assert( pvr2_scene.vertex_index + poly->vertex_count <= pvr2_scene.vertex_count );
nkeynes@687
   558
        for( i=0; i<poly->vertex_count; i++ ) {
nkeynes@1140
   559
            pvr2_decode_render_vertex( &pvr2_scene.vertex_array[pvr2_scene.vertex_index++], context[0], context[1], context[2], ptr, 0 );
nkeynes@687
   560
            ptr += vertex_length;
nkeynes@687
   561
        }
nkeynes@687
   562
        if( is_modified ) {
nkeynes@687
   563
            assert( pvr2_scene.vertex_index + poly->vertex_count <= pvr2_scene.vertex_count );
nkeynes@687
   564
            poly->mod_vertex_index = pvr2_scene.vertex_index;
nkeynes@863
   565
            if( is_modified == SHADOW_FULL ) {
nkeynes@863
   566
                int mod_offset = (vertex_length - 3)>>1;
nkeynes@863
   567
                ptr = &pvr2_scene.pvr2_pbuf[poly_idx] + 5;
nkeynes@863
   568
                for( i=0; i<poly->vertex_count; i++ ) {
nkeynes@1140
   569
                    pvr2_decode_render_vertex( &pvr2_scene.vertex_array[pvr2_scene.vertex_index++], context[0], context[3], context[4], ptr, mod_offset );
nkeynes@863
   570
                    ptr += vertex_length;
nkeynes@863
   571
                }
nkeynes@863
   572
            } else {
nkeynes@863
   573
                scene_add_cheap_shadow_vertexes( &pvr2_scene.vertex_array[poly->vertex_index], 
nkeynes@863
   574
                        &pvr2_scene.vertex_array[poly->mod_vertex_index], poly->vertex_count );
nkeynes@863
   575
                pvr2_scene.vertex_index += poly->vertex_count;
nkeynes@687
   576
            }
nkeynes@687
   577
        }
nkeynes@635
   578
    }
nkeynes@635
   579
}
nkeynes@635
   580
nkeynes@827
   581
static void scene_add_quad_vertexes( pvraddr_t poly_idx, int vertex_length,
nkeynes@863
   582
                                     shadow_mode_t is_modified )
nkeynes@635
   583
{
nkeynes@635
   584
    struct polygon_struct *poly = pvr2_scene.buf_to_poly_map[poly_idx];
nkeynes@635
   585
    uint32_t *ptr = &pvr2_scene.pvr2_pbuf[poly_idx];
nkeynes@635
   586
    uint32_t *context = ptr;
nkeynes@635
   587
    unsigned int i;
nkeynes@635
   588
nkeynes@635
   589
    if( poly->vertex_index == -1 ) {
nkeynes@827
   590
        // Construct it locally and copy to the vertex buffer, as the VBO is
nkeynes@736
   591
        // allowed to be horribly slow for reads (ie it could be direct-mapped
nkeynes@736
   592
        // vram).
nkeynes@736
   593
        struct vertex_struct quad[4];
nkeynes@736
   594
nkeynes@736
   595
        assert( poly != NULL );
nkeynes@736
   596
        assert( pvr2_scene.vertex_index + poly->vertex_count <= pvr2_scene.vertex_count );
nkeynes@863
   597
        ptr += (is_modified == SHADOW_FULL ? 5 : 3 );
nkeynes@736
   598
        poly->vertex_index = pvr2_scene.vertex_index;
nkeynes@736
   599
        for( i=0; i<4; i++ ) {
nkeynes@1140
   600
            pvr2_decode_render_vertex( &quad[i], context[0], context[1], context[2], ptr, 0 );
nkeynes@736
   601
            ptr += vertex_length;
nkeynes@736
   602
        }
nkeynes@687
   603
        scene_compute_vertexes( &quad[3], 1, &quad[0], !POLY1_GOURAUD_SHADED(context[0]) );
nkeynes@736
   604
        // Swap last two vertexes (quad arrangement => tri strip arrangement)
nkeynes@736
   605
        memcpy( &pvr2_scene.vertex_array[pvr2_scene.vertex_index], quad, sizeof(struct vertex_struct)*2 );
nkeynes@736
   606
        memcpy( &pvr2_scene.vertex_array[pvr2_scene.vertex_index+2], &quad[3], sizeof(struct vertex_struct) );
nkeynes@736
   607
        memcpy( &pvr2_scene.vertex_array[pvr2_scene.vertex_index+3], &quad[2], sizeof(struct vertex_struct) );
nkeynes@736
   608
        pvr2_scene.vertex_index += 4;
nkeynes@736
   609
nkeynes@736
   610
        if( is_modified ) {
nkeynes@736
   611
            assert( pvr2_scene.vertex_index + poly->vertex_count <= pvr2_scene.vertex_count );
nkeynes@736
   612
            poly->mod_vertex_index = pvr2_scene.vertex_index;
nkeynes@863
   613
            if( is_modified == SHADOW_FULL ) {
nkeynes@863
   614
                int mod_offset = (vertex_length - 3)>>1;
nkeynes@863
   615
                ptr = &pvr2_scene.pvr2_pbuf[poly_idx] + 5;
nkeynes@863
   616
                for( i=0; i<4; i++ ) {
nkeynes@1140
   617
                    pvr2_decode_render_vertex( &quad[4], context[0], context[3], context[4], ptr, mod_offset );
nkeynes@863
   618
                    ptr += vertex_length;
nkeynes@863
   619
                }
nkeynes@863
   620
                scene_compute_vertexes( &quad[3], 1, &quad[0], !POLY1_GOURAUD_SHADED(context[0]) );
nkeynes@863
   621
                memcpy( &pvr2_scene.vertex_array[pvr2_scene.vertex_index], quad, sizeof(struct vertex_struct)*2 );
nkeynes@863
   622
                memcpy( &pvr2_scene.vertex_array[pvr2_scene.vertex_index+2], &quad[3], sizeof(struct vertex_struct) );
nkeynes@863
   623
                memcpy( &pvr2_scene.vertex_array[pvr2_scene.vertex_index+3], &quad[2], sizeof(struct vertex_struct) );
nkeynes@863
   624
            } else {
nkeynes@863
   625
                scene_add_cheap_shadow_vertexes( &pvr2_scene.vertex_array[poly->vertex_index], 
nkeynes@863
   626
                        &pvr2_scene.vertex_array[poly->mod_vertex_index], poly->vertex_count );
nkeynes@863
   627
                pvr2_scene.vertex_index += poly->vertex_count;
nkeynes@736
   628
            }
nkeynes@736
   629
            pvr2_scene.vertex_index += 4;
nkeynes@736
   630
        }
nkeynes@635
   631
    }
nkeynes@635
   632
}
nkeynes@635
   633
nkeynes@639
   634
static void scene_extract_polygons( pvraddr_t tile_entry )
nkeynes@635
   635
{
nkeynes@934
   636
    uint32_t *tile_list = (uint32_t *)(pvr2_main_ram+tile_entry);
nkeynes@635
   637
    do {
nkeynes@687
   638
        uint32_t entry = *tile_list++;
nkeynes@687
   639
        if( entry >> 28 == 0x0F ) {
nkeynes@687
   640
            break;
nkeynes@687
   641
        } else if( entry >> 28 == 0x0E ) {
nkeynes@934
   642
            tile_list = (uint32_t *)(pvr2_main_ram + (entry&0x007FFFFF));
nkeynes@687
   643
        } else {
nkeynes@687
   644
            pvraddr_t polyaddr = entry&0x000FFFFF;
nkeynes@863
   645
            shadow_mode_t is_modified = (entry & 0x01000000) ? pvr2_scene.shadow_mode : SHADOW_NONE;
nkeynes@687
   646
            int vertex_length = (entry >> 21) & 0x07;
nkeynes@687
   647
            int context_length = 3;
nkeynes@863
   648
            if( is_modified == SHADOW_FULL ) {
nkeynes@687
   649
                context_length = 5;
nkeynes@687
   650
                vertex_length <<= 1 ;
nkeynes@687
   651
            }
nkeynes@687
   652
            vertex_length += 3;
nkeynes@687
   653
nkeynes@687
   654
            if( (entry & 0xE0000000) == 0x80000000 ) {
nkeynes@687
   655
                /* Triangle(s) */
nkeynes@687
   656
                int strip_count = ((entry >> 25) & 0x0F)+1;
nkeynes@687
   657
                int polygon_length = 3 * vertex_length + context_length;
nkeynes@687
   658
                int i;
nkeynes@687
   659
                struct polygon_struct *last_poly = NULL;
nkeynes@687
   660
                for( i=0; i<strip_count; i++ ) {
nkeynes@687
   661
                    struct polygon_struct *poly = scene_add_polygon( polyaddr, 3, is_modified );
nkeynes@687
   662
                    polyaddr += polygon_length;
nkeynes@687
   663
                    if( last_poly != NULL && last_poly->next == NULL ) {
nkeynes@687
   664
                        last_poly->next = poly;
nkeynes@687
   665
                    }
nkeynes@687
   666
                    last_poly = poly;
nkeynes@687
   667
                }
nkeynes@687
   668
            } else if( (entry & 0xE0000000) == 0xA0000000 ) {
nkeynes@687
   669
                /* Sprite(s) */
nkeynes@687
   670
                int strip_count = ((entry >> 25) & 0x0F)+1;
nkeynes@687
   671
                int polygon_length = 4 * vertex_length + context_length;
nkeynes@687
   672
                int i;
nkeynes@687
   673
                struct polygon_struct *last_poly = NULL;
nkeynes@687
   674
                for( i=0; i<strip_count; i++ ) {
nkeynes@687
   675
                    struct polygon_struct *poly = scene_add_polygon( polyaddr, 4, is_modified );
nkeynes@687
   676
                    polyaddr += polygon_length;
nkeynes@687
   677
                    if( last_poly != NULL && last_poly->next == NULL ) {
nkeynes@687
   678
                        last_poly->next = poly;
nkeynes@687
   679
                    }
nkeynes@687
   680
                    last_poly = poly;
nkeynes@687
   681
                }
nkeynes@687
   682
            } else {
nkeynes@687
   683
                /* Polygon */
nkeynes@687
   684
                int i, last = -1;
nkeynes@687
   685
                for( i=5; i>=0; i-- ) {
nkeynes@687
   686
                    if( entry & (0x40000000>>i) ) {
nkeynes@687
   687
                        last = i;
nkeynes@687
   688
                        break;
nkeynes@687
   689
                    }
nkeynes@687
   690
                }
nkeynes@687
   691
                if( last != -1 ) {
nkeynes@687
   692
                    scene_add_polygon( polyaddr, last+3, is_modified );
nkeynes@687
   693
                }
nkeynes@687
   694
            }
nkeynes@687
   695
        }
nkeynes@635
   696
    } while( 1 );
nkeynes@635
   697
}
nkeynes@635
   698
nkeynes@639
   699
static void scene_extract_vertexes( pvraddr_t tile_entry )
nkeynes@635
   700
{
nkeynes@934
   701
    uint32_t *tile_list = (uint32_t *)(pvr2_main_ram+tile_entry);
nkeynes@635
   702
    do {
nkeynes@736
   703
        uint32_t entry = *tile_list++;
nkeynes@736
   704
        if( entry >> 28 == 0x0F ) {
nkeynes@736
   705
            break;
nkeynes@736
   706
        } else if( entry >> 28 == 0x0E ) {
nkeynes@934
   707
            tile_list = (uint32_t *)(pvr2_main_ram + (entry&0x007FFFFF));
nkeynes@736
   708
        } else {
nkeynes@736
   709
            pvraddr_t polyaddr = entry&0x000FFFFF;
nkeynes@863
   710
            shadow_mode_t is_modified = (entry & 0x01000000) ? pvr2_scene.shadow_mode : SHADOW_NONE;
nkeynes@736
   711
            int vertex_length = (entry >> 21) & 0x07;
nkeynes@736
   712
            int context_length = 3;
nkeynes@863
   713
            if( is_modified == SHADOW_FULL ) {
nkeynes@736
   714
                context_length = 5;
nkeynes@736
   715
                vertex_length <<=1 ;
nkeynes@736
   716
            }
nkeynes@736
   717
            vertex_length += 3;
nkeynes@736
   718
nkeynes@736
   719
            if( (entry & 0xE0000000) == 0x80000000 ) {
nkeynes@736
   720
                /* Triangle(s) */
nkeynes@736
   721
                int strip_count = ((entry >> 25) & 0x0F)+1;
nkeynes@736
   722
                int polygon_length = 3 * vertex_length + context_length;
nkeynes@736
   723
                int i;
nkeynes@736
   724
                for( i=0; i<strip_count; i++ ) {
nkeynes@736
   725
                    scene_add_vertexes( polyaddr, vertex_length, is_modified );
nkeynes@736
   726
                    polyaddr += polygon_length;
nkeynes@736
   727
                }
nkeynes@736
   728
            } else if( (entry & 0xE0000000) == 0xA0000000 ) {
nkeynes@736
   729
                /* Sprite(s) */
nkeynes@736
   730
                int strip_count = ((entry >> 25) & 0x0F)+1;
nkeynes@736
   731
                int polygon_length = 4 * vertex_length + context_length;
nkeynes@736
   732
                int i;
nkeynes@736
   733
                for( i=0; i<strip_count; i++ ) {
nkeynes@736
   734
                    scene_add_quad_vertexes( polyaddr, vertex_length, is_modified );
nkeynes@736
   735
                    polyaddr += polygon_length;
nkeynes@736
   736
                }
nkeynes@736
   737
            } else {
nkeynes@736
   738
                /* Polygon */
nkeynes@736
   739
                int i, last = -1;
nkeynes@736
   740
                for( i=5; i>=0; i-- ) {
nkeynes@736
   741
                    if( entry & (0x40000000>>i) ) {
nkeynes@736
   742
                        last = i;
nkeynes@736
   743
                        break;
nkeynes@736
   744
                    }
nkeynes@736
   745
                }
nkeynes@736
   746
                if( last != -1 ) {
nkeynes@736
   747
                    scene_add_vertexes( polyaddr, vertex_length, is_modified );
nkeynes@736
   748
                }
nkeynes@736
   749
            }
nkeynes@736
   750
        }
nkeynes@827
   751
    } while( 1 );
nkeynes@635
   752
}
nkeynes@635
   753
nkeynes@687
   754
static void scene_extract_background( void )
nkeynes@687
   755
{
nkeynes@687
   756
    uint32_t bgplane = MMIO_READ(PVR2, RENDER_BGPLANE);
nkeynes@687
   757
    int vertex_length = (bgplane >> 24) & 0x07;
nkeynes@687
   758
    int context_length = 3, i;
nkeynes@863
   759
    shadow_mode_t is_modified = (bgplane & 0x08000000) ? pvr2_scene.shadow_mode : SHADOW_NONE;
nkeynes@687
   760
nkeynes@687
   761
    struct polygon_struct *poly = &pvr2_scene.poly_array[pvr2_scene.poly_count++];
nkeynes@687
   762
    uint32_t *context = &pvr2_scene.pvr2_pbuf[(bgplane & 0x00FFFFFF)>>3];
nkeynes@687
   763
    poly->context = context;
nkeynes@687
   764
    poly->vertex_count = 4;
nkeynes@687
   765
    poly->vertex_index = pvr2_scene.vertex_count;
nkeynes@863
   766
    if( is_modified == SHADOW_FULL ) {
nkeynes@687
   767
        context_length = 5;
nkeynes@687
   768
        vertex_length <<= 1;
nkeynes@863
   769
    }
nkeynes@863
   770
    if( is_modified != SHADOW_NONE ) {
nkeynes@687
   771
        poly->mod_vertex_index = pvr2_scene.vertex_count + 4;
nkeynes@827
   772
        pvr2_scene.vertex_count += 8;
nkeynes@687
   773
    } else {
nkeynes@687
   774
        poly->mod_vertex_index = -1;
nkeynes@687
   775
        pvr2_scene.vertex_count += 4;
nkeynes@687
   776
    }
nkeynes@687
   777
    vertex_length += 3;
nkeynes@687
   778
    context_length += (bgplane & 0x07) * vertex_length;
nkeynes@687
   779
nkeynes@687
   780
    poly->next = NULL;
nkeynes@1133
   781
    poly->sub_next = NULL;
nkeynes@687
   782
    pvr2_scene.bkgnd_poly = poly;
nkeynes@736
   783
nkeynes@687
   784
    struct vertex_struct base_vertexes[3];
nkeynes@827
   785
    uint32_t *ptr = context + context_length;
nkeynes@687
   786
    for( i=0; i<3; i++ ) {
nkeynes@1140
   787
        pvr2_decode_render_vertex( &base_vertexes[i], context[0], context[1], context[2],
nkeynes@736
   788
                ptr, 0 );
nkeynes@687
   789
        ptr += vertex_length;
nkeynes@687
   790
    }
nkeynes@687
   791
    struct vertex_struct *result_vertexes = &pvr2_scene.vertex_array[poly->vertex_index];
nkeynes@687
   792
    result_vertexes[0].x = result_vertexes[0].y = 0;
nkeynes@687
   793
    result_vertexes[1].x = result_vertexes[3].x = pvr2_scene.buffer_width;
nkeynes@687
   794
    result_vertexes[1].y = result_vertexes[2].x = 0;
nkeynes@687
   795
    result_vertexes[2].y = result_vertexes[3].y  = pvr2_scene.buffer_height;
nkeynes@687
   796
    scene_compute_vertexes( result_vertexes, 4, base_vertexes, !POLY1_GOURAUD_SHADED(context[0]) );
nkeynes@687
   797
nkeynes@863
   798
    if( is_modified == SHADOW_FULL ) {
nkeynes@687
   799
        int mod_offset = (vertex_length - 3)>>1;
nkeynes@687
   800
        ptr = context + context_length;
nkeynes@687
   801
        for( i=0; i<3; i++ ) {
nkeynes@1140
   802
            pvr2_decode_render_vertex( &base_vertexes[i], context[0], context[3], context[4],
nkeynes@736
   803
                    ptr, mod_offset );
nkeynes@687
   804
            ptr += vertex_length;
nkeynes@687
   805
        }
nkeynes@687
   806
        result_vertexes = &pvr2_scene.vertex_array[poly->mod_vertex_index];
nkeynes@687
   807
        result_vertexes[0].x = result_vertexes[0].y = 0;
nkeynes@687
   808
        result_vertexes[1].x = result_vertexes[3].x = pvr2_scene.buffer_width;
nkeynes@687
   809
        result_vertexes[1].y = result_vertexes[2].x = 0;
nkeynes@687
   810
        result_vertexes[2].y = result_vertexes[3].y  = pvr2_scene.buffer_height;
nkeynes@687
   811
        scene_compute_vertexes( result_vertexes, 4, base_vertexes, !POLY1_GOURAUD_SHADED(context[0]) );
nkeynes@863
   812
    } else if( is_modified == SHADOW_CHEAP ) {
nkeynes@863
   813
        scene_add_cheap_shadow_vertexes( &pvr2_scene.vertex_array[poly->vertex_index], 
nkeynes@863
   814
                &pvr2_scene.vertex_array[poly->mod_vertex_index], poly->vertex_count );
nkeynes@863
   815
        pvr2_scene.vertex_index += poly->vertex_count;
nkeynes@687
   816
    }
nkeynes@736
   817
nkeynes@687
   818
}
nkeynes@687
   819
nkeynes@687
   820
nkeynes@639
   821
uint32_t pvr2_scene_buffer_width()
nkeynes@639
   822
{
nkeynes@639
   823
    return pvr2_scene.buffer_width;
nkeynes@639
   824
}
nkeynes@639
   825
nkeynes@639
   826
uint32_t pvr2_scene_buffer_height()
nkeynes@639
   827
{
nkeynes@639
   828
    return pvr2_scene.buffer_height;
nkeynes@639
   829
}
nkeynes@639
   830
nkeynes@635
   831
/**
nkeynes@635
   832
 * Extract the current scene into the rendering structures. We run two passes
nkeynes@827
   833
 * - first pass extracts the polygons into pvr2_scene.poly_array (finding vertex counts),
nkeynes@635
   834
 * second pass extracts the vertex data into the VBO/vertex array.
nkeynes@635
   835
 *
nkeynes@827
   836
 * Difficult to do in single pass as we don't generally know the size of a
nkeynes@635
   837
 * polygon for certain until we've seen all tiles containing it. It also means we
nkeynes@635
   838
 * can count the vertexes and allocate the appropriate size VBO.
nkeynes@635
   839
 *
nkeynes@635
   840
 * FIXME: accesses into VRAM need to be bounds-checked properly
nkeynes@635
   841
 */
nkeynes@635
   842
void pvr2_scene_read( void )
nkeynes@635
   843
{
nkeynes@635
   844
    pvr2_scene_init();
nkeynes@639
   845
    pvr2_scene_reset();
nkeynes@635
   846
nkeynes@635
   847
    pvr2_scene.bounds[0] = MMIO_READ( PVR2, RENDER_HCLIP ) & 0x03FF;
nkeynes@635
   848
    pvr2_scene.bounds[1] = ((MMIO_READ( PVR2, RENDER_HCLIP ) >> 16) & 0x03FF) + 1;
nkeynes@635
   849
    pvr2_scene.bounds[2] = MMIO_READ( PVR2, RENDER_VCLIP ) & 0x03FF;
nkeynes@635
   850
    pvr2_scene.bounds[3] = ((MMIO_READ( PVR2, RENDER_VCLIP ) >> 16) & 0x03FF) + 1;
nkeynes@635
   851
    pvr2_scene.bounds[4] = pvr2_scene.bounds[5] = MMIO_READF( PVR2, RENDER_FARCLIP );
nkeynes@635
   852
nkeynes@827
   853
    uint32_t scaler = MMIO_READ( PVR2, RENDER_SCALER );
nkeynes@827
   854
    if( scaler & SCALER_HSCALE ) {
nkeynes@827
   855
    	/* If the horizontal scaler is in use, we're (in principle) supposed to
nkeynes@827
   856
    	 * divide everything by 2. However in the interests of display quality,
nkeynes@827
   857
    	 * instead we want to render to the unscaled resolution and downsample
nkeynes@827
   858
    	 * only if/when required.
nkeynes@827
   859
    	 */
nkeynes@827
   860
    	pvr2_scene.bounds[1] *= 2;
nkeynes@827
   861
    }
nkeynes@847
   862
    
nkeynes@847
   863
    uint32_t fog_col = MMIO_READ( PVR2, RENDER_FOGTBLCOL );
nkeynes@847
   864
    unpack_bgra( fog_col, pvr2_scene.fog_lut_colour );
nkeynes@847
   865
    fog_col = MMIO_READ( PVR2, RENDER_FOGVRTCOL );
nkeynes@847
   866
    unpack_bgra( fog_col, pvr2_scene.fog_vert_colour );
nkeynes@847
   867
    
nkeynes@934
   868
    uint32_t *tilebuffer = (uint32_t *)(pvr2_main_ram + MMIO_READ( PVR2, RENDER_TILEBASE ));
nkeynes@635
   869
    uint32_t *segment = tilebuffer;
nkeynes@863
   870
    uint32_t shadow = MMIO_READ(PVR2,RENDER_SHADOW);
nkeynes@635
   871
    pvr2_scene.segment_list = (struct tile_segment *)tilebuffer;
nkeynes@934
   872
    pvr2_scene.pvr2_pbuf = (uint32_t *)(pvr2_main_ram + MMIO_READ(PVR2,RENDER_POLYBASE));
nkeynes@863
   873
    pvr2_scene.shadow_mode = shadow & 0x100 ? SHADOW_CHEAP : SHADOW_FULL;
nkeynes@863
   874
    scene_shadow_intensity = U8TOFLOAT(shadow&0xFF);
nkeynes@687
   875
nkeynes@635
   876
    int max_tile_x = 0;
nkeynes@635
   877
    int max_tile_y = 0;
nkeynes@635
   878
    int obj_config = MMIO_READ( PVR2, RENDER_OBJCFG );
nkeynes@635
   879
    int isp_config = MMIO_READ( PVR2, RENDER_ISPCFG );
nkeynes@635
   880
nkeynes@635
   881
    if( (obj_config & 0x00200000) == 0 ) {
nkeynes@687
   882
        if( isp_config & 1 ) {
nkeynes@687
   883
            pvr2_scene.sort_mode = SORT_NEVER;
nkeynes@687
   884
        } else {
nkeynes@687
   885
            pvr2_scene.sort_mode = SORT_ALWAYS;
nkeynes@687
   886
        }
nkeynes@635
   887
    } else {
nkeynes@687
   888
        pvr2_scene.sort_mode = SORT_TILEFLAG;
nkeynes@635
   889
    }
nkeynes@635
   890
nkeynes@827
   891
    // Pass 1: Extract polygon list
nkeynes@635
   892
    uint32_t control;
nkeynes@635
   893
    int i;
nkeynes@635
   894
    do {
nkeynes@687
   895
        control = *segment++;
nkeynes@687
   896
        int tile_x = SEGMENT_X(control);
nkeynes@687
   897
        int tile_y = SEGMENT_Y(control);
nkeynes@687
   898
        if( tile_x > max_tile_x ) {
nkeynes@687
   899
            max_tile_x = tile_x;
nkeynes@827
   900
        }
nkeynes@687
   901
        if( tile_y > max_tile_y ) {
nkeynes@687
   902
            max_tile_y = tile_y;
nkeynes@687
   903
        }
nkeynes@687
   904
        for( i=0; i<5; i++ ) {
nkeynes@687
   905
            if( (*segment & NO_POINTER) == 0 ) {
nkeynes@687
   906
                scene_extract_polygons( *segment );
nkeynes@687
   907
            }
nkeynes@687
   908
            segment++;
nkeynes@687
   909
        }
nkeynes@635
   910
    } while( (control & SEGMENT_END) == 0 );
nkeynes@635
   911
nkeynes@635
   912
    pvr2_scene.buffer_width = (max_tile_x+1)<<5;
nkeynes@635
   913
    pvr2_scene.buffer_height = (max_tile_y+1)<<5;
nkeynes@635
   914
nkeynes@687
   915
    // Pass 2: Extract vertex data
nkeynes@687
   916
    vertex_buffer_map();
nkeynes@687
   917
    pvr2_scene.vertex_index = 0;
nkeynes@687
   918
    segment = tilebuffer;
nkeynes@687
   919
    do {
nkeynes@687
   920
        control = *segment++;
nkeynes@687
   921
        for( i=0; i<5; i++ ) {
nkeynes@687
   922
            if( (*segment & NO_POINTER) == 0 ) {
nkeynes@687
   923
                scene_extract_vertexes( *segment );
nkeynes@687
   924
            }
nkeynes@687
   925
            segment++;
nkeynes@687
   926
        }
nkeynes@687
   927
    } while( (control & SEGMENT_END) == 0 );
nkeynes@736
   928
nkeynes@687
   929
    scene_extract_background();
nkeynes@847
   930
    scene_compute_lut_fog();
nkeynes@1133
   931
    scene_backface_cull();
nkeynes@736
   932
nkeynes@687
   933
    vertex_buffer_unmap();
nkeynes@635
   934
}
nkeynes@645
   935
nkeynes@645
   936
/**
nkeynes@645
   937
 * Dump the current scene to file in a (mostly) human readable form
nkeynes@645
   938
 */
nkeynes@1142
   939
void pvr2_scene_print( FILE *f )
nkeynes@645
   940
{
nkeynes@645
   941
    int i,j;
nkeynes@645
   942
nkeynes@645
   943
    fprintf( f, "Polygons: %d\n", pvr2_scene.poly_count );
nkeynes@645
   944
    for( i=0; i<pvr2_scene.poly_count; i++ ) {
nkeynes@736
   945
        struct polygon_struct *poly = &pvr2_scene.poly_array[i];
nkeynes@1074
   946
        fprintf( f, "  %08X ", (uint32_t)(((unsigned char *)poly->context) - pvr2_main_ram) );
nkeynes@736
   947
        switch( poly->vertex_count ) {
nkeynes@736
   948
        case 3: fprintf( f, "Tri     " ); break;
nkeynes@736
   949
        case 4: fprintf( f, "Quad    " ); break;
nkeynes@736
   950
        default: fprintf( f,"%d-Strip ", poly->vertex_count-2 ); break;
nkeynes@736
   951
        }
nkeynes@736
   952
        fprintf( f, "%08X %08X %08X ", poly->context[0], poly->context[1], poly->context[2] );
nkeynes@736
   953
        if( poly->mod_vertex_index != -1 ) {
nkeynes@736
   954
            fprintf( f, "%08X %08X\n", poly->context[3], poly->context[5] );
nkeynes@736
   955
        } else {
nkeynes@736
   956
            fprintf( f, "\n" );
nkeynes@736
   957
        }
nkeynes@736
   958
nkeynes@736
   959
        for( j=0; j<poly->vertex_count; j++ ) {
nkeynes@736
   960
            struct vertex_struct *v = &pvr2_scene.vertex_array[poly->vertex_index+j];
nkeynes@784
   961
            fprintf( f, "    %.5f %.5f %.5f, (%.5f,%.5f)  %.5f,%.5f,%.5f,%.5f  %.5f %.5f %.5f %.5f\n", v->x, v->y, v->z, v->u, v->v,
nkeynes@827
   962
                     v->rgba[0], v->rgba[1], v->rgba[2], v->rgba[3],
nkeynes@784
   963
                     v->offset_rgba[0], v->offset_rgba[1], v->offset_rgba[2], v->offset_rgba[3] );
nkeynes@736
   964
        }
nkeynes@736
   965
        if( poly->mod_vertex_index != -1 ) {
nkeynes@736
   966
            fprintf( f, "  ---\n" );
nkeynes@736
   967
            for( j=0; j<poly->vertex_count; j++ ) {
nkeynes@736
   968
                struct vertex_struct *v = &pvr2_scene.vertex_array[poly->mod_vertex_index+j];
nkeynes@784
   969
                fprintf( f, "    %.5f %.5f %.5f, (%.5f,%.5f)  %.5f,%.5f,%.5f,%.5f  %.5f %.5f %.5f %.5f\n", v->x, v->y, v->z, v->u, v->v,
nkeynes@827
   970
                         v->rgba[0], v->rgba[1], v->rgba[2], v->rgba[3],
nkeynes@784
   971
                         v->offset_rgba[0], v->offset_rgba[1], v->offset_rgba[2], v->offset_rgba[3] );
nkeynes@736
   972
            }
nkeynes@736
   973
        }
nkeynes@645
   974
    }
nkeynes@645
   975
nkeynes@645
   976
}
nkeynes@1142
   977
nkeynes@1142
   978
void pvr2_scene_dump()
nkeynes@1142
   979
{
nkeynes@1142
   980
    pvr2_scene_print(stdout);
nkeynes@1142
   981
}
.