nkeynes@189 | 1 | /**
|
nkeynes@286 | 2 | * $Id: rendcore.c,v 1.8 2007-01-15 10:11:13 nkeynes Exp $
|
nkeynes@189 | 3 | *
|
nkeynes@189 | 4 | * PVR2 renderer core.
|
nkeynes@189 | 5 | *
|
nkeynes@189 | 6 | * Copyright (c) 2005 Nathan Keynes.
|
nkeynes@189 | 7 | *
|
nkeynes@189 | 8 | * This program is free software; you can redistribute it and/or modify
|
nkeynes@189 | 9 | * it under the terms of the GNU General Public License as published by
|
nkeynes@189 | 10 | * the Free Software Foundation; either version 2 of the License, or
|
nkeynes@189 | 11 | * (at your option) any later version.
|
nkeynes@189 | 12 | *
|
nkeynes@189 | 13 | * This program is distributed in the hope that it will be useful,
|
nkeynes@189 | 14 | * but WITHOUT ANY WARRANTY; without even the implied warranty of
|
nkeynes@189 | 15 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
nkeynes@189 | 16 | * GNU General Public License for more details.
|
nkeynes@189 | 17 | */
|
nkeynes@215 | 18 | #include <sys/time.h>
|
nkeynes@189 | 19 | #include "pvr2/pvr2.h"
|
nkeynes@189 | 20 | #include "asic.h"
|
nkeynes@189 | 21 |
|
nkeynes@221 | 22 | int pvr2_poly_depthmode[8] = { GL_NEVER, GL_LESS, GL_EQUAL, GL_LEQUAL,
|
nkeynes@189 | 23 | GL_GREATER, GL_NOTEQUAL, GL_GEQUAL,
|
nkeynes@189 | 24 | GL_ALWAYS };
|
nkeynes@221 | 25 | int pvr2_poly_srcblend[8] = {
|
nkeynes@189 | 26 | GL_ZERO, GL_ONE, GL_DST_COLOR, GL_ONE_MINUS_DST_COLOR,
|
nkeynes@189 | 27 | GL_SRC_ALPHA, GL_ONE_MINUS_SRC_ALPHA, GL_DST_ALPHA,
|
nkeynes@189 | 28 | GL_ONE_MINUS_DST_ALPHA };
|
nkeynes@221 | 29 | int pvr2_poly_dstblend[8] = {
|
nkeynes@189 | 30 | GL_ZERO, GL_ONE, GL_SRC_COLOR, GL_ONE_MINUS_SRC_COLOR,
|
nkeynes@189 | 31 | GL_SRC_ALPHA, GL_ONE_MINUS_SRC_ALPHA, GL_DST_ALPHA,
|
nkeynes@189 | 32 | GL_ONE_MINUS_DST_ALPHA };
|
nkeynes@221 | 33 | int pvr2_poly_texblend[4] = {
|
nkeynes@189 | 34 | GL_REPLACE, GL_BLEND, GL_DECAL, GL_MODULATE };
|
nkeynes@221 | 35 | int pvr2_render_colour_format[8] = {
|
nkeynes@189 | 36 | COLFMT_ARGB1555, COLFMT_RGB565, COLFMT_ARGB4444, COLFMT_ARGB1555,
|
nkeynes@189 | 37 | COLFMT_RGB888, COLFMT_ARGB8888, COLFMT_ARGB8888, COLFMT_ARGB4444 };
|
nkeynes@189 | 38 |
|
nkeynes@189 | 39 |
|
nkeynes@189 | 40 | #define CULL_NONE 0
|
nkeynes@189 | 41 | #define CULL_SMALL 1
|
nkeynes@189 | 42 | #define CULL_CCW 2
|
nkeynes@189 | 43 | #define CULL_CW 3
|
nkeynes@189 | 44 |
|
nkeynes@189 | 45 | #define SEGMENT_END 0x80000000
|
nkeynes@189 | 46 | #define SEGMENT_SORT_TRANS 0x20000000
|
nkeynes@189 | 47 | #define SEGMENT_START 0x10000000
|
nkeynes@189 | 48 | #define SEGMENT_X(c) (((c) >> 2) & 0x3F)
|
nkeynes@189 | 49 | #define SEGMENT_Y(c) (((c) >> 8) & 0x3F)
|
nkeynes@189 | 50 | #define NO_POINTER 0x80000000
|
nkeynes@189 | 51 |
|
nkeynes@189 | 52 | extern char *video_base;
|
nkeynes@189 | 53 |
|
nkeynes@189 | 54 | struct tile_segment {
|
nkeynes@189 | 55 | uint32_t control;
|
nkeynes@189 | 56 | pvraddr_t opaque_ptr;
|
nkeynes@189 | 57 | pvraddr_t opaquemod_ptr;
|
nkeynes@189 | 58 | pvraddr_t trans_ptr;
|
nkeynes@189 | 59 | pvraddr_t transmod_ptr;
|
nkeynes@189 | 60 | pvraddr_t punchout_ptr;
|
nkeynes@189 | 61 | };
|
nkeynes@189 | 62 |
|
nkeynes@189 | 63 | /**
|
nkeynes@189 | 64 | * Convert a half-float (16-bit) FP number to a regular 32-bit float.
|
nkeynes@189 | 65 | * Source is 1-bit sign, 5-bit exponent, 10-bit mantissa.
|
nkeynes@189 | 66 | * TODO: Check the correctness of this.
|
nkeynes@189 | 67 | */
|
nkeynes@189 | 68 | float halftofloat( uint16_t half )
|
nkeynes@189 | 69 | {
|
nkeynes@189 | 70 | union {
|
nkeynes@189 | 71 | float f;
|
nkeynes@189 | 72 | uint32_t i;
|
nkeynes@189 | 73 | } temp;
|
nkeynes@189 | 74 | int e = ((half & 0x7C00) >> 10) - 15 + 127;
|
nkeynes@189 | 75 |
|
nkeynes@189 | 76 | temp.i = ((half & 0x8000) << 16) | (e << 23) |
|
nkeynes@189 | 77 | ((half & 0x03FF) << 13);
|
nkeynes@189 | 78 | return temp.f;
|
nkeynes@189 | 79 | }
|
nkeynes@189 | 80 |
|
nkeynes@189 | 81 |
|
nkeynes@189 | 82 | /**
|
nkeynes@189 | 83 | * Setup the GL context for the supplied polygon context.
|
nkeynes@189 | 84 | * @param context pointer to 3 or 5 words of polygon context
|
nkeynes@189 | 85 | * @param modified boolean flag indicating that the modified
|
nkeynes@189 | 86 | * version should be used, rather than the normal version.
|
nkeynes@189 | 87 | */
|
nkeynes@189 | 88 | void render_set_context( uint32_t *context, int render_mode )
|
nkeynes@189 | 89 | {
|
nkeynes@189 | 90 | uint32_t poly1 = context[0], poly2, texture;
|
nkeynes@189 | 91 | if( render_mode == RENDER_FULLMOD ) {
|
nkeynes@189 | 92 | poly2 = context[3];
|
nkeynes@189 | 93 | texture = context[4];
|
nkeynes@189 | 94 | } else {
|
nkeynes@189 | 95 | poly2 = context[1];
|
nkeynes@189 | 96 | texture = context[2];
|
nkeynes@189 | 97 | }
|
nkeynes@189 | 98 |
|
nkeynes@189 | 99 | if( POLY1_DEPTH_ENABLE(poly1) ) {
|
nkeynes@189 | 100 | glEnable( GL_DEPTH_TEST );
|
nkeynes@189 | 101 | glDepthFunc( POLY1_DEPTH_MODE(poly1) );
|
nkeynes@189 | 102 | } else {
|
nkeynes@189 | 103 | glDisable( GL_DEPTH_TEST );
|
nkeynes@189 | 104 | }
|
nkeynes@189 | 105 |
|
nkeynes@189 | 106 | switch( POLY1_CULL_MODE(poly1) ) {
|
nkeynes@189 | 107 | case CULL_NONE:
|
nkeynes@189 | 108 | case CULL_SMALL:
|
nkeynes@189 | 109 | glDisable( GL_CULL_FACE );
|
nkeynes@189 | 110 | break;
|
nkeynes@189 | 111 | case CULL_CCW:
|
nkeynes@189 | 112 | glEnable( GL_CULL_FACE );
|
nkeynes@189 | 113 | glFrontFace( GL_CW );
|
nkeynes@189 | 114 | break;
|
nkeynes@189 | 115 | case CULL_CW:
|
nkeynes@189 | 116 | glEnable( GL_CULL_FACE );
|
nkeynes@189 | 117 | glFrontFace( GL_CCW );
|
nkeynes@189 | 118 | break;
|
nkeynes@189 | 119 | }
|
nkeynes@189 | 120 |
|
nkeynes@189 | 121 | if( POLY1_TEXTURED(poly1) ) {
|
nkeynes@189 | 122 | int width = POLY2_TEX_WIDTH(poly2);
|
nkeynes@189 | 123 | int height = POLY2_TEX_HEIGHT(poly2);
|
nkeynes@189 | 124 | glEnable(GL_TEXTURE_2D);
|
nkeynes@286 | 125 | texcache_get_texture( (texture&0x000FFFFF)<<3, width, height, texture );
|
nkeynes@189 | 126 | glTexEnvi( GL_TEXTURE_ENV, GL_TEXTURE_ENV_MODE, POLY2_TEX_BLEND(poly2) );
|
nkeynes@189 | 127 | } else {
|
nkeynes@189 | 128 | glDisable( GL_TEXTURE_2D );
|
nkeynes@189 | 129 | }
|
nkeynes@189 | 130 |
|
nkeynes@189 | 131 | glShadeModel( POLY1_SHADE_MODEL(poly1) );
|
nkeynes@189 | 132 |
|
nkeynes@221 | 133 | int srcblend = POLY2_SRC_BLEND(poly2);
|
nkeynes@221 | 134 | int destblend = POLY2_DEST_BLEND(poly2);
|
nkeynes@221 | 135 | glBlendFunc( srcblend, destblend );
|
nkeynes@189 | 136 | if( POLY2_TEX_ALPHA_ENABLE(poly2) ) {
|
nkeynes@189 | 137 | glEnable(GL_BLEND);
|
nkeynes@189 | 138 | } else {
|
nkeynes@189 | 139 | glDisable(GL_BLEND);
|
nkeynes@189 | 140 | }
|
nkeynes@189 | 141 | }
|
nkeynes@189 | 142 |
|
nkeynes@189 | 143 | void render_vertexes( uint32_t poly1, uint32_t *vertexes, int num_vertexes, int vertex_size,
|
nkeynes@189 | 144 | int render_mode )
|
nkeynes@189 | 145 | {
|
nkeynes@189 | 146 | int i, m=0;
|
nkeynes@189 | 147 |
|
nkeynes@189 | 148 | if( render_mode == RENDER_FULLMOD ) {
|
nkeynes@189 | 149 | m = (vertex_size - 3)/2;
|
nkeynes@189 | 150 | }
|
nkeynes@189 | 151 |
|
nkeynes@189 | 152 | glBegin( GL_TRIANGLE_STRIP );
|
nkeynes@189 | 153 |
|
nkeynes@189 | 154 | for( i=0; i<num_vertexes; i++ ) {
|
nkeynes@189 | 155 | float *vertexf = (float *)vertexes;
|
nkeynes@189 | 156 | uint32_t argb;
|
nkeynes@189 | 157 | if( POLY1_TEXTURED(poly1) ) {
|
nkeynes@189 | 158 | if( POLY1_UV16(poly1) ) {
|
nkeynes@189 | 159 | glTexCoord2f( halftofloat(vertexes[m+3]>>16),
|
nkeynes@189 | 160 | halftofloat(vertexes[m+3]) );
|
nkeynes@189 | 161 | argb = vertexes[m+4];
|
nkeynes@189 | 162 | } else {
|
nkeynes@189 | 163 | glTexCoord2f( vertexf[m+3], vertexf[m+4] );
|
nkeynes@189 | 164 | argb = vertexes[m+5];
|
nkeynes@189 | 165 | }
|
nkeynes@189 | 166 | } else {
|
nkeynes@189 | 167 | argb = vertexes[m+3];
|
nkeynes@189 | 168 | }
|
nkeynes@189 | 169 |
|
nkeynes@189 | 170 | glColor4ub( (GLubyte)(argb >> 16), (GLubyte)(argb >> 8),
|
nkeynes@189 | 171 | (GLubyte)argb, (GLubyte)(argb >> 24) );
|
nkeynes@189 | 172 | glVertex3f( vertexf[0], vertexf[1], vertexf[2] );
|
nkeynes@189 | 173 | vertexes += vertex_size;
|
nkeynes@189 | 174 | }
|
nkeynes@189 | 175 |
|
nkeynes@189 | 176 | glEnd();
|
nkeynes@189 | 177 | }
|
nkeynes@189 | 178 |
|
nkeynes@189 | 179 | /**
|
nkeynes@189 | 180 | * Render a simple (not auto-sorted) tile
|
nkeynes@189 | 181 | */
|
nkeynes@189 | 182 | void render_tile( pvraddr_t tile_entry, int render_mode, gboolean cheap_modifier_mode ) {
|
nkeynes@215 | 183 | uint32_t poly_bank = MMIO_READ(PVR2,RENDER_POLYBASE);
|
nkeynes@189 | 184 | uint32_t *tile_list = (uint32_t *)(video_base+tile_entry);
|
nkeynes@189 | 185 | do {
|
nkeynes@189 | 186 | uint32_t entry = *tile_list++;
|
nkeynes@189 | 187 | if( entry >> 28 == 0x0F ) {
|
nkeynes@189 | 188 | break;
|
nkeynes@189 | 189 | } else if( entry >> 28 == 0x0E ) {
|
nkeynes@189 | 190 | tile_list = (uint32_t *)(video_base + (entry&0x007FFFFF));
|
nkeynes@189 | 191 | } else {
|
nkeynes@215 | 192 | uint32_t *polygon = (uint32_t *)(video_base + poly_bank + ((entry & 0x000FFFFF) << 2));
|
nkeynes@189 | 193 | int is_modified = entry & 0x01000000;
|
nkeynes@189 | 194 | int vertex_length = (entry >> 21) & 0x07;
|
nkeynes@189 | 195 | int context_length = 3;
|
nkeynes@189 | 196 | if( is_modified && !cheap_modifier_mode ) {
|
nkeynes@189 | 197 | context_length = 5;
|
nkeynes@189 | 198 | vertex_length *= 2 ;
|
nkeynes@189 | 199 | }
|
nkeynes@189 | 200 | vertex_length += 3;
|
nkeynes@189 | 201 |
|
nkeynes@189 | 202 | if( (entry & 0xE0000000) == 0x80000000 ) {
|
nkeynes@189 | 203 | /* Triangle(s) */
|
nkeynes@189 | 204 | int strip_count = ((entry >> 25) & 0x0F)+1;
|
nkeynes@189 | 205 | int polygon_length = 3 * vertex_length + context_length;
|
nkeynes@189 | 206 | int i;
|
nkeynes@189 | 207 | for( i=0; i<strip_count; i++ ) {
|
nkeynes@189 | 208 | render_set_context( polygon, render_mode );
|
nkeynes@189 | 209 | render_vertexes( *polygon, polygon+context_length, 3, vertex_length,
|
nkeynes@189 | 210 | render_mode );
|
nkeynes@189 | 211 | polygon += polygon_length;
|
nkeynes@189 | 212 | }
|
nkeynes@189 | 213 | } else if( (entry & 0xE0000000) == 0xA0000000 ) {
|
nkeynes@189 | 214 | /* Sprite(s) */
|
nkeynes@189 | 215 | int strip_count = (entry >> 25) & 0x0F;
|
nkeynes@189 | 216 | int polygon_length = 4 * vertex_length + context_length;
|
nkeynes@189 | 217 | int i;
|
nkeynes@189 | 218 | for( i=0; i<strip_count; i++ ) {
|
nkeynes@189 | 219 | render_set_context( polygon, render_mode );
|
nkeynes@189 | 220 | render_vertexes( *polygon, polygon+context_length, 4, vertex_length,
|
nkeynes@189 | 221 | render_mode );
|
nkeynes@189 | 222 | polygon += polygon_length;
|
nkeynes@189 | 223 | }
|
nkeynes@189 | 224 | } else {
|
nkeynes@189 | 225 | /* Polygon */
|
nkeynes@189 | 226 | int i, first=-1, last = -1;
|
nkeynes@189 | 227 | for( i=0; i<6; i++ ) {
|
nkeynes@189 | 228 | if( entry & (0x40000000>>i) ) {
|
nkeynes@189 | 229 | if( first == -1 ) first = i;
|
nkeynes@189 | 230 | last = i;
|
nkeynes@189 | 231 | }
|
nkeynes@189 | 232 | }
|
nkeynes@189 | 233 | if( first != -1 ) {
|
nkeynes@189 | 234 | first = 0;
|
nkeynes@189 | 235 | render_set_context(polygon, render_mode);
|
nkeynes@189 | 236 | render_vertexes( *polygon, polygon+context_length + (first*vertex_length),
|
nkeynes@189 | 237 | (last-first+3), vertex_length, render_mode );
|
nkeynes@189 | 238 | }
|
nkeynes@189 | 239 | }
|
nkeynes@189 | 240 | }
|
nkeynes@189 | 241 | } while( 1 );
|
nkeynes@189 | 242 | }
|
nkeynes@189 | 243 |
|
nkeynes@189 | 244 | void pvr2_render_tilebuffer( int width, int height, int clipx1, int clipy1,
|
nkeynes@189 | 245 | int clipx2, int clipy2 ) {
|
nkeynes@189 | 246 |
|
nkeynes@191 | 247 | pvraddr_t segmentbase = MMIO_READ( PVR2, RENDER_TILEBASE );
|
nkeynes@189 | 248 | int tile_sort;
|
nkeynes@189 | 249 | gboolean cheap_shadow;
|
nkeynes@189 | 250 |
|
nkeynes@191 | 251 | int obj_config = MMIO_READ( PVR2, RENDER_OBJCFG );
|
nkeynes@191 | 252 | int isp_config = MMIO_READ( PVR2, RENDER_ISPCFG );
|
nkeynes@191 | 253 | int shadow_cfg = MMIO_READ( PVR2, RENDER_SHADOW );
|
nkeynes@189 | 254 |
|
nkeynes@222 | 255 | if( (obj_config & 0x00200000) == 0 ) {
|
nkeynes@189 | 256 | if( isp_config & 1 ) {
|
nkeynes@189 | 257 | tile_sort = 0;
|
nkeynes@189 | 258 | } else {
|
nkeynes@189 | 259 | tile_sort = 2;
|
nkeynes@189 | 260 | }
|
nkeynes@189 | 261 | } else {
|
nkeynes@189 | 262 | tile_sort = 1;
|
nkeynes@189 | 263 | }
|
nkeynes@189 | 264 |
|
nkeynes@189 | 265 | cheap_shadow = shadow_cfg & 0x100 ? TRUE : FALSE;
|
nkeynes@189 | 266 |
|
nkeynes@189 | 267 | struct tile_segment *segment = (struct tile_segment *)(video_base + segmentbase);
|
nkeynes@189 | 268 |
|
nkeynes@215 | 269 | struct timeval tv_start, tv_end;
|
nkeynes@215 | 270 | gettimeofday(&tv_start, NULL);
|
nkeynes@189 | 271 | glEnable( GL_SCISSOR_TEST );
|
nkeynes@268 | 272 | do {
|
nkeynes@221 | 273 | // fwrite_dump32v( (uint32_t *)segment, sizeof(struct tile_segment), 6, stderr );
|
nkeynes@189 | 274 | int tilex = SEGMENT_X(segment->control);
|
nkeynes@189 | 275 | int tiley = SEGMENT_Y(segment->control);
|
nkeynes@189 | 276 |
|
nkeynes@189 | 277 | int x1 = tilex << 5;
|
nkeynes@189 | 278 | int y1 = tiley << 5;
|
nkeynes@189 | 279 | if( x1 + 32 <= clipx1 ||
|
nkeynes@189 | 280 | y1 + 32 <= clipy1 ||
|
nkeynes@189 | 281 | x1 >= clipx2 ||
|
nkeynes@189 | 282 | y1 >= clipy2 ) {
|
nkeynes@189 | 283 | /* Tile completely clipped, skip */
|
nkeynes@189 | 284 | continue;
|
nkeynes@189 | 285 | }
|
nkeynes@215 | 286 |
|
nkeynes@189 | 287 | /* Set a scissor on the visible part of the tile */
|
nkeynes@189 | 288 | int w = MIN(x1+32, clipx2) - x1;
|
nkeynes@189 | 289 | int h = MIN(y1+32, clipy2) - y1;
|
nkeynes@189 | 290 | x1 = MAX(x1,clipx1);
|
nkeynes@189 | 291 | y1 = MAX(y1,clipy1);
|
nkeynes@189 | 292 | glScissor( x1, height-y1-h, w, h );
|
nkeynes@189 | 293 |
|
nkeynes@189 | 294 | if( (segment->opaque_ptr & NO_POINTER) == 0 ) {
|
nkeynes@189 | 295 | if( (segment->opaquemod_ptr & NO_POINTER) == 0 ) {
|
nkeynes@189 | 296 | /* TODO */
|
nkeynes@189 | 297 | }
|
nkeynes@189 | 298 | render_tile( segment->opaque_ptr, RENDER_NORMAL, cheap_shadow );
|
nkeynes@189 | 299 | }
|
nkeynes@189 | 300 |
|
nkeynes@189 | 301 | if( (segment->trans_ptr & NO_POINTER) == 0 ) {
|
nkeynes@189 | 302 | if( (segment->transmod_ptr & NO_POINTER) == 0 ) {
|
nkeynes@189 | 303 | /* TODO */
|
nkeynes@189 | 304 | }
|
nkeynes@222 | 305 | if( tile_sort == 2 ||
|
nkeynes@222 | 306 | (tile_sort == 1 && ((segment->control & SEGMENT_SORT_TRANS)==0)) ) {
|
nkeynes@189 | 307 | render_autosort_tile( segment->trans_ptr, RENDER_NORMAL, cheap_shadow );
|
nkeynes@189 | 308 | } else {
|
nkeynes@189 | 309 | render_tile( segment->trans_ptr, RENDER_NORMAL, cheap_shadow );
|
nkeynes@189 | 310 | }
|
nkeynes@189 | 311 | }
|
nkeynes@189 | 312 |
|
nkeynes@189 | 313 | if( (segment->punchout_ptr & NO_POINTER) == 0 ) {
|
nkeynes@189 | 314 | render_tile( segment->punchout_ptr, RENDER_NORMAL, cheap_shadow );
|
nkeynes@189 | 315 | }
|
nkeynes@268 | 316 | } while( ((segment++)->control & SEGMENT_END) == 0 );
|
nkeynes@189 | 317 | glDisable( GL_SCISSOR_TEST );
|
nkeynes@215 | 318 |
|
nkeynes@215 | 319 | gettimeofday(&tv_end, NULL);
|
nkeynes@215 | 320 | timersub(&tv_end,&tv_start, &tv_start);
|
nkeynes@189 | 321 | }
|