filename | src/pvr2/rendcore.c |
changeset | 308:10a5b5475fb0 |
prev | 298:44d94dd0e8aa |
next | 318:363935d31859 |
author | nkeynes |
date | Tue Jan 23 11:19:32 2007 +0000 (17 years ago) |
permissions | -rw-r--r-- |
last change | Refactor render buffer read/write to pvr2mem.c Implement 4-bit indexed textures (tentatively) Fix RGB24 support |
file | annotate | diff | log | raw |
nkeynes@189 | 1 | /** |
nkeynes@308 | 2 | * $Id: rendcore.c,v 1.10 2007-01-21 11:28:43 nkeynes Exp $ |
nkeynes@189 | 3 | * |
nkeynes@189 | 4 | * PVR2 renderer core. |
nkeynes@189 | 5 | * |
nkeynes@189 | 6 | * Copyright (c) 2005 Nathan Keynes. |
nkeynes@189 | 7 | * |
nkeynes@189 | 8 | * This program is free software; you can redistribute it and/or modify |
nkeynes@189 | 9 | * it under the terms of the GNU General Public License as published by |
nkeynes@189 | 10 | * the Free Software Foundation; either version 2 of the License, or |
nkeynes@189 | 11 | * (at your option) any later version. |
nkeynes@189 | 12 | * |
nkeynes@189 | 13 | * This program is distributed in the hope that it will be useful, |
nkeynes@189 | 14 | * but WITHOUT ANY WARRANTY; without even the implied warranty of |
nkeynes@189 | 15 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
nkeynes@189 | 16 | * GNU General Public License for more details. |
nkeynes@189 | 17 | */ |
nkeynes@215 | 18 | #include <sys/time.h> |
nkeynes@189 | 19 | #include "pvr2/pvr2.h" |
nkeynes@189 | 20 | #include "asic.h" |
nkeynes@189 | 21 | |
nkeynes@221 | 22 | int pvr2_poly_depthmode[8] = { GL_NEVER, GL_LESS, GL_EQUAL, GL_LEQUAL, |
nkeynes@189 | 23 | GL_GREATER, GL_NOTEQUAL, GL_GEQUAL, |
nkeynes@189 | 24 | GL_ALWAYS }; |
nkeynes@221 | 25 | int pvr2_poly_srcblend[8] = { |
nkeynes@189 | 26 | GL_ZERO, GL_ONE, GL_DST_COLOR, GL_ONE_MINUS_DST_COLOR, |
nkeynes@189 | 27 | GL_SRC_ALPHA, GL_ONE_MINUS_SRC_ALPHA, GL_DST_ALPHA, |
nkeynes@189 | 28 | GL_ONE_MINUS_DST_ALPHA }; |
nkeynes@221 | 29 | int pvr2_poly_dstblend[8] = { |
nkeynes@189 | 30 | GL_ZERO, GL_ONE, GL_SRC_COLOR, GL_ONE_MINUS_SRC_COLOR, |
nkeynes@189 | 31 | GL_SRC_ALPHA, GL_ONE_MINUS_SRC_ALPHA, GL_DST_ALPHA, |
nkeynes@189 | 32 | GL_ONE_MINUS_DST_ALPHA }; |
nkeynes@221 | 33 | int pvr2_poly_texblend[4] = { |
nkeynes@298 | 34 | GL_REPLACE, GL_MODULATE, GL_DECAL, GL_MODULATE }; |
nkeynes@221 | 35 | int pvr2_render_colour_format[8] = { |
nkeynes@189 | 36 | COLFMT_ARGB1555, COLFMT_RGB565, COLFMT_ARGB4444, COLFMT_ARGB1555, |
nkeynes@189 | 37 | COLFMT_RGB888, COLFMT_ARGB8888, COLFMT_ARGB8888, COLFMT_ARGB4444 }; |
nkeynes@189 | 38 | |
nkeynes@189 | 39 | |
nkeynes@189 | 40 | #define CULL_NONE 0 |
nkeynes@189 | 41 | #define CULL_SMALL 1 |
nkeynes@189 | 42 | #define CULL_CCW 2 |
nkeynes@189 | 43 | #define CULL_CW 3 |
nkeynes@189 | 44 | |
nkeynes@189 | 45 | #define SEGMENT_END 0x80000000 |
nkeynes@298 | 46 | #define SEGMENT_ZCLEAR 0x40000000 |
nkeynes@189 | 47 | #define SEGMENT_SORT_TRANS 0x20000000 |
nkeynes@189 | 48 | #define SEGMENT_START 0x10000000 |
nkeynes@189 | 49 | #define SEGMENT_X(c) (((c) >> 2) & 0x3F) |
nkeynes@189 | 50 | #define SEGMENT_Y(c) (((c) >> 8) & 0x3F) |
nkeynes@189 | 51 | #define NO_POINTER 0x80000000 |
nkeynes@189 | 52 | |
nkeynes@189 | 53 | extern char *video_base; |
nkeynes@189 | 54 | |
nkeynes@189 | 55 | struct tile_segment { |
nkeynes@189 | 56 | uint32_t control; |
nkeynes@189 | 57 | pvraddr_t opaque_ptr; |
nkeynes@189 | 58 | pvraddr_t opaquemod_ptr; |
nkeynes@189 | 59 | pvraddr_t trans_ptr; |
nkeynes@189 | 60 | pvraddr_t transmod_ptr; |
nkeynes@189 | 61 | pvraddr_t punchout_ptr; |
nkeynes@189 | 62 | }; |
nkeynes@189 | 63 | |
nkeynes@189 | 64 | /** |
nkeynes@189 | 65 | * Convert a half-float (16-bit) FP number to a regular 32-bit float. |
nkeynes@189 | 66 | * Source is 1-bit sign, 5-bit exponent, 10-bit mantissa. |
nkeynes@189 | 67 | * TODO: Check the correctness of this. |
nkeynes@189 | 68 | */ |
nkeynes@189 | 69 | float halftofloat( uint16_t half ) |
nkeynes@189 | 70 | { |
nkeynes@189 | 71 | union { |
nkeynes@189 | 72 | float f; |
nkeynes@189 | 73 | uint32_t i; |
nkeynes@189 | 74 | } temp; |
nkeynes@308 | 75 | /* int e = ((half & 0x7C00) >> 10) - 15 + 127; |
nkeynes@189 | 76 | |
nkeynes@189 | 77 | temp.i = ((half & 0x8000) << 16) | (e << 23) | |
nkeynes@308 | 78 | ((half & 0x03FF) << 13); */ |
nkeynes@308 | 79 | temp.i = ((uint32_t)half)<<16; |
nkeynes@189 | 80 | return temp.f; |
nkeynes@189 | 81 | } |
nkeynes@189 | 82 | |
nkeynes@189 | 83 | |
nkeynes@189 | 84 | /** |
nkeynes@189 | 85 | * Setup the GL context for the supplied polygon context. |
nkeynes@189 | 86 | * @param context pointer to 3 or 5 words of polygon context |
nkeynes@189 | 87 | * @param modified boolean flag indicating that the modified |
nkeynes@189 | 88 | * version should be used, rather than the normal version. |
nkeynes@189 | 89 | */ |
nkeynes@189 | 90 | void render_set_context( uint32_t *context, int render_mode ) |
nkeynes@189 | 91 | { |
nkeynes@189 | 92 | uint32_t poly1 = context[0], poly2, texture; |
nkeynes@189 | 93 | if( render_mode == RENDER_FULLMOD ) { |
nkeynes@189 | 94 | poly2 = context[3]; |
nkeynes@189 | 95 | texture = context[4]; |
nkeynes@189 | 96 | } else { |
nkeynes@189 | 97 | poly2 = context[1]; |
nkeynes@189 | 98 | texture = context[2]; |
nkeynes@189 | 99 | } |
nkeynes@189 | 100 | |
nkeynes@189 | 101 | if( POLY1_DEPTH_ENABLE(poly1) ) { |
nkeynes@189 | 102 | glEnable( GL_DEPTH_TEST ); |
nkeynes@189 | 103 | glDepthFunc( POLY1_DEPTH_MODE(poly1) ); |
nkeynes@189 | 104 | } else { |
nkeynes@189 | 105 | glDisable( GL_DEPTH_TEST ); |
nkeynes@189 | 106 | } |
nkeynes@189 | 107 | |
nkeynes@189 | 108 | switch( POLY1_CULL_MODE(poly1) ) { |
nkeynes@189 | 109 | case CULL_NONE: |
nkeynes@189 | 110 | case CULL_SMALL: |
nkeynes@189 | 111 | glDisable( GL_CULL_FACE ); |
nkeynes@189 | 112 | break; |
nkeynes@189 | 113 | case CULL_CCW: |
nkeynes@189 | 114 | glEnable( GL_CULL_FACE ); |
nkeynes@189 | 115 | glFrontFace( GL_CW ); |
nkeynes@189 | 116 | break; |
nkeynes@189 | 117 | case CULL_CW: |
nkeynes@189 | 118 | glEnable( GL_CULL_FACE ); |
nkeynes@189 | 119 | glFrontFace( GL_CCW ); |
nkeynes@189 | 120 | break; |
nkeynes@189 | 121 | } |
nkeynes@189 | 122 | |
nkeynes@189 | 123 | if( POLY1_TEXTURED(poly1) ) { |
nkeynes@189 | 124 | int width = POLY2_TEX_WIDTH(poly2); |
nkeynes@189 | 125 | int height = POLY2_TEX_HEIGHT(poly2); |
nkeynes@189 | 126 | glEnable(GL_TEXTURE_2D); |
nkeynes@286 | 127 | texcache_get_texture( (texture&0x000FFFFF)<<3, width, height, texture ); |
nkeynes@189 | 128 | glTexEnvi( GL_TEXTURE_ENV, GL_TEXTURE_ENV_MODE, POLY2_TEX_BLEND(poly2) ); |
nkeynes@308 | 129 | if( POLY2_TEX_CLAMP_U(poly2) ) { |
nkeynes@308 | 130 | glTexParameteri( GL_TEXTURE_2D, GL_TEXTURE_WRAP_S, GL_CLAMP ); |
nkeynes@308 | 131 | } else { |
nkeynes@308 | 132 | glTexParameteri( GL_TEXTURE_2D, GL_TEXTURE_WRAP_S, GL_REPEAT ); |
nkeynes@308 | 133 | } |
nkeynes@308 | 134 | if( POLY2_TEX_CLAMP_V(poly2) ) { |
nkeynes@308 | 135 | glTexParameteri( GL_TEXTURE_2D, GL_TEXTURE_WRAP_T, GL_CLAMP ); |
nkeynes@308 | 136 | } else { |
nkeynes@308 | 137 | glTexParameteri( GL_TEXTURE_2D, GL_TEXTURE_WRAP_S, GL_REPEAT ); |
nkeynes@308 | 138 | } |
nkeynes@189 | 139 | } else { |
nkeynes@189 | 140 | glDisable( GL_TEXTURE_2D ); |
nkeynes@189 | 141 | } |
nkeynes@189 | 142 | |
nkeynes@189 | 143 | glShadeModel( POLY1_SHADE_MODEL(poly1) ); |
nkeynes@189 | 144 | |
nkeynes@221 | 145 | int srcblend = POLY2_SRC_BLEND(poly2); |
nkeynes@221 | 146 | int destblend = POLY2_DEST_BLEND(poly2); |
nkeynes@221 | 147 | glBlendFunc( srcblend, destblend ); |
nkeynes@189 | 148 | } |
nkeynes@189 | 149 | |
nkeynes@189 | 150 | void render_vertexes( uint32_t poly1, uint32_t *vertexes, int num_vertexes, int vertex_size, |
nkeynes@189 | 151 | int render_mode ) |
nkeynes@189 | 152 | { |
nkeynes@189 | 153 | int i, m=0; |
nkeynes@189 | 154 | |
nkeynes@189 | 155 | if( render_mode == RENDER_FULLMOD ) { |
nkeynes@189 | 156 | m = (vertex_size - 3)/2; |
nkeynes@189 | 157 | } |
nkeynes@189 | 158 | |
nkeynes@189 | 159 | glBegin( GL_TRIANGLE_STRIP ); |
nkeynes@189 | 160 | |
nkeynes@189 | 161 | for( i=0; i<num_vertexes; i++ ) { |
nkeynes@189 | 162 | float *vertexf = (float *)vertexes; |
nkeynes@189 | 163 | uint32_t argb; |
nkeynes@189 | 164 | if( POLY1_TEXTURED(poly1) ) { |
nkeynes@189 | 165 | if( POLY1_UV16(poly1) ) { |
nkeynes@189 | 166 | glTexCoord2f( halftofloat(vertexes[m+3]>>16), |
nkeynes@189 | 167 | halftofloat(vertexes[m+3]) ); |
nkeynes@189 | 168 | argb = vertexes[m+4]; |
nkeynes@189 | 169 | } else { |
nkeynes@189 | 170 | glTexCoord2f( vertexf[m+3], vertexf[m+4] ); |
nkeynes@189 | 171 | argb = vertexes[m+5]; |
nkeynes@189 | 172 | } |
nkeynes@189 | 173 | } else { |
nkeynes@189 | 174 | argb = vertexes[m+3]; |
nkeynes@189 | 175 | } |
nkeynes@189 | 176 | |
nkeynes@189 | 177 | glColor4ub( (GLubyte)(argb >> 16), (GLubyte)(argb >> 8), |
nkeynes@189 | 178 | (GLubyte)argb, (GLubyte)(argb >> 24) ); |
nkeynes@189 | 179 | glVertex3f( vertexf[0], vertexf[1], vertexf[2] ); |
nkeynes@189 | 180 | vertexes += vertex_size; |
nkeynes@189 | 181 | } |
nkeynes@189 | 182 | |
nkeynes@189 | 183 | glEnd(); |
nkeynes@189 | 184 | } |
nkeynes@189 | 185 | |
nkeynes@189 | 186 | /** |
nkeynes@189 | 187 | * Render a simple (not auto-sorted) tile |
nkeynes@189 | 188 | */ |
nkeynes@189 | 189 | void render_tile( pvraddr_t tile_entry, int render_mode, gboolean cheap_modifier_mode ) { |
nkeynes@215 | 190 | uint32_t poly_bank = MMIO_READ(PVR2,RENDER_POLYBASE); |
nkeynes@189 | 191 | uint32_t *tile_list = (uint32_t *)(video_base+tile_entry); |
nkeynes@189 | 192 | do { |
nkeynes@189 | 193 | uint32_t entry = *tile_list++; |
nkeynes@189 | 194 | if( entry >> 28 == 0x0F ) { |
nkeynes@189 | 195 | break; |
nkeynes@189 | 196 | } else if( entry >> 28 == 0x0E ) { |
nkeynes@189 | 197 | tile_list = (uint32_t *)(video_base + (entry&0x007FFFFF)); |
nkeynes@189 | 198 | } else { |
nkeynes@215 | 199 | uint32_t *polygon = (uint32_t *)(video_base + poly_bank + ((entry & 0x000FFFFF) << 2)); |
nkeynes@189 | 200 | int is_modified = entry & 0x01000000; |
nkeynes@189 | 201 | int vertex_length = (entry >> 21) & 0x07; |
nkeynes@189 | 202 | int context_length = 3; |
nkeynes@189 | 203 | if( is_modified && !cheap_modifier_mode ) { |
nkeynes@189 | 204 | context_length = 5; |
nkeynes@189 | 205 | vertex_length *= 2 ; |
nkeynes@189 | 206 | } |
nkeynes@189 | 207 | vertex_length += 3; |
nkeynes@308 | 208 | |
nkeynes@189 | 209 | if( (entry & 0xE0000000) == 0x80000000 ) { |
nkeynes@189 | 210 | /* Triangle(s) */ |
nkeynes@189 | 211 | int strip_count = ((entry >> 25) & 0x0F)+1; |
nkeynes@189 | 212 | int polygon_length = 3 * vertex_length + context_length; |
nkeynes@189 | 213 | int i; |
nkeynes@189 | 214 | for( i=0; i<strip_count; i++ ) { |
nkeynes@189 | 215 | render_set_context( polygon, render_mode ); |
nkeynes@189 | 216 | render_vertexes( *polygon, polygon+context_length, 3, vertex_length, |
nkeynes@189 | 217 | render_mode ); |
nkeynes@189 | 218 | polygon += polygon_length; |
nkeynes@189 | 219 | } |
nkeynes@189 | 220 | } else if( (entry & 0xE0000000) == 0xA0000000 ) { |
nkeynes@189 | 221 | /* Sprite(s) */ |
nkeynes@189 | 222 | int strip_count = (entry >> 25) & 0x0F; |
nkeynes@189 | 223 | int polygon_length = 4 * vertex_length + context_length; |
nkeynes@189 | 224 | int i; |
nkeynes@189 | 225 | for( i=0; i<strip_count; i++ ) { |
nkeynes@189 | 226 | render_set_context( polygon, render_mode ); |
nkeynes@189 | 227 | render_vertexes( *polygon, polygon+context_length, 4, vertex_length, |
nkeynes@189 | 228 | render_mode ); |
nkeynes@189 | 229 | polygon += polygon_length; |
nkeynes@189 | 230 | } |
nkeynes@189 | 231 | } else { |
nkeynes@189 | 232 | /* Polygon */ |
nkeynes@189 | 233 | int i, first=-1, last = -1; |
nkeynes@189 | 234 | for( i=0; i<6; i++ ) { |
nkeynes@189 | 235 | if( entry & (0x40000000>>i) ) { |
nkeynes@189 | 236 | if( first == -1 ) first = i; |
nkeynes@189 | 237 | last = i; |
nkeynes@189 | 238 | } |
nkeynes@189 | 239 | } |
nkeynes@189 | 240 | if( first != -1 ) { |
nkeynes@189 | 241 | first = 0; |
nkeynes@189 | 242 | render_set_context(polygon, render_mode); |
nkeynes@189 | 243 | render_vertexes( *polygon, polygon+context_length + (first*vertex_length), |
nkeynes@189 | 244 | (last-first+3), vertex_length, render_mode ); |
nkeynes@189 | 245 | } |
nkeynes@189 | 246 | } |
nkeynes@189 | 247 | } |
nkeynes@189 | 248 | } while( 1 ); |
nkeynes@189 | 249 | } |
nkeynes@189 | 250 | |
nkeynes@189 | 251 | void pvr2_render_tilebuffer( int width, int height, int clipx1, int clipy1, |
nkeynes@189 | 252 | int clipx2, int clipy2 ) { |
nkeynes@189 | 253 | |
nkeynes@191 | 254 | pvraddr_t segmentbase = MMIO_READ( PVR2, RENDER_TILEBASE ); |
nkeynes@189 | 255 | int tile_sort; |
nkeynes@189 | 256 | gboolean cheap_shadow; |
nkeynes@189 | 257 | |
nkeynes@191 | 258 | int obj_config = MMIO_READ( PVR2, RENDER_OBJCFG ); |
nkeynes@191 | 259 | int isp_config = MMIO_READ( PVR2, RENDER_ISPCFG ); |
nkeynes@191 | 260 | int shadow_cfg = MMIO_READ( PVR2, RENDER_SHADOW ); |
nkeynes@189 | 261 | |
nkeynes@222 | 262 | if( (obj_config & 0x00200000) == 0 ) { |
nkeynes@189 | 263 | if( isp_config & 1 ) { |
nkeynes@189 | 264 | tile_sort = 0; |
nkeynes@189 | 265 | } else { |
nkeynes@189 | 266 | tile_sort = 2; |
nkeynes@189 | 267 | } |
nkeynes@189 | 268 | } else { |
nkeynes@189 | 269 | tile_sort = 1; |
nkeynes@189 | 270 | } |
nkeynes@189 | 271 | |
nkeynes@189 | 272 | cheap_shadow = shadow_cfg & 0x100 ? TRUE : FALSE; |
nkeynes@189 | 273 | |
nkeynes@189 | 274 | struct tile_segment *segment = (struct tile_segment *)(video_base + segmentbase); |
nkeynes@189 | 275 | |
nkeynes@215 | 276 | struct timeval tv_start, tv_end; |
nkeynes@215 | 277 | gettimeofday(&tv_start, NULL); |
nkeynes@189 | 278 | glEnable( GL_SCISSOR_TEST ); |
nkeynes@268 | 279 | do { |
nkeynes@221 | 280 | // fwrite_dump32v( (uint32_t *)segment, sizeof(struct tile_segment), 6, stderr ); |
nkeynes@189 | 281 | int tilex = SEGMENT_X(segment->control); |
nkeynes@189 | 282 | int tiley = SEGMENT_Y(segment->control); |
nkeynes@189 | 283 | |
nkeynes@189 | 284 | int x1 = tilex << 5; |
nkeynes@189 | 285 | int y1 = tiley << 5; |
nkeynes@189 | 286 | if( x1 + 32 <= clipx1 || |
nkeynes@189 | 287 | y1 + 32 <= clipy1 || |
nkeynes@189 | 288 | x1 >= clipx2 || |
nkeynes@189 | 289 | y1 >= clipy2 ) { |
nkeynes@189 | 290 | /* Tile completely clipped, skip */ |
nkeynes@189 | 291 | continue; |
nkeynes@189 | 292 | } |
nkeynes@215 | 293 | |
nkeynes@189 | 294 | /* Set a scissor on the visible part of the tile */ |
nkeynes@189 | 295 | int w = MIN(x1+32, clipx2) - x1; |
nkeynes@189 | 296 | int h = MIN(y1+32, clipy2) - y1; |
nkeynes@189 | 297 | x1 = MAX(x1,clipx1); |
nkeynes@189 | 298 | y1 = MAX(y1,clipy1); |
nkeynes@189 | 299 | glScissor( x1, height-y1-h, w, h ); |
nkeynes@189 | 300 | |
nkeynes@189 | 301 | if( (segment->opaque_ptr & NO_POINTER) == 0 ) { |
nkeynes@189 | 302 | if( (segment->opaquemod_ptr & NO_POINTER) == 0 ) { |
nkeynes@189 | 303 | /* TODO */ |
nkeynes@189 | 304 | } |
nkeynes@189 | 305 | render_tile( segment->opaque_ptr, RENDER_NORMAL, cheap_shadow ); |
nkeynes@189 | 306 | } |
nkeynes@189 | 307 | |
nkeynes@189 | 308 | if( (segment->trans_ptr & NO_POINTER) == 0 ) { |
nkeynes@189 | 309 | if( (segment->transmod_ptr & NO_POINTER) == 0 ) { |
nkeynes@189 | 310 | /* TODO */ |
nkeynes@189 | 311 | } |
nkeynes@222 | 312 | if( tile_sort == 2 || |
nkeynes@222 | 313 | (tile_sort == 1 && ((segment->control & SEGMENT_SORT_TRANS)==0)) ) { |
nkeynes@189 | 314 | render_autosort_tile( segment->trans_ptr, RENDER_NORMAL, cheap_shadow ); |
nkeynes@189 | 315 | } else { |
nkeynes@189 | 316 | render_tile( segment->trans_ptr, RENDER_NORMAL, cheap_shadow ); |
nkeynes@189 | 317 | } |
nkeynes@189 | 318 | } |
nkeynes@189 | 319 | |
nkeynes@189 | 320 | if( (segment->punchout_ptr & NO_POINTER) == 0 ) { |
nkeynes@189 | 321 | render_tile( segment->punchout_ptr, RENDER_NORMAL, cheap_shadow ); |
nkeynes@189 | 322 | } |
nkeynes@268 | 323 | } while( ((segment++)->control & SEGMENT_END) == 0 ); |
nkeynes@189 | 324 | glDisable( GL_SCISSOR_TEST ); |
nkeynes@215 | 325 | |
nkeynes@215 | 326 | gettimeofday(&tv_end, NULL); |
nkeynes@215 | 327 | timersub(&tv_end,&tv_start, &tv_start); |
nkeynes@189 | 328 | } |
.