Home | History | Annotate | Download | only in r200
      1 /*
      2 Copyright (C) The Weather Channel, Inc.  2002.  All Rights Reserved.
      3 
      4 The Weather Channel (TM) funded Tungsten Graphics to develop the
      5 initial release of the Radeon 8500 driver under the XFree86 license.
      6 This notice must be preserved.
      7 
      8 Permission is hereby granted, free of charge, to any person obtaining
      9 a copy of this software and associated documentation files (the
     10 "Software"), to deal in the Software without restriction, including
     11 without limitation the rights to use, copy, modify, merge, publish,
     12 distribute, sublicense, and/or sell copies of the Software, and to
     13 permit persons to whom the Software is furnished to do so, subject to
     14 the following conditions:
     15 
     16 The above copyright notice and this permission notice (including the
     17 next paragraph) shall be included in all copies or substantial
     18 portions of the Software.
     19 
     20 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
     21 EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
     22 MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
     23 IN NO EVENT SHALL THE COPYRIGHT OWNER(S) AND/OR ITS SUPPLIERS BE
     24 LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
     25 OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
     26 WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
     27 
     28 **************************************************************************/
     29 
     30 /*
     31  * Authors:
     32  *   Keith Whitwell <keithw (at) vmware.com>
     33  */
     34 
     35 #include "main/glheader.h"
     36 #include "main/imports.h"
     37 #include "main/mtypes.h"
     38 #include "main/enums.h"
     39 #include "main/light.h"
     40 #include "main/state.h"
     41 
     42 #include "vbo/vbo.h"
     43 #include "tnl/tnl.h"
     44 #include "tnl/t_pipeline.h"
     45 
     46 #include "r200_context.h"
     47 #include "r200_state.h"
     48 #include "r200_ioctl.h"
     49 #include "r200_tcl.h"
     50 #include "r200_swtcl.h"
     51 #include "r200_maos.h"
     52 
     53 #include "radeon_common_context.h"
     54 
     55 
     56 
     57 #define HAVE_POINTS      1
     58 #define HAVE_LINES       1
     59 #define HAVE_LINE_LOOP   0
     60 #define HAVE_LINE_STRIPS 1
     61 #define HAVE_TRIANGLES   1
     62 #define HAVE_TRI_STRIPS  1
     63 #define HAVE_TRI_FANS    1
     64 #define HAVE_QUADS       1
     65 #define HAVE_QUAD_STRIPS 1
     66 #define HAVE_POLYGONS    1
     67 #define HAVE_ELTS        1
     68 
     69 
     70 #define HW_POINTS           ((!ctx->Point.SmoothFlag) ? \
     71 				R200_VF_PRIM_POINT_SPRITES : R200_VF_PRIM_POINTS)
     72 #define HW_LINES            R200_VF_PRIM_LINES
     73 #define HW_LINE_LOOP        0
     74 #define HW_LINE_STRIP       R200_VF_PRIM_LINE_STRIP
     75 #define HW_TRIANGLES        R200_VF_PRIM_TRIANGLES
     76 #define HW_TRIANGLE_STRIP_0 R200_VF_PRIM_TRIANGLE_STRIP
     77 #define HW_TRIANGLE_STRIP_1 0
     78 #define HW_TRIANGLE_FAN     R200_VF_PRIM_TRIANGLE_FAN
     79 #define HW_QUADS            R200_VF_PRIM_QUADS
     80 #define HW_QUAD_STRIP       R200_VF_PRIM_QUAD_STRIP
     81 #define HW_POLYGON          R200_VF_PRIM_POLYGON
     82 
     83 
     84 static GLboolean discrete_prim[0x10] = {
     85    0,				/* 0 none */
     86    1,				/* 1 points */
     87    1,				/* 2 lines */
     88    0,				/* 3 line_strip */
     89    1,				/* 4 tri_list */
     90    0,				/* 5 tri_fan */
     91    0,				/* 6 tri_strip */
     92    0,				/* 7 tri_w_flags */
     93    1,				/* 8 rect list (unused) */
     94    1,				/* 9 3vert point */
     95    1,				/* a 3vert line */
     96    0,				/* b point sprite */
     97    0,				/* c line loop */
     98    1,				/* d quads */
     99    0,				/* e quad strip */
    100    0,				/* f polygon */
    101 };
    102 
    103 
    104 #define LOCAL_VARS r200ContextPtr rmesa = R200_CONTEXT(ctx)
    105 #define ELT_TYPE  GLushort
    106 
    107 #define ELT_INIT(prim, hw_prim) \
    108    r200TclPrimitive( ctx, prim, hw_prim | R200_VF_PRIM_WALK_IND )
    109 
    110 #define GET_MESA_ELTS() TNL_CONTEXT(ctx)->vb.Elts
    111 
    112 
    113 /* Don't really know how many elts will fit in what's left of cmdbuf,
    114  * as there is state to emit, etc:
    115  */
    116 
    117 /* Testing on isosurf shows a maximum around here.  Don't know if it's
    118  * the card or driver or kernel module that is causing the behaviour.
    119  */
    120 #define GET_MAX_HW_ELTS() 300
    121 
    122 #define RESET_STIPPLE() do {			\
    123    R200_STATECHANGE( rmesa, lin );		\
    124    radeonEmitState(&rmesa->radeon);			\
    125 } while (0)
    126 
    127 #define AUTO_STIPPLE( mode )  do {		\
    128    R200_STATECHANGE( rmesa, lin );		\
    129    if (mode)					\
    130       rmesa->hw.lin.cmd[LIN_RE_LINE_PATTERN] |=	\
    131 	 R200_LINE_PATTERN_AUTO_RESET;	\
    132    else						\
    133       rmesa->hw.lin.cmd[LIN_RE_LINE_PATTERN] &=	\
    134 	 ~R200_LINE_PATTERN_AUTO_RESET;	\
    135    radeonEmitState(&rmesa->radeon);			\
    136 } while (0)
    137 
    138 
    139 #define ALLOC_ELTS(nr)	r200AllocElts( rmesa, nr )
    140 
    141 static GLushort *r200AllocElts( r200ContextPtr rmesa, GLuint nr )
    142 {
    143    if (rmesa->radeon.dma.flush == r200FlushElts &&
    144        rmesa->tcl.elt_used + nr*2 < R200_ELT_BUF_SZ) {
    145 
    146       GLushort *dest = (GLushort *)(rmesa->radeon.tcl.elt_dma_bo->ptr +
    147 				    rmesa->radeon.tcl.elt_dma_offset + rmesa->tcl.elt_used);
    148 
    149       rmesa->tcl.elt_used += nr*2;
    150 
    151       return dest;
    152    }
    153    else {
    154       if (rmesa->radeon.dma.flush)
    155 	 rmesa->radeon.dma.flush( &rmesa->radeon.glCtx );
    156 
    157       r200EmitAOS( rmesa,
    158 		   rmesa->radeon.tcl.aos_count, 0 );
    159 
    160       r200EmitMaxVtxIndex(rmesa, rmesa->radeon.tcl.aos[0].count);
    161       return r200AllocEltsOpenEnded( rmesa, rmesa->tcl.hw_primitive, nr );
    162    }
    163 }
    164 
    165 
    166 #define CLOSE_ELTS() 				\
    167 do {						\
    168    if (0) R200_NEWPRIM( rmesa );		\
    169 }						\
    170 while (0)
    171 
    172 
    173 /* TODO: Try to extend existing primitive if both are identical,
    174  * discrete and there are no intervening state changes.  (Somewhat
    175  * duplicates changes to DrawArrays code)
    176  */
    177 static void r200EmitPrim( struct gl_context *ctx,
    178 		          GLenum prim,
    179 		          GLuint hwprim,
    180 		          GLuint start,
    181 		          GLuint count)
    182 {
    183    r200ContextPtr rmesa = R200_CONTEXT( ctx );
    184    r200TclPrimitive( ctx, prim, hwprim );
    185 
    186    //   fprintf(stderr,"Emit prim %d\n", rmesa->radeon.tcl.aos_count);
    187 
    188    r200EmitAOS( rmesa,
    189 		rmesa->radeon.tcl.aos_count,
    190 		start );
    191 
    192    /* Why couldn't this packet have taken an offset param?
    193     */
    194    r200EmitVbufPrim( rmesa,
    195 		     rmesa->tcl.hw_primitive,
    196 		     count - start );
    197 }
    198 
    199 #define EMIT_PRIM(ctx, prim, hwprim, start, count) do {         \
    200    r200EmitPrim( ctx, prim, hwprim, start, count );             \
    201    (void) rmesa; } while (0)
    202 
    203 #define MAX_CONVERSION_SIZE 40
    204 /* Try & join small primitives
    205  */
    206 #if 0
    207 #define PREFER_DISCRETE_ELT_PRIM( NR, PRIM ) 0
    208 #else
    209 #define PREFER_DISCRETE_ELT_PRIM( NR, PRIM )			\
    210   ((NR) < 20 ||							\
    211    ((NR) < 40 &&						\
    212     rmesa->tcl.hw_primitive == (PRIM|				\
    213 			    R200_VF_TCL_OUTPUT_VTX_ENABLE|	\
    214 			        R200_VF_PRIM_WALK_IND)))
    215 #endif
    216 
    217 #ifdef MESA_BIG_ENDIAN
    218 /* We could do without (most of) this ugliness if dest was always 32 bit word aligned... */
    219 #define EMIT_ELT(dest, offset, x) do {                          \
    220         int off = offset + ( ( (uintptr_t)dest & 0x2 ) >> 1 );     \
    221         GLushort *des = (GLushort *)( (uintptr_t)dest & ~0x2 );    \
    222         (des)[ off + 1 - 2 * ( off & 1 ) ] = (GLushort)(x);	\
    223 	(void)rmesa; } while (0)
    224 #else
    225 #define EMIT_ELT(dest, offset, x) do {				\
    226 	(dest)[offset] = (GLushort) (x);			\
    227 	(void)rmesa; } while (0)
    228 #endif
    229 
    230 #define EMIT_TWO_ELTS(dest, offset, x, y)  *(GLuint *)((dest)+offset) = ((y)<<16)|(x);
    231 
    232 
    233 
    234 #define TAG(x) tcl_##x
    235 #include "tnl_dd/t_dd_dmatmp2.h"
    236 
    237 /**********************************************************************/
    238 /*                          External entrypoints                     */
    239 /**********************************************************************/
    240 
    241 void r200EmitPrimitive( struct gl_context *ctx,
    242 			  GLuint first,
    243 			  GLuint last,
    244 			  GLuint flags )
    245 {
    246    tcl_render_tab_verts[flags&PRIM_MODE_MASK]( ctx, first, last, flags );
    247 }
    248 
    249 void r200EmitEltPrimitive( struct gl_context *ctx,
    250 			     GLuint first,
    251 			     GLuint last,
    252 			     GLuint flags )
    253 {
    254    tcl_render_tab_elts[flags&PRIM_MODE_MASK]( ctx, first, last, flags );
    255 }
    256 
    257 void r200TclPrimitive( struct gl_context *ctx,
    258 			 GLenum prim,
    259 			 int hw_prim )
    260 {
    261    r200ContextPtr rmesa = R200_CONTEXT(ctx);
    262    GLuint newprim = hw_prim | R200_VF_TCL_OUTPUT_VTX_ENABLE;
    263 
    264    radeon_prepare_render(&rmesa->radeon);
    265    if (rmesa->radeon.NewGLState)
    266       r200ValidateState( ctx );
    267 
    268    if (newprim != rmesa->tcl.hw_primitive ||
    269        !discrete_prim[hw_prim&0xf]) {
    270       /* need to disable perspective-correct texturing for point sprites */
    271       if ((prim & PRIM_MODE_MASK) == GL_POINTS && ctx->Point.PointSprite) {
    272 	 if (rmesa->hw.set.cmd[SET_RE_CNTL] & R200_PERSPECTIVE_ENABLE) {
    273 	    R200_STATECHANGE( rmesa, set );
    274 	    rmesa->hw.set.cmd[SET_RE_CNTL] &= ~R200_PERSPECTIVE_ENABLE;
    275 	 }
    276       }
    277       else if (!(rmesa->hw.set.cmd[SET_RE_CNTL] & R200_PERSPECTIVE_ENABLE)) {
    278 	 R200_STATECHANGE( rmesa, set );
    279 	 rmesa->hw.set.cmd[SET_RE_CNTL] |= R200_PERSPECTIVE_ENABLE;
    280       }
    281       R200_NEWPRIM( rmesa );
    282       rmesa->tcl.hw_primitive = newprim;
    283    }
    284 }
    285 
    286 /**
    287  * Predict total emit size for next rendering operation so there is no flush in middle of rendering
    288  * Prediction has to aim towards the best possible value that is worse than worst case scenario
    289  */
    290 static GLuint r200EnsureEmitSize( struct gl_context * ctx , GLubyte* vimap_rev )
    291 {
    292   r200ContextPtr rmesa = R200_CONTEXT(ctx);
    293   TNLcontext *tnl = TNL_CONTEXT(ctx);
    294   struct vertex_buffer *VB = &tnl->vb;
    295   GLuint space_required;
    296   GLuint state_size;
    297   GLuint nr_aos = 0;
    298   int i;
    299   /* predict number of aos to emit */
    300   for (i = 0; i < 15; ++i)
    301   {
    302     if (vimap_rev[i] != 255)
    303     {
    304       ++nr_aos;
    305     }
    306   }
    307 
    308   {
    309     /* count the prediction for state size */
    310     space_required = 0;
    311     state_size = radeonCountStateEmitSize( &rmesa->radeon );
    312     /* vtx may be changed in r200EmitArrays so account for it if not dirty */
    313     if (!rmesa->hw.vtx.dirty)
    314       state_size += rmesa->hw.vtx.check(&rmesa->radeon.glCtx, &rmesa->hw.vtx);
    315     /* predict size for elements */
    316     for (i = 0; i < VB->PrimitiveCount; ++i)
    317     {
    318       if (!VB->Primitive[i].count)
    319 	continue;
    320       /* If primitive.count is less than MAX_CONVERSION_SIZE
    321          rendering code may decide convert to elts.
    322 	 In that case we have to make pessimistic prediction.
    323 	 and use larger of 2 paths. */
    324       const GLuint elt_count =(VB->Primitive[i].count/GET_MAX_HW_ELTS() + 1);
    325       const GLuint elts = ELTS_BUFSZ(nr_aos) * elt_count;
    326       const GLuint index = INDEX_BUFSZ * elt_count;
    327       const GLuint vbuf = VBUF_BUFSZ;
    328       if ( (!VB->Elts && VB->Primitive[i].count >= MAX_CONVERSION_SIZE)
    329 	  || vbuf > index + elts)
    330 	space_required += vbuf;
    331       else
    332 	space_required += index + elts;
    333       space_required += AOS_BUFSZ(nr_aos);
    334     }
    335   }
    336 
    337   radeon_print(RADEON_RENDER,RADEON_VERBOSE,
    338       "%s space %u, aos %d\n",
    339       __func__, space_required, AOS_BUFSZ(nr_aos) );
    340   /* flush the buffer in case we need more than is left. */
    341   if (rcommonEnsureCmdBufSpace(&rmesa->radeon, space_required + state_size, __func__))
    342     return space_required + radeonCountStateEmitSize( &rmesa->radeon );
    343   else
    344     return space_required + state_size;
    345 }
    346 
    347 
    348 /**********************************************************************/
    349 /*                          Render pipeline stage                     */
    350 /**********************************************************************/
    351 
    352 
    353 /* TCL render.
    354  */
    355 static GLboolean r200_run_tcl_render( struct gl_context *ctx,
    356 				      struct tnl_pipeline_stage *stage )
    357 {
    358    r200ContextPtr rmesa = R200_CONTEXT(ctx);
    359    TNLcontext *tnl = TNL_CONTEXT(ctx);
    360    struct vertex_buffer *VB = &tnl->vb;
    361    GLuint i;
    362    GLubyte *vimap_rev;
    363 /* use hw fixed order for simplicity, pos 0, weight 1, normal 2, fog 3,
    364    color0 - color3 4-7, texcoord0 - texcoord5 8-13, pos 1 14. Must not use
    365    more than 12 of those at the same time. */
    366    GLubyte map_rev_fixed[15] = {255, 255, 255, 255, 255, 255, 255, 255,
    367 			    255, 255, 255, 255, 255, 255, 255};
    368 
    369 
    370    /* TODO: separate this from the swtnl pipeline
    371     */
    372    if (rmesa->radeon.TclFallback)
    373       return GL_TRUE;	/* fallback to software t&l */
    374 
    375    radeon_print(RADEON_RENDER, RADEON_NORMAL, "%s\n", __func__);
    376 
    377    if (VB->Count == 0)
    378       return GL_FALSE;
    379 
    380    /* Validate state:
    381     */
    382    if (rmesa->radeon.NewGLState)
    383       if (!r200ValidateState( ctx ))
    384          return GL_TRUE; /* fallback to sw t&l */
    385 
    386    if (!ctx->VertexProgram._Enabled) {
    387    /* NOTE: inputs != tnl->render_inputs - these are the untransformed
    388     * inputs.
    389     */
    390       map_rev_fixed[0] = VERT_ATTRIB_POS;
    391       /* technically there is no reason we always need VA_COLOR0. In theory
    392          could disable it depending on lighting, color materials, texturing... */
    393       map_rev_fixed[4] = VERT_ATTRIB_COLOR0;
    394 
    395       if (ctx->Light.Enabled) {
    396 	 map_rev_fixed[2] = VERT_ATTRIB_NORMAL;
    397       }
    398 
    399       /* this also enables VA_COLOR1 when using separate specular
    400          lighting model, which is unnecessary.
    401          FIXME: OTOH, we're missing the case where a ATI_fragment_shader accesses
    402          the secondary color (if lighting is disabled). The chip seems
    403          misconfigured for that though elsewhere (tcl output, might lock up) */
    404       if (_mesa_need_secondary_color(ctx)) {
    405 	 map_rev_fixed[5] = VERT_ATTRIB_COLOR1;
    406       }
    407 
    408       if ( (ctx->Fog.FogCoordinateSource == GL_FOG_COORD) && ctx->Fog.Enabled ) {
    409 	 map_rev_fixed[3] = VERT_ATTRIB_FOG;
    410       }
    411 
    412       for (i = 0 ; i < ctx->Const.MaxTextureUnits; i++) {
    413 	 if (ctx->Texture.Unit[i]._Current) {
    414 	    if (rmesa->TexGenNeedNormals[i]) {
    415 	       map_rev_fixed[2] = VERT_ATTRIB_NORMAL;
    416 	    }
    417 	    map_rev_fixed[8 + i] = VERT_ATTRIB_TEX0 + i;
    418 	 }
    419       }
    420       vimap_rev = &map_rev_fixed[0];
    421    }
    422    else {
    423       /* vtx_tcl_output_vtxfmt_0/1 need to match configuration of "fragment
    424 	 part", since using some vertex interpolator later which is not in
    425 	 out_vtxfmt0/1 will lock up. It seems to be ok to write in vertex
    426 	 prog to a not enabled output however, so just don't mess with it.
    427 	 We only need to change compsel. */
    428       GLuint out_compsel = 0;
    429       const GLbitfield64 vp_out =
    430 	 rmesa->curr_vp_hw->mesa_program.info.outputs_written;
    431 
    432       vimap_rev = &rmesa->curr_vp_hw->inputmap_rev[0];
    433       assert(vp_out & BITFIELD64_BIT(VARYING_SLOT_POS));
    434       out_compsel = R200_OUTPUT_XYZW;
    435       if (vp_out & BITFIELD64_BIT(VARYING_SLOT_COL0)) {
    436 	 out_compsel |= R200_OUTPUT_COLOR_0;
    437       }
    438       if (vp_out & BITFIELD64_BIT(VARYING_SLOT_COL1)) {
    439 	 out_compsel |= R200_OUTPUT_COLOR_1;
    440       }
    441       if (vp_out & BITFIELD64_BIT(VARYING_SLOT_FOGC)) {
    442          out_compsel |= R200_OUTPUT_DISCRETE_FOG;
    443       }
    444       if (vp_out & BITFIELD64_BIT(VARYING_SLOT_PSIZ)) {
    445 	 out_compsel |= R200_OUTPUT_PT_SIZE;
    446       }
    447       for (i = VARYING_SLOT_TEX0; i < VARYING_SLOT_TEX6; i++) {
    448 	 if (vp_out & BITFIELD64_BIT(i)) {
    449 	    out_compsel |= R200_OUTPUT_TEX_0 << (i - VARYING_SLOT_TEX0);
    450 	 }
    451       }
    452       if (rmesa->hw.vtx.cmd[VTX_TCL_OUTPUT_COMPSEL] != out_compsel) {
    453 	 R200_STATECHANGE( rmesa, vtx );
    454 	 rmesa->hw.vtx.cmd[VTX_TCL_OUTPUT_COMPSEL] = out_compsel;
    455       }
    456    }
    457 
    458    /* Do the actual work:
    459     */
    460    radeonReleaseArrays( ctx, ~0 /* stage->changed_inputs */ );
    461    GLuint emit_end = r200EnsureEmitSize( ctx, vimap_rev )
    462      + rmesa->radeon.cmdbuf.cs->cdw;
    463    r200EmitArrays( ctx, vimap_rev );
    464 
    465    for (i = 0 ; i < VB->PrimitiveCount ; i++)
    466    {
    467       GLuint prim = _tnl_translate_prim(&VB->Primitive[i]);
    468       GLuint start = VB->Primitive[i].start;
    469       GLuint length = VB->Primitive[i].count;
    470 
    471       if (!length)
    472 	 continue;
    473 
    474       if (VB->Elts)
    475 	 r200EmitEltPrimitive( ctx, start, start+length, prim );
    476       else
    477 	 r200EmitPrimitive( ctx, start, start+length, prim );
    478    }
    479    if ( emit_end < rmesa->radeon.cmdbuf.cs->cdw )
    480      WARN_ONCE("Rendering was %d commands larger than predicted size."
    481 	 " We might overflow  command buffer.\n", rmesa->radeon.cmdbuf.cs->cdw - emit_end);
    482 
    483    return GL_FALSE;		/* finished the pipe */
    484 }
    485 
    486 
    487 
    488 /* Initial state for tcl stage.
    489  */
    490 const struct tnl_pipeline_stage _r200_tcl_stage =
    491 {
    492    "r200 render",
    493    NULL,			/*  private */
    494    NULL,
    495    NULL,
    496    NULL,
    497    r200_run_tcl_render	/* run */
    498 };
    499 
    500 
    501 
    502 /**********************************************************************/
    503 /*                 Validate state at pipeline start                   */
    504 /**********************************************************************/
    505 
    506 
    507 /*-----------------------------------------------------------------------
    508  * Manage TCL fallbacks
    509  */
    510 
    511 
    512 static void transition_to_swtnl( struct gl_context *ctx )
    513 {
    514    r200ContextPtr rmesa = R200_CONTEXT(ctx);
    515    TNLcontext *tnl = TNL_CONTEXT(ctx);
    516 
    517    R200_NEWPRIM( rmesa );
    518 
    519    r200ChooseVertexState( ctx );
    520    r200ChooseRenderState( ctx );
    521 
    522    _tnl_validate_shine_tables( ctx );
    523 
    524    tnl->Driver.NotifyMaterialChange =
    525       _tnl_validate_shine_tables;
    526 
    527    radeonReleaseArrays( ctx, ~0 );
    528 
    529    /* Still using the D3D based hardware-rasterizer from the radeon;
    530     * need to put the card into D3D mode to make it work:
    531     */
    532    R200_STATECHANGE( rmesa, vap );
    533    rmesa->hw.vap.cmd[VAP_SE_VAP_CNTL] &= ~(R200_VAP_TCL_ENABLE|R200_VAP_PROG_VTX_SHADER_ENABLE);
    534 }
    535 
    536 static void transition_to_hwtnl( struct gl_context *ctx )
    537 {
    538    r200ContextPtr rmesa = R200_CONTEXT(ctx);
    539    TNLcontext *tnl = TNL_CONTEXT(ctx);
    540 
    541    _tnl_need_projected_coords( ctx, GL_FALSE );
    542 
    543    r200UpdateMaterial( ctx );
    544 
    545    tnl->Driver.NotifyMaterialChange = r200UpdateMaterial;
    546 
    547    if ( rmesa->radeon.dma.flush )
    548       rmesa->radeon.dma.flush( &rmesa->radeon.glCtx );
    549 
    550    rmesa->radeon.dma.flush = NULL;
    551 
    552    R200_STATECHANGE( rmesa, vap );
    553    rmesa->hw.vap.cmd[VAP_SE_VAP_CNTL] |= R200_VAP_TCL_ENABLE;
    554    rmesa->hw.vap.cmd[VAP_SE_VAP_CNTL] &= ~R200_VAP_FORCE_W_TO_ONE;
    555 
    556    if (ctx->VertexProgram._Enabled) {
    557       rmesa->hw.vap.cmd[VAP_SE_VAP_CNTL] |= R200_VAP_PROG_VTX_SHADER_ENABLE;
    558    }
    559 
    560    if ( ((rmesa->hw.ctx.cmd[CTX_PP_FOG_COLOR] & R200_FOG_USE_MASK)
    561       == R200_FOG_USE_SPEC_ALPHA) &&
    562       (ctx->Fog.FogCoordinateSource == GL_FOG_COORD )) {
    563       R200_STATECHANGE( rmesa, ctx );
    564       rmesa->hw.ctx.cmd[CTX_PP_FOG_COLOR] &= ~R200_FOG_USE_MASK;
    565       rmesa->hw.ctx.cmd[CTX_PP_FOG_COLOR] |= R200_FOG_USE_VTX_FOG;
    566    }
    567 
    568    R200_STATECHANGE( rmesa, vte );
    569    rmesa->hw.vte.cmd[VTE_SE_VTE_CNTL] &= ~(R200_VTX_XY_FMT|R200_VTX_Z_FMT);
    570    rmesa->hw.vte.cmd[VTE_SE_VTE_CNTL] |= R200_VTX_W0_FMT;
    571 
    572    if (R200_DEBUG & RADEON_FALLBACKS)
    573       fprintf(stderr, "R200 end tcl fallback\n");
    574 }
    575 
    576 
    577 static char *fallbackStrings[] = {
    578    "Rasterization fallback",
    579    "Unfilled triangles",
    580    "Twosided lighting, differing materials",
    581    "Materials in VB (maybe between begin/end)",
    582    "Texgen unit 0",
    583    "Texgen unit 1",
    584    "Texgen unit 2",
    585    "Texgen unit 3",
    586    "Texgen unit 4",
    587    "Texgen unit 5",
    588    "User disable",
    589    "Bitmap as points",
    590    "Vertex program"
    591 };
    592 
    593 
    594 static char *getFallbackString(GLuint bit)
    595 {
    596    int i = 0;
    597    while (bit > 1) {
    598       i++;
    599       bit >>= 1;
    600    }
    601    return fallbackStrings[i];
    602 }
    603 
    604 
    605 
    606 void r200TclFallback( struct gl_context *ctx, GLuint bit, GLboolean mode )
    607 {
    608 	r200ContextPtr rmesa = R200_CONTEXT(ctx);
    609 	GLuint oldfallback = rmesa->radeon.TclFallback;
    610 
    611 	if (mode) {
    612 		if (oldfallback == 0) {
    613 			/* We have to flush before transition */
    614 			if ( rmesa->radeon.dma.flush )
    615 				rmesa->radeon.dma.flush( &rmesa->radeon.glCtx );
    616 
    617 			if (R200_DEBUG & RADEON_FALLBACKS)
    618 				fprintf(stderr, "R200 begin tcl fallback %s\n",
    619 						getFallbackString( bit ));
    620 			rmesa->radeon.TclFallback |= bit;
    621 			transition_to_swtnl( ctx );
    622 		} else
    623 			rmesa->radeon.TclFallback |= bit;
    624 	} else {
    625 		if (oldfallback == bit) {
    626 			/* We have to flush before transition */
    627 			if ( rmesa->radeon.dma.flush )
    628 				rmesa->radeon.dma.flush( &rmesa->radeon.glCtx );
    629 
    630 			if (R200_DEBUG & RADEON_FALLBACKS)
    631 				fprintf(stderr, "R200 end tcl fallback %s\n",
    632 						getFallbackString( bit ));
    633 			rmesa->radeon.TclFallback &= ~bit;
    634 			transition_to_hwtnl( ctx );
    635 		} else
    636 			rmesa->radeon.TclFallback &= ~bit;
    637 	}
    638 }
    639