diff options
| author | Keith Whitwell <keithw@vmware.com> | 2009-05-05 12:12:28 +0100 | 
|---|---|---|
| committer | Keith Whitwell <keithw@vmware.com> | 2009-05-05 13:14:53 +0100 | 
| commit | 113403ef51e2ec764db061aabf569d6f1a1a3ef0 (patch) | |
| tree | c21df3f7acaa4406a48200bb4dfa59073257c1a0 /src | |
| parent | 22b417b75ce0e6658a5d1e0e80cb6c3fdf631774 (diff) | |
mesa: more complete fix for transform_invarient glitches
Add a new flag mvp_with_dp4 in the context, and use that to switch
both ffvertex.c and programopt.c vertex transformation code to
either DP4 or MUL/MAD implementations.
Diffstat (limited to 'src')
| -rw-r--r-- | src/mesa/main/context.c | 13 | ||||
| -rw-r--r-- | src/mesa/main/context.h | 4 | ||||
| -rw-r--r-- | src/mesa/main/ffvertex_prog.c | 16 | ||||
| -rw-r--r-- | src/mesa/main/mtypes.h | 6 | ||||
| -rw-r--r-- | src/mesa/shader/programopt.c | 119 | ||||
| -rw-r--r-- | src/mesa/state_tracker/st_context.c | 6 | 
6 files changed, 153 insertions, 11 deletions
| diff --git a/src/mesa/main/context.c b/src/mesa/main/context.c index 016284de9a..d780f91f04 100644 --- a/src/mesa/main/context.c +++ b/src/mesa/main/context.c @@ -1522,4 +1522,17 @@ _mesa_Flush(void)  } +/** + * Set mvp_with_dp4 flag.  If a driver has a preference for DP4 over + * MUL/MAD, or vice versa, call this function to register that. + * Otherwise we default to MUL/MAD. + */ +void +_mesa_set_mvp_with_dp4( GLcontext *ctx, +                        GLboolean flag ) +{ +   ctx->mvp_with_dp4 = flag; +} + +  /*@}*/ diff --git a/src/mesa/main/context.h b/src/mesa/main/context.h index ecc1cec779..5b57d88029 100644 --- a/src/mesa/main/context.h +++ b/src/mesa/main/context.h @@ -151,6 +151,10 @@ extern struct _glapi_table *  _mesa_get_dispatch(GLcontext *ctx); +void +_mesa_set_mvp_with_dp4( GLcontext *ctx, +                        GLboolean flag ); +  /** \name Miscellaneous */  /*@{*/ diff --git a/src/mesa/main/ffvertex_prog.c b/src/mesa/main/ffvertex_prog.c index 82e1c4af66..43325b1352 100644 --- a/src/mesa/main/ffvertex_prog.c +++ b/src/mesa/main/ffvertex_prog.c @@ -315,12 +315,6 @@ static void make_state_key( GLcontext *ctx, struct state_key *key )   */  #define DISASSEM 0 -/* Should be tunable by the driver - do we want to do matrix - * multiplications with DP4's or with MUL/MAD's?  SSE works better - * with the latter, drivers may differ. - */ -#define PREFER_DP4 1 -  /* Use uregs to represent registers internally, translate to Mesa's   * expected formats on emit.   @@ -348,6 +342,7 @@ struct tnl_program {     const struct state_key *state;     struct gl_vertex_program *program;     GLint max_inst;  /** number of instructions allocated for program */ +   GLboolean mvp_with_dp4;     GLuint temp_in_use;     GLuint temp_reserved; @@ -775,7 +770,7 @@ static struct ureg get_eye_position( struct tnl_program *p )        p->eye_position = reserve_temp(p); -      if (PREFER_DP4) { +      if (p->mvp_with_dp4) {  	 register_matrix_param5( p, STATE_MODELVIEW_MATRIX, 0, 0, 3,                                   0, modelview ); @@ -881,7 +876,7 @@ static void build_hpos( struct tnl_program *p )     struct ureg hpos = register_output( p, VERT_RESULT_HPOS );     struct ureg mvp[4]; -   if (PREFER_DP4) { +   if (p->mvp_with_dp4) {        register_matrix_param5( p, STATE_MVP_MATRIX, 0, 0, 3,   			      0, mvp );        emit_matrix_transform_vec4( p, hpos, mvp, pos ); @@ -1574,7 +1569,7 @@ static void build_texture_transform( struct tnl_program *p )  	    struct ureg in = (!is_undef(out_texgen) ?   			      out_texgen :   			      register_input(p, VERT_ATTRIB_TEX0+i)); -	    if (PREFER_DP4) { +	    if (p->mvp_with_dp4) {  	       register_matrix_param5( p, STATE_TEXTURE_MATRIX, i, 0, 3,  				       0, texmat );  	       emit_matrix_transform_vec4( p, out, texmat, in ); @@ -1708,6 +1703,7 @@ static void build_tnl_program( struct tnl_program *p )  static void  create_new_program( const struct state_key *key,                      struct gl_vertex_program *program, +                    GLboolean mvp_with_dp4,                      GLuint max_temps)  {     struct tnl_program p; @@ -1721,6 +1717,7 @@ create_new_program( const struct state_key *key,     p.transformed_normal = undef;     p.identity = undef;     p.temp_in_use = 0; +   p.mvp_with_dp4 = mvp_with_dp4;     if (max_temps >= sizeof(int) * 8)        p.temp_reserved = 0; @@ -1776,6 +1773,7 @@ _mesa_get_fixed_func_vertex_program(GLcontext *ctx)           return NULL;        create_new_program( &key, prog, +                          ctx->mvp_with_dp4,                            ctx->Const.VertexProgram.MaxTemps );  #if 0 diff --git a/src/mesa/main/mtypes.h b/src/mesa/main/mtypes.h index cf71077728..587dc80146 100644 --- a/src/mesa/main/mtypes.h +++ b/src/mesa/main/mtypes.h @@ -2980,6 +2980,12 @@ struct __GLcontextRec     /** software compression/decompression supported or not */     GLboolean Mesa_DXTn; +   /**  +    * Use dp4 (rather than mul/mad) instructions for position +    * transformation? +    */ +   GLboolean mvp_with_dp4; +     /** Core tnl module support */     struct gl_tnl_module TnlModule; diff --git a/src/mesa/shader/programopt.c b/src/mesa/shader/programopt.c index ecd98dc85c..f70c75cec8 100644 --- a/src/mesa/shader/programopt.c +++ b/src/mesa/shader/programopt.c @@ -45,8 +45,8 @@   * into a vertex program.   * May be used to implement the position_invariant option.   */ -void -_mesa_insert_mvp_code(GLcontext *ctx, struct gl_vertex_program *vprog) +static void +_mesa_insert_mvp_dp4_code(GLcontext *ctx, struct gl_vertex_program *vprog)  {     struct prog_instruction *newInst;     const GLuint origLen = vprog->Base.NumInstructions; @@ -113,6 +113,121 @@ _mesa_insert_mvp_code(GLcontext *ctx, struct gl_vertex_program *vprog)  } +static void +_mesa_insert_mvp_mad_code(GLcontext *ctx, struct gl_vertex_program *vprog) +{ +   struct prog_instruction *newInst; +   const GLuint origLen = vprog->Base.NumInstructions; +   const GLuint newLen = origLen + 4; +   GLuint hposTemp; +   GLuint i; + +   /* +    * Setup state references for the modelview/projection matrix. +    * XXX we should check if these state vars are already declared. +    */ +   static const gl_state_index mvpState[4][STATE_LENGTH] = { +      { STATE_MVP_MATRIX, 0, 0, 0, STATE_MATRIX_TRANSPOSE }, +      { STATE_MVP_MATRIX, 0, 1, 1, STATE_MATRIX_TRANSPOSE }, +      { STATE_MVP_MATRIX, 0, 2, 2, STATE_MATRIX_TRANSPOSE }, +      { STATE_MVP_MATRIX, 0, 3, 3, STATE_MATRIX_TRANSPOSE }, +   }; +   GLint mvpRef[4]; + +   for (i = 0; i < 4; i++) { +      mvpRef[i] = _mesa_add_state_reference(vprog->Base.Parameters, +                                            mvpState[i]); +   } + +   /* Alloc storage for new instructions */ +   newInst = _mesa_alloc_instructions(newLen); +   if (!newInst) { +      _mesa_error(ctx, GL_OUT_OF_MEMORY, +                  "glProgramString(inserting position_invariant code)"); +      return; +   } + +   /* TEMP hposTemp; */ +   hposTemp = vprog->Base.NumTemporaries++; + +   /* +    * Generated instructions: +    *    emit_op2(p, OPCODE_MUL, tmp, 0, swizzle1(src,X), mat[0]); +    *    emit_op3(p, OPCODE_MAD, tmp, 0, swizzle1(src,Y), mat[1], tmp); +    *    emit_op3(p, OPCODE_MAD, tmp, 0, swizzle1(src,Z), mat[2], tmp); +    *    emit_op3(p, OPCODE_MAD, dest, 0, swizzle1(src,W), mat[3], tmp); +    */ +   _mesa_init_instructions(newInst, 4); + +   newInst[0].Opcode = OPCODE_MUL; +   newInst[0].DstReg.File = PROGRAM_TEMPORARY; +   newInst[0].DstReg.Index = hposTemp; +   newInst[0].DstReg.WriteMask = WRITEMASK_XYZW; +   newInst[0].SrcReg[0].File = PROGRAM_INPUT; +   newInst[0].SrcReg[0].Index = VERT_ATTRIB_POS; +   newInst[0].SrcReg[0].Swizzle = SWIZZLE_XXXX; +   newInst[0].SrcReg[1].File = PROGRAM_STATE_VAR; +   newInst[0].SrcReg[1].Index = mvpRef[0]; +   newInst[0].SrcReg[1].Swizzle = SWIZZLE_NOOP; + +   for (i = 1; i <= 2; i++) { +      newInst[i].Opcode = OPCODE_MAD; +      newInst[i].DstReg.File = PROGRAM_TEMPORARY; +      newInst[i].DstReg.Index = hposTemp; +      newInst[i].DstReg.WriteMask = WRITEMASK_XYZW; +      newInst[i].SrcReg[0].File = PROGRAM_INPUT; +      newInst[i].SrcReg[0].Index = VERT_ATTRIB_POS; +      newInst[i].SrcReg[0].Swizzle = MAKE_SWIZZLE4(i,i,i,i); +      newInst[i].SrcReg[1].File = PROGRAM_STATE_VAR; +      newInst[i].SrcReg[1].Index = mvpRef[i]; +      newInst[i].SrcReg[1].Swizzle = SWIZZLE_NOOP; +      newInst[i].SrcReg[2].File = PROGRAM_TEMPORARY; +      newInst[i].SrcReg[2].Index = hposTemp; +      newInst[1].SrcReg[2].Swizzle = SWIZZLE_NOOP; +   } + +   newInst[3].Opcode = OPCODE_MAD; +   newInst[3].DstReg.File = PROGRAM_OUTPUT; +   newInst[3].DstReg.Index = VERT_RESULT_HPOS; +   newInst[3].DstReg.WriteMask = WRITEMASK_XYZW; +   newInst[3].SrcReg[0].File = PROGRAM_INPUT; +   newInst[3].SrcReg[0].Index = VERT_ATTRIB_POS; +   newInst[3].SrcReg[0].Swizzle = SWIZZLE_WWWW; +   newInst[3].SrcReg[1].File = PROGRAM_STATE_VAR; +   newInst[3].SrcReg[1].Index = mvpRef[3]; +   newInst[3].SrcReg[1].Swizzle = SWIZZLE_NOOP; +   newInst[3].SrcReg[2].File = PROGRAM_TEMPORARY; +   newInst[3].SrcReg[2].Index = hposTemp; +   newInst[3].SrcReg[2].Swizzle = SWIZZLE_NOOP; + + +   /* Append original instructions after new instructions */ +   _mesa_copy_instructions (newInst + 4, vprog->Base.Instructions, origLen); + +   /* free old instructions */ +   _mesa_free_instructions(vprog->Base.Instructions, origLen); + +   /* install new instructions */ +   vprog->Base.Instructions = newInst; +   vprog->Base.NumInstructions = newLen; +   vprog->Base.InputsRead |= VERT_BIT_POS; +   vprog->Base.OutputsWritten |= (1 << VERT_RESULT_HPOS); +} + + +void +_mesa_insert_mvp_code(GLcontext *ctx, struct gl_vertex_program *vprog) +{ +   if (ctx->mvp_with_dp4)  +      _mesa_insert_mvp_dp4_code( ctx, vprog ); +   else +      _mesa_insert_mvp_mad_code( ctx, vprog ); +} +       + + + +  /**   * Append extra instructions onto the given fragment program to implement diff --git a/src/mesa/state_tracker/st_context.c b/src/mesa/state_tracker/st_context.c index 92a630eff9..2a1f21c51c 100644 --- a/src/mesa/state_tracker/st_context.c +++ b/src/mesa/state_tracker/st_context.c @@ -177,6 +177,12 @@ struct st_context *st_create_context(struct pipe_context *pipe,     ctx = _mesa_create_context(visual, shareCtx, &funcs, NULL); +   /* XXX: need a capability bit in gallium to query if the pipe +    * driver prefers DP4 or MUL/MAD for vertex transformation. +    */ +   if (debug_get_bool_option("MESA_MVP_DP4", FALSE)) +      _mesa_set_mvp_with_dp4( ctx, GL_TRUE ); +     return st_create_context_priv(ctx, pipe);  } | 
