diff options
Diffstat (limited to 'mesalib/src/mesa/program')
| -rw-r--r-- | mesalib/src/mesa/program/arbprogparse.c | 18 | ||||
| -rw-r--r-- | mesalib/src/mesa/program/hash_table.c | 19 | ||||
| -rw-r--r-- | mesalib/src/mesa/program/hash_table.h | 7 | ||||
| -rw-r--r-- | mesalib/src/mesa/program/prog_optimize.c | 89 | ||||
| -rw-r--r-- | mesalib/src/mesa/program/program.c | 2153 | ||||
| -rw-r--r-- | mesalib/src/mesa/program/program_parse.y | 11 | ||||
| -rw-r--r-- | mesalib/src/mesa/program/programopt.c | 33 | ||||
| -rw-r--r-- | mesalib/src/mesa/program/programopt.h | 4 | 
8 files changed, 1229 insertions, 1105 deletions
| diff --git a/mesalib/src/mesa/program/arbprogparse.c b/mesalib/src/mesa/program/arbprogparse.c index 7f778c3c3..dffc8abf7 100644 --- a/mesalib/src/mesa/program/arbprogparse.c +++ b/mesalib/src/mesa/program/arbprogparse.c @@ -116,20 +116,11 @@ _mesa_parse_arb_fragment_program(struct gl_context* ctx, GLenum target,           program->Base.SamplersUsed |= (1 << i);     }     program->Base.ShadowSamplers = prog.ShadowSamplers; -   switch (state.option.Fog) { -   case OPTION_FOG_EXP:    program->FogOption = GL_EXP;    break; -   case OPTION_FOG_EXP2:   program->FogOption = GL_EXP2;   break; -   case OPTION_FOG_LINEAR: program->FogOption = GL_LINEAR; break; -   default:                program->FogOption = GL_NONE;   break; -   }     program->OriginUpperLeft = state.option.OriginUpperLeft;     program->PixelCenterInteger = state.option.PixelCenterInteger;     program->UsesKill            = state.fragment.UsesKill; -   if (program->FogOption) -      program->Base.InputsRead |= FRAG_BIT_FOGC; -     if (program->Base.Instructions)        free(program->Base.Instructions);     program->Base.Instructions = prog.Instructions; @@ -143,12 +134,15 @@ _mesa_parse_arb_fragment_program(struct gl_context* ctx, GLenum target,      * there's no hardware that wants to do fog in a discrete stage separate      * from the fragment shader.      */ -   if (program->FogOption != GL_NONE) { +   if (state.option.Fog != OPTION_NONE) { +      static const GLenum fog_modes[4] = { +	 GL_NONE, GL_EXP, GL_EXP2, GL_LINEAR +      }; +        /* XXX: we should somehow recompile this to remove clamping if disabled         * On the ATI driver, this is unclampled if fragment clamping is disabled         */ -      _mesa_append_fog_code(ctx, program, GL_TRUE); -      program->FogOption = GL_NONE; +      _mesa_append_fog_code(ctx, program, fog_modes[state.option.Fog], GL_TRUE);     }  #if DEBUG_FP diff --git a/mesalib/src/mesa/program/hash_table.c b/mesalib/src/mesa/program/hash_table.c index f7ef366c1..877a9e2ff 100644 --- a/mesalib/src/mesa/program/hash_table.c +++ b/mesalib/src/mesa/program/hash_table.c @@ -160,6 +160,25 @@ hash_table_remove(struct hash_table *ht, const void *key)      }  } +void +hash_table_call_foreach(struct hash_table *ht, +			void (*callback)(const void *key, +					 void *data, +					 void *closure), +			void *closure) +{ +   int bucket; + +   for (bucket = 0; bucket < ht->num_buckets; bucket++) { +      struct node *node, *temp; +      foreach_s(node, temp, &ht->buckets[bucket]) { +	 struct hash_node *hn = (struct hash_node *) node; + +	 callback(hn->key, hn->data, closure); +      } +   } +} +  unsigned  hash_table_string_hash(const void *key)  { diff --git a/mesalib/src/mesa/program/hash_table.h b/mesalib/src/mesa/program/hash_table.h index f1c4fdcd1..e715bb1cc 100644 --- a/mesalib/src/mesa/program/hash_table.h +++ b/mesalib/src/mesa/program/hash_table.h @@ -144,6 +144,13 @@ hash_table_pointer_hash(const void *key);  int  hash_table_pointer_compare(const void *key1, const void *key2); +void +hash_table_call_foreach(struct hash_table *ht, +			void (*callback)(const void *key, +					 void *data, +					 void *closure), +			void *closure); +  #ifdef __cplusplus  }  #endif diff --git a/mesalib/src/mesa/program/prog_optimize.c b/mesalib/src/mesa/program/prog_optimize.c index 164297a34..11debc485 100644 --- a/mesalib/src/mesa/program/prog_optimize.c +++ b/mesalib/src/mesa/program/prog_optimize.c @@ -74,6 +74,17 @@ get_src_arg_mask(const struct prog_instruction *inst,        case OPCODE_MAD:        case OPCODE_MUL:        case OPCODE_SUB: +      case OPCODE_CMP: +      case OPCODE_FLR: +      case OPCODE_FRC: +      case OPCODE_LRP: +      case OPCODE_SEQ: +      case OPCODE_SGE: +      case OPCODE_SGT: +      case OPCODE_SLE: +      case OPCODE_SLT: +      case OPCODE_SNE: +      case OPCODE_SSG:           channel_mask = inst->DstReg.WriteMask & dst_mask;           break;        case OPCODE_RCP: @@ -1235,6 +1246,83 @@ print_it(struct gl_context *ctx, struct gl_program *program, const char *txt) {  }  #endif +/** + * This pass replaces CMP T0, T1 T2 T0 with MOV T0, T2 when the CMP + * instruction is the first instruction to write to register T0.  The are + * several lowering passes done in GLSL IR (e.g. branches and + * relative addressing) that create a large number of conditional assignments + * that ir_to_mesa converts to CMP instructions like the one mentioned above. + * + * Here is why this conversion is safe: + * CMP T0, T1 T2 T0 can be expanded to: + * if (T1 < 0.0) + * 	MOV T0, T2; + * else + * 	MOV T0, T0; + * + * If (T1 < 0.0) evaluates to true then our replacement MOV T0, T2 is the same + * as the original program.  If (T1 < 0.0) evaluates to false, executing + * MOV T0, T0 will store a garbage value in T0 since T0 is uninitialized. + * Therefore, it doesn't matter that we are replacing MOV T0, T0 with MOV T0, T2 + * because any instruction that was going to read from T0 after this was going + * to read a garbage value anyway. + */ +static void +_mesa_simplify_cmp(struct gl_program * program) +{ +   GLuint tempWrites[REG_ALLOCATE_MAX_PROGRAM_TEMPS]; +   GLuint outputWrites[MAX_PROGRAM_OUTPUTS]; +   GLuint i; + +   if (dbg) { +      printf("Optimize: Begin reads without writes\n"); +      _mesa_print_program(program); +   } + +   for (i = 0; i < REG_ALLOCATE_MAX_PROGRAM_TEMPS; i++) { +      tempWrites[i] = 0; +   } + +   for (i = 0; i < MAX_PROGRAM_OUTPUTS; i++) { +      outputWrites[i] = 0; +   } + +   for (i = 0; i < program->NumInstructions; i++) { +      struct prog_instruction *inst = program->Instructions + i; +      GLuint prevWriteMask; + +      /* Give up if we encounter relative addressing or flow control. */ +      if (_mesa_is_flow_control_opcode(inst->Opcode) || inst->DstReg.RelAddr) { +         return; +      } + +      if (inst->DstReg.File == PROGRAM_OUTPUT) { +         assert(inst->DstReg.Index < MAX_PROGRAM_OUTPUTS); +         prevWriteMask = outputWrites[inst->DstReg.Index]; +         outputWrites[inst->DstReg.Index] |= inst->DstReg.WriteMask; +      } else if (inst->DstReg.File == PROGRAM_TEMPORARY) { +         assert(inst->DstReg.Index < REG_ALLOCATE_MAX_PROGRAM_TEMPS); +         prevWriteMask = tempWrites[inst->DstReg.Index]; +         tempWrites[inst->DstReg.Index] |= inst->DstReg.WriteMask; +      } + +      /* For a CMP to be considered a conditional write, the destination +       * register and source register two must be the same. */ +      if (inst->Opcode == OPCODE_CMP +          && !(inst->DstReg.WriteMask & prevWriteMask) +          && inst->SrcReg[2].File == inst->DstReg.File +          && inst->SrcReg[2].Index == inst->DstReg.Index +          && inst->DstReg.WriteMask == get_src_arg_mask(inst, 2, NO_MASK)) { + +         inst->Opcode = OPCODE_MOV; +         inst->SrcReg[0] = inst->SrcReg[1]; +      } +   } +   if (dbg) { +      printf("Optimize: End reads without writes\n"); +      _mesa_print_program(program); +   } +}  /**   * Apply optimizations to the given program to eliminate unnecessary @@ -1245,6 +1333,7 @@ _mesa_optimize_program(struct gl_context *ctx, struct gl_program *program)  {     GLboolean any_change; +   _mesa_simplify_cmp(program);     /* Stop when no modifications were output */     do {        any_change = GL_FALSE; diff --git a/mesalib/src/mesa/program/program.c b/mesalib/src/mesa/program/program.c index 812c0dc50..78efca9f1 100644 --- a/mesalib/src/mesa/program/program.c +++ b/mesalib/src/mesa/program/program.c @@ -1,1077 +1,1076 @@ -/*
 - * Mesa 3-D graphics library
 - * Version:  6.5.3
 - *
 - * Copyright (C) 1999-2007  Brian Paul   All Rights Reserved.
 - *
 - * Permission is hereby granted, free of charge, to any person obtaining a
 - * copy of this software and associated documentation files (the "Software"),
 - * to deal in the Software without restriction, including without limitation
 - * the rights to use, copy, modify, merge, publish, distribute, sublicense,
 - * and/or sell copies of the Software, and to permit persons to whom the
 - * Software is furnished to do so, subject to the following conditions:
 - *
 - * The above copyright notice and this permission notice shall be included
 - * in all copies or substantial portions of the Software.
 - *
 - * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
 - * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 - * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
 - * BRIAN PAUL BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN
 - * AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
 - * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
 - */
 -
 -/**
 - * \file program.c
 - * Vertex and fragment program support functions.
 - * \author Brian Paul
 - */
 -
 -
 -#include "main/glheader.h"
 -#include "main/context.h"
 -#include "main/hash.h"
 -#include "main/mfeatures.h"
 -#include "program.h"
 -#include "prog_cache.h"
 -#include "prog_parameter.h"
 -#include "prog_instruction.h"
 -
 -
 -/**
 - * A pointer to this dummy program is put into the hash table when
 - * glGenPrograms is called.
 - */
 -struct gl_program _mesa_DummyProgram;
 -
 -
 -/**
 - * Init context's vertex/fragment program state
 - */
 -void
 -_mesa_init_program(struct gl_context *ctx)
 -{
 -   GLuint i;
 -
 -   /*
 -    * If this assertion fails, we need to increase the field
 -    * size for register indexes (see INST_INDEX_BITS).
 -    */
 -   ASSERT(ctx->Const.VertexProgram.MaxUniformComponents / 4
 -          <= (1 << INST_INDEX_BITS));
 -   ASSERT(ctx->Const.FragmentProgram.MaxUniformComponents / 4
 -          <= (1 << INST_INDEX_BITS));
 -
 -   ASSERT(ctx->Const.VertexProgram.MaxTemps <= (1 << INST_INDEX_BITS));
 -   ASSERT(ctx->Const.VertexProgram.MaxLocalParams <= (1 << INST_INDEX_BITS));
 -   ASSERT(ctx->Const.FragmentProgram.MaxTemps <= (1 << INST_INDEX_BITS));
 -   ASSERT(ctx->Const.FragmentProgram.MaxLocalParams <= (1 << INST_INDEX_BITS));
 -
 -   ASSERT(ctx->Const.VertexProgram.MaxUniformComponents <= 4 * MAX_UNIFORMS);
 -   ASSERT(ctx->Const.FragmentProgram.MaxUniformComponents <= 4 * MAX_UNIFORMS);
 -
 -   ASSERT(ctx->Const.VertexProgram.MaxAddressOffset <= (1 << INST_INDEX_BITS));
 -   ASSERT(ctx->Const.FragmentProgram.MaxAddressOffset <= (1 << INST_INDEX_BITS));
 -
 -   /* If this fails, increase prog_instruction::TexSrcUnit size */
 -   ASSERT(MAX_TEXTURE_UNITS <= (1 << 5));
 -
 -   /* If this fails, increase prog_instruction::TexSrcTarget size */
 -   ASSERT(NUM_TEXTURE_TARGETS <= (1 << 3));
 -
 -   ctx->Program.ErrorPos = -1;
 -   ctx->Program.ErrorString = _mesa_strdup("");
 -
 -#if FEATURE_NV_vertex_program || FEATURE_ARB_vertex_program
 -   ctx->VertexProgram.Enabled = GL_FALSE;
 -#if FEATURE_es2_glsl
 -   ctx->VertexProgram.PointSizeEnabled =
 -      (ctx->API == API_OPENGLES2) ? GL_TRUE : GL_FALSE;
 -#else
 -   ctx->VertexProgram.PointSizeEnabled = GL_FALSE;
 -#endif
 -   ctx->VertexProgram.TwoSideEnabled = GL_FALSE;
 -   _mesa_reference_vertprog(ctx, &ctx->VertexProgram.Current,
 -                            ctx->Shared->DefaultVertexProgram);
 -   assert(ctx->VertexProgram.Current);
 -   for (i = 0; i < MAX_NV_VERTEX_PROGRAM_PARAMS / 4; i++) {
 -      ctx->VertexProgram.TrackMatrix[i] = GL_NONE;
 -      ctx->VertexProgram.TrackMatrixTransform[i] = GL_IDENTITY_NV;
 -   }
 -   ctx->VertexProgram.Cache = _mesa_new_program_cache();
 -#endif
 -
 -#if FEATURE_NV_fragment_program || FEATURE_ARB_fragment_program
 -   ctx->FragmentProgram.Enabled = GL_FALSE;
 -   _mesa_reference_fragprog(ctx, &ctx->FragmentProgram.Current,
 -                            ctx->Shared->DefaultFragmentProgram);
 -   assert(ctx->FragmentProgram.Current);
 -   ctx->FragmentProgram.Cache = _mesa_new_program_cache();
 -#endif
 -
 -#if FEATURE_ARB_geometry_shader4
 -   ctx->GeometryProgram.Enabled = GL_FALSE;
 -   /* right now by default we don't have a geometry program */
 -   _mesa_reference_geomprog(ctx, &ctx->GeometryProgram.Current,
 -                            NULL);
 -   ctx->GeometryProgram.Cache = _mesa_new_program_cache();
 -#endif
 -
 -   /* XXX probably move this stuff */
 -#if FEATURE_ATI_fragment_shader
 -   ctx->ATIFragmentShader.Enabled = GL_FALSE;
 -   ctx->ATIFragmentShader.Current = ctx->Shared->DefaultFragmentShader;
 -   assert(ctx->ATIFragmentShader.Current);
 -   ctx->ATIFragmentShader.Current->RefCount++;
 -#endif
 -}
 -
 -
 -/**
 - * Free a context's vertex/fragment program state
 - */
 -void
 -_mesa_free_program_data(struct gl_context *ctx)
 -{
 -#if FEATURE_NV_vertex_program || FEATURE_ARB_vertex_program
 -   _mesa_reference_vertprog(ctx, &ctx->VertexProgram.Current, NULL);
 -   _mesa_delete_program_cache(ctx, ctx->VertexProgram.Cache);
 -#endif
 -#if FEATURE_NV_fragment_program || FEATURE_ARB_fragment_program
 -   _mesa_reference_fragprog(ctx, &ctx->FragmentProgram.Current, NULL);
 -   _mesa_delete_program_cache(ctx, ctx->FragmentProgram.Cache);
 -#endif
 -#if FEATURE_ARB_geometry_shader4
 -   _mesa_reference_geomprog(ctx, &ctx->GeometryProgram.Current, NULL);
 -   _mesa_delete_program_cache(ctx, ctx->GeometryProgram.Cache);
 -#endif
 -   /* XXX probably move this stuff */
 -#if FEATURE_ATI_fragment_shader
 -   if (ctx->ATIFragmentShader.Current) {
 -      ctx->ATIFragmentShader.Current->RefCount--;
 -      if (ctx->ATIFragmentShader.Current->RefCount <= 0) {
 -         free(ctx->ATIFragmentShader.Current);
 -      }
 -   }
 -#endif
 -   free((void *) ctx->Program.ErrorString);
 -}
 -
 -
 -/**
 - * Update the default program objects in the given context to reference those
 - * specified in the shared state and release those referencing the old
 - * shared state.
 - */
 -void
 -_mesa_update_default_objects_program(struct gl_context *ctx)
 -{
 -#if FEATURE_NV_vertex_program || FEATURE_ARB_vertex_program
 -   _mesa_reference_vertprog(ctx, &ctx->VertexProgram.Current,
 -                            (struct gl_vertex_program *)
 -                            ctx->Shared->DefaultVertexProgram);
 -   assert(ctx->VertexProgram.Current);
 -#endif
 -
 -#if FEATURE_NV_fragment_program || FEATURE_ARB_fragment_program
 -   _mesa_reference_fragprog(ctx, &ctx->FragmentProgram.Current,
 -                            (struct gl_fragment_program *)
 -                            ctx->Shared->DefaultFragmentProgram);
 -   assert(ctx->FragmentProgram.Current);
 -#endif
 -
 -#if FEATURE_ARB_geometry_shader4
 -   _mesa_reference_geomprog(ctx, &ctx->GeometryProgram.Current,
 -                            (struct gl_geometry_program *)
 -                            ctx->Shared->DefaultGeometryProgram);
 -#endif
 -
 -   /* XXX probably move this stuff */
 -#if FEATURE_ATI_fragment_shader
 -   if (ctx->ATIFragmentShader.Current) {
 -      ctx->ATIFragmentShader.Current->RefCount--;
 -      if (ctx->ATIFragmentShader.Current->RefCount <= 0) {
 -         free(ctx->ATIFragmentShader.Current);
 -      }
 -   }
 -   ctx->ATIFragmentShader.Current = (struct ati_fragment_shader *) ctx->Shared->DefaultFragmentShader;
 -   assert(ctx->ATIFragmentShader.Current);
 -   ctx->ATIFragmentShader.Current->RefCount++;
 -#endif
 -}
 -
 -
 -/**
 - * Set the vertex/fragment program error state (position and error string).
 - * This is generally called from within the parsers.
 - */
 -void
 -_mesa_set_program_error(struct gl_context *ctx, GLint pos, const char *string)
 -{
 -   ctx->Program.ErrorPos = pos;
 -   free((void *) ctx->Program.ErrorString);
 -   if (!string)
 -      string = "";
 -   ctx->Program.ErrorString = _mesa_strdup(string);
 -}
 -
 -
 -/**
 - * Find the line number and column for 'pos' within 'string'.
 - * Return a copy of the line which contains 'pos'.  Free the line with
 - * free().
 - * \param string  the program string
 - * \param pos     the position within the string
 - * \param line    returns the line number corresponding to 'pos'.
 - * \param col     returns the column number corresponding to 'pos'.
 - * \return copy of the line containing 'pos'.
 - */
 -const GLubyte *
 -_mesa_find_line_column(const GLubyte *string, const GLubyte *pos,
 -                       GLint *line, GLint *col)
 -{
 -   const GLubyte *lineStart = string;
 -   const GLubyte *p = string;
 -   GLubyte *s;
 -   int len;
 -
 -   *line = 1;
 -
 -   while (p != pos) {
 -      if (*p == (GLubyte) '\n') {
 -         (*line)++;
 -         lineStart = p + 1;
 -      }
 -      p++;
 -   }
 -
 -   *col = (pos - lineStart) + 1;
 -
 -   /* return copy of this line */
 -   while (*p != 0 && *p != '\n')
 -      p++;
 -   len = p - lineStart;
 -   s = (GLubyte *) malloc(len + 1);
 -   memcpy(s, lineStart, len);
 -   s[len] = 0;
 -
 -   return s;
 -}
 -
 -
 -/**
 - * Initialize a new vertex/fragment program object.
 - */
 -static struct gl_program *
 -_mesa_init_program_struct( struct gl_context *ctx, struct gl_program *prog,
 -                           GLenum target, GLuint id)
 -{
 -   (void) ctx;
 -   if (prog) {
 -      GLuint i;
 -      memset(prog, 0, sizeof(*prog));
 -      prog->Id = id;
 -      prog->Target = target;
 -      prog->Resident = GL_TRUE;
 -      prog->RefCount = 1;
 -      prog->Format = GL_PROGRAM_FORMAT_ASCII_ARB;
 -
 -      /* default mapping from samplers to texture units */
 -      for (i = 0; i < MAX_SAMPLERS; i++)
 -         prog->SamplerUnits[i] = i;
 -   }
 -
 -   return prog;
 -}
 -
 -
 -/**
 - * Initialize a new fragment program object.
 - */
 -struct gl_program *
 -_mesa_init_fragment_program( struct gl_context *ctx, struct gl_fragment_program *prog,
 -                             GLenum target, GLuint id)
 -{
 -   if (prog)
 -      return _mesa_init_program_struct( ctx, &prog->Base, target, id );
 -   else
 -      return NULL;
 -}
 -
 -
 -/**
 - * Initialize a new vertex program object.
 - */
 -struct gl_program *
 -_mesa_init_vertex_program( struct gl_context *ctx, struct gl_vertex_program *prog,
 -                           GLenum target, GLuint id)
 -{
 -   if (prog)
 -      return _mesa_init_program_struct( ctx, &prog->Base, target, id );
 -   else
 -      return NULL;
 -}
 -
 -
 -/**
 - * Initialize a new geometry program object.
 - */
 -struct gl_program *
 -_mesa_init_geometry_program( struct gl_context *ctx, struct gl_geometry_program *prog,
 -                             GLenum target, GLuint id)
 -{
 -   if (prog)
 -      return _mesa_init_program_struct( ctx, &prog->Base, target, id );
 -   else
 -      return NULL;
 -}
 -
 -
 -/**
 - * Allocate and initialize a new fragment/vertex program object but
 - * don't put it into the program hash table.  Called via
 - * ctx->Driver.NewProgram.  May be overridden (ie. replaced) by a
 - * device driver function to implement OO deriviation with additional
 - * types not understood by this function.
 - *
 - * \param ctx  context
 - * \param id   program id/number
 - * \param target  program target/type
 - * \return  pointer to new program object
 - */
 -struct gl_program *
 -_mesa_new_program(struct gl_context *ctx, GLenum target, GLuint id)
 -{
 -   struct gl_program *prog;
 -   switch (target) {
 -   case GL_VERTEX_PROGRAM_ARB: /* == GL_VERTEX_PROGRAM_NV */
 -   case GL_VERTEX_STATE_PROGRAM_NV:
 -      prog = _mesa_init_vertex_program(ctx, CALLOC_STRUCT(gl_vertex_program),
 -                                       target, id );
 -      break;
 -   case GL_FRAGMENT_PROGRAM_NV:
 -   case GL_FRAGMENT_PROGRAM_ARB:
 -      prog =_mesa_init_fragment_program(ctx,
 -                                         CALLOC_STRUCT(gl_fragment_program),
 -                                         target, id );
 -      break;
 -   case MESA_GEOMETRY_PROGRAM:
 -      prog = _mesa_init_geometry_program(ctx,
 -                                         CALLOC_STRUCT(gl_geometry_program),
 -                                         target, id);
 -      break;
 -   default:
 -      _mesa_problem(ctx, "bad target in _mesa_new_program");
 -      prog = NULL;
 -   }
 -   return prog;
 -}
 -
 -
 -/**
 - * Delete a program and remove it from the hash table, ignoring the
 - * reference count.
 - * Called via ctx->Driver.DeleteProgram.  May be wrapped (OO deriviation)
 - * by a device driver function.
 - */
 -void
 -_mesa_delete_program(struct gl_context *ctx, struct gl_program *prog)
 -{
 -   (void) ctx;
 -   ASSERT(prog);
 -   ASSERT(prog->RefCount==0);
 -
 -   if (prog == &_mesa_DummyProgram)
 -      return;
 -
 -   if (prog->String)
 -      free(prog->String);
 -
 -   _mesa_free_instructions(prog->Instructions, prog->NumInstructions);
 -
 -   if (prog->Parameters) {
 -      _mesa_free_parameter_list(prog->Parameters);
 -   }
 -   if (prog->Varying) {
 -      _mesa_free_parameter_list(prog->Varying);
 -   }
 -   if (prog->Attributes) {
 -      _mesa_free_parameter_list(prog->Attributes);
 -   }
 -
 -   free(prog);
 -}
 -
 -
 -/**
 - * Return the gl_program object for a given ID.
 - * Basically just a wrapper for _mesa_HashLookup() to avoid a lot of
 - * casts elsewhere.
 - */
 -struct gl_program *
 -_mesa_lookup_program(struct gl_context *ctx, GLuint id)
 -{
 -   if (id)
 -      return (struct gl_program *) _mesa_HashLookup(ctx->Shared->Programs, id);
 -   else
 -      return NULL;
 -}
 -
 -
 -/**
 - * Reference counting for vertex/fragment programs
 - */
 -void
 -_mesa_reference_program(struct gl_context *ctx,
 -                        struct gl_program **ptr,
 -                        struct gl_program *prog)
 -{
 -   assert(ptr);
 -   if (*ptr && prog) {
 -      /* sanity check */
 -      if ((*ptr)->Target == GL_VERTEX_PROGRAM_ARB)
 -         ASSERT(prog->Target == GL_VERTEX_PROGRAM_ARB);
 -      else if ((*ptr)->Target == GL_FRAGMENT_PROGRAM_ARB)
 -         ASSERT(prog->Target == GL_FRAGMENT_PROGRAM_ARB ||
 -                prog->Target == GL_FRAGMENT_PROGRAM_NV);
 -      else if ((*ptr)->Target == MESA_GEOMETRY_PROGRAM)
 -         ASSERT(prog->Target == MESA_GEOMETRY_PROGRAM);
 -   }
 -   if (*ptr == prog) {
 -      return;  /* no change */
 -   }
 -   if (*ptr) {
 -      GLboolean deleteFlag;
 -
 -      /*_glthread_LOCK_MUTEX((*ptr)->Mutex);*/
 -#if 0
 -      printf("Program %p ID=%u Target=%s  Refcount-- to %d\n",
 -             *ptr, (*ptr)->Id,
 -             ((*ptr)->Target == GL_VERTEX_PROGRAM_ARB ? "VP" :
 -              ((*ptr)->Target == MESA_GEOMETRY_PROGRAM ? "GP" : "FP")),
 -             (*ptr)->RefCount - 1);
 -#endif
 -      ASSERT((*ptr)->RefCount > 0);
 -      (*ptr)->RefCount--;
 -
 -      deleteFlag = ((*ptr)->RefCount == 0);
 -      /*_glthread_UNLOCK_MUTEX((*ptr)->Mutex);*/
 -
 -      if (deleteFlag) {
 -         ASSERT(ctx);
 -         ctx->Driver.DeleteProgram(ctx, *ptr);
 -      }
 -
 -      *ptr = NULL;
 -   }
 -
 -   assert(!*ptr);
 -   if (prog) {
 -      /*_glthread_LOCK_MUTEX(prog->Mutex);*/
 -      prog->RefCount++;
 -#if 0
 -      printf("Program %p ID=%u Target=%s  Refcount++ to %d\n",
 -             prog, prog->Id,
 -             (prog->Target == GL_VERTEX_PROGRAM_ARB ? "VP" :
 -              (prog->Target == MESA_GEOMETRY_PROGRAM ? "GP" : "FP")),
 -             prog->RefCount);
 -#endif
 -      /*_glthread_UNLOCK_MUTEX(prog->Mutex);*/
 -   }
 -
 -   *ptr = prog;
 -}
 -
 -
 -/**
 - * Return a copy of a program.
 - * XXX Problem here if the program object is actually OO-derivation
 - * made by a device driver.
 - */
 -struct gl_program *
 -_mesa_clone_program(struct gl_context *ctx, const struct gl_program *prog)
 -{
 -   struct gl_program *clone;
 -
 -   clone = ctx->Driver.NewProgram(ctx, prog->Target, prog->Id);
 -   if (!clone)
 -      return NULL;
 -
 -   assert(clone->Target == prog->Target);
 -   assert(clone->RefCount == 1);
 -
 -   clone->String = (GLubyte *) _mesa_strdup((char *) prog->String);
 -   clone->Format = prog->Format;
 -   clone->Instructions = _mesa_alloc_instructions(prog->NumInstructions);
 -   if (!clone->Instructions) {
 -      _mesa_reference_program(ctx, &clone, NULL);
 -      return NULL;
 -   }
 -   _mesa_copy_instructions(clone->Instructions, prog->Instructions,
 -                           prog->NumInstructions);
 -   clone->InputsRead = prog->InputsRead;
 -   clone->OutputsWritten = prog->OutputsWritten;
 -   clone->SamplersUsed = prog->SamplersUsed;
 -   clone->ShadowSamplers = prog->ShadowSamplers;
 -   memcpy(clone->TexturesUsed, prog->TexturesUsed, sizeof(prog->TexturesUsed));
 -
 -   if (prog->Parameters)
 -      clone->Parameters = _mesa_clone_parameter_list(prog->Parameters);
 -   memcpy(clone->LocalParams, prog->LocalParams, sizeof(clone->LocalParams));
 -   if (prog->Varying)
 -      clone->Varying = _mesa_clone_parameter_list(prog->Varying);
 -   if (prog->Attributes)
 -      clone->Attributes = _mesa_clone_parameter_list(prog->Attributes);
 -   memcpy(clone->LocalParams, prog->LocalParams, sizeof(clone->LocalParams));
 -   clone->IndirectRegisterFiles = prog->IndirectRegisterFiles;
 -   clone->NumInstructions = prog->NumInstructions;
 -   clone->NumTemporaries = prog->NumTemporaries;
 -   clone->NumParameters = prog->NumParameters;
 -   clone->NumAttributes = prog->NumAttributes;
 -   clone->NumAddressRegs = prog->NumAddressRegs;
 -   clone->NumNativeInstructions = prog->NumNativeInstructions;
 -   clone->NumNativeTemporaries = prog->NumNativeTemporaries;
 -   clone->NumNativeParameters = prog->NumNativeParameters;
 -   clone->NumNativeAttributes = prog->NumNativeAttributes;
 -   clone->NumNativeAddressRegs = prog->NumNativeAddressRegs;
 -   clone->NumAluInstructions = prog->NumAluInstructions;
 -   clone->NumTexInstructions = prog->NumTexInstructions;
 -   clone->NumTexIndirections = prog->NumTexIndirections;
 -   clone->NumNativeAluInstructions = prog->NumNativeAluInstructions;
 -   clone->NumNativeTexInstructions = prog->NumNativeTexInstructions;
 -   clone->NumNativeTexIndirections = prog->NumNativeTexIndirections;
 -
 -   switch (prog->Target) {
 -   case GL_VERTEX_PROGRAM_ARB:
 -      {
 -         const struct gl_vertex_program *vp
 -            = (const struct gl_vertex_program *) prog;
 -         struct gl_vertex_program *vpc = (struct gl_vertex_program *) clone;
 -         vpc->IsPositionInvariant = vp->IsPositionInvariant;
 -         vpc->IsNVProgram = vp->IsNVProgram;
 -      }
 -      break;
 -   case GL_FRAGMENT_PROGRAM_ARB:
 -      {
 -         const struct gl_fragment_program *fp
 -            = (const struct gl_fragment_program *) prog;
 -         struct gl_fragment_program *fpc = (struct gl_fragment_program *) clone;
 -         fpc->FogOption = fp->FogOption;
 -         fpc->UsesKill = fp->UsesKill;
 -         fpc->OriginUpperLeft = fp->OriginUpperLeft;
 -         fpc->PixelCenterInteger = fp->PixelCenterInteger;
 -      }
 -      break;
 -   case MESA_GEOMETRY_PROGRAM:
 -      {
 -         const struct gl_geometry_program *gp
 -            = (const struct gl_geometry_program *) prog;
 -         struct gl_geometry_program *gpc = (struct gl_geometry_program *) clone;
 -         gpc->VerticesOut = gp->VerticesOut;
 -         gpc->InputType = gp->InputType;
 -         gpc->OutputType = gp->OutputType;
 -      }
 -      break;
 -   default:
 -      _mesa_problem(NULL, "Unexpected target in _mesa_clone_program");
 -   }
 -
 -   return clone;
 -}
 -
 -
 -/**
 - * Insert 'count' NOP instructions at 'start' in the given program.
 - * Adjust branch targets accordingly.
 - */
 -GLboolean
 -_mesa_insert_instructions(struct gl_program *prog, GLuint start, GLuint count)
 -{
 -   const GLuint origLen = prog->NumInstructions;
 -   const GLuint newLen = origLen + count;
 -   struct prog_instruction *newInst;
 -   GLuint i;
 -
 -   /* adjust branches */
 -   for (i = 0; i < prog->NumInstructions; i++) {
 -      struct prog_instruction *inst = prog->Instructions + i;
 -      if (inst->BranchTarget > 0) {
 -         if ((GLuint)inst->BranchTarget >= start) {
 -            inst->BranchTarget += count;
 -         }
 -      }
 -   }
 -
 -   /* Alloc storage for new instructions */
 -   newInst = _mesa_alloc_instructions(newLen);
 -   if (!newInst) {
 -      return GL_FALSE;
 -   }
 -
 -   /* Copy 'start' instructions into new instruction buffer */
 -   _mesa_copy_instructions(newInst, prog->Instructions, start);
 -
 -   /* init the new instructions */
 -   _mesa_init_instructions(newInst + start, count);
 -
 -   /* Copy the remaining/tail instructions to new inst buffer */
 -   _mesa_copy_instructions(newInst + start + count,
 -                           prog->Instructions + start,
 -                           origLen - start);
 -
 -   /* free old instructions */
 -   _mesa_free_instructions(prog->Instructions, origLen);
 -
 -   /* install new instructions */
 -   prog->Instructions = newInst;
 -   prog->NumInstructions = newLen;
 -
 -   return GL_TRUE;
 -}
 -
 -/**
 - * Delete 'count' instructions at 'start' in the given program.
 - * Adjust branch targets accordingly.
 - */
 -GLboolean
 -_mesa_delete_instructions(struct gl_program *prog, GLuint start, GLuint count)
 -{
 -   const GLuint origLen = prog->NumInstructions;
 -   const GLuint newLen = origLen - count;
 -   struct prog_instruction *newInst;
 -   GLuint i;
 -
 -   /* adjust branches */
 -   for (i = 0; i < prog->NumInstructions; i++) {
 -      struct prog_instruction *inst = prog->Instructions + i;
 -      if (inst->BranchTarget > 0) {
 -         if (inst->BranchTarget > (GLint) start) {
 -            inst->BranchTarget -= count;
 -         }
 -      }
 -   }
 -
 -   /* Alloc storage for new instructions */
 -   newInst = _mesa_alloc_instructions(newLen);
 -   if (!newInst) {
 -      return GL_FALSE;
 -   }
 -
 -   /* Copy 'start' instructions into new instruction buffer */
 -   _mesa_copy_instructions(newInst, prog->Instructions, start);
 -
 -   /* Copy the remaining/tail instructions to new inst buffer */
 -   _mesa_copy_instructions(newInst + start,
 -                           prog->Instructions + start + count,
 -                           newLen - start);
 -
 -   /* free old instructions */
 -   _mesa_free_instructions(prog->Instructions, origLen);
 -
 -   /* install new instructions */
 -   prog->Instructions = newInst;
 -   prog->NumInstructions = newLen;
 -
 -   return GL_TRUE;
 -}
 -
 -
 -/**
 - * Search instructions for registers that match (oldFile, oldIndex),
 - * replacing them with (newFile, newIndex).
 - */
 -static void
 -replace_registers(struct prog_instruction *inst, GLuint numInst,
 -                  GLuint oldFile, GLuint oldIndex,
 -                  GLuint newFile, GLuint newIndex)
 -{
 -   GLuint i, j;
 -   for (i = 0; i < numInst; i++) {
 -      /* src regs */
 -      for (j = 0; j < _mesa_num_inst_src_regs(inst[i].Opcode); j++) {
 -         if (inst[i].SrcReg[j].File == oldFile &&
 -             inst[i].SrcReg[j].Index == oldIndex) {
 -            inst[i].SrcReg[j].File = newFile;
 -            inst[i].SrcReg[j].Index = newIndex;
 -         }
 -      }
 -      /* dst reg */
 -      if (inst[i].DstReg.File == oldFile && inst[i].DstReg.Index == oldIndex) {
 -         inst[i].DstReg.File = newFile;
 -         inst[i].DstReg.Index = newIndex;
 -      }
 -   }
 -}
 -
 -
 -/**
 - * Search instructions for references to program parameters.  When found,
 - * increment the parameter index by 'offset'.
 - * Used when combining programs.
 - */
 -static void
 -adjust_param_indexes(struct prog_instruction *inst, GLuint numInst,
 -                     GLuint offset)
 -{
 -   GLuint i, j;
 -   for (i = 0; i < numInst; i++) {
 -      for (j = 0; j < _mesa_num_inst_src_regs(inst[i].Opcode); j++) {
 -         GLuint f = inst[i].SrcReg[j].File;
 -         if (f == PROGRAM_CONSTANT ||
 -             f == PROGRAM_UNIFORM ||
 -             f == PROGRAM_STATE_VAR) {
 -            inst[i].SrcReg[j].Index += offset;
 -         }
 -      }
 -   }
 -}
 -
 -
 -/**
 - * Combine two programs into one.  Fix instructions so the outputs of
 - * the first program go to the inputs of the second program.
 - */
 -struct gl_program *
 -_mesa_combine_programs(struct gl_context *ctx,
 -                       const struct gl_program *progA,
 -                       const struct gl_program *progB)
 -{
 -   struct prog_instruction *newInst;
 -   struct gl_program *newProg;
 -   const GLuint lenA = progA->NumInstructions - 1; /* omit END instr */
 -   const GLuint lenB = progB->NumInstructions;
 -   const GLuint numParamsA = _mesa_num_parameters(progA->Parameters);
 -   const GLuint newLength = lenA + lenB;
 -   GLboolean usedTemps[MAX_PROGRAM_TEMPS];
 -   GLuint firstTemp = 0;
 -   GLbitfield inputsB;
 -   GLuint i;
 -
 -   ASSERT(progA->Target == progB->Target);
 -
 -   newInst = _mesa_alloc_instructions(newLength);
 -   if (!newInst)
 -      return GL_FALSE;
 -
 -   _mesa_copy_instructions(newInst, progA->Instructions, lenA);
 -   _mesa_copy_instructions(newInst + lenA, progB->Instructions, lenB);
 -
 -   /* adjust branch / instruction addresses for B's instructions */
 -   for (i = 0; i < lenB; i++) {
 -      newInst[lenA + i].BranchTarget += lenA;
 -   }
 -
 -   newProg = ctx->Driver.NewProgram(ctx, progA->Target, 0);
 -   newProg->Instructions = newInst;
 -   newProg->NumInstructions = newLength;
 -
 -   /* find used temp regs (we may need new temps below) */
 -   _mesa_find_used_registers(newProg, PROGRAM_TEMPORARY,
 -                             usedTemps, MAX_PROGRAM_TEMPS);
 -
 -   if (newProg->Target == GL_FRAGMENT_PROGRAM_ARB) {
 -      struct gl_fragment_program *fprogA, *fprogB, *newFprog;
 -      GLbitfield progB_inputsRead = progB->InputsRead;
 -      GLint progB_colorFile, progB_colorIndex;
 -
 -      fprogA = (struct gl_fragment_program *) progA;
 -      fprogB = (struct gl_fragment_program *) progB;
 -      newFprog = (struct gl_fragment_program *) newProg;
 -
 -      newFprog->UsesKill = fprogA->UsesKill || fprogB->UsesKill;
 -
 -      /* We'll do a search and replace for instances
 -       * of progB_colorFile/progB_colorIndex below...
 -       */
 -      progB_colorFile = PROGRAM_INPUT;
 -      progB_colorIndex = FRAG_ATTRIB_COL0;
 -
 -      /*
 -       * The fragment program may get color from a state var rather than
 -       * a fragment input (vertex output) if it's constant.
 -       * See the texenvprogram.c code.
 -       * So, search the program's parameter list now to see if the program
 -       * gets color from a state var instead of a conventional fragment
 -       * input register.
 -       */
 -      for (i = 0; i < progB->Parameters->NumParameters; i++) {
 -         struct gl_program_parameter *p = &progB->Parameters->Parameters[i];
 -         if (p->Type == PROGRAM_STATE_VAR &&
 -             p->StateIndexes[0] == STATE_INTERNAL &&
 -             p->StateIndexes[1] == STATE_CURRENT_ATTRIB &&
 -             (int) p->StateIndexes[2] == (int) VERT_ATTRIB_COLOR0) {
 -            progB_inputsRead |= FRAG_BIT_COL0;
 -            progB_colorFile = PROGRAM_STATE_VAR;
 -            progB_colorIndex = i;
 -            break;
 -         }
 -      }
 -
 -      /* Connect color outputs of fprogA to color inputs of fprogB, via a
 -       * new temporary register.
 -       */
 -      if ((progA->OutputsWritten & BITFIELD64_BIT(FRAG_RESULT_COLOR)) &&
 -          (progB_inputsRead & FRAG_BIT_COL0)) {
 -         GLint tempReg = _mesa_find_free_register(usedTemps, MAX_PROGRAM_TEMPS,
 -                                                  firstTemp);
 -         if (tempReg < 0) {
 -            _mesa_problem(ctx, "No free temp regs found in "
 -                          "_mesa_combine_programs(), using 31");
 -            tempReg = 31;
 -         }
 -         firstTemp = tempReg + 1;
 -
 -         /* replace writes to result.color[0] with tempReg */
 -         replace_registers(newInst, lenA,
 -                           PROGRAM_OUTPUT, FRAG_RESULT_COLOR,
 -                           PROGRAM_TEMPORARY, tempReg);
 -         /* replace reads from the input color with tempReg */
 -         replace_registers(newInst + lenA, lenB,
 -                           progB_colorFile, progB_colorIndex, /* search for */
 -                           PROGRAM_TEMPORARY, tempReg  /* replace with */ );
 -      }
 -
 -      /* compute combined program's InputsRead */
 -      inputsB = progB_inputsRead;
 -      if (progA->OutputsWritten & BITFIELD64_BIT(FRAG_RESULT_COLOR)) {
 -         inputsB &= ~(1 << FRAG_ATTRIB_COL0);
 -      }
 -      newProg->InputsRead = progA->InputsRead | inputsB;
 -      newProg->OutputsWritten = progB->OutputsWritten;
 -      newProg->SamplersUsed = progA->SamplersUsed | progB->SamplersUsed;
 -   }
 -   else {
 -      /* vertex program */
 -      assert(0);      /* XXX todo */
 -   }
 -
 -   /*
 -    * Merge parameters (uniforms, constants, etc)
 -    */
 -   newProg->Parameters = _mesa_combine_parameter_lists(progA->Parameters,
 -                                                       progB->Parameters);
 -
 -   adjust_param_indexes(newInst + lenA, lenB, numParamsA);
 -
 -
 -   return newProg;
 -}
 -
 -
 -/**
 - * Populate the 'used' array with flags indicating which registers (TEMPs,
 - * INPUTs, OUTPUTs, etc, are used by the given program.
 - * \param file  type of register to scan for
 - * \param used  returns true/false flags for in use / free
 - * \param usedSize  size of the 'used' array
 - */
 -void
 -_mesa_find_used_registers(const struct gl_program *prog,
 -                          gl_register_file file,
 -                          GLboolean used[], GLuint usedSize)
 -{
 -   GLuint i, j;
 -
 -   memset(used, 0, usedSize);
 -
 -   for (i = 0; i < prog->NumInstructions; i++) {
 -      const struct prog_instruction *inst = prog->Instructions + i;
 -      const GLuint n = _mesa_num_inst_src_regs(inst->Opcode);
 -
 -      if (inst->DstReg.File == file) {
 -         ASSERT(inst->DstReg.Index < usedSize);
 -         if(inst->DstReg.Index < usedSize)
 -            used[inst->DstReg.Index] = GL_TRUE;
 -      }
 -
 -      for (j = 0; j < n; j++) {
 -         if (inst->SrcReg[j].File == file) {
 -            ASSERT(inst->SrcReg[j].Index < usedSize);
 -            if(inst->SrcReg[j].Index < usedSize)
 -               used[inst->SrcReg[j].Index] = GL_TRUE;
 -         }
 -      }
 -   }
 -}
 -
 -
 -/**
 - * Scan the given 'used' register flag array for the first entry
 - * that's >= firstReg.
 - * \param used  vector of flags indicating registers in use (as returned
 - *              by _mesa_find_used_registers())
 - * \param usedSize  size of the 'used' array
 - * \param firstReg  first register to start searching at
 - * \return index of unused register, or -1 if none.
 - */
 -GLint
 -_mesa_find_free_register(const GLboolean used[],
 -                         GLuint usedSize, GLuint firstReg)
 -{
 -   GLuint i;
 -
 -   assert(firstReg < usedSize);
 -
 -   for (i = firstReg; i < usedSize; i++)
 -      if (!used[i])
 -         return i;
 -
 -   return -1;
 -}
 -
 -
 -
 -/**
 - * Check if the given register index is valid (doesn't exceed implementation-
 - * dependent limits).
 - * \return GL_TRUE if OK, GL_FALSE if bad index
 - */
 -GLboolean
 -_mesa_valid_register_index(const struct gl_context *ctx,
 -                           gl_shader_type shaderType,
 -                           gl_register_file file, GLint index)
 -{
 -   const struct gl_program_constants *c;
 -
 -   switch (shaderType) {
 -   case MESA_SHADER_VERTEX:
 -      c = &ctx->Const.VertexProgram;
 -      break;
 -   case MESA_SHADER_FRAGMENT:
 -      c = &ctx->Const.FragmentProgram;
 -      break;
 -   case MESA_SHADER_GEOMETRY:
 -      c = &ctx->Const.GeometryProgram;
 -      break;
 -   default:
 -      _mesa_problem(ctx,
 -                    "unexpected shader type in _mesa_valid_register_index()");
 -      return GL_FALSE;
 -   }
 -
 -   switch (file) {
 -   case PROGRAM_UNDEFINED:
 -      return GL_TRUE;  /* XXX or maybe false? */
 -
 -   case PROGRAM_TEMPORARY:
 -      return index >= 0 && index < c->MaxTemps;
 -
 -   case PROGRAM_ENV_PARAM:
 -      return index >= 0 && index < c->MaxEnvParams;
 -
 -   case PROGRAM_LOCAL_PARAM:
 -      return index >= 0 && index < c->MaxLocalParams;
 -
 -   case PROGRAM_NAMED_PARAM:
 -      return index >= 0 && index < c->MaxParameters;
 -
 -   case PROGRAM_UNIFORM:
 -   case PROGRAM_STATE_VAR:
 -      /* aka constant buffer */
 -      return index >= 0 && index < c->MaxUniformComponents / 4;
 -
 -   case PROGRAM_CONSTANT:
 -      /* constant buffer w/ possible relative negative addressing */
 -      return (index > (int) c->MaxUniformComponents / -4 &&
 -              index < c->MaxUniformComponents / 4);
 -
 -   case PROGRAM_INPUT:
 -      if (index < 0)
 -         return GL_FALSE;
 -
 -      switch (shaderType) {
 -      case MESA_SHADER_VERTEX:
 -         return index < VERT_ATTRIB_GENERIC0 + c->MaxAttribs;
 -      case MESA_SHADER_FRAGMENT:
 -         return index < FRAG_ATTRIB_VAR0 + ctx->Const.MaxVarying;
 -      case MESA_SHADER_GEOMETRY:
 -         return index < GEOM_ATTRIB_VAR0 + ctx->Const.MaxVarying;
 -      default:
 -         return GL_FALSE;
 -      }
 -
 -   case PROGRAM_OUTPUT:
 -      if (index < 0)
 -         return GL_FALSE;
 -
 -      switch (shaderType) {
 -      case MESA_SHADER_VERTEX:
 -         return index < VERT_RESULT_VAR0 + ctx->Const.MaxVarying;
 -      case MESA_SHADER_FRAGMENT:
 -         return index < FRAG_RESULT_DATA0 + ctx->Const.MaxDrawBuffers;
 -      case MESA_SHADER_GEOMETRY:
 -         return index < GEOM_RESULT_VAR0 + ctx->Const.MaxVarying;
 -      default:
 -         return GL_FALSE;
 -      }
 -
 -   case PROGRAM_ADDRESS:
 -      return index >= 0 && index < c->MaxAddressRegs;
 -
 -   default:
 -      _mesa_problem(ctx,
 -                    "unexpected register file in _mesa_valid_register_index()");
 -      return GL_FALSE;
 -   }
 -}
 -
 -
 -
 -/**
 - * "Post-process" a GPU program.  This is intended to be used for debugging.
 - * Example actions include no-op'ing instructions or changing instruction
 - * behaviour.
 - */
 -void
 -_mesa_postprocess_program(struct gl_context *ctx, struct gl_program *prog)
 -{
 -   static const GLfloat white[4] = { 0.5, 0.5, 0.5, 0.5 };
 -   GLuint i;
 -   GLuint whiteSwizzle;
 -   GLint whiteIndex = _mesa_add_unnamed_constant(prog->Parameters,
 -                                                 white, 4, &whiteSwizzle);
 -
 -   (void) whiteIndex;
 -
 -   for (i = 0; i < prog->NumInstructions; i++) {
 -      struct prog_instruction *inst = prog->Instructions + i;
 -      const GLuint n = _mesa_num_inst_src_regs(inst->Opcode);
 -
 -      (void) n;
 -
 -      if (_mesa_is_tex_instruction(inst->Opcode)) {
 -#if 0
 -         /* replace TEX/TXP/TXB with MOV */
 -         inst->Opcode = OPCODE_MOV;
 -         inst->DstReg.WriteMask = WRITEMASK_XYZW;
 -         inst->SrcReg[0].Swizzle = SWIZZLE_XYZW;
 -         inst->SrcReg[0].Negate = NEGATE_NONE;
 -#endif
 -
 -#if 0
 -         /* disable shadow texture mode */
 -         inst->TexShadow = 0;
 -#endif
 -      }
 -
 -      if (inst->Opcode == OPCODE_TXP) {
 -#if 0
 -         inst->Opcode = OPCODE_MOV;
 -         inst->DstReg.WriteMask = WRITEMASK_XYZW;
 -         inst->SrcReg[0].File = PROGRAM_CONSTANT;
 -         inst->SrcReg[0].Index = whiteIndex;
 -         inst->SrcReg[0].Swizzle = SWIZZLE_XYZW;
 -         inst->SrcReg[0].Negate = NEGATE_NONE;
 -#endif
 -#if 0
 -         inst->TexShadow = 0;
 -#endif
 -#if 0
 -         inst->Opcode = OPCODE_TEX;
 -         inst->TexShadow = 0;
 -#endif
 -      }
 -
 -   }
 -}
 +/* + * Mesa 3-D graphics library + * Version:  6.5.3 + * + * Copyright (C) 1999-2007  Brian Paul   All Rights Reserved. + * + * Permission is hereby granted, free of charge, to any person obtaining a + * copy of this software and associated documentation files (the "Software"), + * to deal in the Software without restriction, including without limitation + * the rights to use, copy, modify, merge, publish, distribute, sublicense, + * and/or sell copies of the Software, and to permit persons to whom the + * Software is furnished to do so, subject to the following conditions: + * + * The above copyright notice and this permission notice shall be included + * in all copies or substantial portions of the Software. + * + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS + * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL + * BRIAN PAUL BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN + * AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN + * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. + */ + +/** + * \file program.c + * Vertex and fragment program support functions. + * \author Brian Paul + */ + + +#include "main/glheader.h" +#include "main/context.h" +#include "main/hash.h" +#include "main/mfeatures.h" +#include "program.h" +#include "prog_cache.h" +#include "prog_parameter.h" +#include "prog_instruction.h" + + +/** + * A pointer to this dummy program is put into the hash table when + * glGenPrograms is called. + */ +struct gl_program _mesa_DummyProgram; + + +/** + * Init context's vertex/fragment program state + */ +void +_mesa_init_program(struct gl_context *ctx) +{ +   GLuint i; + +   /* +    * If this assertion fails, we need to increase the field +    * size for register indexes (see INST_INDEX_BITS). +    */ +   ASSERT(ctx->Const.VertexProgram.MaxUniformComponents / 4 +          <= (1 << INST_INDEX_BITS)); +   ASSERT(ctx->Const.FragmentProgram.MaxUniformComponents / 4 +          <= (1 << INST_INDEX_BITS)); + +   ASSERT(ctx->Const.VertexProgram.MaxTemps <= (1 << INST_INDEX_BITS)); +   ASSERT(ctx->Const.VertexProgram.MaxLocalParams <= (1 << INST_INDEX_BITS)); +   ASSERT(ctx->Const.FragmentProgram.MaxTemps <= (1 << INST_INDEX_BITS)); +   ASSERT(ctx->Const.FragmentProgram.MaxLocalParams <= (1 << INST_INDEX_BITS)); + +   ASSERT(ctx->Const.VertexProgram.MaxUniformComponents <= 4 * MAX_UNIFORMS); +   ASSERT(ctx->Const.FragmentProgram.MaxUniformComponents <= 4 * MAX_UNIFORMS); + +   ASSERT(ctx->Const.VertexProgram.MaxAddressOffset <= (1 << INST_INDEX_BITS)); +   ASSERT(ctx->Const.FragmentProgram.MaxAddressOffset <= (1 << INST_INDEX_BITS)); + +   /* If this fails, increase prog_instruction::TexSrcUnit size */ +   ASSERT(MAX_TEXTURE_UNITS <= (1 << 5)); + +   /* If this fails, increase prog_instruction::TexSrcTarget size */ +   ASSERT(NUM_TEXTURE_TARGETS <= (1 << 3)); + +   ctx->Program.ErrorPos = -1; +   ctx->Program.ErrorString = _mesa_strdup(""); + +#if FEATURE_NV_vertex_program || FEATURE_ARB_vertex_program +   ctx->VertexProgram.Enabled = GL_FALSE; +#if FEATURE_es2_glsl +   ctx->VertexProgram.PointSizeEnabled = +      (ctx->API == API_OPENGLES2) ? GL_TRUE : GL_FALSE; +#else +   ctx->VertexProgram.PointSizeEnabled = GL_FALSE; +#endif +   ctx->VertexProgram.TwoSideEnabled = GL_FALSE; +   _mesa_reference_vertprog(ctx, &ctx->VertexProgram.Current, +                            ctx->Shared->DefaultVertexProgram); +   assert(ctx->VertexProgram.Current); +   for (i = 0; i < MAX_NV_VERTEX_PROGRAM_PARAMS / 4; i++) { +      ctx->VertexProgram.TrackMatrix[i] = GL_NONE; +      ctx->VertexProgram.TrackMatrixTransform[i] = GL_IDENTITY_NV; +   } +   ctx->VertexProgram.Cache = _mesa_new_program_cache(); +#endif + +#if FEATURE_NV_fragment_program || FEATURE_ARB_fragment_program +   ctx->FragmentProgram.Enabled = GL_FALSE; +   _mesa_reference_fragprog(ctx, &ctx->FragmentProgram.Current, +                            ctx->Shared->DefaultFragmentProgram); +   assert(ctx->FragmentProgram.Current); +   ctx->FragmentProgram.Cache = _mesa_new_program_cache(); +#endif + +#if FEATURE_ARB_geometry_shader4 +   ctx->GeometryProgram.Enabled = GL_FALSE; +   /* right now by default we don't have a geometry program */ +   _mesa_reference_geomprog(ctx, &ctx->GeometryProgram.Current, +                            NULL); +   ctx->GeometryProgram.Cache = _mesa_new_program_cache(); +#endif + +   /* XXX probably move this stuff */ +#if FEATURE_ATI_fragment_shader +   ctx->ATIFragmentShader.Enabled = GL_FALSE; +   ctx->ATIFragmentShader.Current = ctx->Shared->DefaultFragmentShader; +   assert(ctx->ATIFragmentShader.Current); +   ctx->ATIFragmentShader.Current->RefCount++; +#endif +} + + +/** + * Free a context's vertex/fragment program state + */ +void +_mesa_free_program_data(struct gl_context *ctx) +{ +#if FEATURE_NV_vertex_program || FEATURE_ARB_vertex_program +   _mesa_reference_vertprog(ctx, &ctx->VertexProgram.Current, NULL); +   _mesa_delete_program_cache(ctx, ctx->VertexProgram.Cache); +#endif +#if FEATURE_NV_fragment_program || FEATURE_ARB_fragment_program +   _mesa_reference_fragprog(ctx, &ctx->FragmentProgram.Current, NULL); +   _mesa_delete_program_cache(ctx, ctx->FragmentProgram.Cache); +#endif +#if FEATURE_ARB_geometry_shader4 +   _mesa_reference_geomprog(ctx, &ctx->GeometryProgram.Current, NULL); +   _mesa_delete_program_cache(ctx, ctx->GeometryProgram.Cache); +#endif +   /* XXX probably move this stuff */ +#if FEATURE_ATI_fragment_shader +   if (ctx->ATIFragmentShader.Current) { +      ctx->ATIFragmentShader.Current->RefCount--; +      if (ctx->ATIFragmentShader.Current->RefCount <= 0) { +         free(ctx->ATIFragmentShader.Current); +      } +   } +#endif +   free((void *) ctx->Program.ErrorString); +} + + +/** + * Update the default program objects in the given context to reference those + * specified in the shared state and release those referencing the old + * shared state. + */ +void +_mesa_update_default_objects_program(struct gl_context *ctx) +{ +#if FEATURE_NV_vertex_program || FEATURE_ARB_vertex_program +   _mesa_reference_vertprog(ctx, &ctx->VertexProgram.Current, +                            (struct gl_vertex_program *) +                            ctx->Shared->DefaultVertexProgram); +   assert(ctx->VertexProgram.Current); +#endif + +#if FEATURE_NV_fragment_program || FEATURE_ARB_fragment_program +   _mesa_reference_fragprog(ctx, &ctx->FragmentProgram.Current, +                            (struct gl_fragment_program *) +                            ctx->Shared->DefaultFragmentProgram); +   assert(ctx->FragmentProgram.Current); +#endif + +#if FEATURE_ARB_geometry_shader4 +   _mesa_reference_geomprog(ctx, &ctx->GeometryProgram.Current, +                            (struct gl_geometry_program *) +                            ctx->Shared->DefaultGeometryProgram); +#endif + +   /* XXX probably move this stuff */ +#if FEATURE_ATI_fragment_shader +   if (ctx->ATIFragmentShader.Current) { +      ctx->ATIFragmentShader.Current->RefCount--; +      if (ctx->ATIFragmentShader.Current->RefCount <= 0) { +         free(ctx->ATIFragmentShader.Current); +      } +   } +   ctx->ATIFragmentShader.Current = (struct ati_fragment_shader *) ctx->Shared->DefaultFragmentShader; +   assert(ctx->ATIFragmentShader.Current); +   ctx->ATIFragmentShader.Current->RefCount++; +#endif +} + + +/** + * Set the vertex/fragment program error state (position and error string). + * This is generally called from within the parsers. + */ +void +_mesa_set_program_error(struct gl_context *ctx, GLint pos, const char *string) +{ +   ctx->Program.ErrorPos = pos; +   free((void *) ctx->Program.ErrorString); +   if (!string) +      string = ""; +   ctx->Program.ErrorString = _mesa_strdup(string); +} + + +/** + * Find the line number and column for 'pos' within 'string'. + * Return a copy of the line which contains 'pos'.  Free the line with + * free(). + * \param string  the program string + * \param pos     the position within the string + * \param line    returns the line number corresponding to 'pos'. + * \param col     returns the column number corresponding to 'pos'. + * \return copy of the line containing 'pos'. + */ +const GLubyte * +_mesa_find_line_column(const GLubyte *string, const GLubyte *pos, +                       GLint *line, GLint *col) +{ +   const GLubyte *lineStart = string; +   const GLubyte *p = string; +   GLubyte *s; +   int len; + +   *line = 1; + +   while (p != pos) { +      if (*p == (GLubyte) '\n') { +         (*line)++; +         lineStart = p + 1; +      } +      p++; +   } + +   *col = (pos - lineStart) + 1; + +   /* return copy of this line */ +   while (*p != 0 && *p != '\n') +      p++; +   len = p - lineStart; +   s = (GLubyte *) malloc(len + 1); +   memcpy(s, lineStart, len); +   s[len] = 0; + +   return s; +} + + +/** + * Initialize a new vertex/fragment program object. + */ +static struct gl_program * +_mesa_init_program_struct( struct gl_context *ctx, struct gl_program *prog, +                           GLenum target, GLuint id) +{ +   (void) ctx; +   if (prog) { +      GLuint i; +      memset(prog, 0, sizeof(*prog)); +      prog->Id = id; +      prog->Target = target; +      prog->Resident = GL_TRUE; +      prog->RefCount = 1; +      prog->Format = GL_PROGRAM_FORMAT_ASCII_ARB; + +      /* default mapping from samplers to texture units */ +      for (i = 0; i < MAX_SAMPLERS; i++) +         prog->SamplerUnits[i] = i; +   } + +   return prog; +} + + +/** + * Initialize a new fragment program object. + */ +struct gl_program * +_mesa_init_fragment_program( struct gl_context *ctx, struct gl_fragment_program *prog, +                             GLenum target, GLuint id) +{ +   if (prog) +      return _mesa_init_program_struct( ctx, &prog->Base, target, id ); +   else +      return NULL; +} + + +/** + * Initialize a new vertex program object. + */ +struct gl_program * +_mesa_init_vertex_program( struct gl_context *ctx, struct gl_vertex_program *prog, +                           GLenum target, GLuint id) +{ +   if (prog) +      return _mesa_init_program_struct( ctx, &prog->Base, target, id ); +   else +      return NULL; +} + + +/** + * Initialize a new geometry program object. + */ +struct gl_program * +_mesa_init_geometry_program( struct gl_context *ctx, struct gl_geometry_program *prog, +                             GLenum target, GLuint id) +{ +   if (prog) +      return _mesa_init_program_struct( ctx, &prog->Base, target, id ); +   else +      return NULL; +} + + +/** + * Allocate and initialize a new fragment/vertex program object but + * don't put it into the program hash table.  Called via + * ctx->Driver.NewProgram.  May be overridden (ie. replaced) by a + * device driver function to implement OO deriviation with additional + * types not understood by this function. + * + * \param ctx  context + * \param id   program id/number + * \param target  program target/type + * \return  pointer to new program object + */ +struct gl_program * +_mesa_new_program(struct gl_context *ctx, GLenum target, GLuint id) +{ +   struct gl_program *prog; +   switch (target) { +   case GL_VERTEX_PROGRAM_ARB: /* == GL_VERTEX_PROGRAM_NV */ +   case GL_VERTEX_STATE_PROGRAM_NV: +      prog = _mesa_init_vertex_program(ctx, CALLOC_STRUCT(gl_vertex_program), +                                       target, id ); +      break; +   case GL_FRAGMENT_PROGRAM_NV: +   case GL_FRAGMENT_PROGRAM_ARB: +      prog =_mesa_init_fragment_program(ctx, +                                         CALLOC_STRUCT(gl_fragment_program), +                                         target, id ); +      break; +   case MESA_GEOMETRY_PROGRAM: +      prog = _mesa_init_geometry_program(ctx, +                                         CALLOC_STRUCT(gl_geometry_program), +                                         target, id); +      break; +   default: +      _mesa_problem(ctx, "bad target in _mesa_new_program"); +      prog = NULL; +   } +   return prog; +} + + +/** + * Delete a program and remove it from the hash table, ignoring the + * reference count. + * Called via ctx->Driver.DeleteProgram.  May be wrapped (OO deriviation) + * by a device driver function. + */ +void +_mesa_delete_program(struct gl_context *ctx, struct gl_program *prog) +{ +   (void) ctx; +   ASSERT(prog); +   ASSERT(prog->RefCount==0); + +   if (prog == &_mesa_DummyProgram) +      return; + +   if (prog->String) +      free(prog->String); + +   _mesa_free_instructions(prog->Instructions, prog->NumInstructions); + +   if (prog->Parameters) { +      _mesa_free_parameter_list(prog->Parameters); +   } +   if (prog->Varying) { +      _mesa_free_parameter_list(prog->Varying); +   } +   if (prog->Attributes) { +      _mesa_free_parameter_list(prog->Attributes); +   } + +   free(prog); +} + + +/** + * Return the gl_program object for a given ID. + * Basically just a wrapper for _mesa_HashLookup() to avoid a lot of + * casts elsewhere. + */ +struct gl_program * +_mesa_lookup_program(struct gl_context *ctx, GLuint id) +{ +   if (id) +      return (struct gl_program *) _mesa_HashLookup(ctx->Shared->Programs, id); +   else +      return NULL; +} + + +/** + * Reference counting for vertex/fragment programs + */ +void +_mesa_reference_program(struct gl_context *ctx, +                        struct gl_program **ptr, +                        struct gl_program *prog) +{ +   assert(ptr); +   if (*ptr && prog) { +      /* sanity check */ +      if ((*ptr)->Target == GL_VERTEX_PROGRAM_ARB) +         ASSERT(prog->Target == GL_VERTEX_PROGRAM_ARB); +      else if ((*ptr)->Target == GL_FRAGMENT_PROGRAM_ARB) +         ASSERT(prog->Target == GL_FRAGMENT_PROGRAM_ARB || +                prog->Target == GL_FRAGMENT_PROGRAM_NV); +      else if ((*ptr)->Target == MESA_GEOMETRY_PROGRAM) +         ASSERT(prog->Target == MESA_GEOMETRY_PROGRAM); +   } +   if (*ptr == prog) { +      return;  /* no change */ +   } +   if (*ptr) { +      GLboolean deleteFlag; + +      /*_glthread_LOCK_MUTEX((*ptr)->Mutex);*/ +#if 0 +      printf("Program %p ID=%u Target=%s  Refcount-- to %d\n", +             *ptr, (*ptr)->Id, +             ((*ptr)->Target == GL_VERTEX_PROGRAM_ARB ? "VP" : +              ((*ptr)->Target == MESA_GEOMETRY_PROGRAM ? "GP" : "FP")), +             (*ptr)->RefCount - 1); +#endif +      ASSERT((*ptr)->RefCount > 0); +      (*ptr)->RefCount--; + +      deleteFlag = ((*ptr)->RefCount == 0); +      /*_glthread_UNLOCK_MUTEX((*ptr)->Mutex);*/ + +      if (deleteFlag) { +         ASSERT(ctx); +         ctx->Driver.DeleteProgram(ctx, *ptr); +      } + +      *ptr = NULL; +   } + +   assert(!*ptr); +   if (prog) { +      /*_glthread_LOCK_MUTEX(prog->Mutex);*/ +      prog->RefCount++; +#if 0 +      printf("Program %p ID=%u Target=%s  Refcount++ to %d\n", +             prog, prog->Id, +             (prog->Target == GL_VERTEX_PROGRAM_ARB ? "VP" : +              (prog->Target == MESA_GEOMETRY_PROGRAM ? "GP" : "FP")), +             prog->RefCount); +#endif +      /*_glthread_UNLOCK_MUTEX(prog->Mutex);*/ +   } + +   *ptr = prog; +} + + +/** + * Return a copy of a program. + * XXX Problem here if the program object is actually OO-derivation + * made by a device driver. + */ +struct gl_program * +_mesa_clone_program(struct gl_context *ctx, const struct gl_program *prog) +{ +   struct gl_program *clone; + +   clone = ctx->Driver.NewProgram(ctx, prog->Target, prog->Id); +   if (!clone) +      return NULL; + +   assert(clone->Target == prog->Target); +   assert(clone->RefCount == 1); + +   clone->String = (GLubyte *) _mesa_strdup((char *) prog->String); +   clone->Format = prog->Format; +   clone->Instructions = _mesa_alloc_instructions(prog->NumInstructions); +   if (!clone->Instructions) { +      _mesa_reference_program(ctx, &clone, NULL); +      return NULL; +   } +   _mesa_copy_instructions(clone->Instructions, prog->Instructions, +                           prog->NumInstructions); +   clone->InputsRead = prog->InputsRead; +   clone->OutputsWritten = prog->OutputsWritten; +   clone->SamplersUsed = prog->SamplersUsed; +   clone->ShadowSamplers = prog->ShadowSamplers; +   memcpy(clone->TexturesUsed, prog->TexturesUsed, sizeof(prog->TexturesUsed)); + +   if (prog->Parameters) +      clone->Parameters = _mesa_clone_parameter_list(prog->Parameters); +   memcpy(clone->LocalParams, prog->LocalParams, sizeof(clone->LocalParams)); +   if (prog->Varying) +      clone->Varying = _mesa_clone_parameter_list(prog->Varying); +   if (prog->Attributes) +      clone->Attributes = _mesa_clone_parameter_list(prog->Attributes); +   memcpy(clone->LocalParams, prog->LocalParams, sizeof(clone->LocalParams)); +   clone->IndirectRegisterFiles = prog->IndirectRegisterFiles; +   clone->NumInstructions = prog->NumInstructions; +   clone->NumTemporaries = prog->NumTemporaries; +   clone->NumParameters = prog->NumParameters; +   clone->NumAttributes = prog->NumAttributes; +   clone->NumAddressRegs = prog->NumAddressRegs; +   clone->NumNativeInstructions = prog->NumNativeInstructions; +   clone->NumNativeTemporaries = prog->NumNativeTemporaries; +   clone->NumNativeParameters = prog->NumNativeParameters; +   clone->NumNativeAttributes = prog->NumNativeAttributes; +   clone->NumNativeAddressRegs = prog->NumNativeAddressRegs; +   clone->NumAluInstructions = prog->NumAluInstructions; +   clone->NumTexInstructions = prog->NumTexInstructions; +   clone->NumTexIndirections = prog->NumTexIndirections; +   clone->NumNativeAluInstructions = prog->NumNativeAluInstructions; +   clone->NumNativeTexInstructions = prog->NumNativeTexInstructions; +   clone->NumNativeTexIndirections = prog->NumNativeTexIndirections; + +   switch (prog->Target) { +   case GL_VERTEX_PROGRAM_ARB: +      { +         const struct gl_vertex_program *vp +            = (const struct gl_vertex_program *) prog; +         struct gl_vertex_program *vpc = (struct gl_vertex_program *) clone; +         vpc->IsPositionInvariant = vp->IsPositionInvariant; +         vpc->IsNVProgram = vp->IsNVProgram; +      } +      break; +   case GL_FRAGMENT_PROGRAM_ARB: +      { +         const struct gl_fragment_program *fp +            = (const struct gl_fragment_program *) prog; +         struct gl_fragment_program *fpc = (struct gl_fragment_program *) clone; +         fpc->UsesKill = fp->UsesKill; +         fpc->OriginUpperLeft = fp->OriginUpperLeft; +         fpc->PixelCenterInteger = fp->PixelCenterInteger; +      } +      break; +   case MESA_GEOMETRY_PROGRAM: +      { +         const struct gl_geometry_program *gp +            = (const struct gl_geometry_program *) prog; +         struct gl_geometry_program *gpc = (struct gl_geometry_program *) clone; +         gpc->VerticesOut = gp->VerticesOut; +         gpc->InputType = gp->InputType; +         gpc->OutputType = gp->OutputType; +      } +      break; +   default: +      _mesa_problem(NULL, "Unexpected target in _mesa_clone_program"); +   } + +   return clone; +} + + +/** + * Insert 'count' NOP instructions at 'start' in the given program. + * Adjust branch targets accordingly. + */ +GLboolean +_mesa_insert_instructions(struct gl_program *prog, GLuint start, GLuint count) +{ +   const GLuint origLen = prog->NumInstructions; +   const GLuint newLen = origLen + count; +   struct prog_instruction *newInst; +   GLuint i; + +   /* adjust branches */ +   for (i = 0; i < prog->NumInstructions; i++) { +      struct prog_instruction *inst = prog->Instructions + i; +      if (inst->BranchTarget > 0) { +         if ((GLuint)inst->BranchTarget >= start) { +            inst->BranchTarget += count; +         } +      } +   } + +   /* Alloc storage for new instructions */ +   newInst = _mesa_alloc_instructions(newLen); +   if (!newInst) { +      return GL_FALSE; +   } + +   /* Copy 'start' instructions into new instruction buffer */ +   _mesa_copy_instructions(newInst, prog->Instructions, start); + +   /* init the new instructions */ +   _mesa_init_instructions(newInst + start, count); + +   /* Copy the remaining/tail instructions to new inst buffer */ +   _mesa_copy_instructions(newInst + start + count, +                           prog->Instructions + start, +                           origLen - start); + +   /* free old instructions */ +   _mesa_free_instructions(prog->Instructions, origLen); + +   /* install new instructions */ +   prog->Instructions = newInst; +   prog->NumInstructions = newLen; + +   return GL_TRUE; +} + +/** + * Delete 'count' instructions at 'start' in the given program. + * Adjust branch targets accordingly. + */ +GLboolean +_mesa_delete_instructions(struct gl_program *prog, GLuint start, GLuint count) +{ +   const GLuint origLen = prog->NumInstructions; +   const GLuint newLen = origLen - count; +   struct prog_instruction *newInst; +   GLuint i; + +   /* adjust branches */ +   for (i = 0; i < prog->NumInstructions; i++) { +      struct prog_instruction *inst = prog->Instructions + i; +      if (inst->BranchTarget > 0) { +         if (inst->BranchTarget > (GLint) start) { +            inst->BranchTarget -= count; +         } +      } +   } + +   /* Alloc storage for new instructions */ +   newInst = _mesa_alloc_instructions(newLen); +   if (!newInst) { +      return GL_FALSE; +   } + +   /* Copy 'start' instructions into new instruction buffer */ +   _mesa_copy_instructions(newInst, prog->Instructions, start); + +   /* Copy the remaining/tail instructions to new inst buffer */ +   _mesa_copy_instructions(newInst + start, +                           prog->Instructions + start + count, +                           newLen - start); + +   /* free old instructions */ +   _mesa_free_instructions(prog->Instructions, origLen); + +   /* install new instructions */ +   prog->Instructions = newInst; +   prog->NumInstructions = newLen; + +   return GL_TRUE; +} + + +/** + * Search instructions for registers that match (oldFile, oldIndex), + * replacing them with (newFile, newIndex). + */ +static void +replace_registers(struct prog_instruction *inst, GLuint numInst, +                  GLuint oldFile, GLuint oldIndex, +                  GLuint newFile, GLuint newIndex) +{ +   GLuint i, j; +   for (i = 0; i < numInst; i++) { +      /* src regs */ +      for (j = 0; j < _mesa_num_inst_src_regs(inst[i].Opcode); j++) { +         if (inst[i].SrcReg[j].File == oldFile && +             inst[i].SrcReg[j].Index == oldIndex) { +            inst[i].SrcReg[j].File = newFile; +            inst[i].SrcReg[j].Index = newIndex; +         } +      } +      /* dst reg */ +      if (inst[i].DstReg.File == oldFile && inst[i].DstReg.Index == oldIndex) { +         inst[i].DstReg.File = newFile; +         inst[i].DstReg.Index = newIndex; +      } +   } +} + + +/** + * Search instructions for references to program parameters.  When found, + * increment the parameter index by 'offset'. + * Used when combining programs. + */ +static void +adjust_param_indexes(struct prog_instruction *inst, GLuint numInst, +                     GLuint offset) +{ +   GLuint i, j; +   for (i = 0; i < numInst; i++) { +      for (j = 0; j < _mesa_num_inst_src_regs(inst[i].Opcode); j++) { +         GLuint f = inst[i].SrcReg[j].File; +         if (f == PROGRAM_CONSTANT || +             f == PROGRAM_UNIFORM || +             f == PROGRAM_STATE_VAR) { +            inst[i].SrcReg[j].Index += offset; +         } +      } +   } +} + + +/** + * Combine two programs into one.  Fix instructions so the outputs of + * the first program go to the inputs of the second program. + */ +struct gl_program * +_mesa_combine_programs(struct gl_context *ctx, +                       const struct gl_program *progA, +                       const struct gl_program *progB) +{ +   struct prog_instruction *newInst; +   struct gl_program *newProg; +   const GLuint lenA = progA->NumInstructions - 1; /* omit END instr */ +   const GLuint lenB = progB->NumInstructions; +   const GLuint numParamsA = _mesa_num_parameters(progA->Parameters); +   const GLuint newLength = lenA + lenB; +   GLboolean usedTemps[MAX_PROGRAM_TEMPS]; +   GLuint firstTemp = 0; +   GLbitfield inputsB; +   GLuint i; + +   ASSERT(progA->Target == progB->Target); + +   newInst = _mesa_alloc_instructions(newLength); +   if (!newInst) +      return GL_FALSE; + +   _mesa_copy_instructions(newInst, progA->Instructions, lenA); +   _mesa_copy_instructions(newInst + lenA, progB->Instructions, lenB); + +   /* adjust branch / instruction addresses for B's instructions */ +   for (i = 0; i < lenB; i++) { +      newInst[lenA + i].BranchTarget += lenA; +   } + +   newProg = ctx->Driver.NewProgram(ctx, progA->Target, 0); +   newProg->Instructions = newInst; +   newProg->NumInstructions = newLength; + +   /* find used temp regs (we may need new temps below) */ +   _mesa_find_used_registers(newProg, PROGRAM_TEMPORARY, +                             usedTemps, MAX_PROGRAM_TEMPS); + +   if (newProg->Target == GL_FRAGMENT_PROGRAM_ARB) { +      struct gl_fragment_program *fprogA, *fprogB, *newFprog; +      GLbitfield progB_inputsRead = progB->InputsRead; +      GLint progB_colorFile, progB_colorIndex; + +      fprogA = (struct gl_fragment_program *) progA; +      fprogB = (struct gl_fragment_program *) progB; +      newFprog = (struct gl_fragment_program *) newProg; + +      newFprog->UsesKill = fprogA->UsesKill || fprogB->UsesKill; + +      /* We'll do a search and replace for instances +       * of progB_colorFile/progB_colorIndex below... +       */ +      progB_colorFile = PROGRAM_INPUT; +      progB_colorIndex = FRAG_ATTRIB_COL0; + +      /* +       * The fragment program may get color from a state var rather than +       * a fragment input (vertex output) if it's constant. +       * See the texenvprogram.c code. +       * So, search the program's parameter list now to see if the program +       * gets color from a state var instead of a conventional fragment +       * input register. +       */ +      for (i = 0; i < progB->Parameters->NumParameters; i++) { +         struct gl_program_parameter *p = &progB->Parameters->Parameters[i]; +         if (p->Type == PROGRAM_STATE_VAR && +             p->StateIndexes[0] == STATE_INTERNAL && +             p->StateIndexes[1] == STATE_CURRENT_ATTRIB && +             (int) p->StateIndexes[2] == (int) VERT_ATTRIB_COLOR0) { +            progB_inputsRead |= FRAG_BIT_COL0; +            progB_colorFile = PROGRAM_STATE_VAR; +            progB_colorIndex = i; +            break; +         } +      } + +      /* Connect color outputs of fprogA to color inputs of fprogB, via a +       * new temporary register. +       */ +      if ((progA->OutputsWritten & BITFIELD64_BIT(FRAG_RESULT_COLOR)) && +          (progB_inputsRead & FRAG_BIT_COL0)) { +         GLint tempReg = _mesa_find_free_register(usedTemps, MAX_PROGRAM_TEMPS, +                                                  firstTemp); +         if (tempReg < 0) { +            _mesa_problem(ctx, "No free temp regs found in " +                          "_mesa_combine_programs(), using 31"); +            tempReg = 31; +         } +         firstTemp = tempReg + 1; + +         /* replace writes to result.color[0] with tempReg */ +         replace_registers(newInst, lenA, +                           PROGRAM_OUTPUT, FRAG_RESULT_COLOR, +                           PROGRAM_TEMPORARY, tempReg); +         /* replace reads from the input color with tempReg */ +         replace_registers(newInst + lenA, lenB, +                           progB_colorFile, progB_colorIndex, /* search for */ +                           PROGRAM_TEMPORARY, tempReg  /* replace with */ ); +      } + +      /* compute combined program's InputsRead */ +      inputsB = progB_inputsRead; +      if (progA->OutputsWritten & BITFIELD64_BIT(FRAG_RESULT_COLOR)) { +         inputsB &= ~(1 << FRAG_ATTRIB_COL0); +      } +      newProg->InputsRead = progA->InputsRead | inputsB; +      newProg->OutputsWritten = progB->OutputsWritten; +      newProg->SamplersUsed = progA->SamplersUsed | progB->SamplersUsed; +   } +   else { +      /* vertex program */ +      assert(0);      /* XXX todo */ +   } + +   /* +    * Merge parameters (uniforms, constants, etc) +    */ +   newProg->Parameters = _mesa_combine_parameter_lists(progA->Parameters, +                                                       progB->Parameters); + +   adjust_param_indexes(newInst + lenA, lenB, numParamsA); + + +   return newProg; +} + + +/** + * Populate the 'used' array with flags indicating which registers (TEMPs, + * INPUTs, OUTPUTs, etc, are used by the given program. + * \param file  type of register to scan for + * \param used  returns true/false flags for in use / free + * \param usedSize  size of the 'used' array + */ +void +_mesa_find_used_registers(const struct gl_program *prog, +                          gl_register_file file, +                          GLboolean used[], GLuint usedSize) +{ +   GLuint i, j; + +   memset(used, 0, usedSize); + +   for (i = 0; i < prog->NumInstructions; i++) { +      const struct prog_instruction *inst = prog->Instructions + i; +      const GLuint n = _mesa_num_inst_src_regs(inst->Opcode); + +      if (inst->DstReg.File == file) { +         ASSERT(inst->DstReg.Index < usedSize); +         if(inst->DstReg.Index < usedSize) +            used[inst->DstReg.Index] = GL_TRUE; +      } + +      for (j = 0; j < n; j++) { +         if (inst->SrcReg[j].File == file) { +            ASSERT(inst->SrcReg[j].Index < usedSize); +            if(inst->SrcReg[j].Index < usedSize) +               used[inst->SrcReg[j].Index] = GL_TRUE; +         } +      } +   } +} + + +/** + * Scan the given 'used' register flag array for the first entry + * that's >= firstReg. + * \param used  vector of flags indicating registers in use (as returned + *              by _mesa_find_used_registers()) + * \param usedSize  size of the 'used' array + * \param firstReg  first register to start searching at + * \return index of unused register, or -1 if none. + */ +GLint +_mesa_find_free_register(const GLboolean used[], +                         GLuint usedSize, GLuint firstReg) +{ +   GLuint i; + +   assert(firstReg < usedSize); + +   for (i = firstReg; i < usedSize; i++) +      if (!used[i]) +         return i; + +   return -1; +} + + + +/** + * Check if the given register index is valid (doesn't exceed implementation- + * dependent limits). + * \return GL_TRUE if OK, GL_FALSE if bad index + */ +GLboolean +_mesa_valid_register_index(const struct gl_context *ctx, +                           gl_shader_type shaderType, +                           gl_register_file file, GLint index) +{ +   const struct gl_program_constants *c; + +   switch (shaderType) { +   case MESA_SHADER_VERTEX: +      c = &ctx->Const.VertexProgram; +      break; +   case MESA_SHADER_FRAGMENT: +      c = &ctx->Const.FragmentProgram; +      break; +   case MESA_SHADER_GEOMETRY: +      c = &ctx->Const.GeometryProgram; +      break; +   default: +      _mesa_problem(ctx, +                    "unexpected shader type in _mesa_valid_register_index()"); +      return GL_FALSE; +   } + +   switch (file) { +   case PROGRAM_UNDEFINED: +      return GL_TRUE;  /* XXX or maybe false? */ + +   case PROGRAM_TEMPORARY: +      return index >= 0 && index < c->MaxTemps; + +   case PROGRAM_ENV_PARAM: +      return index >= 0 && index < c->MaxEnvParams; + +   case PROGRAM_LOCAL_PARAM: +      return index >= 0 && index < c->MaxLocalParams; + +   case PROGRAM_NAMED_PARAM: +      return index >= 0 && index < c->MaxParameters; + +   case PROGRAM_UNIFORM: +   case PROGRAM_STATE_VAR: +      /* aka constant buffer */ +      return index >= 0 && index < c->MaxUniformComponents / 4; + +   case PROGRAM_CONSTANT: +      /* constant buffer w/ possible relative negative addressing */ +      return (index > (int) c->MaxUniformComponents / -4 && +              index < c->MaxUniformComponents / 4); + +   case PROGRAM_INPUT: +      if (index < 0) +         return GL_FALSE; + +      switch (shaderType) { +      case MESA_SHADER_VERTEX: +         return index < VERT_ATTRIB_GENERIC0 + c->MaxAttribs; +      case MESA_SHADER_FRAGMENT: +         return index < FRAG_ATTRIB_VAR0 + ctx->Const.MaxVarying; +      case MESA_SHADER_GEOMETRY: +         return index < GEOM_ATTRIB_VAR0 + ctx->Const.MaxVarying; +      default: +         return GL_FALSE; +      } + +   case PROGRAM_OUTPUT: +      if (index < 0) +         return GL_FALSE; + +      switch (shaderType) { +      case MESA_SHADER_VERTEX: +         return index < VERT_RESULT_VAR0 + ctx->Const.MaxVarying; +      case MESA_SHADER_FRAGMENT: +         return index < FRAG_RESULT_DATA0 + ctx->Const.MaxDrawBuffers; +      case MESA_SHADER_GEOMETRY: +         return index < GEOM_RESULT_VAR0 + ctx->Const.MaxVarying; +      default: +         return GL_FALSE; +      } + +   case PROGRAM_ADDRESS: +      return index >= 0 && index < c->MaxAddressRegs; + +   default: +      _mesa_problem(ctx, +                    "unexpected register file in _mesa_valid_register_index()"); +      return GL_FALSE; +   } +} + + + +/** + * "Post-process" a GPU program.  This is intended to be used for debugging. + * Example actions include no-op'ing instructions or changing instruction + * behaviour. + */ +void +_mesa_postprocess_program(struct gl_context *ctx, struct gl_program *prog) +{ +   static const GLfloat white[4] = { 0.5, 0.5, 0.5, 0.5 }; +   GLuint i; +   GLuint whiteSwizzle; +   GLint whiteIndex = _mesa_add_unnamed_constant(prog->Parameters, +                                                 white, 4, &whiteSwizzle); + +   (void) whiteIndex; + +   for (i = 0; i < prog->NumInstructions; i++) { +      struct prog_instruction *inst = prog->Instructions + i; +      const GLuint n = _mesa_num_inst_src_regs(inst->Opcode); + +      (void) n; + +      if (_mesa_is_tex_instruction(inst->Opcode)) { +#if 0 +         /* replace TEX/TXP/TXB with MOV */ +         inst->Opcode = OPCODE_MOV; +         inst->DstReg.WriteMask = WRITEMASK_XYZW; +         inst->SrcReg[0].Swizzle = SWIZZLE_XYZW; +         inst->SrcReg[0].Negate = NEGATE_NONE; +#endif + +#if 0 +         /* disable shadow texture mode */ +         inst->TexShadow = 0; +#endif +      } + +      if (inst->Opcode == OPCODE_TXP) { +#if 0 +         inst->Opcode = OPCODE_MOV; +         inst->DstReg.WriteMask = WRITEMASK_XYZW; +         inst->SrcReg[0].File = PROGRAM_CONSTANT; +         inst->SrcReg[0].Index = whiteIndex; +         inst->SrcReg[0].Swizzle = SWIZZLE_XYZW; +         inst->SrcReg[0].Negate = NEGATE_NONE; +#endif +#if 0 +         inst->TexShadow = 0; +#endif +#if 0 +         inst->Opcode = OPCODE_TEX; +         inst->TexShadow = 0; +#endif +      } + +   } +} diff --git a/mesalib/src/mesa/program/program_parse.y b/mesalib/src/mesa/program/program_parse.y index b35bc5a7c..85c783dd6 100644 --- a/mesalib/src/mesa/program/program_parse.y +++ b/mesalib/src/mesa/program/program_parse.y @@ -2060,9 +2060,14 @@ resultColBinding: COLOR optResultFaceType optResultColorType  optResultFaceType:  	{ -	   $$ = (state->mode == ARB_vertex) -	      ? VERT_RESULT_COL0 -	      : FRAG_RESULT_COLOR; +	   if (state->mode == ARB_vertex) { +	      $$ = VERT_RESULT_COL0; +	   } else { +	      if (state->option.DrawBuffers) +		 $$ = FRAG_RESULT_DATA0; +	      else +		 $$ = FRAG_RESULT_COLOR; +	   }  	}  	| '[' INTEGER ']'  	{ diff --git a/mesalib/src/mesa/program/programopt.c b/mesalib/src/mesa/program/programopt.c index 5ad9571f7..a239da2c6 100644 --- a/mesalib/src/mesa/program/programopt.c +++ b/mesalib/src/mesa/program/programopt.c @@ -230,15 +230,25 @@ _mesa_insert_mvp_code(struct gl_context *ctx, struct gl_vertex_program *vprog)  /** - * Append extra instructions onto the given fragment program to implement - * the fog mode specified by fprog->FogOption. - * The fragment.fogcoord input is used to compute the fog blend factor. + * Append instructions to implement fog   * - * XXX with a little work, this function could be adapted to add fog code + * The \c fragment.fogcoord input is used to compute the fog blend factor. + * + * \param ctx      The GL context + * \param fprog    Fragment program that fog instructions will be appended to. + * \param fog_mode Fog mode.  One of \c GL_EXP, \c GL_EXP2, or \c GL_LINEAR. + * \param saturate True if writes to color outputs should be clamped to [0, 1] + * + * \note + * This function sets \c FRAG_BIT_FOGC in \c fprog->Base.InputsRead. + * + * \todo With a little work, this function could be adapted to add fog code   * to vertex programs too.   */  void -_mesa_append_fog_code(struct gl_context *ctx, struct gl_fragment_program *fprog, GLboolean saturate) +_mesa_append_fog_code(struct gl_context *ctx, +		      struct gl_fragment_program *fprog, GLenum fog_mode, +		      GLboolean saturate)  {     static const gl_state_index fogPStateOpt[STATE_LENGTH]        = { STATE_INTERNAL, STATE_FOG_PARAMS_OPTIMIZED, 0, 0, 0 }; @@ -251,9 +261,9 @@ _mesa_append_fog_code(struct gl_context *ctx, struct gl_fragment_program *fprog,     GLint fogPRefOpt, fogColorRef; /* state references */     GLuint colorTemp, fogFactorTemp; /* temporary registerss */ -   if (fprog->FogOption == GL_NONE) { +   if (fog_mode == GL_NONE) {        _mesa_problem(ctx, "_mesa_append_fog_code() called for fragment program" -                    " with FogOption == GL_NONE"); +                    " with fog_mode == GL_NONE");        return;     } @@ -301,7 +311,7 @@ _mesa_append_fog_code(struct gl_context *ctx, struct gl_fragment_program *fprog,     /* emit instructions to compute fog blending factor */     /* this is always clamped to [0, 1] regardless of fragment clamping */ -   if (fprog->FogOption == GL_LINEAR) { +   if (fog_mode == GL_LINEAR) {        /* MAD fogFactorTemp.x, fragment.fogcoord.x, fogPRefOpt.x, fogPRefOpt.y; */        inst->Opcode = OPCODE_MAD;        inst->DstReg.File = PROGRAM_TEMPORARY; @@ -320,7 +330,7 @@ _mesa_append_fog_code(struct gl_context *ctx, struct gl_fragment_program *fprog,        inst++;     }     else { -      ASSERT(fprog->FogOption == GL_EXP || fprog->FogOption == GL_EXP2); +      ASSERT(fog_mode == GL_EXP || fog_mode == GL_EXP2);        /* fogPRefOpt.z = d/ln(2), fogPRefOpt.w = d/sqrt(ln(2) */        /* EXP: MUL fogFactorTemp.x, fogPRefOpt.z, fragment.fogcoord.x; */        /* EXP2: MUL fogFactorTemp.x, fogPRefOpt.w, fragment.fogcoord.x; */ @@ -331,12 +341,12 @@ _mesa_append_fog_code(struct gl_context *ctx, struct gl_fragment_program *fprog,        inst->SrcReg[0].File = PROGRAM_STATE_VAR;        inst->SrcReg[0].Index = fogPRefOpt;        inst->SrcReg[0].Swizzle -         = (fprog->FogOption == GL_EXP) ? SWIZZLE_ZZZZ : SWIZZLE_WWWW; +         = (fog_mode == GL_EXP) ? SWIZZLE_ZZZZ : SWIZZLE_WWWW;        inst->SrcReg[1].File = PROGRAM_INPUT;        inst->SrcReg[1].Index = FRAG_ATTRIB_FOGC;        inst->SrcReg[1].Swizzle = SWIZZLE_XXXX;        inst++; -      if (fprog->FogOption == GL_EXP2) { +      if (fog_mode == GL_EXP2) {           /* MUL fogFactorTemp.x, fogFactorTemp.x, fogFactorTemp.x; */           inst->Opcode = OPCODE_MUL;           inst->DstReg.File = PROGRAM_TEMPORARY; @@ -397,7 +407,6 @@ _mesa_append_fog_code(struct gl_context *ctx, struct gl_fragment_program *fprog,     fprog->Base.Instructions = newInst;     fprog->Base.NumInstructions = inst - newInst;     fprog->Base.InputsRead |= FRAG_BIT_FOGC; -   /* XXX do this?  fprog->FogOption = GL_NONE; */  } diff --git a/mesalib/src/mesa/program/programopt.h b/mesalib/src/mesa/program/programopt.h index 79631aa58..b9205823c 100644 --- a/mesalib/src/mesa/program/programopt.h +++ b/mesalib/src/mesa/program/programopt.h @@ -32,7 +32,9 @@ extern void  _mesa_insert_mvp_code(struct gl_context *ctx, struct gl_vertex_program *vprog);  extern void -_mesa_append_fog_code(struct gl_context *ctx, struct gl_fragment_program *fprog, GLboolean saturate); +_mesa_append_fog_code(struct gl_context *ctx, +		      struct gl_fragment_program *fprog, GLenum fog_mode, +		      GLboolean saturate);  extern void  _mesa_count_texture_indirections(struct gl_program *prog); | 
