src/mesa/tnl/t_draw.c - platform/external/mesa3d - Gitiles

 /*
  * Mesa 3-D graphics library
  * Version:  7.1
  *
  * Copyright (C) 1999-2007  Brian Paul   All Rights Reserved.
  *
  * Permission is hereby granted, free of charge, to any person obtaining a
  * copy of this software and associated documentation files (the "Software"),
  * to deal in the Software without restriction, including without limitation
  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  * and/or sell copies of the Software, and to permit persons to whom the
  * Software is furnished to do so, subject to the following conditions:
  *
  * The above copyright notice and this permission notice shall be included
  * in all copies or substantial portions of the Software.
  *
  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
  * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
  * BRIAN PAUL BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN
  * AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
  *
  * Authors:
  *    Keith Whitwell <keith@tungstengraphics.com>
  */

 #include "main/glheader.h"
 #include "main/condrender.h"
 #include "main/context.h"
 #include "main/imports.h"
 #include "main/mtypes.h"
 #include "main/macros.h"
 #include "main/enums.h"

 #include "t_context.h"
 #include "tnl.h"


 static GLubyte *get_space(struct gl_context *ctx, GLuint bytes)
 {
    TNLcontext *tnl = TNL_CONTEXT(ctx);
    GLubyte *space = malloc(bytes);

    tnl->block[tnl->nr_blocks++] = space;
    return space;
 }


 static void free_space(struct gl_context *ctx)
 {
    TNLcontext *tnl = TNL_CONTEXT(ctx);
    GLuint i;
    for (i = 0; i < tnl->nr_blocks; i++)
       free(tnl->block[i]);
    tnl->nr_blocks = 0;
 }


 /* Convert the incoming array to GLfloats.  Understands the
  * array->Normalized flag and selects the correct conversion method.
  */
 #define CONVERT( TYPE, MACRO ) do {		\
    GLuint i, j;					\
    if (input->Normalized) {			\
       for (i = 0; i < count; i++) {		\
 	 const TYPE *in = (TYPE *)ptr;		\
 	 for (j = 0; j < sz; j++) {		\
 	    *fptr++ = MACRO(*in);		\
 	    in++;				\
 	 }					\
 	 ptr += input->StrideB;			\
       }						\
    } else {					\
       for (i = 0; i < count; i++) {		\
 	 const TYPE *in = (TYPE *)ptr;		\
 	 for (j = 0; j < sz; j++) {		\
 	    *fptr++ = (GLfloat)(*in);		\
 	    in++;				\
 	 }					\
 	 ptr += input->StrideB;			\
       }						\
    }						\
 } while (0)


 /**
  * Convert array of BGRA/GLubyte[4] values to RGBA/float[4]
  * \param ptr  input/ubyte array
  * \param fptr  output/float array
  */
 static void
 convert_bgra_to_float(const struct gl_client_array *input,
                       const GLubyte *ptr, GLfloat *fptr,
                       GLuint count )
 {
    GLuint i;
    assert(input->Normalized);
    assert(input->Size == 4);
    for (i = 0; i < count; i++) {
       const GLubyte *in = (GLubyte *) ptr;  /* in is in BGRA order */
       *fptr++ = UBYTE_TO_FLOAT(in[2]);  /* red */
       *fptr++ = UBYTE_TO_FLOAT(in[1]);  /* green */
       *fptr++ = UBYTE_TO_FLOAT(in[0]);  /* blue */
       *fptr++ = UBYTE_TO_FLOAT(in[3]);  /* alpha */
       ptr += input->StrideB;
    }
 }

 static void
 convert_half_to_float(const struct gl_client_array *input,
 		      const GLubyte *ptr, GLfloat *fptr,
 		      GLuint count, GLuint sz)
 {
    GLuint i, j;

    for (i = 0; i < count; i++) {
       GLhalfARB *in = (GLhalfARB *)ptr;

       for (j = 0; j < sz; j++) {
 	 *fptr++ = _mesa_half_to_float(in[j]);
       }
       ptr += input->StrideB;
    }
 }

 /**
  * \brief Convert fixed-point to floating-point.
  *
  * In OpenGL, a fixed-point number is a "signed 2's complement 16.16 scaled
  * integer" (Table 2.2 of the OpenGL ES 2.0 spec).
  *
  * If the buffer has the \c normalized flag set, the formula
  *     \code normalize(x) := (2*x + 1) / (2^16 - 1) \endcode
  * is used to map the fixed-point numbers into the range [-1, 1].
  */
 static void
 convert_fixed_to_float(const struct gl_client_array *input,
                        const GLubyte *ptr, GLfloat *fptr,
                        GLuint count)
 {
    GLuint i, j;
    const GLint size = input->Size;

    if (input->Normalized) {
       for (i = 0; i < count; ++i) {
          const GLfixed *in = (GLfixed *) ptr;
          for (j = 0; j < size; ++j) {
             *fptr++ = (GLfloat) (2 * in[j] + 1) / (GLfloat) ((1 << 16) - 1);
          }
          ptr += input->StrideB;
       }
    } else {
       for (i = 0; i < count; ++i) {
          const GLfixed *in = (GLfixed *) ptr;
          for (j = 0; j < size; ++j) {
             *fptr++ = in[j] / (GLfloat) (1 << 16);
          }
          ptr += input->StrideB;
       }
    }
 }

 /* Adjust pointer to point at first requested element, convert to
  * floating point, populate VB->AttribPtr[].
  */
 static void _tnl_import_array( struct gl_context *ctx,
 			       GLuint attrib,
 			       GLuint count,
 			       const struct gl_client_array *input,
 			       const GLubyte *ptr )
 {
    TNLcontext *tnl = TNL_CONTEXT(ctx);
    struct vertex_buffer *VB = &tnl->vb;
    GLuint stride = input->StrideB;

    if (input->Type != GL_FLOAT) {
       const GLuint sz = input->Size;
       GLubyte *buf = get_space(ctx, count * sz * sizeof(GLfloat));
       GLfloat *fptr = (GLfloat *)buf;

       switch (input->Type) {
       case GL_BYTE:
 	 CONVERT(GLbyte, BYTE_TO_FLOAT);
 	 break;
       case GL_UNSIGNED_BYTE:
          if (input->Format == GL_BGRA) {
             /* See GL_EXT_vertex_array_bgra */
             convert_bgra_to_float(input, ptr, fptr, count);
          }
          else {
             CONVERT(GLubyte, UBYTE_TO_FLOAT);
          }
 	 break;
       case GL_SHORT:
 	 CONVERT(GLshort, SHORT_TO_FLOAT);
 	 break;
       case GL_UNSIGNED_SHORT:
 	 CONVERT(GLushort, USHORT_TO_FLOAT);
 	 break;
       case GL_INT:
 	 CONVERT(GLint, INT_TO_FLOAT);
 	 break;
       case GL_UNSIGNED_INT:
 	 CONVERT(GLuint, UINT_TO_FLOAT);
 	 break;
       case GL_DOUBLE:
 	 CONVERT(GLdouble, (GLfloat));
 	 break;
       case GL_HALF_FLOAT:
 	 convert_half_to_float(input, ptr, fptr, count, sz);
 	 break;
       case GL_FIXED:
          convert_fixed_to_float(input, ptr, fptr, count);
          break;
       default:
 	 assert(0);
 	 break;
       }

       ptr = buf;
       stride = sz * sizeof(GLfloat);
    }

    VB->AttribPtr[attrib] = &tnl->tmp_inputs[attrib];
    VB->AttribPtr[attrib]->data = (GLfloat (*)[4])ptr;
    VB->AttribPtr[attrib]->start = (GLfloat *)ptr;
    VB->AttribPtr[attrib]->count = count;
    VB->AttribPtr[attrib]->stride = stride;
    VB->AttribPtr[attrib]->size = input->Size;

    /* This should die, but so should the whole GLvector4f concept:
     */
    VB->AttribPtr[attrib]->flags = (((1<<input->Size)-1) |
 				   VEC_NOT_WRITEABLE |
 				   (stride == 4*sizeof(GLfloat) ? 0 : VEC_BAD_STRIDE));

    VB->AttribPtr[attrib]->storage = NULL;
 }

 #define CLIPVERTS  ((6 + MAX_CLIP_PLANES) * 2)


 static GLboolean *_tnl_import_edgeflag( struct gl_context *ctx,
 					const GLvector4f *input,
 					GLuint count)
 {
    const GLubyte *ptr = (const GLubyte *)input->data;
    const GLuint stride = input->stride;
    GLboolean *space = (GLboolean *)get_space(ctx, count + CLIPVERTS);
    GLboolean *bptr = space;
    GLuint i;

    for (i = 0; i < count; i++) {
       *bptr++ = ((GLfloat *)ptr)[0] == 1.0;
       ptr += stride;
    }

    return space;
 }


 static void bind_inputs( struct gl_context *ctx,
 			 const struct gl_client_array *inputs[],
 			 GLint count,
 			 struct gl_buffer_object **bo,
 			 GLuint *nr_bo )
 {
    TNLcontext *tnl = TNL_CONTEXT(ctx);
    struct vertex_buffer *VB = &tnl->vb;
    GLuint i;

    /* Map all the VBOs
     */
    for (i = 0; i < VERT_ATTRIB_MAX; i++) {
       const void *ptr;

       if (inputs[i]->BufferObj->Name) {
 	 if (!inputs[i]->BufferObj->Pointer) {
 	    bo[*nr_bo] = inputs[i]->BufferObj;
 	    (*nr_bo)++;
 	    ctx->Driver.MapBuffer(ctx,
 				  GL_ARRAY_BUFFER,
 				  GL_READ_ONLY_ARB,
 				  inputs[i]->BufferObj);

 	    assert(inputs[i]->BufferObj->Pointer);
 	 }

 	 ptr = ADD_POINTERS(inputs[i]->BufferObj->Pointer,
 			    inputs[i]->Ptr);
       }
       else
 	 ptr = inputs[i]->Ptr;

       /* Just make sure the array is floating point, otherwise convert to
        * temporary storage.
        *
        * XXX: remove the GLvector4f type at some stage and just use
        * client arrays.
        */
       _tnl_import_array(ctx, i, count, inputs[i], ptr);
    }

    /* We process only the vertices between min & max index:
     */
    VB->Count = count;

    /* These should perhaps be part of _TNL_ATTRIB_* */
    VB->BackfaceColorPtr = NULL;
    VB->BackfaceIndexPtr = NULL;
    VB->BackfaceSecondaryColorPtr = NULL;

    /* Clipping and drawing code still requires this to be a packed
     * array of ubytes which can be written into.  TODO: Fix and
     * remove.
     */
    if (ctx->Polygon.FrontMode != GL_FILL ||
        ctx->Polygon.BackMode != GL_FILL)
    {
       VB->EdgeFlag = _tnl_import_edgeflag( ctx,
 					   VB->AttribPtr[_TNL_ATTRIB_EDGEFLAG],
 					   VB->Count );
    }
    else {
       /* the data previously pointed to by EdgeFlag may have been freed */
       VB->EdgeFlag = NULL;
    }
 }


 /* Translate indices to GLuints and store in VB->Elts.
  */
 static void bind_indices( struct gl_context *ctx,
 			  const struct _mesa_index_buffer *ib,
 			  struct gl_buffer_object **bo,
 			  GLuint *nr_bo)
 {
    TNLcontext *tnl = TNL_CONTEXT(ctx);
    struct vertex_buffer *VB = &tnl->vb;
    GLuint i;
    void *ptr;

    if (!ib) {
       VB->Elts = NULL;
       return;
    }

    if (ib->obj->Name && !ib->obj->Pointer) {
       bo[*nr_bo] = ib->obj;
       (*nr_bo)++;
       ctx->Driver.MapBuffer(ctx,
 			    GL_ELEMENT_ARRAY_BUFFER,
 			    GL_READ_ONLY_ARB,
 			    ib->obj);

       assert(ib->obj->Pointer);
    }

    ptr = ADD_POINTERS(ib->obj->Pointer, ib->ptr);

    if (ib->type == GL_UNSIGNED_INT && VB->Primitive[0].basevertex == 0) {
       VB->Elts = (GLuint *) ptr;
    }
    else {
       GLuint *elts = (GLuint *)get_space(ctx, ib->count * sizeof(GLuint));
       VB->Elts = elts;

       if (ib->type == GL_UNSIGNED_INT) {
 	 const GLuint *in = (GLuint *)ptr;
 	 for (i = 0; i < ib->count; i++)
 	    *elts++ = (GLuint)(*in++) + VB->Primitive[0].basevertex;
       }
       else if (ib->type == GL_UNSIGNED_SHORT) {
 	 const GLushort *in = (GLushort *)ptr;
 	 for (i = 0; i < ib->count; i++)
 	    *elts++ = (GLuint)(*in++) + VB->Primitive[0].basevertex;
       }
       else {
 	 const GLubyte *in = (GLubyte *)ptr;
 	 for (i = 0; i < ib->count; i++)
 	    *elts++ = (GLuint)(*in++) + VB->Primitive[0].basevertex;
       }
    }
 }

 static void bind_prims( struct gl_context *ctx,
 			const struct _mesa_prim *prim,
 			GLuint nr_prims )
 {
    TNLcontext *tnl = TNL_CONTEXT(ctx);
    struct vertex_buffer *VB = &tnl->vb;

    VB->Primitive = prim;
    VB->PrimitiveCount = nr_prims;
 }

 static void unmap_vbos( struct gl_context *ctx,
 			struct gl_buffer_object **bo,
 			GLuint nr_bo )
 {
    GLuint i;
    for (i = 0; i < nr_bo; i++) {
       ctx->Driver.UnmapBuffer(ctx, bo[i]);
    }
 }


 void _tnl_vbo_draw_prims(struct gl_context *ctx,
 			 const struct gl_client_array *arrays[],
 			 const struct _mesa_prim *prim,
 			 GLuint nr_prims,
 			 const struct _mesa_index_buffer *ib,
 			 GLboolean index_bounds_valid,
 			 GLuint min_index,
 			 GLuint max_index)
 {
    if (!index_bounds_valid)
       vbo_get_minmax_index(ctx, prim, ib, &min_index, &max_index);

    _tnl_draw_prims(ctx, arrays, prim, nr_prims, ib, min_index, max_index);
 }

 /* This is the main entrypoint into the slimmed-down software tnl
  * module.  In a regular swtnl driver, this can be plugged straight
  * into the vbo->Driver.DrawPrims() callback.
  */
 void _tnl_draw_prims( struct gl_context *ctx,
 		      const struct gl_client_array *arrays[],
 		      const struct _mesa_prim *prim,
 		      GLuint nr_prims,
 		      const struct _mesa_index_buffer *ib,
 		      GLuint min_index,
 		      GLuint max_index)
 {
    TNLcontext *tnl = TNL_CONTEXT(ctx);
    const GLuint TEST_SPLIT = 0;
    const GLint max = TEST_SPLIT ? 8 : tnl->vb.Size - MAX_CLIPPED_VERTICES;
    GLint max_basevertex = prim->basevertex;
    GLuint i;

    /* Mesa core state should have been validated already */
    assert(ctx->NewState == 0x0);

    if (!_mesa_check_conditional_render(ctx))
       return; /* don't draw */

    for (i = 1; i < nr_prims; i++)
       max_basevertex = MAX2(max_basevertex, prim[i].basevertex);

    if (0)
    {
       printf("%s %d..%d\n", __FUNCTION__, min_index, max_index);
       for (i = 0; i < nr_prims; i++)
 	 printf("prim %d: %s start %d count %d\n", i,
 		_mesa_lookup_enum_by_nr(prim[i].mode),
 		prim[i].start,
 		prim[i].count);
    }

    if (min_index) {
       /* We always translate away calls with min_index != 0.
        */
       vbo_rebase_prims( ctx, arrays, prim, nr_prims, ib,
 			min_index, max_index,
 			_tnl_vbo_draw_prims );
       return;
    }
    else if ((GLint)max_index + max_basevertex > max) {
       /* The software TNL pipeline has a fixed amount of storage for
        * vertices and it is necessary to split incoming drawing commands
        * if they exceed that limit.
        */
       struct split_limits limits;
       limits.max_verts = max;
       limits.max_vb_size = ~0;
       limits.max_indices = ~0;

       /* This will split the buffers one way or another and
        * recursively call back into this function.
        */
       vbo_split_prims( ctx, arrays, prim, nr_prims, ib,
 		       0, max_index + prim->basevertex,
 		       _tnl_vbo_draw_prims,
 		       &limits );
    }
    else {
       /* May need to map a vertex buffer object for every attribute plus
        * one for the index buffer.
        */
       struct gl_buffer_object *bo[VERT_ATTRIB_MAX + 1];
       GLuint nr_bo = 0;
       GLuint inst;

       for (i = 0; i < nr_prims;) {
 	 GLuint this_nr_prims;

 	 /* Our SW TNL pipeline doesn't handle basevertex yet, so bind_indices
 	  * will rebase the elements to the basevertex, and we'll only
 	  * emit strings of prims with the same basevertex in one draw call.
 	  */
 	 for (this_nr_prims = 1; i + this_nr_prims < nr_prims;
 	      this_nr_prims++) {
 	    if (prim[i].basevertex != prim[i + this_nr_prims].basevertex)
 	       break;
 	 }

          assert(prim[i].num_instances > 0);

 	 /* Binding inputs may imply mapping some vertex buffer objects.
 	  * They will need to be unmapped below.
 	  */
          for (inst = 0; inst < prim[i].num_instances; inst++) {

             bind_prims(ctx, &prim[i], this_nr_prims);
             bind_inputs(ctx, arrays, max_index + prim[i].basevertex + 1,
                         bo, &nr_bo);
             bind_indices(ctx, ib, bo, &nr_bo);

             tnl->CurInstance = inst;
             TNL_CONTEXT(ctx)->Driver.RunPipeline(ctx);

             unmap_vbos(ctx, bo, nr_bo);
             free_space(ctx);
          }

 	 i += this_nr_prims;
       }
    }
 }
	/*
	* Mesa 3-D graphics library
	* Version: 7.1
	*
	* Copyright (C) 1999-2007 Brian Paul All Rights Reserved.
	*
	* Permission is hereby granted, free of charge, to any person obtaining a
	* copy of this software and associated documentation files (the "Software"),
	* to deal in the Software without restriction, including without limitation
	* the rights to use, copy, modify, merge, publish, distribute, sublicense,
	* and/or sell copies of the Software, and to permit persons to whom the
	* Software is furnished to do so, subject to the following conditions:
	*
	* The above copyright notice and this permission notice shall be included
	* in all copies or substantial portions of the Software.
	*
	* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
	* OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
	* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
	* BRIAN PAUL BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN
	* AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
	* CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
	*
	* Authors:
	* Keith Whitwell <keith@tungstengraphics.com>
	*/

	#include "main/glheader.h"
	#include "main/condrender.h"
	#include "main/context.h"
	#include "main/imports.h"
	#include "main/mtypes.h"
	#include "main/macros.h"
	#include "main/enums.h"

	#include "t_context.h"
	#include "tnl.h"



	static GLubyte get_space(struct gl_context ctx, GLuint bytes)
	{
	TNLcontext *tnl = TNL_CONTEXT(ctx);
	GLubyte *space = malloc(bytes);

	tnl->block[tnl->nr_blocks++] = space;
	return space;
	}


	static void free_space(struct gl_context *ctx)
	{
	TNLcontext *tnl = TNL_CONTEXT(ctx);
	GLuint i;
	for (i = 0; i < tnl->nr_blocks; i++)
	free(tnl->block[i]);
	tnl->nr_blocks = 0;
	}


	/* Convert the incoming array to GLfloats. Understands the
	* array->Normalized flag and selects the correct conversion method.
	*/
	#define CONVERT( TYPE, MACRO ) do { \
	GLuint i, j; \
	if (input->Normalized) { \
	for (i = 0; i < count; i++) { \
	const TYPE in = (TYPE )ptr; \
	for (j = 0; j < sz; j++) { \
	fptr++ = MACRO(in); \
	in++; \
	} \
	ptr += input->StrideB; \
	} \
	} else { \
	for (i = 0; i < count; i++) { \
	const TYPE in = (TYPE )ptr; \
	for (j = 0; j < sz; j++) { \
	fptr++ = (GLfloat)(in); \
	in++; \
	} \
	ptr += input->StrideB; \
	} \
	} \
	} while (0)


	/**
	* Convert array of BGRA/GLubyte[4] values to RGBA/float[4]
	* \param ptr input/ubyte array
	* \param fptr output/float array
	*/
	static void
	convert_bgra_to_float(const struct gl_client_array *input,
	const GLubyte ptr, GLfloat fptr,
	GLuint count )
	{
	GLuint i;
	assert(input->Normalized);
	assert(input->Size == 4);
	for (i = 0; i < count; i++) {
	const GLubyte in = (GLubyte ) ptr; /* in is in BGRA order */
	fptr++ = UBYTE_TO_FLOAT(in[2]); / red */
	fptr++ = UBYTE_TO_FLOAT(in[1]); / green */
	fptr++ = UBYTE_TO_FLOAT(in[0]); / blue */
	fptr++ = UBYTE_TO_FLOAT(in[3]); / alpha */
	ptr += input->StrideB;
	}
	}

	static void
	convert_half_to_float(const struct gl_client_array *input,
	const GLubyte ptr, GLfloat fptr,
	GLuint count, GLuint sz)
	{
	GLuint i, j;

	for (i = 0; i < count; i++) {
	GLhalfARB in = (GLhalfARB )ptr;

	for (j = 0; j < sz; j++) {
	*fptr++ = _mesa_half_to_float(in[j]);
	}
	ptr += input->StrideB;
	}
	}

	/**
	* \brief Convert fixed-point to floating-point.
	*
	* In OpenGL, a fixed-point number is a "signed 2's complement 16.16 scaled
	* integer" (Table 2.2 of the OpenGL ES 2.0 spec).
	*
	* If the buffer has the \c normalized flag set, the formula
	* \code normalize(x) := (2*x + 1) / (2^16 - 1) \endcode
	* is used to map the fixed-point numbers into the range [-1, 1].
	*/
	static void
	convert_fixed_to_float(const struct gl_client_array *input,
	const GLubyte ptr, GLfloat fptr,
	GLuint count)
	{
	GLuint i, j;
	const GLint size = input->Size;

	if (input->Normalized) {
	for (i = 0; i < count; ++i) {
	const GLfixed in = (GLfixed ) ptr;
	for (j = 0; j < size; ++j) {
	fptr++ = (GLfloat) (2 in[j] + 1) / (GLfloat) ((1 << 16) - 1);
	}
	ptr += input->StrideB;
	}
	} else {
	for (i = 0; i < count; ++i) {
	const GLfixed in = (GLfixed ) ptr;
	for (j = 0; j < size; ++j) {
	*fptr++ = in[j] / (GLfloat) (1 << 16);
	}
	ptr += input->StrideB;
	}
	}
	}

	/* Adjust pointer to point at first requested element, convert to
	* floating point, populate VB->AttribPtr[].
	*/
	static void _tnl_import_array( struct gl_context *ctx,
	GLuint attrib,
	GLuint count,
	const struct gl_client_array *input,
	const GLubyte *ptr )
	{
	TNLcontext *tnl = TNL_CONTEXT(ctx);
	struct vertex_buffer *VB = &tnl->vb;
	GLuint stride = input->StrideB;

	if (input->Type != GL_FLOAT) {
	const GLuint sz = input->Size;
	GLubyte buf = get_space(ctx, count sz * sizeof(GLfloat));
	GLfloat fptr = (GLfloat )buf;

	switch (input->Type) {
	case GL_BYTE:
	CONVERT(GLbyte, BYTE_TO_FLOAT);
	break;
	case GL_UNSIGNED_BYTE:
	if (input->Format == GL_BGRA) {
	/* See GL_EXT_vertex_array_bgra */
	convert_bgra_to_float(input, ptr, fptr, count);
	}
	else {
	CONVERT(GLubyte, UBYTE_TO_FLOAT);
	}
	break;
	case GL_SHORT:
	CONVERT(GLshort, SHORT_TO_FLOAT);
	break;
	case GL_UNSIGNED_SHORT:
	CONVERT(GLushort, USHORT_TO_FLOAT);
	break;
	case GL_INT:
	CONVERT(GLint, INT_TO_FLOAT);
	break;
	case GL_UNSIGNED_INT:
	CONVERT(GLuint, UINT_TO_FLOAT);
	break;
	case GL_DOUBLE:
	CONVERT(GLdouble, (GLfloat));
	break;
	case GL_HALF_FLOAT:
	convert_half_to_float(input, ptr, fptr, count, sz);
	break;
	case GL_FIXED:
	convert_fixed_to_float(input, ptr, fptr, count);
	break;
	default:
	assert(0);
	break;
	}

	ptr = buf;
	stride = sz * sizeof(GLfloat);
	}

	VB->AttribPtr[attrib] = &tnl->tmp_inputs[attrib];
	VB->AttribPtr[attrib]->data = (GLfloat (*)[4])ptr;
	VB->AttribPtr[attrib]->start = (GLfloat *)ptr;
	VB->AttribPtr[attrib]->count = count;
	VB->AttribPtr[attrib]->stride = stride;
	VB->AttribPtr[attrib]->size = input->Size;

	/* This should die, but so should the whole GLvector4f concept:
	*/
	VB->AttribPtr[attrib]->flags = (((1<<input->Size)-1) \|
	VEC_NOT_WRITEABLE \|
	(stride == 4*sizeof(GLfloat) ? 0 : VEC_BAD_STRIDE));

	VB->AttribPtr[attrib]->storage = NULL;
	}

	#define CLIPVERTS ((6 + MAX_CLIP_PLANES) * 2)


	static GLboolean _tnl_import_edgeflag( struct gl_context ctx,
	const GLvector4f *input,
	GLuint count)
	{
	const GLubyte ptr = (const GLubyte )input->data;
	const GLuint stride = input->stride;
	GLboolean space = (GLboolean )get_space(ctx, count + CLIPVERTS);
	GLboolean *bptr = space;
	GLuint i;

	for (i = 0; i < count; i++) {
	bptr++ = ((GLfloat )ptr)[0] == 1.0;
	ptr += stride;
	}

	return space;
	}


	static void bind_inputs( struct gl_context *ctx,
	const struct gl_client_array *inputs[],
	GLint count,
	struct gl_buffer_object **bo,
	GLuint *nr_bo )
	{
	TNLcontext *tnl = TNL_CONTEXT(ctx);
	struct vertex_buffer *VB = &tnl->vb;
	GLuint i;

	/* Map all the VBOs
	*/
	for (i = 0; i < VERT_ATTRIB_MAX; i++) {
	const void *ptr;

	if (inputs[i]->BufferObj->Name) {
	if (!inputs[i]->BufferObj->Pointer) {
	bo[*nr_bo] = inputs[i]->BufferObj;
	(*nr_bo)++;
	ctx->Driver.MapBuffer(ctx,
	GL_ARRAY_BUFFER,
	GL_READ_ONLY_ARB,
	inputs[i]->BufferObj);

	assert(inputs[i]->BufferObj->Pointer);
	}

	ptr = ADD_POINTERS(inputs[i]->BufferObj->Pointer,
	inputs[i]->Ptr);
	}
	else
	ptr = inputs[i]->Ptr;

	/* Just make sure the array is floating point, otherwise convert to
	* temporary storage.
	*
	* XXX: remove the GLvector4f type at some stage and just use
	* client arrays.
	*/
	_tnl_import_array(ctx, i, count, inputs[i], ptr);
	}

	/* We process only the vertices between min & max index:
	*/
	VB->Count = count;

	/* These should perhaps be part of _TNL_ATTRIB_* */
	VB->BackfaceColorPtr = NULL;
	VB->BackfaceIndexPtr = NULL;
	VB->BackfaceSecondaryColorPtr = NULL;

	/* Clipping and drawing code still requires this to be a packed
	* array of ubytes which can be written into. TODO: Fix and
	* remove.
	*/
	if (ctx->Polygon.FrontMode != GL_FILL \|\|
	ctx->Polygon.BackMode != GL_FILL)
	{
	VB->EdgeFlag = _tnl_import_edgeflag( ctx,
	VB->AttribPtr[_TNL_ATTRIB_EDGEFLAG],
	VB->Count );
	}
	else {
	/* the data previously pointed to by EdgeFlag may have been freed */
	VB->EdgeFlag = NULL;
	}
	}


	/* Translate indices to GLuints and store in VB->Elts.
	*/
	static void bind_indices( struct gl_context *ctx,
	const struct _mesa_index_buffer *ib,
	struct gl_buffer_object **bo,
	GLuint *nr_bo)
	{
	TNLcontext *tnl = TNL_CONTEXT(ctx);
	struct vertex_buffer *VB = &tnl->vb;
	GLuint i;
	void *ptr;

	if (!ib) {
	VB->Elts = NULL;
	return;
	}

	if (ib->obj->Name && !ib->obj->Pointer) {
	bo[*nr_bo] = ib->obj;
	(*nr_bo)++;
	ctx->Driver.MapBuffer(ctx,
	GL_ELEMENT_ARRAY_BUFFER,
	GL_READ_ONLY_ARB,
	ib->obj);

	assert(ib->obj->Pointer);
	}

	ptr = ADD_POINTERS(ib->obj->Pointer, ib->ptr);

	if (ib->type == GL_UNSIGNED_INT && VB->Primitive[0].basevertex == 0) {
	VB->Elts = (GLuint *) ptr;
	}
	else {
	GLuint elts = (GLuint )get_space(ctx, ib->count * sizeof(GLuint));
	VB->Elts = elts;

	if (ib->type == GL_UNSIGNED_INT) {
	const GLuint in = (GLuint )ptr;
	for (i = 0; i < ib->count; i++)
	elts++ = (GLuint)(in++) + VB->Primitive[0].basevertex;
	}
	else if (ib->type == GL_UNSIGNED_SHORT) {
	const GLushort in = (GLushort )ptr;
	for (i = 0; i < ib->count; i++)
	elts++ = (GLuint)(in++) + VB->Primitive[0].basevertex;
	}
	else {
	const GLubyte in = (GLubyte )ptr;
	for (i = 0; i < ib->count; i++)
	elts++ = (GLuint)(in++) + VB->Primitive[0].basevertex;
	}
	}
	}

	static void bind_prims( struct gl_context *ctx,
	const struct _mesa_prim *prim,
	GLuint nr_prims )
	{
	TNLcontext *tnl = TNL_CONTEXT(ctx);
	struct vertex_buffer *VB = &tnl->vb;

	VB->Primitive = prim;
	VB->PrimitiveCount = nr_prims;
	}

	static void unmap_vbos( struct gl_context *ctx,
	struct gl_buffer_object **bo,
	GLuint nr_bo )
	{
	GLuint i;
	for (i = 0; i < nr_bo; i++) {
	ctx->Driver.UnmapBuffer(ctx, bo[i]);
	}
	}


	void _tnl_vbo_draw_prims(struct gl_context *ctx,
	const struct gl_client_array *arrays[],
	const struct _mesa_prim *prim,
	GLuint nr_prims,
	const struct _mesa_index_buffer *ib,
	GLboolean index_bounds_valid,
	GLuint min_index,
	GLuint max_index)
	{
	if (!index_bounds_valid)
	vbo_get_minmax_index(ctx, prim, ib, &min_index, &max_index);

	_tnl_draw_prims(ctx, arrays, prim, nr_prims, ib, min_index, max_index);
	}

	/* This is the main entrypoint into the slimmed-down software tnl
	* module. In a regular swtnl driver, this can be plugged straight
	* into the vbo->Driver.DrawPrims() callback.
	*/
	void _tnl_draw_prims( struct gl_context *ctx,
	const struct gl_client_array *arrays[],
	const struct _mesa_prim *prim,
	GLuint nr_prims,
	const struct _mesa_index_buffer *ib,
	GLuint min_index,
	GLuint max_index)
	{
	TNLcontext *tnl = TNL_CONTEXT(ctx);
	const GLuint TEST_SPLIT = 0;
	const GLint max = TEST_SPLIT ? 8 : tnl->vb.Size - MAX_CLIPPED_VERTICES;
	GLint max_basevertex = prim->basevertex;
	GLuint i;

	/* Mesa core state should have been validated already */
	assert(ctx->NewState == 0x0);

	if (!_mesa_check_conditional_render(ctx))
	return; /* don't draw */

	for (i = 1; i < nr_prims; i++)
	max_basevertex = MAX2(max_basevertex, prim[i].basevertex);

	if (0)
	{
	printf("%s %d..%d\n", __FUNCTION__, min_index, max_index);
	for (i = 0; i < nr_prims; i++)
	printf("prim %d: %s start %d count %d\n", i,
	_mesa_lookup_enum_by_nr(prim[i].mode),
	prim[i].start,
	prim[i].count);
	}

	if (min_index) {
	/* We always translate away calls with min_index != 0.
	*/
	vbo_rebase_prims( ctx, arrays, prim, nr_prims, ib,
	min_index, max_index,
	_tnl_vbo_draw_prims );
	return;
	}
	else if ((GLint)max_index + max_basevertex > max) {
	/* The software TNL pipeline has a fixed amount of storage for
	* vertices and it is necessary to split incoming drawing commands
	* if they exceed that limit.
	*/
	struct split_limits limits;
	limits.max_verts = max;
	limits.max_vb_size = ~0;
	limits.max_indices = ~0;

	/* This will split the buffers one way or another and
	* recursively call back into this function.
	*/
	vbo_split_prims( ctx, arrays, prim, nr_prims, ib,
	0, max_index + prim->basevertex,
	_tnl_vbo_draw_prims,
	&limits );
	}
	else {
	/* May need to map a vertex buffer object for every attribute plus
	* one for the index buffer.
	*/
	struct gl_buffer_object *bo[VERT_ATTRIB_MAX + 1];
	GLuint nr_bo = 0;
	GLuint inst;

	for (i = 0; i < nr_prims;) {
	GLuint this_nr_prims;

	/* Our SW TNL pipeline doesn't handle basevertex yet, so bind_indices
	* will rebase the elements to the basevertex, and we'll only
	* emit strings of prims with the same basevertex in one draw call.
	*/
	for (this_nr_prims = 1; i + this_nr_prims < nr_prims;
	this_nr_prims++) {
	if (prim[i].basevertex != prim[i + this_nr_prims].basevertex)
	break;
	}

	assert(prim[i].num_instances > 0);

	/* Binding inputs may imply mapping some vertex buffer objects.
	* They will need to be unmapped below.
	*/
	for (inst = 0; inst < prim[i].num_instances; inst++) {

	bind_prims(ctx, &prim[i], this_nr_prims);
	bind_inputs(ctx, arrays, max_index + prim[i].basevertex + 1,
	bo, &nr_bo);
	bind_indices(ctx, ib, bo, &nr_bo);

	tnl->CurInstance = inst;
	TNL_CONTEXT(ctx)->Driver.RunPipeline(ctx);

	unmap_vbos(ctx, bo, nr_bo);
	free_space(ctx);
	}

	i += this_nr_prims;
	}
	}
	}