/************************************************************************** * * Copyright 2007 Tungsten Graphics, Inc., Cedar Park, Texas. * All Rights Reserved. * * Permission is hereby granted, free of charge, to any person obtaining a * copy of this software and associated documentation files (the * "Software"), to deal in the Software without restriction, including * without limitation the rights to use, copy, modify, merge, publish, * distribute, sub license, and/or sell copies of the Software, and to * permit persons to whom the Software is furnished to do so, subject to * the following conditions: * * The above copyright notice and this permission notice (including the * next paragraph) shall be included in all copies or substantial portions * of the Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. * **************************************************************************/ /** * \file * Vertex buffer drawing stage. * * \author José Fonseca * \author Keith Whitwell */ #include "pipe/p_debug.h" #include "pipe/p_util.h" #include "draw_vbuf.h" #include "draw_private.h" #include "draw_vertex.h" #include "draw_pipe.h" #include "translate/translate.h" /** * Vertex buffer emit stage. */ struct vbuf_stage { struct draw_stage stage; /**< This must be first (base class) */ struct vbuf_render *render; const struct vertex_info *vinfo; /** Vertex size in bytes */ unsigned vertex_size; struct translate *translate; /* FIXME: we have no guarantee that 'unsigned' is 32bit */ /** Vertices in hardware format */ unsigned *vertices; unsigned *vertex_ptr; unsigned max_vertices; unsigned nr_vertices; /** Indices */ ushort *indices; unsigned max_indices; unsigned nr_indices; /* Cache point size somewhere it's address won't change: */ float point_size; }; /** * Basically a cast wrapper. */ static INLINE struct vbuf_stage * vbuf_stage( struct draw_stage *stage ) { assert(stage); return (struct vbuf_stage *)stage; } static void vbuf_flush_indices( struct vbuf_stage *vbuf ); static void vbuf_flush_vertices( struct vbuf_stage *vbuf ); static void vbuf_alloc_vertices( struct vbuf_stage *vbuf ); static INLINE boolean overflow( void *map, void *ptr, unsigned bytes, unsigned bufsz ) { unsigned long used = (unsigned long) ((char *)ptr - (char *)map); return (used + bytes) > bufsz; } static INLINE void check_space( struct vbuf_stage *vbuf, unsigned nr ) { if (vbuf->nr_vertices + nr > vbuf->max_vertices ) { vbuf_flush_vertices(vbuf); vbuf_alloc_vertices(vbuf); } if (vbuf->nr_indices + nr > vbuf->max_indices ) vbuf_flush_indices(vbuf); } static INLINE void dump_emitted_vertex(const struct vertex_info *vinfo, const uint8_t *data) { // assert(vinfo == vbuf->render->get_vertex_info(vbuf->render)); unsigned i, j; for (i = 0; i < vinfo->num_attribs; i++) { j = vinfo->src_index[i]; switch (vinfo->emit[i]) { case EMIT_OMIT: debug_printf("EMIT_OMIT:"); break; case EMIT_1F: debug_printf("EMIT_1F:\t"); debug_printf("%f ", *(float *)data); data += sizeof(float); break; case EMIT_1F_PSIZE: debug_printf("EMIT_1F_PSIZE:\t"); debug_printf("%f ", *(float *)data); data += sizeof(float); break; case EMIT_2F: debug_printf("EMIT_2F:\t"); debug_printf("%f ", *(float *)data); data += sizeof(float); debug_printf("%f ", *(float *)data); data += sizeof(float); break; case EMIT_3F: debug_printf("EMIT_3F:\t"); debug_printf("%f ", *(float *)data); data += sizeof(float); debug_printf("%f ", *(float *)data); data += sizeof(float); debug_printf("%f ", *(float *)data); data += sizeof(float); data += sizeof(float); break; case EMIT_4F: debug_printf("EMIT_4F:\t"); debug_printf("%f ", *(float *)data); data += sizeof(float); debug_printf("%f ", *(float *)data); data += sizeof(float); debug_printf("%f ", *(float *)data); data += sizeof(float); debug_printf("%f ", *(float *)data); data += sizeof(float); break; case EMIT_4UB: debug_printf("EMIT_4UB:\t"); debug_printf("%u ", *data++); debug_printf("%u ", *data++); debug_printf("%u ", *data++); debug_printf("%u ", *data++); break; default: assert(0); } debug_printf("\n"); } debug_printf("\n"); } /** * Extract the needed fields from post-transformed vertex and emit * a hardware(driver) vertex. * Recall that the vertices are constructed by the 'draw' module and * have a couple of slots at the beginning (1-dword header, 4-dword * clip pos) that we ignore here. We only use the vertex->data[] fields. */ static INLINE ushort emit_vertex( struct vbuf_stage *vbuf, struct vertex_header *vertex ) { if(vertex->vertex_id == UNDEFINED_VERTEX_ID) { /* Hmm - vertices are emitted one at a time - better make sure * set_buffer is efficient. Consider a special one-shot mode for * translate. */ vbuf->translate->set_buffer(vbuf->translate, 0, vertex->data[0], 0); vbuf->translate->run(vbuf->translate, 0, 1, vbuf->vertex_ptr); if (0) dump_emitted_vertex(vbuf->vinfo, (uint8_t *)vbuf->vertex_ptr); vbuf->vertex_ptr += vbuf->vertex_size/4; vertex->vertex_id = vbuf->nr_vertices++; } return vertex->vertex_id; } static void vbuf_tri( struct draw_stage *stage, struct prim_header *prim ) { struct vbuf_stage *vbuf = vbuf_stage( stage ); unsigned i; check_space( vbuf, 3 ); for (i = 0; i < 3; i++) { vbuf->indices[vbuf->nr_indices++] = emit_vertex( vbuf, prim->v[i] ); } } static void vbuf_line( struct draw_stage *stage, struct prim_header *prim ) { struct vbuf_stage *vbuf = vbuf_stage( stage ); unsigned i; check_space( vbuf, 2 ); for (i = 0; i < 2; i++) { vbuf->indices[vbuf->nr_indices++] = emit_vertex( vbuf, prim->v[i] ); } } static void vbuf_point( struct draw_stage *stage, struct prim_header *prim ) { struct vbuf_stage *vbuf = vbuf_stage( stage ); check_space( vbuf, 1 ); vbuf->indices[vbuf->nr_indices++] = emit_vertex( vbuf, prim->v[0] ); } /** * Set the prim type for subsequent vertices. * This may result in a new vertex size. The existing vbuffer (if any) * will be flushed if needed and a new one allocated. */ static void vbuf_set_prim( struct vbuf_stage *vbuf, uint prim ) { struct translate_key hw_key; unsigned dst_offset; unsigned i; vbuf->render->set_primitive(vbuf->render, prim); /* Must do this after set_primitive() above: * * XXX: need some state managment to track when this needs to be * recalculated. The driver should tell us whether there was a * state change. */ vbuf->vinfo = vbuf->render->get_vertex_info(vbuf->render); if (vbuf->vertex_size != vbuf->vinfo->size * sizeof(float)) { vbuf_flush_vertices(vbuf); vbuf->vertex_size = vbuf->vinfo->size * sizeof(float); } /* Translate from pipeline vertices to hw vertices. */ dst_offset = 0; memset(&hw_key, 0, sizeof(hw_key)); for (i = 0; i < vbuf->vinfo->num_attribs; i++) { unsigned emit_sz = 0; unsigned src_buffer = 0; unsigned output_format; unsigned src_offset = (vbuf->vinfo->src_index[i] * 4 * sizeof(float) ); switch (vbuf->vinfo->emit[i]) { case EMIT_4F: output_format = PIPE_FORMAT_R32G32B32A32_FLOAT; emit_sz = 4 * sizeof(float); break; case EMIT_3F: output_format = PIPE_FORMAT_R32G32B32_FLOAT; emit_sz = 3 * sizeof(float); break; case EMIT_2F: output_format = PIPE_FORMAT_R32G32_FLOAT; emit_sz = 2 * sizeof(float); break; case EMIT_1F: output_format = PIPE_FORMAT_R32_FLOAT; emit_sz = 1 * sizeof(float); break; case EMIT_1F_PSIZE: output_format = PIPE_FORMAT_R32_FLOAT; emit_sz = 1 * sizeof(float); src_buffer = 1; src_offset = 0; break; case EMIT_4UB: output_format = PIPE_FORMAT_B8G8R8A8_UNORM; emit_sz = 4 * sizeof(ubyte); default: assert(0); output_format = PIPE_FORMAT_NONE; emit_sz = 0; break; } hw_key.element[i].input_format = PIPE_FORMAT_R32G32B32A32_FLOAT; hw_key.element[i].input_buffer = src_buffer; hw_key.element[i].input_offset = src_offset; hw_key.element[i].output_format = output_format; hw_key.element[i].output_offset = dst_offset; dst_offset += emit_sz; } hw_key.nr_elements = vbuf->vinfo->num_attribs; hw_key.output_stride = vbuf->vinfo->size * 4; /* Don't bother with caching at this stage: */ if (!vbuf->translate || memcmp(&vbuf->translate->key, &hw_key, sizeof(hw_key)) != 0) { if (vbuf->translate) vbuf->translate->release(vbuf->translate); vbuf->translate = translate_create( &hw_key ); vbuf->translate->set_buffer(vbuf->translate, 1, &vbuf->point_size, 0); } vbuf->point_size = vbuf->stage.draw->rasterizer->point_size; /* Allocate new buffer? */ if (!vbuf->vertices) vbuf_alloc_vertices(vbuf); } static void vbuf_first_tri( struct draw_stage *stage, struct prim_header *prim ) { struct vbuf_stage *vbuf = vbuf_stage( stage ); vbuf_flush_indices( vbuf ); stage->tri = vbuf_tri; vbuf_set_prim(vbuf, PIPE_PRIM_TRIANGLES); stage->tri( stage, prim ); } static void vbuf_first_line( struct draw_stage *stage, struct prim_header *prim ) { struct vbuf_stage *vbuf = vbuf_stage( stage ); vbuf_flush_indices( vbuf ); stage->line = vbuf_line; vbuf_set_prim(vbuf, PIPE_PRIM_LINES); stage->line( stage, prim ); } static void vbuf_first_point( struct draw_stage *stage, struct prim_header *prim ) { struct vbuf_stage *vbuf = vbuf_stage( stage ); vbuf_flush_indices( vbuf ); stage->point = vbuf_point; vbuf_set_prim(vbuf, PIPE_PRIM_POINTS); stage->point( stage, prim ); } static void vbuf_flush_indices( struct vbuf_stage *vbuf ) { if(!vbuf->nr_indices) return; assert((uint) (vbuf->vertex_ptr - vbuf->vertices) == vbuf->nr_vertices * vbuf->vertex_size / sizeof(unsigned)); vbuf->render->draw(vbuf->render, vbuf->indices, vbuf->nr_indices); vbuf->nr_indices = 0; } /** * Flush existing vertex buffer and allocate a new one. * * XXX: We separate flush-on-index-full and flush-on-vb-full, but may * raise issues uploading vertices if the hardware wants to flush when * we flush. */ static void vbuf_flush_vertices( struct vbuf_stage *vbuf ) { if(vbuf->vertices) { vbuf_flush_indices(vbuf); /* Reset temporary vertices ids */ if(vbuf->nr_vertices) draw_reset_vertex_ids( vbuf->stage.draw ); /* Free the vertex buffer */ vbuf->render->release_vertices(vbuf->render, vbuf->vertices, vbuf->vertex_size, vbuf->nr_vertices); vbuf->max_vertices = vbuf->nr_vertices = 0; vbuf->vertex_ptr = vbuf->vertices = NULL; } } static void vbuf_alloc_vertices( struct vbuf_stage *vbuf ) { assert(!vbuf->nr_indices); assert(!vbuf->vertices); /* Allocate a new vertex buffer */ vbuf->max_vertices = vbuf->render->max_vertex_buffer_bytes / vbuf->vertex_size; vbuf->vertices = (uint *) vbuf->render->allocate_vertices(vbuf->render, (ushort) vbuf->vertex_size, (ushort) vbuf->max_vertices); vbuf->vertex_ptr = vbuf->vertices; } static void vbuf_flush( struct draw_stage *stage, unsigned flags ) { struct vbuf_stage *vbuf = vbuf_stage( stage ); vbuf_flush_indices( vbuf ); stage->point = vbuf_first_point; stage->line = vbuf_first_line; stage->tri = vbuf_first_tri; if (flags & DRAW_FLUSH_BACKEND) vbuf_flush_vertices( vbuf ); } static void vbuf_reset_stipple_counter( struct draw_stage *stage ) { /* XXX: Need to do something here for hardware with linestipple. */ (void) stage; } static void vbuf_destroy( struct draw_stage *stage ) { struct vbuf_stage *vbuf = vbuf_stage( stage ); if(vbuf->indices) align_free( vbuf->indices ); if(vbuf->translate) vbuf->translate->release( vbuf->translate ); if (vbuf->render) vbuf->render->destroy( vbuf->render ); FREE( stage ); } /** * Create a new primitive vbuf/render stage. */ struct draw_stage *draw_vbuf_stage( struct draw_context *draw, struct vbuf_render *render ) { struct vbuf_stage *vbuf = CALLOC_STRUCT(vbuf_stage); if(!vbuf) goto fail; vbuf->stage.draw = draw; vbuf->stage.point = vbuf_first_point; vbuf->stage.line = vbuf_first_line; vbuf->stage.tri = vbuf_first_tri; vbuf->stage.flush = vbuf_flush; vbuf->stage.reset_stipple_counter = vbuf_reset_stipple_counter; vbuf->stage.destroy = vbuf_destroy; vbuf->render = render; vbuf->max_indices = MAX2(render->max_indices, UNDEFINED_VERTEX_ID-1); vbuf->indices = (ushort *) align_malloc( vbuf->max_indices * sizeof(vbuf->indices[0]), 16 ); if(!vbuf->indices) goto fail; vbuf->vertices = NULL; vbuf->vertex_ptr = vbuf->vertices; return &vbuf->stage; fail: if (vbuf) vbuf_destroy(&vbuf->stage); return NULL; }