/* Copyright (C) Intel Corp. 2006. All Rights Reserved. Intel funded Tungsten Graphics (http://www.tungstengraphics.com) to develop this 3D driver. Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the "Software"), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions: The above copyright notice and this permission notice (including the next paragraph) shall be included in all copies or substantial portions of the Software. THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE COPYRIGHT OWNER(S) AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. **********************************************************************/ /* * Authors: * Keith Whitwell */ #include "main/mtypes.h" #include "main/texstore.h" #include "program/prog_parameter.h" #include "intel_mipmap_tree.h" #include "intel_batchbuffer.h" #include "intel_tex.h" #include "intel_fbo.h" #include "brw_context.h" #include "brw_state.h" #include "brw_defines.h" static GLuint translate_tex_target( GLenum target ) { switch (target) { case GL_TEXTURE_1D: return BRW_SURFACE_1D; case GL_TEXTURE_RECTANGLE_NV: return BRW_SURFACE_2D; case GL_TEXTURE_2D: return BRW_SURFACE_2D; case GL_TEXTURE_3D: return BRW_SURFACE_3D; case GL_TEXTURE_CUBE_MAP: return BRW_SURFACE_CUBE; default: assert(0); return 0; } } static GLuint translate_tex_format( gl_format mesa_format, GLenum internal_format, GLenum depth_mode ) { switch( mesa_format ) { case MESA_FORMAT_L8: return BRW_SURFACEFORMAT_L8_UNORM; case MESA_FORMAT_I8: return BRW_SURFACEFORMAT_I8_UNORM; case MESA_FORMAT_A8: return BRW_SURFACEFORMAT_A8_UNORM; case MESA_FORMAT_AL88: return BRW_SURFACEFORMAT_L8A8_UNORM; case MESA_FORMAT_AL1616: return BRW_SURFACEFORMAT_L16A16_UNORM; case MESA_FORMAT_R8: return BRW_SURFACEFORMAT_R8_UNORM; case MESA_FORMAT_R16: return BRW_SURFACEFORMAT_R16_UNORM; case MESA_FORMAT_RG88: return BRW_SURFACEFORMAT_R8G8_UNORM; case MESA_FORMAT_RG1616: return BRW_SURFACEFORMAT_R16G16_UNORM; case MESA_FORMAT_RGB888: assert(0); /* not supported for sampling */ return BRW_SURFACEFORMAT_R8G8B8_UNORM; case MESA_FORMAT_ARGB8888: return BRW_SURFACEFORMAT_B8G8R8A8_UNORM; case MESA_FORMAT_XRGB8888: return BRW_SURFACEFORMAT_B8G8R8X8_UNORM; case MESA_FORMAT_RGBA8888_REV: _mesa_problem(NULL, "unexpected format in i965:translate_tex_format()"); return BRW_SURFACEFORMAT_R8G8B8A8_UNORM; case MESA_FORMAT_RGB565: return BRW_SURFACEFORMAT_B5G6R5_UNORM; case MESA_FORMAT_ARGB1555: return BRW_SURFACEFORMAT_B5G5R5A1_UNORM; case MESA_FORMAT_ARGB4444: return BRW_SURFACEFORMAT_B4G4R4A4_UNORM; case MESA_FORMAT_YCBCR_REV: return BRW_SURFACEFORMAT_YCRCB_NORMAL; case MESA_FORMAT_YCBCR: return BRW_SURFACEFORMAT_YCRCB_SWAPUVY; case MESA_FORMAT_RGB_FXT1: case MESA_FORMAT_RGBA_FXT1: return BRW_SURFACEFORMAT_FXT1; case MESA_FORMAT_Z16: if (depth_mode == GL_INTENSITY) return BRW_SURFACEFORMAT_I16_UNORM; else if (depth_mode == GL_ALPHA) return BRW_SURFACEFORMAT_A16_UNORM; else return BRW_SURFACEFORMAT_L16_UNORM; case MESA_FORMAT_RGB_DXT1: return BRW_SURFACEFORMAT_DXT1_RGB; case MESA_FORMAT_RGBA_DXT1: return BRW_SURFACEFORMAT_BC1_UNORM; case MESA_FORMAT_RGBA_DXT3: return BRW_SURFACEFORMAT_BC2_UNORM; case MESA_FORMAT_RGBA_DXT5: return BRW_SURFACEFORMAT_BC3_UNORM; case MESA_FORMAT_SARGB8: return BRW_SURFACEFORMAT_B8G8R8A8_UNORM_SRGB; case MESA_FORMAT_SLA8: return BRW_SURFACEFORMAT_L8A8_UNORM_SRGB; case MESA_FORMAT_SL8: return BRW_SURFACEFORMAT_L8_UNORM_SRGB; case MESA_FORMAT_SRGB_DXT1: return BRW_SURFACEFORMAT_BC1_UNORM_SRGB; case MESA_FORMAT_S8_Z24: /* XXX: these different surface formats don't seem to * make any difference for shadow sampler/compares. */ if (depth_mode == GL_INTENSITY) return BRW_SURFACEFORMAT_I24X8_UNORM; else if (depth_mode == GL_ALPHA) return BRW_SURFACEFORMAT_A24X8_UNORM; else return BRW_SURFACEFORMAT_L24X8_UNORM; case MESA_FORMAT_DUDV8: return BRW_SURFACEFORMAT_R8G8_SNORM; case MESA_FORMAT_SIGNED_RGBA8888_REV: return BRW_SURFACEFORMAT_R8G8B8A8_SNORM; default: assert(0); return 0; } } static void brw_set_surface_tiling(struct brw_surface_state *surf, uint32_t tiling) { switch (tiling) { case I915_TILING_NONE: surf->ss3.tiled_surface = 0; surf->ss3.tile_walk = 0; break; case I915_TILING_X: surf->ss3.tiled_surface = 1; surf->ss3.tile_walk = BRW_TILEWALK_XMAJOR; break; case I915_TILING_Y: surf->ss3.tiled_surface = 1; surf->ss3.tile_walk = BRW_TILEWALK_YMAJOR; break; } } static void brw_update_texture_surface( struct gl_context *ctx, GLuint unit ) { struct brw_context *brw = brw_context(ctx); struct gl_texture_object *tObj = ctx->Texture.Unit[unit]._Current; struct intel_texture_object *intelObj = intel_texture_object(tObj); struct gl_texture_image *firstImage = tObj->Image[0][intelObj->firstLevel]; const GLuint surf_index = SURF_INDEX_TEXTURE(unit); struct brw_surface_state surf; void *map; memset(&surf, 0, sizeof(surf)); surf.ss0.mipmap_layout_mode = BRW_SURFACE_MIPMAPLAYOUT_BELOW; surf.ss0.surface_type = translate_tex_target(tObj->Target); surf.ss0.surface_format = translate_tex_format(firstImage->TexFormat, firstImage->InternalFormat, tObj->DepthMode); /* This is ok for all textures with channel width 8bit or less: */ /* surf.ss0.data_return_format = BRW_SURFACERETURNFORMAT_S1; */ surf.ss1.base_addr = intelObj->mt->region->buffer->offset; /* reloc */ surf.ss2.mip_count = intelObj->lastLevel - intelObj->firstLevel; surf.ss2.width = firstImage->Width - 1; surf.ss2.height = firstImage->Height - 1; brw_set_surface_tiling(&surf, intelObj->mt->region->tiling); surf.ss3.pitch = (intelObj->mt->region->pitch * intelObj->mt->cpp) - 1; surf.ss3.depth = firstImage->Depth - 1; surf.ss4.min_lod = 0; if (tObj->Target == GL_TEXTURE_CUBE_MAP) { surf.ss0.cube_pos_x = 1; surf.ss0.cube_pos_y = 1; surf.ss0.cube_pos_z = 1; surf.ss0.cube_neg_x = 1; surf.ss0.cube_neg_y = 1; surf.ss0.cube_neg_z = 1; } map = brw_state_batch(brw, sizeof(surf), 32, &brw->wm.surf_bo[surf_index], &brw->wm.surf_offset[surf_index]); memcpy(map, &surf, sizeof(surf)); /* Emit relocation to surface contents */ drm_intel_bo_emit_reloc(brw->wm.surf_bo[surf_index], brw->wm.surf_offset[surf_index] + offsetof(struct brw_surface_state, ss1), intelObj->mt->region->buffer, 0, I915_GEM_DOMAIN_SAMPLER, 0); } /** * Create the constant buffer surface. Vertex/fragment shader constants will be * read from this buffer with Data Port Read instructions/messages. */ void brw_create_constant_surface(struct brw_context *brw, drm_intel_bo *bo, int width, drm_intel_bo **out_bo, uint32_t *out_offset) { const GLint w = width - 1; struct brw_surface_state surf; void *map; memset(&surf, 0, sizeof(surf)); surf.ss0.mipmap_layout_mode = BRW_SURFACE_MIPMAPLAYOUT_BELOW; surf.ss0.surface_type = BRW_SURFACE_BUFFER; surf.ss0.surface_format = BRW_SURFACEFORMAT_R32G32B32A32_FLOAT; assert(bo); surf.ss1.base_addr = bo->offset; /* reloc */ surf.ss2.width = w & 0x7f; /* bits 6:0 of size or width */ surf.ss2.height = (w >> 7) & 0x1fff; /* bits 19:7 of size or width */ surf.ss3.depth = (w >> 20) & 0x7f; /* bits 26:20 of size or width */ surf.ss3.pitch = (width * 16) - 1; /* ignored?? */ brw_set_surface_tiling(&surf, I915_TILING_NONE); /* tiling now allowed */ map = brw_state_batch(brw, sizeof(surf), 32, out_bo, out_offset); memcpy(map, &surf, sizeof(surf)); /* Emit relocation to surface contents. Section 5.1.1 of the gen4 * bspec ("Data Cache") says that the data cache does not exist as * a separate cache and is just the sampler cache. */ drm_intel_bo_emit_reloc(*out_bo, (*out_offset + offsetof(struct brw_surface_state, ss1)), bo, 0, I915_GEM_DOMAIN_SAMPLER, 0); } /* Creates a new WM constant buffer reflecting the current fragment program's * constants, if needed by the fragment program. * * Otherwise, constants go through the CURBEs using the brw_constant_buffer * state atom. */ static void prepare_wm_constants(struct brw_context *brw) { struct gl_context *ctx = &brw->intel.ctx; struct intel_context *intel = &brw->intel; struct brw_fragment_program *fp = (struct brw_fragment_program *) brw->fragment_program; const int size = brw->wm.prog_data->nr_pull_params * sizeof(float); float *constants; unsigned int i; _mesa_load_state_parameters(ctx, fp->program.Base.Parameters); /* BRW_NEW_FRAGMENT_PROGRAM */ if (brw->wm.prog_data->nr_pull_params == 0) { if (brw->wm.const_bo) { drm_intel_bo_unreference(brw->wm.const_bo); brw->wm.const_bo = NULL; brw->state.dirty.brw |= BRW_NEW_WM_CONSTBUF; } return; } drm_intel_bo_unreference(brw->wm.const_bo); brw->wm.const_bo = drm_intel_bo_alloc(intel->bufmgr, "WM const bo", size, 64); /* _NEW_PROGRAM_CONSTANTS */ drm_intel_gem_bo_map_gtt(brw->wm.const_bo); constants = brw->wm.const_bo->virtual; for (i = 0; i < brw->wm.prog_data->nr_pull_params; i++) { constants[i] = convert_param(brw->wm.prog_data->pull_param_convert[i], *brw->wm.prog_data->pull_param[i]); } drm_intel_gem_bo_unmap_gtt(brw->wm.const_bo); brw->state.dirty.brw |= BRW_NEW_WM_CONSTBUF; } const struct brw_tracked_state brw_wm_constants = { .dirty = { .mesa = (_NEW_PROGRAM_CONSTANTS), .brw = (BRW_NEW_FRAGMENT_PROGRAM), .cache = 0 }, .prepare = prepare_wm_constants, }; /** * Updates surface / buffer for fragment shader constant buffer, if * one is required. * * This consumes the state updates for the constant buffer, and produces * BRW_NEW_WM_SURFACES to get picked up by brw_prepare_wm_surfaces for * inclusion in the binding table. */ static void upload_wm_constant_surface(struct brw_context *brw ) { GLuint surf = SURF_INDEX_FRAG_CONST_BUFFER; struct brw_fragment_program *fp = (struct brw_fragment_program *) brw->fragment_program; const struct gl_program_parameter_list *params = fp->program.Base.Parameters; /* If there's no constant buffer, then no surface BO is needed to point at * it. */ if (brw->wm.const_bo == 0) { if (brw->wm.surf_bo[surf] != NULL) { drm_intel_bo_unreference(brw->wm.surf_bo[surf]); brw->wm.surf_bo[surf] = NULL; brw->state.dirty.brw |= BRW_NEW_WM_SURFACES; } return; } brw_create_constant_surface(brw, brw->wm.const_bo, params->NumParameters, &brw->wm.surf_bo[surf], &brw->wm.surf_offset[surf]); brw->state.dirty.brw |= BRW_NEW_WM_SURFACES; } const struct brw_tracked_state brw_wm_constant_surface = { .dirty = { .mesa = 0, .brw = (BRW_NEW_WM_CONSTBUF | BRW_NEW_BATCH), .cache = 0 }, .emit = upload_wm_constant_surface, }; /** * Sets up a surface state structure to point at the given region. * While it is only used for the front/back buffer currently, it should be * usable for further buffers when doing ARB_draw_buffer support. */ static void brw_update_renderbuffer_surface(struct brw_context *brw, struct gl_renderbuffer *rb, unsigned int unit) { struct intel_context *intel = &brw->intel; struct gl_context *ctx = &intel->ctx; drm_intel_bo *region_bo = NULL; struct intel_renderbuffer *irb = intel_renderbuffer(rb); struct intel_region *region = irb ? irb->region : NULL; struct { unsigned int surface_type; unsigned int surface_format; unsigned int width, height, pitch, cpp; GLubyte color_mask[4]; GLboolean color_blend; uint32_t tiling; uint32_t draw_x; uint32_t draw_y; } key; struct brw_surface_state surf; void *map; memset(&key, 0, sizeof(key)); if (region != NULL) { region_bo = region->buffer; key.surface_type = BRW_SURFACE_2D; switch (irb->Base.Format) { /* XRGB and ARGB are treated the same here because the chips in this * family cannot render to XRGB targets. This means that we have to * mask writes to alpha (ala glColorMask) and reconfigure the alpha * blending hardware to use GL_ONE (or GL_ZERO) for cases where * GL_DST_ALPHA (or GL_ONE_MINUS_DST_ALPHA) is used. */ case MESA_FORMAT_ARGB8888: case MESA_FORMAT_XRGB8888: key.surface_format = BRW_SURFACEFORMAT_B8G8R8A8_UNORM; break; case MESA_FORMAT_SARGB8: key.surface_format = BRW_SURFACEFORMAT_B8G8R8A8_UNORM_SRGB; break; case MESA_FORMAT_RGB565: key.surface_format = BRW_SURFACEFORMAT_B5G6R5_UNORM; break; case MESA_FORMAT_ARGB1555: key.surface_format = BRW_SURFACEFORMAT_B5G5R5A1_UNORM; break; case MESA_FORMAT_ARGB4444: key.surface_format = BRW_SURFACEFORMAT_B4G4R4A4_UNORM; break; case MESA_FORMAT_A8: key.surface_format = BRW_SURFACEFORMAT_A8_UNORM; break; case MESA_FORMAT_R8: key.surface_format = BRW_SURFACEFORMAT_R8_UNORM; break; case MESA_FORMAT_R16: key.surface_format = BRW_SURFACEFORMAT_R16_UNORM; break; case MESA_FORMAT_RG88: key.surface_format = BRW_SURFACEFORMAT_R8G8_UNORM; break; case MESA_FORMAT_RG1616: key.surface_format = BRW_SURFACEFORMAT_R16G16_UNORM; break; default: _mesa_problem(ctx, "Bad renderbuffer format: %d\n", irb->Base.Format); } key.tiling = region->tiling; key.width = rb->Width; key.height = rb->Height; key.pitch = region->pitch; key.cpp = region->cpp; key.draw_x = region->draw_x; key.draw_y = region->draw_y; } else { key.surface_type = BRW_SURFACE_NULL; key.surface_format = BRW_SURFACEFORMAT_B8G8R8A8_UNORM; key.tiling = I915_TILING_X; key.width = 1; key.height = 1; key.cpp = 4; key.draw_x = 0; key.draw_y = 0; } if (intel->gen < 6) { /* _NEW_COLOR */ memcpy(key.color_mask, ctx->Color.ColorMask[unit], sizeof(key.color_mask)); /* As mentioned above, disable writes to the alpha component when the * renderbuffer is XRGB. */ if (ctx->DrawBuffer->Visual.alphaBits == 0) key.color_mask[3] = GL_FALSE; key.color_blend = (!ctx->Color._LogicOpEnabled && (ctx->Color.BlendEnabled & (1 << unit))); } memset(&surf, 0, sizeof(surf)); surf.ss0.surface_format = key.surface_format; surf.ss0.surface_type = key.surface_type; if (key.tiling == I915_TILING_NONE) { surf.ss1.base_addr = (key.draw_x + key.draw_y * key.pitch) * key.cpp; } else { uint32_t tile_base, tile_x, tile_y; uint32_t pitch = key.pitch * key.cpp; if (key.tiling == I915_TILING_X) { tile_x = key.draw_x % (512 / key.cpp); tile_y = key.draw_y % 8; tile_base = ((key.draw_y / 8) * (8 * pitch)); tile_base += (key.draw_x - tile_x) / (512 / key.cpp) * 4096; } else { /* Y */ tile_x = key.draw_x % (128 / key.cpp); tile_y = key.draw_y % 32; tile_base = ((key.draw_y / 32) * (32 * pitch)); tile_base += (key.draw_x - tile_x) / (128 / key.cpp) * 4096; } assert(brw->has_surface_tile_offset || (tile_x == 0 && tile_y == 0)); assert(tile_x % 4 == 0); assert(tile_y % 2 == 0); /* Note that the low bits of these fields are missing, so * there's the possibility of getting in trouble. */ surf.ss1.base_addr = tile_base; surf.ss5.x_offset = tile_x / 4; surf.ss5.y_offset = tile_y / 2; } if (region_bo != NULL) surf.ss1.base_addr += region_bo->offset; /* reloc */ surf.ss2.width = key.width - 1; surf.ss2.height = key.height - 1; brw_set_surface_tiling(&surf, key.tiling); surf.ss3.pitch = (key.pitch * key.cpp) - 1; if (intel->gen < 6) { /* _NEW_COLOR */ surf.ss0.color_blend = key.color_blend; surf.ss0.writedisable_red = !key.color_mask[0]; surf.ss0.writedisable_green = !key.color_mask[1]; surf.ss0.writedisable_blue = !key.color_mask[2]; surf.ss0.writedisable_alpha = !key.color_mask[3]; } map = brw_state_batch(brw, sizeof(surf), 32, &brw->wm.surf_bo[unit], &brw->wm.surf_offset[unit]); memcpy(map, &surf, sizeof(surf)); if (region_bo != NULL) { drm_intel_bo_emit_reloc(brw->wm.surf_bo[unit], brw->wm.surf_offset[unit] + offsetof(struct brw_surface_state, ss1), region_bo, surf.ss1.base_addr - region_bo->offset, I915_GEM_DOMAIN_RENDER, I915_GEM_DOMAIN_RENDER); } } static void prepare_wm_surfaces(struct brw_context *brw) { struct gl_context *ctx = &brw->intel.ctx; int i; int nr_surfaces = 0; if (ctx->DrawBuffer->_NumColorDrawBuffers >= 1) { for (i = 0; i < ctx->DrawBuffer->_NumColorDrawBuffers; i++) { struct gl_renderbuffer *rb = ctx->DrawBuffer->_ColorDrawBuffers[i]; struct intel_renderbuffer *irb = intel_renderbuffer(rb); struct intel_region *region = irb ? irb->region : NULL; brw_add_validated_bo(brw, region->buffer); nr_surfaces = SURF_INDEX_DRAW(i) + 1; } } if (brw->wm.const_bo) { brw_add_validated_bo(brw, brw->wm.const_bo); nr_surfaces = SURF_INDEX_FRAG_CONST_BUFFER + 1; } for (i = 0; i < BRW_MAX_TEX_UNIT; i++) { const struct gl_texture_unit *texUnit = &ctx->Texture.Unit[i]; struct gl_texture_object *tObj = texUnit->_Current; struct intel_texture_object *intelObj = intel_texture_object(tObj); if (texUnit->_ReallyEnabled) { brw_add_validated_bo(brw, intelObj->mt->region->buffer); nr_surfaces = SURF_INDEX_TEXTURE(i) + 1; } } /* Have to update this in our prepare, since the unit's prepare * relies on it. */ if (brw->wm.nr_surfaces != nr_surfaces) { brw->wm.nr_surfaces = nr_surfaces; brw->state.dirty.brw |= BRW_NEW_NR_WM_SURFACES; } } /** * Constructs the set of surface state objects pointed to by the * binding table. */ static void upload_wm_surfaces(struct brw_context *brw) { struct gl_context *ctx = &brw->intel.ctx; GLuint i; /* _NEW_BUFFERS | _NEW_COLOR */ /* Update surfaces for drawing buffers */ if (ctx->DrawBuffer->_NumColorDrawBuffers >= 1) { for (i = 0; i < ctx->DrawBuffer->_NumColorDrawBuffers; i++) { brw_update_renderbuffer_surface(brw, ctx->DrawBuffer->_ColorDrawBuffers[i], i); } } else { brw_update_renderbuffer_surface(brw, NULL, 0); } /* Update surfaces for textures */ for (i = 0; i < BRW_MAX_TEX_UNIT; i++) { const struct gl_texture_unit *texUnit = &ctx->Texture.Unit[i]; const GLuint surf = SURF_INDEX_TEXTURE(i); /* _NEW_TEXTURE */ if (texUnit->_ReallyEnabled) { brw_update_texture_surface(ctx, i); } else { drm_intel_bo_unreference(brw->wm.surf_bo[surf]); brw->wm.surf_bo[surf] = NULL; } } brw->state.dirty.brw |= BRW_NEW_WM_SURFACES; } const struct brw_tracked_state brw_wm_surfaces = { .dirty = { .mesa = (_NEW_COLOR | _NEW_TEXTURE | _NEW_BUFFERS), .brw = (BRW_NEW_BATCH), .cache = 0 }, .prepare = prepare_wm_surfaces, .emit = upload_wm_surfaces, }; /** * Constructs the binding table for the WM surface state, which maps unit * numbers to surface state objects. */ static void brw_wm_upload_binding_table(struct brw_context *brw) { uint32_t *bind; int i; /* Might want to calculate nr_surfaces first, to avoid taking up so much * space for the binding table. */ bind = brw_state_batch(brw, sizeof(uint32_t) * BRW_WM_MAX_SURF, 32, &brw->wm.bind_bo, &brw->wm.bind_bo_offset); for (i = 0; i < BRW_WM_MAX_SURF; i++) { /* BRW_NEW_WM_SURFACES */ bind[i] = brw->wm.surf_offset[i]; if (brw->wm.surf_bo[i]) { bind[i] = brw->wm.surf_offset[i]; } else { bind[i] = 0; } } brw->state.dirty.brw |= BRW_NEW_BINDING_TABLE; } const struct brw_tracked_state brw_wm_binding_table = { .dirty = { .mesa = 0, .brw = (BRW_NEW_BATCH | BRW_NEW_WM_SURFACES), .cache = 0 }, .emit = brw_wm_upload_binding_table, };