/************************************************************************** * * Copyright 2008 Tungsten Graphics, Inc., Cedar Park, Texas. * All Rights Reserved. * * Permission is hereby granted, free of charge, to any person obtaining a * copy of this software and associated documentation files (the * "Software"), to deal in the Software without restriction, including * without limitation the rights to use, copy, modify, merge, publish, * distribute, sub license, and/or sell copies of the Software, and to * permit persons to whom the Software is furnished to do so, subject to * the following conditions: * * The above copyright notice and this permission notice (including the * next paragraph) shall be included in all copies or substantial portions * of the Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. * **************************************************************************/ #include "pipe/p_compiler.h" #include "pipe/p_format.h" #include "pipe/p_state.h" #include "util/u_inlines.h" #include "util/u_format.h" #include "util/u_tile.h" #include "util/u_math.h" #include "util/u_memory.h" #include "st_device.h" #include "st_sample.h" /** * Use our own pseudo random generator to ensure consistent runs among * multiple runs and platforms. * * @sa http://en.wikipedia.org/wiki/Linear_congruential_generator */ static uint32_t st_random(void) { static uint64_t seed = UINT64_C(0xbb9a063afb0a739d); seed = UINT64_C(134775813) * seed + UINT64_C(1); return (uint32_t)(seed >> 32); } /** * We don't want to include the patent-encumbered DXT code here, so instead * we store several uncompressed/compressed data pairs for hardware testing * purposes. */ struct dxt_data { uint8_t rgba[16*4]; uint8_t raw[16]; }; static const struct dxt_data dxt1_rgb_data[] = { { { 0x99, 0xb0, 0x8e, 0xff, 0x5d, 0x62, 0x89, 0xff, 0x99, 0xb0, 0x8e, 0xff, 0x99, 0xb0, 0x8e, 0xff, 0xd6, 0xff, 0x94, 0xff, 0x5d, 0x62, 0x89, 0xff, 0x99, 0xb0, 0x8e, 0xff, 0xd6, 0xff, 0x94, 0xff, 0x5d, 0x62, 0x89, 0xff, 0x5d, 0x62, 0x89, 0xff, 0x99, 0xb0, 0x8e, 0xff, 0x21, 0x14, 0x84, 0xff, 0x5d, 0x62, 0x89, 0xff, 0x21, 0x14, 0x84, 0xff, 0x21, 0x14, 0x84, 0xff, 0x99, 0xb0, 0x8e, 0xff }, {0xf2, 0xd7, 0xb0, 0x20, 0xae, 0x2c, 0x6f, 0x97} }, { { 0xb5, 0xcf, 0x9c, 0xff, 0x83, 0x8c, 0x8b, 0xff, 0x21, 0x08, 0x6b, 0xff, 0x83, 0x8c, 0x8b, 0xff, 0x52, 0x4a, 0x7b, 0xff, 0x83, 0x8c, 0x8b, 0xff, 0x83, 0x8c, 0x8b, 0xff, 0xb5, 0xcf, 0x9c, 0xff, 0x21, 0x08, 0x6b, 0xff, 0xb5, 0xcf, 0x9c, 0xff, 0x83, 0x8c, 0x8b, 0xff, 0x52, 0x4a, 0x7b, 0xff, 0xb5, 0xcf, 0x9c, 0xff, 0x83, 0x8c, 0x8b, 0xff, 0x52, 0x4a, 0x7b, 0xff, 0x83, 0x8c, 0x8b, 0xff }, {0x73, 0xb6, 0x4d, 0x20, 0x98, 0x2b, 0xe1, 0xb8} }, { { 0x00, 0x2c, 0xff, 0xff, 0x94, 0x8d, 0x7b, 0xff, 0x4a, 0x5c, 0xbd, 0xff, 0x4a, 0x5c, 0xbd, 0xff, 0x4a, 0x5c, 0xbd, 0xff, 0x94, 0x8d, 0x7b, 0xff, 0x94, 0x8d, 0x7b, 0xff, 0x94, 0x8d, 0x7b, 0xff, 0xde, 0xbe, 0x39, 0xff, 0x94, 0x8d, 0x7b, 0xff, 0xde, 0xbe, 0x39, 0xff, 0xde, 0xbe, 0x39, 0xff, 0xde, 0xbe, 0x39, 0xff, 0xde, 0xbe, 0x39, 0xff, 0xde, 0xbe, 0x39, 0xff, 0x94, 0x8d, 0x7b, 0xff }, {0xe7, 0xdd, 0x7f, 0x01, 0xf9, 0xab, 0x08, 0x80} }, { { 0x6b, 0x24, 0x21, 0xff, 0x7b, 0x4f, 0x5d, 0xff, 0x7b, 0x4f, 0x5d, 0xff, 0x8b, 0x7a, 0x99, 0xff, 0x7b, 0x4f, 0x5d, 0xff, 0x7b, 0x4f, 0x5d, 0xff, 0x6b, 0x24, 0x21, 0xff, 0x8b, 0x7a, 0x99, 0xff, 0x9c, 0xa6, 0xd6, 0xff, 0x6b, 0x24, 0x21, 0xff, 0x7b, 0x4f, 0x5d, 0xff, 0x8b, 0x7a, 0x99, 0xff, 0x6b, 0x24, 0x21, 0xff, 0x8b, 0x7a, 0x99, 0xff, 0x7b, 0x4f, 0x5d, 0xff, 0x9c, 0xa6, 0xd6, 0xff }, {0x3a, 0x9d, 0x24, 0x69, 0xbd, 0x9f, 0xb4, 0x39} } }; static const struct dxt_data dxt1_rgba_data[] = { { { 0x00, 0x00, 0x00, 0x00, 0x4e, 0xaa, 0x90, 0xff, 0x4e, 0xaa, 0x90, 0xff, 0x00, 0x00, 0x00, 0x00, 0x4e, 0xaa, 0x90, 0xff, 0x29, 0xff, 0xff, 0xff, 0x00, 0x00, 0x00, 0x00, 0x4e, 0xaa, 0x90, 0xff, 0x73, 0x55, 0x21, 0xff, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x4e, 0xaa, 0x90, 0xff, 0x4e, 0xaa, 0x90, 0xff, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x4e, 0xaa, 0x90, 0xff }, {0xff, 0x2f, 0xa4, 0x72, 0xeb, 0xb2, 0xbd, 0xbe} }, { { 0xb5, 0xe3, 0x63, 0xff, 0x00, 0x00, 0x00, 0x00, 0x6b, 0x24, 0x84, 0xff, 0xb5, 0xe3, 0x63, 0xff, 0x00, 0x00, 0x00, 0x00, 0xb5, 0xe3, 0x63, 0xff, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x6b, 0x24, 0x84, 0xff, 0x6b, 0x24, 0x84, 0xff, 0x00, 0x00, 0x00, 0x00, 0xb5, 0xe3, 0x63, 0xff, 0x90, 0x83, 0x73, 0xff, 0xb5, 0xe3, 0x63, 0xff }, {0x30, 0x69, 0x0c, 0xb7, 0x4d, 0xf7, 0x0f, 0x67} }, { { 0x00, 0x00, 0x00, 0x00, 0xc6, 0x86, 0x8c, 0xff, 0xc6, 0x86, 0x8c, 0xff, 0x21, 0x65, 0x42, 0xff, 0x21, 0x65, 0x42, 0xff, 0x21, 0x65, 0x42, 0xff, 0x21, 0x65, 0x42, 0xff, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x21, 0x65, 0x42, 0xff, 0xc6, 0x86, 0x8c, 0xff, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xc6, 0x86, 0x8c, 0xff }, {0x28, 0x23, 0x31, 0xc4, 0x17, 0xc0, 0xd3, 0x7f} }, { { 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xc6, 0xe3, 0x9c, 0xff, 0x7b, 0x1c, 0x52, 0xff, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x7b, 0x1c, 0x52, 0xff, 0x00, 0x00, 0x00, 0x00, 0x7b, 0x1c, 0x52, 0xff, 0xa0, 0x7f, 0x77, 0xff, 0xc6, 0xe3, 0x9c, 0xff, 0x00, 0x00, 0x00, 0x00, 0xa0, 0x7f, 0x77, 0xff }, {0xea, 0x78, 0x13, 0xc7, 0x7f, 0xfc, 0x33, 0xb6} }, }; static const struct dxt_data dxt3_rgba_data[] = { { { 0x6d, 0xc6, 0x96, 0x77, 0x6d, 0xc6, 0x96, 0xee, 0x6d, 0xc6, 0x96, 0xaa, 0x8c, 0xff, 0xb5, 0x44, 0x6d, 0xc6, 0x96, 0xff, 0x6d, 0xc6, 0x96, 0x88, 0x31, 0x55, 0x5a, 0x66, 0x6d, 0xc6, 0x96, 0x99, 0x31, 0x55, 0x5a, 0xbb, 0x31, 0x55, 0x5a, 0x55, 0x31, 0x55, 0x5a, 0x11, 0x6d, 0xc6, 0x96, 0xcc, 0x6d, 0xc6, 0x96, 0xcc, 0x6d, 0xc6, 0x96, 0x11, 0x31, 0x55, 0x5a, 0x44, 0x31, 0x55, 0x5a, 0x88 }, {0xe7, 0x4a, 0x8f, 0x96, 0x5b, 0xc1, 0x1c, 0x84, 0xf6, 0x8f, 0xab, 0x32, 0x2a, 0x9a, 0x95, 0x5a} }, { { 0xad, 0xeb, 0x73, 0x99, 0x97, 0xaa, 0x86, 0x66, 0x6b, 0x28, 0xad, 0x99, 0xad, 0xeb, 0x73, 0x99, 0x6b, 0x28, 0xad, 0x22, 0xad, 0xeb, 0x73, 0xff, 0x97, 0xaa, 0x86, 0x55, 0x6b, 0x28, 0xad, 0x55, 0x6b, 0x28, 0xad, 0x44, 0xad, 0xeb, 0x73, 0x33, 0x6b, 0x28, 0xad, 0xee, 0x6b, 0x28, 0xad, 0x99, 0x97, 0xaa, 0x86, 0x66, 0xad, 0xeb, 0x73, 0xbb, 0x97, 0xaa, 0x86, 0x99, 0xad, 0xeb, 0x73, 0xbb }, {0x69, 0x99, 0xf2, 0x55, 0x34, 0x9e, 0xb6, 0xb9, 0x4e, 0xaf, 0x55, 0x69, 0x18, 0x61, 0x51, 0x22} }, { { 0x63, 0xd7, 0xd6, 0x00, 0x57, 0x62, 0x5d, 0xdd, 0x57, 0x62, 0x5d, 0xcc, 0x57, 0x62, 0x5d, 0xbb, 0x52, 0x28, 0x21, 0xaa, 0x57, 0x62, 0x5d, 0xcc, 0x57, 0x62, 0x5d, 0xcc, 0x57, 0x62, 0x5d, 0x66, 0x57, 0x62, 0x5d, 0x22, 0x57, 0x62, 0x5d, 0xdd, 0x63, 0xd7, 0xd6, 0xee, 0x57, 0x62, 0x5d, 0x33, 0x63, 0xd7, 0xd6, 0x55, 0x52, 0x28, 0x21, 0x55, 0x57, 0x62, 0x5d, 0x11, 0x5d, 0x9c, 0x99, 0xee }, {0xd0, 0xbc, 0xca, 0x6c, 0xd2, 0x3e, 0x55, 0xe1, 0xba, 0x66, 0x44, 0x51, 0xfc, 0xfd, 0xcf, 0xb4} }, { { 0x94, 0x6f, 0x60, 0x22, 0x94, 0x6f, 0x60, 0x22, 0xc5, 0xab, 0x76, 0x11, 0xc5, 0xab, 0x76, 0xee, 0x63, 0x34, 0x4a, 0xdd, 0x63, 0x34, 0x4a, 0x33, 0x94, 0x6f, 0x60, 0x77, 0xf7, 0xe7, 0x8c, 0x00, 0x94, 0x6f, 0x60, 0x33, 0x63, 0x34, 0x4a, 0xaa, 0x94, 0x6f, 0x60, 0x77, 0x63, 0x34, 0x4a, 0xcc, 0x94, 0x6f, 0x60, 0xaa, 0xf7, 0xe7, 0x8c, 0x99, 0x63, 0x34, 0x4a, 0x44, 0xc5, 0xab, 0x76, 0xaa }, {0x22, 0xe1, 0x3d, 0x07, 0xa3, 0xc7, 0x9a, 0xa4, 0x31, 0xf7, 0xa9, 0x61, 0xaf, 0x35, 0x77, 0x93} }, }; static const struct dxt_data dxt5_rgba_data[] = { { { 0x6d, 0xc6, 0x96, 0x74, 0x6d, 0xc6, 0x96, 0xf8, 0x6d, 0xc6, 0x96, 0xb6, 0x8c, 0xff, 0xb5, 0x53, 0x6d, 0xc6, 0x96, 0xf8, 0x6d, 0xc6, 0x96, 0x95, 0x31, 0x55, 0x5a, 0x53, 0x6d, 0xc6, 0x96, 0x95, 0x31, 0x55, 0x5a, 0xb6, 0x31, 0x55, 0x5a, 0x53, 0x31, 0x55, 0x5a, 0x11, 0x6d, 0xc6, 0x96, 0xd7, 0x6d, 0xc6, 0x96, 0xb6, 0x6d, 0xc6, 0x96, 0x11, 0x31, 0x55, 0x5a, 0x32, 0x31, 0x55, 0x5a, 0x95 }, {0xf8, 0x11, 0xc5, 0x0c, 0x9a, 0x73, 0xb4, 0x9c, 0xf6, 0x8f, 0xab, 0x32, 0x2a, 0x9a, 0x95, 0x5a} }, { { 0xad, 0xeb, 0x73, 0xa1, 0x97, 0xaa, 0x86, 0x65, 0x6b, 0x28, 0xad, 0xa1, 0xad, 0xeb, 0x73, 0xa1, 0x6b, 0x28, 0xad, 0x2a, 0xad, 0xeb, 0x73, 0xfb, 0x97, 0xaa, 0x86, 0x47, 0x6b, 0x28, 0xad, 0x65, 0x6b, 0x28, 0xad, 0x47, 0xad, 0xeb, 0x73, 0x47, 0x6b, 0x28, 0xad, 0xdd, 0x6b, 0x28, 0xad, 0xa1, 0x97, 0xaa, 0x86, 0x65, 0xad, 0xeb, 0x73, 0xbf, 0x97, 0xaa, 0x86, 0xa1, 0xad, 0xeb, 0x73, 0xbf }, {0xfb, 0x2a, 0x34, 0x19, 0xdc, 0xbf, 0xe8, 0x71, 0x4e, 0xaf, 0x55, 0x69, 0x18, 0x61, 0x51, 0x22} }, { { 0x63, 0xd7, 0xd6, 0x00, 0x57, 0x62, 0x5d, 0xf5, 0x57, 0x62, 0x5d, 0xd2, 0x57, 0x62, 0x5d, 0xaf, 0x52, 0x28, 0x21, 0xaf, 0x57, 0x62, 0x5d, 0xd2, 0x57, 0x62, 0x5d, 0xd2, 0x57, 0x62, 0x5d, 0x69, 0x57, 0x62, 0x5d, 0x23, 0x57, 0x62, 0x5d, 0xd2, 0x63, 0xd7, 0xd6, 0xf5, 0x57, 0x62, 0x5d, 0x46, 0x63, 0xd7, 0xd6, 0x46, 0x52, 0x28, 0x21, 0x69, 0x57, 0x62, 0x5d, 0x23, 0x5d, 0x9c, 0x99, 0xf5 }, {0xf5, 0x00, 0x81, 0x36, 0xa9, 0x17, 0xec, 0x1e, 0xba, 0x66, 0x44, 0x51, 0xfc, 0xfd, 0xcf, 0xb4} }, { { 0x94, 0x6f, 0x60, 0x25, 0x94, 0x6f, 0x60, 0x25, 0xc5, 0xab, 0x76, 0x05, 0xc5, 0xab, 0x76, 0xe8, 0x63, 0x34, 0x4a, 0xe8, 0x63, 0x34, 0x4a, 0x25, 0x94, 0x6f, 0x60, 0x86, 0xf7, 0xe7, 0x8c, 0x05, 0x94, 0x6f, 0x60, 0x25, 0x63, 0x34, 0x4a, 0xa7, 0x94, 0x6f, 0x60, 0x66, 0x63, 0x34, 0x4a, 0xc7, 0x94, 0x6f, 0x60, 0xa7, 0xf7, 0xe7, 0x8c, 0xa7, 0x63, 0x34, 0x4a, 0x45, 0xc5, 0xab, 0x76, 0xa7 }, {0xe8, 0x05, 0x7f, 0x80, 0x33, 0x5f, 0xb5, 0x79, 0x31, 0xf7, 0xa9, 0x61, 0xaf, 0x35, 0x77, 0x93} }, }; static INLINE void st_sample_dxt_pixel_block(enum pipe_format format, uint8_t *raw, float *rgba, unsigned rgba_stride, unsigned w, unsigned h) { const struct dxt_data *data; unsigned n; unsigned i; unsigned x, y, ch; switch(format) { case PIPE_FORMAT_DXT1_RGB: data = dxt1_rgb_data; n = sizeof(dxt1_rgb_data)/sizeof(dxt1_rgb_data[0]); break; case PIPE_FORMAT_DXT1_RGBA: data = dxt1_rgba_data; n = sizeof(dxt1_rgba_data)/sizeof(dxt1_rgba_data[0]); break; case PIPE_FORMAT_DXT3_RGBA: data = dxt3_rgba_data; n = sizeof(dxt3_rgba_data)/sizeof(dxt3_rgba_data[0]); break; case PIPE_FORMAT_DXT5_RGBA: data = dxt5_rgba_data; n = sizeof(dxt5_rgba_data)/sizeof(dxt5_rgba_data[0]); break; default: assert(0); return; } i = st_random() % n; for(y = 0; y < h; ++y) for(x = 0; x < w; ++x) for(ch = 0; ch < 4; ++ch) rgba[y*rgba_stride + x*4 + ch] = (float)(data[i].rgba[y*4*4 + x*4 + ch])/255.0f; memcpy(raw, data[i].raw, util_format_get_blocksize(format)); } static INLINE void st_sample_generic_pixel_block(enum pipe_format format, uint8_t *raw, float *rgba, unsigned rgba_stride, unsigned w, unsigned h, boolean norm) { unsigned i; unsigned x, y, ch; int blocksize = util_format_get_blocksize(format); if (norm) { for (y = 0; y < h; ++y) { for (x = 0; x < w; ++x) { for (ch = 0; ch < 4; ++ch) { unsigned offset = y*rgba_stride + x*4 + ch; rgba[offset] = (st_random() & 0xff) / (double)0xff; } } } util_format_write_4f(format, rgba, rgba_stride * sizeof(float), raw, util_format_get_stride(format, w), 0, 0, w, h); } else { for (i = 0; i < blocksize; ++i) raw[i] = (uint8_t)st_random(); } util_format_read_4f(format, rgba, rgba_stride * sizeof(float), raw, util_format_get_stride(format, w), 0, 0, w, h); if (format == PIPE_FORMAT_UYVY || format == PIPE_FORMAT_YUYV) { for (y = 0; y < h; ++y) { for (x = 0; x < w; ++x) { for (ch = 0; ch < 4; ++ch) { unsigned offset = y*rgba_stride + x*4 + ch; rgba[offset] = CLAMP(rgba[offset], 0.0f, 1.0f); } } } } } /** * Randomly sample pixels. */ void st_sample_pixel_block(enum pipe_format format, void *raw, float *rgba, unsigned rgba_stride, unsigned w, unsigned h, boolean norm) { switch(format) { case PIPE_FORMAT_DXT1_RGB: case PIPE_FORMAT_DXT1_RGBA: case PIPE_FORMAT_DXT3_RGBA: case PIPE_FORMAT_DXT5_RGBA: st_sample_dxt_pixel_block(format, raw, rgba, rgba_stride, w, h); break; default: st_sample_generic_pixel_block(format, raw, rgba, rgba_stride, w, h, norm); break; } } void st_sample_surface(struct pipe_context *pipe, struct st_surface *surface, float *rgba, boolean norm) { struct pipe_resource *texture = surface->texture; unsigned width = u_minify(texture->width0, surface->level); unsigned height = u_minify(texture->height0, surface->level); uint rgba_stride = width * 4; struct pipe_transfer *transfer; void *raw; transfer = pipe_get_transfer(pipe, surface->texture, surface->level, surface->layer, PIPE_TRANSFER_WRITE, 0, 0, width, height); if (!transfer) return; raw = pipe->transfer_map(pipe, transfer); if (raw) { enum pipe_format format = texture->format; uint x, y; int nblocksx = util_format_get_nblocksx(format, width); int nblocksy = util_format_get_nblocksy(format, height); int blockwidth = util_format_get_blockwidth(format); int blockheight = util_format_get_blockheight(format); int blocksize = util_format_get_blocksize(format); for (y = 0; y < nblocksy; ++y) { for (x = 0; x < nblocksx; ++x) { st_sample_pixel_block(format, (uint8_t *) raw + y * transfer->stride + x * blocksize, rgba + y * blockheight * rgba_stride + x * blockwidth * 4, rgba_stride, MIN2(blockwidth, width - x*blockwidth), MIN2(blockheight, height - y*blockheight), norm); } } pipe->transfer_unmap(pipe, transfer); } pipe->transfer_destroy(pipe, transfer); }