/* * Copyright 2009 Corbin Simpson * * Permission is hereby granted, free of charge, to any person obtaining a * copy of this software and associated documentation files (the "Software"), * to deal in the Software without restriction, including without limitation * on the rights to use, copy, modify, merge, publish, distribute, sub * license, and/or sell copies of the Software, and to permit persons to whom * the Software is furnished to do so, subject to the following conditions: * * The above copyright notice and this permission notice (including the next * paragraph) shall be included in all copies or substantial portions of the * Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM, * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE * USE OR OTHER DEALINGS IN THE SOFTWARE. */ #include "r300_vs.h" static void r300_vs_declare(struct r300_vs_asm* assembler, struct tgsi_full_declaration* decl) { switch (decl->Declaration.File) { case TGSI_FILE_INPUT: break; case TGSI_FILE_OUTPUT: switch (decl->Semantic.SemanticName) { case TGSI_SEMANTIC_POSITION: assembler->tab[decl->DeclarationRange.First] = 0; break; case TGSI_SEMANTIC_COLOR: assembler->tab[decl->DeclarationRange.First] = (assembler->point_size ? 1 : 0) + assembler->out_colors; break; case TGSI_SEMANTIC_FOG: case TGSI_SEMANTIC_GENERIC: /* XXX multiple? */ assembler->tab[decl->DeclarationRange.First] = (assembler->point_size ? 1 : 0) + assembler->out_colors + assembler->out_texcoords; break; case TGSI_SEMANTIC_PSIZE: assembler->tab[decl->DeclarationRange.First] = 1; break; default: debug_printf("r300: vs: Bad semantic declaration %d\n", decl->Semantic.SemanticName); break; } break; case TGSI_FILE_CONSTANT: break; case TGSI_FILE_TEMPORARY: assembler->temp_count++; break; default: debug_printf("r300: vs: Bad file %d\n", decl->Declaration.File); break; } } static INLINE unsigned r300_vs_src_type(struct r300_vs_asm* assembler, struct tgsi_src_register* src) { switch (src->File) { case TGSI_FILE_NULL: case TGSI_FILE_INPUT: /* Probably a zero or one swizzle */ return R300_PVS_SRC_REG_INPUT; case TGSI_FILE_TEMPORARY: return R300_PVS_SRC_REG_TEMPORARY; case TGSI_FILE_CONSTANT: case TGSI_FILE_IMMEDIATE: return R300_PVS_SRC_REG_CONSTANT; default: debug_printf("r300: vs: Unimplemented src type %d\n", src->File); break; } return 0; } static INLINE unsigned r300_vs_src(struct r300_vs_asm* assembler, struct tgsi_src_register* src) { switch (src->File) { case TGSI_FILE_NULL: case TGSI_FILE_INPUT: case TGSI_FILE_TEMPORARY: case TGSI_FILE_CONSTANT: return src->Index; case TGSI_FILE_IMMEDIATE: return src->Index + assembler->imm_offset; default: debug_printf("r300: vs: Unimplemented src type %d\n", src->File); break; } return 0; } static INLINE unsigned r300_vs_dst_type(struct r300_vs_asm* assembler, struct tgsi_dst_register* dst) { switch (dst->File) { case TGSI_FILE_TEMPORARY: return R300_PVS_DST_REG_TEMPORARY; case TGSI_FILE_OUTPUT: return R300_PVS_DST_REG_OUT; default: debug_printf("r300: vs: Unimplemented dst type %d\n", dst->File); break; } return 0; } static INLINE unsigned r300_vs_dst(struct r300_vs_asm* assembler, struct tgsi_dst_register* dst) { switch (dst->File) { case TGSI_FILE_TEMPORARY: return dst->Index; case TGSI_FILE_OUTPUT: return assembler->tab[dst->Index]; default: debug_printf("r300: vs: Unimplemented dst %d\n", dst->File); break; } return 0; } static uint32_t r300_vs_op(unsigned op) { switch (op) { case TGSI_OPCODE_DP3: case TGSI_OPCODE_DP4: return R300_VE_DOT_PRODUCT; case TGSI_OPCODE_MUL: return R300_VE_MULTIPLY; case TGSI_OPCODE_ADD: case TGSI_OPCODE_MOV: case TGSI_OPCODE_SUB: case TGSI_OPCODE_SWZ: return R300_VE_ADD; case TGSI_OPCODE_MAX: return R300_VE_MAXIMUM; case TGSI_OPCODE_SLT: return R300_VE_SET_LESS_THAN; case TGSI_OPCODE_RSQ: return R300_PVS_DST_MATH_INST | R300_ME_RECIP_DX; case TGSI_OPCODE_MAD: return R300_PVS_DST_MACRO_INST | R300_PVS_MACRO_OP_2CLK_MADD; default: break; } return 0; } static uint32_t r300_vs_swiz(struct tgsi_full_src_register* reg) { if (reg->SrcRegister.Extended) { return (reg->SrcRegister.Negate ? (0xf << 12) : 0) | reg->SrcRegisterExtSwz.ExtSwizzleX | (reg->SrcRegisterExtSwz.ExtSwizzleY << 3) | (reg->SrcRegisterExtSwz.ExtSwizzleZ << 6) | (reg->SrcRegisterExtSwz.ExtSwizzleW << 9); } else { return (reg->SrcRegister.Negate ? (0xf << 12) : 0) | reg->SrcRegister.SwizzleX | (reg->SrcRegister.SwizzleY << 3) | (reg->SrcRegister.SwizzleZ << 6) | (reg->SrcRegister.SwizzleW << 9); } } /* XXX icky icky icky icky */ static uint32_t r300_vs_scalar_swiz(struct tgsi_full_src_register* reg) { if (reg->SrcRegister.Extended) { return (reg->SrcRegister.Negate ? (0xf << 12) : 0) | reg->SrcRegisterExtSwz.ExtSwizzleX | (reg->SrcRegisterExtSwz.ExtSwizzleX << 3) | (reg->SrcRegisterExtSwz.ExtSwizzleX << 6) | (reg->SrcRegisterExtSwz.ExtSwizzleX << 9); } else { return (reg->SrcRegister.Negate ? (0xf << 12) : 0) | reg->SrcRegister.SwizzleX | (reg->SrcRegister.SwizzleX << 3) | (reg->SrcRegister.SwizzleX << 6) | (reg->SrcRegister.SwizzleX << 9); } } /* XXX scalar stupidity */ static void r300_vs_emit_inst(struct r300_vertex_shader* vs, struct r300_vs_asm* assembler, struct tgsi_full_src_register* src, struct tgsi_full_dst_register* dst, unsigned op, unsigned count, boolean is_scalar) { int i = vs->instruction_count; vs->instructions[i].inst0 = R300_PVS_DST_OPCODE(r300_vs_op(op)) | R300_PVS_DST_REG_TYPE(r300_vs_dst_type(assembler, &dst->DstRegister)) | R300_PVS_DST_OFFSET(r300_vs_dst(assembler, &dst->DstRegister)) | R300_PVS_DST_WE(dst->DstRegister.WriteMask); switch (count) { case 3: vs->instructions[i].inst3 = R300_PVS_SRC_REG_TYPE(r300_vs_src_type(assembler, &src[2].SrcRegister)) | R300_PVS_SRC_OFFSET(r300_vs_src(assembler, &src[2].SrcRegister)) | R300_PVS_SRC_SWIZZLE(r300_vs_swiz(&src[2])); /* Fall through */ case 2: vs->instructions[i].inst2 = R300_PVS_SRC_REG_TYPE(r300_vs_src_type(assembler, &src[1].SrcRegister)) | R300_PVS_SRC_OFFSET(r300_vs_src(assembler, &src[1].SrcRegister)) | R300_PVS_SRC_SWIZZLE(r300_vs_swiz(&src[1])); /* Fall through */ case 1: vs->instructions[i].inst1 = R300_PVS_SRC_REG_TYPE(r300_vs_src_type(assembler, &src[0].SrcRegister)) | R300_PVS_SRC_OFFSET(r300_vs_src(assembler, &src[0].SrcRegister)) | /* XXX the icky, it burns */ R300_PVS_SRC_SWIZZLE(is_scalar ? r300_vs_scalar_swiz(&src[0]) : r300_vs_swiz(&src[0])); break; } vs->instruction_count++; } static void r300_vs_instruction(struct r300_vertex_shader* vs, struct r300_vs_asm* assembler, struct tgsi_full_instruction* inst) { switch (inst->Instruction.Opcode) { case TGSI_OPCODE_RSQ: r300_vs_emit_inst(vs, assembler, inst->FullSrcRegisters, &inst->FullDstRegisters[0], inst->Instruction.Opcode, 1, TRUE); break; case TGSI_OPCODE_SUB: inst->FullSrcRegisters[1].SrcRegister.Negate = !inst->FullSrcRegisters[1].SrcRegister.Negate; /* Fall through */ case TGSI_OPCODE_ADD: case TGSI_OPCODE_MUL: case TGSI_OPCODE_MAX: case TGSI_OPCODE_SLT: r300_vs_emit_inst(vs, assembler, inst->FullSrcRegisters, &inst->FullDstRegisters[0], inst->Instruction.Opcode, 2, FALSE); break; case TGSI_OPCODE_DP3: /* Set alpha swizzle to zero for src0 and src1 */ if (!inst->FullSrcRegisters[0].SrcRegister.Extended) { inst->FullSrcRegisters[0].SrcRegister.Extended = TRUE; inst->FullSrcRegisters[0].SrcRegisterExtSwz.ExtSwizzleX = inst->FullSrcRegisters[0].SrcRegister.SwizzleX; inst->FullSrcRegisters[0].SrcRegisterExtSwz.ExtSwizzleY = inst->FullSrcRegisters[0].SrcRegister.SwizzleY; inst->FullSrcRegisters[0].SrcRegisterExtSwz.ExtSwizzleZ = inst->FullSrcRegisters[0].SrcRegister.SwizzleZ; } inst->FullSrcRegisters[0].SrcRegisterExtSwz.ExtSwizzleW = TGSI_EXTSWIZZLE_ZERO; if (!inst->FullSrcRegisters[1].SrcRegister.Extended) { inst->FullSrcRegisters[1].SrcRegister.Extended = TRUE; inst->FullSrcRegisters[1].SrcRegisterExtSwz.ExtSwizzleX = inst->FullSrcRegisters[1].SrcRegister.SwizzleX; inst->FullSrcRegisters[1].SrcRegisterExtSwz.ExtSwizzleY = inst->FullSrcRegisters[1].SrcRegister.SwizzleY; inst->FullSrcRegisters[1].SrcRegisterExtSwz.ExtSwizzleZ = inst->FullSrcRegisters[1].SrcRegister.SwizzleZ; } inst->FullSrcRegisters[1].SrcRegisterExtSwz.ExtSwizzleW = TGSI_EXTSWIZZLE_ZERO; /* Fall through */ case TGSI_OPCODE_DP4: r300_vs_emit_inst(vs, assembler, inst->FullSrcRegisters, &inst->FullDstRegisters[0], inst->Instruction.Opcode, 2, FALSE); break; case TGSI_OPCODE_MOV: case TGSI_OPCODE_SWZ: inst->FullSrcRegisters[1] = r300_constant_zero; r300_vs_emit_inst(vs, assembler, inst->FullSrcRegisters, &inst->FullDstRegisters[0], inst->Instruction.Opcode, 2, FALSE); break; case TGSI_OPCODE_MAD: r300_vs_emit_inst(vs, assembler, inst->FullSrcRegisters, &inst->FullDstRegisters[0], inst->Instruction.Opcode, 3, FALSE); break; case TGSI_OPCODE_END: break; default: debug_printf("r300: vs: Bad opcode %d\n", inst->Instruction.Opcode); break; } } static void r300_vs_init(struct r300_vertex_shader* vs, struct r300_vs_asm* assembler) { struct tgsi_shader_info* info = &vs->info; int i; for (i = 0; i < info->num_outputs; i++) { switch (info->output_semantic_name[i]) { case TGSI_SEMANTIC_PSIZE: assembler->point_size = TRUE; break; case TGSI_SEMANTIC_COLOR: assembler->out_colors++; break; case TGSI_SEMANTIC_FOG: case TGSI_SEMANTIC_GENERIC: assembler->out_texcoords++; break; } } vs->instruction_count = 0; } void r300_translate_vertex_shader(struct r300_context* r300, struct r300_vertex_shader* vs) { struct tgsi_parse_context parser; int i; struct r300_constant_buffer* consts = &r300->shader_constants[PIPE_SHADER_VERTEX]; struct r300_vs_asm* assembler = CALLOC_STRUCT(r300_vs_asm); if (assembler == NULL) { return; } /* Init assembler. */ r300_vs_init(vs, assembler); /* Setup starting offset for immediates. */ assembler->imm_offset = consts->user_count; tgsi_parse_init(&parser, vs->state.tokens); while (!tgsi_parse_end_of_tokens(&parser)) { tgsi_parse_token(&parser); /* This is seriously the lamest way to create fragment programs ever. * I blame TGSI. */ switch (parser.FullToken.Token.Type) { case TGSI_TOKEN_TYPE_DECLARATION: /* Allocated registers sitting at the beginning * of the program. */ r300_vs_declare(assembler, &parser.FullToken.FullDeclaration); break; case TGSI_TOKEN_TYPE_IMMEDIATE: debug_printf("r300: Emitting immediate to constant buffer, " "position %d\n", assembler->imm_offset + assembler->imm_count); /* I am not amused by the length of these. */ for (i = 0; i < 4; i++) { consts->constants[assembler->imm_offset + assembler->imm_count][i] = parser.FullToken.FullImmediate.u[i].Float; } assembler->imm_count++; break; case TGSI_TOKEN_TYPE_INSTRUCTION: r300_vs_instruction(vs, assembler, &parser.FullToken.FullInstruction); break; } } debug_printf("r300: vs: %d texs and %d colors, first free reg is %d\n", assembler->tex_count, assembler->color_count, assembler->tex_count + assembler->color_count); consts->count = consts->user_count + assembler->imm_count; vs->uses_imms = assembler->imm_count; debug_printf("r300: vs: %d total constants, " "%d from user and %d from immediates\n", consts->count, consts->user_count, assembler->imm_count); debug_printf("r300: vs: tab: %d %d %d %d\n", assembler->tab[0], assembler->tab[1], assembler->tab[2], assembler->tab[3]); tgsi_dump(vs->state.tokens, 0); /* XXX finish r300 vertex shader dumper */ r300_vs_dump(vs); tgsi_parse_free(&parser); FREE(assembler); }