/* * Copyright (C) 2008-2009 Advanced Micro Devices, Inc. * * Permission is hereby granted, free of charge, to any person obtaining a * copy of this software and associated documentation files (the "Software"), * to deal in the Software without restriction, including without limitation * the rights to use, copy, modify, merge, publish, distribute, sublicense, * and/or sell copies of the Software, and to permit persons to whom the * Software is furnished to do so, subject to the following conditions: * * The above copyright notice and this permission notice shall be included * in all copies or substantial portions of the Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL * THE COPYRIGHT HOLDER(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN * AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. */ /* * Authors: * Richard Li , * CooperYuan , */ #include #include #include #include #include #include "main/imports.h" #include "shader/prog_parameter.h" #include "shader/prog_statevars.h" #include "r600_context.h" #include "r600_cmdbuf.h" #include "r700_chip.h" #include "r700_fragprog.h" #include "r700_debug.h" //TODO : Validate FP input with VP output. void Map_Fragment_Program(r700_AssemblerBase *pAsm, struct gl_fragment_program *mesa_fp) { unsigned int unBit; unsigned int i; GLuint ui; pAsm->number_used_registers = 0; //Input mapping : mesa_fp->Base.InputsRead set the flag, set in //The flags parsed in parse_attrib_binding. FRAG_ATTRIB_COLx, FRAG_ATTRIB_TEXx, ... //MUST match order in Map_Vertex_Output unBit = 1 << FRAG_ATTRIB_COL0; if(mesa_fp->Base.InputsRead & unBit) { pAsm->uiFP_AttributeMap[FRAG_ATTRIB_COL0] = pAsm->number_used_registers++; } unBit = 1 << FRAG_ATTRIB_COL1; if(mesa_fp->Base.InputsRead & unBit) { pAsm->uiFP_AttributeMap[FRAG_ATTRIB_COL1] = pAsm->number_used_registers++; } for(i=0; i<8; i++) { unBit = 1 << (FRAG_ATTRIB_TEX0 + i); if(mesa_fp->Base.InputsRead & unBit) { pAsm->uiFP_AttributeMap[FRAG_ATTRIB_TEX0 + i] = pAsm->number_used_registers++; } } /* Map temporary registers (GPRs) */ pAsm->starting_temp_register_number = pAsm->number_used_registers; if(mesa_fp->Base.NumNativeTemporaries >= mesa_fp->Base.NumTemporaries) { pAsm->number_used_registers += mesa_fp->Base.NumNativeTemporaries; } else { pAsm->number_used_registers += mesa_fp->Base.NumTemporaries; } /* Output mapping */ pAsm->number_of_exports = 0; pAsm->number_of_colorandz_exports = 0; /* don't include stencil and mask out. */ pAsm->starting_export_register_number = pAsm->number_used_registers; unBit = 1 << FRAG_RESULT_COLOR; if(mesa_fp->Base.OutputsWritten & unBit) { pAsm->uiFP_OutputMap[FRAG_RESULT_COLOR] = pAsm->number_used_registers++; pAsm->number_of_exports++; pAsm->number_of_colorandz_exports++; } unBit = 1 << FRAG_RESULT_DEPTH; if(mesa_fp->Base.OutputsWritten & unBit) { pAsm->depth_export_register_number = pAsm->number_used_registers; pAsm->uiFP_OutputMap[FRAG_RESULT_DEPTH] = pAsm->number_used_registers++; pAsm->number_of_exports++; pAsm->number_of_colorandz_exports++; } pAsm->pucOutMask = (unsigned char*) MALLOC(pAsm->number_of_exports); for(ui=0; uinumber_of_exports; ui++) { pAsm->pucOutMask[ui] = 0x0; } pAsm->uFirstHelpReg = pAsm->number_used_registers; } GLboolean Find_Instruction_Dependencies_fp(struct r700_fragment_program *fp, struct gl_fragment_program *mesa_fp) { GLuint i, j; GLint * puiTEMPwrites; struct prog_instruction * pILInst; InstDeps *pInstDeps; struct prog_instruction * texcoord_DepInst; GLint nDepInstID; puiTEMPwrites = (GLint*) MALLOC(sizeof(GLuint)*mesa_fp->Base.NumTemporaries); for(i=0; iBase.NumTemporaries; i++) { puiTEMPwrites[i] = -1; } pInstDeps = (InstDeps*)MALLOC(sizeof(InstDeps)*mesa_fp->Base.NumInstructions); for(i=0; iBase.NumInstructions; i++) { pInstDeps[i].nDstDep = -1; pILInst = &(mesa_fp->Base.Instructions[i]); //Dst if(pILInst->DstReg.File == PROGRAM_TEMPORARY) { //Set lastwrite for the temp puiTEMPwrites[pILInst->DstReg.Index] = i; } //Src for(j=0; j<3; j++) { if(pILInst->SrcReg[j].File == PROGRAM_TEMPORARY) { //Set dep. pInstDeps[i].nSrcDeps[j] = puiTEMPwrites[pILInst->SrcReg[j].Index]; } else { pInstDeps[i].nSrcDeps[j] = -1; } } } fp->r700AsmCode.pInstDeps = pInstDeps; FREE(puiTEMPwrites); //Find dep for tex inst for(i=0; iBase.NumInstructions; i++) { pILInst = &(mesa_fp->Base.Instructions[i]); if(GL_TRUE == IsTex(pILInst->Opcode)) { //src0 is the tex coord register, src1 is texunit, src2 is textype nDepInstID = pInstDeps[i].nSrcDeps[0]; if(nDepInstID >= 0) { texcoord_DepInst = &(mesa_fp->Base.Instructions[nDepInstID]); if(GL_TRUE == IsAlu(texcoord_DepInst->Opcode) ) { pInstDeps[nDepInstID].nDstDep = i; pInstDeps[i].nDstDep = i; } else if(GL_TRUE == IsTex(texcoord_DepInst->Opcode) ) { pInstDeps[i].nDstDep = i; } else { //... other deps? } } } } return GL_TRUE; } GLboolean r700TranslateFragmentShader(struct r700_fragment_program *fp, struct gl_fragment_program *mesa_fp) { GLuint number_of_colors_exported; GLboolean z_enabled = GL_FALSE; GLuint unBit; //Init_Program Init_r700_AssemblerBase( SPT_FP, &(fp->r700AsmCode), &(fp->r700Shader) ); Map_Fragment_Program(&(fp->r700AsmCode), mesa_fp); if( GL_FALSE == Find_Instruction_Dependencies_fp(fp, mesa_fp) ) { return GL_FALSE; } if( GL_FALSE == AssembleInstr(mesa_fp->Base.NumInstructions, &(mesa_fp->Base.Instructions[0]), &(fp->r700AsmCode)) ) { return GL_FALSE; } if(GL_FALSE == Process_Fragment_Exports(&(fp->r700AsmCode), mesa_fp->Base.OutputsWritten) ) { return GL_FALSE; } fp->r700Shader.nRegs = (fp->r700AsmCode.number_used_registers == 0) ? 0 : (fp->r700AsmCode.number_used_registers - 1); fp->r700Shader.nParamExports = fp->r700AsmCode.number_of_exports; number_of_colors_exported = fp->r700AsmCode.number_of_colorandz_exports; unBit = 1 << FRAG_RESULT_DEPTH; if(mesa_fp->Base.OutputsWritten & unBit) { z_enabled = GL_TRUE; number_of_colors_exported--; } fp->r700Shader.exportMode = number_of_colors_exported << 1 | z_enabled; fp->translated = GL_TRUE; return GL_TRUE; } void * r700GetActiveFpShaderBo(GLcontext * ctx) { struct r700_fragment_program *fp = (struct r700_fragment_program *) (ctx->FragmentProgram._Current); return fp->shaderbo; } GLboolean r700SetupFragmentProgram(GLcontext * ctx) { context_t *context = R700_CONTEXT(ctx); BATCH_LOCALS(&context->radeon); R700_CHIP_CONTEXT *r700 = (R700_CHIP_CONTEXT*)(context->chipobj.pvChipObj); struct r700_fragment_program *fp = (struct r700_fragment_program *) (ctx->FragmentProgram._Current); struct gl_program_parameter_list *paramList; unsigned int unNumParamData; unsigned int ui; unsigned int unNumOfReg; if(GL_FALSE == fp->loaded) { if(fp->r700Shader.bNeedsAssembly == GL_TRUE) { Assemble( &(fp->r700Shader) ); } /* Load fp to gpu */ r600EmitShader(ctx, &(fp->shaderbo), (GLvoid *)(fp->r700Shader.pProgram), fp->r700Shader.uShaderBinaryDWORDSize, "FS"); fp->loaded = GL_TRUE; } DumpHwBinary(DUMP_PIXEL_SHADER, (GLvoid *)(fp->r700Shader.pProgram), fp->r700Shader.uShaderBinaryDWORDSize); /* TODO : enable this after MemUse fixed *= (context->chipobj.MemUse)(context, fp->shadercode.buf->id); */ r700->SQ_PGM_START_PS.u32All = 0; /* set from buffer obj */ unNumOfReg = fp->r700Shader.nRegs + 1; ui = (r700->SPI_PS_IN_CONTROL_0.u32All & NUM_INTERP_mask) / (1 << NUM_INTERP_shift); ui = ui ? unNumOfReg : ui; SETfield(r700->SQ_PGM_RESOURCES_PS.u32All, ui, NUM_GPRS_shift, NUM_GPRS_mask); CLEARbit(r700->SQ_PGM_RESOURCES_PS.u32All, UNCACHED_FIRST_INST_bit); if(fp->r700Shader.uStackSize) /* we don't use branch for now, it should be zero. */ { SETfield(r700->SQ_PGM_RESOURCES_PS.u32All, fp->r700Shader.uStackSize, STACK_SIZE_shift, STACK_SIZE_mask); } SETfield(r700->SQ_PGM_EXPORTS_PS.u32All, fp->r700Shader.exportMode, EXPORT_MODE_shift, EXPORT_MODE_mask); if(fp->r700Shader.killIsUsed) { SETbit(r700->DB_SHADER_CONTROL.u32All, KILL_ENABLE_bit); } else { CLEARbit(r700->DB_SHADER_CONTROL.u32All, KILL_ENABLE_bit); } if(fp->r700Shader.depthIsExported) { SETbit(r700->DB_SHADER_CONTROL.u32All, Z_EXPORT_ENABLE_bit); } else { CLEARbit(r700->DB_SHADER_CONTROL.u32All, Z_EXPORT_ENABLE_bit); } /* sent out shader constants. */ paramList = fp->mesa_program.Base.Parameters; if(NULL != paramList) { _mesa_load_state_parameters(ctx, paramList); unNumParamData = paramList->NumParameters * 4; BEGIN_BATCH_NO_AUTOSTATE(2 + unNumParamData); R600_OUT_BATCH(CP_PACKET3(R600_IT_SET_ALU_CONST, unNumParamData)); /* assembler map const from very beginning. */ R600_OUT_BATCH(SQ_ALU_CONSTANT_PS_OFFSET * 4); unNumParamData = paramList->NumParameters; for(ui=0; uiParameterValues[ui][0]))); R600_OUT_BATCH(*((unsigned int*)&(paramList->ParameterValues[ui][1]))); R600_OUT_BATCH(*((unsigned int*)&(paramList->ParameterValues[ui][2]))); R600_OUT_BATCH(*((unsigned int*)&(paramList->ParameterValues[ui][3]))); } END_BATCH(); COMMIT_BATCH(); } return GL_TRUE; }