
Also avoids empty shader for "END" - seems to be somewhat valid fp Maybe this can be done differently in the future (fake FRAG_RESULT_COLOR already in Map_Fragment_Program() or is there a way to program the chip to not hang in case of no exports.
490 lines
15 KiB
C
490 lines
15 KiB
C
/*
|
|
* Copyright (C) 2008-2009 Advanced Micro Devices, Inc.
|
|
*
|
|
* Permission is hereby granted, free of charge, to any person obtaining a
|
|
* copy of this software and associated documentation files (the "Software"),
|
|
* to deal in the Software without restriction, including without limitation
|
|
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
|
* and/or sell copies of the Software, and to permit persons to whom the
|
|
* Software is furnished to do so, subject to the following conditions:
|
|
*
|
|
* The above copyright notice and this permission notice shall be included
|
|
* in all copies or substantial portions of the Software.
|
|
*
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
|
|
* OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
* THE COPYRIGHT HOLDER(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN
|
|
* AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
|
|
* CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
|
|
*/
|
|
|
|
/*
|
|
* Authors:
|
|
* Richard Li <RichardZ.Li@amd.com>, <richardradeon@gmail.com>
|
|
* CooperYuan <cooper.yuan@amd.com>, <cooperyuan@gmail.com>
|
|
*/
|
|
|
|
#include <stdio.h>
|
|
#include <stdarg.h>
|
|
#include <stdlib.h>
|
|
#include <string.h>
|
|
#include <math.h>
|
|
|
|
#include "main/imports.h"
|
|
#include "shader/prog_parameter.h"
|
|
#include "shader/prog_statevars.h"
|
|
|
|
#include "r600_context.h"
|
|
#include "r600_cmdbuf.h"
|
|
|
|
#include "r700_fragprog.h"
|
|
|
|
#include "r700_debug.h"
|
|
|
|
//TODO : Validate FP input with VP output.
|
|
void Map_Fragment_Program(r700_AssemblerBase *pAsm,
|
|
struct gl_fragment_program *mesa_fp)
|
|
{
|
|
unsigned int unBit;
|
|
unsigned int i;
|
|
GLuint ui;
|
|
|
|
pAsm->number_used_registers = 0;
|
|
|
|
//Input mapping : mesa_fp->Base.InputsRead set the flag, set in
|
|
//The flags parsed in parse_attrib_binding. FRAG_ATTRIB_COLx, FRAG_ATTRIB_TEXx, ...
|
|
//MUST match order in Map_Vertex_Output
|
|
unBit = 1 << FRAG_ATTRIB_WPOS;
|
|
if(mesa_fp->Base.InputsRead & unBit)
|
|
{
|
|
pAsm->uiFP_AttributeMap[FRAG_ATTRIB_WPOS] = pAsm->number_used_registers++;
|
|
}
|
|
|
|
unBit = 1 << FRAG_ATTRIB_COL0;
|
|
if(mesa_fp->Base.InputsRead & unBit)
|
|
{
|
|
pAsm->uiFP_AttributeMap[FRAG_ATTRIB_COL0] = pAsm->number_used_registers++;
|
|
}
|
|
|
|
unBit = 1 << FRAG_ATTRIB_COL1;
|
|
if(mesa_fp->Base.InputsRead & unBit)
|
|
{
|
|
pAsm->uiFP_AttributeMap[FRAG_ATTRIB_COL1] = pAsm->number_used_registers++;
|
|
}
|
|
|
|
unBit = 1 << FRAG_ATTRIB_FOGC;
|
|
if(mesa_fp->Base.InputsRead & unBit)
|
|
{
|
|
pAsm->uiFP_AttributeMap[FRAG_ATTRIB_FOGC] = pAsm->number_used_registers++;
|
|
}
|
|
|
|
for(i=0; i<8; i++)
|
|
{
|
|
unBit = 1 << (FRAG_ATTRIB_TEX0 + i);
|
|
if(mesa_fp->Base.InputsRead & unBit)
|
|
{
|
|
pAsm->uiFP_AttributeMap[FRAG_ATTRIB_TEX0 + i] = pAsm->number_used_registers++;
|
|
}
|
|
}
|
|
|
|
/* Map temporary registers (GPRs) */
|
|
pAsm->starting_temp_register_number = pAsm->number_used_registers;
|
|
|
|
if(mesa_fp->Base.NumNativeTemporaries >= mesa_fp->Base.NumTemporaries)
|
|
{
|
|
pAsm->number_used_registers += mesa_fp->Base.NumNativeTemporaries;
|
|
}
|
|
else
|
|
{
|
|
pAsm->number_used_registers += mesa_fp->Base.NumTemporaries;
|
|
}
|
|
|
|
/* Output mapping */
|
|
pAsm->number_of_exports = 0;
|
|
pAsm->number_of_colorandz_exports = 0; /* don't include stencil and mask out. */
|
|
pAsm->starting_export_register_number = pAsm->number_used_registers;
|
|
unBit = 1 << FRAG_RESULT_COLOR;
|
|
if(mesa_fp->Base.OutputsWritten & unBit)
|
|
{
|
|
pAsm->uiFP_OutputMap[FRAG_RESULT_COLOR] = pAsm->number_used_registers++;
|
|
pAsm->number_of_exports++;
|
|
pAsm->number_of_colorandz_exports++;
|
|
}
|
|
unBit = 1 << FRAG_RESULT_DEPTH;
|
|
if(mesa_fp->Base.OutputsWritten & unBit)
|
|
{
|
|
pAsm->depth_export_register_number = pAsm->number_used_registers;
|
|
pAsm->uiFP_OutputMap[FRAG_RESULT_DEPTH] = pAsm->number_used_registers++;
|
|
pAsm->number_of_exports++;
|
|
pAsm->number_of_colorandz_exports++;
|
|
pAsm->pR700Shader->depthIsExported = 1;
|
|
}
|
|
|
|
pAsm->pucOutMask = (unsigned char*) MALLOC(pAsm->number_of_exports);
|
|
for(ui=0; ui<pAsm->number_of_exports; ui++)
|
|
{
|
|
pAsm->pucOutMask[ui] = 0x0;
|
|
}
|
|
|
|
pAsm->uFirstHelpReg = pAsm->number_used_registers;
|
|
}
|
|
|
|
GLboolean Find_Instruction_Dependencies_fp(struct r700_fragment_program *fp,
|
|
struct gl_fragment_program *mesa_fp)
|
|
{
|
|
GLuint i, j;
|
|
GLint * puiTEMPwrites;
|
|
struct prog_instruction * pILInst;
|
|
InstDeps *pInstDeps;
|
|
struct prog_instruction * texcoord_DepInst;
|
|
GLint nDepInstID;
|
|
|
|
puiTEMPwrites = (GLint*) MALLOC(sizeof(GLuint)*mesa_fp->Base.NumTemporaries);
|
|
for(i=0; i<mesa_fp->Base.NumTemporaries; i++)
|
|
{
|
|
puiTEMPwrites[i] = -1;
|
|
}
|
|
|
|
pInstDeps = (InstDeps*)MALLOC(sizeof(InstDeps)*mesa_fp->Base.NumInstructions);
|
|
|
|
for(i=0; i<mesa_fp->Base.NumInstructions; i++)
|
|
{
|
|
pInstDeps[i].nDstDep = -1;
|
|
pILInst = &(mesa_fp->Base.Instructions[i]);
|
|
|
|
//Dst
|
|
if(pILInst->DstReg.File == PROGRAM_TEMPORARY)
|
|
{
|
|
//Set lastwrite for the temp
|
|
puiTEMPwrites[pILInst->DstReg.Index] = i;
|
|
}
|
|
|
|
//Src
|
|
for(j=0; j<3; j++)
|
|
{
|
|
if(pILInst->SrcReg[j].File == PROGRAM_TEMPORARY)
|
|
{
|
|
//Set dep.
|
|
pInstDeps[i].nSrcDeps[j] = puiTEMPwrites[pILInst->SrcReg[j].Index];
|
|
}
|
|
else
|
|
{
|
|
pInstDeps[i].nSrcDeps[j] = -1;
|
|
}
|
|
}
|
|
}
|
|
|
|
fp->r700AsmCode.pInstDeps = pInstDeps;
|
|
|
|
FREE(puiTEMPwrites);
|
|
|
|
//Find dep for tex inst
|
|
for(i=0; i<mesa_fp->Base.NumInstructions; i++)
|
|
{
|
|
pILInst = &(mesa_fp->Base.Instructions[i]);
|
|
|
|
if(GL_TRUE == IsTex(pILInst->Opcode))
|
|
{ //src0 is the tex coord register, src1 is texunit, src2 is textype
|
|
nDepInstID = pInstDeps[i].nSrcDeps[0];
|
|
if(nDepInstID >= 0)
|
|
{
|
|
texcoord_DepInst = &(mesa_fp->Base.Instructions[nDepInstID]);
|
|
if(GL_TRUE == IsAlu(texcoord_DepInst->Opcode) )
|
|
{
|
|
pInstDeps[nDepInstID].nDstDep = i;
|
|
pInstDeps[i].nDstDep = i;
|
|
}
|
|
else if(GL_TRUE == IsTex(texcoord_DepInst->Opcode) )
|
|
{
|
|
pInstDeps[i].nDstDep = i;
|
|
}
|
|
else
|
|
{ //... other deps?
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
return GL_TRUE;
|
|
}
|
|
|
|
GLboolean r700TranslateFragmentShader(struct r700_fragment_program *fp,
|
|
struct gl_fragment_program *mesa_fp)
|
|
{
|
|
GLuint number_of_colors_exported;
|
|
GLboolean z_enabled = GL_FALSE;
|
|
GLuint unBit;
|
|
|
|
//Init_Program
|
|
Init_r700_AssemblerBase( SPT_FP, &(fp->r700AsmCode), &(fp->r700Shader) );
|
|
Map_Fragment_Program(&(fp->r700AsmCode), mesa_fp);
|
|
|
|
if( GL_FALSE == Find_Instruction_Dependencies_fp(fp, mesa_fp) )
|
|
{
|
|
return GL_FALSE;
|
|
}
|
|
|
|
if( GL_FALSE == AssembleInstr(mesa_fp->Base.NumInstructions,
|
|
&(mesa_fp->Base.Instructions[0]),
|
|
&(fp->r700AsmCode)) )
|
|
{
|
|
return GL_FALSE;
|
|
}
|
|
|
|
if(GL_FALSE == Process_Fragment_Exports(&(fp->r700AsmCode), mesa_fp->Base.OutputsWritten) )
|
|
{
|
|
return GL_FALSE;
|
|
}
|
|
|
|
fp->r700Shader.nRegs = (fp->r700AsmCode.number_used_registers == 0) ? 0
|
|
: (fp->r700AsmCode.number_used_registers - 1);
|
|
|
|
fp->r700Shader.nParamExports = fp->r700AsmCode.number_of_exports;
|
|
|
|
number_of_colors_exported = fp->r700AsmCode.number_of_colorandz_exports;
|
|
|
|
unBit = 1 << FRAG_RESULT_DEPTH;
|
|
if(mesa_fp->Base.OutputsWritten & unBit)
|
|
{
|
|
z_enabled = GL_TRUE;
|
|
number_of_colors_exported--;
|
|
}
|
|
|
|
/* illegal to set this to 0 */
|
|
if(number_of_colors_exported || z_enabled)
|
|
{
|
|
fp->r700Shader.exportMode = number_of_colors_exported << 1 | z_enabled;
|
|
}
|
|
else
|
|
{
|
|
fp->r700Shader.exportMode = (1 << 1);
|
|
}
|
|
|
|
fp->translated = GL_TRUE;
|
|
|
|
return GL_TRUE;
|
|
}
|
|
|
|
void r700SelectFragmentShader(GLcontext *ctx)
|
|
{
|
|
context_t *context = R700_CONTEXT(ctx);
|
|
struct r700_fragment_program *fp = (struct r700_fragment_program *)
|
|
(ctx->FragmentProgram._Current);
|
|
if (context->radeon.radeonScreen->chip_family < CHIP_FAMILY_RV770)
|
|
{
|
|
fp->r700AsmCode.bR6xx = 1;
|
|
}
|
|
|
|
if (GL_FALSE == fp->translated)
|
|
r700TranslateFragmentShader(fp, &(fp->mesa_program));
|
|
}
|
|
|
|
void * r700GetActiveFpShaderBo(GLcontext * ctx)
|
|
{
|
|
struct r700_fragment_program *fp = (struct r700_fragment_program *)
|
|
(ctx->FragmentProgram._Current);
|
|
|
|
return fp->shaderbo;
|
|
}
|
|
|
|
GLboolean r700SetupFragmentProgram(GLcontext * ctx)
|
|
{
|
|
context_t *context = R700_CONTEXT(ctx);
|
|
R700_CHIP_CONTEXT *r700 = (R700_CHIP_CONTEXT*)(&context->hw);
|
|
struct r700_fragment_program *fp = (struct r700_fragment_program *)
|
|
(ctx->FragmentProgram._Current);
|
|
r700_AssemblerBase *pAsm = &(fp->r700AsmCode);
|
|
struct gl_fragment_program *mesa_fp = &(fp->mesa_program);
|
|
struct gl_program_parameter_list *paramList;
|
|
unsigned int unNumParamData;
|
|
unsigned int ui, i;
|
|
unsigned int unNumOfReg;
|
|
unsigned int unBit;
|
|
GLuint exportCount;
|
|
|
|
if(GL_FALSE == fp->loaded)
|
|
{
|
|
if(fp->r700Shader.bNeedsAssembly == GL_TRUE)
|
|
{
|
|
Assemble( &(fp->r700Shader) );
|
|
}
|
|
|
|
/* Load fp to gpu */
|
|
r600EmitShader(ctx,
|
|
&(fp->shaderbo),
|
|
(GLvoid *)(fp->r700Shader.pProgram),
|
|
fp->r700Shader.uShaderBinaryDWORDSize,
|
|
"FS");
|
|
|
|
fp->loaded = GL_TRUE;
|
|
}
|
|
|
|
DumpHwBinary(DUMP_PIXEL_SHADER, (GLvoid *)(fp->r700Shader.pProgram),
|
|
fp->r700Shader.uShaderBinaryDWORDSize);
|
|
|
|
/* TODO : enable this after MemUse fixed *=
|
|
(context->chipobj.MemUse)(context, fp->shadercode.buf->id);
|
|
*/
|
|
|
|
R600_STATECHANGE(context, ps);
|
|
|
|
r700->ps.SQ_PGM_RESOURCES_PS.u32All = 0;
|
|
SETbit(r700->ps.SQ_PGM_RESOURCES_PS.u32All, PGM_RESOURCES__PRIME_CACHE_ON_DRAW_bit);
|
|
|
|
r700->ps.SQ_PGM_START_PS.u32All = 0; /* set from buffer obj */
|
|
|
|
R600_STATECHANGE(context, spi);
|
|
|
|
unNumOfReg = fp->r700Shader.nRegs + 1;
|
|
|
|
ui = (r700->SPI_PS_IN_CONTROL_0.u32All & NUM_INTERP_mask) / (1 << NUM_INTERP_shift);
|
|
|
|
/* PS uses fragment.position */
|
|
if (mesa_fp->Base.InputsRead & (1 << FRAG_ATTRIB_WPOS))
|
|
{
|
|
ui += 1;
|
|
SETfield(r700->SPI_PS_IN_CONTROL_0.u32All, ui, NUM_INTERP_shift, NUM_INTERP_mask);
|
|
SETfield(r700->SPI_PS_IN_CONTROL_0.u32All, CENTERS_ONLY, BARYC_SAMPLE_CNTL_shift, BARYC_SAMPLE_CNTL_mask);
|
|
SETbit(r700->SPI_PS_IN_CONTROL_0.u32All, POSITION_ENA_bit);
|
|
SETbit(r700->SPI_INPUT_Z.u32All, PROVIDE_Z_TO_SPI_bit);
|
|
}
|
|
else
|
|
{
|
|
CLEARbit(r700->SPI_PS_IN_CONTROL_0.u32All, POSITION_ENA_bit);
|
|
CLEARbit(r700->SPI_INPUT_Z.u32All, PROVIDE_Z_TO_SPI_bit);
|
|
}
|
|
|
|
ui = (unNumOfReg < ui) ? ui : unNumOfReg;
|
|
|
|
SETfield(r700->ps.SQ_PGM_RESOURCES_PS.u32All, ui, NUM_GPRS_shift, NUM_GPRS_mask);
|
|
|
|
CLEARbit(r700->ps.SQ_PGM_RESOURCES_PS.u32All, UNCACHED_FIRST_INST_bit);
|
|
|
|
if(fp->r700Shader.uStackSize) /* we don't use branch for now, it should be zero. */
|
|
{
|
|
SETfield(r700->ps.SQ_PGM_RESOURCES_PS.u32All, fp->r700Shader.uStackSize,
|
|
STACK_SIZE_shift, STACK_SIZE_mask);
|
|
}
|
|
|
|
SETfield(r700->ps.SQ_PGM_EXPORTS_PS.u32All, fp->r700Shader.exportMode,
|
|
EXPORT_MODE_shift, EXPORT_MODE_mask);
|
|
|
|
R600_STATECHANGE(context, db);
|
|
|
|
if(fp->r700Shader.killIsUsed)
|
|
{
|
|
SETbit(r700->DB_SHADER_CONTROL.u32All, KILL_ENABLE_bit);
|
|
}
|
|
else
|
|
{
|
|
CLEARbit(r700->DB_SHADER_CONTROL.u32All, KILL_ENABLE_bit);
|
|
}
|
|
|
|
if(fp->r700Shader.depthIsExported)
|
|
{
|
|
SETbit(r700->DB_SHADER_CONTROL.u32All, Z_EXPORT_ENABLE_bit);
|
|
}
|
|
else
|
|
{
|
|
CLEARbit(r700->DB_SHADER_CONTROL.u32All, Z_EXPORT_ENABLE_bit);
|
|
}
|
|
|
|
// emit ps input map
|
|
unBit = 1 << FRAG_ATTRIB_WPOS;
|
|
if(mesa_fp->Base.InputsRead & unBit)
|
|
{
|
|
ui = pAsm->uiFP_AttributeMap[FRAG_ATTRIB_WPOS];
|
|
SETbit(r700->SPI_PS_INPUT_CNTL[ui].u32All, SEL_CENTROID_bit);
|
|
SETfield(r700->SPI_PS_INPUT_CNTL[ui].u32All, ui,
|
|
SEMANTIC_shift, SEMANTIC_mask);
|
|
if (r700->SPI_INTERP_CONTROL_0.u32All & FLAT_SHADE_ENA_bit)
|
|
SETbit(r700->SPI_PS_INPUT_CNTL[ui].u32All, FLAT_SHADE_bit);
|
|
else
|
|
CLEARbit(r700->SPI_PS_INPUT_CNTL[ui].u32All, FLAT_SHADE_bit);
|
|
}
|
|
|
|
unBit = 1 << FRAG_ATTRIB_COL0;
|
|
if(mesa_fp->Base.InputsRead & unBit)
|
|
{
|
|
ui = pAsm->uiFP_AttributeMap[FRAG_ATTRIB_COL0];
|
|
SETbit(r700->SPI_PS_INPUT_CNTL[ui].u32All, SEL_CENTROID_bit);
|
|
SETfield(r700->SPI_PS_INPUT_CNTL[ui].u32All, ui,
|
|
SEMANTIC_shift, SEMANTIC_mask);
|
|
if (r700->SPI_INTERP_CONTROL_0.u32All & FLAT_SHADE_ENA_bit)
|
|
SETbit(r700->SPI_PS_INPUT_CNTL[ui].u32All, FLAT_SHADE_bit);
|
|
else
|
|
CLEARbit(r700->SPI_PS_INPUT_CNTL[ui].u32All, FLAT_SHADE_bit);
|
|
}
|
|
|
|
unBit = 1 << FRAG_ATTRIB_COL1;
|
|
if(mesa_fp->Base.InputsRead & unBit)
|
|
{
|
|
ui = pAsm->uiFP_AttributeMap[FRAG_ATTRIB_COL1];
|
|
SETbit(r700->SPI_PS_INPUT_CNTL[ui].u32All, SEL_CENTROID_bit);
|
|
SETfield(r700->SPI_PS_INPUT_CNTL[ui].u32All, ui,
|
|
SEMANTIC_shift, SEMANTIC_mask);
|
|
if (r700->SPI_INTERP_CONTROL_0.u32All & FLAT_SHADE_ENA_bit)
|
|
SETbit(r700->SPI_PS_INPUT_CNTL[ui].u32All, FLAT_SHADE_bit);
|
|
else
|
|
CLEARbit(r700->SPI_PS_INPUT_CNTL[ui].u32All, FLAT_SHADE_bit);
|
|
}
|
|
|
|
unBit = 1 << FRAG_ATTRIB_FOGC;
|
|
if(mesa_fp->Base.InputsRead & unBit)
|
|
{
|
|
ui = pAsm->uiFP_AttributeMap[FRAG_ATTRIB_FOGC];
|
|
SETbit(r700->SPI_PS_INPUT_CNTL[ui].u32All, SEL_CENTROID_bit);
|
|
SETfield(r700->SPI_PS_INPUT_CNTL[ui].u32All, ui,
|
|
SEMANTIC_shift, SEMANTIC_mask);
|
|
if (r700->SPI_INTERP_CONTROL_0.u32All & FLAT_SHADE_ENA_bit)
|
|
SETbit(r700->SPI_PS_INPUT_CNTL[ui].u32All, FLAT_SHADE_bit);
|
|
else
|
|
CLEARbit(r700->SPI_PS_INPUT_CNTL[ui].u32All, FLAT_SHADE_bit);
|
|
}
|
|
|
|
for(i=0; i<8; i++)
|
|
{
|
|
unBit = 1 << (FRAG_ATTRIB_TEX0 + i);
|
|
if(mesa_fp->Base.InputsRead & unBit)
|
|
{
|
|
ui = pAsm->uiFP_AttributeMap[FRAG_ATTRIB_TEX0 + i];
|
|
SETbit(r700->SPI_PS_INPUT_CNTL[ui].u32All, SEL_CENTROID_bit);
|
|
SETfield(r700->SPI_PS_INPUT_CNTL[ui].u32All, ui,
|
|
SEMANTIC_shift, SEMANTIC_mask);
|
|
CLEARbit(r700->SPI_PS_INPUT_CNTL[ui].u32All, FLAT_SHADE_bit);
|
|
}
|
|
}
|
|
|
|
R600_STATECHANGE(context, cb);
|
|
exportCount = (r700->ps.SQ_PGM_EXPORTS_PS.u32All & EXPORT_MODE_mask) / (1 << EXPORT_MODE_shift);
|
|
r700->CB_SHADER_CONTROL.u32All = (1 << exportCount) - 1;
|
|
|
|
/* sent out shader constants. */
|
|
paramList = fp->mesa_program.Base.Parameters;
|
|
|
|
if(NULL != paramList) {
|
|
_mesa_load_state_parameters(ctx, paramList);
|
|
|
|
if (paramList->NumParameters > R700_MAX_DX9_CONSTS)
|
|
return GL_FALSE;
|
|
|
|
R600_STATECHANGE(context, ps_consts);
|
|
|
|
r700->ps.num_consts = paramList->NumParameters;
|
|
|
|
unNumParamData = paramList->NumParameters;
|
|
|
|
for(ui=0; ui<unNumParamData; ui++) {
|
|
r700->ps.consts[ui][0].f32All = paramList->ParameterValues[ui][0];
|
|
r700->ps.consts[ui][1].f32All = paramList->ParameterValues[ui][1];
|
|
r700->ps.consts[ui][2].f32All = paramList->ParameterValues[ui][2];
|
|
r700->ps.consts[ui][3].f32All = paramList->ParameterValues[ui][3];
|
|
}
|
|
} else
|
|
r700->ps.num_consts = 0;
|
|
|
|
return GL_TRUE;
|
|
}
|
|
|