gallium: add TGSI_SEMANTIC_TEXCOORD,PCOORD v3

This makes it possible to identify gl_TexCoord and gl_PointCoord
for drivers where sprite coordinate replacement is restricted.

The new PIPE_CAP_TGSI_TEXCOORD decides whether these varyings
should be hidden behind the GENERIC semantic or not.

With this patch only nvc0 and nv30 will request that they be used.

v2: introduce a CAP so other drivers don't have to bother with
the new semantic

v3: adapt to introduction gl_varying_slot enum
This commit is contained in:
Christoph Bumiller
2013-03-15 22:11:31 +01:00
parent 3eaf823b90
commit 8acaf862df
28 changed files with 170 additions and 91 deletions

View File

@@ -52,6 +52,7 @@
*/ */
#include "pipe/p_screen.h"
#include "pipe/p_context.h" #include "pipe/p_context.h"
#include "util/u_math.h" #include "util/u_math.h"
#include "util/u_memory.h" #include "util/u_memory.h"
@@ -74,6 +75,9 @@ struct widepoint_stage {
uint num_texcoord_gen; uint num_texcoord_gen;
uint texcoord_gen_slot[PIPE_MAX_SHADER_OUTPUTS]; uint texcoord_gen_slot[PIPE_MAX_SHADER_OUTPUTS];
/* TGSI_SEMANTIC to which sprite_coord_enable applies */
unsigned sprite_coord_semantic;
int psize_slot; int psize_slot;
}; };
@@ -233,28 +237,29 @@ widepoint_first_point(struct draw_stage *stage,
wide->num_texcoord_gen = 0; wide->num_texcoord_gen = 0;
/* Loop over fragment shader inputs looking for generic inputs /* Loop over fragment shader inputs looking for the PCOORD input or inputs
* for which bit 'k' in sprite_coord_enable is set. * for which bit 'k' in sprite_coord_enable is set.
*/ */
for (i = 0; i < fs->info.num_inputs; i++) { for (i = 0; i < fs->info.num_inputs; i++) {
if (fs->info.input_semantic_name[i] == TGSI_SEMANTIC_GENERIC) { int slot;
const int generic_index = fs->info.input_semantic_index[i]; const unsigned sn = fs->info.input_semantic_name[i];
/* Note that sprite_coord enable is a bitfield of const unsigned si = fs->info.input_semantic_index[i];
* PIPE_MAX_SHADER_OUTPUTS bits.
*/
if (generic_index < PIPE_MAX_SHADER_OUTPUTS &&
(rast->sprite_coord_enable & (1 << generic_index))) {
/* OK, this generic attribute needs to be replaced with a
* texcoord (see above).
*/
int slot = draw_alloc_extra_vertex_attrib(draw,
TGSI_SEMANTIC_GENERIC,
generic_index);
/* add this slot to the texcoord-gen list */ if (sn == wide->sprite_coord_semantic) {
wide->texcoord_gen_slot[wide->num_texcoord_gen++] = slot; /* Note that sprite_coord_enable is a bitfield of 32 bits. */
} if (si >= 32 || !(rast->sprite_coord_enable & (1 << si)))
continue;
} else if (sn != TGSI_SEMANTIC_PCOORD) {
continue;
} }
/* OK, this generic attribute needs to be replaced with a
* sprite coord (see above).
*/
slot = draw_alloc_extra_vertex_attrib(draw, sn, si);
/* add this slot to the texcoord-gen list */
wide->texcoord_gen_slot[wide->num_texcoord_gen++] = slot;
} }
} }
@@ -326,6 +331,11 @@ struct draw_stage *draw_wide_point_stage( struct draw_context *draw )
if (!draw_alloc_temp_verts( &wide->stage, 4 )) if (!draw_alloc_temp_verts( &wide->stage, 4 ))
goto fail; goto fail;
wide->sprite_coord_semantic =
draw->pipe->screen->get_param(draw->pipe->screen, PIPE_CAP_TGSI_TEXCOORD)
?
TGSI_SEMANTIC_TEXCOORD : TGSI_SEMANTIC_GENERIC;
return &wide->stage; return &wide->stage;
fail: fail:

View File

@@ -305,6 +305,7 @@ iter_declaration(
TXT( ", " ); TXT( ", " );
ENM( decl->Semantic.Name, tgsi_semantic_names ); ENM( decl->Semantic.Name, tgsi_semantic_names );
if (decl->Semantic.Index != 0 || if (decl->Semantic.Index != 0 ||
decl->Semantic.Name == TGSI_SEMANTIC_TEXCOORD ||
decl->Semantic.Name == TGSI_SEMANTIC_GENERIC) { decl->Semantic.Name == TGSI_SEMANTIC_GENERIC) {
CHR( '[' ); CHR( '[' );
UID( decl->Semantic.Index ); UID( decl->Semantic.Index );

View File

@@ -76,7 +76,9 @@ const char *tgsi_semantic_names[TGSI_SEMANTIC_COUNT] =
"GRID_SIZE", "GRID_SIZE",
"BLOCK_ID", "BLOCK_ID",
"BLOCK_SIZE", "BLOCK_SIZE",
"THREAD_ID" "THREAD_ID",
"TEXCOORD",
"PCOORD"
}; };
const char *tgsi_texture_names[TGSI_TEXTURE_COUNT] = const char *tgsi_texture_names[TGSI_TEXTURE_COUNT] =

View File

@@ -159,13 +159,18 @@ Points
sprite_coord_enable sprite_coord_enable
^^^^^^^^^^^^^^^^^^^ ^^^^^^^^^^^^^^^^^^^
The effect of this state depends on PIPE_CAP_TGSI_TEXCOORD !
Controls automatic texture coordinate generation for rendering sprite points. Controls automatic texture coordinate generation for rendering sprite points.
If PIPE_CAP_TGSI_TEXCOORD is false:
When bit k in the sprite_coord_enable bitfield is set, then generic When bit k in the sprite_coord_enable bitfield is set, then generic
input k to the fragment shader will get an automatically computed input k to the fragment shader will get an automatically computed
texture coordinate. texture coordinate.
If PIPE_CAP_TGSI_TEXCOORD is true:
The bitfield refers to inputs with TEXCOORD semantic instead of generic inputs.
The texture coordinate will be of the form (s, t, 0, 1) where s varies The texture coordinate will be of the form (s, t, 0, 1) where s varies
from 0 to 1 from left to right while t varies from 0 to 1 according to from 0 to 1 from left to right while t varies from 0 to 1 according to
the state of 'sprite_coord_mode' (see below). the state of 'sprite_coord_mode' (see below).

View File

@@ -137,6 +137,14 @@ The integer capabilities:
* ``PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT``: Describes the required * ``PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT``: Describes the required
alignment for pipe_sampler_view::u.buf.first_element, in bytes. alignment for pipe_sampler_view::u.buf.first_element, in bytes.
If a driver does not support first/last_element, it should return 0. If a driver does not support first/last_element, it should return 0.
* ``PIPE_CAP_TGSI_TEXCOORD``: This CAP describes a hw limitation.
If true, the hardware cannot replace arbitrary shader inputs with sprite
coordinates and hence the inputs that are desired to be replaceable must
be declared with TGSI_SEMANTIC_TEXCOORD instead of TGSI_SEMANTIC_GENERIC.
The rasterizer's sprite_coord_enable state therefore also applies to the
TEXCOORD semantic.
Also, TGSI_SEMANTIC_PCOORD becomes available, which labels a fragment shader
input that will always be replaced with sprite coordinates.
.. _pipe_capf: .. _pipe_capf:

View File

@@ -1949,6 +1949,35 @@ When using this semantic, be sure to set the appropriate state in the
:ref:`rasterizer` first. :ref:`rasterizer` first.
TGSI_SEMANTIC_TEXCOORD
""""""""""""""""""""""
Only available if PIPE_CAP_TGSI_TEXCOORD is exposed !
Vertex shader outputs and fragment shader inputs may be labeled with
this semantic to make them replaceable by sprite coordinates via the
sprite_coord_enable state in the :ref:`rasterizer`.
The semantic index permitted with this semantic is limited to <= 7.
If the driver does not support TEXCOORD, sprite coordinate replacement
applies to inputs with the GENERIC semantic instead.
The intended use case for this semantic is gl_TexCoord.
TGSI_SEMANTIC_PCOORD
""""""""""""""""""""
Only available if PIPE_CAP_TGSI_TEXCOORD is exposed !
Fragment shader inputs may be labeled with TGSI_SEMANTIC_PCOORD to indicate
that the register contains sprite coordinates in the form (x, y, 0, 1), if
the current primitive is a point and point sprites are enabled. Otherwise,
the contents of the register are undefined.
The intended use case for this semantic is gl_PointCoord.
TGSI_SEMANTIC_GENERIC TGSI_SEMANTIC_GENERIC
""""""""""""""""""""" """""""""""""""""""""

View File

@@ -165,6 +165,8 @@ fd_screen_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
case PIPE_CAP_TEXTURE_MULTISAMPLE: case PIPE_CAP_TEXTURE_MULTISAMPLE:
case PIPE_CAP_USER_CONSTANT_BUFFERS: case PIPE_CAP_USER_CONSTANT_BUFFERS:
return 1; return 1;
case PIPE_CAP_TGSI_TEXCOORD:
return 0;
case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT: case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:
return 256; return 256;

View File

@@ -184,6 +184,8 @@ i915_get_param(struct pipe_screen *screen, enum pipe_cap cap)
case PIPE_CAP_USER_INDEX_BUFFERS: case PIPE_CAP_USER_INDEX_BUFFERS:
case PIPE_CAP_USER_CONSTANT_BUFFERS: case PIPE_CAP_USER_CONSTANT_BUFFERS:
return 1; return 1;
case PIPE_CAP_TGSI_TEXCOORD:
return 0;
/* Unsupported features (boolean caps). */ /* Unsupported features (boolean caps). */
case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS: case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:

View File

@@ -208,6 +208,7 @@ llvmpipe_get_param(struct pipe_screen *screen, enum pipe_cap param)
case PIPE_CAP_VERTEX_BUFFER_OFFSET_4BYTE_ALIGNED_ONLY: case PIPE_CAP_VERTEX_BUFFER_OFFSET_4BYTE_ALIGNED_ONLY:
case PIPE_CAP_VERTEX_BUFFER_STRIDE_4BYTE_ALIGNED_ONLY: case PIPE_CAP_VERTEX_BUFFER_STRIDE_4BYTE_ALIGNED_ONLY:
case PIPE_CAP_VERTEX_ELEMENT_SRC_OFFSET_4BYTE_ALIGNED_ONLY: case PIPE_CAP_VERTEX_ELEMENT_SRC_OFFSET_4BYTE_ALIGNED_ONLY:
case PIPE_CAP_TGSI_TEXCOORD:
return 0; return 0;
case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT: case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:

View File

@@ -79,6 +79,7 @@ nv30_screen_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT: case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER: case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER: case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
case PIPE_CAP_TGSI_TEXCOORD:
case PIPE_CAP_USER_CONSTANT_BUFFERS: case PIPE_CAP_USER_CONSTANT_BUFFERS:
case PIPE_CAP_USER_INDEX_BUFFERS: case PIPE_CAP_USER_INDEX_BUFFERS:
return 1; return 1;

View File

@@ -927,15 +927,17 @@ nvfx_fragprog_parse_decl_input(struct nv30_context *nvfx, struct nvfx_fpc *fpc,
case TGSI_SEMANTIC_FACE: case TGSI_SEMANTIC_FACE:
hw = NV40_FP_OP_INPUT_SRC_FACING; hw = NV40_FP_OP_INPUT_SRC_FACING;
break; break;
case TGSI_SEMANTIC_GENERIC: case TGSI_SEMANTIC_TEXCOORD:
if (fdec->Semantic.Index >= 8) assert(fdec->Semantic.Index < 8);
return TRUE;
fpc->fp->texcoord[fdec->Semantic.Index] = fdec->Semantic.Index; fpc->fp->texcoord[fdec->Semantic.Index] = fdec->Semantic.Index;
fpc->fp->texcoords |= (1 << fdec->Semantic.Index); fpc->fp->texcoords |= (1 << fdec->Semantic.Index);
fpc->fp->vp_or |= (0x00004000 << fdec->Semantic.Index); fpc->fp->vp_or |= (0x00004000 << fdec->Semantic.Index);
hw = NVFX_FP_OP_INPUT_SRC_TC(fdec->Semantic.Index); hw = NVFX_FP_OP_INPUT_SRC_TC(fdec->Semantic.Index);
break; break;
case TGSI_SEMANTIC_GENERIC:
case TGSI_SEMANTIC_PCOORD:
/* will be assigned to remaining TC slots later */
return TRUE;
default: default:
assert(0); assert(0);
return FALSE; return FALSE;
@@ -955,22 +957,24 @@ nvfx_fragprog_assign_generic(struct nv30_context *nvfx, struct nvfx_fpc *fpc,
switch (fdec->Semantic.Name) { switch (fdec->Semantic.Name) {
case TGSI_SEMANTIC_GENERIC: case TGSI_SEMANTIC_GENERIC:
if (fdec->Semantic.Index >= 8) { case TGSI_SEMANTIC_PCOORD:
for (hw = 0; hw < num_texcoords; hw++) { for (hw = 0; hw < num_texcoords; hw++) {
if (fpc->fp->texcoord[hw] == 0xffff) { if (fpc->fp->texcoord[hw] == 0xffff) {
fpc->fp->texcoord[hw] = fdec->Semantic.Index; if (hw <= 7) {
if (hw <= 7) { fpc->fp->texcoords |= (0x1 << hw);
fpc->fp->texcoords |= (0x1 << hw); fpc->fp->vp_or |= (0x00004000 << hw);
fpc->fp->vp_or |= (0x00004000 << hw); } else {
} else { fpc->fp->vp_or |= (0x00001000 << (hw - 8));
fpc->fp->vp_or |= (0x00001000 << (hw - 8));
}
if (fdec->Semantic.Index == 9)
fpc->fp->point_sprite_control |= (0x00000100 << hw);
hw = NVFX_FP_OP_INPUT_SRC_TC(hw);
fpc->r_input[idx] = nvfx_reg(NVFXSR_INPUT, hw);
return TRUE;
} }
if (fdec->Semantic.Name == TGSI_SEMANTIC_PCOORD) {
fpc->fp->texcoord[hw] = 0xfffe;
fpc->fp->point_sprite_control |= (0x00000100 << hw);
} else {
fpc->fp->texcoord[hw] = fdec->Semantic.Index + 8;
}
hw = NVFX_FP_OP_INPUT_SRC_TC(hw);
fpc->r_input[idx] = nvfx_reg(NVFXSR_INPUT, hw);
return TRUE;
} }
return FALSE; return FALSE;
} }

View File

@@ -819,6 +819,7 @@ nvfx_vertprog_parse_decl_output(struct nv30_context *nv30, struct nvfx_vpc *vpc,
{ {
unsigned num_texcoords = nv30->is_nv4x ? 10 : 8; unsigned num_texcoords = nv30->is_nv4x ? 10 : 8;
unsigned idx = fdec->Range.First; unsigned idx = fdec->Range.First;
unsigned semantic_index = fdec->Semantic.Index;
int hw = 0, i; int hw = 0, i;
switch (fdec->Semantic.Name) { switch (fdec->Semantic.Name) {
@@ -860,8 +861,12 @@ nvfx_vertprog_parse_decl_output(struct nv30_context *nv30, struct nvfx_vpc *vpc,
hw = NVFX_VP(INST_DEST_PSZ); hw = NVFX_VP(INST_DEST_PSZ);
break; break;
case TGSI_SEMANTIC_GENERIC: case TGSI_SEMANTIC_GENERIC:
/* this is really an identifier for VP/FP linkage */
semantic_index += 8;
/* fall through */
case TGSI_SEMANTIC_TEXCOORD:
for (i = 0; i < num_texcoords; i++) { for (i = 0; i < num_texcoords; i++) {
if (vpc->vp->texcoord[i] == fdec->Semantic.Index) { if (vpc->vp->texcoord[i] == semantic_index) {
hw = NVFX_VP(INST_DEST_TC(i)); hw = NVFX_VP(INST_DEST_TC(i));
break; break;
} }

View File

@@ -70,8 +70,6 @@ struct nv50_ir_varying
#endif #endif
#define NV50_SEMANTIC_CLIPDISTANCE (TGSI_SEMANTIC_COUNT + 0) #define NV50_SEMANTIC_CLIPDISTANCE (TGSI_SEMANTIC_COUNT + 0)
#define NV50_SEMANTIC_TEXCOORD (TGSI_SEMANTIC_COUNT + 1)
#define NV50_SEMANTIC_POINTCOORD (TGSI_SEMANTIC_COUNT + 2)
#define NV50_SEMANTIC_VIEWPORTINDEX (TGSI_SEMANTIC_COUNT + 4) #define NV50_SEMANTIC_VIEWPORTINDEX (TGSI_SEMANTIC_COUNT + 4)
#define NV50_SEMANTIC_LAYER (TGSI_SEMANTIC_COUNT + 5) #define NV50_SEMANTIC_LAYER (TGSI_SEMANTIC_COUNT + 5)
#define NV50_SEMANTIC_INVOCATIONID (TGSI_SEMANTIC_COUNT + 6) #define NV50_SEMANTIC_INVOCATIONID (TGSI_SEMANTIC_COUNT + 6)

View File

@@ -184,6 +184,7 @@ nv50_screen_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
case PIPE_CAP_VERTEX_BUFFER_OFFSET_4BYTE_ALIGNED_ONLY: case PIPE_CAP_VERTEX_BUFFER_OFFSET_4BYTE_ALIGNED_ONLY:
case PIPE_CAP_VERTEX_BUFFER_STRIDE_4BYTE_ALIGNED_ONLY: case PIPE_CAP_VERTEX_BUFFER_STRIDE_4BYTE_ALIGNED_ONLY:
case PIPE_CAP_VERTEX_ELEMENT_SRC_OFFSET_4BYTE_ALIGNED_ONLY: case PIPE_CAP_VERTEX_ELEMENT_SRC_OFFSET_4BYTE_ALIGNED_ONLY:
case PIPE_CAP_TGSI_TEXCOORD:
case PIPE_CAP_TEXTURE_MULTISAMPLE: case PIPE_CAP_TEXTURE_MULTISAMPLE:
return 0; return 0;
default: default:

View File

@@ -494,7 +494,7 @@ nv50_blitter_make_vp(struct nv50_blitter *blit)
blit->vp.out[1].hw = 2; blit->vp.out[1].hw = 2;
blit->vp.out[1].mask = 0x7; blit->vp.out[1].mask = 0x7;
blit->vp.out[1].sn = TGSI_SEMANTIC_GENERIC; blit->vp.out[1].sn = TGSI_SEMANTIC_GENERIC;
blit->vp.out[1].si = 8; blit->vp.out[1].si = 0;
blit->vp.vp.attrs[0] = 0x73; blit->vp.vp.attrs[0] = 0x73;
blit->vp.vp.psiz = 0x40; blit->vp.vp.psiz = 0x40;
blit->vp.vp.edgeflag = 0x40; blit->vp.vp.edgeflag = 0x40;
@@ -536,9 +536,8 @@ nv50_blitter_make_fp(struct pipe_context *pipe,
return NULL; return NULL;
out = ureg_DECL_output(ureg, TGSI_SEMANTIC_COLOR, 0); out = ureg_DECL_output(ureg, TGSI_SEMANTIC_COLOR, 0);
/* NOTE: use GENERIC[8] so we don't use the TEXCOORD slots on nvc0 */
tc = ureg_DECL_fs_input( tc = ureg_DECL_fs_input(
ureg, TGSI_SEMANTIC_GENERIC, 8, TGSI_INTERPOLATE_LINEAR); ureg, TGSI_SEMANTIC_GENERIC, 0, TGSI_INTERPOLATE_LINEAR);
data = ureg_DECL_temporary(ureg); data = ureg_DECL_temporary(ureg);

View File

@@ -27,33 +27,6 @@
#include "nv50/codegen/nv50_ir_driver.h" #include "nv50/codegen/nv50_ir_driver.h"
#include "nve4_compute.h" #include "nve4_compute.h"
/* If only they told use the actual semantic instead of just GENERIC ... */
static void
nvc0_mesa_varying_hack(struct nv50_ir_varying *var)
{
unsigned c;
if (var->sn != TGSI_SEMANTIC_GENERIC)
return;
if (var->si <= 7) /* gl_TexCoord */
for (c = 0; c < 4; ++c)
var->slot[c] = (0x300 + var->si * 0x10 + c * 0x4) / 4;
else
if (var->si == 9) /* gl_PointCoord */
for (c = 0; c < 4; ++c)
var->slot[c] = (0x2e0 + c * 0x4) / 4;
else
if (var->si <= 39)
for (c = 0; c < 4; ++c) /* move down user varyings (first has index 8) */
var->slot[c] -= 0x80 / 4;
else {
NOUVEAU_ERR("too many varyings / invalid location: %u !\n", var->si);
for (c = 0; c < 4; ++c)
var->slot[c] = (0x270 + c * 0x4) / 4; /* catch invalid indices */
}
}
static uint32_t static uint32_t
nvc0_shader_input_address(unsigned sn, unsigned si, unsigned ubase) nvc0_shader_input_address(unsigned sn, unsigned si, unsigned ubase)
{ {
@@ -69,11 +42,11 @@ nvc0_shader_input_address(unsigned sn, unsigned si, unsigned ubase)
case NV50_SEMANTIC_CLIPDISTANCE: return 0x2c0 + si * 0x4; case NV50_SEMANTIC_CLIPDISTANCE: return 0x2c0 + si * 0x4;
case TGSI_SEMANTIC_CLIPDIST: return 0x2c0 + si * 0x10; case TGSI_SEMANTIC_CLIPDIST: return 0x2c0 + si * 0x10;
case TGSI_SEMANTIC_CLIPVERTEX: return 0x260; case TGSI_SEMANTIC_CLIPVERTEX: return 0x260;
case NV50_SEMANTIC_POINTCOORD: return 0x2e0; case TGSI_SEMANTIC_PCOORD: return 0x2e0;
case NV50_SEMANTIC_TESSCOORD: return 0x2f0; case NV50_SEMANTIC_TESSCOORD: return 0x2f0;
case TGSI_SEMANTIC_INSTANCEID: return 0x2f8; case TGSI_SEMANTIC_INSTANCEID: return 0x2f8;
case TGSI_SEMANTIC_VERTEXID: return 0x2fc; case TGSI_SEMANTIC_VERTEXID: return 0x2fc;
case NV50_SEMANTIC_TEXCOORD: return 0x300 + si * 0x10; case TGSI_SEMANTIC_TEXCOORD: return 0x300 + si * 0x10;
case TGSI_SEMANTIC_FACE: return 0x3fc; case TGSI_SEMANTIC_FACE: return 0x3fc;
case NV50_SEMANTIC_INVOCATIONID: return ~0; case NV50_SEMANTIC_INVOCATIONID: return ~0;
default: default:
@@ -99,7 +72,7 @@ nvc0_shader_output_address(unsigned sn, unsigned si, unsigned ubase)
case NV50_SEMANTIC_CLIPDISTANCE: return 0x2c0 + si * 0x4; case NV50_SEMANTIC_CLIPDISTANCE: return 0x2c0 + si * 0x4;
case TGSI_SEMANTIC_CLIPDIST: return 0x2c0 + si * 0x10; case TGSI_SEMANTIC_CLIPDIST: return 0x2c0 + si * 0x10;
case TGSI_SEMANTIC_CLIPVERTEX: return 0x260; case TGSI_SEMANTIC_CLIPVERTEX: return 0x260;
case NV50_SEMANTIC_TEXCOORD: return 0x300 + si * 0x10; case TGSI_SEMANTIC_TEXCOORD: return 0x300 + si * 0x10;
case TGSI_SEMANTIC_EDGEFLAG: return ~0; case TGSI_SEMANTIC_EDGEFLAG: return ~0;
default: default:
assert(!"invalid TGSI output semantic"); assert(!"invalid TGSI output semantic");
@@ -149,8 +122,6 @@ nvc0_sp_assign_input_slots(struct nv50_ir_prog_info *info)
for (c = 0; c < 4; ++c) for (c = 0; c < 4; ++c)
info->in[i].slot[c] = (offset + c * 0x4) / 4; info->in[i].slot[c] = (offset + c * 0x4) / 4;
nvc0_mesa_varying_hack(&info->in[i]);
} }
return 0; return 0;
@@ -194,8 +165,6 @@ nvc0_sp_assign_output_slots(struct nv50_ir_prog_info *info)
for (c = 0; c < 4; ++c) for (c = 0; c < 4; ++c)
info->out[i].slot[c] = (offset + c * 0x4) / 4; info->out[i].slot[c] = (offset + c * 0x4) / 4;
nvc0_mesa_varying_hack(&info->out[i]);
} }
return 0; return 0;

View File

@@ -114,6 +114,7 @@ nvc0_screen_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
case PIPE_CAP_TWO_SIDED_STENCIL: case PIPE_CAP_TWO_SIDED_STENCIL:
case PIPE_CAP_DEPTH_CLIP_DISABLE: case PIPE_CAP_DEPTH_CLIP_DISABLE:
case PIPE_CAP_POINT_SPRITE: case PIPE_CAP_POINT_SPRITE:
case PIPE_CAP_TGSI_TEXCOORD:
return 1; return 1;
case PIPE_CAP_SM3: case PIPE_CAP_SM3:
return 1; return 1;

View File

@@ -172,6 +172,8 @@ static int r300_get_param(struct pipe_screen* pscreen, enum pipe_cap param)
case PIPE_CAP_VERTEX_BUFFER_STRIDE_4BYTE_ALIGNED_ONLY: case PIPE_CAP_VERTEX_BUFFER_STRIDE_4BYTE_ALIGNED_ONLY:
case PIPE_CAP_VERTEX_ELEMENT_SRC_OFFSET_4BYTE_ALIGNED_ONLY: case PIPE_CAP_VERTEX_ELEMENT_SRC_OFFSET_4BYTE_ALIGNED_ONLY:
return r300screen->caps.has_tcl; return r300screen->caps.has_tcl;
case PIPE_CAP_TGSI_TEXCOORD:
return 0;
/* Texturing. */ /* Texturing. */
case PIPE_CAP_MAX_COMBINED_SAMPLERS: case PIPE_CAP_MAX_COMBINED_SAMPLERS:

View File

@@ -565,6 +565,8 @@ static int r600_get_param(struct pipe_screen* pscreen, enum pipe_cap param)
case PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS: case PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS:
case PIPE_CAP_TEXTURE_BUFFER_OBJECTS: case PIPE_CAP_TEXTURE_BUFFER_OBJECTS:
return 1; return 1;
case PIPE_CAP_TGSI_TEXCOORD:
return 0;
case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT: case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT:
return R600_MAP_BUFFER_ALIGNMENT; return R600_MAP_BUFFER_ALIGNMENT;

View File

@@ -330,6 +330,8 @@ static int r600_get_param(struct pipe_screen* pscreen, enum pipe_cap param)
case PIPE_CAP_START_INSTANCE: case PIPE_CAP_START_INSTANCE:
case PIPE_CAP_NPOT_TEXTURES: case PIPE_CAP_NPOT_TEXTURES:
return 1; return 1;
case PIPE_CAP_TGSI_TEXCOORD:
return 0;
case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT: case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT:
return 64; return 64;

View File

@@ -173,6 +173,8 @@ softpipe_get_param(struct pipe_screen *screen, enum pipe_cap param)
return 1; return 1;
case PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT: case PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT:
return 0; return 0;
case PIPE_CAP_TGSI_TEXCOORD:
return 0;
} }
/* should only get here on unhandled cases */ /* should only get here on unhandled cases */
debug_printf("Unexpected PIPE_CAP %d query\n", param); debug_printf("Unexpected PIPE_CAP %d query\n", param);

View File

@@ -150,6 +150,8 @@ svga_get_param(struct pipe_screen *screen, enum pipe_cap param)
return 1; return 1;
case PIPE_CAP_POINT_SPRITE: case PIPE_CAP_POINT_SPRITE:
return 1; return 1;
case PIPE_CAP_TGSI_TEXCOORD:
return 0;
case PIPE_CAP_MAX_RENDER_TARGETS: case PIPE_CAP_MAX_RENDER_TARGETS:
if(!sws->get_cap(sws, SVGA3D_DEVCAP_MAX_RENDER_TARGETS, &result)) if(!sws->get_cap(sws, SVGA3D_DEVCAP_MAX_RENDER_TARGETS, &result))
return 1; return 1;

View File

@@ -498,7 +498,8 @@ enum pipe_cap {
PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT = 75, PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT = 75,
PIPE_CAP_CUBE_MAP_ARRAY = 76, PIPE_CAP_CUBE_MAP_ARRAY = 76,
PIPE_CAP_TEXTURE_BUFFER_OBJECTS = 77, PIPE_CAP_TEXTURE_BUFFER_OBJECTS = 77,
PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT = 78 PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT = 78,
PIPE_CAP_TGSI_TEXCOORD = 79
}; };
/** /**

View File

@@ -162,7 +162,9 @@ struct tgsi_declaration_interp
#define TGSI_SEMANTIC_BLOCK_ID 16 /**< id of the current block */ #define TGSI_SEMANTIC_BLOCK_ID 16 /**< id of the current block */
#define TGSI_SEMANTIC_BLOCK_SIZE 17 /**< block size in threads */ #define TGSI_SEMANTIC_BLOCK_SIZE 17 /**< block size in threads */
#define TGSI_SEMANTIC_THREAD_ID 18 /**< block-relative id of the current thread */ #define TGSI_SEMANTIC_THREAD_ID 18 /**< block-relative id of the current thread */
#define TGSI_SEMANTIC_COUNT 19 /**< number of semantic values */ #define TGSI_SEMANTIC_TEXCOORD 19 /**< texture or sprite coordinates */
#define TGSI_SEMANTIC_PCOORD 20 /**< point sprite coordinate */
#define TGSI_SEMANTIC_COUNT 21 /**< number of semantic values */
struct tgsi_declaration_semantic struct tgsi_declaration_semantic
{ {

View File

@@ -145,7 +145,7 @@ struct pipe_rasterizer_state
unsigned line_stipple_factor:8; /**< [1..256] actually */ unsigned line_stipple_factor:8; /**< [1..256] actually */
unsigned line_stipple_pattern:16; unsigned line_stipple_pattern:16;
unsigned sprite_coord_enable; /* bitfield referring to 32 GENERIC inputs */ uint32_t sprite_coord_enable; /* referring to 32 TEXCOORD/GENERIC inputs */
float line_width; float line_width;
float point_size; /**< used when no per-vertex size */ float point_size; /**< used when no per-vertex size */

View File

@@ -183,6 +183,9 @@ st_create_context_priv( struct gl_context *ctx, struct pipe_context *pipe,
screen->get_param(screen, PIPE_CAP_SHADER_STENCIL_EXPORT); screen->get_param(screen, PIPE_CAP_SHADER_STENCIL_EXPORT);
st->has_shader_model3 = screen->get_param(screen, PIPE_CAP_SM3); st->has_shader_model3 = screen->get_param(screen, PIPE_CAP_SM3);
st->needs_texcoord_semantic =
screen->get_param(screen, PIPE_CAP_TGSI_TEXCOORD);
/* GL limits and extensions */ /* GL limits and extensions */
st_init_limits(st); st_init_limits(st);
st_init_extensions(st); st_init_extensions(st);

View File

@@ -85,6 +85,8 @@ struct st_context
boolean has_time_elapsed; boolean has_time_elapsed;
boolean has_shader_model3; boolean has_shader_model3;
boolean needs_texcoord_semantic;
/* On old libGL's for linux we need to invalidate the drawables /* On old libGL's for linux we need to invalidate the drawables
* on glViewpport calls, this is set via a option. * on glViewpport calls, this is set via a option.
*/ */

View File

@@ -177,6 +177,7 @@ void
st_prepare_vertex_program(struct gl_context *ctx, st_prepare_vertex_program(struct gl_context *ctx,
struct st_vertex_program *stvp) struct st_vertex_program *stvp)
{ {
struct st_context *st = st_context(ctx);
GLuint attr; GLuint attr;
stvp->num_inputs = 0; stvp->num_inputs = 0;
@@ -267,7 +268,8 @@ st_prepare_vertex_program(struct gl_context *ctx,
case VARYING_SLOT_TEX5: case VARYING_SLOT_TEX5:
case VARYING_SLOT_TEX6: case VARYING_SLOT_TEX6:
case VARYING_SLOT_TEX7: case VARYING_SLOT_TEX7:
stvp->output_semantic_name[slot] = TGSI_SEMANTIC_GENERIC; stvp->output_semantic_name[slot] = st->needs_texcoord_semantic ?
TGSI_SEMANTIC_TEXCOORD : TGSI_SEMANTIC_GENERIC;
stvp->output_semantic_index[slot] = attr - VARYING_SLOT_TEX0; stvp->output_semantic_index[slot] = attr - VARYING_SLOT_TEX0;
break; break;
@@ -275,10 +277,8 @@ st_prepare_vertex_program(struct gl_context *ctx,
default: default:
assert(attr < VARYING_SLOT_MAX); assert(attr < VARYING_SLOT_MAX);
stvp->output_semantic_name[slot] = TGSI_SEMANTIC_GENERIC; stvp->output_semantic_name[slot] = TGSI_SEMANTIC_GENERIC;
stvp->output_semantic_index[slot] = (VARYING_SLOT_VAR0 - stvp->output_semantic_index[slot] = st->needs_texcoord_semantic ?
VARYING_SLOT_TEX0 + (attr - VARYING_SLOT_VAR0) : (attr - VARYING_SLOT_TEX0);
attr -
VARYING_SLOT_VAR0);
break; break;
} }
} }
@@ -585,11 +585,18 @@ st_translate_fragment_program(struct st_context *st,
* fragment shader plus fixed-function hardware (such as * fragment shader plus fixed-function hardware (such as
* BFC). * BFC).
* *
* There is no requirement that semantic indexes start at * However, some drivers may need us to identify the PNTC and TEXi
* zero or be restricted to a particular range -- nobody * varyings if, for example, their capability to replace them with
* should be building tables based on semantic index. * sprite coordinates is limited.
*/ */
case VARYING_SLOT_PNTC: case VARYING_SLOT_PNTC:
if (st->needs_texcoord_semantic) {
input_semantic_name[slot] = TGSI_SEMANTIC_PCOORD;
input_semantic_index[slot] = 0;
interpMode[slot] = TGSI_INTERPOLATE_LINEAR;
break;
}
/* fall through */
case VARYING_SLOT_TEX0: case VARYING_SLOT_TEX0:
case VARYING_SLOT_TEX1: case VARYING_SLOT_TEX1:
case VARYING_SLOT_TEX2: case VARYING_SLOT_TEX2:
@@ -598,13 +605,29 @@ st_translate_fragment_program(struct st_context *st,
case VARYING_SLOT_TEX5: case VARYING_SLOT_TEX5:
case VARYING_SLOT_TEX6: case VARYING_SLOT_TEX6:
case VARYING_SLOT_TEX7: case VARYING_SLOT_TEX7:
if (st->needs_texcoord_semantic) {
input_semantic_name[slot] = TGSI_SEMANTIC_TEXCOORD;
input_semantic_index[slot] = attr - VARYING_SLOT_TEX0;
interpMode[slot] =
st_translate_interp(stfp->Base.InterpQualifier[attr], FALSE);
break;
}
/* fall through */
case VARYING_SLOT_VAR0: case VARYING_SLOT_VAR0:
default: default:
/* Actually, let's try and zero-base this just for /* Semantic indices should be zero-based because drivers may choose
* readability of the generated TGSI. * to assign a fixed slot determined by that index.
* This is useful because ARB_separate_shader_objects uses location
* qualifiers for linkage, and if the semantic index corresponds to
* these locations, linkage passes in the driver become unecessary.
*
* If needs_texcoord_semantic is true, no semantic indices will be
* consumed for the TEXi varyings, and we can base the locations of
* the user varyings on VAR0. Otherwise, we use TEX0 as base index.
*/ */
assert(attr >= VARYING_SLOT_TEX0); assert(attr >= VARYING_SLOT_TEX0);
input_semantic_index[slot] = (attr - VARYING_SLOT_TEX0); input_semantic_index[slot] = st->needs_texcoord_semantic ?
(attr - VARYING_SLOT_VAR0) : (attr - VARYING_SLOT_TEX0);
input_semantic_name[slot] = TGSI_SEMANTIC_GENERIC; input_semantic_name[slot] = TGSI_SEMANTIC_GENERIC;
if (attr == VARYING_SLOT_PNTC) if (attr == VARYING_SLOT_PNTC)
interpMode[slot] = TGSI_INTERPOLATE_LINEAR; interpMode[slot] = TGSI_INTERPOLATE_LINEAR;