intel/nir: Extract add_const_offset_to_base
Pretty much every driver using nir_lower_io_to_temporaries followed by nir_lower_io is going to want this. In particular, radv and radeonsi in the next commits. Reviewed-by: Bas Nieuwenhuizen <bas@basnieuwenhuizen.nl>
This commit is contained in:
@@ -3171,6 +3171,8 @@ bool nir_lower_io(nir_shader *shader,
|
|||||||
int (*type_size)(const struct glsl_type *, bool),
|
int (*type_size)(const struct glsl_type *, bool),
|
||||||
nir_lower_io_options);
|
nir_lower_io_options);
|
||||||
|
|
||||||
|
bool nir_io_add_const_offset_to_base(nir_shader *nir, nir_variable_mode mode);
|
||||||
|
|
||||||
typedef enum {
|
typedef enum {
|
||||||
/**
|
/**
|
||||||
* An address format which is a simple 32-bit global GPU address.
|
* An address format which is a simple 32-bit global GPU address.
|
||||||
|
@@ -1307,3 +1307,78 @@ nir_build_addr_isub(nir_builder *b, nir_ssa_def *addr0, nir_ssa_def *addr1,
|
|||||||
|
|
||||||
unreachable("Invalid address format");
|
unreachable("Invalid address format");
|
||||||
}
|
}
|
||||||
|
|
||||||
|
static bool
|
||||||
|
is_input(nir_intrinsic_instr *intrin)
|
||||||
|
{
|
||||||
|
return intrin->intrinsic == nir_intrinsic_load_input ||
|
||||||
|
intrin->intrinsic == nir_intrinsic_load_per_vertex_input ||
|
||||||
|
intrin->intrinsic == nir_intrinsic_load_interpolated_input ||
|
||||||
|
intrin->intrinsic == nir_intrinsic_load_fs_input_interp_deltas;
|
||||||
|
}
|
||||||
|
|
||||||
|
static bool
|
||||||
|
is_output(nir_intrinsic_instr *intrin)
|
||||||
|
{
|
||||||
|
return intrin->intrinsic == nir_intrinsic_load_output ||
|
||||||
|
intrin->intrinsic == nir_intrinsic_load_per_vertex_output ||
|
||||||
|
intrin->intrinsic == nir_intrinsic_store_output ||
|
||||||
|
intrin->intrinsic == nir_intrinsic_store_per_vertex_output;
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
/**
|
||||||
|
* This pass adds constant offsets to instr->const_index[0] for input/output
|
||||||
|
* intrinsics, and resets the offset source to 0. Non-constant offsets remain
|
||||||
|
* unchanged - since we don't know what part of a compound variable is
|
||||||
|
* accessed, we allocate storage for the entire thing. For drivers that use
|
||||||
|
* nir_lower_io_to_temporaries() before nir_lower_io(), this guarantees that
|
||||||
|
* the offset source will be 0, so that they don't have to add it in manually.
|
||||||
|
*/
|
||||||
|
|
||||||
|
static bool
|
||||||
|
add_const_offset_to_base_block(nir_block *block, nir_builder *b,
|
||||||
|
nir_variable_mode mode)
|
||||||
|
{
|
||||||
|
bool progress = false;
|
||||||
|
nir_foreach_instr_safe(instr, block) {
|
||||||
|
if (instr->type != nir_instr_type_intrinsic)
|
||||||
|
continue;
|
||||||
|
|
||||||
|
nir_intrinsic_instr *intrin = nir_instr_as_intrinsic(instr);
|
||||||
|
|
||||||
|
if ((mode == nir_var_shader_in && is_input(intrin)) ||
|
||||||
|
(mode == nir_var_shader_out && is_output(intrin))) {
|
||||||
|
nir_src *offset = nir_get_io_offset_src(intrin);
|
||||||
|
|
||||||
|
if (nir_src_is_const(*offset)) {
|
||||||
|
intrin->const_index[0] += nir_src_as_uint(*offset);
|
||||||
|
b->cursor = nir_before_instr(&intrin->instr);
|
||||||
|
nir_instr_rewrite_src(&intrin->instr, offset,
|
||||||
|
nir_src_for_ssa(nir_imm_int(b, 0)));
|
||||||
|
progress = true;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
return progress;
|
||||||
|
}
|
||||||
|
|
||||||
|
bool
|
||||||
|
nir_io_add_const_offset_to_base(nir_shader *nir, nir_variable_mode mode)
|
||||||
|
{
|
||||||
|
bool progress = false;
|
||||||
|
|
||||||
|
nir_foreach_function(f, nir) {
|
||||||
|
if (f->impl) {
|
||||||
|
nir_builder b;
|
||||||
|
nir_builder_init(&b, f->impl);
|
||||||
|
nir_foreach_block(block, f->impl) {
|
||||||
|
progress |= add_const_offset_to_base_block(block, &b, mode);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
return progress;
|
||||||
|
}
|
||||||
|
|
||||||
|
@@ -28,75 +28,6 @@
|
|||||||
#include "compiler/nir/nir_builder.h"
|
#include "compiler/nir/nir_builder.h"
|
||||||
#include "util/u_math.h"
|
#include "util/u_math.h"
|
||||||
|
|
||||||
static bool
|
|
||||||
is_input(nir_intrinsic_instr *intrin)
|
|
||||||
{
|
|
||||||
return intrin->intrinsic == nir_intrinsic_load_input ||
|
|
||||||
intrin->intrinsic == nir_intrinsic_load_per_vertex_input ||
|
|
||||||
intrin->intrinsic == nir_intrinsic_load_interpolated_input ||
|
|
||||||
intrin->intrinsic == nir_intrinsic_load_fs_input_interp_deltas;
|
|
||||||
}
|
|
||||||
|
|
||||||
static bool
|
|
||||||
is_output(nir_intrinsic_instr *intrin)
|
|
||||||
{
|
|
||||||
return intrin->intrinsic == nir_intrinsic_load_output ||
|
|
||||||
intrin->intrinsic == nir_intrinsic_load_per_vertex_output ||
|
|
||||||
intrin->intrinsic == nir_intrinsic_store_output ||
|
|
||||||
intrin->intrinsic == nir_intrinsic_store_per_vertex_output;
|
|
||||||
}
|
|
||||||
|
|
||||||
/**
|
|
||||||
* In many cases, we just add the base and offset together, so there's no
|
|
||||||
* reason to keep them separate. Sometimes, combining them is essential:
|
|
||||||
* if a shader only accesses part of a compound variable (such as a matrix
|
|
||||||
* or array), the variable's base may not actually exist in the VUE map.
|
|
||||||
*
|
|
||||||
* This pass adds constant offsets to instr->const_index[0], and resets
|
|
||||||
* the offset source to 0. Non-constant offsets remain unchanged - since
|
|
||||||
* we don't know what part of a compound variable is accessed, we allocate
|
|
||||||
* storage for the entire thing.
|
|
||||||
*/
|
|
||||||
|
|
||||||
static bool
|
|
||||||
add_const_offset_to_base_block(nir_block *block, nir_builder *b,
|
|
||||||
nir_variable_mode mode)
|
|
||||||
{
|
|
||||||
nir_foreach_instr_safe(instr, block) {
|
|
||||||
if (instr->type != nir_instr_type_intrinsic)
|
|
||||||
continue;
|
|
||||||
|
|
||||||
nir_intrinsic_instr *intrin = nir_instr_as_intrinsic(instr);
|
|
||||||
|
|
||||||
if ((mode == nir_var_shader_in && is_input(intrin)) ||
|
|
||||||
(mode == nir_var_shader_out && is_output(intrin))) {
|
|
||||||
nir_src *offset = nir_get_io_offset_src(intrin);
|
|
||||||
|
|
||||||
if (nir_src_is_const(*offset)) {
|
|
||||||
intrin->const_index[0] += nir_src_as_uint(*offset);
|
|
||||||
b->cursor = nir_before_instr(&intrin->instr);
|
|
||||||
nir_instr_rewrite_src(&intrin->instr, offset,
|
|
||||||
nir_src_for_ssa(nir_imm_int(b, 0)));
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
return true;
|
|
||||||
}
|
|
||||||
|
|
||||||
static void
|
|
||||||
add_const_offset_to_base(nir_shader *nir, nir_variable_mode mode)
|
|
||||||
{
|
|
||||||
nir_foreach_function(f, nir) {
|
|
||||||
if (f->impl) {
|
|
||||||
nir_builder b;
|
|
||||||
nir_builder_init(&b, f->impl);
|
|
||||||
nir_foreach_block(block, f->impl) {
|
|
||||||
add_const_offset_to_base_block(block, &b, mode);
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
static bool
|
static bool
|
||||||
remap_tess_levels(nir_builder *b, nir_intrinsic_instr *intr,
|
remap_tess_levels(nir_builder *b, nir_intrinsic_instr *intr,
|
||||||
GLenum primitive_mode)
|
GLenum primitive_mode)
|
||||||
@@ -152,6 +83,24 @@ remap_tess_levels(nir_builder *b, nir_intrinsic_instr *intr,
|
|||||||
return true;
|
return true;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
static bool
|
||||||
|
is_input(nir_intrinsic_instr *intrin)
|
||||||
|
{
|
||||||
|
return intrin->intrinsic == nir_intrinsic_load_input ||
|
||||||
|
intrin->intrinsic == nir_intrinsic_load_per_vertex_input ||
|
||||||
|
intrin->intrinsic == nir_intrinsic_load_interpolated_input;
|
||||||
|
}
|
||||||
|
|
||||||
|
static bool
|
||||||
|
is_output(nir_intrinsic_instr *intrin)
|
||||||
|
{
|
||||||
|
return intrin->intrinsic == nir_intrinsic_load_output ||
|
||||||
|
intrin->intrinsic == nir_intrinsic_load_per_vertex_output ||
|
||||||
|
intrin->intrinsic == nir_intrinsic_store_output ||
|
||||||
|
intrin->intrinsic == nir_intrinsic_store_per_vertex_output;
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
static bool
|
static bool
|
||||||
remap_patch_urb_offsets(nir_block *block, nir_builder *b,
|
remap_patch_urb_offsets(nir_block *block, nir_builder *b,
|
||||||
const struct brw_vue_map *vue_map,
|
const struct brw_vue_map *vue_map,
|
||||||
@@ -227,7 +176,7 @@ brw_nir_lower_vs_inputs(nir_shader *nir,
|
|||||||
/* This pass needs actual constants */
|
/* This pass needs actual constants */
|
||||||
nir_opt_constant_folding(nir);
|
nir_opt_constant_folding(nir);
|
||||||
|
|
||||||
add_const_offset_to_base(nir, nir_var_shader_in);
|
nir_io_add_const_offset_to_base(nir, nir_var_shader_in);
|
||||||
|
|
||||||
brw_nir_apply_attribute_workarounds(nir, vs_attrib_wa_flags);
|
brw_nir_apply_attribute_workarounds(nir, vs_attrib_wa_flags);
|
||||||
|
|
||||||
@@ -350,7 +299,7 @@ brw_nir_lower_vue_inputs(nir_shader *nir,
|
|||||||
/* This pass needs actual constants */
|
/* This pass needs actual constants */
|
||||||
nir_opt_constant_folding(nir);
|
nir_opt_constant_folding(nir);
|
||||||
|
|
||||||
add_const_offset_to_base(nir, nir_var_shader_in);
|
nir_io_add_const_offset_to_base(nir, nir_var_shader_in);
|
||||||
|
|
||||||
nir_foreach_function(function, nir) {
|
nir_foreach_function(function, nir) {
|
||||||
if (!function->impl)
|
if (!function->impl)
|
||||||
@@ -401,7 +350,7 @@ brw_nir_lower_tes_inputs(nir_shader *nir, const struct brw_vue_map *vue_map)
|
|||||||
/* This pass needs actual constants */
|
/* This pass needs actual constants */
|
||||||
nir_opt_constant_folding(nir);
|
nir_opt_constant_folding(nir);
|
||||||
|
|
||||||
add_const_offset_to_base(nir, nir_var_shader_in);
|
nir_io_add_const_offset_to_base(nir, nir_var_shader_in);
|
||||||
|
|
||||||
nir_foreach_function(function, nir) {
|
nir_foreach_function(function, nir) {
|
||||||
if (function->impl) {
|
if (function->impl) {
|
||||||
@@ -458,7 +407,7 @@ brw_nir_lower_fs_inputs(nir_shader *nir,
|
|||||||
/* This pass needs actual constants */
|
/* This pass needs actual constants */
|
||||||
nir_opt_constant_folding(nir);
|
nir_opt_constant_folding(nir);
|
||||||
|
|
||||||
add_const_offset_to_base(nir, nir_var_shader_in);
|
nir_io_add_const_offset_to_base(nir, nir_var_shader_in);
|
||||||
}
|
}
|
||||||
|
|
||||||
void
|
void
|
||||||
@@ -484,7 +433,7 @@ brw_nir_lower_tcs_outputs(nir_shader *nir, const struct brw_vue_map *vue_map,
|
|||||||
/* This pass needs actual constants */
|
/* This pass needs actual constants */
|
||||||
nir_opt_constant_folding(nir);
|
nir_opt_constant_folding(nir);
|
||||||
|
|
||||||
add_const_offset_to_base(nir, nir_var_shader_out);
|
nir_io_add_const_offset_to_base(nir, nir_var_shader_out);
|
||||||
|
|
||||||
nir_foreach_function(function, nir) {
|
nir_foreach_function(function, nir) {
|
||||||
if (function->impl) {
|
if (function->impl) {
|
||||||
|
Reference in New Issue
Block a user