i965/fs: Add a shader_stats struct.

It'll grow further, and we'd like to avoid adding an additional
parameter to fs_generator() for each new piece of data.

v2 (idr): Rebase on 17 months.  Track a visitor instead of a cfg.

Reviewed-by: Kenneth Graunke <kenneth@whitecape.org>
Reviewed-by: Matt Turner <mattst88@gmail.com>
This commit is contained in:
Matt Turner
2016-10-17 14:10:26 -07:00
committed by Ian Romanick
parent 11a49f289d
commit dabb5d4bee
9 changed files with 29 additions and 27 deletions

View File

@@ -8108,7 +8108,7 @@ brw_compile_fs(const struct brw_compiler *compiler, void *log_data,
} }
fs_generator g(compiler, log_data, mem_ctx, &prog_data->base, fs_generator g(compiler, log_data, mem_ctx, &prog_data->base,
v8.promoted_constants, v8.runtime_check_aads_emit, v8.shader_stats, v8.runtime_check_aads_emit,
MESA_SHADER_FRAGMENT); MESA_SHADER_FRAGMENT);
if (unlikely(INTEL_DEBUG & DEBUG_WM)) { if (unlikely(INTEL_DEBUG & DEBUG_WM)) {
@@ -8258,9 +8258,8 @@ brw_compile_cs(const struct brw_compiler *compiler, void *log_data,
unsigned max_dispatch_width = 32; unsigned max_dispatch_width = 32;
fs_visitor *v8 = NULL, *v16 = NULL, *v32 = NULL; fs_visitor *v8 = NULL, *v16 = NULL, *v32 = NULL;
cfg_t *cfg = NULL; fs_visitor *v = NULL;
const char *fail_msg = NULL; const char *fail_msg = NULL;
unsigned promoted_constants = 0;
if ((int)key->base.subgroup_size_type >= (int)BRW_SUBGROUP_SIZE_REQUIRE_8) { if ((int)key->base.subgroup_size_type >= (int)BRW_SUBGROUP_SIZE_REQUIRE_8) {
/* These enum values are expressly chosen to be equal to the subgroup /* These enum values are expressly chosen to be equal to the subgroup
@@ -8294,10 +8293,9 @@ brw_compile_cs(const struct brw_compiler *compiler, void *log_data,
/* We should always be able to do SIMD32 for compute shaders */ /* We should always be able to do SIMD32 for compute shaders */
assert(v8->max_dispatch_width >= 32); assert(v8->max_dispatch_width >= 32);
cfg = v8->cfg; v = v8;
cs_set_simd_size(prog_data, 8); cs_set_simd_size(prog_data, 8);
cs_fill_push_const_info(compiler->devinfo, prog_data); cs_fill_push_const_info(compiler->devinfo, prog_data);
promoted_constants = v8->promoted_constants;
} }
} }
@@ -8317,7 +8315,7 @@ brw_compile_cs(const struct brw_compiler *compiler, void *log_data,
compiler->shader_perf_log(log_data, compiler->shader_perf_log(log_data,
"SIMD16 shader failed to compile: %s", "SIMD16 shader failed to compile: %s",
v16->fail_msg); v16->fail_msg);
if (!cfg) { if (!v) {
fail_msg = fail_msg =
"Couldn't generate SIMD16 program and not " "Couldn't generate SIMD16 program and not "
"enough threads for SIMD8"; "enough threads for SIMD8";
@@ -8326,10 +8324,9 @@ brw_compile_cs(const struct brw_compiler *compiler, void *log_data,
/* We should always be able to do SIMD32 for compute shaders */ /* We should always be able to do SIMD32 for compute shaders */
assert(v16->max_dispatch_width >= 32); assert(v16->max_dispatch_width >= 32);
cfg = v16->cfg; v = v16;
cs_set_simd_size(prog_data, 16); cs_set_simd_size(prog_data, 16);
cs_fill_push_const_info(compiler->devinfo, prog_data); cs_fill_push_const_info(compiler->devinfo, prog_data);
promoted_constants = v16->promoted_constants;
} }
} }
@@ -8354,27 +8351,27 @@ brw_compile_cs(const struct brw_compiler *compiler, void *log_data,
compiler->shader_perf_log(log_data, compiler->shader_perf_log(log_data,
"SIMD32 shader failed to compile: %s", "SIMD32 shader failed to compile: %s",
v16->fail_msg); v16->fail_msg);
if (!cfg) { if (!v) {
fail_msg = fail_msg =
"Couldn't generate SIMD32 program and not " "Couldn't generate SIMD32 program and not "
"enough threads for SIMD16"; "enough threads for SIMD16";
} }
} else { } else {
cfg = v32->cfg; v = v32;
cs_set_simd_size(prog_data, 32); cs_set_simd_size(prog_data, 32);
cs_fill_push_const_info(compiler->devinfo, prog_data); cs_fill_push_const_info(compiler->devinfo, prog_data);
promoted_constants = v32->promoted_constants;
} }
} }
const unsigned *ret = NULL; const unsigned *ret = NULL;
if (unlikely(cfg == NULL)) { if (unlikely(v == NULL)) {
assert(fail_msg); assert(fail_msg);
if (error_str) if (error_str)
*error_str = ralloc_strdup(mem_ctx, fail_msg); *error_str = ralloc_strdup(mem_ctx, fail_msg);
} else { } else {
fs_generator g(compiler, log_data, mem_ctx, &prog_data->base, fs_generator g(compiler, log_data, mem_ctx, &prog_data->base,
promoted_constants, false, MESA_SHADER_COMPUTE); v->shader_stats, v->runtime_check_aads_emit,
MESA_SHADER_COMPUTE);
if (INTEL_DEBUG & DEBUG_CS) { if (INTEL_DEBUG & DEBUG_CS) {
char *name = ralloc_asprintf(mem_ctx, "%s compute shader %s", char *name = ralloc_asprintf(mem_ctx, "%s compute shader %s",
src_shader->info.label ? src_shader->info.label ?
@@ -8383,7 +8380,7 @@ brw_compile_cs(const struct brw_compiler *compiler, void *log_data,
g.enable_debug(name); g.enable_debug(name);
} }
g.generate_code(cfg, prog_data->simd_size); g.generate_code(v->cfg, prog_data->simd_size);
ret = g.get_assembly(); ret = g.get_assembly();
} }

View File

@@ -52,6 +52,10 @@ offset(const fs_reg &reg, const brw::fs_builder &bld, unsigned delta)
#define UBO_START ((1 << 16) - 4) #define UBO_START ((1 << 16) - 4)
struct shader_stats {
unsigned promoted_constants;
};
/** /**
* The fragment shader front-end. * The fragment shader front-end.
* *
@@ -389,7 +393,8 @@ public:
int shader_time_index; int shader_time_index;
unsigned promoted_constants; struct shader_stats shader_stats;
brw::fs_builder bld; brw::fs_builder bld;
private: private:
@@ -413,7 +418,7 @@ public:
fs_generator(const struct brw_compiler *compiler, void *log_data, fs_generator(const struct brw_compiler *compiler, void *log_data,
void *mem_ctx, void *mem_ctx,
struct brw_stage_prog_data *prog_data, struct brw_stage_prog_data *prog_data,
unsigned promoted_constants, struct shader_stats shader_stats,
bool runtime_check_aads_emit, bool runtime_check_aads_emit,
gl_shader_stage stage); gl_shader_stage stage);
~fs_generator(); ~fs_generator();
@@ -517,7 +522,7 @@ private:
unsigned dispatch_width; /**< 8, 16 or 32 */ unsigned dispatch_width; /**< 8, 16 or 32 */
exec_list discard_halt_patches; exec_list discard_halt_patches;
unsigned promoted_constants; struct shader_stats shader_stats;
bool runtime_check_aads_emit; bool runtime_check_aads_emit;
bool debug_flag; bool debug_flag;
const char *shader_name; const char *shader_name;

View File

@@ -442,7 +442,7 @@ fs_visitor::opt_combine_constants()
reg.offset += imm->size * width; reg.offset += imm->size * width;
} }
promoted_constants = table.len; shader_stats.promoted_constants = table.len;
/* Rewrite the immediate sources to refer to the new GRFs. */ /* Rewrite the immediate sources to refer to the new GRFs. */
for (int i = 0; i < table.len; i++) { for (int i = 0; i < table.len; i++) {

View File

@@ -183,14 +183,14 @@ brw_reg_from_fs_reg(const struct gen_device_info *devinfo, fs_inst *inst,
fs_generator::fs_generator(const struct brw_compiler *compiler, void *log_data, fs_generator::fs_generator(const struct brw_compiler *compiler, void *log_data,
void *mem_ctx, void *mem_ctx,
struct brw_stage_prog_data *prog_data, struct brw_stage_prog_data *prog_data,
unsigned promoted_constants, struct shader_stats shader_stats,
bool runtime_check_aads_emit, bool runtime_check_aads_emit,
gl_shader_stage stage) gl_shader_stage stage)
: compiler(compiler), log_data(log_data), : compiler(compiler), log_data(log_data),
devinfo(compiler->devinfo), devinfo(compiler->devinfo),
prog_data(prog_data), prog_data(prog_data),
promoted_constants(promoted_constants), shader_stats(shader_stats),
runtime_check_aads_emit(runtime_check_aads_emit), debug_flag(false), runtime_check_aads_emit(runtime_check_aads_emit), debug_flag(false),
stage(stage), mem_ctx(mem_ctx) stage(stage), mem_ctx(mem_ctx)
{ {
@@ -2253,7 +2253,7 @@ fs_generator::generate_code(const cfg_t *cfg, int dispatch_width)
"SIMD%d shader: %d instructions. %d loops. %u cycles. %d:%d spills:fills. Promoted %u constants. Compacted %d to %d" "SIMD%d shader: %d instructions. %d loops. %u cycles. %d:%d spills:fills. Promoted %u constants. Compacted %d to %d"
" bytes (%.0f%%)\n", " bytes (%.0f%%)\n",
shader_name, dispatch_width, before_size / 16, loop_count, cfg->cycle_count, shader_name, dispatch_width, before_size / 16, loop_count, cfg->cycle_count,
spill_count, fill_count, promoted_constants, before_size, after_size, spill_count, fill_count, shader_stats.promoted_constants, before_size, after_size,
100.0f * (before_size - after_size) / before_size); 100.0f * (before_size - after_size) / before_size);
dump_assembly(p->store, disasm_info); dump_assembly(p->store, disasm_info);
@@ -2268,7 +2268,7 @@ fs_generator::generate_code(const cfg_t *cfg, int dispatch_width)
_mesa_shader_stage_to_abbrev(stage), _mesa_shader_stage_to_abbrev(stage),
dispatch_width, before_size / 16, dispatch_width, before_size / 16,
loop_count, cfg->cycle_count, spill_count, loop_count, cfg->cycle_count, spill_count,
fill_count, promoted_constants, before_size, fill_count, shader_stats.promoted_constants, before_size,
after_size); after_size);
return start_offset; return start_offset;

View File

@@ -952,7 +952,7 @@ fs_visitor::init()
this->pull_constant_loc = NULL; this->pull_constant_loc = NULL;
this->push_constant_loc = NULL; this->push_constant_loc = NULL;
this->promoted_constants = 0, this->shader_stats.promoted_constants = 0,
this->grf_used = 0; this->grf_used = 0;
this->spilled_any_registers = false; this->spilled_any_registers = false;

View File

@@ -1335,7 +1335,7 @@ brw_compile_tes(const struct brw_compiler *compiler,
prog_data->base.dispatch_mode = DISPATCH_MODE_SIMD8; prog_data->base.dispatch_mode = DISPATCH_MODE_SIMD8;
fs_generator g(compiler, log_data, mem_ctx, fs_generator g(compiler, log_data, mem_ctx,
&prog_data->base.base, v.promoted_constants, false, &prog_data->base.base, v.shader_stats, false,
MESA_SHADER_TESS_EVAL); MESA_SHADER_TESS_EVAL);
if (unlikely(INTEL_DEBUG & DEBUG_TES)) { if (unlikely(INTEL_DEBUG & DEBUG_TES)) {
g.enable_debug(ralloc_asprintf(mem_ctx, g.enable_debug(ralloc_asprintf(mem_ctx,

View File

@@ -2975,7 +2975,7 @@ brw_compile_vs(const struct brw_compiler *compiler, void *log_data,
prog_data->base.base.dispatch_grf_start_reg = v.payload.num_regs; prog_data->base.base.dispatch_grf_start_reg = v.payload.num_regs;
fs_generator g(compiler, log_data, mem_ctx, fs_generator g(compiler, log_data, mem_ctx,
&prog_data->base.base, v.promoted_constants, &prog_data->base.base, v.shader_stats,
v.runtime_check_aads_emit, MESA_SHADER_VERTEX); v.runtime_check_aads_emit, MESA_SHADER_VERTEX);
if (INTEL_DEBUG & DEBUG_VS) { if (INTEL_DEBUG & DEBUG_VS) {
const char *debug_name = const char *debug_name =

View File

@@ -856,7 +856,7 @@ brw_compile_gs(const struct brw_compiler *compiler, void *log_data,
prog_data->base.base.dispatch_grf_start_reg = v.payload.num_regs; prog_data->base.base.dispatch_grf_start_reg = v.payload.num_regs;
fs_generator g(compiler, log_data, mem_ctx, fs_generator g(compiler, log_data, mem_ctx,
&prog_data->base.base, v.promoted_constants, &prog_data->base.base, v.shader_stats,
false, MESA_SHADER_GEOMETRY); false, MESA_SHADER_GEOMETRY);
if (unlikely(INTEL_DEBUG & DEBUG_GS)) { if (unlikely(INTEL_DEBUG & DEBUG_GS)) {
const char *label = const char *label =

View File

@@ -487,7 +487,7 @@ brw_compile_tcs(const struct brw_compiler *compiler,
prog_data->base.base.dispatch_grf_start_reg = v.payload.num_regs; prog_data->base.base.dispatch_grf_start_reg = v.payload.num_regs;
fs_generator g(compiler, log_data, mem_ctx, fs_generator g(compiler, log_data, mem_ctx,
&prog_data->base.base, v.promoted_constants, false, &prog_data->base.base, v.shader_stats, false,
MESA_SHADER_TESS_CTRL); MESA_SHADER_TESS_CTRL);
if (unlikely(INTEL_DEBUG & DEBUG_TCS)) { if (unlikely(INTEL_DEBUG & DEBUG_TCS)) {
g.enable_debug(ralloc_asprintf(mem_ctx, g.enable_debug(ralloc_asprintf(mem_ctx,