intel/ir: Use brw::performance object instead of CFG cycle counts for codegen stats.
These should be more accurate than the current cycle counts, since among other things they consider the effect of post-scheduling passes like the software scoreboard on TGL. In addition it will enable us to clean up some of the now redundant cycle-count estimation functionality in the instruction scheduler. Reviewed-by: Kenneth Graunke <kenneth@whitecape.org>
This commit is contained in:
@@ -1371,7 +1371,8 @@ brw_compile_tes(const struct brw_compiler *compiler,
|
||||
nir->info.name));
|
||||
}
|
||||
|
||||
g.generate_code(v.cfg, 8, v.shader_stats, stats);
|
||||
g.generate_code(v.cfg, 8, v.shader_stats,
|
||||
v.performance_analysis.require(), stats);
|
||||
|
||||
assembly = g.get_assembly();
|
||||
} else {
|
||||
@@ -1387,7 +1388,9 @@ brw_compile_tes(const struct brw_compiler *compiler,
|
||||
v.dump_instructions();
|
||||
|
||||
assembly = brw_vec4_generate_assembly(compiler, log_data, mem_ctx, nir,
|
||||
&prog_data->base, v.cfg, stats);
|
||||
&prog_data->base, v.cfg,
|
||||
v.performance_analysis.require(),
|
||||
stats);
|
||||
}
|
||||
|
||||
return assembly;
|
||||
|
Reference in New Issue
Block a user