radv: Move radv_optimize_nir_algebraic to a separate function.

Signed-off-by: Timur Kristóf <timur.kristof@gmail.com> Reviewed-by: Samuel Pitoiset <samuel.pitoiset@gmail.com> Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/11711>
2021-07-05 09:05:43 +02:00
parent 00d11c2065
commit fd64c18214
3 changed files with 35 additions and 29 deletions
--- a/src/amd/vulkan/radv_pipeline.c
+++ b/src/amd/vulkan/radv_pipeline.c
@@ -3449,35 +3449,7 @@ radv_create_shaders(struct radv_pipeline *pipeline, struct radv_device *device,
         if (lowered_ngg)
            radv_lower_ngg(device, nir[i], &infos[i], pipeline_key, &keys[i]);
-         /* optimize the lowered ALU operations */
+         radv_optimize_nir_algebraic(nir[i], io_to_mem || lowered_ngg || i == MESA_SHADER_COMPUTE);
         bool more_algebraic = true;
         while (more_algebraic) {
            more_algebraic = false;
            NIR_PASS_V(nir[i], nir_copy_prop);
            NIR_PASS_V(nir[i], nir_opt_dce);
            NIR_PASS_V(nir[i], nir_opt_constant_folding);
            NIR_PASS_V(nir[i], nir_opt_cse);
            NIR_PASS(more_algebraic, nir[i], nir_opt_algebraic);
         }
         if (io_to_mem || lowered_ngg || i == MESA_SHADER_COMPUTE)
            NIR_PASS_V(nir[i], nir_opt_offsets);
         /* Do late algebraic optimization to turn add(a,
          * neg(b)) back into subs, then the mandatory cleanup
          * after algebraic.  Note that it may produce fnegs,
          * and if so then we need to keep running to squash
          * fneg(fneg(a)).
          */
         bool more_late_algebraic = true;
         while (more_late_algebraic) {
            more_late_algebraic = false;
            NIR_PASS(more_late_algebraic, nir[i], nir_opt_algebraic_late);
            NIR_PASS_V(nir[i], nir_opt_constant_folding);
            NIR_PASS_V(nir[i], nir_copy_prop);
            NIR_PASS_V(nir[i], nir_opt_dce);
            NIR_PASS_V(nir[i], nir_opt_cse);
         }
         if (nir[i]->info.bit_sizes_int & (8 | 16)) {
            if (device->physical_device->rad_info.chip_class >= GFX8) {
--- a/src/amd/vulkan/radv_shader.c
+++ b/src/amd/vulkan/radv_shader.c
@@ -189,6 +189,39 @@ radv_optimize_nir(const struct radv_device *device, struct nir_shader *shader,
   NIR_PASS(progress, shader, nir_opt_move, nir_move_load_ubo);
 }
 void
 radv_optimize_nir_algebraic(nir_shader *nir, bool opt_offsets)
 {
   bool more_algebraic = true;
   while (more_algebraic) {
      more_algebraic = false;
      NIR_PASS_V(nir, nir_copy_prop);
      NIR_PASS_V(nir, nir_opt_dce);
      NIR_PASS_V(nir, nir_opt_constant_folding);
      NIR_PASS_V(nir, nir_opt_cse);
      NIR_PASS(more_algebraic, nir, nir_opt_algebraic);
   }
   if (opt_offsets)
      NIR_PASS_V(nir, nir_opt_offsets);
   /* Do late algebraic optimization to turn add(a,
    * neg(b)) back into subs, then the mandatory cleanup
    * after algebraic.  Note that it may produce fnegs,
    * and if so then we need to keep running to squash
    * fneg(fneg(a)).
    */
   bool more_late_algebraic = true;
   while (more_late_algebraic) {
      more_late_algebraic = false;
      NIR_PASS(more_late_algebraic, nir, nir_opt_algebraic_late);
      NIR_PASS_V(nir, nir_opt_constant_folding);
      NIR_PASS_V(nir, nir_copy_prop);
      NIR_PASS_V(nir, nir_opt_dce);
      NIR_PASS_V(nir, nir_opt_cse);
   }
 }
 static void
 shared_var_info(const struct glsl_type *type, unsigned *size, unsigned *align)
 {
--- a/src/amd/vulkan/radv_shader.h
+++ b/src/amd/vulkan/radv_shader.h
@@ -425,6 +425,7 @@ struct radv_shader_slab {
 void radv_optimize_nir(const struct radv_device *device, struct nir_shader *shader,
                       bool optimize_conservatively, bool allow_copies);
 void radv_optimize_nir_algebraic(nir_shader *shader, bool opt_offsets);
 bool radv_nir_lower_ycbcr_textures(nir_shader *shader, const struct radv_pipeline_layout *layout);
 nir_shader *radv_shader_compile_to_nir(struct radv_device *device, struct vk_shader_module *module,