intel/fs: prevent large vector ops generated by peephole_ffma

author Lionel Landwerlin <lionel.g.landwerlin@intel.com>

Thu, 9 Mar 2023 10:12:54 +0000 (12:12 +0200)

committer Marge Bot <emma+marge@anholt.net>

Tue, 14 Mar 2023 10:38:50 +0000 (10:38 +0000)
author Lionel Landwerlin <lionel.g.landwerlin@intel.com>
Thu, 9 Mar 2023 10:12:54 +0000 (12:12 +0200)
committer Marge Bot <emma+marge@anholt.net>
Tue, 14 Mar 2023 10:38:50 +0000 (10:38 +0000)
diff --git a/src/intel/compiler/brw_nir.c b/src/intel/compiler/brw_nir.c

index b340c09..6c9feaf 100644 (file)
--- a/src/intel/compiler/brw_nir.c
+++ b/src/intel/compiler/brw_nir.c
@@ -1458,8 +1458,19 @@ brw_postprocess_nir(nir_shader *nir, const struct brw_compiler *compiler,
        brw_nir_optimize(nir, compiler, is_scalar);
  
     if (devinfo->ver >= 6) {
-      /* Try and fuse multiply-adds */
-      OPT(brw_nir_opt_peephole_ffma);
+      /* Try and fuse multiply-adds, if successful, run shrink_vectors to
+       * avoid peephole_ffma to generate things like this :
+       *    vec16 ssa_0 = ...
+       *    vec16 ssa_1 = fneg ssa_0
+       *    vec1  ssa_2 = ffma ssa_1, ...
+       *
+       * We want this instead :
+       *    vec16 ssa_0 = ...
+       *    vec1  ssa_1 = fneg ssa_0.x
+       *    vec1  ssa_2 = ffma ssa_1, ...
+       */
+      if (OPT(brw_nir_opt_peephole_ffma))
+         OPT(nir_opt_shrink_vectors);
     }
  
     if (is_scalar)
author	Lionel Landwerlin <lionel.g.landwerlin@intel.com>
	Thu, 9 Mar 2023 10:12:54 +0000 (12:12 +0200)
committer	Marge Bot <emma+marge@anholt.net>
	Tue, 14 Mar 2023 10:38:50 +0000 (10:38 +0000)