Fix SSA update when vectorisation adds a vdef to a read-only loop

author Richard Sandiford <richard.sandiford@arm.com>

Tue, 31 Dec 2019 08:28:24 +0000 (08:28 +0000)

committer Richard Sandiford <rsandifo@gcc.gnu.org>

Tue, 31 Dec 2019 08:28:24 +0000 (08:28 +0000)
author Richard Sandiford <richard.sandiford@arm.com>
Tue, 31 Dec 2019 08:28:24 +0000 (08:28 +0000)
committer Richard Sandiford <rsandifo@gcc.gnu.org>
Tue, 31 Dec 2019 08:28:24 +0000 (08:28 +0000)
diff --git a/gcc/ChangeLog b/gcc/ChangeLog

index 03e3f80..a75b901 100644 (file)
--- a/gcc/ChangeLog
+++ b/gcc/ChangeLog
@@ -1,3 +1,12 @@
+2020-12-31  Richard Sandiford  <richard.sandiford@arm.com>
+
+       * tree-vect-loop-manip.c (create_lcssa_for_virtual_phi): Return
+       the incoming virtual operand definition.
+       (vect_do_peeling): When vectorizing an epilogue loop, handle the
+       case in which the main loop has a virtual phi and the epilogue
+       and scalar loops don't.  Restore an earlier comment about the
+       update_ssa call.
+
  2019-12-30  Olivier Hainque  <hainque@adacore.com>
  
         * config/vxworks/stdint.h: New file.  Include _yvals.h
diff --git a/gcc/testsuite/ChangeLog b/gcc/testsuite/ChangeLog

index 76bcf82..097c61d 100644 (file)
--- a/gcc/testsuite/ChangeLog
+++ b/gcc/testsuite/ChangeLog
@@ -1,3 +1,7 @@
+2020-12-31  Richard Sandiford  <richard.sandiford@arm.com>
+
+       * gcc.dg/vect/vect-epilogues-2.c: New test.
+
  2019-12-30  Olivier Hainque  <hainque@adacore.com>
  
         * gcc.dg/vect/tree-vect.h: #undef OFFSET.
diff --git a/gcc/testsuite/gcc.dg/vect/vect-epilogues-2.c b/gcc/testsuite/gcc.dg/vect/vect-epilogues-2.c

new file mode 100644 (file)

index 0000000..b251e1f
--- /dev/null
+++ b/gcc/testsuite/gcc.dg/vect/vect-epilogues-2.c
@@ -0,0 +1,57 @@
+/* { dg-do compile } */
+
+int
+f1 (int *x, int n)
+{
+  int res = 0;
+  for (int i = 0; i < n; ++i)
+    res += x[i * 2] == 1 ? 2 : 3;
+  return res;
+}
+
+int
+f2 (int *x)
+{
+  int res = 0;
+  for (int i = 0; i < 0x83; ++i)
+    res += x[i * 2] == 1 ? 2 : 3;
+  return res;
+}
+
+int
+f3 (int *x, int n)
+{
+  int res = 0;
+  for (int i = 0; i < n; ++i)
+    res += x[i * 2] == 1 ? 2 : 3;
+  return res + x[0x100];
+}
+
+int
+f4 (int *x)
+{
+  int res = 0;
+  for (int i = 0; i < 0x83; ++i)
+    res += x[i * 2] == 1 ? 2 : 3;
+  return res + x[0x100];
+}
+
+int
+f5 (int *x, int n, int a)
+{
+  int res = 0;
+  for (int i = 0; i < n; ++i)
+    res += x[i * 2] == 1 ? 2 : 3;
+  x[a] += 1;
+  return res;
+}
+
+int
+f6 (int *x, int a)
+{
+  int res = 0;
+  for (int i = 0; i < 0x83; ++i)
+    res += x[i * 2] == 1 ? 2 : 3;
+  x[a] += 1;
+  return res;
+}
diff --git a/gcc/tree-vect-loop-manip.c b/gcc/tree-vect-loop-manip.c

index b4dda97..dd2d943 100644 (file)
--- a/gcc/tree-vect-loop-manip.c
+++ b/gcc/tree-vect-loop-manip.c
@@ -1249,9 +1249,12 @@ slpeel_can_duplicate_loop_p (const class loop *loop, const_edge e)
     the *guard[12] routines, which assume loop closed SSA form for all PHIs
     (but normally loop closed SSA form doesn't require virtual PHIs to be
     in the same form).  Doing this early simplifies the checking what
-   uses should be renamed.  */
+   uses should be renamed.
  
-static void
+   If we create a new phi after the loop, return the definition that
+   applies on entry to the loop, otherwise return null.  */
+
+static tree
  create_lcssa_for_virtual_phi (class loop *loop)
  {
    gphi_iterator gsi;
@@ -1283,10 +1286,12 @@ create_lcssa_for_virtual_phi (class loop *loop)
                   && !flow_bb_inside_loop_p (loop, gimple_bb (stmt)))
                 FOR_EACH_IMM_USE_ON_STMT (use_p, imm_iter)
                   SET_USE (use_p, new_vop);
+
+           return PHI_ARG_DEF_FROM_EDGE (phi, loop_preheader_edge (loop));
           }
         break;
        }
-
+  return NULL_TREE;
  }
  
  /* Function vect_get_loop_location.
@@ -2483,9 +2488,42 @@ vect_do_peeling (loop_vec_info loop_vinfo, tree niters, tree nitersm1,
    class loop *prolog, *epilog = NULL, *loop = LOOP_VINFO_LOOP (loop_vinfo);
    class loop *first_loop = loop;
    bool irred_flag = loop_preheader_edge (loop)->flags & EDGE_IRREDUCIBLE_LOOP;
-  create_lcssa_for_virtual_phi (loop);
+
+  /* We might have a queued need to update virtual SSA form.  As we
+     delete the update SSA machinery below after doing a regular
+     incremental SSA update during loop copying make sure we don't
+     lose that fact.
+     ???  Needing to update virtual SSA form by renaming is unfortunate
+     but not all of the vectorizer code inserting new loads / stores
+     properly assigns virtual operands to those statements.  */
    update_ssa (TODO_update_ssa_only_virtuals);
  
+  create_lcssa_for_virtual_phi (loop);
+
+  /* If we're vectorizing an epilogue loop, the update_ssa above will
+     have ensured that the virtual operand is in SSA form throughout the
+     vectorized main loop.  Normally it is possible to trace the updated
+     vector-stmt vdefs back to scalar-stmt vdefs and vector-stmt vuses
+     back to scalar-stmt vuses, meaning that the effect of the SSA update
+     remains local to the main loop.  However, there are rare cases in
+     which the vectorized loop has vdefs even when the original scalar
+     loop didn't.  For example, vectorizing a load with IFN_LOAD_LANES
+     introduces clobbers of the temporary vector array, which in turn
+     needs new vdefs.  If the scalar loop doesn't write to memory, these
+     new vdefs will be the only ones in the vector loop.
+
+     In that case, update_ssa will have added a new virtual phi to the
+     main loop, which previously didn't need one.  Ensure that we (locally)
+     maintain LCSSA form for the virtual operand, just as we would have
+     done if the virtual phi had existed from the outset.  This makes it
+     easier to duplicate the scalar epilogue loop below.  */
+  tree vop_to_rename = NULL_TREE;
+  if (loop_vec_info orig_loop_vinfo = LOOP_VINFO_ORIG_LOOP_INFO (loop_vinfo))
+    {
+      class loop *orig_loop = LOOP_VINFO_LOOP (orig_loop_vinfo);
+      vop_to_rename = create_lcssa_for_virtual_phi (orig_loop);
+    }
+
    if (MAY_HAVE_DEBUG_BIND_STMTS)
      {
        gcc_assert (!adjust_vec.exists ());
@@ -2706,6 +2744,26 @@ vect_do_peeling (loop_vec_info loop_vinfo, tree niters, tree nitersm1,
          as the transformations mentioned above make less or no sense when not
          vectorizing.  */
        epilog = vect_epilogues ? get_loop_copy (loop) : scalar_loop;
+      if (vop_to_rename)
+       {
+         /* Vectorizing the main loop can sometimes introduce a vdef to
+            a loop that previously didn't have one; see the comment above
+            the definition of VOP_TO_RENAME for details.  The definition
+            D that holds on E will then be different from the definition
+            VOP_TO_RENAME that holds during SCALAR_LOOP, so we need to
+            rename VOP_TO_RENAME to D when copying the loop.
+
+            The virtual operand is in LCSSA form for the main loop,
+            and no stmt between the main loop and E needs a vdef,
+            so we know that D is provided by a phi rather than by a
+            vdef on a normal gimple stmt.  */
+         basic_block vdef_bb = e->src;
+         gphi *vphi;
+         while (!(vphi = get_virtual_phi (vdef_bb)))
+           vdef_bb = get_immediate_dominator (CDI_DOMINATORS, vdef_bb);
+         gcc_assert (vop_to_rename != gimple_phi_result (vphi));
+         set_current_def (vop_to_rename, gimple_phi_result (vphi));
+       }
        epilog = slpeel_tree_duplicate_loop_to_edge_cfg (loop, epilog, e);
        if (!epilog)
         {
author	Richard Sandiford <richard.sandiford@arm.com>
	Tue, 31 Dec 2019 08:28:24 +0000 (08:28 +0000)
committer	Richard Sandiford <rsandifo@gcc.gnu.org>
	Tue, 31 Dec 2019 08:28:24 +0000 (08:28 +0000)
gcc/ChangeLog		patch \| blob \| history
gcc/testsuite/ChangeLog		patch \| blob \| history
gcc/testsuite/gcc.dg/vect/vect-epilogues-2.c	[new file with mode: 0644]	patch \| blob
gcc/tree-vect-loop-manip.c		patch \| blob \| history