aco: don't emit parallelcopy when switching to WQM.

author Daniel Schürmann <daniel@schuermann.dev>

Wed, 12 Aug 2020 12:52:04 +0000 (14:52 +0200)

committer Daniel Schürmann <daniel@schuermann.dev>

Tue, 22 Dec 2020 14:08:40 +0000 (15:08 +0100)
author Daniel Schürmann <daniel@schuermann.dev>
Wed, 12 Aug 2020 12:52:04 +0000 (14:52 +0200)
committer Daniel Schürmann <daniel@schuermann.dev>
Tue, 22 Dec 2020 14:08:40 +0000 (15:08 +0100)
diff --git a/src/amd/compiler/aco_insert_exec_mask.cpp b/src/amd/compiler/aco_insert_exec_mask.cpp

index ff89fbf..1ce9d46 100644 (file)
--- a/src/amd/compiler/aco_insert_exec_mask.cpp
+++ b/src/amd/compiler/aco_insert_exec_mask.cpp
@@ -323,14 +323,7 @@ void transition_to_WQM(exec_ctx& ctx, Builder bld, unsigned idx)
        return;
     if (ctx.info[idx].exec.back().second & mask_type_global) {
        Temp exec_mask = ctx.info[idx].exec.back().first;
-      /* TODO: we might generate better code if we pass the uncopied "exec_mask"
-       * directly to the s_wqm (we still need to keep this parallelcopy for
-       * potential later uses of exec_mask though). We currently can't do this
-       * because of a RA bug. */
-      exec_mask = bld.pseudo(aco_opcode::p_parallelcopy, bld.def(bld.lm), bld.exec(exec_mask));
-      ctx.info[idx].exec.back().first = exec_mask;
-
-      exec_mask = bld.sop1(Builder::s_wqm, bld.def(bld.lm, exec), bld.def(s1, scc), exec_mask);
+      exec_mask = bld.sop1(Builder::s_wqm, bld.def(bld.lm, exec), bld.def(s1, scc), bld.exec(exec_mask));
        ctx.info[idx].exec.emplace_back(exec_mask, mask_type_global | mask_type_wqm);
        return;
     }
author	Daniel Schürmann <daniel@schuermann.dev>
	Wed, 12 Aug 2020 12:52:04 +0000 (14:52 +0200)
committer	Daniel Schürmann <daniel@schuermann.dev>
	Tue, 22 Dec 2020 14:08:40 +0000 (15:08 +0100)