aco: propagate SGPRs into VOP1 instructions early.

author Daniel Schürmann <daniel@schuermann.dev>

Thu, 17 Sep 2020 23:00:38 +0000 (00:00 +0100)

committer Marge Bot <eric+marge@anholt.net>

Wed, 14 Oct 2020 15:31:38 +0000 (15:31 +0000)
author Daniel Schürmann <daniel@schuermann.dev>
Thu, 17 Sep 2020 23:00:38 +0000 (00:00 +0100)
committer Marge Bot <eric+marge@anholt.net>
Wed, 14 Oct 2020 15:31:38 +0000 (15:31 +0000)
diff --git a/src/amd/compiler/aco_optimizer.cpp b/src/amd/compiler/aco_optimizer.cpp

index a2640bd..1b8674a 100644 (file)
--- a/src/amd/compiler/aco_optimizer.cpp
+++ b/src/amd/compiler/aco_optimizer.cpp
@@ -877,6 +877,11 @@ void label_instruction(opt_ctx &ctx, Block& block, aco_ptr<Instruction>& instr)
              instr->operands[i].setTemp(info.temp);
              info = ctx.info[info.temp.id()];
           }
+         /* applying SGPRs to VOP1 doesn't increase code size and DCE is helped by doing it earlier */
+         if (info.is_temp() && info.temp.type() == RegType::sgpr && can_apply_sgprs(instr) && instr->operands.size() == 1) {
+            instr->operands[i].setTemp(info.temp);
+            info = ctx.info[info.temp.id()];
+         }
  
           /* for instructions other than v_cndmask_b32, the size of the instruction should match the operand size */
           unsigned can_use_mod = instr->opcode != aco_opcode::v_cndmask_b32 || instr->operands[i].getTemp().bytes() == 4;
author	Daniel Schürmann <daniel@schuermann.dev>
	Thu, 17 Sep 2020 23:00:38 +0000 (00:00 +0100)
committer	Marge Bot <eric+marge@anholt.net>
	Wed, 14 Oct 2020 15:31:38 +0000 (15:31 +0000)