aco: Don't allow any VALU instruction to write m0.
authorTimur Kristóf <timur.kristof@gmail.com>
Sat, 6 May 2023 15:03:22 +0000 (17:03 +0200)
committerMarge Bot <emma+marge@anholt.net>
Wed, 10 May 2023 12:41:25 +0000 (12:41 +0000)
Fixes: d5398b62da1913e7224c826da0dbd5fa88436f18
Signed-off-by: Timur Kristóf <timur.kristof@gmail.com>
Reviewed-by: Georg Lehmann <dadschoorse@gmail.com>
Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/22885>

src/amd/compiler/aco_ir.cpp
src/amd/compiler/aco_ir.h
src/amd/compiler/aco_register_allocation.cpp

index 03f6931..6c9e64f 100644 (file)
@@ -480,22 +480,23 @@ can_use_opsel(amd_gfx_level gfx_level, aco_opcode op, int idx)
 }
 
 bool
-can_write_m0(amd_gfx_level gfx_level, const aco_ptr<Instruction>& instr)
+can_write_m0(const aco_ptr<Instruction>& instr)
 {
    if (instr->isSALU())
       return true;
 
+   /* VALU can't write m0 on any GPU generations. */
    if (instr->isVALU())
-      return gfx_level >= GFX9;
+      return false;
 
    switch (instr->opcode) {
    case aco_opcode::p_parallelcopy:
    case aco_opcode::p_extract:
    case aco_opcode::p_insert:
+      /* These pseudo instructions are implemented with SALU when writing m0. */
       return true;
-   case aco_opcode::p_reload:
-      return gfx_level >= GFX9;
    default:
+      /* Assume that no other instructions can write m0. */
       return false;
    }
 }
index a39e949..528e0c3 100644 (file)
@@ -1804,7 +1804,7 @@ bool instr_is_16bit(amd_gfx_level gfx_level, aco_opcode op);
 uint8_t get_gfx11_true16_mask(aco_opcode op);
 bool can_use_SDWA(amd_gfx_level gfx_level, const aco_ptr<Instruction>& instr, bool pre_ra);
 bool can_use_DPP(const aco_ptr<Instruction>& instr, bool pre_ra, bool dpp8);
-bool can_write_m0(amd_gfx_level gfx_level, const aco_ptr<Instruction>& instr);
+bool can_write_m0(const aco_ptr<Instruction>& instr);
 /* updates "instr" and returns the old instruction (or NULL if no update was needed) */
 aco_ptr<Instruction> convert_to_SDWA(amd_gfx_level gfx_level, aco_ptr<Instruction>& instr);
 aco_ptr<Instruction> convert_to_DPP(aco_ptr<Instruction>& instr, bool dpp8);
index fba6e1c..0b36010 100644 (file)
@@ -1656,7 +1656,7 @@ get_reg(ra_ctx& ctx, RegisterFile& reg_file, Temp temp,
    }
    if (ctx.assignments[temp.id()].m0) {
       if (get_reg_specified(ctx, reg_file, temp.regClass(), instr, m0) &&
-          can_write_m0(ctx.program->gfx_level, instr))
+          can_write_m0(instr))
          return m0;
    }