r600/sfn: tie in 64 lowering code

author Gert Wollny <gert.wollny@collabora.com>

Sat, 28 Nov 2020 15:37:09 +0000 (16:37 +0100)

committer Marge Bot <eric+marge@anholt.net>

Tue, 12 Jan 2021 19:29:40 +0000 (19:29 +0000)
author Gert Wollny <gert.wollny@collabora.com>
Sat, 28 Nov 2020 15:37:09 +0000 (16:37 +0100)
committer Marge Bot <eric+marge@anholt.net>
Tue, 12 Jan 2021 19:29:40 +0000 (19:29 +0000)
diff --git a/src/gallium/drivers/r600/sfn/sfn_nir.cpp b/src/gallium/drivers/r600/sfn/sfn_nir.cpp

index 5c950da..8379dc8 100644 (file)
--- a/src/gallium/drivers/r600/sfn/sfn_nir.cpp
+++ b/src/gallium/drivers/r600/sfn/sfn_nir.cpp
@@ -844,6 +844,7 @@ static bool
  optimize_once(nir_shader *shader, bool vectorize)
  {
     bool progress = false;
+   NIR_PASS(progress, shader, nir_lower_vars_to_ssa);
     NIR_PASS(progress, shader, nir_copy_prop);
     NIR_PASS(progress, shader, nir_opt_dce);
     NIR_PASS(progress, shader, nir_opt_algebraic);
@@ -885,6 +886,35 @@ bool has_saturate(const nir_function *func)
     return false;
  }
  
+bool r600_lower_to_scalar_instr_filter(const nir_instr *instr, const void *)
+{
+   if (instr->type != nir_instr_type_alu)
+      return true;
+
+   auto alu = nir_instr_as_alu(instr);
+   switch (alu->op) {
+   case nir_op_bany_fnequal3:
+   case nir_op_bany_fnequal4:
+   case nir_op_ball_fequal3:
+   case nir_op_ball_fequal4:
+   case nir_op_bany_inequal3:
+   case nir_op_bany_inequal4:
+   case nir_op_ball_iequal3:
+   case nir_op_ball_iequal4:
+   case nir_op_fdot2:
+   case nir_op_fdot3:
+   case nir_op_fdot4:
+      return false;
+   case nir_op_bany_fnequal2:
+   case nir_op_ball_fequal2:
+   case nir_op_bany_inequal2:
+   case nir_op_ball_iequal2:
+      return nir_src_bit_size(alu->src[0].src) != 64;
+   default:
+      return true;
+   }
+}
+
  int r600_shader_from_nir(struct r600_context *rctx,
                           struct r600_pipe_shader *pipeshader,
                           r600_shader_key *key)
@@ -892,6 +922,10 @@ int r600_shader_from_nir(struct r600_context *rctx,
     char filename[4000];
     struct r600_pipe_shader_selector *sel = pipeshader->selector;
  
+   bool lower_64bit = ((sel->nir->options->lower_int64_options ||
+                        sel->nir->options->lower_doubles_options) &&
+                       (sel->nir->info.bit_sizes_float | sel->nir->info.bit_sizes_int) & 64);
+
     r600::ShaderFromNir convert;
  
     if (rctx->screen->b.debug_flags & DBG_PREOPT_IR) {
@@ -906,6 +940,12 @@ int r600_shader_from_nir(struct r600_context *rctx,
     NIR_PASS_V(sel->nir, nir_lower_regs_to_ssa);
     NIR_PASS_V(sel->nir, nir_lower_phis_to_scalar);
  
+   if (lower_64bit)
+      NIR_PASS_V(sel->nir, nir_lower_int64);
+   while(optimize_once(sel->nir, false));
+
+   NIR_PASS_V(sel->nir, nir_lower_alu_to_scalar, r600_lower_to_scalar_instr_filter, NULL);
+
     NIR_PASS_V(sel->nir, r600_lower_shared_io);
     NIR_PASS_V(sel->nir, r600_nir_lower_atomics);
  
@@ -928,9 +968,23 @@ int r600_shader_from_nir(struct r600_context *rctx,
     NIR_PASS_V(sel->nir, nir_lower_io, io_modes, r600_glsl_type_size,
                   nir_lower_io_lower_64bit_to_32);
  
+   /**/
+   if (lower_64bit)
+      NIR_PASS_V(sel->nir, nir_lower_indirect_derefs, nir_var_function_temp, 10);
+
     NIR_PASS_V(sel->nir, nir_opt_constant_folding);
     NIR_PASS_V(sel->nir, nir_io_add_const_offset_to_base, io_modes);
  
+   NIR_PASS_V(sel->nir, nir_lower_alu_to_scalar, r600_lower_to_scalar_instr_filter, NULL);
+   NIR_PASS_V(sel->nir, nir_lower_phis_to_scalar);
+   if (lower_64bit)
+      NIR_PASS_V(sel->nir, r600::r600_nir_split_64bit_io);
+   NIR_PASS_V(sel->nir, nir_lower_alu_to_scalar, r600_lower_to_scalar_instr_filter, NULL);
+   NIR_PASS_V(sel->nir, nir_lower_phis_to_scalar);
+   NIR_PASS_V(sel->nir, nir_lower_alu_to_scalar, r600_lower_to_scalar_instr_filter, NULL);
+   NIR_PASS_V(sel->nir, nir_copy_prop);
+   NIR_PASS_V(sel->nir, nir_opt_dce);
+
     if (sel->nir->info.stage == MESA_SHADER_VERTEX)
        NIR_PASS_V(sel->nir, r600_vectorize_vs_inputs);
  
@@ -952,11 +1006,14 @@ int r600_shader_from_nir(struct r600_context *rctx,
                   (pipe_prim_type)key->tcs.prim_mode);
  
     NIR_PASS_V(sel->nir, nir_lower_ubo_vec4);
+   if (lower_64bit)
+      NIR_PASS_V(sel->nir, r600::r600_nir_64_to_vec2);
  
     /* Lower to scalar to let some optimization work out better */
-   NIR_PASS_V(sel->nir, nir_lower_alu_to_scalar, NULL, NULL);
     while(optimize_once(sel->nir, false));
  
+   NIR_PASS_V(sel->nir, r600::r600_merge_vec2_stores);
+
     NIR_PASS_V(sel->nir, nir_remove_dead_variables, nir_var_shader_in, NULL);
     NIR_PASS_V(sel->nir, nir_remove_dead_variables,  nir_var_shader_out, NULL);
  
diff --git a/src/gallium/drivers/r600/sfn/sfn_shader_base.cpp b/src/gallium/drivers/r600/sfn/sfn_shader_base.cpp

index 12d4487..e33884a 100644 (file)
--- a/src/gallium/drivers/r600/sfn/sfn_shader_base.cpp
+++ b/src/gallium/drivers/r600/sfn/sfn_shader_base.cpp
@@ -978,8 +978,7 @@ bool ShaderFromNirProcessor::load_uniform(nir_intrinsic_instr* instr)
  
     if (literal) {
        AluInstruction *ir = nullptr;
-
-      for (int i = 0; i < instr->num_components ; ++i) {
+      for (unsigned i = 0; i < nir_dest_num_components(instr->dest); ++i) {
           PValue u = PValue(new UniformValue(512 + literal->u32 + base, i));
           sfn_log << SfnLog::io << "uniform "
                   << instr->dest.ssa.index << " const["<< i << "]: "<< instr->const_index[i] << "\n";
author	Gert Wollny <gert.wollny@collabora.com>
	Sat, 28 Nov 2020 15:37:09 +0000 (16:37 +0100)
committer	Marge Bot <eric+marge@anholt.net>
	Tue, 12 Jan 2021 19:29:40 +0000 (19:29 +0000)
src/gallium/drivers/r600/sfn/sfn_nir.cpp		patch \| blob \| history
src/gallium/drivers/r600/sfn/sfn_shader_base.cpp		patch \| blob \| history