glsl: Retire ldexp lowering in favor of the nir lowering flag.

author Emma Anholt <emma@anholt.net>

Wed, 22 Mar 2023 20:20:03 +0000 (13:20 -0700)

committer Marge Bot <emma+marge@anholt.net>

Thu, 6 Apr 2023 02:32:00 +0000 (02:32 +0000)
author Emma Anholt <emma@anholt.net>
Wed, 22 Mar 2023 20:20:03 +0000 (13:20 -0700)
committer Marge Bot <emma+marge@anholt.net>
Thu, 6 Apr 2023 02:32:00 +0000 (02:32 +0000)
diff --git a/docs/gallium/screen.rst b/docs/gallium/screen.rst

index a7ab998..8714b98 100644 (file)
--- a/docs/gallium/screen.rst
+++ b/docs/gallium/screen.rst
@@ -752,7 +752,6 @@ support different features.
    is supported. If it is, DTRUNC/DCEIL/DFLR/DROUND opcodes may be used.
  * ``PIPE_SHADER_CAP_DFRACEXP_DLDEXP_SUPPORTED``: Whether DFRACEXP and
    DLDEXP are supported.
-* ``PIPE_SHADER_CAP_LDEXP_SUPPORTED``: Whether LDEXP is supported.
  * ``PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE``: Whether the driver doesn't
    ignore tgsi_declaration_range::Last for shader inputs and outputs.
  * ``PIPE_SHADER_CAP_MAX_SHADER_BUFFERS``: Maximum number of memory buffers
diff --git a/src/asahi/compiler/agx_compile.h b/src/asahi/compiler/agx_compile.h

index 397eef1..7d977f7 100644 (file)
--- a/src/asahi/compiler/agx_compile.h
+++ b/src/asahi/compiler/agx_compile.h
@@ -185,6 +185,7 @@ static const nir_shader_compiler_options agx_nir_options = {
     .lower_iabs = true,
     .lower_fdph = true,
     .lower_ffract = true,
+   .lower_ldexp = true,
     .lower_pack_half_2x16 = true,
     .lower_pack_64_2x32 = true,
     .lower_unpack_half_2x16 = true,
diff --git a/src/compiler/glsl/ir_optimization.h b/src/compiler/glsl/ir_optimization.h

index f895f1c..abea3bd 100644 (file)
--- a/src/compiler/glsl/ir_optimization.h
+++ b/src/compiler/glsl/ir_optimization.h
@@ -59,7 +59,7 @@ bool do_tree_grafting(exec_list *instructions);
  bool do_vec_index_to_cond_assign(exec_list *instructions);
  bool lower_discard(exec_list *instructions);
  void lower_discard_flow(exec_list *instructions);
-bool lower_instructions(exec_list *instructions, bool have_ldexp,
+bool lower_instructions(exec_list *instructions,
                          bool have_dfrexp, bool have_dround,
                          bool have_gpu_shader5);
  bool lower_clip_cull_distance(struct gl_shader_program *prog,
diff --git a/src/compiler/glsl/lower_instructions.cpp b/src/compiler/glsl/lower_instructions.cpp

index 7e47dfc..18a229d 100644 (file)
--- a/src/compiler/glsl/lower_instructions.cpp
+++ b/src/compiler/glsl/lower_instructions.cpp
@@ -30,13 +30,8 @@
   * rather than in each driver backend.
   *
   * Currently supported transformations:
- * - LDEXP_TO_ARITH
   * - DOPS_TO_DFRAC
   *
- * LDEXP_TO_ARITH:
- * -------------
- * Converts ir_binop_ldexp to arithmetic and bit operations for float sources.
- *
   * DFREXP_DLDEXP_TO_ARITH:
   * ---------------
   * Converts ir_binop_ldexp, ir_unop_frexp_sig, and ir_unop_frexp_exp to
@@ -57,7 +52,6 @@
  #include <math.h>
  
  /* Operations for lower_instructions() */
-#define LDEXP_TO_ARITH     0x80
  #define DOPS_TO_DFRAC      0x800
  #define DFREXP_DLDEXP_TO_ARITH    0x1000
  #define FIND_LSB_TO_FLOAT_CAST    0x20000
@@ -80,7 +74,6 @@ public:
  private:
     unsigned lower; /** Bitfield of which operations to lower */
  
-   void ldexp_to_arith(ir_expression *);
     void dldexp_to_arith(ir_expression *);
     void dfrexp_sig_to_arith(ir_expression *);
     void dfrexp_exp_to_arith(ir_expression *);
@@ -111,11 +104,10 @@ private:
  #define lowering(x) (this->lower & x)
  
  bool
-lower_instructions(exec_list *instructions, bool have_ldexp, bool have_dfrexp,
+lower_instructions(exec_list *instructions, bool have_dfrexp,
                     bool have_dround, bool have_gpu_shader5)
  {
     unsigned what_to_lower =
-      (have_ldexp ? 0 : LDEXP_TO_ARITH) |
        (have_dfrexp ? 0 : DFREXP_DLDEXP_TO_ARITH) |
        (have_dround ? 0 : DOPS_TO_DFRAC) |
        /* Assume that if ARB_gpu_shader5 is not supported then all of the
@@ -133,170 +125,6 @@ lower_instructions(exec_list *instructions, bool have_ldexp, bool have_dfrexp,
  }
  
  void
-lower_instructions_visitor::ldexp_to_arith(ir_expression *ir)
-{
-   /* Translates
-    *    ir_binop_ldexp x exp
-    * into
-    *
-    *    extracted_biased_exp = rshift(bitcast_f2i(abs(x)), exp_shift);
-    *    resulting_biased_exp = min(extracted_biased_exp + exp, 255);
-    *
-    *    if (extracted_biased_exp >= 255)
-    *       return x; // +/-inf, NaN
-    *
-    *    sign_mantissa = bitcast_f2u(x) & sign_mantissa_mask;
-    *
-    *    if (min(resulting_biased_exp, extracted_biased_exp) < 1)
-    *       resulting_biased_exp = 0;
-    *    if (resulting_biased_exp >= 255 ||
-    *        min(resulting_biased_exp, extracted_biased_exp) < 1) {
-    *       sign_mantissa &= sign_mask;
-    *    }
-    *
-    *    return bitcast_u2f(sign_mantissa |
-    *                       lshift(i2u(resulting_biased_exp), exp_shift));
-    *
-    * which we can't actually implement as such, since the GLSL IR doesn't
-    * have vectorized if-statements. We actually implement it without branches
-    * using conditional-select:
-    *
-    *    extracted_biased_exp = rshift(bitcast_f2i(abs(x)), exp_shift);
-    *    resulting_biased_exp = min(extracted_biased_exp + exp, 255);
-    *
-    *    sign_mantissa = bitcast_f2u(x) & sign_mantissa_mask;
-    *
-    *    flush_to_zero = lequal(min(resulting_biased_exp, extracted_biased_exp), 0);
-    *    resulting_biased_exp = csel(flush_to_zero, 0, resulting_biased_exp)
-    *    zero_mantissa = logic_or(flush_to_zero,
-    *                             gequal(resulting_biased_exp, 255));
-    *    sign_mantissa = csel(zero_mantissa, sign_mantissa & sign_mask, sign_mantissa);
-    *
-    *    result = sign_mantissa |
-    *             lshift(i2u(resulting_biased_exp), exp_shift));
-    *
-    *    return csel(extracted_biased_exp >= 255, x, bitcast_u2f(result));
-    *
-    * The definition of ldexp in the GLSL spec says:
-    *
-    *    "If this product is too large to be represented in the
-    *     floating-point type, the result is undefined."
-    *
-    * However, the definition of ldexp in the GLSL ES spec does not contain
-    * this sentence, so we do need to handle overflow correctly.
-    *
-    * There is additional language limiting the defined range of exp, but this
-    * is merely to allow implementations that store 2^exp in a temporary
-    * variable.
-    */
-
-   const unsigned vec_elem = ir->type->vector_elements;
-
-   /* Types */
-   const glsl_type *ivec = glsl_type::get_instance(GLSL_TYPE_INT, vec_elem, 1);
-   const glsl_type *uvec = glsl_type::get_instance(GLSL_TYPE_UINT, vec_elem, 1);
-   const glsl_type *bvec = glsl_type::get_instance(GLSL_TYPE_BOOL, vec_elem, 1);
-
-   /* Temporary variables */
-   ir_variable *x = new(ir) ir_variable(ir->type, "x", ir_var_temporary);
-   ir_variable *exp = new(ir) ir_variable(ivec, "exp", ir_var_temporary);
-   ir_variable *result = new(ir) ir_variable(uvec, "result", ir_var_temporary);
-
-   ir_variable *extracted_biased_exp =
-      new(ir) ir_variable(ivec, "extracted_biased_exp", ir_var_temporary);
-   ir_variable *resulting_biased_exp =
-      new(ir) ir_variable(ivec, "resulting_biased_exp", ir_var_temporary);
-
-   ir_variable *sign_mantissa =
-      new(ir) ir_variable(uvec, "sign_mantissa", ir_var_temporary);
-
-   ir_variable *flush_to_zero =
-      new(ir) ir_variable(bvec, "flush_to_zero", ir_var_temporary);
-   ir_variable *zero_mantissa =
-      new(ir) ir_variable(bvec, "zero_mantissa", ir_var_temporary);
-
-   ir_instruction &i = *base_ir;
-
-   /* Copy <x> and <exp> arguments. */
-   i.insert_before(x);
-   i.insert_before(assign(x, ir->operands[0]));
-   i.insert_before(exp);
-   i.insert_before(assign(exp, ir->operands[1]));
-
-   /* Extract the biased exponent from <x>. */
-   i.insert_before(extracted_biased_exp);
-   i.insert_before(assign(extracted_biased_exp,
-                          rshift(bitcast_f2i(abs(x)),
-                                 new(ir) ir_constant(23, vec_elem))));
-
-   /* The definition of ldexp in the GLSL 4.60 spec says:
-    *
-    *    "If exp is greater than +128 (single-precision) or +1024
-    *     (double-precision), the value returned is undefined. If exp is less
-    *     than -126 (single-precision) or -1022 (double-precision), the value
-    *     returned may be flushed to zero."
-    *
-    * So we do not have to guard against the possibility of addition overflow,
-    * which could happen when exp is close to INT_MAX. Addition underflow
-    * cannot happen (the worst case is 0 + (-INT_MAX)).
-    */
-   i.insert_before(resulting_biased_exp);
-   i.insert_before(assign(resulting_biased_exp,
-                          min2(add(extracted_biased_exp, exp),
-                               new(ir) ir_constant(255, vec_elem))));
-
-   i.insert_before(sign_mantissa);
-   i.insert_before(assign(sign_mantissa,
-                          bit_and(bitcast_f2u(x),
-                                  new(ir) ir_constant(0x807fffffu, vec_elem))));
-
-   /* We flush to zero if the original or resulting biased exponent is 0,
-    * indicating a +/-0.0 or subnormal input or output.
-    *
-    * The mantissa is set to 0 if the resulting biased exponent is 255, since
-    * an overflow should produce a +/-inf result.
-    *
-    * Note that NaN inputs are handled separately.
-    */
-   i.insert_before(flush_to_zero);
-   i.insert_before(assign(flush_to_zero,
-                          lequal(min2(resulting_biased_exp,
-                                      extracted_biased_exp),
-                                 ir_constant::zero(ir, ivec))));
-   i.insert_before(assign(resulting_biased_exp,
-                          csel(flush_to_zero,
-                               ir_constant::zero(ir, ivec),
-                               resulting_biased_exp)));
-
-   i.insert_before(zero_mantissa);
-   i.insert_before(assign(zero_mantissa,
-                          logic_or(flush_to_zero,
-                                   equal(resulting_biased_exp,
-                                         new(ir) ir_constant(255, vec_elem)))));
-   i.insert_before(assign(sign_mantissa,
-                          csel(zero_mantissa,
-                               bit_and(sign_mantissa,
-                                       new(ir) ir_constant(0x80000000u, vec_elem)),
-                               sign_mantissa)));
-
-   i.insert_before(result);
-   i.insert_before(assign(result,
-                          bitfield_insert(sign_mantissa,
-                                          i2u(resulting_biased_exp),
-                                          new(ir) ir_constant(23u, vec_elem),
-                                          new(ir) ir_constant(8u, vec_elem))));
-
-   ir->operation = ir_triop_csel;
-   ir->init_num_operands();
-   ir->operands[0] = gequal(extracted_biased_exp,
-                            new(ir) ir_constant(255, vec_elem));
-   ir->operands[1] = new(ir) ir_dereference_variable(x);
-   ir->operands[2] = bitcast_u2f(result);
-
-   this->progress = true;
-}
-
-void
  lower_instructions_visitor::dldexp_to_arith(ir_expression *ir)
  {
     /* See ldexp_to_arith for structure. Uses frexp_exp to extract the exponent
@@ -1100,8 +928,6 @@ lower_instructions_visitor::visit_leave(ir_expression *ir)
        break;
  
     case ir_binop_ldexp:
-      if (lowering(LDEXP_TO_ARITH) && ir->type->is_float())
-         ldexp_to_arith(ir);
        if (lowering(DFREXP_DLDEXP_TO_ARITH) && ir->type->is_double())
           dldexp_to_arith(ir);
        break;
diff --git a/src/compiler/glsl/test_optpass.cpp b/src/compiler/glsl/test_optpass.cpp

index fc289ae..ea2e260 100644 (file)
--- a/src/compiler/glsl/test_optpass.cpp
+++ b/src/compiler/glsl/test_optpass.cpp
@@ -93,7 +93,7 @@ do_optimization(struct exec_list *ir, const char *optimization,
        return lower_discard(ir);
     } else if (sscanf(optimization, "lower_instructions ( %d ) ",
                       &int_0) == 1) {
-      return lower_instructions(ir, false, false, false, false);
+      return lower_instructions(ir, false, false, false);
     } else {
        printf("Unrecognized optimization %s\n", optimization);
        exit(EXIT_FAILURE);
diff --git a/src/gallium/auxiliary/gallivm/lp_bld_limits.h b/src/gallium/auxiliary/gallivm/lp_bld_limits.h

index b0b854a..4acd9e9 100644 (file)
--- a/src/gallium/auxiliary/gallivm/lp_bld_limits.h
+++ b/src/gallium/auxiliary/gallivm/lp_bld_limits.h
@@ -151,7 +151,6 @@ gallivm_get_shader_param(enum pipe_shader_cap param)
        return 1;
     case PIPE_SHADER_CAP_DROUND_SUPPORTED:
     case PIPE_SHADER_CAP_DFRACEXP_DLDEXP_SUPPORTED:
-   case PIPE_SHADER_CAP_LDEXP_SUPPORTED:
     case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
     case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:
        return 0;
diff --git a/src/gallium/auxiliary/tgsi/tgsi_exec.h b/src/gallium/auxiliary/tgsi/tgsi_exec.h

index 9604d73..72ffe47 100644 (file)
--- a/src/gallium/auxiliary/tgsi/tgsi_exec.h
+++ b/src/gallium/auxiliary/tgsi/tgsi_exec.h
@@ -483,7 +483,6 @@ tgsi_exec_get_shader_param(enum pipe_shader_cap param)
     case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
        return 1;
     case PIPE_SHADER_CAP_DFRACEXP_DLDEXP_SUPPORTED:
-   case PIPE_SHADER_CAP_LDEXP_SUPPORTED:
     case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
        return 1;
     case PIPE_SHADER_CAP_DROUND_SUPPORTED:
diff --git a/src/gallium/drivers/asahi/agx_pipe.c b/src/gallium/drivers/asahi/agx_pipe.c

index 1426ed3..ea4296f 100644 (file)
--- a/src/gallium/drivers/asahi/agx_pipe.c
+++ b/src/gallium/drivers/asahi/agx_pipe.c
@@ -1591,7 +1591,6 @@ agx_get_shader_param(struct pipe_screen *pscreen, enum pipe_shader_type shader,
     case PIPE_SHADER_CAP_INT64_ATOMICS:
     case PIPE_SHADER_CAP_DROUND_SUPPORTED:
     case PIPE_SHADER_CAP_DFRACEXP_DLDEXP_SUPPORTED:
-   case PIPE_SHADER_CAP_LDEXP_SUPPORTED:
     case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
        return 0;
  
diff --git a/src/gallium/drivers/crocus/crocus_screen.c b/src/gallium/drivers/crocus/crocus_screen.c

index 434e857..0e59773 100644 (file)
--- a/src/gallium/drivers/crocus/crocus_screen.c
+++ b/src/gallium/drivers/crocus/crocus_screen.c
@@ -522,7 +522,6 @@ crocus_get_shader_param(struct pipe_screen *pscreen,
     case PIPE_SHADER_CAP_SUPPORTED_IRS:
        return 1 << PIPE_SHADER_IR_NIR;
     case PIPE_SHADER_CAP_DROUND_SUPPORTED:
-   case PIPE_SHADER_CAP_LDEXP_SUPPORTED:
        return 1;
     case PIPE_SHADER_CAP_DFRACEXP_DLDEXP_SUPPORTED:
     case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
diff --git a/src/gallium/drivers/d3d12/d3d12_screen.cpp b/src/gallium/drivers/d3d12/d3d12_screen.cpp

index 665df77..b7623d3 100644 (file)
--- a/src/gallium/drivers/d3d12/d3d12_screen.cpp
+++ b/src/gallium/drivers/d3d12/d3d12_screen.cpp
@@ -496,7 +496,6 @@ d3d12_get_shader_param(struct pipe_screen *pscreen,
            screen->opts.ResourceBindingTier >= D3D12_RESOURCE_BINDING_TIER_3) ?
           PIPE_MAX_SHADER_IMAGES : D3D12_PS_CS_UAV_REGISTER_COUNT;
  
-   case PIPE_SHADER_CAP_LDEXP_SUPPORTED:
     case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
     case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:
     case PIPE_SHADER_CAP_CONT_SUPPORTED:
diff --git a/src/gallium/drivers/etnaviv/etnaviv_compiler.c b/src/gallium/drivers/etnaviv/etnaviv_compiler.c

index 0e26795..a182b2e 100644 (file)
--- a/src/gallium/drivers/etnaviv/etnaviv_compiler.c
+++ b/src/gallium/drivers/etnaviv/etnaviv_compiler.c
@@ -44,6 +44,7 @@ etna_compiler_create(const char *renderer, const struct etna_specs *specs)
        .fuse_ffma64 = true,
        .lower_uadd_carry = true,
        .lower_usub_borrow = true,
+      .lower_ldexp = true,
        .lower_mul_high = true,
        .lower_bitops = true,
        .lower_all_io_to_temps = true,
diff --git a/src/gallium/drivers/etnaviv/etnaviv_screen.c b/src/gallium/drivers/etnaviv/etnaviv_screen.c

index c811f08..1b402aa 100644 (file)
--- a/src/gallium/drivers/etnaviv/etnaviv_screen.c
+++ b/src/gallium/drivers/etnaviv/etnaviv_screen.c
@@ -418,7 +418,6 @@ etna_screen_get_shader_param(struct pipe_screen *pscreen,
                  : screen->specs.max_vs_uniforms * sizeof(float[4]);
     case PIPE_SHADER_CAP_DROUND_SUPPORTED:
     case PIPE_SHADER_CAP_DFRACEXP_DLDEXP_SUPPORTED:
-   case PIPE_SHADER_CAP_LDEXP_SUPPORTED:
     case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
        return false;
     case PIPE_SHADER_CAP_SUPPORTED_IRS:
diff --git a/src/gallium/drivers/freedreno/freedreno_screen.c b/src/gallium/drivers/freedreno/freedreno_screen.c

index e6b1cb3..984c803 100644 (file)
--- a/src/gallium/drivers/freedreno/freedreno_screen.c
+++ b/src/gallium/drivers/freedreno/freedreno_screen.c
@@ -686,7 +686,6 @@ fd_screen_get_shader_param(struct pipe_screen *pscreen,
     case PIPE_SHADER_CAP_SUBROUTINES:
     case PIPE_SHADER_CAP_DROUND_SUPPORTED:
     case PIPE_SHADER_CAP_DFRACEXP_DLDEXP_SUPPORTED:
-   case PIPE_SHADER_CAP_LDEXP_SUPPORTED:
     case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
     case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
     case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:
diff --git a/src/gallium/drivers/i915/i915_screen.c b/src/gallium/drivers/i915/i915_screen.c

index 1240da0..80a425b 100644 (file)
--- a/src/gallium/drivers/i915/i915_screen.c
+++ b/src/gallium/drivers/i915/i915_screen.c
@@ -366,7 +366,6 @@ i915_get_shader_param(struct pipe_screen *screen, enum pipe_shader_type shader,
           return I915_TEX_UNITS;
        case PIPE_SHADER_CAP_DROUND_SUPPORTED:
        case PIPE_SHADER_CAP_DFRACEXP_DLDEXP_SUPPORTED:
-      case PIPE_SHADER_CAP_LDEXP_SUPPORTED:
        case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
        case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
        case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
diff --git a/src/gallium/drivers/iris/iris_screen.c b/src/gallium/drivers/iris/iris_screen.c

index 3b81089..c71e857 100644 (file)
--- a/src/gallium/drivers/iris/iris_screen.c
+++ b/src/gallium/drivers/iris/iris_screen.c
@@ -549,7 +549,6 @@ iris_get_shader_param(struct pipe_screen *pscreen,
        return irs;
     }
     case PIPE_SHADER_CAP_DROUND_SUPPORTED:
-   case PIPE_SHADER_CAP_LDEXP_SUPPORTED:
        return 1;
     case PIPE_SHADER_CAP_DFRACEXP_DLDEXP_SUPPORTED:
     case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
diff --git a/src/gallium/drivers/nouveau/nv30/nv30_screen.c b/src/gallium/drivers/nouveau/nv30/nv30_screen.c

index 09b707d..7134f04 100644 (file)
--- a/src/gallium/drivers/nouveau/nv30/nv30_screen.c
+++ b/src/gallium/drivers/nouveau/nv30/nv30_screen.c
@@ -365,7 +365,6 @@ nv30_screen_get_shader_param(struct pipe_screen *pscreen,
        case PIPE_SHADER_CAP_GLSL_16BIT_CONSTS:
        case PIPE_SHADER_CAP_DROUND_SUPPORTED:
        case PIPE_SHADER_CAP_DFRACEXP_DLDEXP_SUPPORTED:
-      case PIPE_SHADER_CAP_LDEXP_SUPPORTED:
        case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
        case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
        case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
@@ -418,7 +417,6 @@ nv30_screen_get_shader_param(struct pipe_screen *pscreen,
        case PIPE_SHADER_CAP_GLSL_16BIT_CONSTS:
        case PIPE_SHADER_CAP_DROUND_SUPPORTED:
        case PIPE_SHADER_CAP_DFRACEXP_DLDEXP_SUPPORTED:
-      case PIPE_SHADER_CAP_LDEXP_SUPPORTED:
        case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
        case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
        case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
diff --git a/src/gallium/drivers/nouveau/nv50/nv50_screen.c b/src/gallium/drivers/nouveau/nv50/nv50_screen.c

index 028b763..6151883 100644 (file)
--- a/src/gallium/drivers/nouveau/nv50/nv50_screen.c
+++ b/src/gallium/drivers/nouveau/nv50/nv50_screen.c
@@ -517,7 +517,6 @@ nv50_screen_get_shader_param(struct pipe_screen *pscreen,
        return (1 << PIPE_SHADER_IR_TGSI) | (1 << PIPE_SHADER_IR_NIR);
     case PIPE_SHADER_CAP_DROUND_SUPPORTED:
     case PIPE_SHADER_CAP_DFRACEXP_DLDEXP_SUPPORTED:
-   case PIPE_SHADER_CAP_LDEXP_SUPPORTED:
     case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
     case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
     case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:
diff --git a/src/gallium/drivers/nouveau/nvc0/nvc0_screen.c b/src/gallium/drivers/nouveau/nvc0/nvc0_screen.c

index d3f5339..b301326 100644 (file)
--- a/src/gallium/drivers/nouveau/nvc0/nvc0_screen.c
+++ b/src/gallium/drivers/nouveau/nvc0/nvc0_screen.c
@@ -539,7 +539,6 @@ nvc0_screen_get_shader_param(struct pipe_screen *pscreen,
     case PIPE_SHADER_CAP_DROUND_SUPPORTED:
        return 1;
     case PIPE_SHADER_CAP_DFRACEXP_DLDEXP_SUPPORTED:
-   case PIPE_SHADER_CAP_LDEXP_SUPPORTED:
     case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
     case PIPE_SHADER_CAP_INT64_ATOMICS:
     case PIPE_SHADER_CAP_FP16:
diff --git a/src/gallium/drivers/panfrost/pan_screen.c b/src/gallium/drivers/panfrost/pan_screen.c

index 9f3a1cb..bfcca51 100644 (file)
--- a/src/gallium/drivers/panfrost/pan_screen.c
+++ b/src/gallium/drivers/panfrost/pan_screen.c
@@ -459,7 +459,6 @@ panfrost_get_shader_param(struct pipe_screen *screen,
     case PIPE_SHADER_CAP_INT64_ATOMICS:
     case PIPE_SHADER_CAP_DROUND_SUPPORTED:
     case PIPE_SHADER_CAP_DFRACEXP_DLDEXP_SUPPORTED:
-   case PIPE_SHADER_CAP_LDEXP_SUPPORTED:
     case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
        return 0;
  
diff --git a/src/gallium/drivers/r300/r300_screen.c b/src/gallium/drivers/r300/r300_screen.c

index 82e5e7e..e0653ba 100644 (file)
--- a/src/gallium/drivers/r300/r300_screen.c
+++ b/src/gallium/drivers/r300/r300_screen.c
@@ -312,7 +312,6 @@ static int r300_get_shader_param(struct pipe_screen *pscreen,
          case PIPE_SHADER_CAP_GLSL_16BIT_CONSTS:
          case PIPE_SHADER_CAP_DROUND_SUPPORTED:
          case PIPE_SHADER_CAP_DFRACEXP_DLDEXP_SUPPORTED:
-        case PIPE_SHADER_CAP_LDEXP_SUPPORTED:
          case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
          case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
          case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
@@ -403,7 +402,6 @@ static int r300_get_shader_param(struct pipe_screen *pscreen,
          case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
          case PIPE_SHADER_CAP_DROUND_SUPPORTED:
          case PIPE_SHADER_CAP_DFRACEXP_DLDEXP_SUPPORTED:
-        case PIPE_SHADER_CAP_LDEXP_SUPPORTED:
          case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
          case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
          case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
diff --git a/src/gallium/drivers/r600/r600_pipe.c b/src/gallium/drivers/r600/r600_pipe.c

index b404ecf..29e590b 100644 (file)
--- a/src/gallium/drivers/r600/r600_pipe.c
+++ b/src/gallium/drivers/r600/r600_pipe.c
@@ -638,7 +638,6 @@ static int r600_get_shader_param(struct pipe_screen* pscreen,
         }
         case PIPE_SHADER_CAP_DROUND_SUPPORTED:
         case PIPE_SHADER_CAP_DFRACEXP_DLDEXP_SUPPORTED:
-       case PIPE_SHADER_CAP_LDEXP_SUPPORTED:
                 return 0;
         case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
         case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
diff --git a/src/gallium/drivers/r600/r600_pipe_common.c b/src/gallium/drivers/r600/r600_pipe_common.c

index 4eb2ac7..e5762c7 100644 (file)
--- a/src/gallium/drivers/r600/r600_pipe_common.c
+++ b/src/gallium/drivers/r600/r600_pipe_common.c
@@ -1348,6 +1348,7 @@ bool r600_common_screen_init(struct r600_common_screen *rscreen,
                 .lower_extract_word = true,
                 .lower_insert_byte = true,
                 .lower_insert_word = true,
+               .lower_ldexp = true,
                 .lower_rotate = true,
                 /* due to a bug in the shader compiler, some loops hang
                  * if they are not unrolled, see:
diff --git a/src/gallium/drivers/radeonsi/si_get.c b/src/gallium/drivers/radeonsi/si_get.c

index 26f36bb..e7bd4d4 100644 (file)
--- a/src/gallium/drivers/radeonsi/si_get.c
+++ b/src/gallium/drivers/radeonsi/si_get.c
@@ -498,7 +498,6 @@ static int si_get_shader_param(struct pipe_screen *pscreen, enum pipe_shader_typ
     case PIPE_SHADER_CAP_INT64_ATOMICS:
     case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
     case PIPE_SHADER_CAP_DROUND_SUPPORTED:
-   case PIPE_SHADER_CAP_LDEXP_SUPPORTED:
     case PIPE_SHADER_CAP_DFRACEXP_DLDEXP_SUPPORTED:
     case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR: /* lowered in finalize_nir */
     case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR: /* lowered in finalize_nir */
diff --git a/src/gallium/drivers/svga/svga_screen.c b/src/gallium/drivers/svga/svga_screen.c

index eac5475..b50e84f 100644 (file)
--- a/src/gallium/drivers/svga/svga_screen.c
+++ b/src/gallium/drivers/svga/svga_screen.c
@@ -537,7 +537,6 @@ vgpu9_get_shader_param(struct pipe_screen *screen,
           return (1 << PIPE_SHADER_IR_TGSI) | (svgascreen->debug.nir ? (1 << PIPE_SHADER_IR_NIR) : 0);
        case PIPE_SHADER_CAP_DROUND_SUPPORTED:
        case PIPE_SHADER_CAP_DFRACEXP_DLDEXP_SUPPORTED:
-      case PIPE_SHADER_CAP_LDEXP_SUPPORTED:
        case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
        case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
        case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
@@ -603,7 +602,6 @@ vgpu9_get_shader_param(struct pipe_screen *screen,
           return (1 << PIPE_SHADER_IR_TGSI) | (svgascreen->debug.nir ? (1 << PIPE_SHADER_IR_NIR) : 0);
        case PIPE_SHADER_CAP_DROUND_SUPPORTED:
        case PIPE_SHADER_CAP_DFRACEXP_DLDEXP_SUPPORTED:
-      case PIPE_SHADER_CAP_LDEXP_SUPPORTED:
        case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
        case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
        case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
@@ -714,7 +712,6 @@ vgpu10_get_shader_param(struct pipe_screen *screen,
           return 0;
     case PIPE_SHADER_CAP_DROUND_SUPPORTED:
     case PIPE_SHADER_CAP_DFRACEXP_DLDEXP_SUPPORTED:
-   case PIPE_SHADER_CAP_LDEXP_SUPPORTED:
        /* For the above cases, we rely on the GLSL compiler to translate/lower
         * the TGIS instruction into other instructions we do support.
         */
@@ -748,6 +745,7 @@ vgpu10_get_shader_param(struct pipe_screen *screen,
     .lower_int64_options = nir_lower_imul_2x32_64,                             \
     .lower_fdph = true,                                                        \
     .lower_flrp64 = true,                                                      \
+   .lower_ldexp = true,                                                       \
     .lower_rotate = true,                                                      \
     .lower_uniforms_to_ubo = true,                                             \
     .lower_vector_cmp = true,                                                  \
diff --git a/src/gallium/drivers/svga/svga_tgsi_vgpu10.c b/src/gallium/drivers/svga/svga_tgsi_vgpu10.c

index cf22757..7a462cd 100644 (file)
--- a/src/gallium/drivers/svga/svga_tgsi_vgpu10.c
+++ b/src/gallium/drivers/svga/svga_tgsi_vgpu10.c
@@ -11116,8 +11116,7 @@ emit_instruction(struct svga_shader_emitter_v10 *emit,
        return emit_dtrunc(emit, inst);
  
     /* The following opcodes should never be seen here.  We return zero
-    * for all the PIPE_CAP_TGSI_DROUND_SUPPORTED, DFRACEXP_DLDEXP_SUPPORTED,
-    * LDEXP_SUPPORTED queries.
+    * for all the PIPE_CAP_TGSI_DROUND_SUPPORTED, DFRACEXP_DLDEXP_SUPPORTED queries.
      */
     case TGSI_OPCODE_LDEXP:
     case TGSI_OPCODE_DSSG:
diff --git a/src/gallium/drivers/v3d/v3d_screen.c b/src/gallium/drivers/v3d/v3d_screen.c

index 3ca1674..916c6ff 100644 (file)
--- a/src/gallium/drivers/v3d/v3d_screen.c
+++ b/src/gallium/drivers/v3d/v3d_screen.c
@@ -432,7 +432,6 @@ v3d_screen_get_shader_param(struct pipe_screen *pscreen, enum pipe_shader_type s
          case PIPE_SHADER_CAP_GLSL_16BIT_CONSTS:
          case PIPE_SHADER_CAP_DROUND_SUPPORTED:
          case PIPE_SHADER_CAP_DFRACEXP_DLDEXP_SUPPORTED:
-        case PIPE_SHADER_CAP_LDEXP_SUPPORTED:
          case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
          case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
          case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
diff --git a/src/gallium/drivers/vc4/vc4_program.c b/src/gallium/drivers/vc4/vc4_program.c

index 0f2e92a..2a35af6 100644 (file)
--- a/src/gallium/drivers/vc4/vc4_program.c
+++ b/src/gallium/drivers/vc4/vc4_program.c
@@ -2183,6 +2183,7 @@ static const nir_shader_compiler_options nir_options = {
          .lower_ldexp = true,
          .lower_fneg = true,
          .lower_ineg = true,
+        .lower_ldexp = true,
          .lower_rotate = true,
          .lower_to_scalar = true,
          .lower_umax = true,
diff --git a/src/gallium/drivers/vc4/vc4_screen.c b/src/gallium/drivers/vc4/vc4_screen.c

index 448391f..5b7ae10 100644 (file)
--- a/src/gallium/drivers/vc4/vc4_screen.c
+++ b/src/gallium/drivers/vc4/vc4_screen.c
@@ -295,7 +295,6 @@ vc4_screen_get_shader_param(struct pipe_screen *pscreen,
          case PIPE_SHADER_CAP_GLSL_16BIT_CONSTS:
          case PIPE_SHADER_CAP_DROUND_SUPPORTED:
          case PIPE_SHADER_CAP_DFRACEXP_DLDEXP_SUPPORTED:
-        case PIPE_SHADER_CAP_LDEXP_SUPPORTED:
          case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
                  return 0;
          case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
diff --git a/src/gallium/drivers/virgl/virgl_screen.c b/src/gallium/drivers/virgl/virgl_screen.c

index 87aedd9..ff04d40 100644 (file)
--- a/src/gallium/drivers/virgl/virgl_screen.c
+++ b/src/gallium/drivers/virgl/virgl_screen.c
@@ -1195,6 +1195,7 @@ virgl_create_screen(struct virgl_winsys *vws, const struct pipe_screen_config *c
     }
     screen->compiler_options.lower_ffma32 = true;
     screen->compiler_options.fuse_ffma32 = false;
+   screen->compiler_options.lower_ldexp = true;
     screen->compiler_options.lower_image_offset_to_range_base = true;
     screen->compiler_options.lower_atomic_offset_to_range_base = true;
  
diff --git a/src/gallium/drivers/zink/zink_screen.c b/src/gallium/drivers/zink/zink_screen.c

index 39f08ee..eeed588 100644 (file)
--- a/src/gallium/drivers/zink/zink_screen.c
+++ b/src/gallium/drivers/zink/zink_screen.c
@@ -1242,9 +1242,6 @@ zink_get_shader_param(struct pipe_screen *pscreen,
                       ZINK_MAX_SHADER_IMAGES);
        return 0;
  
-   case PIPE_SHADER_CAP_LDEXP_SUPPORTED:
-      return 1;
-
     case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
     case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:
        return 0; /* not implemented */
diff --git a/src/gallium/include/pipe/p_defines.h b/src/gallium/include/pipe/p_defines.h

index b122cc5..90f72a5 100644 (file)
--- a/src/gallium/include/pipe/p_defines.h
+++ b/src/gallium/include/pipe/p_defines.h
@@ -1121,7 +1121,6 @@ enum pipe_shader_cap
     PIPE_SHADER_CAP_MAX_SHADER_BUFFERS,
     PIPE_SHADER_CAP_SUPPORTED_IRS,
     PIPE_SHADER_CAP_MAX_SHADER_IMAGES,
-   PIPE_SHADER_CAP_LDEXP_SUPPORTED,
     PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS,
     PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS,
  };
diff --git a/src/mesa/state_tracker/st_glsl_to_ir.cpp b/src/mesa/state_tracker/st_glsl_to_ir.cpp

index 3d56410..457cc14 100644 (file)
--- a/src/mesa/state_tracker/st_glsl_to_ir.cpp
+++ b/src/mesa/state_tracker/st_glsl_to_ir.cpp
@@ -66,8 +66,6 @@ link_shader(struct gl_context *ctx, struct gl_shader_program *prog)
                                                     PIPE_SHADER_CAP_DROUND_SUPPORTED);
        bool have_dfrexp = pscreen->get_shader_param(pscreen, ptarget,
                                                     PIPE_SHADER_CAP_DFRACEXP_DLDEXP_SUPPORTED);
-      bool have_ldexp = pscreen->get_shader_param(pscreen, ptarget,
-                                                  PIPE_SHADER_CAP_LDEXP_SUPPORTED);
  
        if (!pscreen->get_param(pscreen, PIPE_CAP_INT64_DIVMOD))
           lower_64bit_integer_instructions(ir, DIV64 | MOD64);
@@ -81,7 +79,7 @@ link_shader(struct gl_context *ctx, struct gl_shader_program *prog)
           lower_blend_equation_advanced(
              shader, ctx->Extensions.KHR_blend_equation_advanced_coherent);
  
-      lower_instructions(ir, have_ldexp, have_dfrexp, have_dround,
+      lower_instructions(ir, have_dfrexp, have_dround,
                           ctx->Extensions.ARB_gpu_shader5);
  
        do_vec_index_to_cond_assign(ir);
diff --git a/src/panfrost/midgard/midgard_compile.h b/src/panfrost/midgard/midgard_compile.h

index d2a1cd0..e2fb10b 100644 (file)
--- a/src/panfrost/midgard/midgard_compile.h
+++ b/src/panfrost/midgard/midgard_compile.h
@@ -71,6 +71,7 @@ static const nir_shader_compiler_options midgard_nir_options = {
     .lower_extract_word = true,
     .lower_insert_byte = true,
     .lower_insert_word = true,
+   .lower_ldexp = true,
     .lower_rotate = true,
  
     .lower_pack_half_2x16 = true,
author	Emma Anholt <emma@anholt.net>
	Wed, 22 Mar 2023 20:20:03 +0000 (13:20 -0700)
committer	Marge Bot <emma+marge@anholt.net>
	Thu, 6 Apr 2023 02:32:00 +0000 (02:32 +0000)
docs/gallium/screen.rst		patch \| blob \| history
src/asahi/compiler/agx_compile.h		patch \| blob \| history
src/compiler/glsl/ir_optimization.h		patch \| blob \| history
src/compiler/glsl/lower_instructions.cpp		patch \| blob \| history
src/compiler/glsl/test_optpass.cpp		patch \| blob \| history
src/gallium/auxiliary/gallivm/lp_bld_limits.h		patch \| blob \| history
src/gallium/auxiliary/tgsi/tgsi_exec.h		patch \| blob \| history
src/gallium/drivers/asahi/agx_pipe.c		patch \| blob \| history
src/gallium/drivers/crocus/crocus_screen.c		patch \| blob \| history
src/gallium/drivers/d3d12/d3d12_screen.cpp		patch \| blob \| history
src/gallium/drivers/etnaviv/etnaviv_compiler.c		patch \| blob \| history
src/gallium/drivers/etnaviv/etnaviv_screen.c		patch \| blob \| history
src/gallium/drivers/freedreno/freedreno_screen.c		patch \| blob \| history
src/gallium/drivers/i915/i915_screen.c		patch \| blob \| history
src/gallium/drivers/iris/iris_screen.c		patch \| blob \| history
src/gallium/drivers/nouveau/nv30/nv30_screen.c		patch \| blob \| history
src/gallium/drivers/nouveau/nv50/nv50_screen.c		patch \| blob \| history
src/gallium/drivers/nouveau/nvc0/nvc0_screen.c		patch \| blob \| history
src/gallium/drivers/panfrost/pan_screen.c		patch \| blob \| history
src/gallium/drivers/r300/r300_screen.c		patch \| blob \| history
src/gallium/drivers/r600/r600_pipe.c		patch \| blob \| history
src/gallium/drivers/r600/r600_pipe_common.c		patch \| blob \| history
src/gallium/drivers/radeonsi/si_get.c		patch \| blob \| history
src/gallium/drivers/svga/svga_screen.c		patch \| blob \| history
src/gallium/drivers/svga/svga_tgsi_vgpu10.c		patch \| blob \| history
src/gallium/drivers/v3d/v3d_screen.c		patch \| blob \| history
src/gallium/drivers/vc4/vc4_program.c		patch \| blob \| history
src/gallium/drivers/vc4/vc4_screen.c		patch \| blob \| history
src/gallium/drivers/virgl/virgl_screen.c		patch \| blob \| history
src/gallium/drivers/zink/zink_screen.c		patch \| blob \| history
src/gallium/include/pipe/p_defines.h		patch \| blob \| history
src/mesa/state_tracker/st_glsl_to_ir.cpp		patch \| blob \| history
src/panfrost/midgard/midgard_compile.h		patch \| blob \| history