nir: Eliminate nir_op_i2b

author Ian Romanick <ian.d.romanick@intel.com>

Tue, 15 Feb 2022 17:35:47 +0000 (09:35 -0800)

committer Marge Bot <emma+marge@anholt.net>

Wed, 14 Dec 2022 06:23:21 +0000 (06:23 +0000)
author Ian Romanick <ian.d.romanick@intel.com>
Tue, 15 Feb 2022 17:35:47 +0000 (09:35 -0800)
committer Marge Bot <emma+marge@anholt.net>
Wed, 14 Dec 2022 06:23:21 +0000 (06:23 +0000)
diff --git a/src/amd/compiler/aco_instruction_selection.cpp b/src/amd/compiler/aco_instruction_selection.cpp

index cea9935..6be4c9a 100644 (file)
--- a/src/amd/compiler/aco_instruction_selection.cpp
+++ b/src/amd/compiler/aco_instruction_selection.cpp
@@ -3471,8 +3471,7 @@ visit_alu_instr(isel_context* ctx, nir_alu_instr* instr)
           bld.pseudo(aco_opcode::p_create_vector, Definition(dst), tmp, Operand::zero());
        break;
     }
-   case nir_op_b2b1:
-   case nir_op_i2b1: {
+   case nir_op_b2b1: {
        Temp src = get_alu_src(ctx, instr->src[0]);
        assert(dst.regClass() == bld.lm);
  
diff --git a/src/amd/llvm/ac_nir_to_llvm.c b/src/amd/llvm/ac_nir_to_llvm.c

index dffa06a..6707f27 100644 (file)
--- a/src/amd/llvm/ac_nir_to_llvm.c
+++ b/src/amd/llvm/ac_nir_to_llvm.c
@@ -1112,7 +1112,6 @@ static bool visit_alu(struct ac_nir_context *ctx, const nir_alu_instr *instr)
     case nir_op_b2i64:
        result = emit_b2i(&ctx->ac, src[0], instr->dest.dest.ssa.bit_size);
        break;
-   case nir_op_i2b1:
     case nir_op_b2b1: /* after loads */
        result = emit_i2b(&ctx->ac, src[0]);
        break;
diff --git a/src/amd/vulkan/radv_pipeline.c b/src/amd/vulkan/radv_pipeline.c

index 5b950aa..bcbea9a 100644 (file)
--- a/src/amd/vulkan/radv_pipeline.c
+++ b/src/amd/vulkan/radv_pipeline.c
@@ -3086,7 +3086,6 @@ lower_bit_size_callback(const nir_instr *instr, void *_)
        case nir_op_bit_count:
        case nir_op_find_lsb:
        case nir_op_ufind_msb:
-      case nir_op_i2b1:
           return 32;
        case nir_op_ilt:
        case nir_op_ige:
diff --git a/src/asahi/compiler/agx_compile.c b/src/asahi/compiler/agx_compile.c

index a27e276..ee4fe55 100644 (file)
--- a/src/asahi/compiler/agx_compile.c
+++ b/src/asahi/compiler/agx_compile.c
@@ -805,7 +805,6 @@ agx_emit_alu_bool(agx_builder *b, nir_op op,
     case nir_op_inot: return agx_xor_to(b, dst, s0, t);
  
     case nir_op_f2b1: return agx_fcmpsel_to(b, dst, s0, f, f, t, AGX_FCOND_EQ);
-   case nir_op_i2b1: return agx_icmpsel_to(b, dst, s0, f, f, t, AGX_ICOND_UEQ);
     case nir_op_b2b1: return agx_icmpsel_to(b, dst, s0, f, f, t, AGX_ICOND_UEQ);
  
     case nir_op_bcsel:
diff --git a/src/broadcom/compiler/nir_to_vir.c b/src/broadcom/compiler/nir_to_vir.c

index 64c3eb1..6ff9b82 100644 (file)
--- a/src/broadcom/compiler/nir_to_vir.c
+++ b/src/broadcom/compiler/nir_to_vir.c
@@ -1210,11 +1210,6 @@ ntq_emit_comparison(struct v3d_compile *c,
                  vir_set_pf(c, vir_SUB_dest(c, nop, src0, src1), V3D_QPU_PF_PUSHC);
                  break;
  
-        case nir_op_i2b32:
-                vir_set_pf(c, vir_MOV_dest(c, nop, src0), V3D_QPU_PF_PUSHZ);
-                cond_invert = true;
-                break;
-
          case nir_op_f2b32:
                  vir_set_pf(c, vir_FMOV_dest(c, nop, src0), V3D_QPU_PF_PUSHZ);
                  cond_invert = true;
@@ -1656,7 +1651,6 @@ ntq_emit_alu(struct v3d_compile *c, nir_alu_instr *instr)
                  break;
          }
  
-        case nir_op_i2b32:
          case nir_op_f2b32:
          case nir_op_feq32:
          case nir_op_fneu32:
diff --git a/src/compiler/nir/nir.c b/src/compiler/nir/nir.c

index c579755..5db6bec 100644 (file)
--- a/src/compiler/nir/nir.c
+++ b/src/compiler/nir/nir.c
@@ -3108,10 +3108,6 @@ nir_alu_instr_is_comparison(const nir_alu_instr *instr)
     CASE_ALL_SIZES(nir_op_uge)
     CASE_ALL_SIZES(nir_op_ieq)
     CASE_ALL_SIZES(nir_op_ine)
-   case nir_op_i2b1:
-   case nir_op_i2b8:
-   case nir_op_i2b16:
-   case nir_op_i2b32:
     case nir_op_f2b1:
     case nir_op_f2b8:
     case nir_op_f2b16:
diff --git a/src/compiler/nir/nir_lower_bool_to_bitsize.c b/src/compiler/nir/nir_lower_bool_to_bitsize.c

index f252ff6..aa4f3de 100644 (file)
--- a/src/compiler/nir/nir_lower_bool_to_bitsize.c
+++ b/src/compiler/nir/nir_lower_bool_to_bitsize.c
@@ -168,11 +168,6 @@ lower_alu_instr(nir_builder *b, nir_alu_instr *alu)
                                 bit_size == 16 ? nir_op_f2b16 : nir_op_f2b32;
        break;
  
-   case nir_op_i2b1:
-      opcode = bit_size == 8 ? nir_op_i2b8 :
-                               bit_size == 16 ? nir_op_i2b16 : nir_op_i2b32;
-      break;
-
     case nir_op_b2b1:
        /* Since the canonical bit size is the size of the src, it's a no-op */
        opcode = nir_op_mov;
diff --git a/src/compiler/nir/nir_lower_bool_to_float.c b/src/compiler/nir/nir_lower_bool_to_float.c

index 9542b80..593a9ef 100644 (file)
--- a/src/compiler/nir/nir_lower_bool_to_float.c
+++ b/src/compiler/nir/nir_lower_bool_to_float.c
@@ -67,7 +67,6 @@ lower_alu_instr(nir_builder *b, nir_alu_instr *alu)
     case nir_op_b2f32: alu->op = nir_op_mov; break;
     case nir_op_b2i32: alu->op = nir_op_mov; break;
     case nir_op_f2b1:
-   case nir_op_i2b1:
        rep = nir_sne(b, nir_ssa_for_alu_src(b, alu, 0),
                         nir_imm_float(b, 0));
        break;
diff --git a/src/compiler/nir/nir_lower_bool_to_int32.c b/src/compiler/nir/nir_lower_bool_to_int32.c

index 86cb875..e9e21a6 100644 (file)
--- a/src/compiler/nir/nir_lower_bool_to_int32.c
+++ b/src/compiler/nir/nir_lower_bool_to_int32.c
@@ -67,7 +67,6 @@ lower_alu_instr(nir_alu_instr *alu)
        break;
  
     case nir_op_f2b1: alu->op = nir_op_f2b32; break;
-   case nir_op_i2b1: alu->op = nir_op_i2b32; break;
  
     case nir_op_b2b32:
     case nir_op_b2b1:
diff --git a/src/compiler/nir/nir_lower_int64.c b/src/compiler/nir/nir_lower_int64.c

index 58feca4..422bd40 100644 (file)
--- a/src/compiler/nir/nir_lower_int64.c
+++ b/src/compiler/nir/nir_lower_int64.c
@@ -48,14 +48,6 @@ lower_b2i64(nir_builder *b, nir_ssa_def *x)
  }
  
  static nir_ssa_def *
-lower_i2b(nir_builder *b, nir_ssa_def *x)
-{
-   return nir_ine(b, nir_ior(b, nir_unpack_64_2x32_split_x(b, x),
-                                nir_unpack_64_2x32_split_y(b, x)),
-                     nir_imm_int(b, 0));
-}
-
-static nir_ssa_def *
  lower_i2i8(nir_builder *b, nir_ssa_def *x)
  {
     return nir_i2i8(b, nir_unpack_64_2x32_split_x(b, x));
@@ -871,7 +863,6 @@ nir_lower_int64_op_to_options_mask(nir_op opcode)
     case nir_op_irem:
        return nir_lower_divmod64;
     case nir_op_b2i64:
-   case nir_op_i2b1:
     case nir_op_i2i8:
     case nir_op_i2i16:
     case nir_op_i2i32:
@@ -965,8 +956,6 @@ lower_int64_alu_instr(nir_builder *b, nir_alu_instr *alu)
        return lower_irem64(b, src[0], src[1]);
     case nir_op_b2i64:
        return lower_b2i64(b, src[0]);
-   case nir_op_i2b1:
-      return lower_i2b(b, src[0]);
     case nir_op_i2i8:
        return lower_i2i8(b, src[0]);
     case nir_op_i2i16:
@@ -1052,7 +1041,6 @@ should_lower_int64_alu_instr(const nir_alu_instr *alu,
                               const nir_shader_compiler_options *options)
  {
     switch (alu->op) {
-   case nir_op_i2b1:
     case nir_op_i2i8:
     case nir_op_i2i16:
     case nir_op_i2i32:
diff --git a/src/compiler/nir/nir_lower_int_to_float.c b/src/compiler/nir/nir_lower_int_to_float.c

index 6cdb53e..98633be 100644 (file)
--- a/src/compiler/nir/nir_lower_int_to_float.c
+++ b/src/compiler/nir/nir_lower_int_to_float.c
@@ -89,7 +89,6 @@ lower_alu_instr(nir_builder *b, nir_alu_instr *alu)
     }
  
     case nir_op_f2u32: alu->op = nir_op_ffloor; break;
-   case nir_op_i2b1: alu->op = nir_op_f2b1; break;
  
     case nir_op_ilt: alu->op = nir_op_flt; break;
     case nir_op_ige: alu->op = nir_op_fge; break;
diff --git a/src/compiler/nir/nir_opcodes.py b/src/compiler/nir/nir_opcodes.py

index b49efdb..c8cbe0c 100644 (file)
--- a/src/compiler/nir/nir_opcodes.py
+++ b/src/compiler/nir/nir_opcodes.py
@@ -229,7 +229,7 @@ for src_t in [tint, tuint, tfloat, tbool]:
     if src_t == tbool:
        dst_types = [tfloat, tint, tbool]
     elif src_t == tint:
-      dst_types = [tfloat, tint, tbool]
+      dst_types = [tfloat, tint]
     elif src_t == tuint:
        dst_types = [tfloat, tuint]
     elif src_t == tfloat:
diff --git a/src/compiler/nir/nir_opcodes_c.py b/src/compiler/nir/nir_opcodes_c.py

index 4f80d51..a51438a 100644 (file)
--- a/src/compiler/nir/nir_opcodes_c.py
+++ b/src/compiler/nir/nir_opcodes_c.py
@@ -50,6 +50,10 @@ nir_type_conversion_op(nir_alu_type src, nir_alu_type dst, nir_rounding_mode rnd
        return nir_op_mov;
     }
  
+   /* i2b and u2b do not exist.  Use ine (via nir_type_conversion) instead */
+   assert((src_base != nir_type_int && src_base != nir_type_uint) ||
+          dst_base != nir_type_bool);
+
     switch (src_base) {
  %     for src_t in ['int', 'uint', 'float', 'bool']:
        case nir_type_${src_t}:
@@ -68,8 +72,8 @@ nir_type_conversion_op(nir_alu_type src, nir_alu_type dst, nir_rounding_mode rnd
  %                 else:
  <%                   dst_t = 'int' %>
  %                 endif
-%              elif src_t == 'uint' and dst_t == 'bool':
-<%                src_t = 'int' %>
+%              elif src_t in ['int', 'uint'] and dst_t == 'bool':
+<%                   continue %>
  %              endif
                 switch (dst_bit_size) {
  %                 for dst_bits in type_sizes(dst_t):
diff --git a/src/compiler/nir/nir_opt_algebraic.py b/src/compiler/nir/nir_opt_algebraic.py

index c47176a..079a522 100644 (file)
--- a/src/compiler/nir/nir_opt_algebraic.py
+++ b/src/compiler/nir/nir_opt_algebraic.py
@@ -719,7 +719,6 @@ optimizations.extend([
     (('bcsel', ('ilt', a, b), b, a), ('imax', a, b)),
     (('bcsel', ('ige', a, b), b, a), ('imin', a, b)),
     (('bcsel', ('ige', b, a), b, a), ('imax', a, b)),
-   (('bcsel', ('i2b', a), b, c), ('bcsel', ('ine', a, 0), b, c)),
     (('bcsel', ('inot', a), b, c), ('bcsel', a, c, b)),
     (('bcsel', a, ('bcsel', a, b, c), d), ('bcsel', a, b, d)),
     (('bcsel', a, b, ('bcsel', a, c, d)), ('bcsel', a, b, d)),
@@ -1391,9 +1390,6 @@ optimizations.extend([
     (('fsin', a), lowered_sincos(0.5), 'options->lower_sincos'),
     (('fcos', a), lowered_sincos(0.75), 'options->lower_sincos'),
     # Boolean simplifications
-   (('i2b16(is_used_by_if)', a), ('ine16', a, 0)),
-   (('i2b32(is_used_by_if)', a), ('ine32', a, 0)),
-   (('i2b1(is_used_by_if)', a), ('ine', a, 0)),
     (('ieq', a, True), a),
     (('ine(is_not_used_by_if)', a, True), ('inot', a)),
     (('ine', a, False), a),
@@ -1454,8 +1450,6 @@ optimizations.extend([
     # Conversions
     (('f2i', ('ftrunc', a)), ('f2i', a)),
     (('f2u', ('ftrunc', a)), ('f2u', a)),
-   (('i2b', ('ineg', a)), ('i2b', a)),
-   (('i2b', ('iabs', a)), ('i2b', a)),
     (('inot', ('f2b1', a)), ('feq', a, 0.0)),
  
     # Conversions from 16 bits to 32 bits and back can always be removed
@@ -1967,8 +1961,8 @@ optimizations.extend([
  
     (('ubfe', a, 0, '#b'), ('iand', a, ('ushr', 0xffffffff, ('ineg', b)))),
  
-   (('b2i32', ('i2b', ('ubfe', a, b, 1))), ('ubfe', a, b, 1)),
-   (('b2i32', ('i2b', ('ibfe', a, b, 1))), ('ubfe', a, b, 1)), # ubfe in the replacement is correct
+   (('b2i32', ('ine', ('ubfe', a, b, 1), 0)), ('ubfe', a, b, 1)),
+   (('b2i32', ('ine', ('ibfe', a, b, 1), 0)), ('ubfe', a, b, 1)), # ubfe in the replacement is correct
     (('ine', ('ibfe(is_used_once)', a, '#b', '#c'), 0), ('ine', ('iand', a, ('ishl', ('ushr', 0xffffffff, ('ineg', c)), b)), 0)),
     (('ieq', ('ibfe(is_used_once)', a, '#b', '#c'), 0), ('ieq', ('iand', a, ('ishl', ('ushr', 0xffffffff, ('ineg', c)), b)), 0)),
     (('ine', ('ubfe(is_used_once)', a, '#b', '#c'), 0), ('ine', ('iand', a, ('ishl', ('ushr', 0xffffffff, ('ineg', c)), b)), 0)),
@@ -2194,13 +2188,11 @@ for left, right in itertools.combinations_with_replacement(invert.keys(), 2):
     optimizations.append((('inot', ('iand(is_used_once)', (left, a, b), (right, c, d))),
                           ('ior', (invert[left], a, b), (invert[right], c, d))))
  
-# Optimize x2bN(b2x(x)) -> x
+# Optimize f2bN(b2f(x)) -> x
  for size in type_sizes('bool'):
      aN = 'a@' + str(size)
      f2bN = 'f2b' + str(size)
-    i2bN = 'i2b' + str(size)
      optimizations.append(((f2bN, ('b2f', aN)), a))
-    optimizations.append(((i2bN, ('b2i', aN)), a))
  
  # Optimize x2yN(b2x(x)) -> b2y
  for x, y in itertools.product(['f', 'u', 'i'], ['f', 'u', 'i']):
diff --git a/src/compiler/nir/nir_search.c b/src/compiler/nir/nir_search.c

index 8ac17a7..17f703a 100644 (file)
--- a/src/compiler/nir/nir_search.c
+++ b/src/compiler/nir/nir_search.c
@@ -144,7 +144,6 @@ nir_op_matches_search_op(nir_op nop, uint16_t sop)
     MATCH_ICONV_CASE(i2i)
     MATCH_FCONV_CASE(b2f)
     MATCH_ICONV_CASE(b2i)
-   MATCH_BCONV_CASE(i2b)
     MATCH_BCONV_CASE(f2b)
     default:
        unreachable("Invalid nir_search_op");
@@ -187,7 +186,6 @@ nir_search_op_for_nir_op(nir_op nop)
     MATCH_ICONV_CASE(i2i)
     MATCH_FCONV_CASE(b2f)
     MATCH_ICONV_CASE(b2i)
-   MATCH_BCONV_CASE(i2b)
     MATCH_BCONV_CASE(f2b)
     default:
        return nop;
@@ -241,7 +239,6 @@ nir_op_for_search_op(uint16_t sop, unsigned bit_size)
     RET_ICONV_CASE(i2i)
     RET_FCONV_CASE(b2f)
     RET_ICONV_CASE(b2i)
-   RET_BCONV_CASE(i2b)
     RET_BCONV_CASE(f2b)
     default:
        unreachable("Invalid nir_search_op");
@@ -621,7 +618,6 @@ UNUSED static void dump_value(const nir_algebraic_table *table, const nir_search
        CASE(f2b)
        CASE(b2f)
        CASE(b2i)
-      CASE(i2b)
        CASE(i2i)
        CASE(f2i)
        CASE(i2f)
diff --git a/src/compiler/nir/nir_search.h b/src/compiler/nir/nir_search.h

index 48777b4..3b16778 100644 (file)
--- a/src/compiler/nir/nir_search.h
+++ b/src/compiler/nir/nir_search.h
@@ -123,7 +123,6 @@ enum nir_search_op {
     nir_search_op_i2i,
     nir_search_op_b2f,
     nir_search_op_b2i,
-   nir_search_op_i2b,
     nir_search_op_f2b,
     nir_num_search_ops,
  };
diff --git a/src/freedreno/ir3/ir3_compiler_nir.c b/src/freedreno/ir3/ir3_compiler_nir.c

index 2ed14ed..3d2109f 100644 (file)
--- a/src/freedreno/ir3/ir3_compiler_nir.c
+++ b/src/freedreno/ir3/ir3_compiler_nir.c
@@ -476,16 +476,6 @@ emit_alu(struct ir3_context *ctx, nir_alu_instr *alu)
        dst[0]->cat2.condition = IR3_COND_NE;
        break;
  
-   case nir_op_i2b1:
-      /* i2b1 will appear when translating from nir_load_ubo or
-       * nir_intrinsic_load_ssbo, where any non-zero value is true.
-       */
-      dst[0] = ir3_CMPS_S(
-         b, src[0], 0,
-         create_immed_typed(b, 0, type_uint_size(bs[0])), 0);
-      dst[0]->cat2.condition = IR3_COND_NE;
-      break;
-
     case nir_op_b2b1:
        /* b2b1 will appear when translating from
         *
diff --git a/src/gallium/auxiliary/gallivm/lp_bld_nir.c b/src/gallium/auxiliary/gallivm/lp_bld_nir.c

index f3d879b..3fe4629 100644 (file)
--- a/src/gallium/auxiliary/gallivm/lp_bld_nir.c
+++ b/src/gallium/auxiliary/gallivm/lp_bld_nir.c
@@ -244,27 +244,6 @@ assign_alu_dest(struct lp_build_nir_context *bld_base,
        assign_reg(bld_base, &dest->dest.reg, dest->write_mask, vals);
  }
  
-
-static LLVMValueRef
-int_to_bool32(struct lp_build_nir_context *bld_base,
-              uint32_t src_bit_size,
-              bool is_unsigned,
-              LLVMValueRef val)
-{
-   LLVMBuilderRef builder = bld_base->base.gallivm->builder;
-   struct lp_build_context *int_bld =
-      get_int_bld(bld_base, is_unsigned, src_bit_size);
-   LLVMValueRef result = lp_build_compare(bld_base->base.gallivm,
-                                          int_bld->type, PIPE_FUNC_NOTEQUAL,
-                                          val, int_bld->zero);
-   if (src_bit_size == 16)
-      result = LLVMBuildSExt(builder, result, bld_base->int_bld.vec_type, "");
-   else if (src_bit_size == 64)
-      result = LLVMBuildTrunc(builder, result, bld_base->int_bld.vec_type, "");
-   return result;
-}
-
-
  static LLVMValueRef
  flt_to_bool32(struct lp_build_nir_context *bld_base,
                uint32_t src_bit_size,
@@ -964,9 +943,6 @@ do_alu_action(struct lp_build_nir_context *bld_base,
     case nir_op_ftrunc:
        result = lp_build_trunc(get_flt_bld(bld_base, src_bit_size[0]), src[0]);
        break;
-   case nir_op_i2b32:
-      result = int_to_bool32(bld_base, src_bit_size[0], false, src[0]);
-      break;
     case nir_op_i2f16:
        result = LLVMBuildSIToFP(builder, src[0],
                                 bld_base->half_bld.vec_type, "");
diff --git a/src/gallium/auxiliary/nir/nir_to_tgsi.c b/src/gallium/auxiliary/nir/nir_to_tgsi.c

index ba1dbc0..bcf0fa9 100644 (file)
--- a/src/gallium/auxiliary/nir/nir_to_tgsi.c
+++ b/src/gallium/auxiliary/nir/nir_to_tgsi.c
@@ -1568,13 +1568,6 @@ ntt_emit_alu(struct ntt_compile *c, nir_alu_instr *instr)
              ntt_FSNE(c, dst, src[0], ureg_imm1f(c->ureg, 0));
           break;
  
-      case nir_op_i2b32:
-         if (src_64) {
-            ntt_U64SNE(c, dst, src[0], ureg_imm1u(c->ureg, 0));
-         } else
-            ntt_USNE(c, dst, src[0], ureg_imm1u(c->ureg, 0));
-         break;
-
        case nir_op_b2i32:
           ntt_AND(c, dst, src[0], ureg_imm1u(c->ureg, 1));
           break;
diff --git a/src/gallium/drivers/d3d12/ci/d3d12-quick_shader.txt b/src/gallium/drivers/d3d12/ci/d3d12-quick_shader.txt

index 95ba2c5..364f08b 100644 (file)
--- a/src/gallium/drivers/d3d12/ci/d3d12-quick_shader.txt
+++ b/src/gallium/drivers/d3d12/ci/d3d12-quick_shader.txt
@@ -524,6 +524,7 @@ spec/arb_tessellation_shader/execution/variable-indexing/tcs-patch-output-array-
  spec/arb_tessellation_shader/execution/variable-indexing/tcs-patch-output-array-vec3-index-wr: crash
  spec/arb_tessellation_shader/execution/variable-indexing/tcs-patch-output-array-vec4-index-wr: crash
  spec/arb_tessellation_shader/execution/variable-indexing/tcs-patch-vec4-index-wr: crash
+spec/arb_tessellation_shader/execution/variable-indexing/tcs-patch-vec4-swiz-index-wr: crash
  spec/arb_tessellation_shader/execution/variable-indexing/tes-both-input-array-float-index-rd: crash
  spec/arb_tessellation_shader/execution/variable-indexing/tes-both-input-array-vec2-index-rd: crash
  spec/arb_tessellation_shader/execution/variable-indexing/tes-both-input-array-vec3-index-rd: crash
@@ -3011,9 +3012,9 @@ spec/oes_viewport_array/viewport-gs-writes-out-of-range: skip
  summary:
         name:  results
         ----  --------
-       pass:    17231
+       pass:    17230
         fail:       20
-      crash:       40
+      crash:       41
         skip:     2925
      timeout:        0
         warn:       25
diff --git a/src/gallium/drivers/etnaviv/etnaviv_compiler_nir_emit.c b/src/gallium/drivers/etnaviv/etnaviv_compiler_nir_emit.c

index 7d8c483..f926057 100644 (file)
--- a/src/gallium/drivers/etnaviv/etnaviv_compiler_nir_emit.c
+++ b/src/gallium/drivers/etnaviv/etnaviv_compiler_nir_emit.c
@@ -83,7 +83,6 @@ static const struct etna_op_info etna_ops[] = {
     UOP(b2f32, AND, 0_X_X), /* AND with fui(1.0f) */
     UOP(b2i32, AND, 0_X_X), /* AND with 1 */
     OPC(f2b32, CMP, 0_X_X, NE), /* != 0.0 */
-   UOPC(i2b32, CMP, 0_X_X, NE), /* != 0 */
  
     /* arithmetic */
     IOP(iadd, ADD, 0_X_1),
@@ -167,9 +166,6 @@ etna_emit_alu(struct etna_compile *c, nir_op op, struct etna_inst_dst dst,
     case nir_op_f2b32:
        inst.src[1] = etna_immediate_float(0.0f);
        break;
-   case nir_op_i2b32:
-      inst.src[1] = etna_immediate_int(0);
-      break;
     case nir_op_ineg:
        inst.src[0] = etna_immediate_int(0);
        src[0].neg = 1;
diff --git a/src/gallium/drivers/r600/sfn/sfn_instr_alu.cpp b/src/gallium/drivers/r600/sfn/sfn_instr_alu.cpp

index d7291f8..afc7709 100644 (file)
--- a/src/gallium/drivers/r600/sfn/sfn_instr_alu.cpp
+++ b/src/gallium/drivers/r600/sfn/sfn_instr_alu.cpp
@@ -1249,9 +1249,6 @@ emit_any_all_icomp(
     const nir_alu_instr& alu, EAluOp opcode, int nc, bool all, Shader& shader);
  
  static bool
-emit_alu_i2orf2_b1(const nir_alu_instr& alu, EAluOp opcode, Shader& shader);
-
-static bool
  emit_alu_comb_with_zero(const nir_alu_instr& alu, EAluOp opcode, Shader& shader);
  static bool
  emit_unpack_64_2x32_split(const nir_alu_instr& alu, int comp, Shader& shader);
@@ -1614,9 +1611,6 @@ AluInstr::from_nir(nir_alu_instr *alu, Shader& shader)
        return emit_alu_op2(*alu, op2_add, shader, op2_opt_neg_src1);
     case nir_op_ftrunc:
        return emit_alu_op1(*alu, op1_trunc, shader);
-   case nir_op_i2b1:
-   case nir_op_i2b32:
-      return emit_alu_i2orf2_b1(*alu, op2_setne_int, shader);
     case nir_op_iadd:
        return emit_alu_op2_int(*alu, op2_add_int, shader);
     case nir_op_iand:
@@ -2644,28 +2638,6 @@ emit_create_vec(const nir_alu_instr& instr, unsigned nc, Shader& shader)
  }
  
  static bool
-emit_alu_i2orf2_b1(const nir_alu_instr& alu, EAluOp opcode, Shader& shader)
-{
-   auto& value_factory = shader.value_factory();
-   AluInstr *ir = nullptr;
-   Pin pin = nir_dest_num_components(alu.dest.dest) == 1 ? pin_free : pin_none;
-
-   for (int i = 0; i < 4; ++i) {
-      if (alu.dest.write_mask & (1 << i)) {
-         ir = new AluInstr(opcode,
-                           value_factory.dest(alu.dest, i, pin),
-                           value_factory.src(alu.src[0], i),
-                           value_factory.zero(),
-                           AluInstr::write);
-         shader.emit_instruction(ir);
-      }
-   }
-   if (ir)
-      ir->set_alu_flag(alu_last_instr);
-   return true;
-}
-
-static bool
  emit_alu_comb_with_zero(const nir_alu_instr& alu, EAluOp opcode, Shader& shader)
  {
     auto& value_factory = shader.value_factory();
diff --git a/src/gallium/drivers/vc4/vc4_program.c b/src/gallium/drivers/vc4/vc4_program.c

index 426512c..c4461cf 100644 (file)
--- a/src/gallium/drivers/vc4/vc4_program.c
+++ b/src/gallium/drivers/vc4/vc4_program.c
@@ -1146,7 +1146,6 @@ ntq_emit_alu(struct vc4_compile *c, nir_alu_instr *instr)
          case nir_op_b2i32:
                  result = qir_AND(c, src[0], qir_uniform_ui(c, 1));
                  break;
-        case nir_op_i2b32:
          case nir_op_f2b32:
                  qir_SF(c, src[0]);
                  result = qir_MOV(c, qir_SEL(c, QPU_COND_ZC,
diff --git a/src/gallium/drivers/zink/nir_to_spirv/nir_to_spirv.c b/src/gallium/drivers/zink/nir_to_spirv/nir_to_spirv.c

index 6a94201..7b0e7f9 100644 (file)
--- a/src/gallium/drivers/zink/nir_to_spirv/nir_to_spirv.c
+++ b/src/gallium/drivers/zink/nir_to_spirv/nir_to_spirv.c
@@ -2185,13 +2185,6 @@ emit_alu(struct ntv_context *ctx, nir_alu_instr *alu)
                                              nir_src_bit_size(alu->src[0].src),
                                              num_components, 0));
        break;
-   case nir_op_i2b1:
-      assert(nir_op_infos[alu->op].num_inputs == 1);
-      result = emit_binop(ctx, SpvOpINotEqual, dest_type, src[0],
-                          get_ivec_constant(ctx,
-                                            nir_src_bit_size(alu->src[0].src),
-                                            num_components, 0));
-      break;
  
  
  #define BINOP(nir_op, spirv_op) \
diff --git a/src/gallium/drivers/zink/nir_to_spirv/zink_nir_algebraic.py b/src/gallium/drivers/zink/nir_to_spirv/zink_nir_algebraic.py

index af2419c..20ed4cf 100644 (file)
--- a/src/gallium/drivers/zink/nir_to_spirv/zink_nir_algebraic.py
+++ b/src/gallium/drivers/zink/nir_to_spirv/zink_nir_algebraic.py
@@ -25,7 +25,7 @@ import sys
  
  lower_b2b = [
     (('b2b32', 'a'), ('b2i32', 'a')),
-   (('b2b1', 'a'), ('i2b1', 'a')),
+   (('b2b1', 'a'), ('ine', 'a', 0)),
  ]
  
  def main():
diff --git a/src/intel/compiler/brw_fs_nir.cpp b/src/intel/compiler/brw_fs_nir.cpp

index e52e234..510da77 100644 (file)
--- a/src/intel/compiler/brw_fs_nir.cpp
+++ b/src/intel/compiler/brw_fs_nir.cpp
@@ -1569,23 +1569,14 @@ fs_visitor::nir_emit_alu(const fs_builder &bld, nir_alu_instr *instr,
        inst = bld.emit(SHADER_OPCODE_RSQ, result, op[0]);
        break;
  
-   case nir_op_i2b32:
     case nir_op_f2b32: {
        uint32_t bit_size = nir_src_bit_size(instr->src[0].src);
        if (bit_size == 64) {
           /* two-argument instructions can't take 64-bit immediates */
-         fs_reg zero;
-         fs_reg tmp;
+         fs_reg zero = vgrf(glsl_type::double_type);
+         fs_reg tmp = vgrf(glsl_type::double_type);
  
-         if (instr->op == nir_op_f2b32) {
-            zero = vgrf(glsl_type::double_type);
-            tmp = vgrf(glsl_type::double_type);
-            bld.MOV(zero, setup_imm_df(bld, 0.0));
-         } else {
-            zero = vgrf(glsl_type::int64_t_type);
-            tmp = vgrf(glsl_type::int64_t_type);
-            bld.MOV(zero, brw_imm_q(0));
-         }
+         bld.MOV(zero, setup_imm_df(bld, 0.0));
  
           /* A SIMD16 execution needs to be split in two instructions, so use
            * a vgrf instead of the flag register as dst so instruction splitting
@@ -1596,11 +1587,10 @@ fs_visitor::nir_emit_alu(const fs_builder &bld, nir_alu_instr *instr,
        } else {
           fs_reg zero;
           if (bit_size == 32) {
-            zero = instr->op == nir_op_f2b32 ? brw_imm_f(0.0f) : brw_imm_d(0);
+            zero = brw_imm_f(0.0f);
           } else {
              assert(bit_size == 16);
-            zero = instr->op == nir_op_f2b32 ?
-               retype(brw_imm_w(0), BRW_REGISTER_TYPE_HF) : brw_imm_w(0);
+            zero = retype(brw_imm_w(0), BRW_REGISTER_TYPE_HF);
           }
           bld.CMP(result, op[0], zero, BRW_CONDITIONAL_NZ);
        }
diff --git a/src/intel/compiler/brw_vec4_nir.cpp b/src/intel/compiler/brw_vec4_nir.cpp

index 77799ba..756eb52 100644 (file)
--- a/src/intel/compiler/brw_vec4_nir.cpp
+++ b/src/intel/compiler/brw_vec4_nir.cpp
@@ -1576,10 +1576,6 @@ vec4_visitor::nir_emit_alu(nir_alu_instr *instr)
        }
        break;
  
-   case nir_op_i2b32:
-      emit(CMP(dst, op[0], brw_imm_d(0), BRW_CONDITIONAL_NZ));
-      break;
-
     case nir_op_unpack_half_2x16_split_x:
     case nir_op_unpack_half_2x16_split_y:
     case nir_op_pack_half_2x16_split:
diff --git a/src/microsoft/compiler/dxil_nir_algebraic.py b/src/microsoft/compiler/dxil_nir_algebraic.py

index df824b3..c5f216c 100644 (file)
--- a/src/microsoft/compiler/dxil_nir_algebraic.py
+++ b/src/microsoft/compiler/dxil_nir_algebraic.py
@@ -93,8 +93,7 @@ remove_unsupported_casts(no_16bit_conv, 16, 0xffff, 65535.0, -32768.0, 32767.0)
  
  lower_x2b = [
    (('b2b32', 'a'), ('b2i32', 'a')),
-  (('b2b1', 'a'), ('i2b1', 'a')),
-  (('i2b1', 'a'), ('ine', a, 0)),
+  (('b2b1', 'a'), ('ine', ('b2i32', a), 0)),
    (('f2b1', 'a'), ('fneu', a, 0)),
  ]
  
diff --git a/src/nouveau/codegen/nv50_ir_from_nir.cpp b/src/nouveau/codegen/nv50_ir_from_nir.cpp

index d31dc13..7d18610 100644 (file)
--- a/src/nouveau/codegen/nv50_ir_from_nir.cpp
+++ b/src/nouveau/codegen/nv50_ir_from_nir.cpp
@@ -2921,18 +2921,10 @@ Converter::visit(nir_alu_instr *insn)
        mkOp2(OP_MERGE, TYPE_U64, newDefs[0], loadImm(NULL, 0), tmp);
        break;
     }
-   case nir_op_f2b32:
-   case nir_op_i2b32: {
+   case nir_op_f2b32: {
        DEFAULT_CHECKS;
        LValues &newDefs = convert(&insn->dest);
-      Value *src1;
-      if (typeSizeof(sTypes[0]) == 8) {
-         src1 = loadImm(getSSA(8), 0.0);
-      } else {
-         src1 = zero;
-      }
-      CondCode cc = op == nir_op_f2b32 ? CC_NEU : CC_NE;
-      mkCmp(OP_SET, cc, TYPE_U32, newDefs[0], sTypes[0], getSrc(&insn->src[0]), src1);
+      mkCmp(OP_SET, CC_NEU, TYPE_U32, newDefs[0], sTypes[0], getSrc(&insn->src[0]), zero);
        break;
     }
     case nir_op_b2i8:
diff --git a/src/panfrost/bifrost/bifrost_compile.c b/src/panfrost/bifrost/bifrost_compile.c

index e8b6cf7..f5af591 100644 (file)
--- a/src/panfrost/bifrost/bifrost_compile.c
+++ b/src/panfrost/bifrost/bifrost_compile.c
@@ -2914,16 +2914,6 @@ bi_emit_alu(bi_builder *b, nir_alu_instr *instr)
                  bi_mux_i32_to(b, dst, bi_imm_u32(0), bi_imm_u32(~0), s0, BI_MUX_FP_ZERO);
                  break;
  
-        case nir_op_i2b8:
-                bi_mux_v4i8_to(b, dst, bi_imm_u8(0), bi_imm_u8(~0), s0, BI_MUX_INT_ZERO);
-                break;
-        case nir_op_i2b16:
-                bi_mux_v2i16_to(b, dst, bi_imm_u16(0), bi_imm_u16(~0), s0, BI_MUX_INT_ZERO);
-                break;
-        case nir_op_i2b32:
-                bi_mux_i32_to(b, dst, bi_imm_u32(0), bi_imm_u32(~0), s0, BI_MUX_INT_ZERO);
-                break;
-
          case nir_op_ieq8:
          case nir_op_ine8:
          case nir_op_ilt8:
diff --git a/src/panfrost/midgard/midgard_compile.c b/src/panfrost/midgard/midgard_compile.c

index 9ebddce..2de2149 100644 (file)
--- a/src/panfrost/midgard/midgard_compile.c
+++ b/src/panfrost/midgard/midgard_compile.c
@@ -840,7 +840,6 @@ emit_alu(compiler_context *ctx, nir_alu_instr *instr)
                   * we can do a "not equal to 0.0" test. */
  
                  ALU_CASE_CMP(f2b32, fne);
-                ALU_CASE_CMP(i2b32, ine);
  
                  ALU_CASE(frcp, frcp);
                  ALU_CASE(frsq, frsqrt);
author	Ian Romanick <ian.d.romanick@intel.com>
	Tue, 15 Feb 2022 17:35:47 +0000 (09:35 -0800)
committer	Marge Bot <emma+marge@anholt.net>
	Wed, 14 Dec 2022 06:23:21 +0000 (06:23 +0000)
src/amd/compiler/aco_instruction_selection.cpp		patch \| blob \| history
src/amd/llvm/ac_nir_to_llvm.c		patch \| blob \| history
src/amd/vulkan/radv_pipeline.c		patch \| blob \| history
src/asahi/compiler/agx_compile.c		patch \| blob \| history
src/broadcom/compiler/nir_to_vir.c		patch \| blob \| history
src/compiler/nir/nir.c		patch \| blob \| history
src/compiler/nir/nir_lower_bool_to_bitsize.c		patch \| blob \| history
src/compiler/nir/nir_lower_bool_to_float.c		patch \| blob \| history
src/compiler/nir/nir_lower_bool_to_int32.c		patch \| blob \| history
src/compiler/nir/nir_lower_int64.c		patch \| blob \| history
src/compiler/nir/nir_lower_int_to_float.c		patch \| blob \| history
src/compiler/nir/nir_opcodes.py		patch \| blob \| history
src/compiler/nir/nir_opcodes_c.py		patch \| blob \| history
src/compiler/nir/nir_opt_algebraic.py		patch \| blob \| history
src/compiler/nir/nir_search.c		patch \| blob \| history
src/compiler/nir/nir_search.h		patch \| blob \| history
src/freedreno/ir3/ir3_compiler_nir.c		patch \| blob \| history
src/gallium/auxiliary/gallivm/lp_bld_nir.c		patch \| blob \| history
src/gallium/auxiliary/nir/nir_to_tgsi.c		patch \| blob \| history
src/gallium/drivers/d3d12/ci/d3d12-quick_shader.txt		patch \| blob \| history
src/gallium/drivers/etnaviv/etnaviv_compiler_nir_emit.c		patch \| blob \| history
src/gallium/drivers/r600/sfn/sfn_instr_alu.cpp		patch \| blob \| history
src/gallium/drivers/vc4/vc4_program.c		patch \| blob \| history
src/gallium/drivers/zink/nir_to_spirv/nir_to_spirv.c		patch \| blob \| history
src/gallium/drivers/zink/nir_to_spirv/zink_nir_algebraic.py		patch \| blob \| history
src/intel/compiler/brw_fs_nir.cpp		patch \| blob \| history
src/intel/compiler/brw_vec4_nir.cpp		patch \| blob \| history
src/microsoft/compiler/dxil_nir_algebraic.py		patch \| blob \| history
src/nouveau/codegen/nv50_ir_from_nir.cpp		patch \| blob \| history
src/panfrost/bifrost/bifrost_compile.c		patch \| blob \| history
src/panfrost/midgard/midgard_compile.c		patch \| blob \| history