freedreno/ir3: no need to count bits 16b at a time for a4xx

author Ilia Mirkin <imirkin@alum.mit.edu>

Fri, 3 Dec 2021 08:04:19 +0000 (03:04 -0500)

committer Marge Bot <emma+marge@anholt.net>

Tue, 8 Mar 2022 01:23:05 +0000 (01:23 +0000)
author Ilia Mirkin <imirkin@alum.mit.edu>
Fri, 3 Dec 2021 08:04:19 +0000 (03:04 -0500)
committer Marge Bot <emma+marge@anholt.net>
Tue, 8 Mar 2022 01:23:05 +0000 (01:23 +0000)
diff --git a/src/freedreno/ir3/ir3_compiler_nir.c b/src/freedreno/ir3/ir3_compiler_nir.c

index c6bd72c..228cfbd 100644 (file)
--- a/src/freedreno/ir3/ir3_compiler_nir.c
+++ b/src/freedreno/ir3/ir3_compiler_nir.c
@@ -769,9 +769,13 @@ emit_alu(struct ir3_context *ctx, nir_alu_instr *alu)
        break;
     }
     case nir_op_bit_count: {
-      // TODO, we need to do this 16b at a time on a5xx+a6xx.. need to
-      // double check on earlier gen's.  Once half-precision support is
-      // in place, this should probably move to a NIR lowering pass:
+      if (ctx->compiler->gen < 5) {
+         dst[0] = ir3_CBITS_B(b, src[0], 0);
+         break;
+      }
+
+      // We need to do this 16b at a time on a5xx+a6xx.  Once half-precision
+      // support is in place, this should probably move to a NIR lowering pass:
        struct ir3_instruction *hi, *lo;
  
        hi = ir3_COV(b, ir3_SHR_B(b, src[0], 0, create_immed(b, 16), 0), TYPE_U32,
author	Ilia Mirkin <imirkin@alum.mit.edu>
	Fri, 3 Dec 2021 08:04:19 +0000 (03:04 -0500)
committer	Marge Bot <emma+marge@anholt.net>
	Tue, 8 Mar 2022 01:23:05 +0000 (01:23 +0000)