intel/compiler/gfx12.5+: Lower 64-bit cluster_broadcast with 32-bit ops

author Jordan Justen <jordan.l.justen@intel.com>

Wed, 19 Apr 2023 00:11:41 +0000 (20:11 -0400)

committer Jordan Justen <jordan.l.justen@intel.com>

Thu, 20 Apr 2023 18:41:10 +0000 (11:41 -0700)
author Jordan Justen <jordan.l.justen@intel.com>
Wed, 19 Apr 2023 00:11:41 +0000 (20:11 -0400)
committer Jordan Justen <jordan.l.justen@intel.com>
Thu, 20 Apr 2023 18:41:10 +0000 (11:41 -0700)
diff --git a/src/intel/compiler/brw_fs_lower_regioning.cpp b/src/intel/compiler/brw_fs_lower_regioning.cpp

index a30d183..a86e092 100644 (file)
--- a/src/intel/compiler/brw_fs_lower_regioning.cpp
+++ b/src/intel/compiler/brw_fs_lower_regioning.cpp
@@ -174,10 +174,17 @@ namespace {
            *    integer DWord multiply, indirect addressing must not be
            *    used."
            *
+          * For MTL (verx10 == 125), float64 is supported, but int64 is not.
+          * Therefore we need to lower cluster broadcast using 32-bit int ops.
+          *
+          * For gfx12.5+ platforms that support int64, the register regions
+          * used by cluster broadcast aren't supported by the 64-bit pipeline.
+          *
            * Work around the above and handle platforms that don't
            * support 64-bit types at all.
            */
-         if ((!has_64bit || devinfo->platform == INTEL_PLATFORM_CHV ||
+         if ((!has_64bit || devinfo->verx10 >= 125 ||
+              devinfo->platform == INTEL_PLATFORM_CHV ||
                intel_device_info_is_9lp(devinfo)) && type_sz(t) > 4)
              return BRW_REGISTER_TYPE_UD;
           else
author	Jordan Justen <jordan.l.justen@intel.com>
	Wed, 19 Apr 2023 00:11:41 +0000 (20:11 -0400)
committer	Jordan Justen <jordan.l.justen@intel.com>
	Thu, 20 Apr 2023 18:41:10 +0000 (11:41 -0700)