drm/i915/dg2: Add initial gt/ctx/engine workarounds
authorMatt Roper <matthew.d.roper@intel.com>
Tue, 2 Nov 2021 22:25:10 +0000 (15:25 -0700)
committerMatt Roper <matthew.d.roper@intel.com>
Thu, 11 Nov 2021 19:09:10 +0000 (11:09 -0800)
Bspec: 54077,68173,54833
Cc: Anusha Srivatsa <anusha.srivatsa@intel.com>
Signed-off-by: Matt Roper <matthew.d.roper@intel.com>
Reviewed-by: Anusha Srivatsa <anusha.srivatsa@intel.com>
Link: https://patchwork.freedesktop.org/patch/msgid/20211102222511.534310-3-matthew.d.roper@intel.com
drivers/gpu/drm/i915/gt/intel_workarounds.c
drivers/gpu/drm/i915/i915_reg.h
drivers/gpu/drm/i915/intel_pm.c

index 4aaa210..37fd541 100644 (file)
@@ -644,6 +644,42 @@ static void dg1_ctx_workarounds_init(struct intel_engine_cs *engine,
                     DG1_HZ_READ_SUPPRESSION_OPTIMIZATION_DISABLE);
 }
 
+static void dg2_ctx_workarounds_init(struct intel_engine_cs *engine,
+                                    struct i915_wa_list *wal)
+{
+       gen12_ctx_gt_tuning_init(engine, wal);
+
+       /* Wa_16011186671:dg2_g11 */
+       if (IS_DG2_GRAPHICS_STEP(engine->i915, G11, STEP_A0, STEP_B0)) {
+               wa_masked_dis(wal, VFLSKPD, DIS_MULT_MISS_RD_SQUASH);
+               wa_masked_en(wal, VFLSKPD, DIS_OVER_FETCH_CACHE);
+       }
+
+       if (IS_DG2_GRAPHICS_STEP(engine->i915, G10, STEP_A0, STEP_B0)) {
+               /* Wa_14010469329:dg2_g10 */
+               wa_masked_en(wal, GEN11_COMMON_SLICE_CHICKEN3,
+                            XEHP_DUAL_SIMD8_SEQ_MERGE_DISABLE);
+
+               /*
+                * Wa_22010465075:dg2_g10
+                * Wa_22010613112:dg2_g10
+                * Wa_14010698770:dg2_g10
+                */
+               wa_masked_en(wal, GEN11_COMMON_SLICE_CHICKEN3,
+                            GEN12_DISABLE_CPS_AWARE_COLOR_PIPE);
+       }
+
+       /* Wa_16013271637:dg2 */
+       wa_masked_en(wal, SLICE_COMMON_ECO_CHICKEN1,
+                    MSC_MSAA_REODER_BUF_BYPASS_DISABLE);
+
+       /* Wa_22012532006:dg2 */
+       if (IS_DG2_GRAPHICS_STEP(engine->i915, G10, STEP_A0, STEP_C0) ||
+           IS_DG2_GRAPHICS_STEP(engine->i915, G11, STEP_A0, STEP_B0))
+               wa_masked_en(wal, GEN9_HALF_SLICE_CHICKEN7,
+                            DG2_DISABLE_ROUND_ENABLE_ALLOW_FOR_SSLA);
+}
+
 static void fakewa_disable_nestedbb_mode(struct intel_engine_cs *engine,
                                         struct i915_wa_list *wal)
 {
@@ -730,7 +766,9 @@ __intel_engine_init_ctx_wa(struct intel_engine_cs *engine,
        if (engine->class != RENDER_CLASS)
                goto done;
 
-       if (IS_XEHPSDV(i915))
+       if (IS_DG2(i915))
+               dg2_ctx_workarounds_init(engine, wal);
+       else if (IS_XEHPSDV(i915))
                ; /* noop; none at this time */
        else if (IS_DG1(i915))
                dg1_ctx_workarounds_init(engine, wal);
@@ -1344,11 +1382,116 @@ xehpsdv_gt_workarounds_init(struct intel_gt *gt, struct i915_wa_list *wal)
 }
 
 static void
+dg2_gt_workarounds_init(struct intel_gt *gt, struct i915_wa_list *wal)
+{
+       struct intel_engine_cs *engine;
+       int id;
+
+       xehp_init_mcr(gt, wal);
+
+       /* Wa_14011060649:dg2 */
+       wa_14011060649(gt, wal);
+
+       /*
+        * Although there are per-engine instances of these registers,
+        * they technically exist outside the engine itself and are not
+        * impacted by engine resets.  Furthermore, they're part of the
+        * GuC blacklist so trying to treat them as engine workarounds
+        * will result in GuC initialization failure and a wedged GPU.
+        */
+       for_each_engine(engine, gt, id) {
+               if (engine->class != VIDEO_DECODE_CLASS)
+                       continue;
+
+               /* Wa_16010515920:dg2_g10 */
+               if (IS_DG2_GRAPHICS_STEP(gt->i915, G10, STEP_A0, STEP_B0))
+                       wa_write_or(wal, VDBOX_CGCTL3F18(engine->mmio_base),
+                                   ALNUNIT_CLKGATE_DIS);
+       }
+
+       if (IS_DG2_G10(gt->i915)) {
+               /* Wa_22010523718:dg2 */
+               wa_write_or(wal, UNSLICE_UNIT_LEVEL_CLKGATE,
+                           CG3DDISCFEG_CLKGATE_DIS);
+
+               /* Wa_14011006942:dg2 */
+               wa_write_or(wal, SUBSLICE_UNIT_LEVEL_CLKGATE,
+                           DSS_ROUTER_CLKGATE_DIS);
+       }
+
+       if (IS_DG2_GRAPHICS_STEP(gt->i915, G10, STEP_A0, STEP_B0)) {
+               /* Wa_14010680813:dg2_g10 */
+               wa_write_or(wal, GEN12_GAMSTLB_CTRL, CONTROL_BLOCK_CLKGATE_DIS |
+                           EGRESS_BLOCK_CLKGATE_DIS | TAG_BLOCK_CLKGATE_DIS);
+
+               /* Wa_14010948348:dg2_g10 */
+               wa_write_or(wal, UNSLCGCTL9430, MSQDUNIT_CLKGATE_DIS);
+
+               /* Wa_14011037102:dg2_g10 */
+               wa_write_or(wal, UNSLCGCTL9444, LTCDD_CLKGATE_DIS);
+
+               /* Wa_14011371254:dg2_g10 */
+               wa_write_or(wal, SLICE_UNIT_LEVEL_CLKGATE, NODEDSS_CLKGATE_DIS);
+
+               /* Wa_14011431319:dg2_g10 */
+               wa_write_or(wal, UNSLCGCTL9440, GAMTLBOACS_CLKGATE_DIS |
+                           GAMTLBVDBOX7_CLKGATE_DIS |
+                           GAMTLBVDBOX6_CLKGATE_DIS |
+                           GAMTLBVDBOX5_CLKGATE_DIS |
+                           GAMTLBVDBOX4_CLKGATE_DIS |
+                           GAMTLBVDBOX3_CLKGATE_DIS |
+                           GAMTLBVDBOX2_CLKGATE_DIS |
+                           GAMTLBVDBOX1_CLKGATE_DIS |
+                           GAMTLBVDBOX0_CLKGATE_DIS |
+                           GAMTLBKCR_CLKGATE_DIS |
+                           GAMTLBGUC_CLKGATE_DIS |
+                           GAMTLBBLT_CLKGATE_DIS);
+               wa_write_or(wal, UNSLCGCTL9444, GAMTLBGFXA0_CLKGATE_DIS |
+                           GAMTLBGFXA1_CLKGATE_DIS |
+                           GAMTLBCOMPA0_CLKGATE_DIS |
+                           GAMTLBCOMPA1_CLKGATE_DIS |
+                           GAMTLBCOMPB0_CLKGATE_DIS |
+                           GAMTLBCOMPB1_CLKGATE_DIS |
+                           GAMTLBCOMPC0_CLKGATE_DIS |
+                           GAMTLBCOMPC1_CLKGATE_DIS |
+                           GAMTLBCOMPD0_CLKGATE_DIS |
+                           GAMTLBCOMPD1_CLKGATE_DIS |
+                           GAMTLBMERT_CLKGATE_DIS   |
+                           GAMTLBVEBOX3_CLKGATE_DIS |
+                           GAMTLBVEBOX2_CLKGATE_DIS |
+                           GAMTLBVEBOX1_CLKGATE_DIS |
+                           GAMTLBVEBOX0_CLKGATE_DIS);
+
+               /* Wa_14010569222:dg2_g10 */
+               wa_write_or(wal, UNSLICE_UNIT_LEVEL_CLKGATE,
+                           GAMEDIA_CLKGATE_DIS);
+
+               /* Wa_14011028019:dg2_g10 */
+               wa_write_or(wal, SSMCGCTL9530, RTFUNIT_CLKGATE_DIS);
+       }
+
+       if (IS_DG2_GRAPHICS_STEP(gt->i915, G10, STEP_A0, STEP_B0) ||
+           IS_DG2_GRAPHICS_STEP(gt->i915, G11, STEP_A0, STEP_B0)) {
+               /* Wa_14012362059:dg2 */
+               wa_write_or(wal, GEN12_MERT_MOD_CTRL, FORCE_MISS_FTLB);
+       }
+
+       /* Wa_1509235366:dg2 */
+       wa_write_or(wal, GEN12_GAMCNTRL_CTRL, INVALIDATION_BROADCAST_MODE_DIS |
+                   GLOBAL_INVALIDATION_MODE);
+
+       /* Wa_14014830051:dg2 */
+       wa_write_clr(wal, SARB_CHICKEN1, COMP_CKN_IN);
+}
+
+static void
 gt_init_workarounds(struct intel_gt *gt, struct i915_wa_list *wal)
 {
        struct drm_i915_private *i915 = gt->i915;
 
-       if (IS_XEHPSDV(i915))
+       if (IS_DG2(i915))
+               dg2_gt_workarounds_init(gt, wal);
+       else if (IS_XEHPSDV(i915))
                xehpsdv_gt_workarounds_init(gt, wal);
        else if (IS_DG1(i915))
                dg1_gt_workarounds_init(gt, wal);
@@ -1739,6 +1882,34 @@ static void xehpsdv_whitelist_build(struct intel_engine_cs *engine)
        allow_read_ctx_timestamp(engine);
 }
 
+static void dg2_whitelist_build(struct intel_engine_cs *engine)
+{
+       struct i915_wa_list *w = &engine->whitelist;
+
+       allow_read_ctx_timestamp(engine);
+
+       switch (engine->class) {
+       case RENDER_CLASS:
+               /*
+                * Wa_1507100340:dg2_g10
+                *
+                * This covers 4 registers which are next to one another :
+                *   - PS_INVOCATION_COUNT
+                *   - PS_INVOCATION_COUNT_UDW
+                *   - PS_DEPTH_COUNT
+                *   - PS_DEPTH_COUNT_UDW
+                */
+               if (IS_DG2_GRAPHICS_STEP(engine->i915, G10, STEP_A0, STEP_B0))
+                       whitelist_reg_ext(w, PS_INVOCATION_COUNT,
+                                         RING_FORCE_TO_NONPRIV_ACCESS_RD |
+                                         RING_FORCE_TO_NONPRIV_RANGE_4);
+
+               break;
+       default:
+               break;
+       }
+}
+
 void intel_engine_init_whitelist(struct intel_engine_cs *engine)
 {
        struct drm_i915_private *i915 = engine->i915;
@@ -1746,7 +1917,9 @@ void intel_engine_init_whitelist(struct intel_engine_cs *engine)
 
        wa_init_start(w, "whitelist", engine->name);
 
-       if (IS_XEHPSDV(i915))
+       if (IS_DG2(i915))
+               dg2_whitelist_build(engine);
+       else if (IS_XEHPSDV(i915))
                xehpsdv_whitelist_build(engine);
        else if (IS_DG1(i915))
                dg1_whitelist_build(engine);
@@ -1826,6 +1999,105 @@ static void
 rcs_engine_wa_init(struct intel_engine_cs *engine, struct i915_wa_list *wal)
 {
        struct drm_i915_private *i915 = engine->i915;
+       u64 dss_mask = intel_sseu_get_subslices(&engine->gt->info.sseu, 0);
+
+       if (IS_DG2_GRAPHICS_STEP(engine->i915, G11, STEP_A0, STEP_B0)) {
+               /* Wa_14013392000:dg2_g11 */
+               wa_masked_en(wal, GEN7_ROW_CHICKEN2, GEN12_ENABLE_LARGE_GRF_MODE);
+
+               /* Wa_16011620976:dg2_g11 */
+               wa_write_or(wal, LSC_CHICKEN_BIT_0_UDW, DIS_CHAIN_2XSIMD8);
+       }
+
+       if (IS_DG2_GRAPHICS_STEP(engine->i915, G10, STEP_A0, STEP_B0) ||
+           IS_DG2_GRAPHICS_STEP(engine->i915, G11, STEP_A0, STEP_B0)) {
+               /* Wa_14012419201:dg2 */
+               wa_masked_en(wal, GEN9_ROW_CHICKEN4,
+                            GEN12_DISABLE_HDR_PAST_PAYLOAD_HOLD_FIX);
+       }
+
+       if (IS_DG2_GRAPHICS_STEP(engine->i915, G10, STEP_B0, STEP_C0) ||
+           IS_DG2_G11(engine->i915)) {
+               /*
+                * Wa_22012826095:dg2
+                * Wa_22013059131:dg2
+                */
+               wa_write_clr_set(wal, LSC_CHICKEN_BIT_0_UDW,
+                                MAXREQS_PER_BANK,
+                                REG_FIELD_PREP(MAXREQS_PER_BANK, 2));
+
+               /* Wa_22013059131:dg2 */
+               wa_write_or(wal, LSC_CHICKEN_BIT_0,
+                           FORCE_1_SUB_MESSAGE_PER_FRAGMENT);
+       }
+
+       /* Wa_1308578152:dg2_g10 when first gslice is fused off */
+       if (IS_DG2_GRAPHICS_STEP(engine->i915, G10, STEP_B0, STEP_C0) &&
+           (dss_mask & GENMASK(GEN_DSS_PER_GSLICE - 1, 0)) == 0) {
+               wa_masked_dis(wal, GEN12_CS_DEBUG_MODE1_CCCSUNIT_BE_COMMON,
+                             GEN12_REPLAY_MODE_GRANULARITY);
+       }
+
+       if (IS_DG2_GRAPHICS_STEP(engine->i915, G10, STEP_B0, STEP_FOREVER) ||
+           IS_DG2_G11(engine->i915)) {
+               /* Wa_22013037850:dg2 */
+               wa_write_or(wal, LSC_CHICKEN_BIT_0_UDW,
+                           DISABLE_128B_EVICTION_COMMAND_UDW);
+
+               /* Wa_22012856258:dg2 */
+               wa_masked_en(wal, GEN7_ROW_CHICKEN2,
+                            GEN12_DISABLE_READ_SUPPRESSION);
+
+               /*
+                * Wa_22010960976:dg2
+                * Wa_14013347512:dg2
+                */
+               wa_masked_dis(wal, GEN12_HDC_CHICKEN0,
+                             LSC_L1_FLUSH_CTL_3D_DATAPORT_FLUSH_EVENTS_MASK);
+       }
+
+       if (IS_DG2_GRAPHICS_STEP(engine->i915, G10, STEP_A0, STEP_B0)) {
+               /*
+                * Wa_1608949956:dg2_g10
+                * Wa_14010198302:dg2_g10
+                */
+               wa_masked_en(wal, GEN8_ROW_CHICKEN,
+                            MDQ_ARBITRATION_MODE | UGM_BACKUP_MODE);
+
+               /*
+                * Wa_14010918519:dg2_g10
+                *
+                * LSC_CHICKEN_BIT_0 always reads back as 0 is this stepping,
+                * so ignoring verification.
+                */
+               wa_add(wal, LSC_CHICKEN_BIT_0_UDW, 0,
+                      FORCE_SLM_FENCE_SCOPE_TO_TILE | FORCE_UGM_FENCE_SCOPE_TO_TILE,
+                      0, false);
+       }
+
+       if (IS_DG2_GRAPHICS_STEP(engine->i915, G10, STEP_A0, STEP_B0)) {
+               /* Wa_22010430635:dg2 */
+               wa_masked_en(wal,
+                            GEN9_ROW_CHICKEN4,
+                            GEN12_DISABLE_GRF_CLEAR);
+
+               /* Wa_14010648519:dg2 */
+               wa_write_or(wal, XEHP_L3NODEARBCFG, XEHP_LNESPARE);
+       }
+
+       if (IS_DG2_GRAPHICS_STEP(engine->i915, G10, STEP_A0, STEP_C0) ||
+           IS_DG2_G11(engine->i915)) {
+               /* Wa_22012654132:dg2 */
+               wa_add(wal, GEN10_CACHE_MODE_SS, 0,
+                      _MASKED_BIT_ENABLE(ENABLE_PREFETCH_INTO_IC),
+                      0 /* write-only, so skip validation */,
+                      true);
+       }
+
+       /* Wa_14013202645:dg2 */
+       if (IS_DG2_GRAPHICS_STEP(engine->i915, G10, STEP_B0, STEP_C0) ||
+           IS_DG2_GRAPHICS_STEP(engine->i915, G11, STEP_A0, STEP_B0))
+               wa_write_or(wal, RT_CTRL, DIS_NULL_QUERY);
 
        if (IS_DG1_GRAPHICS_STEP(i915, STEP_A0, STEP_B0) ||
            IS_TGL_UY_GRAPHICS_STEP(i915, STEP_A0, STEP_B0)) {
index 1da522d..24a3f6f 100644 (file)
@@ -502,6 +502,11 @@ static inline bool i915_mmio_reg_valid(i915_reg_t reg)
 #define   INVALIDATION_BROADCAST_MODE_DIS      REG_BIT(12)
 #define   GLOBAL_INVALIDATION_MODE             REG_BIT(2)
 
+#define GEN12_GAMSTLB_CTRL             _MMIO(0xcf4c)
+#define   CONTROL_BLOCK_CLKGATE_DIS    REG_BIT(12)
+#define   EGRESS_BLOCK_CLKGATE_DIS     REG_BIT(11)
+#define   TAG_BLOCK_CLKGATE_DIS                REG_BIT(7)
+
 #define GEN12_MERT_MOD_CTRL            _MMIO(0xcf28)
 #define   FORCE_MISS_FTLB              REG_BIT(3)
 
@@ -777,6 +782,9 @@ static inline bool i915_mmio_reg_valid(i915_reg_t reg)
 #define EU_PERF_CNTL5      _MMIO(0xe55c)
 #define EU_PERF_CNTL6      _MMIO(0xe65c)
 
+#define RT_CTRL                        _MMIO(0xe530)
+#define  DIS_NULL_QUERY                REG_BIT(10)
+
 /*
  * OA Boolean state
  */
@@ -2781,6 +2789,9 @@ static inline bool i915_mmio_reg_valid(i915_reg_t reg)
 #define VDBOX_CGCTL3F10(base)          _MMIO((base) + 0x3f10)
 #define   IECPUNIT_CLKGATE_DIS         REG_BIT(22)
 
+#define VDBOX_CGCTL3F18(base)          _MMIO((base) + 0x3f18)
+#define   ALNUNIT_CLKGATE_DIS          REG_BIT(13)
+
 #define ERROR_GEN6     _MMIO(0x40a0)
 #define GEN7_ERR_INT   _MMIO(0x44040)
 #define   ERR_INT_POISON               (1 << 31)
@@ -3124,7 +3135,8 @@ static inline bool i915_mmio_reg_valid(i915_reg_t reg)
 #define GEN9_RCS_FE_FSM2 _MMIO(0x22a4)
 
 #define GEN10_CACHE_MODE_SS                    _MMIO(0xe420)
-#define   FLOAT_BLEND_OPTIMIZATION_ENABLE      (1 << 4)
+#define   ENABLE_PREFETCH_INTO_IC              REG_BIT(3)
+#define   FLOAT_BLEND_OPTIMIZATION_ENABLE      REG_BIT(4)
 
 /* Fuse readout registers for GT */
 #define HSW_PAVP_FUSE1                 _MMIO(0x911C)
@@ -4333,18 +4345,25 @@ enum {
 #define  SARBUNIT_CLKGATE_DIS          (1 << 5)
 #define  RCCUNIT_CLKGATE_DIS           (1 << 7)
 #define  MSCUNIT_CLKGATE_DIS           (1 << 10)
+#define  NODEDSS_CLKGATE_DIS           REG_BIT(12)
 #define  L3_CLKGATE_DIS                        REG_BIT(16)
 #define  L3_CR2X_CLKGATE_DIS           REG_BIT(17)
 
 #define SUBSLICE_UNIT_LEVEL_CLKGATE    _MMIO(0x9524)
-#define  GWUNIT_CLKGATE_DIS            (1 << 16)
+#define   DSS_ROUTER_CLKGATE_DIS       REG_BIT(28)
+#define   GWUNIT_CLKGATE_DIS           REG_BIT(16)
 
 #define SUBSLICE_UNIT_LEVEL_CLKGATE2   _MMIO(0x9528)
 #define  CPSSUNIT_CLKGATE_DIS          REG_BIT(9)
 
+#define SSMCGCTL9530                   _MMIO(0x9530)
+#define   RTFUNIT_CLKGATE_DIS          REG_BIT(18)
+
 #define UNSLICE_UNIT_LEVEL_CLKGATE     _MMIO(0x9434)
 #define   VFUNIT_CLKGATE_DIS           REG_BIT(20)
-#define   TSGUNIT_CLKGATE_DIS          REG_BIT(17)
+#define   TSGUNIT_CLKGATE_DIS          REG_BIT(17) /* XEHPSDV */
+#define   CG3DDISCFEG_CLKGATE_DIS      REG_BIT(17) /* DG2 */
+#define   GAMEDIA_CLKGATE_DIS          REG_BIT(11)
 #define   HSUNIT_CLKGATE_DIS           REG_BIT(8)
 #define   VSUNIT_CLKGATE_DIS           REG_BIT(3)
 
@@ -8403,6 +8422,9 @@ enum {
 #define GEN9_CTX_PREEMPT_REG           _MMIO(0x2248)
 #define   GEN12_DISABLE_POSH_BUSY_FF_DOP_CG REG_BIT(11)
 
+#define GEN12_CS_DEBUG_MODE1_CCCSUNIT_BE_COMMON                _MMIO(0x20EC)
+#define   GEN12_REPLAY_MODE_GRANULARITY                        REG_BIT(0)
+
 #define GEN8_CS_CHICKEN1               _MMIO(0x2580)
 #define GEN9_PREEMPT_3D_OBJECT_LEVEL           (1 << 0)
 #define GEN9_PREEMPT_GPGPU_LEVEL(hi, lo)       (((hi) << 2) | ((lo) << 1))
@@ -8426,9 +8448,10 @@ enum {
   #define GEN8_ERRDETBCTRL (1 << 9)
 
 #define GEN11_COMMON_SLICE_CHICKEN3                    _MMIO(0x7304)
-  #define DG1_FLOAT_POINT_BLEND_OPT_STRICT_MODE_EN     REG_BIT(12)
-  #define GEN11_BLEND_EMB_FIX_DISABLE_IN_RCC           REG_BIT(11)
-  #define GEN12_DISABLE_CPS_AWARE_COLOR_PIPE           REG_BIT(9)
+#define   DG1_FLOAT_POINT_BLEND_OPT_STRICT_MODE_EN     REG_BIT(12)
+#define   XEHP_DUAL_SIMD8_SEQ_MERGE_DISABLE            REG_BIT(12)
+#define   GEN11_BLEND_EMB_FIX_DISABLE_IN_RCC           REG_BIT(11)
+#define   GEN12_DISABLE_CPS_AWARE_COLOR_PIPE           REG_BIT(9)
 
 #define HIZ_CHICKEN                                    _MMIO(0x7018)
 # define CHV_HZ_8X8_MODE_IN_1X                         REG_BIT(15)
@@ -8492,6 +8515,12 @@ enum {
 #define  HDC_FORCE_NON_COHERENT                        (1 << 4)
 #define  HDC_BARRIER_PERFORMANCE_DISABLE       (1 << 10)
 
+#define GEN12_HDC_CHICKEN0                                     _MMIO(0xE5F0)
+#define   LSC_L1_FLUSH_CTL_3D_DATAPORT_FLUSH_EVENTS_MASK       REG_GENMASK(13, 11)
+
+#define SARB_CHICKEN1                          _MMIO(0xe90c)
+#define   COMP_CKN_IN                          REG_GENMASK(30, 29)
+
 #define GEN8_HDC_CHICKEN1                      _MMIO(0x7304)
 
 /* GEN9 chicken */
@@ -8522,6 +8551,10 @@ enum {
 #define   PIXEL_ROUNDING_TRUNC_FB_PASSTHRU     (1 << 15)
 #define   PER_PIXEL_ALPHA_BYPASS_EN            (1 << 7)
 
+#define VFLSKPD                                _MMIO(0x62a8)
+#define   DIS_OVER_FETCH_CACHE         REG_BIT(1)
+#define   DIS_MULT_MISS_RD_SQUASH      REG_BIT(0)
+
 #define FF_MODE2                       _MMIO(0x6604)
 #define   FF_MODE2_GS_TIMER_MASK       REG_GENMASK(31, 24)
 #define   FF_MODE2_GS_TIMER_224                REG_FIELD_PREP(FF_MODE2_GS_TIMER_MASK, 224)
@@ -9345,6 +9378,9 @@ enum {
 #define   GEN8_SDEUNIT_CLOCK_GATE_DISABLE      (1 << 14)
 #define   GEN8_HDCUNIT_CLOCK_GATE_DISABLE_HDCREQ (1 << 28)
 
+#define UNSLCGCTL9430                          _MMIO(0x9430)
+#define   MSQDUNIT_CLKGATE_DIS                 REG_BIT(3)
+
 #define GEN6_GFXPAUSE                          _MMIO(0xA000)
 #define GEN6_RPNSWREQ                          _MMIO(0xA008)
 #define   GEN6_TURBO_DISABLE                   (1 << 31)
@@ -9660,24 +9696,39 @@ enum {
 #define   GEN9_CCS_TLB_PREFETCH_ENABLE (1 << 3)
 
 #define GEN8_ROW_CHICKEN               _MMIO(0xe4f0)
-#define   FLOW_CONTROL_ENABLE          (1 << 15)
-#define   PARTIAL_INSTRUCTION_SHOOTDOWN_DISABLE        (1 << 8)
-#define   STALL_DOP_GATING_DISABLE             (1 << 5)
-#define   THROTTLE_12_5                                (7 << 2)
-#define   DISABLE_EARLY_EOT                    (1 << 1)
+#define   FLOW_CONTROL_ENABLE                  REG_BIT(15)
+#define   UGM_BACKUP_MODE                      REG_BIT(13)
+#define   MDQ_ARBITRATION_MODE                 REG_BIT(12)
+#define   PARTIAL_INSTRUCTION_SHOOTDOWN_DISABLE        REG_BIT(8)
+#define   STALL_DOP_GATING_DISABLE             REG_BIT(5)
+#define   THROTTLE_12_5                                REG_GENMASK(4, 2)
+#define   DISABLE_EARLY_EOT                    REG_BIT(1)
 
 #define GEN7_ROW_CHICKEN2                      _MMIO(0xe4f4)
+#define   GEN12_DISABLE_READ_SUPPRESSION       REG_BIT(15)
 #define   GEN12_DISABLE_EARLY_READ             REG_BIT(14)
+#define   GEN12_ENABLE_LARGE_GRF_MODE          REG_BIT(12)
 #define   GEN12_PUSH_CONST_DEREF_HOLD_DIS      REG_BIT(8)
 
+#define LSC_CHICKEN_BIT_0                      _MMIO(0xe7c8)
+#define   FORCE_1_SUB_MESSAGE_PER_FRAGMENT     REG_BIT(15)
+#define LSC_CHICKEN_BIT_0_UDW                  _MMIO(0xe7c8 + 4)
+#define   DIS_CHAIN_2XSIMD8                    REG_BIT(55 - 32)
+#define   FORCE_SLM_FENCE_SCOPE_TO_TILE                REG_BIT(42 - 32)
+#define   FORCE_UGM_FENCE_SCOPE_TO_TILE                REG_BIT(41 - 32)
+#define   MAXREQS_PER_BANK                     REG_GENMASK(39 - 32, 37 - 32)
+#define   DISABLE_128B_EVICTION_COMMAND_UDW    REG_BIT(36 - 32)
+
 #define GEN7_ROW_CHICKEN2_GT2          _MMIO(0xf4f4)
 #define   DOP_CLOCK_GATING_DISABLE     (1 << 0)
 #define   PUSH_CONSTANT_DEREF_DISABLE  (1 << 8)
 #define   GEN11_TDL_CLOCK_GATING_FIX_DISABLE   (1 << 1)
 
-#define GEN9_ROW_CHICKEN4              _MMIO(0xe48c)
-#define   GEN12_DISABLE_TDL_PUSH       REG_BIT(9)
-#define   GEN11_DIS_PICK_2ND_EU                REG_BIT(7)
+#define GEN9_ROW_CHICKEN4                              _MMIO(0xe48c)
+#define   GEN12_DISABLE_GRF_CLEAR                      REG_BIT(13)
+#define   GEN12_DISABLE_TDL_PUSH                       REG_BIT(9)
+#define   GEN11_DIS_PICK_2ND_EU                                REG_BIT(7)
+#define   GEN12_DISABLE_HDR_PAST_PAYLOAD_HOLD_FIX      REG_BIT(4)
 
 #define HSW_ROW_CHICKEN3               _MMIO(0xe49c)
 #define  HSW_ROW_CHICKEN3_L3_GLOBAL_ATOMICS_DISABLE    (1 << 6)
@@ -9692,9 +9743,10 @@ enum {
 #define   GEN8_SAMPLER_POWER_BYPASS_DIS        (1 << 1)
 
 #define GEN9_HALF_SLICE_CHICKEN7       _MMIO(0xe194)
-#define   GEN9_SAMPLER_HASH_COMPRESSED_READ_ADDR       (1 << 8)
-#define   GEN9_ENABLE_YV12_BUGFIX      (1 << 4)
-#define   GEN9_ENABLE_GPGPU_PREEMPTION (1 << 2)
+#define   DG2_DISABLE_ROUND_ENABLE_ALLOW_FOR_SSLA      REG_BIT(15)
+#define   GEN9_SAMPLER_HASH_COMPRESSED_READ_ADDR       REG_BIT(8)
+#define   GEN9_ENABLE_YV12_BUGFIX                      REG_BIT(4)
+#define   GEN9_ENABLE_GPGPU_PREEMPTION                 REG_BIT(2)
 
 /* Audio */
 #define G4X_AUD_VID_DID                        _MMIO(DISPLAY_MMIO_BASE(dev_priv) + 0x62020)
@@ -12516,12 +12568,17 @@ enum skl_power_gate {
 #define   PMFLUSH_GAPL3UNBLOCK         (1 << 21)
 #define   PMFLUSHDONE_LNEBLK           (1 << 22)
 
+#define XEHP_L3NODEARBCFG              _MMIO(0xb0b4)
+#define   XEHP_LNESPARE                        REG_BIT(19)
+
 #define GEN12_GLOBAL_MOCS(i)   _MMIO(0x4000 + (i) * 4) /* Global MOCS regs */
 
 #define GEN12_GSMBASE                  _MMIO(0x108100)
 #define GEN12_DSMBASE                  _MMIO(0x1080C0)
 
 #define XEHP_CLOCK_GATE_DIS            _MMIO(0x101014)
+#define   SGSI_SIDECLK_DIS             REG_BIT(17)
+#define   SGGI_DIS                     REG_BIT(15)
 #define   SGR_DIS                      REG_BIT(13)
 
 /* gamt regs */
@@ -12900,4 +12957,7 @@ enum skl_power_gate {
 #define CLKGATE_DIS_MISC                       _MMIO(0x46534)
 #define  CLKGATE_DIS_MISC_DMASC_GATING_DIS     REG_BIT(21)
 
+#define SLICE_COMMON_ECO_CHICKEN1              _MMIO(0x731C)
+#define   MSC_MSAA_REODER_BUF_BYPASS_DISABLE   REG_BIT(14)
+
 #endif /* _I915_REG_H_ */
index a133419..6b122dc 100644 (file)
@@ -7473,6 +7473,22 @@ static void xehpsdv_init_clock_gating(struct drm_i915_private *dev_priv)
                intel_uncore_rmw(&dev_priv->uncore, XEHP_CLOCK_GATE_DIS, 0, SGR_DIS);
 }
 
+static void dg2_init_clock_gating(struct drm_i915_private *i915)
+{
+       /* Wa_22010954014:dg2_g10 */
+       if (IS_DG2_G10(i915))
+               intel_uncore_rmw(&i915->uncore, XEHP_CLOCK_GATE_DIS, 0,
+                                SGSI_SIDECLK_DIS);
+
+       /*
+        * Wa_14010733611:dg2_g10
+        * Wa_22010146351:dg2_g10
+        */
+       if (IS_DG2_GRAPHICS_STEP(i915, G10, STEP_A0, STEP_B0))
+               intel_uncore_rmw(&i915->uncore, XEHP_CLOCK_GATE_DIS, 0,
+                                SGR_DIS | SGGI_DIS);
+}
+
 static void cnp_init_clock_gating(struct drm_i915_private *dev_priv)
 {
        if (!HAS_PCH_CNP(dev_priv))
@@ -7883,6 +7899,7 @@ static const struct drm_i915_clock_gating_funcs platform##_clock_gating_funcs =
        .init_clock_gating = platform##_init_clock_gating,              \
 }
 
+CG_FUNCS(dg2);
 CG_FUNCS(xehpsdv);
 CG_FUNCS(adlp);
 CG_FUNCS(dg1);
@@ -7920,7 +7937,9 @@ CG_FUNCS(nop);
  */
 void intel_init_clock_gating_hooks(struct drm_i915_private *dev_priv)
 {
-       if (IS_XEHPSDV(dev_priv))
+       if (IS_DG2(dev_priv))
+               dev_priv->clock_gating_funcs = &dg2_clock_gating_funcs;
+       else if (IS_XEHPSDV(dev_priv))
                dev_priv->clock_gating_funcs = &xehpsdv_clock_gating_funcs;
        else if (IS_ALDERLAKE_P(dev_priv))
                dev_priv->clock_gating_funcs = &adlp_clock_gating_funcs;