drm/amd/display: Add check for DET fetch latency hiding for dcn32
authorDillon Varone <Dillon.Varone@amd.com>
Tue, 8 Nov 2022 23:45:33 +0000 (18:45 -0500)
committerGreg Kroah-Hartman <gregkh@linuxfoundation.org>
Thu, 12 Jan 2023 11:02:54 +0000 (12:02 +0100)
[ Upstream commit 6d4727c80947de0e6fad58b196a9d215e3b32608 ]

[WHY?]
Some configurations are constructed with very marginal DET buffers relative to
the worst possible time required to fetch a swath.

[HOW?]
Add a check to see that the DET buffer allocated for each pipe can hide the
latency for all pipes to fetch at least one swath.

Reviewed-by: Alvin Lee <Alvin.Lee2@amd.com>
Reviewed-by: Jun Lei <Jun.Lei@amd.com>
Acked-by: Brian Chang <Brian.Chang@amd.com>
Signed-off-by: Dillon Varone <Dillon.Varone@amd.com>
Tested-by: Daniel Wheeler <daniel.wheeler@amd.com>
Signed-off-by: Alex Deucher <alexander.deucher@amd.com>
Stable-dep-of: f3c23bea598a ("drm/amd/display: Uninitialized variables causing 4k60 UCLK to stay at DPM1 and not DPM0")
Signed-off-by: Sasha Levin <sashal@kernel.org>
drivers/gpu/drm/amd/display/dc/dml/dcn32/display_mode_vba_32.c
drivers/gpu/drm/amd/display/dc/dml/dcn32/display_mode_vba_util_32.c
drivers/gpu/drm/amd/display/dc/dml/dcn32/display_mode_vba_util_32.h
drivers/gpu/drm/amd/display/dc/dml/display_mode_vba.h

index 9afd9ba..820042f 100644 (file)
@@ -670,6 +670,25 @@ static void DISPCLKDPPCLKDCFCLKDeepSleepPrefetchParametersWatermarksAndPerforman
                v->cursor_bw[k] = mode_lib->vba.NumberOfCursors[k] * mode_lib->vba.CursorWidth[k][0] * mode_lib->vba.CursorBPP[k][0] / 8 / (mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]) * mode_lib->vba.VRatio[k];
        }
 
+       v->NotEnoughDETSwathFillLatencyHiding = dml32_CalculateDETSwathFillLatencyHiding(
+                                               mode_lib->vba.NumberOfActiveSurfaces,
+                                               mode_lib->vba.ReturnBW,
+                                               v->UrgentLatency,
+                                               mode_lib->vba.SwathHeightY,
+                                               mode_lib->vba.SwathHeightC,
+                                               v->swath_width_luma_ub,
+                                               v->swath_width_chroma_ub,
+                                               v->BytePerPixelDETY,
+                                               v->BytePerPixelDETC,
+                                               mode_lib->vba.DETBufferSizeY,
+                                               mode_lib->vba.DETBufferSizeC,
+                                               mode_lib->vba.DPPPerPlane,
+                                               mode_lib->vba.HTotal,
+                                               mode_lib->vba.PixelClock,
+                                               mode_lib->vba.VRatio,
+                                               mode_lib->vba.VRatioChroma,
+                                               mode_lib->vba.UsesMALLForPStateChange);
+
        for (k = 0; k < mode_lib->vba.NumberOfActiveSurfaces; ++k) {
                v->MaxVStartupLines[k] = ((mode_lib->vba.Interlace[k] &&
                                !mode_lib->vba.ProgressiveToInterlaceUnitInOPP) ?
@@ -1664,6 +1683,7 @@ static void mode_support_configuration(struct vba_vars_st *v,
                                && mode_lib->vba.PTEBufferSizeNotExceeded[i][j] == true
                                && mode_lib->vba.DCCMetaBufferSizeNotExceeded[i][j] == true
                                && mode_lib->vba.NonsupportedDSCInputBPC == false
+                               && mode_lib->vba.NotEnoughDETSwathFillLatencyHidingPerState[i][j] == false
                                && !mode_lib->vba.ExceededMALLSize
                                && ((mode_lib->vba.HostVMEnable == false
                                && !mode_lib->vba.ImmediateFlipRequiredFinal)
@@ -3158,6 +3178,25 @@ void dml32_ModeSupportAndSystemConfigurationFull(struct display_mode_lib *mode_l
                                        mode_lib->vba.UrgentBurstFactorChroma,
                                        mode_lib->vba.UrgentBurstFactorCursor);
 
+                       mode_lib->vba.NotEnoughDETSwathFillLatencyHidingPerState[i][j] = dml32_CalculateDETSwathFillLatencyHiding(
+                                       mode_lib->vba.NumberOfActiveSurfaces,
+                                       mode_lib->vba.ReturnBWPerState[i][j],
+                                       mode_lib->vba.UrgLatency[i],
+                                       mode_lib->vba.SwathHeightYThisState,
+                                       mode_lib->vba.SwathHeightCThisState,
+                                       mode_lib->vba.swath_width_luma_ub_this_state,
+                                       mode_lib->vba.swath_width_chroma_ub_this_state,
+                                       mode_lib->vba.BytePerPixelInDETY,
+                                       mode_lib->vba.BytePerPixelInDETC,
+                                       mode_lib->vba.DETBufferSizeYThisState,
+                                       mode_lib->vba.DETBufferSizeCThisState,
+                                       mode_lib->vba.NoOfDPPThisState,
+                                       mode_lib->vba.HTotal,
+                                       mode_lib->vba.PixelClock,
+                                       mode_lib->vba.VRatio,
+                                       mode_lib->vba.VRatioChroma,
+                                       mode_lib->vba.UsesMALLForPStateChange);
+
                        v->dummy_vars.dml32_ModeSupportAndSystemConfigurationFull.VMDataOnlyReturnBWPerState = dml32_get_return_bw_mbps_vm_only(&mode_lib->vba.soc, i,
                                        mode_lib->vba.DCFCLKState[i][j], mode_lib->vba.FabricClockPerState[i],
                                        mode_lib->vba.DRAMSpeedPerState[i]);
index debe46b..5af601c 100644 (file)
@@ -6228,3 +6228,72 @@ void dml32_CalculateImmediateFlipBandwithSupport(unsigned int NumberOfActiveSurf
        *ImmediateFlipBandwidthSupport = (*TotalBandwidth <= ReturnBW);
        *FractionOfUrgentBandwidth = *TotalBandwidth / ReturnBW;
 }
+
+bool dml32_CalculateDETSwathFillLatencyHiding(unsigned int NumberOfActiveSurfaces,
+               double ReturnBW,
+               double UrgentLatency,
+               unsigned int SwathHeightY[],
+               unsigned int SwathHeightC[],
+               unsigned int SwathWidthY[],
+               unsigned int SwathWidthC[],
+               double  BytePerPixelInDETY[],
+               double  BytePerPixelInDETC[],
+               unsigned int    DETBufferSizeY[],
+               unsigned int    DETBufferSizeC[],
+               unsigned int    NumOfDPP[],
+               unsigned int    HTotal[],
+               double  PixelClock[],
+               double  VRatioY[],
+               double  VRatioC[],
+               enum dm_use_mall_for_pstate_change_mode UsesMALLForPStateChange[DC__NUM_DPP__MAX])
+{
+       int k;
+       double SwathSizeAllSurfaces = 0;
+       double SwathSizeAllSurfacesInFetchTimeUs;
+       double DETSwathLatencyHidingUs;
+       double DETSwathLatencyHidingYUs;
+       double DETSwathLatencyHidingCUs;
+       double SwathSizePerSurfaceY[DC__NUM_DPP__MAX];
+       double SwathSizePerSurfaceC[DC__NUM_DPP__MAX];
+       bool NotEnoughDETSwathFillLatencyHiding = false;
+
+       /* calculate sum of single swath size for all pipes in bytes*/
+       for (k = 0; k < NumberOfActiveSurfaces; k++) {
+               SwathSizePerSurfaceY[k] += SwathHeightY[k] * SwathWidthY[k] * BytePerPixelInDETY[k] * NumOfDPP[k];
+
+               if (SwathHeightC[k] != 0)
+                       SwathSizePerSurfaceC[k] += SwathHeightC[k] * SwathWidthC[k] * BytePerPixelInDETC[k] * NumOfDPP[k];
+               else
+                       SwathSizePerSurfaceC[k] = 0;
+
+               SwathSizeAllSurfaces += SwathSizePerSurfaceY[k] + SwathSizePerSurfaceC[k];
+       }
+
+       SwathSizeAllSurfacesInFetchTimeUs = SwathSizeAllSurfaces / ReturnBW + UrgentLatency;
+
+       /* ensure all DET - 1 swath can hide a fetch for all surfaces */
+       for (k = 0; k < NumberOfActiveSurfaces; k++) {
+               double LineTime = HTotal[k] / PixelClock[k];
+
+               /* only care if surface is not phantom */
+               if (UsesMALLForPStateChange[k] != dm_use_mall_pstate_change_phantom_pipe) {
+                       DETSwathLatencyHidingYUs = (dml_floor(DETBufferSizeY[k] / BytePerPixelInDETY[k] / SwathWidthY[k], 1.0) - SwathHeightY[k]) / VRatioY[k] * LineTime;
+
+                       if (SwathHeightC[k] != 0) {
+                               DETSwathLatencyHidingCUs = (dml_floor(DETBufferSizeC[k] / BytePerPixelInDETC[k] / SwathWidthC[k], 1.0) - SwathHeightC[k]) / VRatioC[k] * LineTime;
+
+                               DETSwathLatencyHidingUs = dml_min(DETSwathLatencyHidingYUs, DETSwathLatencyHidingCUs);
+                       } else {
+                               DETSwathLatencyHidingUs = DETSwathLatencyHidingYUs;
+                       }
+
+                       /* DET must be able to hide time to fetch 1 swath for each surface */
+                       if (DETSwathLatencyHidingUs < SwathSizeAllSurfacesInFetchTimeUs) {
+                               NotEnoughDETSwathFillLatencyHiding = true;
+                               break;
+                       }
+               }
+       }
+
+       return NotEnoughDETSwathFillLatencyHiding;
+}
index 3989c2a..779c680 100644 (file)
@@ -1141,4 +1141,22 @@ void dml32_CalculateImmediateFlipBandwithSupport(unsigned int NumberOfActiveSurf
                double  *FractionOfUrgentBandwidth,
                bool *ImmediateFlipBandwidthSupport);
 
+bool dml32_CalculateDETSwathFillLatencyHiding(unsigned int NumberOfActiveSurfaces,
+               double ReturnBW,
+               double UrgentLatency,
+               unsigned int SwathHeightY[],
+               unsigned int SwathHeightC[],
+               unsigned int SwathWidthY[],
+               unsigned int SwathWidthC[],
+               double  BytePerPixelInDETY[],
+               double  BytePerPixelInDETC[],
+               unsigned int    DETBufferSizeY[],
+               unsigned int    DETBufferSizeC[],
+               unsigned int    NumOfDPP[],
+               unsigned int    HTotal[],
+               double  PixelClock[],
+               double  VRatioY[],
+               double  VRatioC[],
+               enum dm_use_mall_for_pstate_change_mode UsesMALLForPStateChange[DC__NUM_DPP__MAX]);
+
 #endif
index a0207a8..2b34b02 100644 (file)
@@ -1041,6 +1041,7 @@ struct vba_vars_st {
        double MinFullDETBufferingTime;
        double AverageReadBandwidthGBytePerSecond;
        bool   FirstMainPlane;
+       bool NotEnoughDETSwathFillLatencyHiding;
 
        unsigned int ViewportWidthChroma[DC__NUM_DPP__MAX];
        unsigned int ViewportHeightChroma[DC__NUM_DPP__MAX];
@@ -1224,6 +1225,7 @@ struct vba_vars_st {
        unsigned int BlockWidthC[DC__NUM_DPP__MAX];
        unsigned int SubViewportLinesNeededInMALL[DC__NUM_DPP__MAX];
        bool VActiveBandwithSupport[DC__VOLTAGE_STATES][2];
+       bool NotEnoughDETSwathFillLatencyHidingPerState[DC__VOLTAGE_STATES][2];
        struct dummy_vars dummy_vars;
 };