/* * Copyright 2018 Advanced Micro Devices, Inc. * * Permission is hereby granted, free of charge, to any person obtaining a * copy of this software and associated documentation files (the "Software"), * to deal in the Software without restriction, including without limitation * the rights to use, copy, modify, merge, publish, distribute, sublicense, * and/or sell copies of the Software, and to permit persons to whom the * Software is furnished to do so, subject to the following conditions: * * The above copyright notice and this permission notice shall be included in * all copies or substantial portions of the Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR * OTHER DEALINGS IN THE SOFTWARE. * * Authors: AMD * */ #include "../display_mode_lib.h" #include "display_mode_vba_20v2.h" #include "../dml_inline_defs.h" /* * NOTE: * This file is gcc-parseable HW gospel, coming straight from HW engineers. * * It doesn't adhere to Linux kernel style and sometimes will do things in odd * ways. Unless there is something clearly wrong with it the code should * remain as-is as it provides us with a guarantee from HW that it is correct. */ #define BPP_INVALID 0 #define BPP_BLENDED_PIPE 0xffffffff static double adjust_ReturnBW( struct display_mode_lib *mode_lib, double ReturnBW, bool DCCEnabledAnyPlane, double ReturnBandwidthToDCN); static unsigned int dscceComputeDelay( unsigned int bpc, double bpp, unsigned int sliceWidth, unsigned int numSlices, enum output_format_class pixelFormat); static unsigned int dscComputeDelay(enum output_format_class pixelFormat); static bool CalculateDelayAfterScaler( struct display_mode_lib *mode_lib, double ReturnBW, double ReadBandwidthPlaneLuma, double ReadBandwidthPlaneChroma, double TotalDataReadBandwidth, double DisplayPipeLineDeliveryTimeLuma, double DisplayPipeLineDeliveryTimeChroma, double DPPCLK, double DISPCLK, double PixelClock, unsigned int DSCDelay, unsigned int DPPPerPlane, bool ScalerEnabled, unsigned int NumberOfCursors, double DPPCLKDelaySubtotal, double DPPCLKDelaySCL, double DPPCLKDelaySCLLBOnly, double DPPCLKDelayCNVCFormater, double DPPCLKDelayCNVCCursor, double DISPCLKDelaySubtotal, unsigned int ScalerRecoutWidth, enum output_format_class OutputFormat, unsigned int HTotal, unsigned int SwathWidthSingleDPPY, double BytePerPixelDETY, double BytePerPixelDETC, unsigned int SwathHeightY, unsigned int SwathHeightC, bool Interlace, bool ProgressiveToInterlaceUnitInOPP, double *DSTXAfterScaler, double *DSTYAfterScaler ); // Super monster function with some 45 argument static bool CalculatePrefetchSchedule( struct display_mode_lib *mode_lib, double DPPCLK, double DISPCLK, double PixelClock, double DCFCLKDeepSleep, unsigned int DPPPerPlane, unsigned int NumberOfCursors, unsigned int VBlank, unsigned int HTotal, unsigned int MaxInterDCNTileRepeaters, unsigned int VStartup, unsigned int PageTableLevels, bool GPUVMEnable, bool DynamicMetadataEnable, unsigned int DynamicMetadataLinesBeforeActiveRequired, unsigned int DynamicMetadataTransmittedBytes, bool DCCEnable, double UrgentLatencyPixelDataOnly, double UrgentExtraLatency, double TCalc, unsigned int PDEAndMetaPTEBytesFrame, unsigned int MetaRowByte, unsigned int PixelPTEBytesPerRow, double PrefetchSourceLinesY, unsigned int SwathWidthY, double BytePerPixelDETY, double VInitPreFillY, unsigned int MaxNumSwathY, double PrefetchSourceLinesC, double BytePerPixelDETC, double VInitPreFillC, unsigned int MaxNumSwathC, unsigned int SwathHeightY, unsigned int SwathHeightC, double TWait, bool XFCEnabled, double XFCRemoteSurfaceFlipDelay, bool InterlaceEnable, bool ProgressiveToInterlaceUnitInOPP, double DSTXAfterScaler, double DSTYAfterScaler, double *DestinationLinesForPrefetch, double *PrefetchBandwidth, double *DestinationLinesToRequestVMInVBlank, double *DestinationLinesToRequestRowInVBlank, double *VRatioPrefetchY, double *VRatioPrefetchC, double *RequiredPrefetchPixDataBW, double *Tno_bw, unsigned int *VUpdateOffsetPix, double *VUpdateWidthPix, double *VReadyOffsetPix); static double RoundToDFSGranularityUp(double Clock, double VCOSpeed); static double RoundToDFSGranularityDown(double Clock, double VCOSpeed); static double CalculatePrefetchSourceLines( struct display_mode_lib *mode_lib, double VRatio, double vtaps, bool Interlace, bool ProgressiveToInterlaceUnitInOPP, unsigned int SwathHeight, unsigned int ViewportYStart, double *VInitPreFill, unsigned int *MaxNumSwath); static unsigned int CalculateVMAndRowBytes( struct display_mode_lib *mode_lib, bool DCCEnable, unsigned int BlockHeight256Bytes, unsigned int BlockWidth256Bytes, enum source_format_class SourcePixelFormat, unsigned int SurfaceTiling, unsigned int BytePerPixel, enum scan_direction_class ScanDirection, unsigned int ViewportWidth, unsigned int ViewportHeight, unsigned int SwathWidthY, bool GPUVMEnable, unsigned int VMMPageSize, unsigned int PTEBufferSizeInRequestsLuma, unsigned int PDEProcessingBufIn64KBReqs, unsigned int Pitch, unsigned int DCCMetaPitch, unsigned int *MacroTileWidth, unsigned int *MetaRowByte, unsigned int *PixelPTEBytesPerRow, bool *PTEBufferSizeNotExceeded, unsigned int *dpte_row_height, unsigned int *meta_row_height); static double CalculateTWait( unsigned int PrefetchMode, double DRAMClockChangeLatency, double UrgentLatencyPixelDataOnly, double SREnterPlusExitTime); static double CalculateRemoteSurfaceFlipDelay( struct display_mode_lib *mode_lib, double VRatio, double SwathWidth, double Bpp, double LineTime, double XFCTSlvVupdateOffset, double XFCTSlvVupdateWidth, double XFCTSlvVreadyOffset, double XFCXBUFLatencyTolerance, double XFCFillBWOverhead, double XFCSlvChunkSize, double XFCBusTransportTime, double TCalc, double TWait, double *SrcActiveDrainRate, double *TInitXFill, double *TslvChk); static void CalculateActiveRowBandwidth( bool GPUVMEnable, enum source_format_class SourcePixelFormat, double VRatio, bool DCCEnable, double LineTime, unsigned int MetaRowByteLuma, unsigned int MetaRowByteChroma, unsigned int meta_row_height_luma, unsigned int meta_row_height_chroma, unsigned int PixelPTEBytesPerRowLuma, unsigned int PixelPTEBytesPerRowChroma, unsigned int dpte_row_height_luma, unsigned int dpte_row_height_chroma, double *meta_row_bw, double *dpte_row_bw, double *qual_row_bw); static void CalculateFlipSchedule( struct display_mode_lib *mode_lib, double UrgentExtraLatency, double UrgentLatencyPixelDataOnly, unsigned int GPUVMMaxPageTableLevels, bool GPUVMEnable, double BandwidthAvailableForImmediateFlip, unsigned int TotImmediateFlipBytes, enum source_format_class SourcePixelFormat, unsigned int ImmediateFlipBytes, double LineTime, double VRatio, double Tno_bw, double PDEAndMetaPTEBytesFrame, unsigned int MetaRowByte, unsigned int PixelPTEBytesPerRow, bool DCCEnable, unsigned int dpte_row_height, unsigned int meta_row_height, double qual_row_bw, double *DestinationLinesToRequestVMInImmediateFlip, double *DestinationLinesToRequestRowInImmediateFlip, double *final_flip_bw, bool *ImmediateFlipSupportedForPipe); static double CalculateWriteBackDelay( enum source_format_class WritebackPixelFormat, double WritebackHRatio, double WritebackVRatio, unsigned int WritebackLumaHTaps, unsigned int WritebackLumaVTaps, unsigned int WritebackChromaHTaps, unsigned int WritebackChromaVTaps, unsigned int WritebackDestinationWidth); static void dml20v2_DisplayPipeConfiguration(struct display_mode_lib *mode_lib); static void dml20v2_DISPCLKDPPCLKDCFCLKDeepSleepPrefetchParametersWatermarksAndPerformanceCalculation( struct display_mode_lib *mode_lib); void dml20v2_recalculate(struct display_mode_lib *mode_lib) { ModeSupportAndSystemConfiguration(mode_lib); mode_lib->vba.FabricAndDRAMBandwidth = dml_min( mode_lib->vba.DRAMSpeed * mode_lib->vba.NumberOfChannels * mode_lib->vba.DRAMChannelWidth, mode_lib->vba.FabricClock * mode_lib->vba.FabricDatapathToDCNDataReturn) / 1000.0; PixelClockAdjustmentForProgressiveToInterlaceUnit(mode_lib); dml20v2_DisplayPipeConfiguration(mode_lib); dml20v2_DISPCLKDPPCLKDCFCLKDeepSleepPrefetchParametersWatermarksAndPerformanceCalculation(mode_lib); } static double adjust_ReturnBW( struct display_mode_lib *mode_lib, double ReturnBW, bool DCCEnabledAnyPlane, double ReturnBandwidthToDCN) { double CriticalCompression; if (DCCEnabledAnyPlane && ReturnBandwidthToDCN > mode_lib->vba.DCFCLK * mode_lib->vba.ReturnBusWidth / 4.0) ReturnBW = dml_min( ReturnBW, ReturnBandwidthToDCN * 4 * (1.0 - mode_lib->vba.UrgentLatencyPixelDataOnly / ((mode_lib->vba.ROBBufferSizeInKByte - mode_lib->vba.PixelChunkSizeInKByte) * 1024 / ReturnBandwidthToDCN - mode_lib->vba.DCFCLK * mode_lib->vba.ReturnBusWidth / 4) + mode_lib->vba.UrgentLatencyPixelDataOnly)); CriticalCompression = 2.0 * mode_lib->vba.ReturnBusWidth * mode_lib->vba.DCFCLK * mode_lib->vba.UrgentLatencyPixelDataOnly / (ReturnBandwidthToDCN * mode_lib->vba.UrgentLatencyPixelDataOnly + (mode_lib->vba.ROBBufferSizeInKByte - mode_lib->vba.PixelChunkSizeInKByte) * 1024); if (DCCEnabledAnyPlane && CriticalCompression > 1.0 && CriticalCompression < 4.0) ReturnBW = dml_min( ReturnBW, 4.0 * ReturnBandwidthToDCN * (mode_lib->vba.ROBBufferSizeInKByte - mode_lib->vba.PixelChunkSizeInKByte) * 1024 * mode_lib->vba.ReturnBusWidth * mode_lib->vba.DCFCLK * mode_lib->vba.UrgentLatencyPixelDataOnly / dml_pow( (ReturnBandwidthToDCN * mode_lib->vba.UrgentLatencyPixelDataOnly + (mode_lib->vba.ROBBufferSizeInKByte - mode_lib->vba.PixelChunkSizeInKByte) * 1024), 2)); return ReturnBW; } static unsigned int dscceComputeDelay( unsigned int bpc, double bpp, unsigned int sliceWidth, unsigned int numSlices, enum output_format_class pixelFormat) { // valid bpc = source bits per component in the set of {8, 10, 12} // valid bpp = increments of 1/16 of a bit // min = 6/7/8 in N420/N422/444, respectively // max = such that compression is 1:1 //valid sliceWidth = number of pixels per slice line, must be less than or equal to 5184/numSlices (or 4096/numSlices in 420 mode) //valid numSlices = number of slices in the horiziontal direction per DSC engine in the set of {1, 2, 3, 4} //valid pixelFormat = pixel/color format in the set of {:N444_RGB, :S422, :N422, :N420} // fixed value unsigned int rcModelSize = 8192; // N422/N420 operate at 2 pixels per clock unsigned int pixelsPerClock, lstall, D, initalXmitDelay, w, s, ix, wx, p, l0, a, ax, l, Delay, pixels; if (pixelFormat == dm_n422 || pixelFormat == dm_420) pixelsPerClock = 2; // #all other modes operate at 1 pixel per clock else pixelsPerClock = 1; //initial transmit delay as per PPS initalXmitDelay = dml_round(rcModelSize / 2.0 / bpp / pixelsPerClock); //compute ssm delay if (bpc == 8) D = 81; else if (bpc == 10) D = 89; else D = 113; //divide by pixel per cycle to compute slice width as seen by DSC w = sliceWidth / pixelsPerClock; //422 mode has an additional cycle of delay if (pixelFormat == dm_s422) s = 1; else s = 0; //main calculation for the dscce ix = initalXmitDelay + 45; wx = (w + 2) / 3; p = 3 * wx - w; l0 = ix / w; a = ix + p * l0; ax = (a + 2) / 3 + D + 6 + 1; l = (ax + wx - 1) / wx; if ((ix % w) == 0 && p != 0) lstall = 1; else lstall = 0; Delay = l * wx * (numSlices - 1) + ax + s + lstall + 22; //dsc processes 3 pixel containers per cycle and a container can contain 1 or 2 pixels pixels = Delay * 3 * pixelsPerClock; return pixels; } static unsigned int dscComputeDelay(enum output_format_class pixelFormat) { unsigned int Delay = 0; if (pixelFormat == dm_420) { // sfr Delay = Delay + 2; // dsccif Delay = Delay + 0; // dscc - input deserializer Delay = Delay + 3; // dscc gets pixels every other cycle Delay = Delay + 2; // dscc - input cdc fifo Delay = Delay + 12; // dscc gets pixels every other cycle Delay = Delay + 13; // dscc - cdc uncertainty Delay = Delay + 2; // dscc - output cdc fifo Delay = Delay + 7; // dscc gets pixels every other cycle Delay = Delay + 3; // dscc - cdc uncertainty Delay = Delay + 2; // dscc - output serializer Delay = Delay + 1; // sft Delay = Delay + 1; } else if (pixelFormat == dm_n422) { // sfr Delay = Delay + 2; // dsccif Delay = Delay + 1; // dscc - input deserializer Delay = Delay + 5; // dscc - input cdc fifo Delay = Delay + 25; // dscc - cdc uncertainty Delay = Delay + 2; // dscc - output cdc fifo Delay = Delay + 10; // dscc - cdc uncertainty Delay = Delay + 2; // dscc - output serializer Delay = Delay + 1; // sft Delay = Delay + 1; } else { // sfr Delay = Delay + 2; // dsccif Delay = Delay + 0; // dscc - input deserializer Delay = Delay + 3; // dscc - input cdc fifo Delay = Delay + 12; // dscc - cdc uncertainty Delay = Delay + 2; // dscc - output cdc fifo Delay = Delay + 7; // dscc - output serializer Delay = Delay + 1; // dscc - cdc uncertainty Delay = Delay + 2; // sft Delay = Delay + 1; } return Delay; } static bool CalculateDelayAfterScaler( struct display_mode_lib *mode_lib, double ReturnBW, double ReadBandwidthPlaneLuma, double ReadBandwidthPlaneChroma, double TotalDataReadBandwidth, double DisplayPipeLineDeliveryTimeLuma, double DisplayPipeLineDeliveryTimeChroma, double DPPCLK, double DISPCLK, double PixelClock, unsigned int DSCDelay, unsigned int DPPPerPlane, bool ScalerEnabled, unsigned int NumberOfCursors, double DPPCLKDelaySubtotal, double DPPCLKDelaySCL, double DPPCLKDelaySCLLBOnly, double DPPCLKDelayCNVCFormater, double DPPCLKDelayCNVCCursor, double DISPCLKDelaySubtotal, unsigned int ScalerRecoutWidth, enum output_format_class OutputFormat, unsigned int HTotal, unsigned int SwathWidthSingleDPPY, double BytePerPixelDETY, double BytePerPixelDETC, unsigned int SwathHeightY, unsigned int SwathHeightC, bool Interlace, bool ProgressiveToInterlaceUnitInOPP, double *DSTXAfterScaler, double *DSTYAfterScaler ) { unsigned int DPPCycles, DISPCLKCycles; double DataFabricLineDeliveryTimeLuma; double DataFabricLineDeliveryTimeChroma; double DSTTotalPixelsAfterScaler; DataFabricLineDeliveryTimeLuma = SwathWidthSingleDPPY * SwathHeightY * dml_ceil(BytePerPixelDETY, 1) / (mode_lib->vba.ReturnBW * ReadBandwidthPlaneLuma / TotalDataReadBandwidth); mode_lib->vba.LastPixelOfLineExtraWatermark = dml_max(mode_lib->vba.LastPixelOfLineExtraWatermark, DataFabricLineDeliveryTimeLuma - DisplayPipeLineDeliveryTimeLuma); if (BytePerPixelDETC != 0) { DataFabricLineDeliveryTimeChroma = SwathWidthSingleDPPY / 2 * SwathHeightC * dml_ceil(BytePerPixelDETC, 2) / (mode_lib->vba.ReturnBW * ReadBandwidthPlaneChroma / TotalDataReadBandwidth); mode_lib->vba.LastPixelOfLineExtraWatermark = dml_max(mode_lib->vba.LastPixelOfLineExtraWatermark, DataFabricLineDeliveryTimeChroma - DisplayPipeLineDeliveryTimeChroma); } if (ScalerEnabled) DPPCycles = DPPCLKDelaySubtotal + DPPCLKDelaySCL; else DPPCycles = DPPCLKDelaySubtotal + DPPCLKDelaySCLLBOnly; DPPCycles = DPPCycles + DPPCLKDelayCNVCFormater + NumberOfCursors * DPPCLKDelayCNVCCursor; DISPCLKCycles = DISPCLKDelaySubtotal; if (DPPCLK == 0.0 || DISPCLK == 0.0) return true; *DSTXAfterScaler = DPPCycles * PixelClock / DPPCLK + DISPCLKCycles * PixelClock / DISPCLK + DSCDelay; if (DPPPerPlane > 1) *DSTXAfterScaler = *DSTXAfterScaler + ScalerRecoutWidth; if (OutputFormat == dm_420 || (Interlace && ProgressiveToInterlaceUnitInOPP)) *DSTYAfterScaler = 1; else *DSTYAfterScaler = 0; DSTTotalPixelsAfterScaler = ((double) (*DSTYAfterScaler * HTotal)) + *DSTXAfterScaler; *DSTYAfterScaler = dml_floor(DSTTotalPixelsAfterScaler / HTotal, 1); *DSTXAfterScaler = DSTTotalPixelsAfterScaler - ((double) (*DSTYAfterScaler * HTotal)); return true; } static bool CalculatePrefetchSchedule( struct display_mode_lib *mode_lib, double DPPCLK, double DISPCLK, double PixelClock, double DCFCLKDeepSleep, unsigned int DPPPerPlane, unsigned int NumberOfCursors, unsigned int VBlank, unsigned int HTotal, unsigned int MaxInterDCNTileRepeaters, unsigned int VStartup, unsigned int PageTableLevels, bool GPUVMEnable, bool DynamicMetadataEnable, unsigned int DynamicMetadataLinesBeforeActiveRequired, unsigned int DynamicMetadataTransmittedBytes, bool DCCEnable, double UrgentLatencyPixelDataOnly, double UrgentExtraLatency, double TCalc, unsigned int PDEAndMetaPTEBytesFrame, unsigned int MetaRowByte, unsigned int PixelPTEBytesPerRow, double PrefetchSourceLinesY, unsigned int SwathWidthY, double BytePerPixelDETY, double VInitPreFillY, unsigned int MaxNumSwathY, double PrefetchSourceLinesC, double BytePerPixelDETC, double VInitPreFillC, unsigned int MaxNumSwathC, unsigned int SwathHeightY, unsigned int SwathHeightC, double TWait, bool XFCEnabled, double XFCRemoteSurfaceFlipDelay, bool InterlaceEnable, bool ProgressiveToInterlaceUnitInOPP, double DSTXAfterScaler, double DSTYAfterScaler, double *DestinationLinesForPrefetch, double *PrefetchBandwidth, double *DestinationLinesToRequestVMInVBlank, double *DestinationLinesToRequestRowInVBlank, double *VRatioPrefetchY, double *VRatioPrefetchC, double *RequiredPrefetchPixDataBW, double *Tno_bw, unsigned int *VUpdateOffsetPix, double *VUpdateWidthPix, double *VReadyOffsetPix) { bool MyError = false; double TotalRepeaterDelayTime; double Tdm, LineTime, Tsetup; double dst_y_prefetch_equ; double Tsw_oto; double prefetch_bw_oto; double Tvm_oto; double Tr0_oto; double Tpre_oto; double dst_y_prefetch_oto; double TimeForFetchingMetaPTE = 0; double TimeForFetchingRowInVBlank = 0; double LinesToRequestPrefetchPixelData = 0; *VUpdateOffsetPix = dml_ceil(HTotal / 4.0, 1); TotalRepeaterDelayTime = MaxInterDCNTileRepeaters * (2.0 / DPPCLK + 3.0 / DISPCLK); *VUpdateWidthPix = (14.0 / DCFCLKDeepSleep + 12.0 / DPPCLK + TotalRepeaterDelayTime) * PixelClock; *VReadyOffsetPix = dml_max( 150.0 / DPPCLK, TotalRepeaterDelayTime + 20.0 / DCFCLKDeepSleep + 10.0 / DPPCLK) * PixelClock; Tsetup = (double) (*VUpdateOffsetPix + *VUpdateWidthPix + *VReadyOffsetPix) / PixelClock; LineTime = (double) HTotal / PixelClock; if (DynamicMetadataEnable) { double Tdmbf, Tdmec, Tdmsks; Tdm = dml_max(0.0, UrgentExtraLatency - TCalc); Tdmbf = DynamicMetadataTransmittedBytes / 4.0 / DISPCLK; Tdmec = LineTime; if (DynamicMetadataLinesBeforeActiveRequired == 0) Tdmsks = VBlank * LineTime / 2.0; else Tdmsks = DynamicMetadataLinesBeforeActiveRequired * LineTime; if (InterlaceEnable && !ProgressiveToInterlaceUnitInOPP) Tdmsks = Tdmsks / 2; if (VStartup * LineTime < Tsetup + TWait + UrgentExtraLatency + Tdmbf + Tdmec + Tdmsks) { MyError = true; } } else Tdm = 0; if (GPUVMEnable) { if (PageTableLevels == 4) *Tno_bw = UrgentExtraLatency + UrgentLatencyPixelDataOnly; else if (PageTableLevels == 3) *Tno_bw = UrgentExtraLatency; else *Tno_bw = 0; } else if (DCCEnable) *Tno_bw = LineTime; else *Tno_bw = LineTime / 4; dst_y_prefetch_equ = VStartup - dml_max(TCalc + TWait, XFCRemoteSurfaceFlipDelay) / LineTime - (Tsetup + Tdm) / LineTime - (DSTYAfterScaler + DSTXAfterScaler / HTotal); Tsw_oto = dml_max(PrefetchSourceLinesY, PrefetchSourceLinesC) * LineTime; prefetch_bw_oto = (MetaRowByte + PixelPTEBytesPerRow + PrefetchSourceLinesY * SwathWidthY * dml_ceil(BytePerPixelDETY, 1) + PrefetchSourceLinesC * SwathWidthY / 2 * dml_ceil(BytePerPixelDETC, 2)) / Tsw_oto; if (GPUVMEnable == true) { Tvm_oto = dml_max( *Tno_bw + PDEAndMetaPTEBytesFrame / prefetch_bw_oto, dml_max( UrgentExtraLatency + UrgentLatencyPixelDataOnly * (PageTableLevels - 1), LineTime / 4.0)); } else Tvm_oto = LineTime / 4.0; if ((GPUVMEnable == true || DCCEnable == true)) { Tr0_oto = dml_max( (MetaRowByte + PixelPTEBytesPerRow) / prefetch_bw_oto, dml_max(UrgentLatencyPixelDataOnly, dml_max(LineTime - Tvm_oto, LineTime / 4))); } else Tr0_oto = LineTime - Tvm_oto; Tpre_oto = Tvm_oto + Tr0_oto + Tsw_oto; dst_y_prefetch_oto = Tpre_oto / LineTime; if (dst_y_prefetch_oto < dst_y_prefetch_equ) *DestinationLinesForPrefetch = dst_y_prefetch_oto; else *DestinationLinesForPrefetch = dst_y_prefetch_equ; *DestinationLinesForPrefetch = dml_floor(4.0 * (*DestinationLinesForPrefetch + 0.125), 1) / 4; dml_print("DML: VStartup: %d\n", VStartup); dml_print("DML: TCalc: %f\n", TCalc); dml_print("DML: TWait: %f\n", TWait); dml_print("DML: XFCRemoteSurfaceFlipDelay: %f\n", XFCRemoteSurfaceFlipDelay); dml_print("DML: LineTime: %f\n", LineTime); dml_print("DML: Tsetup: %f\n", Tsetup); dml_print("DML: Tdm: %f\n", Tdm); dml_print("DML: DSTYAfterScaler: %f\n", DSTYAfterScaler); dml_print("DML: DSTXAfterScaler: %f\n", DSTXAfterScaler); dml_print("DML: HTotal: %d\n", HTotal); *PrefetchBandwidth = 0; *DestinationLinesToRequestVMInVBlank = 0; *DestinationLinesToRequestRowInVBlank = 0; *VRatioPrefetchY = 0; *VRatioPrefetchC = 0; *RequiredPrefetchPixDataBW = 0; if (*DestinationLinesForPrefetch > 1) { *PrefetchBandwidth = (PDEAndMetaPTEBytesFrame + 2 * MetaRowByte + 2 * PixelPTEBytesPerRow + PrefetchSourceLinesY * SwathWidthY * dml_ceil(BytePerPixelDETY, 1) + PrefetchSourceLinesC * SwathWidthY / 2 * dml_ceil(BytePerPixelDETC, 2)) / (*DestinationLinesForPrefetch * LineTime - *Tno_bw); if (GPUVMEnable) { TimeForFetchingMetaPTE = dml_max( *Tno_bw + (double) PDEAndMetaPTEBytesFrame / *PrefetchBandwidth, dml_max( UrgentExtraLatency + UrgentLatencyPixelDataOnly * (PageTableLevels - 1), LineTime / 4)); } else { if (NumberOfCursors > 0 || XFCEnabled) TimeForFetchingMetaPTE = LineTime / 4; else TimeForFetchingMetaPTE = 0.0; } if ((GPUVMEnable == true || DCCEnable == true)) { TimeForFetchingRowInVBlank = dml_max( (MetaRowByte + PixelPTEBytesPerRow) / *PrefetchBandwidth, dml_max( UrgentLatencyPixelDataOnly, dml_max( LineTime - TimeForFetchingMetaPTE, LineTime / 4.0))); } else { if (NumberOfCursors > 0 || XFCEnabled) TimeForFetchingRowInVBlank = LineTime - TimeForFetchingMetaPTE; else TimeForFetchingRowInVBlank = 0.0; } *DestinationLinesToRequestVMInVBlank = dml_floor( 4.0 * (TimeForFetchingMetaPTE / LineTime + 0.125), 1) / 4.0; *DestinationLinesToRequestRowInVBlank = dml_floor( 4.0 * (TimeForFetchingRowInVBlank / LineTime + 0.125), 1) / 4.0; LinesToRequestPrefetchPixelData = *DestinationLinesForPrefetch - ((NumberOfCursors > 0 || GPUVMEnable || DCCEnable) ? (*DestinationLinesToRequestVMInVBlank + *DestinationLinesToRequestRowInVBlank) : 0.0); if (LinesToRequestPrefetchPixelData > 0) { *VRatioPrefetchY = (double) PrefetchSourceLinesY / LinesToRequestPrefetchPixelData; *VRatioPrefetchY = dml_max(*VRatioPrefetchY, 1.0); if ((SwathHeightY > 4) && (VInitPreFillY > 3)) { if (LinesToRequestPrefetchPixelData > (VInitPreFillY - 3.0) / 2.0) { *VRatioPrefetchY = dml_max( (double) PrefetchSourceLinesY / LinesToRequestPrefetchPixelData, (double) MaxNumSwathY * SwathHeightY / (LinesToRequestPrefetchPixelData - (VInitPreFillY - 3.0) / 2.0)); *VRatioPrefetchY = dml_max(*VRatioPrefetchY, 1.0); } else { MyError = true; *VRatioPrefetchY = 0; } } *VRatioPrefetchC = (double) PrefetchSourceLinesC / LinesToRequestPrefetchPixelData; *VRatioPrefetchC = dml_max(*VRatioPrefetchC, 1.0); if ((SwathHeightC > 4)) { if (LinesToRequestPrefetchPixelData > (VInitPreFillC - 3.0) / 2.0) { *VRatioPrefetchC = dml_max( *VRatioPrefetchC, (double) MaxNumSwathC * SwathHeightC / (LinesToRequestPrefetchPixelData - (VInitPreFillC - 3.0) / 2.0)); *VRatioPrefetchC = dml_max(*VRatioPrefetchC, 1.0); } else { MyError = true; *VRatioPrefetchC = 0; } } *RequiredPrefetchPixDataBW = DPPPerPlane * ((double) PrefetchSourceLinesY / LinesToRequestPrefetchPixelData * dml_ceil( BytePerPixelDETY, 1) + (double) PrefetchSourceLinesC / LinesToRequestPrefetchPixelData * dml_ceil( BytePerPixelDETC, 2) / 2) * SwathWidthY / LineTime; } else { MyError = true; *VRatioPrefetchY = 0; *VRatioPrefetchC = 0; *RequiredPrefetchPixDataBW = 0; } } else { MyError = true; } if (MyError) { *PrefetchBandwidth = 0; TimeForFetchingMetaPTE = 0; TimeForFetchingRowInVBlank = 0; *DestinationLinesToRequestVMInVBlank = 0; *DestinationLinesToRequestRowInVBlank = 0; *DestinationLinesForPrefetch = 0; LinesToRequestPrefetchPixelData = 0; *VRatioPrefetchY = 0; *VRatioPrefetchC = 0; *RequiredPrefetchPixDataBW = 0; } return MyError; } static double RoundToDFSGranularityUp(double Clock, double VCOSpeed) { return VCOSpeed * 4 / dml_floor(VCOSpeed * 4 / Clock, 1); } static double RoundToDFSGranularityDown(double Clock, double VCOSpeed) { return VCOSpeed * 4 / dml_ceil(VCOSpeed * 4 / Clock, 1); } static double CalculatePrefetchSourceLines( struct display_mode_lib *mode_lib, double VRatio, double vtaps, bool Interlace, bool ProgressiveToInterlaceUnitInOPP, unsigned int SwathHeight, unsigned int ViewportYStart, double *VInitPreFill, unsigned int *MaxNumSwath) { unsigned int MaxPartialSwath; if (ProgressiveToInterlaceUnitInOPP) *VInitPreFill = dml_floor((VRatio + vtaps + 1) / 2.0, 1); else *VInitPreFill = dml_floor((VRatio + vtaps + 1 + Interlace * 0.5 * VRatio) / 2.0, 1); if (!mode_lib->vba.IgnoreViewportPositioning) { *MaxNumSwath = dml_ceil((*VInitPreFill - 1.0) / SwathHeight, 1) + 1.0; if (*VInitPreFill > 1.0) MaxPartialSwath = (unsigned int) (*VInitPreFill - 2) % SwathHeight; else MaxPartialSwath = (unsigned int) (*VInitPreFill + SwathHeight - 2) % SwathHeight; MaxPartialSwath = dml_max(1U, MaxPartialSwath); } else { if (ViewportYStart != 0) dml_print( "WARNING DML: using viewport y position of 0 even though actual viewport y position is non-zero in prefetch source lines calculation\n"); *MaxNumSwath = dml_ceil(*VInitPreFill / SwathHeight, 1); if (*VInitPreFill > 1.0) MaxPartialSwath = (unsigned int) (*VInitPreFill - 1) % SwathHeight; else MaxPartialSwath = (unsigned int) (*VInitPreFill + SwathHeight - 1) % SwathHeight; } return *MaxNumSwath * SwathHeight + MaxPartialSwath; } static unsigned int CalculateVMAndRowBytes( struct display_mode_lib *mode_lib, bool DCCEnable, unsigned int BlockHeight256Bytes, unsigned int BlockWidth256Bytes, enum source_format_class SourcePixelFormat, unsigned int SurfaceTiling, unsigned int BytePerPixel, enum scan_direction_class ScanDirection, unsigned int ViewportWidth, unsigned int ViewportHeight, unsigned int SwathWidth, bool GPUVMEnable, unsigned int VMMPageSize, unsigned int PTEBufferSizeInRequestsLuma, unsigned int PDEProcessingBufIn64KBReqs, unsigned int Pitch, unsigned int DCCMetaPitch, unsigned int *MacroTileWidth, unsigned int *MetaRowByte, unsigned int *PixelPTEBytesPerRow, bool *PTEBufferSizeNotExceeded, unsigned int *dpte_row_height, unsigned int *meta_row_height) { unsigned int MetaRequestHeight; unsigned int MetaRequestWidth; unsigned int MetaSurfWidth; unsigned int MetaSurfHeight; unsigned int MPDEBytesFrame; unsigned int MetaPTEBytesFrame; unsigned int DCCMetaSurfaceBytes; unsigned int MacroTileSizeBytes; unsigned int MacroTileHeight; unsigned int DPDE0BytesFrame; unsigned int ExtraDPDEBytesFrame; unsigned int PDEAndMetaPTEBytesFrame; if (DCCEnable == true) { MetaRequestHeight = 8 * BlockHeight256Bytes; MetaRequestWidth = 8 * BlockWidth256Bytes; if (ScanDirection == dm_horz) { *meta_row_height = MetaRequestHeight; MetaSurfWidth = dml_ceil((double) SwathWidth - 1, MetaRequestWidth) + MetaRequestWidth; *MetaRowByte = MetaSurfWidth * MetaRequestHeight * BytePerPixel / 256.0; } else { *meta_row_height = MetaRequestWidth; MetaSurfHeight = dml_ceil((double) SwathWidth - 1, MetaRequestHeight) + MetaRequestHeight; *MetaRowByte = MetaSurfHeight * MetaRequestWidth * BytePerPixel / 256.0; } if (ScanDirection == dm_horz) { DCCMetaSurfaceBytes = DCCMetaPitch * (dml_ceil(ViewportHeight - 1, 64 * BlockHeight256Bytes) + 64 * BlockHeight256Bytes) * BytePerPixel / 256; } else { DCCMetaSurfaceBytes = DCCMetaPitch * (dml_ceil( (double) ViewportHeight - 1, 64 * BlockHeight256Bytes) + 64 * BlockHeight256Bytes) * BytePerPixel / 256; } if (GPUVMEnable == true) { MetaPTEBytesFrame = (dml_ceil( (double) (DCCMetaSurfaceBytes - VMMPageSize) / (8 * VMMPageSize), 1) + 1) * 64; MPDEBytesFrame = 128 * (mode_lib->vba.GPUVMMaxPageTableLevels - 1); } else { MetaPTEBytesFrame = 0; MPDEBytesFrame = 0; } } else { MetaPTEBytesFrame = 0; MPDEBytesFrame = 0; *MetaRowByte = 0; } if (SurfaceTiling == dm_sw_linear || SurfaceTiling == dm_sw_gfx7_2d_thin_gl || SurfaceTiling == dm_sw_gfx7_2d_thin_lvp) { MacroTileSizeBytes = 256; MacroTileHeight = BlockHeight256Bytes; } else if (SurfaceTiling == dm_sw_4kb_s || SurfaceTiling == dm_sw_4kb_s_x || SurfaceTiling == dm_sw_4kb_d || SurfaceTiling == dm_sw_4kb_d_x) { MacroTileSizeBytes = 4096; MacroTileHeight = 4 * BlockHeight256Bytes; } else if (SurfaceTiling == dm_sw_64kb_s || SurfaceTiling == dm_sw_64kb_s_t || SurfaceTiling == dm_sw_64kb_s_x || SurfaceTiling == dm_sw_64kb_d || SurfaceTiling == dm_sw_64kb_d_t || SurfaceTiling == dm_sw_64kb_d_x || SurfaceTiling == dm_sw_64kb_r_x) { MacroTileSizeBytes = 65536; MacroTileHeight = 16 * BlockHeight256Bytes; } else { MacroTileSizeBytes = 262144; MacroTileHeight = 32 * BlockHeight256Bytes; } *MacroTileWidth = MacroTileSizeBytes / BytePerPixel / MacroTileHeight; if (GPUVMEnable == true && mode_lib->vba.GPUVMMaxPageTableLevels > 1) { if (ScanDirection == dm_horz) { DPDE0BytesFrame = 64 * (dml_ceil( ((Pitch * (dml_ceil( ViewportHeight - 1, MacroTileHeight) + MacroTileHeight) * BytePerPixel) - MacroTileSizeBytes) / (8 * 2097152), 1) + 1); } else { DPDE0BytesFrame = 64 * (dml_ceil( ((Pitch * (dml_ceil( (double) SwathWidth - 1, MacroTileHeight) + MacroTileHeight) * BytePerPixel) - MacroTileSizeBytes) / (8 * 2097152), 1) + 1); } ExtraDPDEBytesFrame = 128 * (mode_lib->vba.GPUVMMaxPageTableLevels - 2); } else { DPDE0BytesFrame = 0; ExtraDPDEBytesFrame = 0; } PDEAndMetaPTEBytesFrame = MetaPTEBytesFrame + MPDEBytesFrame + DPDE0BytesFrame + ExtraDPDEBytesFrame; if (GPUVMEnable == true) { unsigned int PTERequestSize; unsigned int PixelPTEReqHeight; unsigned int PixelPTEReqWidth; double FractionOfPTEReturnDrop; unsigned int EffectivePDEProcessingBufIn64KBReqs; if (SurfaceTiling == dm_sw_linear) { PixelPTEReqHeight = 1; PixelPTEReqWidth = 8.0 * VMMPageSize / BytePerPixel; PTERequestSize = 64; FractionOfPTEReturnDrop = 0; } else if (MacroTileSizeBytes == 4096) { PixelPTEReqHeight = MacroTileHeight; PixelPTEReqWidth = 8 * *MacroTileWidth; PTERequestSize = 64; if (ScanDirection == dm_horz) FractionOfPTEReturnDrop = 0; else FractionOfPTEReturnDrop = 7 / 8; } else if (VMMPageSize == 4096 && MacroTileSizeBytes > 4096) { PixelPTEReqHeight = 16 * BlockHeight256Bytes; PixelPTEReqWidth = 16 * BlockWidth256Bytes; PTERequestSize = 128; FractionOfPTEReturnDrop = 0; } else { PixelPTEReqHeight = MacroTileHeight; PixelPTEReqWidth = 8 * *MacroTileWidth; PTERequestSize = 64; FractionOfPTEReturnDrop = 0; } if (SourcePixelFormat == dm_420_8 || SourcePixelFormat == dm_420_10) EffectivePDEProcessingBufIn64KBReqs = PDEProcessingBufIn64KBReqs / 2; else EffectivePDEProcessingBufIn64KBReqs = PDEProcessingBufIn64KBReqs; if (SurfaceTiling == dm_sw_linear) { *dpte_row_height = dml_min( 128, 1 << (unsigned int) dml_floor( dml_log2( dml_min( (double) PTEBufferSizeInRequestsLuma * PixelPTEReqWidth, EffectivePDEProcessingBufIn64KBReqs * 65536.0 / BytePerPixel) / Pitch), 1)); *PixelPTEBytesPerRow = PTERequestSize * (dml_ceil( (double) (Pitch * *dpte_row_height - 1) / PixelPTEReqWidth, 1) + 1); } else if (ScanDirection == dm_horz) { *dpte_row_height = PixelPTEReqHeight; *PixelPTEBytesPerRow = PTERequestSize * (dml_ceil(((double) SwathWidth - 1) / PixelPTEReqWidth, 1) + 1); } else { *dpte_row_height = dml_min(PixelPTEReqWidth, *MacroTileWidth); *PixelPTEBytesPerRow = PTERequestSize * (dml_ceil( ((double) SwathWidth - 1) / PixelPTEReqHeight, 1) + 1); } if (*PixelPTEBytesPerRow * (1 - FractionOfPTEReturnDrop) <= 64 * PTEBufferSizeInRequestsLuma) { *PTEBufferSizeNotExceeded = true; } else { *PTEBufferSizeNotExceeded = false; } } else { *PixelPTEBytesPerRow = 0; *PTEBufferSizeNotExceeded = true; } return PDEAndMetaPTEBytesFrame; } static void dml20v2_DISPCLKDPPCLKDCFCLKDeepSleepPrefetchParametersWatermarksAndPerformanceCalculation( struct display_mode_lib *mode_lib) { unsigned int j, k; mode_lib->vba.WritebackDISPCLK = 0.0; mode_lib->vba.DISPCLKWithRamping = 0; mode_lib->vba.DISPCLKWithoutRamping = 0; mode_lib->vba.GlobalDPPCLK = 0.0; // dml_ml->vba.DISPCLK and dml_ml->vba.DPPCLK Calculation // for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { if (mode_lib->vba.WritebackEnable[k]) { mode_lib->vba.WritebackDISPCLK = dml_max( mode_lib->vba.WritebackDISPCLK, CalculateWriteBackDISPCLK( mode_lib->vba.WritebackPixelFormat[k], mode_lib->vba.PixelClock[k], mode_lib->vba.WritebackHRatio[k], mode_lib->vba.WritebackVRatio[k], mode_lib->vba.WritebackLumaHTaps[k], mode_lib->vba.WritebackLumaVTaps[k], mode_lib->vba.WritebackChromaHTaps[k], mode_lib->vba.WritebackChromaVTaps[k], mode_lib->vba.WritebackDestinationWidth[k], mode_lib->vba.HTotal[k], mode_lib->vba.WritebackChromaLineBufferWidth)); } } for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { if (mode_lib->vba.HRatio[k] > 1) { mode_lib->vba.PSCL_THROUGHPUT_LUMA[k] = dml_min( mode_lib->vba.MaxDCHUBToPSCLThroughput, mode_lib->vba.MaxPSCLToLBThroughput * mode_lib->vba.HRatio[k] / dml_ceil( mode_lib->vba.htaps[k] / 6.0, 1)); } else { mode_lib->vba.PSCL_THROUGHPUT_LUMA[k] = dml_min( mode_lib->vba.MaxDCHUBToPSCLThroughput, mode_lib->vba.MaxPSCLToLBThroughput); } mode_lib->vba.DPPCLKUsingSingleDPPLuma = mode_lib->vba.PixelClock[k] * dml_max( mode_lib->vba.vtaps[k] / 6.0 * dml_min( 1.0, mode_lib->vba.HRatio[k]), dml_max( mode_lib->vba.HRatio[k] * mode_lib->vba.VRatio[k] / mode_lib->vba.PSCL_THROUGHPUT_LUMA[k], 1.0)); if ((mode_lib->vba.htaps[k] > 6 || mode_lib->vba.vtaps[k] > 6) && mode_lib->vba.DPPCLKUsingSingleDPPLuma < 2 * mode_lib->vba.PixelClock[k]) { mode_lib->vba.DPPCLKUsingSingleDPPLuma = 2 * mode_lib->vba.PixelClock[k]; } if ((mode_lib->vba.SourcePixelFormat[k] != dm_420_8 && mode_lib->vba.SourcePixelFormat[k] != dm_420_10)) { mode_lib->vba.PSCL_THROUGHPUT_CHROMA[k] = 0.0; mode_lib->vba.DPPCLKUsingSingleDPP[k] = mode_lib->vba.DPPCLKUsingSingleDPPLuma; } else { if (mode_lib->vba.HRatio[k] > 1) { mode_lib->vba.PSCL_THROUGHPUT_CHROMA[k] = dml_min( mode_lib->vba.MaxDCHUBToPSCLThroughput, mode_lib->vba.MaxPSCLToLBThroughput * mode_lib->vba.HRatio[k] / 2 / dml_ceil( mode_lib->vba.HTAPsChroma[k] / 6.0, 1.0)); } else { mode_lib->vba.PSCL_THROUGHPUT_CHROMA[k] = dml_min( mode_lib->vba.MaxDCHUBToPSCLThroughput, mode_lib->vba.MaxPSCLToLBThroughput); } mode_lib->vba.DPPCLKUsingSingleDPPChroma = mode_lib->vba.PixelClock[k] * dml_max( mode_lib->vba.VTAPsChroma[k] / 6.0 * dml_min( 1.0, mode_lib->vba.HRatio[k] / 2), dml_max( mode_lib->vba.HRatio[k] * mode_lib->vba.VRatio[k] / 4 / mode_lib->vba.PSCL_THROUGHPUT_CHROMA[k], 1.0)); if ((mode_lib->vba.HTAPsChroma[k] > 6 || mode_lib->vba.VTAPsChroma[k] > 6) && mode_lib->vba.DPPCLKUsingSingleDPPChroma < 2 * mode_lib->vba.PixelClock[k]) { mode_lib->vba.DPPCLKUsingSingleDPPChroma = 2 * mode_lib->vba.PixelClock[k]; } mode_lib->vba.DPPCLKUsingSingleDPP[k] = dml_max( mode_lib->vba.DPPCLKUsingSingleDPPLuma, mode_lib->vba.DPPCLKUsingSingleDPPChroma); } } for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { if (mode_lib->vba.BlendingAndTiming[k] != k) continue; if (mode_lib->vba.ODMCombineEnabled[k]) { mode_lib->vba.DISPCLKWithRamping = dml_max( mode_lib->vba.DISPCLKWithRamping, mode_lib->vba.PixelClock[k] / 2 * (1 + mode_lib->vba.DISPCLKDPPCLKDSCCLKDownSpreading / 100) * (1 + mode_lib->vba.DISPCLKRampingMargin / 100)); mode_lib->vba.DISPCLKWithoutRamping = dml_max( mode_lib->vba.DISPCLKWithoutRamping, mode_lib->vba.PixelClock[k] / 2 * (1 + mode_lib->vba.DISPCLKDPPCLKDSCCLKDownSpreading / 100)); } else if (!mode_lib->vba.ODMCombineEnabled[k]) { mode_lib->vba.DISPCLKWithRamping = dml_max( mode_lib->vba.DISPCLKWithRamping, mode_lib->vba.PixelClock[k] * (1 + mode_lib->vba.DISPCLKDPPCLKDSCCLKDownSpreading / 100) * (1 + mode_lib->vba.DISPCLKRampingMargin / 100)); mode_lib->vba.DISPCLKWithoutRamping = dml_max( mode_lib->vba.DISPCLKWithoutRamping, mode_lib->vba.PixelClock[k] * (1 + mode_lib->vba.DISPCLKDPPCLKDSCCLKDownSpreading / 100)); } } mode_lib->vba.DISPCLKWithRamping = dml_max( mode_lib->vba.DISPCLKWithRamping, mode_lib->vba.WritebackDISPCLK); mode_lib->vba.DISPCLKWithoutRamping = dml_max( mode_lib->vba.DISPCLKWithoutRamping, mode_lib->vba.WritebackDISPCLK); ASSERT(mode_lib->vba.DISPCLKDPPCLKVCOSpeed != 0); mode_lib->vba.DISPCLKWithRampingRoundedToDFSGranularity = RoundToDFSGranularityUp( mode_lib->vba.DISPCLKWithRamping, mode_lib->vba.DISPCLKDPPCLKVCOSpeed); mode_lib->vba.DISPCLKWithoutRampingRoundedToDFSGranularity = RoundToDFSGranularityUp( mode_lib->vba.DISPCLKWithoutRamping, mode_lib->vba.DISPCLKDPPCLKVCOSpeed); mode_lib->vba.MaxDispclkRoundedToDFSGranularity = RoundToDFSGranularityDown( mode_lib->vba.soc.clock_limits[mode_lib->vba.soc.num_states].dispclk_mhz, mode_lib->vba.DISPCLKDPPCLKVCOSpeed); if (mode_lib->vba.DISPCLKWithoutRampingRoundedToDFSGranularity > mode_lib->vba.MaxDispclkRoundedToDFSGranularity) { mode_lib->vba.DISPCLK_calculated = mode_lib->vba.DISPCLKWithoutRampingRoundedToDFSGranularity; } else if (mode_lib->vba.DISPCLKWithRampingRoundedToDFSGranularity > mode_lib->vba.MaxDispclkRoundedToDFSGranularity) { mode_lib->vba.DISPCLK_calculated = mode_lib->vba.MaxDispclkRoundedToDFSGranularity; } else { mode_lib->vba.DISPCLK_calculated = mode_lib->vba.DISPCLKWithRampingRoundedToDFSGranularity; } DTRACE(" dispclk_mhz (calculated) = %f", mode_lib->vba.DISPCLK_calculated); for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { if (mode_lib->vba.DPPPerPlane[k] == 0) { mode_lib->vba.DPPCLK_calculated[k] = 0; } else { mode_lib->vba.DPPCLK_calculated[k] = mode_lib->vba.DPPCLKUsingSingleDPP[k] / mode_lib->vba.DPPPerPlane[k] * (1 + mode_lib->vba.DISPCLKDPPCLKDSCCLKDownSpreading / 100); } mode_lib->vba.GlobalDPPCLK = dml_max( mode_lib->vba.GlobalDPPCLK, mode_lib->vba.DPPCLK_calculated[k]); } mode_lib->vba.GlobalDPPCLK = RoundToDFSGranularityUp( mode_lib->vba.GlobalDPPCLK, mode_lib->vba.DISPCLKDPPCLKVCOSpeed); for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { mode_lib->vba.DPPCLK_calculated[k] = mode_lib->vba.GlobalDPPCLK / 255 * dml_ceil( mode_lib->vba.DPPCLK_calculated[k] * 255 / mode_lib->vba.GlobalDPPCLK, 1); DTRACE(" dppclk_mhz[%i] (calculated) = %f", k, mode_lib->vba.DPPCLK_calculated[k]); } // Urgent Watermark mode_lib->vba.DCCEnabledAnyPlane = false; for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) if (mode_lib->vba.DCCEnable[k]) mode_lib->vba.DCCEnabledAnyPlane = true; mode_lib->vba.ReturnBandwidthToDCN = dml_min( mode_lib->vba.ReturnBusWidth * mode_lib->vba.DCFCLK, mode_lib->vba.FabricAndDRAMBandwidth * 1000) * mode_lib->vba.PercentOfIdealDRAMFabricAndSDPPortBWReceivedAfterUrgLatencyPixelDataOnly / 100; mode_lib->vba.ReturnBW = mode_lib->vba.ReturnBandwidthToDCN; mode_lib->vba.ReturnBW = adjust_ReturnBW( mode_lib, mode_lib->vba.ReturnBW, mode_lib->vba.DCCEnabledAnyPlane, mode_lib->vba.ReturnBandwidthToDCN); // Let's do this calculation again?? mode_lib->vba.ReturnBandwidthToDCN = dml_min( mode_lib->vba.ReturnBusWidth * mode_lib->vba.DCFCLK, mode_lib->vba.FabricAndDRAMBandwidth * 1000); mode_lib->vba.ReturnBW = adjust_ReturnBW( mode_lib, mode_lib->vba.ReturnBW, mode_lib->vba.DCCEnabledAnyPlane, mode_lib->vba.ReturnBandwidthToDCN); DTRACE(" dcfclk_mhz = %f", mode_lib->vba.DCFCLK); DTRACE(" return_bw_to_dcn = %f", mode_lib->vba.ReturnBandwidthToDCN); DTRACE(" return_bus_bw = %f", mode_lib->vba.ReturnBW); for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { bool MainPlaneDoesODMCombine = false; if (mode_lib->vba.SourceScan[k] == dm_horz) mode_lib->vba.SwathWidthSingleDPPY[k] = mode_lib->vba.ViewportWidth[k]; else mode_lib->vba.SwathWidthSingleDPPY[k] = mode_lib->vba.ViewportHeight[k]; if (mode_lib->vba.ODMCombineEnabled[k] == true) MainPlaneDoesODMCombine = true; for (j = 0; j < mode_lib->vba.NumberOfActivePlanes; ++j) if (mode_lib->vba.BlendingAndTiming[k] == j && mode_lib->vba.ODMCombineEnabled[j] == true) MainPlaneDoesODMCombine = true; if (MainPlaneDoesODMCombine == true) mode_lib->vba.SwathWidthY[k] = dml_min( (double) mode_lib->vba.SwathWidthSingleDPPY[k], dml_round( mode_lib->vba.HActive[k] / 2.0 * mode_lib->vba.HRatio[k])); else { if (mode_lib->vba.DPPPerPlane[k] == 0) { mode_lib->vba.SwathWidthY[k] = 0; } else { mode_lib->vba.SwathWidthY[k] = mode_lib->vba.SwathWidthSingleDPPY[k] / mode_lib->vba.DPPPerPlane[k]; } } } for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { if (mode_lib->vba.SourcePixelFormat[k] == dm_444_64) { mode_lib->vba.BytePerPixelDETY[k] = 8; mode_lib->vba.BytePerPixelDETC[k] = 0; } else if (mode_lib->vba.SourcePixelFormat[k] == dm_444_32) { mode_lib->vba.BytePerPixelDETY[k] = 4; mode_lib->vba.BytePerPixelDETC[k] = 0; } else if (mode_lib->vba.SourcePixelFormat[k] == dm_444_16) { mode_lib->vba.BytePerPixelDETY[k] = 2; mode_lib->vba.BytePerPixelDETC[k] = 0; } else if (mode_lib->vba.SourcePixelFormat[k] == dm_444_8) { mode_lib->vba.BytePerPixelDETY[k] = 1; mode_lib->vba.BytePerPixelDETC[k] = 0; } else if (mode_lib->vba.SourcePixelFormat[k] == dm_420_8) { mode_lib->vba.BytePerPixelDETY[k] = 1; mode_lib->vba.BytePerPixelDETC[k] = 2; } else { // dm_420_10 mode_lib->vba.BytePerPixelDETY[k] = 4.0 / 3.0; mode_lib->vba.BytePerPixelDETC[k] = 8.0 / 3.0; } } mode_lib->vba.TotalDataReadBandwidth = 0.0; for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { mode_lib->vba.ReadBandwidthPlaneLuma[k] = mode_lib->vba.SwathWidthSingleDPPY[k] * dml_ceil(mode_lib->vba.BytePerPixelDETY[k], 1) / (mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]) * mode_lib->vba.VRatio[k]; mode_lib->vba.ReadBandwidthPlaneChroma[k] = mode_lib->vba.SwathWidthSingleDPPY[k] / 2 * dml_ceil(mode_lib->vba.BytePerPixelDETC[k], 2) / (mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]) * mode_lib->vba.VRatio[k] / 2; DTRACE( " read_bw[%i] = %fBps", k, mode_lib->vba.ReadBandwidthPlaneLuma[k] + mode_lib->vba.ReadBandwidthPlaneChroma[k]); mode_lib->vba.TotalDataReadBandwidth += mode_lib->vba.ReadBandwidthPlaneLuma[k] + mode_lib->vba.ReadBandwidthPlaneChroma[k]; } mode_lib->vba.TotalDCCActiveDPP = 0; mode_lib->vba.TotalActiveDPP = 0; for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { mode_lib->vba.TotalActiveDPP = mode_lib->vba.TotalActiveDPP + mode_lib->vba.DPPPerPlane[k]; if (mode_lib->vba.DCCEnable[k]) mode_lib->vba.TotalDCCActiveDPP = mode_lib->vba.TotalDCCActiveDPP + mode_lib->vba.DPPPerPlane[k]; } mode_lib->vba.UrgentRoundTripAndOutOfOrderLatency = (mode_lib->vba.RoundTripPingLatencyCycles + 32) / mode_lib->vba.DCFCLK + mode_lib->vba.UrgentOutOfOrderReturnPerChannelPixelDataOnly * mode_lib->vba.NumberOfChannels / mode_lib->vba.ReturnBW; mode_lib->vba.LastPixelOfLineExtraWatermark = 0; for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { if (mode_lib->vba.VRatio[k] <= 1.0) mode_lib->vba.DisplayPipeLineDeliveryTimeLuma[k] = (double) mode_lib->vba.SwathWidthY[k] * mode_lib->vba.DPPPerPlane[k] / mode_lib->vba.HRatio[k] / mode_lib->vba.PixelClock[k]; else mode_lib->vba.DisplayPipeLineDeliveryTimeLuma[k] = (double) mode_lib->vba.SwathWidthY[k] / mode_lib->vba.PSCL_THROUGHPUT_LUMA[k] / mode_lib->vba.DPPCLK[k]; if (mode_lib->vba.BytePerPixelDETC[k] == 0) mode_lib->vba.DisplayPipeLineDeliveryTimeChroma[k] = 0.0; else if (mode_lib->vba.VRatio[k] / 2.0 <= 1.0) mode_lib->vba.DisplayPipeLineDeliveryTimeChroma[k] = mode_lib->vba.SwathWidthY[k] / 2.0 * mode_lib->vba.DPPPerPlane[k] / (mode_lib->vba.HRatio[k] / 2.0) / mode_lib->vba.PixelClock[k]; else mode_lib->vba.DisplayPipeLineDeliveryTimeChroma[k] = mode_lib->vba.SwathWidthY[k] / 2.0 / mode_lib->vba.PSCL_THROUGHPUT_CHROMA[k] / mode_lib->vba.DPPCLK[k]; } mode_lib->vba.UrgentExtraLatency = mode_lib->vba.UrgentRoundTripAndOutOfOrderLatency + (mode_lib->vba.TotalActiveDPP * mode_lib->vba.PixelChunkSizeInKByte + mode_lib->vba.TotalDCCActiveDPP * mode_lib->vba.MetaChunkSize) * 1024.0 / mode_lib->vba.ReturnBW; if (mode_lib->vba.GPUVMEnable) mode_lib->vba.UrgentExtraLatency += mode_lib->vba.TotalActiveDPP * mode_lib->vba.PTEGroupSize / mode_lib->vba.ReturnBW; mode_lib->vba.UrgentWatermark = mode_lib->vba.UrgentLatencyPixelDataOnly + mode_lib->vba.LastPixelOfLineExtraWatermark + mode_lib->vba.UrgentExtraLatency; DTRACE(" urgent_extra_latency = %fus", mode_lib->vba.UrgentExtraLatency); DTRACE(" wm_urgent = %fus", mode_lib->vba.UrgentWatermark); mode_lib->vba.UrgentLatency = mode_lib->vba.UrgentLatencyPixelDataOnly; mode_lib->vba.TotalActiveWriteback = 0; for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { if (mode_lib->vba.WritebackEnable[k]) mode_lib->vba.TotalActiveWriteback = mode_lib->vba.TotalActiveWriteback + mode_lib->vba.ActiveWritebacksPerPlane[k]; } if (mode_lib->vba.TotalActiveWriteback <= 1) mode_lib->vba.WritebackUrgentWatermark = mode_lib->vba.WritebackLatency; else mode_lib->vba.WritebackUrgentWatermark = mode_lib->vba.WritebackLatency + mode_lib->vba.WritebackChunkSize * 1024.0 / 32 / mode_lib->vba.SOCCLK; DTRACE(" wm_wb_urgent = %fus", mode_lib->vba.WritebackUrgentWatermark); // NB P-State/DRAM Clock Change Watermark mode_lib->vba.DRAMClockChangeWatermark = mode_lib->vba.DRAMClockChangeLatency + mode_lib->vba.UrgentWatermark; DTRACE(" wm_pstate_change = %fus", mode_lib->vba.DRAMClockChangeWatermark); DTRACE(" calculating wb pstate watermark"); DTRACE(" total wb outputs %d", mode_lib->vba.TotalActiveWriteback); DTRACE(" socclk frequency %f Mhz", mode_lib->vba.SOCCLK); if (mode_lib->vba.TotalActiveWriteback <= 1) mode_lib->vba.WritebackDRAMClockChangeWatermark = mode_lib->vba.DRAMClockChangeLatency + mode_lib->vba.WritebackLatency; else mode_lib->vba.WritebackDRAMClockChangeWatermark = mode_lib->vba.DRAMClockChangeLatency + mode_lib->vba.WritebackLatency + mode_lib->vba.WritebackChunkSize * 1024.0 / 32 / mode_lib->vba.SOCCLK; DTRACE(" wm_wb_pstate %fus", mode_lib->vba.WritebackDRAMClockChangeWatermark); // Stutter Efficiency for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { mode_lib->vba.LinesInDETY[k] = mode_lib->vba.DETBufferSizeY[k] / mode_lib->vba.BytePerPixelDETY[k] / mode_lib->vba.SwathWidthY[k]; mode_lib->vba.LinesInDETYRoundedDownToSwath[k] = dml_floor( mode_lib->vba.LinesInDETY[k], mode_lib->vba.SwathHeightY[k]); mode_lib->vba.FullDETBufferingTimeY[k] = mode_lib->vba.LinesInDETYRoundedDownToSwath[k] * (mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]) / mode_lib->vba.VRatio[k]; if (mode_lib->vba.BytePerPixelDETC[k] > 0) { mode_lib->vba.LinesInDETC[k] = mode_lib->vba.DETBufferSizeC[k] / mode_lib->vba.BytePerPixelDETC[k] / (mode_lib->vba.SwathWidthY[k] / 2); mode_lib->vba.LinesInDETCRoundedDownToSwath[k] = dml_floor( mode_lib->vba.LinesInDETC[k], mode_lib->vba.SwathHeightC[k]); mode_lib->vba.FullDETBufferingTimeC[k] = mode_lib->vba.LinesInDETCRoundedDownToSwath[k] * (mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]) / (mode_lib->vba.VRatio[k] / 2); } else { mode_lib->vba.LinesInDETC[k] = 0; mode_lib->vba.LinesInDETCRoundedDownToSwath[k] = 0; mode_lib->vba.FullDETBufferingTimeC[k] = 999999; } } mode_lib->vba.MinFullDETBufferingTime = 999999.0; for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { if (mode_lib->vba.FullDETBufferingTimeY[k] < mode_lib->vba.MinFullDETBufferingTime) { mode_lib->vba.MinFullDETBufferingTime = mode_lib->vba.FullDETBufferingTimeY[k]; mode_lib->vba.FrameTimeForMinFullDETBufferingTime = (double) mode_lib->vba.VTotal[k] * mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]; } if (mode_lib->vba.FullDETBufferingTimeC[k] < mode_lib->vba.MinFullDETBufferingTime) { mode_lib->vba.MinFullDETBufferingTime = mode_lib->vba.FullDETBufferingTimeC[k]; mode_lib->vba.FrameTimeForMinFullDETBufferingTime = (double) mode_lib->vba.VTotal[k] * mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]; } } mode_lib->vba.AverageReadBandwidthGBytePerSecond = 0.0; for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { if (mode_lib->vba.DCCEnable[k]) { mode_lib->vba.AverageReadBandwidthGBytePerSecond = mode_lib->vba.AverageReadBandwidthGBytePerSecond + mode_lib->vba.ReadBandwidthPlaneLuma[k] / mode_lib->vba.DCCRate[k] / 1000 + mode_lib->vba.ReadBandwidthPlaneChroma[k] / mode_lib->vba.DCCRate[k] / 1000; } else { mode_lib->vba.AverageReadBandwidthGBytePerSecond = mode_lib->vba.AverageReadBandwidthGBytePerSecond + mode_lib->vba.ReadBandwidthPlaneLuma[k] / 1000 + mode_lib->vba.ReadBandwidthPlaneChroma[k] / 1000; } if (mode_lib->vba.DCCEnable[k]) { mode_lib->vba.AverageReadBandwidthGBytePerSecond = mode_lib->vba.AverageReadBandwidthGBytePerSecond + mode_lib->vba.ReadBandwidthPlaneLuma[k] / 1000 / 256 + mode_lib->vba.ReadBandwidthPlaneChroma[k] / 1000 / 256; } if (mode_lib->vba.GPUVMEnable) { mode_lib->vba.AverageReadBandwidthGBytePerSecond = mode_lib->vba.AverageReadBandwidthGBytePerSecond + mode_lib->vba.ReadBandwidthPlaneLuma[k] / 1000 / 512 + mode_lib->vba.ReadBandwidthPlaneChroma[k] / 1000 / 512; } } mode_lib->vba.PartOfBurstThatFitsInROB = dml_min( mode_lib->vba.MinFullDETBufferingTime * mode_lib->vba.TotalDataReadBandwidth, mode_lib->vba.ROBBufferSizeInKByte * 1024 * mode_lib->vba.TotalDataReadBandwidth / (mode_lib->vba.AverageReadBandwidthGBytePerSecond * 1000)); mode_lib->vba.StutterBurstTime = mode_lib->vba.PartOfBurstThatFitsInROB * (mode_lib->vba.AverageReadBandwidthGBytePerSecond * 1000) / mode_lib->vba.TotalDataReadBandwidth / mode_lib->vba.ReturnBW + (mode_lib->vba.MinFullDETBufferingTime * mode_lib->vba.TotalDataReadBandwidth - mode_lib->vba.PartOfBurstThatFitsInROB) / (mode_lib->vba.DCFCLK * 64); if (mode_lib->vba.TotalActiveWriteback == 0) { mode_lib->vba.StutterEfficiencyNotIncludingVBlank = (1 - (mode_lib->vba.SRExitTime + mode_lib->vba.StutterBurstTime) / mode_lib->vba.MinFullDETBufferingTime) * 100; } else { mode_lib->vba.StutterEfficiencyNotIncludingVBlank = 0; } mode_lib->vba.SmallestVBlank = 999999; for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { if (mode_lib->vba.SynchronizedVBlank || mode_lib->vba.NumberOfActivePlanes == 1) { mode_lib->vba.VBlankTime = (double) (mode_lib->vba.VTotal[k] - mode_lib->vba.VActive[k]) * mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]; } else { mode_lib->vba.VBlankTime = 0; } mode_lib->vba.SmallestVBlank = dml_min( mode_lib->vba.SmallestVBlank, mode_lib->vba.VBlankTime); } mode_lib->vba.StutterEfficiency = (mode_lib->vba.StutterEfficiencyNotIncludingVBlank / 100 * (mode_lib->vba.FrameTimeForMinFullDETBufferingTime - mode_lib->vba.SmallestVBlank) + mode_lib->vba.SmallestVBlank) / mode_lib->vba.FrameTimeForMinFullDETBufferingTime * 100; // dml_ml->vba.DCFCLK Deep Sleep mode_lib->vba.DCFCLKDeepSleep = 8.0; for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; k++) { if (mode_lib->vba.BytePerPixelDETC[k] > 0) { mode_lib->vba.DCFCLKDeepSleepPerPlane[k] = dml_max( 1.1 * mode_lib->vba.SwathWidthY[k] * dml_ceil( mode_lib->vba.BytePerPixelDETY[k], 1) / 32 / mode_lib->vba.DisplayPipeLineDeliveryTimeLuma[k], 1.1 * mode_lib->vba.SwathWidthY[k] / 2.0 * dml_ceil( mode_lib->vba.BytePerPixelDETC[k], 2) / 32 / mode_lib->vba.DisplayPipeLineDeliveryTimeChroma[k]); } else mode_lib->vba.DCFCLKDeepSleepPerPlane[k] = 1.1 * mode_lib->vba.SwathWidthY[k] * dml_ceil(mode_lib->vba.BytePerPixelDETY[k], 1) / 64.0 / mode_lib->vba.DisplayPipeLineDeliveryTimeLuma[k]; mode_lib->vba.DCFCLKDeepSleepPerPlane[k] = dml_max( mode_lib->vba.DCFCLKDeepSleepPerPlane[k], mode_lib->vba.PixelClock[k] / 16.0); mode_lib->vba.DCFCLKDeepSleep = dml_max( mode_lib->vba.DCFCLKDeepSleep, mode_lib->vba.DCFCLKDeepSleepPerPlane[k]); DTRACE( " dcfclk_deepsleep_per_plane[%i] = %fMHz", k, mode_lib->vba.DCFCLKDeepSleepPerPlane[k]); } DTRACE(" dcfclk_deepsleep_mhz = %fMHz", mode_lib->vba.DCFCLKDeepSleep); // Stutter Watermark mode_lib->vba.StutterExitWatermark = mode_lib->vba.SRExitTime + mode_lib->vba.LastPixelOfLineExtraWatermark + mode_lib->vba.UrgentExtraLatency + 10 / mode_lib->vba.DCFCLKDeepSleep; mode_lib->vba.StutterEnterPlusExitWatermark = mode_lib->vba.SREnterPlusExitTime + mode_lib->vba.LastPixelOfLineExtraWatermark + mode_lib->vba.UrgentExtraLatency; DTRACE(" wm_cstate_exit = %fus", mode_lib->vba.StutterExitWatermark); DTRACE(" wm_cstate_enter_exit = %fus", mode_lib->vba.StutterEnterPlusExitWatermark); // Urgent Latency Supported for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { mode_lib->vba.EffectiveDETPlusLBLinesLuma = dml_floor( mode_lib->vba.LinesInDETY[k] + dml_min( mode_lib->vba.LinesInDETY[k] * mode_lib->vba.DPPCLK[k] * mode_lib->vba.BytePerPixelDETY[k] * mode_lib->vba.PSCL_THROUGHPUT_LUMA[k] / (mode_lib->vba.ReturnBW / mode_lib->vba.DPPPerPlane[k]), (double) mode_lib->vba.EffectiveLBLatencyHidingSourceLinesLuma), mode_lib->vba.SwathHeightY[k]); mode_lib->vba.UrgentLatencySupportUsLuma = mode_lib->vba.EffectiveDETPlusLBLinesLuma * (mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]) / mode_lib->vba.VRatio[k] - mode_lib->vba.EffectiveDETPlusLBLinesLuma * mode_lib->vba.SwathWidthY[k] * mode_lib->vba.BytePerPixelDETY[k] / (mode_lib->vba.ReturnBW / mode_lib->vba.DPPPerPlane[k]); if (mode_lib->vba.BytePerPixelDETC[k] > 0) { mode_lib->vba.EffectiveDETPlusLBLinesChroma = dml_floor( mode_lib->vba.LinesInDETC[k] + dml_min( mode_lib->vba.LinesInDETC[k] * mode_lib->vba.DPPCLK[k] * mode_lib->vba.BytePerPixelDETC[k] * mode_lib->vba.PSCL_THROUGHPUT_CHROMA[k] / (mode_lib->vba.ReturnBW / mode_lib->vba.DPPPerPlane[k]), (double) mode_lib->vba.EffectiveLBLatencyHidingSourceLinesChroma), mode_lib->vba.SwathHeightC[k]); mode_lib->vba.UrgentLatencySupportUsChroma = mode_lib->vba.EffectiveDETPlusLBLinesChroma * (mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]) / (mode_lib->vba.VRatio[k] / 2) - mode_lib->vba.EffectiveDETPlusLBLinesChroma * (mode_lib->vba.SwathWidthY[k] / 2) * mode_lib->vba.BytePerPixelDETC[k] / (mode_lib->vba.ReturnBW / mode_lib->vba.DPPPerPlane[k]); mode_lib->vba.UrgentLatencySupportUs[k] = dml_min( mode_lib->vba.UrgentLatencySupportUsLuma, mode_lib->vba.UrgentLatencySupportUsChroma); } else { mode_lib->vba.UrgentLatencySupportUs[k] = mode_lib->vba.UrgentLatencySupportUsLuma; } } mode_lib->vba.MinUrgentLatencySupportUs = 999999; for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { mode_lib->vba.MinUrgentLatencySupportUs = dml_min( mode_lib->vba.MinUrgentLatencySupportUs, mode_lib->vba.UrgentLatencySupportUs[k]); } // Non-Urgent Latency Tolerance mode_lib->vba.NonUrgentLatencyTolerance = mode_lib->vba.MinUrgentLatencySupportUs - mode_lib->vba.UrgentWatermark; // DSCCLK for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { if ((mode_lib->vba.BlendingAndTiming[k] != k) || !mode_lib->vba.DSCEnabled[k]) { mode_lib->vba.DSCCLK_calculated[k] = 0.0; } else { if (mode_lib->vba.OutputFormat[k] == dm_420 || mode_lib->vba.OutputFormat[k] == dm_n422) mode_lib->vba.DSCFormatFactor = 2; else mode_lib->vba.DSCFormatFactor = 1; if (mode_lib->vba.ODMCombineEnabled[k]) mode_lib->vba.DSCCLK_calculated[k] = mode_lib->vba.PixelClockBackEnd[k] / 6 / mode_lib->vba.DSCFormatFactor / (1 - mode_lib->vba.DISPCLKDPPCLKDSCCLKDownSpreading / 100); else mode_lib->vba.DSCCLK_calculated[k] = mode_lib->vba.PixelClockBackEnd[k] / 3 / mode_lib->vba.DSCFormatFactor / (1 - mode_lib->vba.DISPCLKDPPCLKDSCCLKDownSpreading / 100); } } // DSC Delay // TODO for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { double bpp = mode_lib->vba.OutputBpp[k]; unsigned int slices = mode_lib->vba.NumberOfDSCSlices[k]; if (mode_lib->vba.DSCEnabled[k] && bpp != 0) { if (!mode_lib->vba.ODMCombineEnabled[k]) { mode_lib->vba.DSCDelay[k] = dscceComputeDelay( mode_lib->vba.DSCInputBitPerComponent[k], bpp, dml_ceil( (double) mode_lib->vba.HActive[k] / mode_lib->vba.NumberOfDSCSlices[k], 1), slices, mode_lib->vba.OutputFormat[k]) + dscComputeDelay( mode_lib->vba.OutputFormat[k]); } else { mode_lib->vba.DSCDelay[k] = 2 * (dscceComputeDelay( mode_lib->vba.DSCInputBitPerComponent[k], bpp, dml_ceil( (double) mode_lib->vba.HActive[k] / mode_lib->vba.NumberOfDSCSlices[k], 1), slices / 2.0, mode_lib->vba.OutputFormat[k]) + dscComputeDelay( mode_lib->vba.OutputFormat[k])); } mode_lib->vba.DSCDelay[k] = mode_lib->vba.DSCDelay[k] * mode_lib->vba.PixelClock[k] / mode_lib->vba.PixelClockBackEnd[k]; } else { mode_lib->vba.DSCDelay[k] = 0; } } for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) for (j = 0; j < mode_lib->vba.NumberOfActivePlanes; ++j) // NumberOfPlanes if (j != k && mode_lib->vba.BlendingAndTiming[k] == j && mode_lib->vba.DSCEnabled[j]) mode_lib->vba.DSCDelay[k] = mode_lib->vba.DSCDelay[j]; // Prefetch for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { unsigned int PDEAndMetaPTEBytesFrameY; unsigned int PixelPTEBytesPerRowY; unsigned int MetaRowByteY; unsigned int MetaRowByteC; unsigned int PDEAndMetaPTEBytesFrameC; unsigned int PixelPTEBytesPerRowC; Calculate256BBlockSizes( mode_lib->vba.SourcePixelFormat[k], mode_lib->vba.SurfaceTiling[k], dml_ceil(mode_lib->vba.BytePerPixelDETY[k], 1), dml_ceil(mode_lib->vba.BytePerPixelDETC[k], 2), &mode_lib->vba.BlockHeight256BytesY[k], &mode_lib->vba.BlockHeight256BytesC[k], &mode_lib->vba.BlockWidth256BytesY[k], &mode_lib->vba.BlockWidth256BytesC[k]); PDEAndMetaPTEBytesFrameY = CalculateVMAndRowBytes( mode_lib, mode_lib->vba.DCCEnable[k], mode_lib->vba.BlockHeight256BytesY[k], mode_lib->vba.BlockWidth256BytesY[k], mode_lib->vba.SourcePixelFormat[k], mode_lib->vba.SurfaceTiling[k], dml_ceil(mode_lib->vba.BytePerPixelDETY[k], 1), mode_lib->vba.SourceScan[k], mode_lib->vba.ViewportWidth[k], mode_lib->vba.ViewportHeight[k], mode_lib->vba.SwathWidthY[k], mode_lib->vba.GPUVMEnable, mode_lib->vba.VMMPageSize, mode_lib->vba.PTEBufferSizeInRequestsLuma, mode_lib->vba.PDEProcessingBufIn64KBReqs, mode_lib->vba.PitchY[k], mode_lib->vba.DCCMetaPitchY[k], &mode_lib->vba.MacroTileWidthY[k], &MetaRowByteY, &PixelPTEBytesPerRowY, &mode_lib->vba.PTEBufferSizeNotExceeded[mode_lib->vba.VoltageLevel][0], &mode_lib->vba.dpte_row_height[k], &mode_lib->vba.meta_row_height[k]); mode_lib->vba.PrefetchSourceLinesY[k] = CalculatePrefetchSourceLines( mode_lib, mode_lib->vba.VRatio[k], mode_lib->vba.vtaps[k], mode_lib->vba.Interlace[k], mode_lib->vba.ProgressiveToInterlaceUnitInOPP, mode_lib->vba.SwathHeightY[k], mode_lib->vba.ViewportYStartY[k], &mode_lib->vba.VInitPreFillY[k], &mode_lib->vba.MaxNumSwathY[k]); if ((mode_lib->vba.SourcePixelFormat[k] != dm_444_64 && mode_lib->vba.SourcePixelFormat[k] != dm_444_32 && mode_lib->vba.SourcePixelFormat[k] != dm_444_16 && mode_lib->vba.SourcePixelFormat[k] != dm_444_8)) { PDEAndMetaPTEBytesFrameC = CalculateVMAndRowBytes( mode_lib, mode_lib->vba.DCCEnable[k], mode_lib->vba.BlockHeight256BytesC[k], mode_lib->vba.BlockWidth256BytesC[k], mode_lib->vba.SourcePixelFormat[k], mode_lib->vba.SurfaceTiling[k], dml_ceil( mode_lib->vba.BytePerPixelDETC[k], 2), mode_lib->vba.SourceScan[k], mode_lib->vba.ViewportWidth[k] / 2, mode_lib->vba.ViewportHeight[k] / 2, mode_lib->vba.SwathWidthY[k] / 2, mode_lib->vba.GPUVMEnable, mode_lib->vba.VMMPageSize, mode_lib->vba.PTEBufferSizeInRequestsLuma, mode_lib->vba.PDEProcessingBufIn64KBReqs, mode_lib->vba.PitchC[k], 0, &mode_lib->vba.MacroTileWidthC[k], &MetaRowByteC, &PixelPTEBytesPerRowC, &mode_lib->vba.PTEBufferSizeNotExceeded[mode_lib->vba.VoltageLevel][0], &mode_lib->vba.dpte_row_height_chroma[k], &mode_lib->vba.meta_row_height_chroma[k]); mode_lib->vba.PrefetchSourceLinesC[k] = CalculatePrefetchSourceLines( mode_lib, mode_lib->vba.VRatio[k] / 2, mode_lib->vba.VTAPsChroma[k], mode_lib->vba.Interlace[k], mode_lib->vba.ProgressiveToInterlaceUnitInOPP, mode_lib->vba.SwathHeightC[k], mode_lib->vba.ViewportYStartC[k], &mode_lib->vba.VInitPreFillC[k], &mode_lib->vba.MaxNumSwathC[k]); } else { PixelPTEBytesPerRowC = 0; PDEAndMetaPTEBytesFrameC = 0; MetaRowByteC = 0; mode_lib->vba.MaxNumSwathC[k] = 0; mode_lib->vba.PrefetchSourceLinesC[k] = 0; } mode_lib->vba.PixelPTEBytesPerRow[k] = PixelPTEBytesPerRowY + PixelPTEBytesPerRowC; mode_lib->vba.PDEAndMetaPTEBytesFrame[k] = PDEAndMetaPTEBytesFrameY + PDEAndMetaPTEBytesFrameC; mode_lib->vba.MetaRowByte[k] = MetaRowByteY + MetaRowByteC; CalculateActiveRowBandwidth( mode_lib->vba.GPUVMEnable, mode_lib->vba.SourcePixelFormat[k], mode_lib->vba.VRatio[k], mode_lib->vba.DCCEnable[k], mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k], MetaRowByteY, MetaRowByteC, mode_lib->vba.meta_row_height[k], mode_lib->vba.meta_row_height_chroma[k], PixelPTEBytesPerRowY, PixelPTEBytesPerRowC, mode_lib->vba.dpte_row_height[k], mode_lib->vba.dpte_row_height_chroma[k], &mode_lib->vba.meta_row_bw[k], &mode_lib->vba.dpte_row_bw[k], &mode_lib->vba.qual_row_bw[k]); } mode_lib->vba.TCalc = 24.0 / mode_lib->vba.DCFCLKDeepSleep; for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { if (mode_lib->vba.BlendingAndTiming[k] == k) { if (mode_lib->vba.WritebackEnable[k] == true) { mode_lib->vba.WritebackDelay[mode_lib->vba.VoltageLevel][k] = mode_lib->vba.WritebackLatency + CalculateWriteBackDelay( mode_lib->vba.WritebackPixelFormat[k], mode_lib->vba.WritebackHRatio[k], mode_lib->vba.WritebackVRatio[k], mode_lib->vba.WritebackLumaHTaps[k], mode_lib->vba.WritebackLumaVTaps[k], mode_lib->vba.WritebackChromaHTaps[k], mode_lib->vba.WritebackChromaVTaps[k], mode_lib->vba.WritebackDestinationWidth[k]) / mode_lib->vba.DISPCLK; } else mode_lib->vba.WritebackDelay[mode_lib->vba.VoltageLevel][k] = 0; for (j = 0; j < mode_lib->vba.NumberOfActivePlanes; ++j) { if (mode_lib->vba.BlendingAndTiming[j] == k && mode_lib->vba.WritebackEnable[j] == true) { mode_lib->vba.WritebackDelay[mode_lib->vba.VoltageLevel][k] = dml_max( mode_lib->vba.WritebackDelay[mode_lib->vba.VoltageLevel][k], mode_lib->vba.WritebackLatency + CalculateWriteBackDelay( mode_lib->vba.WritebackPixelFormat[j], mode_lib->vba.WritebackHRatio[j], mode_lib->vba.WritebackVRatio[j], mode_lib->vba.WritebackLumaHTaps[j], mode_lib->vba.WritebackLumaVTaps[j], mode_lib->vba.WritebackChromaHTaps[j], mode_lib->vba.WritebackChromaVTaps[j], mode_lib->vba.WritebackDestinationWidth[j]) / mode_lib->vba.DISPCLK); } } } } for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) for (j = 0; j < mode_lib->vba.NumberOfActivePlanes; ++j) if (mode_lib->vba.BlendingAndTiming[k] == j) mode_lib->vba.WritebackDelay[mode_lib->vba.VoltageLevel][k] = mode_lib->vba.WritebackDelay[mode_lib->vba.VoltageLevel][j]; mode_lib->vba.VStartupLines = 13; for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { mode_lib->vba.MaxVStartupLines[k] = mode_lib->vba.VTotal[k] - mode_lib->vba.VActive[k] - dml_max( 1.0, dml_ceil( mode_lib->vba.WritebackDelay[mode_lib->vba.VoltageLevel][k] / (mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]), 1)); } for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) mode_lib->vba.MaximumMaxVStartupLines = dml_max( mode_lib->vba.MaximumMaxVStartupLines, mode_lib->vba.MaxVStartupLines[k]); for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { mode_lib->vba.cursor_bw[k] = 0.0; for (j = 0; j < mode_lib->vba.NumberOfCursors[k]; ++j) mode_lib->vba.cursor_bw[k] += mode_lib->vba.CursorWidth[k][j] * mode_lib->vba.CursorBPP[k][j] / 8.0 / (mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]) * mode_lib->vba.VRatio[k]; } do { double MaxTotalRDBandwidth = 0; bool DestinationLineTimesForPrefetchLessThan2 = false; bool VRatioPrefetchMoreThan4 = false; bool prefetch_vm_bw_valid = true; bool prefetch_row_bw_valid = true; double TWait = CalculateTWait( mode_lib->vba.PrefetchMode[mode_lib->vba.VoltageLevel][mode_lib->vba.maxMpcComb], mode_lib->vba.DRAMClockChangeLatency, mode_lib->vba.UrgentLatencyPixelDataOnly, mode_lib->vba.SREnterPlusExitTime); for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { if (mode_lib->vba.XFCEnabled[k] == true) { mode_lib->vba.XFCRemoteSurfaceFlipDelay = CalculateRemoteSurfaceFlipDelay( mode_lib, mode_lib->vba.VRatio[k], mode_lib->vba.SwathWidthY[k], dml_ceil( mode_lib->vba.BytePerPixelDETY[k], 1), mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k], mode_lib->vba.XFCTSlvVupdateOffset, mode_lib->vba.XFCTSlvVupdateWidth, mode_lib->vba.XFCTSlvVreadyOffset, mode_lib->vba.XFCXBUFLatencyTolerance, mode_lib->vba.XFCFillBWOverhead, mode_lib->vba.XFCSlvChunkSize, mode_lib->vba.XFCBusTransportTime, mode_lib->vba.TCalc, TWait, &mode_lib->vba.SrcActiveDrainRate, &mode_lib->vba.TInitXFill, &mode_lib->vba.TslvChk); } else { mode_lib->vba.XFCRemoteSurfaceFlipDelay = 0; } CalculateDelayAfterScaler(mode_lib, mode_lib->vba.ReturnBW, mode_lib->vba.ReadBandwidthPlaneLuma[k], mode_lib->vba.ReadBandwidthPlaneChroma[k], mode_lib->vba.TotalDataReadBandwidth, mode_lib->vba.DisplayPipeLineDeliveryTimeLuma[k], mode_lib->vba.DisplayPipeLineDeliveryTimeChroma[k], mode_lib->vba.DPPCLK[k], mode_lib->vba.DISPCLK, mode_lib->vba.PixelClock[k], mode_lib->vba.DSCDelay[k], mode_lib->vba.DPPPerPlane[k], mode_lib->vba.ScalerEnabled[k], mode_lib->vba.NumberOfCursors[k], mode_lib->vba.DPPCLKDelaySubtotal, mode_lib->vba.DPPCLKDelaySCL, mode_lib->vba.DPPCLKDelaySCLLBOnly, mode_lib->vba.DPPCLKDelayCNVCFormater, mode_lib->vba.DPPCLKDelayCNVCCursor, mode_lib->vba.DISPCLKDelaySubtotal, mode_lib->vba.SwathWidthY[k] / mode_lib->vba.HRatio[k], mode_lib->vba.OutputFormat[k], mode_lib->vba.HTotal[k], mode_lib->vba.SwathWidthSingleDPPY[k], mode_lib->vba.BytePerPixelDETY[k], mode_lib->vba.BytePerPixelDETC[k], mode_lib->vba.SwathHeightY[k], mode_lib->vba.SwathHeightC[k], mode_lib->vba.Interlace[k], mode_lib->vba.ProgressiveToInterlaceUnitInOPP, &mode_lib->vba.DSTXAfterScaler[k], &mode_lib->vba.DSTYAfterScaler[k]); mode_lib->vba.ErrorResult[k] = CalculatePrefetchSchedule( mode_lib, mode_lib->vba.DPPCLK[k], mode_lib->vba.DISPCLK, mode_lib->vba.PixelClock[k], mode_lib->vba.DCFCLKDeepSleep, mode_lib->vba.DPPPerPlane[k], mode_lib->vba.NumberOfCursors[k], mode_lib->vba.VTotal[k] - mode_lib->vba.VActive[k], mode_lib->vba.HTotal[k], mode_lib->vba.MaxInterDCNTileRepeaters, dml_min( mode_lib->vba.VStartupLines, mode_lib->vba.MaxVStartupLines[k]), mode_lib->vba.GPUVMMaxPageTableLevels, mode_lib->vba.GPUVMEnable, mode_lib->vba.DynamicMetadataEnable[k], mode_lib->vba.DynamicMetadataLinesBeforeActiveRequired[k], mode_lib->vba.DynamicMetadataTransmittedBytes[k], mode_lib->vba.DCCEnable[k], mode_lib->vba.UrgentLatencyPixelDataOnly, mode_lib->vba.UrgentExtraLatency, mode_lib->vba.TCalc, mode_lib->vba.PDEAndMetaPTEBytesFrame[k], mode_lib->vba.MetaRowByte[k], mode_lib->vba.PixelPTEBytesPerRow[k], mode_lib->vba.PrefetchSourceLinesY[k], mode_lib->vba.SwathWidthY[k], mode_lib->vba.BytePerPixelDETY[k], mode_lib->vba.VInitPreFillY[k], mode_lib->vba.MaxNumSwathY[k], mode_lib->vba.PrefetchSourceLinesC[k], mode_lib->vba.BytePerPixelDETC[k], mode_lib->vba.VInitPreFillC[k], mode_lib->vba.MaxNumSwathC[k], mode_lib->vba.SwathHeightY[k], mode_lib->vba.SwathHeightC[k], TWait, mode_lib->vba.XFCEnabled[k], mode_lib->vba.XFCRemoteSurfaceFlipDelay, mode_lib->vba.Interlace[k], mode_lib->vba.ProgressiveToInterlaceUnitInOPP, mode_lib->vba.DSTXAfterScaler[k], mode_lib->vba.DSTYAfterScaler[k], &mode_lib->vba.DestinationLinesForPrefetch[k], &mode_lib->vba.PrefetchBandwidth[k], &mode_lib->vba.DestinationLinesToRequestVMInVBlank[k], &mode_lib->vba.DestinationLinesToRequestRowInVBlank[k], &mode_lib->vba.VRatioPrefetchY[k], &mode_lib->vba.VRatioPrefetchC[k], &mode_lib->vba.RequiredPrefetchPixDataBWLuma[k], &mode_lib->vba.Tno_bw[k], &mode_lib->vba.VUpdateOffsetPix[k], &mode_lib->vba.VUpdateWidthPix[k], &mode_lib->vba.VReadyOffsetPix[k]); if (mode_lib->vba.BlendingAndTiming[k] == k) { mode_lib->vba.VStartup[k] = dml_min( mode_lib->vba.VStartupLines, mode_lib->vba.MaxVStartupLines[k]); if (mode_lib->vba.VStartupRequiredWhenNotEnoughTimeForDynamicMetadata != 0) { mode_lib->vba.VStartup[k] = mode_lib->vba.VStartupRequiredWhenNotEnoughTimeForDynamicMetadata; } } else { mode_lib->vba.VStartup[k] = dml_min( mode_lib->vba.VStartupLines, mode_lib->vba.MaxVStartupLines[mode_lib->vba.BlendingAndTiming[k]]); } } for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { if (mode_lib->vba.PDEAndMetaPTEBytesFrame[k] == 0) mode_lib->vba.prefetch_vm_bw[k] = 0; else if (mode_lib->vba.DestinationLinesToRequestVMInVBlank[k] > 0) { mode_lib->vba.prefetch_vm_bw[k] = (double) mode_lib->vba.PDEAndMetaPTEBytesFrame[k] / (mode_lib->vba.DestinationLinesToRequestVMInVBlank[k] * mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]); } else { mode_lib->vba.prefetch_vm_bw[k] = 0; prefetch_vm_bw_valid = false; } if (mode_lib->vba.MetaRowByte[k] + mode_lib->vba.PixelPTEBytesPerRow[k] == 0) mode_lib->vba.prefetch_row_bw[k] = 0; else if (mode_lib->vba.DestinationLinesToRequestRowInVBlank[k] > 0) { mode_lib->vba.prefetch_row_bw[k] = (double) (mode_lib->vba.MetaRowByte[k] + mode_lib->vba.PixelPTEBytesPerRow[k]) / (mode_lib->vba.DestinationLinesToRequestRowInVBlank[k] * mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]); } else { mode_lib->vba.prefetch_row_bw[k] = 0; prefetch_row_bw_valid = false; } MaxTotalRDBandwidth = MaxTotalRDBandwidth + mode_lib->vba.cursor_bw[k] + dml_max( mode_lib->vba.prefetch_vm_bw[k], dml_max( mode_lib->vba.prefetch_row_bw[k], dml_max( mode_lib->vba.ReadBandwidthPlaneLuma[k] + mode_lib->vba.ReadBandwidthPlaneChroma[k], mode_lib->vba.RequiredPrefetchPixDataBWLuma[k]) + mode_lib->vba.meta_row_bw[k] + mode_lib->vba.dpte_row_bw[k])); if (mode_lib->vba.DestinationLinesForPrefetch[k] < 2) DestinationLineTimesForPrefetchLessThan2 = true; if (mode_lib->vba.VRatioPrefetchY[k] > 4 || mode_lib->vba.VRatioPrefetchC[k] > 4) VRatioPrefetchMoreThan4 = true; } if (MaxTotalRDBandwidth <= mode_lib->vba.ReturnBW && prefetch_vm_bw_valid && prefetch_row_bw_valid && !VRatioPrefetchMoreThan4 && !DestinationLineTimesForPrefetchLessThan2) mode_lib->vba.PrefetchModeSupported = true; else { mode_lib->vba.PrefetchModeSupported = false; dml_print( "DML: CalculatePrefetchSchedule ***failed***. Bandwidth violation. Results are NOT valid\n"); } if (mode_lib->vba.PrefetchModeSupported == true) { double final_flip_bw[DC__NUM_DPP__MAX]; unsigned int ImmediateFlipBytes[DC__NUM_DPP__MAX]; double total_dcn_read_bw_with_flip = 0; mode_lib->vba.BandwidthAvailableForImmediateFlip = mode_lib->vba.ReturnBW; for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { mode_lib->vba.BandwidthAvailableForImmediateFlip = mode_lib->vba.BandwidthAvailableForImmediateFlip - mode_lib->vba.cursor_bw[k] - dml_max( mode_lib->vba.ReadBandwidthPlaneLuma[k] + mode_lib->vba.ReadBandwidthPlaneChroma[k] + mode_lib->vba.qual_row_bw[k], mode_lib->vba.PrefetchBandwidth[k]); } for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { ImmediateFlipBytes[k] = 0; if ((mode_lib->vba.SourcePixelFormat[k] != dm_420_8 && mode_lib->vba.SourcePixelFormat[k] != dm_420_10)) { ImmediateFlipBytes[k] = mode_lib->vba.PDEAndMetaPTEBytesFrame[k] + mode_lib->vba.MetaRowByte[k] + mode_lib->vba.PixelPTEBytesPerRow[k]; } } mode_lib->vba.TotImmediateFlipBytes = 0; for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { if ((mode_lib->vba.SourcePixelFormat[k] != dm_420_8 && mode_lib->vba.SourcePixelFormat[k] != dm_420_10)) { mode_lib->vba.TotImmediateFlipBytes = mode_lib->vba.TotImmediateFlipBytes + ImmediateFlipBytes[k]; } } for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { CalculateFlipSchedule( mode_lib, mode_lib->vba.UrgentExtraLatency, mode_lib->vba.UrgentLatencyPixelDataOnly, mode_lib->vba.GPUVMMaxPageTableLevels, mode_lib->vba.GPUVMEnable, mode_lib->vba.BandwidthAvailableForImmediateFlip, mode_lib->vba.TotImmediateFlipBytes, mode_lib->vba.SourcePixelFormat[k], ImmediateFlipBytes[k], mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k], mode_lib->vba.VRatio[k], mode_lib->vba.Tno_bw[k], mode_lib->vba.PDEAndMetaPTEBytesFrame[k], mode_lib->vba.MetaRowByte[k], mode_lib->vba.PixelPTEBytesPerRow[k], mode_lib->vba.DCCEnable[k], mode_lib->vba.dpte_row_height[k], mode_lib->vba.meta_row_height[k], mode_lib->vba.qual_row_bw[k], &mode_lib->vba.DestinationLinesToRequestVMInImmediateFlip[k], &mode_lib->vba.DestinationLinesToRequestRowInImmediateFlip[k], &final_flip_bw[k], &mode_lib->vba.ImmediateFlipSupportedForPipe[k]); } for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { total_dcn_read_bw_with_flip = total_dcn_read_bw_with_flip + mode_lib->vba.cursor_bw[k] + dml_max( mode_lib->vba.prefetch_vm_bw[k], dml_max( mode_lib->vba.prefetch_row_bw[k], final_flip_bw[k] + dml_max( mode_lib->vba.ReadBandwidthPlaneLuma[k] + mode_lib->vba.ReadBandwidthPlaneChroma[k], mode_lib->vba.RequiredPrefetchPixDataBWLuma[k]))); } mode_lib->vba.ImmediateFlipSupported = true; if (total_dcn_read_bw_with_flip > mode_lib->vba.ReturnBW) { mode_lib->vba.ImmediateFlipSupported = false; } for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { if (mode_lib->vba.ImmediateFlipSupportedForPipe[k] == false) { mode_lib->vba.ImmediateFlipSupported = false; } } } else { mode_lib->vba.ImmediateFlipSupported = false; } for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { if (mode_lib->vba.ErrorResult[k]) { mode_lib->vba.PrefetchModeSupported = false; dml_print( "DML: CalculatePrefetchSchedule ***failed***. Prefetch schedule violation. Results are NOT valid\n"); } } mode_lib->vba.VStartupLines = mode_lib->vba.VStartupLines + 1; } while (!((mode_lib->vba.PrefetchModeSupported && (!mode_lib->vba.ImmediateFlipSupport || mode_lib->vba.ImmediateFlipSupported)) || mode_lib->vba.MaximumMaxVStartupLines < mode_lib->vba.VStartupLines)); //Display Pipeline Delivery Time in Prefetch for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { if (mode_lib->vba.VRatioPrefetchY[k] <= 1) { mode_lib->vba.DisplayPipeLineDeliveryTimeLumaPrefetch[k] = mode_lib->vba.SwathWidthY[k] * mode_lib->vba.DPPPerPlane[k] / mode_lib->vba.HRatio[k] / mode_lib->vba.PixelClock[k]; } else { mode_lib->vba.DisplayPipeLineDeliveryTimeLumaPrefetch[k] = mode_lib->vba.SwathWidthY[k] / mode_lib->vba.PSCL_THROUGHPUT_LUMA[k] / mode_lib->vba.DPPCLK[k]; } if (mode_lib->vba.BytePerPixelDETC[k] == 0) { mode_lib->vba.DisplayPipeLineDeliveryTimeChromaPrefetch[k] = 0; } else { if (mode_lib->vba.VRatioPrefetchC[k] <= 1) { mode_lib->vba.DisplayPipeLineDeliveryTimeChromaPrefetch[k] = mode_lib->vba.SwathWidthY[k] * mode_lib->vba.DPPPerPlane[k] / mode_lib->vba.HRatio[k] / mode_lib->vba.PixelClock[k]; } else { mode_lib->vba.DisplayPipeLineDeliveryTimeChromaPrefetch[k] = mode_lib->vba.SwathWidthY[k] / mode_lib->vba.PSCL_THROUGHPUT_LUMA[k] / mode_lib->vba.DPPCLK[k]; } } } // Min TTUVBlank for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { if (mode_lib->vba.PrefetchMode[mode_lib->vba.VoltageLevel][mode_lib->vba.maxMpcComb] == 0) { mode_lib->vba.AllowDRAMClockChangeDuringVBlank[k] = true; mode_lib->vba.AllowDRAMSelfRefreshDuringVBlank[k] = true; mode_lib->vba.MinTTUVBlank[k] = dml_max( mode_lib->vba.DRAMClockChangeWatermark, dml_max( mode_lib->vba.StutterEnterPlusExitWatermark, mode_lib->vba.UrgentWatermark)); } else if (mode_lib->vba.PrefetchMode[mode_lib->vba.VoltageLevel][mode_lib->vba.maxMpcComb] == 1) { mode_lib->vba.AllowDRAMClockChangeDuringVBlank[k] = false; mode_lib->vba.AllowDRAMSelfRefreshDuringVBlank[k] = true; mode_lib->vba.MinTTUVBlank[k] = dml_max( mode_lib->vba.StutterEnterPlusExitWatermark, mode_lib->vba.UrgentWatermark); } else { mode_lib->vba.AllowDRAMClockChangeDuringVBlank[k] = false; mode_lib->vba.AllowDRAMSelfRefreshDuringVBlank[k] = false; mode_lib->vba.MinTTUVBlank[k] = mode_lib->vba.UrgentWatermark; } if (!mode_lib->vba.DynamicMetadataEnable[k]) mode_lib->vba.MinTTUVBlank[k] = mode_lib->vba.TCalc + mode_lib->vba.MinTTUVBlank[k]; } // DCC Configuration mode_lib->vba.ActiveDPPs = 0; // NB P-State/DRAM Clock Change Support for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { mode_lib->vba.ActiveDPPs = mode_lib->vba.ActiveDPPs + mode_lib->vba.DPPPerPlane[k]; } for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { double EffectiveLBLatencyHidingY; double EffectiveLBLatencyHidingC; double DPPOutputBufferLinesY; double DPPOutputBufferLinesC; double DPPOPPBufferingY; double MaxDETBufferingTimeY; double ActiveDRAMClockChangeLatencyMarginY; mode_lib->vba.LBLatencyHidingSourceLinesY = dml_min( mode_lib->vba.MaxLineBufferLines, (unsigned int) dml_floor( (double) mode_lib->vba.LineBufferSize / mode_lib->vba.LBBitPerPixel[k] / (mode_lib->vba.SwathWidthY[k] / dml_max( mode_lib->vba.HRatio[k], 1.0)), 1)) - (mode_lib->vba.vtaps[k] - 1); mode_lib->vba.LBLatencyHidingSourceLinesC = dml_min( mode_lib->vba.MaxLineBufferLines, (unsigned int) dml_floor( (double) mode_lib->vba.LineBufferSize / mode_lib->vba.LBBitPerPixel[k] / (mode_lib->vba.SwathWidthY[k] / 2.0 / dml_max( mode_lib->vba.HRatio[k] / 2, 1.0)), 1)) - (mode_lib->vba.VTAPsChroma[k] - 1); EffectiveLBLatencyHidingY = mode_lib->vba.LBLatencyHidingSourceLinesY / mode_lib->vba.VRatio[k] * (mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]); EffectiveLBLatencyHidingC = mode_lib->vba.LBLatencyHidingSourceLinesC / (mode_lib->vba.VRatio[k] / 2) * (mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]); if (mode_lib->vba.SwathWidthY[k] > 2 * mode_lib->vba.DPPOutputBufferPixels) { DPPOutputBufferLinesY = mode_lib->vba.DPPOutputBufferPixels / mode_lib->vba.SwathWidthY[k]; } else if (mode_lib->vba.SwathWidthY[k] > mode_lib->vba.DPPOutputBufferPixels) { DPPOutputBufferLinesY = 0.5; } else { DPPOutputBufferLinesY = 1; } if (mode_lib->vba.SwathWidthY[k] / 2 > 2 * mode_lib->vba.DPPOutputBufferPixels) { DPPOutputBufferLinesC = mode_lib->vba.DPPOutputBufferPixels / (mode_lib->vba.SwathWidthY[k] / 2); } else if (mode_lib->vba.SwathWidthY[k] / 2 > mode_lib->vba.DPPOutputBufferPixels) { DPPOutputBufferLinesC = 0.5; } else { DPPOutputBufferLinesC = 1; } DPPOPPBufferingY = (mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]) * (DPPOutputBufferLinesY + mode_lib->vba.OPPOutputBufferLines); MaxDETBufferingTimeY = mode_lib->vba.FullDETBufferingTimeY[k] + (mode_lib->vba.LinesInDETY[k] - mode_lib->vba.LinesInDETYRoundedDownToSwath[k]) / mode_lib->vba.SwathHeightY[k] * (mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]); ActiveDRAMClockChangeLatencyMarginY = DPPOPPBufferingY + EffectiveLBLatencyHidingY + MaxDETBufferingTimeY - mode_lib->vba.DRAMClockChangeWatermark; if (mode_lib->vba.ActiveDPPs > 1) { ActiveDRAMClockChangeLatencyMarginY = ActiveDRAMClockChangeLatencyMarginY - (1 - 1 / (mode_lib->vba.ActiveDPPs - 1)) * mode_lib->vba.SwathHeightY[k] * (mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]); } if (mode_lib->vba.BytePerPixelDETC[k] > 0) { double DPPOPPBufferingC = (mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]) * (DPPOutputBufferLinesC + mode_lib->vba.OPPOutputBufferLines); double MaxDETBufferingTimeC = mode_lib->vba.FullDETBufferingTimeC[k] + (mode_lib->vba.LinesInDETC[k] - mode_lib->vba.LinesInDETCRoundedDownToSwath[k]) / mode_lib->vba.SwathHeightC[k] * (mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]); double ActiveDRAMClockChangeLatencyMarginC = DPPOPPBufferingC + EffectiveLBLatencyHidingC + MaxDETBufferingTimeC - mode_lib->vba.DRAMClockChangeWatermark; if (mode_lib->vba.ActiveDPPs > 1) { ActiveDRAMClockChangeLatencyMarginC = ActiveDRAMClockChangeLatencyMarginC - (1 - 1 / (mode_lib->vba.ActiveDPPs - 1)) * mode_lib->vba.SwathHeightC[k] * (mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]); } mode_lib->vba.ActiveDRAMClockChangeLatencyMargin[k] = dml_min( ActiveDRAMClockChangeLatencyMarginY, ActiveDRAMClockChangeLatencyMarginC); } else { mode_lib->vba.ActiveDRAMClockChangeLatencyMargin[k] = ActiveDRAMClockChangeLatencyMarginY; } if (mode_lib->vba.WritebackEnable[k]) { double WritebackDRAMClockChangeLatencyMargin; if (mode_lib->vba.WritebackPixelFormat[k] == dm_444_32) { WritebackDRAMClockChangeLatencyMargin = (double) (mode_lib->vba.WritebackInterfaceLumaBufferSize + mode_lib->vba.WritebackInterfaceChromaBufferSize) / (mode_lib->vba.WritebackDestinationWidth[k] * mode_lib->vba.WritebackDestinationHeight[k] / (mode_lib->vba.WritebackSourceHeight[k] * mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]) * 4) - mode_lib->vba.WritebackDRAMClockChangeWatermark; } else if (mode_lib->vba.WritebackPixelFormat[k] == dm_420_10) { WritebackDRAMClockChangeLatencyMargin = dml_min( (double) mode_lib->vba.WritebackInterfaceLumaBufferSize * 8.0 / 10, 2.0 * mode_lib->vba.WritebackInterfaceChromaBufferSize * 8 / 10) / (mode_lib->vba.WritebackDestinationWidth[k] * mode_lib->vba.WritebackDestinationHeight[k] / (mode_lib->vba.WritebackSourceHeight[k] * mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k])) - mode_lib->vba.WritebackDRAMClockChangeWatermark; } else { WritebackDRAMClockChangeLatencyMargin = dml_min( (double) mode_lib->vba.WritebackInterfaceLumaBufferSize, 2.0 * mode_lib->vba.WritebackInterfaceChromaBufferSize) / (mode_lib->vba.WritebackDestinationWidth[k] * mode_lib->vba.WritebackDestinationHeight[k] / (mode_lib->vba.WritebackSourceHeight[k] * mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k])) - mode_lib->vba.WritebackDRAMClockChangeWatermark; } mode_lib->vba.ActiveDRAMClockChangeLatencyMargin[k] = dml_min( mode_lib->vba.ActiveDRAMClockChangeLatencyMargin[k], WritebackDRAMClockChangeLatencyMargin); } } mode_lib->vba.MinActiveDRAMClockChangeMargin = 999999; for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { if (mode_lib->vba.ActiveDRAMClockChangeLatencyMargin[k] < mode_lib->vba.MinActiveDRAMClockChangeMargin) { mode_lib->vba.MinActiveDRAMClockChangeMargin = mode_lib->vba.ActiveDRAMClockChangeLatencyMargin[k]; } } mode_lib->vba.MinActiveDRAMClockChangeLatencySupported = mode_lib->vba.MinActiveDRAMClockChangeMargin + mode_lib->vba.DRAMClockChangeLatency; if (mode_lib->vba.MinActiveDRAMClockChangeMargin > 0) { mode_lib->vba.DRAMClockChangeSupport[0][0] = dm_dram_clock_change_vactive; } else { if (mode_lib->vba.SynchronizedVBlank || mode_lib->vba.NumberOfActivePlanes == 1) { mode_lib->vba.DRAMClockChangeSupport[0][0] = dm_dram_clock_change_vblank; for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { if (!mode_lib->vba.AllowDRAMClockChangeDuringVBlank[k]) { mode_lib->vba.DRAMClockChangeSupport[0][0] = dm_dram_clock_change_unsupported; } } } else { mode_lib->vba.DRAMClockChangeSupport[0][0] = dm_dram_clock_change_unsupported; } } for (k = 0; k <= mode_lib->vba.soc.num_states; k++) for (j = 0; j < 2; j++) mode_lib->vba.DRAMClockChangeSupport[k][j] = mode_lib->vba.DRAMClockChangeSupport[0][0]; //XFC Parameters: for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { if (mode_lib->vba.XFCEnabled[k] == true) { double TWait; mode_lib->vba.XFCSlaveVUpdateOffset[k] = mode_lib->vba.XFCTSlvVupdateOffset; mode_lib->vba.XFCSlaveVupdateWidth[k] = mode_lib->vba.XFCTSlvVupdateWidth; mode_lib->vba.XFCSlaveVReadyOffset[k] = mode_lib->vba.XFCTSlvVreadyOffset; TWait = CalculateTWait( mode_lib->vba.PrefetchMode[mode_lib->vba.VoltageLevel][mode_lib->vba.maxMpcComb], mode_lib->vba.DRAMClockChangeLatency, mode_lib->vba.UrgentLatencyPixelDataOnly, mode_lib->vba.SREnterPlusExitTime); mode_lib->vba.XFCRemoteSurfaceFlipDelay = CalculateRemoteSurfaceFlipDelay( mode_lib, mode_lib->vba.VRatio[k], mode_lib->vba.SwathWidthY[k], dml_ceil(mode_lib->vba.BytePerPixelDETY[k], 1), mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k], mode_lib->vba.XFCTSlvVupdateOffset, mode_lib->vba.XFCTSlvVupdateWidth, mode_lib->vba.XFCTSlvVreadyOffset, mode_lib->vba.XFCXBUFLatencyTolerance, mode_lib->vba.XFCFillBWOverhead, mode_lib->vba.XFCSlvChunkSize, mode_lib->vba.XFCBusTransportTime, mode_lib->vba.TCalc, TWait, &mode_lib->vba.SrcActiveDrainRate, &mode_lib->vba.TInitXFill, &mode_lib->vba.TslvChk); mode_lib->vba.XFCRemoteSurfaceFlipLatency[k] = dml_floor( mode_lib->vba.XFCRemoteSurfaceFlipDelay / (mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]), 1); mode_lib->vba.XFCTransferDelay[k] = dml_ceil( mode_lib->vba.XFCBusTransportTime / (mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]), 1); mode_lib->vba.XFCPrechargeDelay[k] = dml_ceil( (mode_lib->vba.XFCBusTransportTime + mode_lib->vba.TInitXFill + mode_lib->vba.TslvChk) / (mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]), 1); mode_lib->vba.InitFillLevel = mode_lib->vba.XFCXBUFLatencyTolerance * mode_lib->vba.SrcActiveDrainRate; mode_lib->vba.FinalFillMargin = (mode_lib->vba.DestinationLinesToRequestVMInVBlank[k] + mode_lib->vba.DestinationLinesToRequestRowInVBlank[k]) * mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k] * mode_lib->vba.SrcActiveDrainRate + mode_lib->vba.XFCFillConstant; mode_lib->vba.FinalFillLevel = mode_lib->vba.XFCRemoteSurfaceFlipDelay * mode_lib->vba.SrcActiveDrainRate + mode_lib->vba.FinalFillMargin; mode_lib->vba.RemainingFillLevel = dml_max( 0.0, mode_lib->vba.FinalFillLevel - mode_lib->vba.InitFillLevel); mode_lib->vba.TFinalxFill = mode_lib->vba.RemainingFillLevel / (mode_lib->vba.SrcActiveDrainRate * mode_lib->vba.XFCFillBWOverhead / 100); mode_lib->vba.XFCPrefetchMargin[k] = mode_lib->vba.XFCRemoteSurfaceFlipDelay + mode_lib->vba.TFinalxFill + (mode_lib->vba.DestinationLinesToRequestVMInVBlank[k] + mode_lib->vba.DestinationLinesToRequestRowInVBlank[k]) * mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]; } else { mode_lib->vba.XFCSlaveVUpdateOffset[k] = 0; mode_lib->vba.XFCSlaveVupdateWidth[k] = 0; mode_lib->vba.XFCSlaveVReadyOffset[k] = 0; mode_lib->vba.XFCRemoteSurfaceFlipLatency[k] = 0; mode_lib->vba.XFCPrechargeDelay[k] = 0; mode_lib->vba.XFCTransferDelay[k] = 0; mode_lib->vba.XFCPrefetchMargin[k] = 0; } } { unsigned int VStartupMargin = 0; bool FirstMainPlane = true; for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { if (mode_lib->vba.BlendingAndTiming[k] == k) { unsigned int Margin = (mode_lib->vba.MaxVStartupLines[k] - mode_lib->vba.VStartup[k]) * mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]; if (FirstMainPlane) { VStartupMargin = Margin; FirstMainPlane = false; } else VStartupMargin = dml_min(VStartupMargin, Margin); } if (mode_lib->vba.UseMaximumVStartup) { if (mode_lib->vba.VTotal_Max[k] == mode_lib->vba.VTotal[k]) { //only use max vstart if it is not drr or lateflip. mode_lib->vba.VStartup[k] = mode_lib->vba.MaxVStartupLines[mode_lib->vba.BlendingAndTiming[k]]; } } } } } static void dml20v2_DisplayPipeConfiguration(struct display_mode_lib *mode_lib) { double BytePerPixDETY; double BytePerPixDETC; double Read256BytesBlockHeightY; double Read256BytesBlockHeightC; double Read256BytesBlockWidthY; double Read256BytesBlockWidthC; double MaximumSwathHeightY; double MaximumSwathHeightC; double MinimumSwathHeightY; double MinimumSwathHeightC; double SwathWidth; double SwathWidthGranularityY; double SwathWidthGranularityC; double RoundedUpMaxSwathSizeBytesY; double RoundedUpMaxSwathSizeBytesC; unsigned int j, k; for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { bool MainPlaneDoesODMCombine = false; if (mode_lib->vba.SourcePixelFormat[k] == dm_444_64) { BytePerPixDETY = 8; BytePerPixDETC = 0; } else if (mode_lib->vba.SourcePixelFormat[k] == dm_444_32) { BytePerPixDETY = 4; BytePerPixDETC = 0; } else if (mode_lib->vba.SourcePixelFormat[k] == dm_444_16) { BytePerPixDETY = 2; BytePerPixDETC = 0; } else if (mode_lib->vba.SourcePixelFormat[k] == dm_444_8) { BytePerPixDETY = 1; BytePerPixDETC = 0; } else if (mode_lib->vba.SourcePixelFormat[k] == dm_420_8) { BytePerPixDETY = 1; BytePerPixDETC = 2; } else { BytePerPixDETY = 4.0 / 3.0; BytePerPixDETC = 8.0 / 3.0; } if ((mode_lib->vba.SourcePixelFormat[k] == dm_444_64 || mode_lib->vba.SourcePixelFormat[k] == dm_444_32 || mode_lib->vba.SourcePixelFormat[k] == dm_444_16 || mode_lib->vba.SourcePixelFormat[k] == dm_444_8)) { if (mode_lib->vba.SurfaceTiling[k] == dm_sw_linear) { Read256BytesBlockHeightY = 1; } else if (mode_lib->vba.SourcePixelFormat[k] == dm_444_64) { Read256BytesBlockHeightY = 4; } else if (mode_lib->vba.SourcePixelFormat[k] == dm_444_32 || mode_lib->vba.SourcePixelFormat[k] == dm_444_16) { Read256BytesBlockHeightY = 8; } else { Read256BytesBlockHeightY = 16; } Read256BytesBlockWidthY = 256 / dml_ceil(BytePerPixDETY, 1) / Read256BytesBlockHeightY; Read256BytesBlockHeightC = 0; Read256BytesBlockWidthC = 0; } else { if (mode_lib->vba.SurfaceTiling[k] == dm_sw_linear) { Read256BytesBlockHeightY = 1; Read256BytesBlockHeightC = 1; } else if (mode_lib->vba.SourcePixelFormat[k] == dm_420_8) { Read256BytesBlockHeightY = 16; Read256BytesBlockHeightC = 8; } else { Read256BytesBlockHeightY = 8; Read256BytesBlockHeightC = 8; } Read256BytesBlockWidthY = 256 / dml_ceil(BytePerPixDETY, 1) / Read256BytesBlockHeightY; Read256BytesBlockWidthC = 256 / dml_ceil(BytePerPixDETC, 2) / Read256BytesBlockHeightC; } if (mode_lib->vba.SourceScan[k] == dm_horz) { MaximumSwathHeightY = Read256BytesBlockHeightY; MaximumSwathHeightC = Read256BytesBlockHeightC; } else { MaximumSwathHeightY = Read256BytesBlockWidthY; MaximumSwathHeightC = Read256BytesBlockWidthC; } if ((mode_lib->vba.SourcePixelFormat[k] == dm_444_64 || mode_lib->vba.SourcePixelFormat[k] == dm_444_32 || mode_lib->vba.SourcePixelFormat[k] == dm_444_16 || mode_lib->vba.SourcePixelFormat[k] == dm_444_8)) { if (mode_lib->vba.SurfaceTiling[k] == dm_sw_linear || (mode_lib->vba.SourcePixelFormat[k] == dm_444_64 && (mode_lib->vba.SurfaceTiling[k] == dm_sw_4kb_s || mode_lib->vba.SurfaceTiling[k] == dm_sw_4kb_s_x || mode_lib->vba.SurfaceTiling[k] == dm_sw_64kb_s || mode_lib->vba.SurfaceTiling[k] == dm_sw_64kb_s_t || mode_lib->vba.SurfaceTiling[k] == dm_sw_64kb_s_x || mode_lib->vba.SurfaceTiling[k] == dm_sw_var_s || mode_lib->vba.SurfaceTiling[k] == dm_sw_var_s_x) && mode_lib->vba.SourceScan[k] == dm_horz)) { MinimumSwathHeightY = MaximumSwathHeightY; } else if (mode_lib->vba.SourcePixelFormat[k] == dm_444_8 && mode_lib->vba.SourceScan[k] != dm_horz) { MinimumSwathHeightY = MaximumSwathHeightY; } else { MinimumSwathHeightY = MaximumSwathHeightY / 2.0; } MinimumSwathHeightC = MaximumSwathHeightC; } else { if (mode_lib->vba.SurfaceTiling[k] == dm_sw_linear) { MinimumSwathHeightY = MaximumSwathHeightY; MinimumSwathHeightC = MaximumSwathHeightC; } else if (mode_lib->vba.SourcePixelFormat[k] == dm_420_8 && mode_lib->vba.SourceScan[k] == dm_horz) { MinimumSwathHeightY = MaximumSwathHeightY / 2.0; MinimumSwathHeightC = MaximumSwathHeightC; } else if (mode_lib->vba.SourcePixelFormat[k] == dm_420_10 && mode_lib->vba.SourceScan[k] == dm_horz) { MinimumSwathHeightC = MaximumSwathHeightC / 2.0; MinimumSwathHeightY = MaximumSwathHeightY; } else { MinimumSwathHeightY = MaximumSwathHeightY; MinimumSwathHeightC = MaximumSwathHeightC; } } if (mode_lib->vba.SourceScan[k] == dm_horz) { SwathWidth = mode_lib->vba.ViewportWidth[k]; } else { SwathWidth = mode_lib->vba.ViewportHeight[k]; } if (mode_lib->vba.ODMCombineEnabled[k] == true) { MainPlaneDoesODMCombine = true; } for (j = 0; j < mode_lib->vba.NumberOfActivePlanes; ++j) { if (mode_lib->vba.BlendingAndTiming[k] == j && mode_lib->vba.ODMCombineEnabled[j] == true) { MainPlaneDoesODMCombine = true; } } if (MainPlaneDoesODMCombine == true) { SwathWidth = dml_min( SwathWidth, mode_lib->vba.HActive[k] / 2.0 * mode_lib->vba.HRatio[k]); } else { if (mode_lib->vba.DPPPerPlane[k] == 0) SwathWidth = 0; else SwathWidth = SwathWidth / mode_lib->vba.DPPPerPlane[k]; } SwathWidthGranularityY = 256 / dml_ceil(BytePerPixDETY, 1) / MaximumSwathHeightY; RoundedUpMaxSwathSizeBytesY = (dml_ceil( (double) (SwathWidth - 1), SwathWidthGranularityY) + SwathWidthGranularityY) * BytePerPixDETY * MaximumSwathHeightY; if (mode_lib->vba.SourcePixelFormat[k] == dm_420_10) { RoundedUpMaxSwathSizeBytesY = dml_ceil(RoundedUpMaxSwathSizeBytesY, 256) + 256; } if (MaximumSwathHeightC > 0) { SwathWidthGranularityC = 256.0 / dml_ceil(BytePerPixDETC, 2) / MaximumSwathHeightC; RoundedUpMaxSwathSizeBytesC = (dml_ceil( (double) (SwathWidth / 2.0 - 1), SwathWidthGranularityC) + SwathWidthGranularityC) * BytePerPixDETC * MaximumSwathHeightC; if (mode_lib->vba.SourcePixelFormat[k] == dm_420_10) { RoundedUpMaxSwathSizeBytesC = dml_ceil( RoundedUpMaxSwathSizeBytesC, 256) + 256; } } else RoundedUpMaxSwathSizeBytesC = 0.0; if (RoundedUpMaxSwathSizeBytesY + RoundedUpMaxSwathSizeBytesC <= mode_lib->vba.DETBufferSizeInKByte * 1024.0 / 2.0) { mode_lib->vba.SwathHeightY[k] = MaximumSwathHeightY; mode_lib->vba.SwathHeightC[k] = MaximumSwathHeightC; } else { mode_lib->vba.SwathHeightY[k] = MinimumSwathHeightY; mode_lib->vba.SwathHeightC[k] = MinimumSwathHeightC; } if (mode_lib->vba.SwathHeightC[k] == 0) { mode_lib->vba.DETBufferSizeY[k] = mode_lib->vba.DETBufferSizeInKByte * 1024; mode_lib->vba.DETBufferSizeC[k] = 0; } else if (mode_lib->vba.SwathHeightY[k] <= mode_lib->vba.SwathHeightC[k]) { mode_lib->vba.DETBufferSizeY[k] = mode_lib->vba.DETBufferSizeInKByte * 1024.0 / 2; mode_lib->vba.DETBufferSizeC[k] = mode_lib->vba.DETBufferSizeInKByte * 1024.0 / 2; } else { mode_lib->vba.DETBufferSizeY[k] = mode_lib->vba.DETBufferSizeInKByte * 1024.0 * 2 / 3; mode_lib->vba.DETBufferSizeC[k] = mode_lib->vba.DETBufferSizeInKByte * 1024.0 / 3; } } } static double CalculateTWait( unsigned int PrefetchMode, double DRAMClockChangeLatency, double UrgentLatencyPixelDataOnly, double SREnterPlusExitTime) { if (PrefetchMode == 0) { return dml_max( DRAMClockChangeLatency + UrgentLatencyPixelDataOnly, dml_max(SREnterPlusExitTime, UrgentLatencyPixelDataOnly)); } else if (PrefetchMode == 1) { return dml_max(SREnterPlusExitTime, UrgentLatencyPixelDataOnly); } else { return UrgentLatencyPixelDataOnly; } } static double CalculateRemoteSurfaceFlipDelay( struct display_mode_lib *mode_lib, double VRatio, double SwathWidth, double Bpp, double LineTime, double XFCTSlvVupdateOffset, double XFCTSlvVupdateWidth, double XFCTSlvVreadyOffset, double XFCXBUFLatencyTolerance, double XFCFillBWOverhead, double XFCSlvChunkSize, double XFCBusTransportTime, double TCalc, double TWait, double *SrcActiveDrainRate, double *TInitXFill, double *TslvChk) { double TSlvSetup, AvgfillRate, result; *SrcActiveDrainRate = VRatio * SwathWidth * Bpp / LineTime; TSlvSetup = XFCTSlvVupdateOffset + XFCTSlvVupdateWidth + XFCTSlvVreadyOffset; *TInitXFill = XFCXBUFLatencyTolerance / (1 + XFCFillBWOverhead / 100); AvgfillRate = *SrcActiveDrainRate * (1 + XFCFillBWOverhead / 100); *TslvChk = XFCSlvChunkSize / AvgfillRate; dml_print( "DML::CalculateRemoteSurfaceFlipDelay: SrcActiveDrainRate: %f\n", *SrcActiveDrainRate); dml_print("DML::CalculateRemoteSurfaceFlipDelay: TSlvSetup: %f\n", TSlvSetup); dml_print("DML::CalculateRemoteSurfaceFlipDelay: TInitXFill: %f\n", *TInitXFill); dml_print("DML::CalculateRemoteSurfaceFlipDelay: AvgfillRate: %f\n", AvgfillRate); dml_print("DML::CalculateRemoteSurfaceFlipDelay: TslvChk: %f\n", *TslvChk); result = 2 * XFCBusTransportTime + TSlvSetup + TCalc + TWait + *TslvChk + *TInitXFill; // TODO: This doesn't seem to match programming guide dml_print("DML::CalculateRemoteSurfaceFlipDelay: RemoteSurfaceFlipDelay: %f\n", result); return result; } static double CalculateWriteBackDelay( enum source_format_class WritebackPixelFormat, double WritebackHRatio, double WritebackVRatio, unsigned int WritebackLumaHTaps, unsigned int WritebackLumaVTaps, unsigned int WritebackChromaHTaps, unsigned int WritebackChromaVTaps, unsigned int WritebackDestinationWidth) { double CalculateWriteBackDelay = dml_max( dml_ceil(WritebackLumaHTaps / 4.0, 1) / WritebackHRatio, WritebackLumaVTaps * dml_ceil(1.0 / WritebackVRatio, 1) * dml_ceil( WritebackDestinationWidth / 4.0, 1) + dml_ceil(1.0 / WritebackVRatio, 1) * (dml_ceil( WritebackLumaVTaps / 4.0, 1) + 4)); if (WritebackPixelFormat != dm_444_32) { CalculateWriteBackDelay = dml_max( CalculateWriteBackDelay, dml_max( dml_ceil( WritebackChromaHTaps / 2.0, 1) / (2 * WritebackHRatio), WritebackChromaVTaps * dml_ceil( 1 / (2 * WritebackVRatio), 1) * dml_ceil( WritebackDestinationWidth / 2.0 / 2.0, 1) + dml_ceil( 1 / (2 * WritebackVRatio), 1) * (dml_ceil( WritebackChromaVTaps / 4.0, 1) + 4))); } return CalculateWriteBackDelay; } static void CalculateActiveRowBandwidth( bool GPUVMEnable, enum source_format_class SourcePixelFormat, double VRatio, bool DCCEnable, double LineTime, unsigned int MetaRowByteLuma, unsigned int MetaRowByteChroma, unsigned int meta_row_height_luma, unsigned int meta_row_height_chroma, unsigned int PixelPTEBytesPerRowLuma, unsigned int PixelPTEBytesPerRowChroma, unsigned int dpte_row_height_luma, unsigned int dpte_row_height_chroma, double *meta_row_bw, double *dpte_row_bw, double *qual_row_bw) { if (DCCEnable != true) { *meta_row_bw = 0; } else if (SourcePixelFormat == dm_420_8 || SourcePixelFormat == dm_420_10) { *meta_row_bw = VRatio * MetaRowByteLuma / (meta_row_height_luma * LineTime) + VRatio / 2 * MetaRowByteChroma / (meta_row_height_chroma * LineTime); } else { *meta_row_bw = VRatio * MetaRowByteLuma / (meta_row_height_luma * LineTime); } if (GPUVMEnable != true) { *dpte_row_bw = 0; } else if (SourcePixelFormat == dm_420_8 || SourcePixelFormat == dm_420_10) { *dpte_row_bw = VRatio * PixelPTEBytesPerRowLuma / (dpte_row_height_luma * LineTime) + VRatio / 2 * PixelPTEBytesPerRowChroma / (dpte_row_height_chroma * LineTime); } else { *dpte_row_bw = VRatio * PixelPTEBytesPerRowLuma / (dpte_row_height_luma * LineTime); } if ((SourcePixelFormat == dm_420_8 || SourcePixelFormat == dm_420_10)) { *qual_row_bw = *meta_row_bw + *dpte_row_bw; } else { *qual_row_bw = 0; } } static void CalculateFlipSchedule( struct display_mode_lib *mode_lib, double UrgentExtraLatency, double UrgentLatencyPixelDataOnly, unsigned int GPUVMMaxPageTableLevels, bool GPUVMEnable, double BandwidthAvailableForImmediateFlip, unsigned int TotImmediateFlipBytes, enum source_format_class SourcePixelFormat, unsigned int ImmediateFlipBytes, double LineTime, double VRatio, double Tno_bw, double PDEAndMetaPTEBytesFrame, unsigned int MetaRowByte, unsigned int PixelPTEBytesPerRow, bool DCCEnable, unsigned int dpte_row_height, unsigned int meta_row_height, double qual_row_bw, double *DestinationLinesToRequestVMInImmediateFlip, double *DestinationLinesToRequestRowInImmediateFlip, double *final_flip_bw, bool *ImmediateFlipSupportedForPipe) { double min_row_time = 0.0; if (SourcePixelFormat == dm_420_8 || SourcePixelFormat == dm_420_10) { *DestinationLinesToRequestVMInImmediateFlip = 0.0; *DestinationLinesToRequestRowInImmediateFlip = 0.0; *final_flip_bw = qual_row_bw; *ImmediateFlipSupportedForPipe = true; } else { double TimeForFetchingMetaPTEImmediateFlip; double TimeForFetchingRowInVBlankImmediateFlip; if (GPUVMEnable == true) { mode_lib->vba.ImmediateFlipBW[0] = BandwidthAvailableForImmediateFlip * ImmediateFlipBytes / TotImmediateFlipBytes; TimeForFetchingMetaPTEImmediateFlip = dml_max( Tno_bw + PDEAndMetaPTEBytesFrame / mode_lib->vba.ImmediateFlipBW[0], dml_max( UrgentExtraLatency + UrgentLatencyPixelDataOnly * (GPUVMMaxPageTableLevels - 1), LineTime / 4.0)); } else { TimeForFetchingMetaPTEImmediateFlip = 0; } *DestinationLinesToRequestVMInImmediateFlip = dml_floor( 4.0 * (TimeForFetchingMetaPTEImmediateFlip / LineTime + 0.125), 1) / 4.0; if ((GPUVMEnable == true || DCCEnable == true)) { mode_lib->vba.ImmediateFlipBW[0] = BandwidthAvailableForImmediateFlip * ImmediateFlipBytes / TotImmediateFlipBytes; TimeForFetchingRowInVBlankImmediateFlip = dml_max( (MetaRowByte + PixelPTEBytesPerRow) / mode_lib->vba.ImmediateFlipBW[0], dml_max(UrgentLatencyPixelDataOnly, LineTime / 4.0)); } else { TimeForFetchingRowInVBlankImmediateFlip = 0; } *DestinationLinesToRequestRowInImmediateFlip = dml_floor( 4.0 * (TimeForFetchingRowInVBlankImmediateFlip / LineTime + 0.125), 1) / 4.0; if (GPUVMEnable == true) { *final_flip_bw = dml_max( PDEAndMetaPTEBytesFrame / (*DestinationLinesToRequestVMInImmediateFlip * LineTime), (MetaRowByte + PixelPTEBytesPerRow) / (TimeForFetchingRowInVBlankImmediateFlip * LineTime)); } else if (MetaRowByte + PixelPTEBytesPerRow > 0) { *final_flip_bw = (MetaRowByte + PixelPTEBytesPerRow) / (TimeForFetchingRowInVBlankImmediateFlip * LineTime); } else { *final_flip_bw = 0; } if (GPUVMEnable && !DCCEnable) min_row_time = dpte_row_height * LineTime / VRatio; else if (!GPUVMEnable && DCCEnable) min_row_time = meta_row_height * LineTime / VRatio; else min_row_time = dml_min(dpte_row_height, meta_row_height) * LineTime / VRatio; if (*DestinationLinesToRequestVMInImmediateFlip >= 8 || *DestinationLinesToRequestRowInImmediateFlip >= 16 || TimeForFetchingMetaPTEImmediateFlip + 2 * TimeForFetchingRowInVBlankImmediateFlip > min_row_time) *ImmediateFlipSupportedForPipe = false; else *ImmediateFlipSupportedForPipe = true; } } static unsigned int TruncToValidBPP( double DecimalBPP, bool DSCEnabled, enum output_encoder_class Output, enum output_format_class Format, unsigned int DSCInputBitPerComponent) { if (Output == dm_hdmi) { if (Format == dm_420) { if (DecimalBPP >= 18) return 18; else if (DecimalBPP >= 15) return 15; else if (DecimalBPP >= 12) return 12; else return BPP_INVALID; } else if (Format == dm_444) { if (DecimalBPP >= 36) return 36; else if (DecimalBPP >= 30) return 30; else if (DecimalBPP >= 24) return 24; else if (DecimalBPP >= 18) return 18; else return BPP_INVALID; } else { if (DecimalBPP / 1.5 >= 24) return 24; else if (DecimalBPP / 1.5 >= 20) return 20; else if (DecimalBPP / 1.5 >= 16) return 16; else return BPP_INVALID; } } else { if (DSCEnabled) { if (Format == dm_420) { if (DecimalBPP < 6) return BPP_INVALID; else if (DecimalBPP >= 1.5 * DSCInputBitPerComponent - 1 / 16) return 1.5 * DSCInputBitPerComponent - 1 / 16; else return dml_floor(16 * DecimalBPP, 1) / 16; } else if (Format == dm_n422) { if (DecimalBPP < 7) return BPP_INVALID; else if (DecimalBPP >= 2 * DSCInputBitPerComponent - 1 / 16) return 2 * DSCInputBitPerComponent - 1 / 16; else return dml_floor(16 * DecimalBPP, 1) / 16; } else { if (DecimalBPP < 8) return BPP_INVALID; else if (DecimalBPP >= 3 * DSCInputBitPerComponent - 1 / 16) return 3 * DSCInputBitPerComponent - 1 / 16; else return dml_floor(16 * DecimalBPP, 1) / 16; } } else if (Format == dm_420) { if (DecimalBPP >= 18) return 18; else if (DecimalBPP >= 15) return 15; else if (DecimalBPP >= 12) return 12; else return BPP_INVALID; } else if (Format == dm_s422 || Format == dm_n422) { if (DecimalBPP >= 24) return 24; else if (DecimalBPP >= 20) return 20; else if (DecimalBPP >= 16) return 16; else return BPP_INVALID; } else { if (DecimalBPP >= 36) return 36; else if (DecimalBPP >= 30) return 30; else if (DecimalBPP >= 24) return 24; else if (DecimalBPP >= 18) return 18; else return BPP_INVALID; } } } void dml20v2_ModeSupportAndSystemConfigurationFull(struct display_mode_lib *mode_lib) { struct vba_vars_st *locals = &mode_lib->vba; int i; unsigned int j, k, m; /*MODE SUPPORT, VOLTAGE STATE AND SOC CONFIGURATION*/ /*Scale Ratio, taps Support Check*/ mode_lib->vba.ScaleRatioAndTapsSupport = true; for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { if (mode_lib->vba.ScalerEnabled[k] == false && ((mode_lib->vba.SourcePixelFormat[k] != dm_444_64 && mode_lib->vba.SourcePixelFormat[k] != dm_444_32 && mode_lib->vba.SourcePixelFormat[k] != dm_444_16 && mode_lib->vba.SourcePixelFormat[k] != dm_mono_16 && mode_lib->vba.SourcePixelFormat[k] != dm_mono_8) || mode_lib->vba.HRatio[k] != 1.0 || mode_lib->vba.htaps[k] != 1.0 || mode_lib->vba.VRatio[k] != 1.0 || mode_lib->vba.vtaps[k] != 1.0)) { mode_lib->vba.ScaleRatioAndTapsSupport = false; } else if (mode_lib->vba.vtaps[k] < 1.0 || mode_lib->vba.vtaps[k] > 8.0 || mode_lib->vba.htaps[k] < 1.0 || mode_lib->vba.htaps[k] > 8.0 || (mode_lib->vba.htaps[k] > 1.0 && (mode_lib->vba.htaps[k] % 2) == 1) || mode_lib->vba.HRatio[k] > mode_lib->vba.MaxHSCLRatio || mode_lib->vba.VRatio[k] > mode_lib->vba.MaxVSCLRatio || mode_lib->vba.HRatio[k] > mode_lib->vba.htaps[k] || mode_lib->vba.VRatio[k] > mode_lib->vba.vtaps[k] || (mode_lib->vba.SourcePixelFormat[k] != dm_444_64 && mode_lib->vba.SourcePixelFormat[k] != dm_444_32 && mode_lib->vba.SourcePixelFormat[k] != dm_444_16 && mode_lib->vba.SourcePixelFormat[k] != dm_mono_16 && mode_lib->vba.SourcePixelFormat[k] != dm_mono_8 && (mode_lib->vba.HRatio[k] / 2.0 > mode_lib->vba.HTAPsChroma[k] || mode_lib->vba.VRatio[k] / 2.0 > mode_lib->vba.VTAPsChroma[k]))) { mode_lib->vba.ScaleRatioAndTapsSupport = false; } } /*Source Format, Pixel Format and Scan Support Check*/ mode_lib->vba.SourceFormatPixelAndScanSupport = true; for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { if ((mode_lib->vba.SurfaceTiling[k] == dm_sw_linear && mode_lib->vba.SourceScan[k] != dm_horz) || ((mode_lib->vba.SurfaceTiling[k] == dm_sw_4kb_d || mode_lib->vba.SurfaceTiling[k] == dm_sw_4kb_d_x || mode_lib->vba.SurfaceTiling[k] == dm_sw_64kb_d || mode_lib->vba.SurfaceTiling[k] == dm_sw_64kb_d_t || mode_lib->vba.SurfaceTiling[k] == dm_sw_64kb_d_x || mode_lib->vba.SurfaceTiling[k] == dm_sw_var_d || mode_lib->vba.SurfaceTiling[k] == dm_sw_var_d_x) && mode_lib->vba.SourcePixelFormat[k] != dm_444_64) || (mode_lib->vba.SurfaceTiling[k] == dm_sw_64kb_r_x && (mode_lib->vba.SourcePixelFormat[k] == dm_mono_8 || mode_lib->vba.SourcePixelFormat[k] == dm_420_8 || mode_lib->vba.SourcePixelFormat[k] == dm_420_10)) || (((mode_lib->vba.SurfaceTiling[k] == dm_sw_gfx7_2d_thin_gl || mode_lib->vba.SurfaceTiling[k] == dm_sw_gfx7_2d_thin_lvp) && !((mode_lib->vba.SourcePixelFormat[k] == dm_444_64 || mode_lib->vba.SourcePixelFormat[k] == dm_444_32) && mode_lib->vba.SourceScan[k] == dm_horz && mode_lib->vba.SupportGFX7CompatibleTilingIn32bppAnd64bpp == true && mode_lib->vba.DCCEnable[k] == false)) || (mode_lib->vba.DCCEnable[k] == true && (mode_lib->vba.SurfaceTiling[k] == dm_sw_linear || mode_lib->vba.SourcePixelFormat[k] == dm_420_8 || mode_lib->vba.SourcePixelFormat[k] == dm_420_10)))) { mode_lib->vba.SourceFormatPixelAndScanSupport = false; } } /*Bandwidth Support Check*/ for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { if (mode_lib->vba.SourcePixelFormat[k] == dm_444_64) { locals->BytePerPixelInDETY[k] = 8.0; locals->BytePerPixelInDETC[k] = 0.0; } else if (mode_lib->vba.SourcePixelFormat[k] == dm_444_32) { locals->BytePerPixelInDETY[k] = 4.0; locals->BytePerPixelInDETC[k] = 0.0; } else if (mode_lib->vba.SourcePixelFormat[k] == dm_444_16 || mode_lib->vba.SourcePixelFormat[k] == dm_mono_16) { locals->BytePerPixelInDETY[k] = 2.0; locals->BytePerPixelInDETC[k] = 0.0; } else if (mode_lib->vba.SourcePixelFormat[k] == dm_mono_8) { locals->BytePerPixelInDETY[k] = 1.0; locals->BytePerPixelInDETC[k] = 0.0; } else if (mode_lib->vba.SourcePixelFormat[k] == dm_420_8) { locals->BytePerPixelInDETY[k] = 1.0; locals->BytePerPixelInDETC[k] = 2.0; } else { locals->BytePerPixelInDETY[k] = 4.0 / 3; locals->BytePerPixelInDETC[k] = 8.0 / 3; } if (mode_lib->vba.SourceScan[k] == dm_horz) { locals->SwathWidthYSingleDPP[k] = mode_lib->vba.ViewportWidth[k]; } else { locals->SwathWidthYSingleDPP[k] = mode_lib->vba.ViewportHeight[k]; } } for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { locals->ReadBandwidthLuma[k] = locals->SwathWidthYSingleDPP[k] * dml_ceil(locals->BytePerPixelInDETY[k], 1.0) / (mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]) * mode_lib->vba.VRatio[k]; locals->ReadBandwidthChroma[k] = locals->SwathWidthYSingleDPP[k] / 2 * dml_ceil(locals->BytePerPixelInDETC[k], 2.0) / (mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]) * mode_lib->vba.VRatio[k] / 2.0; locals->ReadBandwidth[k] = locals->ReadBandwidthLuma[k] + locals->ReadBandwidthChroma[k]; } for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { if (mode_lib->vba.WritebackEnable[k] == true && mode_lib->vba.WritebackPixelFormat[k] == dm_444_32) { locals->WriteBandwidth[k] = mode_lib->vba.WritebackDestinationWidth[k] * mode_lib->vba.WritebackDestinationHeight[k] / (mode_lib->vba.WritebackSourceHeight[k] * mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]) * 4.0; } else if (mode_lib->vba.WritebackEnable[k] == true && mode_lib->vba.WritebackPixelFormat[k] == dm_420_10) { locals->WriteBandwidth[k] = mode_lib->vba.WritebackDestinationWidth[k] * mode_lib->vba.WritebackDestinationHeight[k] / (mode_lib->vba.WritebackSourceHeight[k] * mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]) * 3.0; } else if (mode_lib->vba.WritebackEnable[k] == true) { locals->WriteBandwidth[k] = mode_lib->vba.WritebackDestinationWidth[k] * mode_lib->vba.WritebackDestinationHeight[k] / (mode_lib->vba.WritebackSourceHeight[k] * mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]) * 1.5; } else { locals->WriteBandwidth[k] = 0.0; } } mode_lib->vba.DCCEnabledInAnyPlane = false; for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { if (mode_lib->vba.DCCEnable[k] == true) { mode_lib->vba.DCCEnabledInAnyPlane = true; } } mode_lib->vba.UrgentLatency = mode_lib->vba.UrgentLatencyPixelDataOnly; for (i = 0; i <= mode_lib->vba.soc.num_states; i++) { locals->FabricAndDRAMBandwidthPerState[i] = dml_min( mode_lib->vba.DRAMSpeedPerState[i] * mode_lib->vba.NumberOfChannels * mode_lib->vba.DRAMChannelWidth, mode_lib->vba.FabricClockPerState[i] * mode_lib->vba.FabricDatapathToDCNDataReturn) / 1000; locals->ReturnBWToDCNPerState = dml_min(locals->ReturnBusWidth * locals->DCFCLKPerState[i], locals->FabricAndDRAMBandwidthPerState[i] * 1000) * locals->PercentOfIdealDRAMFabricAndSDPPortBWReceivedAfterUrgLatencyPixelDataOnly / 100; locals->ReturnBWPerState[i] = locals->ReturnBWToDCNPerState; if (locals->DCCEnabledInAnyPlane == true && locals->ReturnBWToDCNPerState > locals->DCFCLKPerState[i] * locals->ReturnBusWidth / 4) { locals->ReturnBWPerState[i] = dml_min(locals->ReturnBWPerState[i], locals->ReturnBWToDCNPerState * 4 * (1 - locals->UrgentLatency / ((locals->ROBBufferSizeInKByte - locals->PixelChunkSizeInKByte) * 1024 / (locals->ReturnBWToDCNPerState - locals->DCFCLKPerState[i] * locals->ReturnBusWidth / 4) + locals->UrgentLatency))); } locals->CriticalPoint = 2 * locals->ReturnBusWidth * locals->DCFCLKPerState[i] * locals->UrgentLatency / (locals->ReturnBWToDCNPerState * locals->UrgentLatency + (locals->ROBBufferSizeInKByte - locals->PixelChunkSizeInKByte) * 1024); if (locals->DCCEnabledInAnyPlane && locals->CriticalPoint > 1 && locals->CriticalPoint < 4) { locals->ReturnBWPerState[i] = dml_min(locals->ReturnBWPerState[i], 4 * locals->ReturnBWToDCNPerState * (locals->ROBBufferSizeInKByte - locals->PixelChunkSizeInKByte) * 1024 * locals->ReturnBusWidth * locals->DCFCLKPerState[i] * locals->UrgentLatency / dml_pow((locals->ReturnBWToDCNPerState * locals->UrgentLatency + (locals->ROBBufferSizeInKByte - locals->PixelChunkSizeInKByte) * 1024), 2)); } locals->ReturnBWToDCNPerState = dml_min(locals->ReturnBusWidth * locals->DCFCLKPerState[i], locals->FabricAndDRAMBandwidthPerState[i] * 1000); if (locals->DCCEnabledInAnyPlane == true && locals->ReturnBWToDCNPerState > locals->DCFCLKPerState[i] * locals->ReturnBusWidth / 4) { locals->ReturnBWPerState[i] = dml_min(locals->ReturnBWPerState[i], locals->ReturnBWToDCNPerState * 4 * (1 - locals->UrgentLatency / ((locals->ROBBufferSizeInKByte - locals->PixelChunkSizeInKByte) * 1024 / (locals->ReturnBWToDCNPerState - locals->DCFCLKPerState[i] * locals->ReturnBusWidth / 4) + locals->UrgentLatency))); } locals->CriticalPoint = 2 * locals->ReturnBusWidth * locals->DCFCLKPerState[i] * locals->UrgentLatency / (locals->ReturnBWToDCNPerState * locals->UrgentLatency + (locals->ROBBufferSizeInKByte - locals->PixelChunkSizeInKByte) * 1024); if (locals->DCCEnabledInAnyPlane && locals->CriticalPoint > 1 && locals->CriticalPoint < 4) { locals->ReturnBWPerState[i] = dml_min(locals->ReturnBWPerState[i], 4 * locals->ReturnBWToDCNPerState * (locals->ROBBufferSizeInKByte - locals->PixelChunkSizeInKByte) * 1024 * locals->ReturnBusWidth * locals->DCFCLKPerState[i] * locals->UrgentLatency / dml_pow((locals->ReturnBWToDCNPerState * locals->UrgentLatency + (locals->ROBBufferSizeInKByte - locals->PixelChunkSizeInKByte) * 1024), 2)); } } /*Writeback Latency support check*/ mode_lib->vba.WritebackLatencySupport = true; for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { if (mode_lib->vba.WritebackEnable[k] == true) { if (mode_lib->vba.WritebackPixelFormat[k] == dm_444_32) { if (locals->WriteBandwidth[k] > (mode_lib->vba.WritebackInterfaceLumaBufferSize + mode_lib->vba.WritebackInterfaceChromaBufferSize) / mode_lib->vba.WritebackLatency) { mode_lib->vba.WritebackLatencySupport = false; } } else { if (locals->WriteBandwidth[k] > 1.5 * dml_min( mode_lib->vba.WritebackInterfaceLumaBufferSize, 2.0 * mode_lib->vba.WritebackInterfaceChromaBufferSize) / mode_lib->vba.WritebackLatency) { mode_lib->vba.WritebackLatencySupport = false; } } } } /*Re-ordering Buffer Support Check*/ for (i = 0; i <= mode_lib->vba.soc.num_states; i++) { locals->UrgentRoundTripAndOutOfOrderLatencyPerState[i] = (mode_lib->vba.RoundTripPingLatencyCycles + 32.0) / mode_lib->vba.DCFCLKPerState[i] + locals->UrgentOutOfOrderReturnPerChannel * mode_lib->vba.NumberOfChannels / locals->ReturnBWPerState[i]; if ((mode_lib->vba.ROBBufferSizeInKByte - mode_lib->vba.PixelChunkSizeInKByte) * 1024.0 / locals->ReturnBWPerState[i] > locals->UrgentRoundTripAndOutOfOrderLatencyPerState[i]) { locals->ROBSupport[i] = true; } else { locals->ROBSupport[i] = false; } } /*Writeback Mode Support Check*/ mode_lib->vba.TotalNumberOfActiveWriteback = 0; for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { if (mode_lib->vba.WritebackEnable[k] == true) { if (mode_lib->vba.ActiveWritebacksPerPlane[k] == 0) mode_lib->vba.ActiveWritebacksPerPlane[k] = 1; mode_lib->vba.TotalNumberOfActiveWriteback = mode_lib->vba.TotalNumberOfActiveWriteback + mode_lib->vba.ActiveWritebacksPerPlane[k]; } } mode_lib->vba.WritebackModeSupport = true; if (mode_lib->vba.TotalNumberOfActiveWriteback > mode_lib->vba.MaxNumWriteback) { mode_lib->vba.WritebackModeSupport = false; } for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { if (mode_lib->vba.WritebackEnable[k] == true && mode_lib->vba.Writeback10bpc420Supported != true && mode_lib->vba.WritebackPixelFormat[k] == dm_420_10) { mode_lib->vba.WritebackModeSupport = false; } } /*Writeback Scale Ratio and Taps Support Check*/ mode_lib->vba.WritebackScaleRatioAndTapsSupport = true; for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { if (mode_lib->vba.WritebackEnable[k] == true) { if (mode_lib->vba.WritebackLumaAndChromaScalingSupported == false && (mode_lib->vba.WritebackHRatio[k] != 1.0 || mode_lib->vba.WritebackVRatio[k] != 1.0)) { mode_lib->vba.WritebackScaleRatioAndTapsSupport = false; } if (mode_lib->vba.WritebackHRatio[k] > mode_lib->vba.WritebackMaxHSCLRatio || mode_lib->vba.WritebackVRatio[k] > mode_lib->vba.WritebackMaxVSCLRatio || mode_lib->vba.WritebackHRatio[k] < mode_lib->vba.WritebackMinHSCLRatio || mode_lib->vba.WritebackVRatio[k] < mode_lib->vba.WritebackMinVSCLRatio || mode_lib->vba.WritebackLumaHTaps[k] > mode_lib->vba.WritebackMaxHSCLTaps || mode_lib->vba.WritebackLumaVTaps[k] > mode_lib->vba.WritebackMaxVSCLTaps || mode_lib->vba.WritebackHRatio[k] > mode_lib->vba.WritebackLumaHTaps[k] || mode_lib->vba.WritebackVRatio[k] > mode_lib->vba.WritebackLumaVTaps[k] || (mode_lib->vba.WritebackLumaHTaps[k] > 2.0 && ((mode_lib->vba.WritebackLumaHTaps[k] % 2) == 1)) || (mode_lib->vba.WritebackPixelFormat[k] != dm_444_32 && (mode_lib->vba.WritebackChromaHTaps[k] > mode_lib->vba.WritebackMaxHSCLTaps || mode_lib->vba.WritebackChromaVTaps[k] > mode_lib->vba.WritebackMaxVSCLTaps || 2.0 * mode_lib->vba.WritebackHRatio[k] > mode_lib->vba.WritebackChromaHTaps[k] || 2.0 * mode_lib->vba.WritebackVRatio[k] > mode_lib->vba.WritebackChromaVTaps[k] || (mode_lib->vba.WritebackChromaHTaps[k] > 2.0 && ((mode_lib->vba.WritebackChromaHTaps[k] % 2) == 1))))) { mode_lib->vba.WritebackScaleRatioAndTapsSupport = false; } if (mode_lib->vba.WritebackVRatio[k] < 1.0) { mode_lib->vba.WritebackLumaVExtra = dml_max(1.0 - 2.0 / dml_ceil(1.0 / mode_lib->vba.WritebackVRatio[k], 1.0), 0.0); } else { mode_lib->vba.WritebackLumaVExtra = -1; } if ((mode_lib->vba.WritebackPixelFormat[k] == dm_444_32 && mode_lib->vba.WritebackLumaVTaps[k] > (mode_lib->vba.WritebackLineBufferLumaBufferSize + mode_lib->vba.WritebackLineBufferChromaBufferSize) / 3.0 / mode_lib->vba.WritebackDestinationWidth[k] - mode_lib->vba.WritebackLumaVExtra) || (mode_lib->vba.WritebackPixelFormat[k] == dm_420_8 && mode_lib->vba.WritebackLumaVTaps[k] > mode_lib->vba.WritebackLineBufferLumaBufferSize * 8.0 / 10.0 / mode_lib->vba.WritebackDestinationWidth[k] - mode_lib->vba.WritebackLumaVExtra) || (mode_lib->vba.WritebackPixelFormat[k] == dm_420_10 && mode_lib->vba.WritebackLumaVTaps[k] > mode_lib->vba.WritebackLineBufferLumaBufferSize * 8.0 / 10.0 / mode_lib->vba.WritebackDestinationWidth[k] - mode_lib->vba.WritebackLumaVExtra)) { mode_lib->vba.WritebackScaleRatioAndTapsSupport = false; } if (2.0 * mode_lib->vba.WritebackVRatio[k] < 1) { mode_lib->vba.WritebackChromaVExtra = 0.0; } else { mode_lib->vba.WritebackChromaVExtra = -1; } if ((mode_lib->vba.WritebackPixelFormat[k] == dm_420_8 && mode_lib->vba.WritebackChromaVTaps[k] > mode_lib->vba.WritebackLineBufferChromaBufferSize * 8.0 / 10.0 / mode_lib->vba.WritebackDestinationWidth[k] - mode_lib->vba.WritebackChromaVExtra) || (mode_lib->vba.WritebackPixelFormat[k] == dm_420_10 && mode_lib->vba.WritebackChromaVTaps[k] > mode_lib->vba.WritebackLineBufferChromaBufferSize * 8.0 / 10.0 / mode_lib->vba.WritebackDestinationWidth[k] - mode_lib->vba.WritebackChromaVExtra)) { mode_lib->vba.WritebackScaleRatioAndTapsSupport = false; } } } /*Maximum DISPCLK/DPPCLK Support check*/ mode_lib->vba.WritebackRequiredDISPCLK = 0.0; for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { if (mode_lib->vba.WritebackEnable[k] == true) { mode_lib->vba.WritebackRequiredDISPCLK = dml_max( mode_lib->vba.WritebackRequiredDISPCLK, CalculateWriteBackDISPCLK( mode_lib->vba.WritebackPixelFormat[k], mode_lib->vba.PixelClock[k], mode_lib->vba.WritebackHRatio[k], mode_lib->vba.WritebackVRatio[k], mode_lib->vba.WritebackLumaHTaps[k], mode_lib->vba.WritebackLumaVTaps[k], mode_lib->vba.WritebackChromaHTaps[k], mode_lib->vba.WritebackChromaVTaps[k], mode_lib->vba.WritebackDestinationWidth[k], mode_lib->vba.HTotal[k], mode_lib->vba.WritebackChromaLineBufferWidth)); } } for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { if (mode_lib->vba.HRatio[k] > 1.0) { locals->PSCL_FACTOR[k] = dml_min( mode_lib->vba.MaxDCHUBToPSCLThroughput, mode_lib->vba.MaxPSCLToLBThroughput * mode_lib->vba.HRatio[k] / dml_ceil( mode_lib->vba.htaps[k] / 6.0, 1.0)); } else { locals->PSCL_FACTOR[k] = dml_min( mode_lib->vba.MaxDCHUBToPSCLThroughput, mode_lib->vba.MaxPSCLToLBThroughput); } if (locals->BytePerPixelInDETC[k] == 0.0) { locals->PSCL_FACTOR_CHROMA[k] = 0.0; locals->MinDPPCLKUsingSingleDPP[k] = mode_lib->vba.PixelClock[k] * dml_max3( mode_lib->vba.vtaps[k] / 6.0 * dml_min( 1.0, mode_lib->vba.HRatio[k]), mode_lib->vba.HRatio[k] * mode_lib->vba.VRatio[k] / locals->PSCL_FACTOR[k], 1.0); if ((mode_lib->vba.htaps[k] > 6.0 || mode_lib->vba.vtaps[k] > 6.0) && locals->MinDPPCLKUsingSingleDPP[k] < 2.0 * mode_lib->vba.PixelClock[k]) { locals->MinDPPCLKUsingSingleDPP[k] = 2.0 * mode_lib->vba.PixelClock[k]; } } else { if (mode_lib->vba.HRatio[k] / 2.0 > 1.0) { locals->PSCL_FACTOR_CHROMA[k] = dml_min( mode_lib->vba.MaxDCHUBToPSCLThroughput, mode_lib->vba.MaxPSCLToLBThroughput * mode_lib->vba.HRatio[k] / 2.0 / dml_ceil( mode_lib->vba.HTAPsChroma[k] / 6.0, 1.0)); } else { locals->PSCL_FACTOR_CHROMA[k] = dml_min( mode_lib->vba.MaxDCHUBToPSCLThroughput, mode_lib->vba.MaxPSCLToLBThroughput); } locals->MinDPPCLKUsingSingleDPP[k] = mode_lib->vba.PixelClock[k] * dml_max5( mode_lib->vba.vtaps[k] / 6.0 * dml_min( 1.0, mode_lib->vba.HRatio[k]), mode_lib->vba.HRatio[k] * mode_lib->vba.VRatio[k] / locals->PSCL_FACTOR[k], mode_lib->vba.VTAPsChroma[k] / 6.0 * dml_min( 1.0, mode_lib->vba.HRatio[k] / 2.0), mode_lib->vba.HRatio[k] * mode_lib->vba.VRatio[k] / 4.0 / locals->PSCL_FACTOR_CHROMA[k], 1.0); if ((mode_lib->vba.htaps[k] > 6.0 || mode_lib->vba.vtaps[k] > 6.0 || mode_lib->vba.HTAPsChroma[k] > 6.0 || mode_lib->vba.VTAPsChroma[k] > 6.0) && locals->MinDPPCLKUsingSingleDPP[k] < 2.0 * mode_lib->vba.PixelClock[k]) { locals->MinDPPCLKUsingSingleDPP[k] = 2.0 * mode_lib->vba.PixelClock[k]; } } } for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { Calculate256BBlockSizes( mode_lib->vba.SourcePixelFormat[k], mode_lib->vba.SurfaceTiling[k], dml_ceil(locals->BytePerPixelInDETY[k], 1.0), dml_ceil(locals->BytePerPixelInDETC[k], 2.0), &locals->Read256BlockHeightY[k], &locals->Read256BlockHeightC[k], &locals->Read256BlockWidthY[k], &locals->Read256BlockWidthC[k]); if (mode_lib->vba.SourceScan[k] == dm_horz) { locals->MaxSwathHeightY[k] = locals->Read256BlockHeightY[k]; locals->MaxSwathHeightC[k] = locals->Read256BlockHeightC[k]; } else { locals->MaxSwathHeightY[k] = locals->Read256BlockWidthY[k]; locals->MaxSwathHeightC[k] = locals->Read256BlockWidthC[k]; } if ((mode_lib->vba.SourcePixelFormat[k] == dm_444_64 || mode_lib->vba.SourcePixelFormat[k] == dm_444_32 || mode_lib->vba.SourcePixelFormat[k] == dm_444_16 || mode_lib->vba.SourcePixelFormat[k] == dm_mono_16 || mode_lib->vba.SourcePixelFormat[k] == dm_mono_8)) { if (mode_lib->vba.SurfaceTiling[k] == dm_sw_linear || (mode_lib->vba.SourcePixelFormat[k] == dm_444_64 && (mode_lib->vba.SurfaceTiling[k] == dm_sw_4kb_s || mode_lib->vba.SurfaceTiling[k] == dm_sw_4kb_s_x || mode_lib->vba.SurfaceTiling[k] == dm_sw_64kb_s || mode_lib->vba.SurfaceTiling[k] == dm_sw_64kb_s_t || mode_lib->vba.SurfaceTiling[k] == dm_sw_64kb_s_x || mode_lib->vba.SurfaceTiling[k] == dm_sw_var_s || mode_lib->vba.SurfaceTiling[k] == dm_sw_var_s_x) && mode_lib->vba.SourceScan[k] == dm_horz)) { locals->MinSwathHeightY[k] = locals->MaxSwathHeightY[k]; } else { locals->MinSwathHeightY[k] = locals->MaxSwathHeightY[k] / 2.0; } locals->MinSwathHeightC[k] = locals->MaxSwathHeightC[k]; } else { if (mode_lib->vba.SurfaceTiling[k] == dm_sw_linear) { locals->MinSwathHeightY[k] = locals->MaxSwathHeightY[k]; locals->MinSwathHeightC[k] = locals->MaxSwathHeightC[k]; } else if (mode_lib->vba.SourcePixelFormat[k] == dm_420_8 && mode_lib->vba.SourceScan[k] == dm_horz) { locals->MinSwathHeightY[k] = locals->MaxSwathHeightY[k] / 2.0; locals->MinSwathHeightC[k] = locals->MaxSwathHeightC[k]; } else if (mode_lib->vba.SourcePixelFormat[k] == dm_420_10 && mode_lib->vba.SourceScan[k] == dm_horz) { locals->MinSwathHeightC[k] = locals->MaxSwathHeightC[k] / 2.0; locals->MinSwathHeightY[k] = locals->MaxSwathHeightY[k]; } else { locals->MinSwathHeightY[k] = locals->MaxSwathHeightY[k]; locals->MinSwathHeightC[k] = locals->MaxSwathHeightC[k]; } } if (mode_lib->vba.SurfaceTiling[k] == dm_sw_linear) { mode_lib->vba.MaximumSwathWidthSupport = 8192.0; } else { mode_lib->vba.MaximumSwathWidthSupport = 5120.0; } mode_lib->vba.MaximumSwathWidthInDETBuffer = dml_min( mode_lib->vba.MaximumSwathWidthSupport, mode_lib->vba.DETBufferSizeInKByte * 1024.0 / 2.0 / (locals->BytePerPixelInDETY[k] * locals->MinSwathHeightY[k] + locals->BytePerPixelInDETC[k] / 2.0 * locals->MinSwathHeightC[k])); if (locals->BytePerPixelInDETC[k] == 0.0) { mode_lib->vba.MaximumSwathWidthInLineBuffer = mode_lib->vba.LineBufferSize * dml_max(mode_lib->vba.HRatio[k], 1.0) / mode_lib->vba.LBBitPerPixel[k] / (mode_lib->vba.vtaps[k] + dml_max( dml_ceil( mode_lib->vba.VRatio[k], 1.0) - 2, 0.0)); } else { mode_lib->vba.MaximumSwathWidthInLineBuffer = dml_min( mode_lib->vba.LineBufferSize * dml_max( mode_lib->vba.HRatio[k], 1.0) / mode_lib->vba.LBBitPerPixel[k] / (mode_lib->vba.vtaps[k] + dml_max( dml_ceil( mode_lib->vba.VRatio[k], 1.0) - 2, 0.0)), 2.0 * mode_lib->vba.LineBufferSize * dml_max( mode_lib->vba.HRatio[k] / 2.0, 1.0) / mode_lib->vba.LBBitPerPixel[k] / (mode_lib->vba.VTAPsChroma[k] + dml_max( dml_ceil( mode_lib->vba.VRatio[k] / 2.0, 1.0) - 2, 0.0))); } locals->MaximumSwathWidth[k] = dml_min( mode_lib->vba.MaximumSwathWidthInDETBuffer, mode_lib->vba.MaximumSwathWidthInLineBuffer); } for (i = 0; i <= mode_lib->vba.soc.num_states; i++) { for (j = 0; j < 2; j++) { mode_lib->vba.MaxDispclkRoundedDownToDFSGranularity = RoundToDFSGranularityDown( mode_lib->vba.MaxDispclk[i], mode_lib->vba.DISPCLKDPPCLKVCOSpeed); mode_lib->vba.MaxDppclkRoundedDownToDFSGranularity = RoundToDFSGranularityDown( mode_lib->vba.MaxDppclk[i], mode_lib->vba.DISPCLKDPPCLKVCOSpeed); locals->RequiredDISPCLK[i][j] = 0.0; locals->DISPCLK_DPPCLK_Support[i][j] = true; for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { mode_lib->vba.PlaneRequiredDISPCLKWithoutODMCombine = mode_lib->vba.PixelClock[k] * (1.0 + mode_lib->vba.DISPCLKDPPCLKDSCCLKDownSpreading / 100.0) * (1.0 + mode_lib->vba.DISPCLKRampingMargin / 100.0); if (mode_lib->vba.PlaneRequiredDISPCLKWithoutODMCombine >= mode_lib->vba.MaxDispclk[i] && i == mode_lib->vba.soc.num_states) mode_lib->vba.PlaneRequiredDISPCLKWithoutODMCombine = mode_lib->vba.PixelClock[k] * (1 + mode_lib->vba.DISPCLKDPPCLKDSCCLKDownSpreading / 100.0); mode_lib->vba.PlaneRequiredDISPCLKWithODMCombine = mode_lib->vba.PixelClock[k] / 2 * (1 + mode_lib->vba.DISPCLKDPPCLKDSCCLKDownSpreading / 100.0) * (1 + mode_lib->vba.DISPCLKRampingMargin / 100.0); if (mode_lib->vba.PlaneRequiredDISPCLKWithODMCombine >= mode_lib->vba.MaxDispclk[i] && i == mode_lib->vba.soc.num_states) mode_lib->vba.PlaneRequiredDISPCLKWithODMCombine = mode_lib->vba.PixelClock[k] / 2 * (1 + mode_lib->vba.DISPCLKDPPCLKDSCCLKDownSpreading / 100.0); if (mode_lib->vba.ODMCapability == false || mode_lib->vba.PlaneRequiredDISPCLKWithoutODMCombine <= mode_lib->vba.MaxDispclkRoundedDownToDFSGranularity) { locals->ODMCombineEnablePerState[i][k] = false; mode_lib->vba.PlaneRequiredDISPCLK = mode_lib->vba.PlaneRequiredDISPCLKWithoutODMCombine; } else { locals->ODMCombineEnablePerState[i][k] = true; mode_lib->vba.PlaneRequiredDISPCLK = mode_lib->vba.PlaneRequiredDISPCLKWithODMCombine; } if (locals->MinDPPCLKUsingSingleDPP[k] * (1.0 + mode_lib->vba.DISPCLKDPPCLKDSCCLKDownSpreading / 100.0) <= mode_lib->vba.MaxDppclkRoundedDownToDFSGranularity && locals->SwathWidthYSingleDPP[k] <= locals->MaximumSwathWidth[k] && locals->ODMCombineEnablePerState[i][k] == false) { locals->NoOfDPP[i][j][k] = 1; locals->RequiredDPPCLK[i][j][k] = locals->MinDPPCLKUsingSingleDPP[k] * (1.0 + mode_lib->vba.DISPCLKDPPCLKDSCCLKDownSpreading / 100.0); } else { locals->NoOfDPP[i][j][k] = 2; locals->RequiredDPPCLK[i][j][k] = locals->MinDPPCLKUsingSingleDPP[k] * (1.0 + mode_lib->vba.DISPCLKDPPCLKDSCCLKDownSpreading / 100.0) / 2.0; } locals->RequiredDISPCLK[i][j] = dml_max( locals->RequiredDISPCLK[i][j], mode_lib->vba.PlaneRequiredDISPCLK); if ((locals->MinDPPCLKUsingSingleDPP[k] / locals->NoOfDPP[i][j][k] * (1.0 + mode_lib->vba.DISPCLKDPPCLKDSCCLKDownSpreading / 100.0) > mode_lib->vba.MaxDppclkRoundedDownToDFSGranularity) || (mode_lib->vba.PlaneRequiredDISPCLK > mode_lib->vba.MaxDispclkRoundedDownToDFSGranularity)) { locals->DISPCLK_DPPCLK_Support[i][j] = false; } } locals->TotalNumberOfActiveDPP[i][j] = 0.0; for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) locals->TotalNumberOfActiveDPP[i][j] = locals->TotalNumberOfActiveDPP[i][j] + locals->NoOfDPP[i][j][k]; if (j == 1) { while (locals->TotalNumberOfActiveDPP[i][j] < mode_lib->vba.MaxNumDPP && locals->TotalNumberOfActiveDPP[i][j] < 2 * mode_lib->vba.NumberOfActivePlanes) { double BWOfNonSplitPlaneOfMaximumBandwidth; unsigned int NumberOfNonSplitPlaneOfMaximumBandwidth; BWOfNonSplitPlaneOfMaximumBandwidth = 0; NumberOfNonSplitPlaneOfMaximumBandwidth = 0; for (k = 0; k < mode_lib->vba.NumberOfActivePlanes; ++k) { if (locals->ReadBandwidth[k] > BWOfNonSplitPlaneOfMaximumBandwidth && locals->NoOfDPP[i][j][k] == 1) { BWOfNonSplitPlaneOfMaximumBandwidth = locals->ReadBandwidth[k]; NumberOfNonSplitPlaneOfMaximumBandwidth = k; } } locals->NoOfDPP[i][j][NumberOfNonSplitPlaneOfMaximumBandwidth] = 2; locals->RequiredDPPCLK[i][j][NumberOfNonSplitPlaneOfMaximumBandwidth] = locals->MinDPPCLKUsingSingleDPP[NumberOfNonSplitPlaneOfMaximumBandwidth] * (1 + mode_lib->vba.DISPCLKDPPCLKDSCCLKDownSpreading / 100) / 2; locals->TotalNumberOfActiveDPP[i][j] = locals->TotalNumberOfActiveDPP[i][j] + 1; } } if (locals->TotalNumberOfActiveDPP[i][j] > mode_lib->vba.MaxNumDPP) { locals->RequiredDISPCLK[i][j] = 0.0; locals->DISPCLK_DPPCLK_Support[i][j] = true; for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { locals->ODMCombineEnablePerState[i][k] = false; if (locals->SwathWidthYSingleDPP[k] <= locals->MaximumSwathWidth[k]) { locals->NoOfDPP[i][j][k] = 1; locals->RequiredDPPCLK[i][j][k] = locals->MinDPPCLKUsingSingleDPP[k] * (1.0 + mode_lib->vba.DISPCLKDPPCLKDSCCLKDownSpreading / 100.0); } else { locals->NoOfDPP[i][j][k] = 2; locals->RequiredDPPCLK[i][j][k] = locals->MinDPPCLKUsingSingleDPP[k] * (1.0 + mode_lib->vba.DISPCLKDPPCLKDSCCLKDownSpreading / 100.0) / 2.0; } if (i != mode_lib->vba.soc.num_states) { mode_lib->vba.PlaneRequiredDISPCLK = mode_lib->vba.PixelClock[k] * (1.0 + mode_lib->vba.DISPCLKDPPCLKDSCCLKDownSpreading / 100.0) * (1.0 + mode_lib->vba.DISPCLKRampingMargin / 100.0); } else { mode_lib->vba.PlaneRequiredDISPCLK = mode_lib->vba.PixelClock[k] * (1.0 + mode_lib->vba.DISPCLKDPPCLKDSCCLKDownSpreading / 100.0); } locals->RequiredDISPCLK[i][j] = dml_max( locals->RequiredDISPCLK[i][j], mode_lib->vba.PlaneRequiredDISPCLK); if (locals->MinDPPCLKUsingSingleDPP[k] / locals->NoOfDPP[i][j][k] * (1.0 + mode_lib->vba.DISPCLKDPPCLKDSCCLKDownSpreading / 100.0) > mode_lib->vba.MaxDppclkRoundedDownToDFSGranularity || mode_lib->vba.PlaneRequiredDISPCLK > mode_lib->vba.MaxDispclkRoundedDownToDFSGranularity) locals->DISPCLK_DPPCLK_Support[i][j] = false; } locals->TotalNumberOfActiveDPP[i][j] = 0.0; for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) locals->TotalNumberOfActiveDPP[i][j] = locals->TotalNumberOfActiveDPP[i][j] + locals->NoOfDPP[i][j][k]; } locals->RequiredDISPCLK[i][j] = dml_max( locals->RequiredDISPCLK[i][j], mode_lib->vba.WritebackRequiredDISPCLK); if (mode_lib->vba.MaxDispclkRoundedDownToDFSGranularity < mode_lib->vba.WritebackRequiredDISPCLK) { locals->DISPCLK_DPPCLK_Support[i][j] = false; } } } /*Viewport Size Check*/ for (i = 0; i <= mode_lib->vba.soc.num_states; i++) { locals->ViewportSizeSupport[i] = true; for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { if (locals->ODMCombineEnablePerState[i][k] == true) { if (dml_min(locals->SwathWidthYSingleDPP[k], dml_round(mode_lib->vba.HActive[k] / 2.0 * mode_lib->vba.HRatio[k])) > locals->MaximumSwathWidth[k]) { locals->ViewportSizeSupport[i] = false; } } else { if (locals->SwathWidthYSingleDPP[k] / 2.0 > locals->MaximumSwathWidth[k]) { locals->ViewportSizeSupport[i] = false; } } } } /*Total Available Pipes Support Check*/ for (i = 0; i <= mode_lib->vba.soc.num_states; i++) { for (j = 0; j < 2; j++) { if (locals->TotalNumberOfActiveDPP[i][j] <= mode_lib->vba.MaxNumDPP) locals->TotalAvailablePipesSupport[i][j] = true; else locals->TotalAvailablePipesSupport[i][j] = false; } } /*Total Available OTG Support Check*/ mode_lib->vba.TotalNumberOfActiveOTG = 0.0; for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { if (mode_lib->vba.BlendingAndTiming[k] == k) { mode_lib->vba.TotalNumberOfActiveOTG = mode_lib->vba.TotalNumberOfActiveOTG + 1.0; } } if (mode_lib->vba.TotalNumberOfActiveOTG <= mode_lib->vba.MaxNumOTG) { mode_lib->vba.NumberOfOTGSupport = true; } else { mode_lib->vba.NumberOfOTGSupport = false; } /*Display IO and DSC Support Check*/ mode_lib->vba.NonsupportedDSCInputBPC = false; for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { if (!(mode_lib->vba.DSCInputBitPerComponent[k] == 12.0 || mode_lib->vba.DSCInputBitPerComponent[k] == 10.0 || mode_lib->vba.DSCInputBitPerComponent[k] == 8.0)) { mode_lib->vba.NonsupportedDSCInputBPC = true; } } for (i = 0; i <= mode_lib->vba.soc.num_states; i++) { for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { locals->RequiresDSC[i][k] = 0; locals->RequiresFEC[i][k] = 0; if (mode_lib->vba.BlendingAndTiming[k] == k) { if (mode_lib->vba.Output[k] == dm_hdmi) { locals->RequiresDSC[i][k] = 0; locals->RequiresFEC[i][k] = 0; locals->OutputBppPerState[i][k] = TruncToValidBPP( dml_min(600.0, mode_lib->vba.PHYCLKPerState[i]) / mode_lib->vba.PixelClockBackEnd[k] * 24, false, mode_lib->vba.Output[k], mode_lib->vba.OutputFormat[k], mode_lib->vba.DSCInputBitPerComponent[k]); } else if (mode_lib->vba.Output[k] == dm_dp || mode_lib->vba.Output[k] == dm_edp) { if (mode_lib->vba.Output[k] == dm_edp) { mode_lib->vba.EffectiveFECOverhead = 0.0; } else { mode_lib->vba.EffectiveFECOverhead = mode_lib->vba.FECOverhead; } if (mode_lib->vba.PHYCLKPerState[i] >= 270.0) { mode_lib->vba.Outbpp = TruncToValidBPP( (1.0 - mode_lib->vba.Downspreading / 100.0) * 270.0 * mode_lib->vba.OutputLinkDPLanes[k] / mode_lib->vba.PixelClockBackEnd[k] * 8.0, false, mode_lib->vba.Output[k], mode_lib->vba.OutputFormat[k], mode_lib->vba.DSCInputBitPerComponent[k]); mode_lib->vba.OutbppDSC = TruncToValidBPP( (1.0 - mode_lib->vba.Downspreading / 100.0) * (1.0 - mode_lib->vba.EffectiveFECOverhead / 100.0) * 270.0 * mode_lib->vba.OutputLinkDPLanes[k] / mode_lib->vba.PixelClockBackEnd[k] * 8.0, true, mode_lib->vba.Output[k], mode_lib->vba.OutputFormat[k], mode_lib->vba.DSCInputBitPerComponent[k]); if (mode_lib->vba.DSCEnabled[k] == true) { locals->RequiresDSC[i][k] = true; if (mode_lib->vba.Output[k] == dm_dp) { locals->RequiresFEC[i][k] = true; } else { locals->RequiresFEC[i][k] = false; } mode_lib->vba.Outbpp = mode_lib->vba.OutbppDSC; } else { locals->RequiresDSC[i][k] = false; locals->RequiresFEC[i][k] = false; } locals->OutputBppPerState[i][k] = mode_lib->vba.Outbpp; } if (mode_lib->vba.Outbpp == BPP_INVALID && mode_lib->vba.PHYCLKPerState[i] >= 540.0) { mode_lib->vba.Outbpp = TruncToValidBPP( (1.0 - mode_lib->vba.Downspreading / 100.0) * 540.0 * mode_lib->vba.OutputLinkDPLanes[k] / mode_lib->vba.PixelClockBackEnd[k] * 8.0, false, mode_lib->vba.Output[k], mode_lib->vba.OutputFormat[k], mode_lib->vba.DSCInputBitPerComponent[k]); mode_lib->vba.OutbppDSC = TruncToValidBPP( (1.0 - mode_lib->vba.Downspreading / 100.0) * (1.0 - mode_lib->vba.EffectiveFECOverhead / 100.0) * 540.0 * mode_lib->vba.OutputLinkDPLanes[k] / mode_lib->vba.PixelClockBackEnd[k] * 8.0, true, mode_lib->vba.Output[k], mode_lib->vba.OutputFormat[k], mode_lib->vba.DSCInputBitPerComponent[k]); if (mode_lib->vba.DSCEnabled[k] == true) { locals->RequiresDSC[i][k] = true; if (mode_lib->vba.Output[k] == dm_dp) { locals->RequiresFEC[i][k] = true; } else { locals->RequiresFEC[i][k] = false; } mode_lib->vba.Outbpp = mode_lib->vba.OutbppDSC; } else { locals->RequiresDSC[i][k] = false; locals->RequiresFEC[i][k] = false; } locals->OutputBppPerState[i][k] = mode_lib->vba.Outbpp; } if (mode_lib->vba.Outbpp == BPP_INVALID && mode_lib->vba.PHYCLKPerState[i] >= 810.0) { mode_lib->vba.Outbpp = TruncToValidBPP( (1.0 - mode_lib->vba.Downspreading / 100.0) * 810.0 * mode_lib->vba.OutputLinkDPLanes[k] / mode_lib->vba.PixelClockBackEnd[k] * 8.0, false, mode_lib->vba.Output[k], mode_lib->vba.OutputFormat[k], mode_lib->vba.DSCInputBitPerComponent[k]); mode_lib->vba.OutbppDSC = TruncToValidBPP( (1.0 - mode_lib->vba.Downspreading / 100.0) * (1.0 - mode_lib->vba.EffectiveFECOverhead / 100.0) * 810.0 * mode_lib->vba.OutputLinkDPLanes[k] / mode_lib->vba.PixelClockBackEnd[k] * 8.0, true, mode_lib->vba.Output[k], mode_lib->vba.OutputFormat[k], mode_lib->vba.DSCInputBitPerComponent[k]); if (mode_lib->vba.DSCEnabled[k] == true || mode_lib->vba.Outbpp == BPP_INVALID) { locals->RequiresDSC[i][k] = true; if (mode_lib->vba.Output[k] == dm_dp) { locals->RequiresFEC[i][k] = true; } else { locals->RequiresFEC[i][k] = false; } mode_lib->vba.Outbpp = mode_lib->vba.OutbppDSC; } else { locals->RequiresDSC[i][k] = false; locals->RequiresFEC[i][k] = false; } locals->OutputBppPerState[i][k] = mode_lib->vba.Outbpp; } } } else { locals->OutputBppPerState[i][k] = BPP_BLENDED_PIPE; } } } for (i = 0; i <= mode_lib->vba.soc.num_states; i++) { locals->DIOSupport[i] = true; for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { if (locals->OutputBppPerState[i][k] == BPP_INVALID || (mode_lib->vba.OutputFormat[k] == dm_420 && mode_lib->vba.Interlace[k] == true && mode_lib->vba.ProgressiveToInterlaceUnitInOPP == true)) { locals->DIOSupport[i] = false; } } } for (i = 0; i <= mode_lib->vba.soc.num_states; i++) { for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { locals->DSCCLKRequiredMoreThanSupported[i] = false; if (mode_lib->vba.BlendingAndTiming[k] == k) { if ((mode_lib->vba.Output[k] == dm_dp || mode_lib->vba.Output[k] == dm_edp)) { if (mode_lib->vba.OutputFormat[k] == dm_420 || mode_lib->vba.OutputFormat[k] == dm_n422) { mode_lib->vba.DSCFormatFactor = 2; } else { mode_lib->vba.DSCFormatFactor = 1; } if (locals->RequiresDSC[i][k] == true) { if (locals->ODMCombineEnablePerState[i][k] == true) { if (mode_lib->vba.PixelClockBackEnd[k] / 6.0 / mode_lib->vba.DSCFormatFactor > (1.0 - mode_lib->vba.DISPCLKDPPCLKDSCCLKDownSpreading / 100.0) * mode_lib->vba.MaxDSCCLK[i]) { locals->DSCCLKRequiredMoreThanSupported[i] = true; } } else { if (mode_lib->vba.PixelClockBackEnd[k] / 3.0 / mode_lib->vba.DSCFormatFactor > (1.0 - mode_lib->vba.DISPCLKDPPCLKDSCCLKDownSpreading / 100.0) * mode_lib->vba.MaxDSCCLK[i]) { locals->DSCCLKRequiredMoreThanSupported[i] = true; } } } } } } } for (i = 0; i <= mode_lib->vba.soc.num_states; i++) { locals->NotEnoughDSCUnits[i] = false; mode_lib->vba.TotalDSCUnitsRequired = 0.0; for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { if (locals->RequiresDSC[i][k] == true) { if (locals->ODMCombineEnablePerState[i][k] == true) { mode_lib->vba.TotalDSCUnitsRequired = mode_lib->vba.TotalDSCUnitsRequired + 2.0; } else { mode_lib->vba.TotalDSCUnitsRequired = mode_lib->vba.TotalDSCUnitsRequired + 1.0; } } } if (mode_lib->vba.TotalDSCUnitsRequired > mode_lib->vba.NumberOfDSC) { locals->NotEnoughDSCUnits[i] = true; } } /*DSC Delay per state*/ for (i = 0; i <= mode_lib->vba.soc.num_states; i++) { for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { if (mode_lib->vba.BlendingAndTiming[k] != k) { mode_lib->vba.slices = 0; } else if (locals->RequiresDSC[i][k] == 0 || locals->RequiresDSC[i][k] == false) { mode_lib->vba.slices = 0; } else if (mode_lib->vba.PixelClockBackEnd[k] > 3200.0) { mode_lib->vba.slices = dml_ceil( mode_lib->vba.PixelClockBackEnd[k] / 400.0, 4.0); } else if (mode_lib->vba.PixelClockBackEnd[k] > 1360.0) { mode_lib->vba.slices = 8.0; } else if (mode_lib->vba.PixelClockBackEnd[k] > 680.0) { mode_lib->vba.slices = 4.0; } else if (mode_lib->vba.PixelClockBackEnd[k] > 340.0) { mode_lib->vba.slices = 2.0; } else { mode_lib->vba.slices = 1.0; } if (locals->OutputBppPerState[i][k] == BPP_BLENDED_PIPE || locals->OutputBppPerState[i][k] == BPP_INVALID) { mode_lib->vba.bpp = 0.0; } else { mode_lib->vba.bpp = locals->OutputBppPerState[i][k]; } if (locals->RequiresDSC[i][k] == true && mode_lib->vba.bpp != 0.0) { if (locals->ODMCombineEnablePerState[i][k] == false) { locals->DSCDelayPerState[i][k] = dscceComputeDelay( mode_lib->vba.DSCInputBitPerComponent[k], mode_lib->vba.bpp, dml_ceil( mode_lib->vba.HActive[k] / mode_lib->vba.slices, 1.0), mode_lib->vba.slices, mode_lib->vba.OutputFormat[k]) + dscComputeDelay( mode_lib->vba.OutputFormat[k]); } else { locals->DSCDelayPerState[i][k] = 2.0 * (dscceComputeDelay( mode_lib->vba.DSCInputBitPerComponent[k], mode_lib->vba.bpp, dml_ceil(mode_lib->vba.HActive[k] / mode_lib->vba.slices, 1.0), mode_lib->vba.slices / 2, mode_lib->vba.OutputFormat[k]) + dscComputeDelay(mode_lib->vba.OutputFormat[k])); } locals->DSCDelayPerState[i][k] = locals->DSCDelayPerState[i][k] * mode_lib->vba.PixelClock[k] / mode_lib->vba.PixelClockBackEnd[k]; } else { locals->DSCDelayPerState[i][k] = 0.0; } } for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { for (m = 0; m <= mode_lib->vba.NumberOfActivePlanes - 1; m++) { for (j = 0; j <= mode_lib->vba.NumberOfActivePlanes - 1; j++) { if (mode_lib->vba.BlendingAndTiming[k] == m && locals->RequiresDSC[i][m] == true) locals->DSCDelayPerState[i][k] = locals->DSCDelayPerState[i][m]; } } } } //Prefetch Check for (i = 0; i <= mode_lib->vba.soc.num_states; i++) { for (j = 0; j < 2; j++) { for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { if (locals->ODMCombineEnablePerState[i][k] == true) locals->SwathWidthYPerState[i][j][k] = dml_min(locals->SwathWidthYSingleDPP[k], dml_round(locals->HActive[k] / 2 * locals->HRatio[k])); else locals->SwathWidthYPerState[i][j][k] = locals->SwathWidthYSingleDPP[k] / locals->NoOfDPP[i][j][k]; locals->SwathWidthGranularityY = 256 / dml_ceil(locals->BytePerPixelInDETY[k], 1) / locals->MaxSwathHeightY[k]; locals->RoundedUpMaxSwathSizeBytesY = (dml_ceil(locals->SwathWidthYPerState[i][j][k] - 1, locals->SwathWidthGranularityY) + locals->SwathWidthGranularityY) * locals->BytePerPixelInDETY[k] * locals->MaxSwathHeightY[k]; if (locals->SourcePixelFormat[k] == dm_420_10) { locals->RoundedUpMaxSwathSizeBytesY = dml_ceil(locals->RoundedUpMaxSwathSizeBytesY, 256) + 256; } if (locals->MaxSwathHeightC[k] > 0) { locals->SwathWidthGranularityC = 256 / dml_ceil(locals->BytePerPixelInDETC[k], 2) / locals->MaxSwathHeightC[k]; locals->RoundedUpMaxSwathSizeBytesC = (dml_ceil(locals->SwathWidthYPerState[i][j][k] / 2 - 1, locals->SwathWidthGranularityC) + locals->SwathWidthGranularityC) * locals->BytePerPixelInDETC[k] * locals->MaxSwathHeightC[k]; } if (locals->SourcePixelFormat[k] == dm_420_10) { locals->RoundedUpMaxSwathSizeBytesC = dml_ceil(locals->RoundedUpMaxSwathSizeBytesC, 256) + 256; } else { locals->RoundedUpMaxSwathSizeBytesC = 0; } if (locals->RoundedUpMaxSwathSizeBytesY + locals->RoundedUpMaxSwathSizeBytesC <= locals->DETBufferSizeInKByte * 1024 / 2) { locals->SwathHeightYPerState[i][j][k] = locals->MaxSwathHeightY[k]; locals->SwathHeightCPerState[i][j][k] = locals->MaxSwathHeightC[k]; } else { locals->SwathHeightYPerState[i][j][k] = locals->MinSwathHeightY[k]; locals->SwathHeightCPerState[i][j][k] = locals->MinSwathHeightC[k]; } if (locals->BytePerPixelInDETC[k] == 0) { locals->LinesInDETLuma = locals->DETBufferSizeInKByte * 1024 / locals->BytePerPixelInDETY[k] / locals->SwathWidthYPerState[i][j][k]; locals->LinesInDETChroma = 0; } else if (locals->SwathHeightYPerState[i][j][k] <= locals->SwathHeightCPerState[i][j][k]) { locals->LinesInDETLuma = locals->DETBufferSizeInKByte * 1024 / 2 / locals->BytePerPixelInDETY[k] / locals->SwathWidthYPerState[i][j][k]; locals->LinesInDETChroma = locals->DETBufferSizeInKByte * 1024 / 2 / locals->BytePerPixelInDETC[k] / (locals->SwathWidthYPerState[i][j][k] / 2); } else { locals->LinesInDETLuma = locals->DETBufferSizeInKByte * 1024 * 2 / 3 / locals->BytePerPixelInDETY[k] / locals->SwathWidthYPerState[i][j][k]; locals->LinesInDETChroma = locals->DETBufferSizeInKByte * 1024 / 3 / locals->BytePerPixelInDETY[k] / (locals->SwathWidthYPerState[i][j][k] / 2); } locals->EffectiveLBLatencyHidingSourceLinesLuma = dml_min(locals->MaxLineBufferLines, dml_floor(locals->LineBufferSize / locals->LBBitPerPixel[k] / (locals->SwathWidthYPerState[i][j][k] / dml_max(locals->HRatio[k], 1)), 1)) - (locals->vtaps[k] - 1); locals->EffectiveLBLatencyHidingSourceLinesChroma = dml_min(locals->MaxLineBufferLines, dml_floor(locals->LineBufferSize / locals->LBBitPerPixel[k] / (locals->SwathWidthYPerState[i][j][k] / 2 / dml_max(locals->HRatio[k] / 2, 1)), 1)) - (locals->VTAPsChroma[k] - 1); locals->EffectiveDETLBLinesLuma = dml_floor(locals->LinesInDETLuma + dml_min( locals->LinesInDETLuma * locals->RequiredDISPCLK[i][j] * locals->BytePerPixelInDETY[k] * locals->PSCL_FACTOR[k] / locals->ReturnBWPerState[i], locals->EffectiveLBLatencyHidingSourceLinesLuma), locals->SwathHeightYPerState[i][j][k]); locals->EffectiveDETLBLinesChroma = dml_floor(locals->LinesInDETChroma + dml_min( locals->LinesInDETChroma * locals->RequiredDISPCLK[i][j] * locals->BytePerPixelInDETC[k] * locals->PSCL_FACTOR_CHROMA[k] / locals->ReturnBWPerState[i], locals->EffectiveLBLatencyHidingSourceLinesChroma), locals->SwathHeightCPerState[i][j][k]); if (locals->BytePerPixelInDETC[k] == 0) { locals->UrgentLatencySupportUsPerState[i][j][k] = locals->EffectiveDETLBLinesLuma * (locals->HTotal[k] / locals->PixelClock[k]) / locals->VRatio[k] - locals->EffectiveDETLBLinesLuma * locals->SwathWidthYPerState[i][j][k] * dml_ceil(locals->BytePerPixelInDETY[k], 1) / (locals->ReturnBWPerState[i] / locals->NoOfDPP[i][j][k]); } else { locals->UrgentLatencySupportUsPerState[i][j][k] = dml_min( locals->EffectiveDETLBLinesLuma * (locals->HTotal[k] / locals->PixelClock[k]) / locals->VRatio[k] - locals->EffectiveDETLBLinesLuma * locals->SwathWidthYPerState[i][j][k] * dml_ceil(locals->BytePerPixelInDETY[k], 1) / (locals->ReturnBWPerState[i] / locals->NoOfDPP[i][j][k]), locals->EffectiveDETLBLinesChroma * (locals->HTotal[k] / locals->PixelClock[k]) / (locals->VRatio[k] / 2) - locals->EffectiveDETLBLinesChroma * locals->SwathWidthYPerState[i][j][k] / 2 * dml_ceil(locals->BytePerPixelInDETC[k], 2) / (locals->ReturnBWPerState[i] / locals->NoOfDPP[i][j][k])); } } } } for (i = 0; i <= locals->soc.num_states; i++) { for (j = 0; j < 2; j++) { locals->UrgentLatencySupport[i][j] = true; for (k = 0; k < locals->NumberOfActivePlanes; k++) { if (locals->UrgentLatencySupportUsPerState[i][j][k] < locals->UrgentLatency) locals->UrgentLatencySupport[i][j] = false; } } } /*Prefetch Check*/ for (i = 0; i <= locals->soc.num_states; i++) { for (j = 0; j < 2; j++) { locals->TotalNumberOfDCCActiveDPP[i][j] = 0; for (k = 0; k < locals->NumberOfActivePlanes; k++) { if (locals->DCCEnable[k] == true) { locals->TotalNumberOfDCCActiveDPP[i][j] = locals->TotalNumberOfDCCActiveDPP[i][j] + locals->NoOfDPP[i][j][k]; } } } } CalculateMinAndMaxPrefetchMode(locals->AllowDRAMSelfRefreshOrDRAMClockChangeInVblank, &locals->MinPrefetchMode, &locals->MaxPrefetchMode); locals->MaxTotalVActiveRDBandwidth = 0; for (k = 0; k < locals->NumberOfActivePlanes; k++) { locals->MaxTotalVActiveRDBandwidth = locals->MaxTotalVActiveRDBandwidth + locals->ReadBandwidth[k]; } for (i = 0; i <= locals->soc.num_states; i++) { for (j = 0; j < 2; j++) { for (k = 0; k < locals->NumberOfActivePlanes; k++) { locals->NoOfDPPThisState[k] = locals->NoOfDPP[i][j][k]; locals->RequiredDPPCLKThisState[k] = locals->RequiredDPPCLK[i][j][k]; locals->SwathHeightYThisState[k] = locals->SwathHeightYPerState[i][j][k]; locals->SwathHeightCThisState[k] = locals->SwathHeightCPerState[i][j][k]; locals->SwathWidthYThisState[k] = locals->SwathWidthYPerState[i][j][k]; mode_lib->vba.ProjectedDCFCLKDeepSleep = dml_max( mode_lib->vba.ProjectedDCFCLKDeepSleep, mode_lib->vba.PixelClock[k] / 16.0); if (mode_lib->vba.BytePerPixelInDETC[k] == 0.0) { if (mode_lib->vba.VRatio[k] <= 1.0) { mode_lib->vba.ProjectedDCFCLKDeepSleep = dml_max( mode_lib->vba.ProjectedDCFCLKDeepSleep, 1.1 * dml_ceil( mode_lib->vba.BytePerPixelInDETY[k], 1.0) / 64.0 * mode_lib->vba.HRatio[k] * mode_lib->vba.PixelClock[k] / mode_lib->vba.NoOfDPP[i][j][k]); } else { mode_lib->vba.ProjectedDCFCLKDeepSleep = dml_max( mode_lib->vba.ProjectedDCFCLKDeepSleep, 1.1 * dml_ceil( mode_lib->vba.BytePerPixelInDETY[k], 1.0) / 64.0 * mode_lib->vba.PSCL_FACTOR[k] * mode_lib->vba.RequiredDPPCLK[i][j][k]); } } else { if (mode_lib->vba.VRatio[k] <= 1.0) { mode_lib->vba.ProjectedDCFCLKDeepSleep = dml_max( mode_lib->vba.ProjectedDCFCLKDeepSleep, 1.1 * dml_ceil( mode_lib->vba.BytePerPixelInDETY[k], 1.0) / 32.0 * mode_lib->vba.HRatio[k] * mode_lib->vba.PixelClock[k] / mode_lib->vba.NoOfDPP[i][j][k]); } else { mode_lib->vba.ProjectedDCFCLKDeepSleep = dml_max( mode_lib->vba.ProjectedDCFCLKDeepSleep, 1.1 * dml_ceil( mode_lib->vba.BytePerPixelInDETY[k], 1.0) / 32.0 * mode_lib->vba.PSCL_FACTOR[k] * mode_lib->vba.RequiredDPPCLK[i][j][k]); } if (mode_lib->vba.VRatio[k] / 2.0 <= 1.0) { mode_lib->vba.ProjectedDCFCLKDeepSleep = dml_max( mode_lib->vba.ProjectedDCFCLKDeepSleep, 1.1 * dml_ceil( mode_lib->vba.BytePerPixelInDETC[k], 2.0) / 32.0 * mode_lib->vba.HRatio[k] / 2.0 * mode_lib->vba.PixelClock[k] / mode_lib->vba.NoOfDPP[i][j][k]); } else { mode_lib->vba.ProjectedDCFCLKDeepSleep = dml_max( mode_lib->vba.ProjectedDCFCLKDeepSleep, 1.1 * dml_ceil( mode_lib->vba.BytePerPixelInDETC[k], 2.0) / 32.0 * mode_lib->vba.PSCL_FACTOR_CHROMA[k] * mode_lib->vba.RequiredDPPCLK[i][j][k]); } } } for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { mode_lib->vba.PDEAndMetaPTEBytesPerFrameY = CalculateVMAndRowBytes( mode_lib, mode_lib->vba.DCCEnable[k], mode_lib->vba.Read256BlockHeightY[k], mode_lib->vba.Read256BlockWidthY[k], mode_lib->vba.SourcePixelFormat[k], mode_lib->vba.SurfaceTiling[k], dml_ceil(mode_lib->vba.BytePerPixelInDETY[k], 1.0), mode_lib->vba.SourceScan[k], mode_lib->vba.ViewportWidth[k], mode_lib->vba.ViewportHeight[k], mode_lib->vba.SwathWidthYPerState[i][j][k], mode_lib->vba.GPUVMEnable, mode_lib->vba.VMMPageSize, mode_lib->vba.PTEBufferSizeInRequestsLuma, mode_lib->vba.PDEProcessingBufIn64KBReqs, mode_lib->vba.PitchY[k], mode_lib->vba.DCCMetaPitchY[k], &mode_lib->vba.MacroTileWidthY[k], &mode_lib->vba.MetaRowBytesY, &mode_lib->vba.DPTEBytesPerRowY, &mode_lib->vba.PTEBufferSizeNotExceededY[i][j][k], &mode_lib->vba.dpte_row_height[k], &mode_lib->vba.meta_row_height[k]); mode_lib->vba.PrefetchLinesY[k] = CalculatePrefetchSourceLines( mode_lib, mode_lib->vba.VRatio[k], mode_lib->vba.vtaps[k], mode_lib->vba.Interlace[k], mode_lib->vba.ProgressiveToInterlaceUnitInOPP, mode_lib->vba.SwathHeightYPerState[i][j][k], mode_lib->vba.ViewportYStartY[k], &mode_lib->vba.PrefillY[k], &mode_lib->vba.MaxNumSwY[k]); if ((mode_lib->vba.SourcePixelFormat[k] != dm_444_64 && mode_lib->vba.SourcePixelFormat[k] != dm_444_32 && mode_lib->vba.SourcePixelFormat[k] != dm_444_16 && mode_lib->vba.SourcePixelFormat[k] != dm_mono_16 && mode_lib->vba.SourcePixelFormat[k] != dm_mono_8)) { mode_lib->vba.PDEAndMetaPTEBytesPerFrameC = CalculateVMAndRowBytes( mode_lib, mode_lib->vba.DCCEnable[k], mode_lib->vba.Read256BlockHeightY[k], mode_lib->vba.Read256BlockWidthY[k], mode_lib->vba.SourcePixelFormat[k], mode_lib->vba.SurfaceTiling[k], dml_ceil(mode_lib->vba.BytePerPixelInDETC[k], 2.0), mode_lib->vba.SourceScan[k], mode_lib->vba.ViewportWidth[k] / 2.0, mode_lib->vba.ViewportHeight[k] / 2.0, mode_lib->vba.SwathWidthYPerState[i][j][k] / 2.0, mode_lib->vba.GPUVMEnable, mode_lib->vba.VMMPageSize, mode_lib->vba.PTEBufferSizeInRequestsLuma, mode_lib->vba.PDEProcessingBufIn64KBReqs, mode_lib->vba.PitchC[k], 0.0, &mode_lib->vba.MacroTileWidthC[k], &mode_lib->vba.MetaRowBytesC, &mode_lib->vba.DPTEBytesPerRowC, &mode_lib->vba.PTEBufferSizeNotExceededC[i][j][k], &mode_lib->vba.dpte_row_height_chroma[k], &mode_lib->vba.meta_row_height_chroma[k]); mode_lib->vba.PrefetchLinesC[k] = CalculatePrefetchSourceLines( mode_lib, mode_lib->vba.VRatio[k] / 2.0, mode_lib->vba.VTAPsChroma[k], mode_lib->vba.Interlace[k], mode_lib->vba.ProgressiveToInterlaceUnitInOPP, mode_lib->vba.SwathHeightCPerState[i][j][k], mode_lib->vba.ViewportYStartC[k], &mode_lib->vba.PrefillC[k], &mode_lib->vba.MaxNumSwC[k]); } else { mode_lib->vba.PDEAndMetaPTEBytesPerFrameC = 0.0; mode_lib->vba.MetaRowBytesC = 0.0; mode_lib->vba.DPTEBytesPerRowC = 0.0; locals->PrefetchLinesC[k] = 0.0; locals->PTEBufferSizeNotExceededC[i][j][k] = true; locals->PTEBufferSizeInRequestsForLuma = mode_lib->vba.PTEBufferSizeInRequestsLuma + mode_lib->vba.PTEBufferSizeInRequestsChroma; } locals->PDEAndMetaPTEBytesPerFrame[k] = mode_lib->vba.PDEAndMetaPTEBytesPerFrameY + mode_lib->vba.PDEAndMetaPTEBytesPerFrameC; locals->MetaRowBytes[k] = mode_lib->vba.MetaRowBytesY + mode_lib->vba.MetaRowBytesC; locals->DPTEBytesPerRow[k] = mode_lib->vba.DPTEBytesPerRowY + mode_lib->vba.DPTEBytesPerRowC; CalculateActiveRowBandwidth( mode_lib->vba.GPUVMEnable, mode_lib->vba.SourcePixelFormat[k], mode_lib->vba.VRatio[k], mode_lib->vba.DCCEnable[k], mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k], mode_lib->vba.MetaRowBytesY, mode_lib->vba.MetaRowBytesC, mode_lib->vba.meta_row_height[k], mode_lib->vba.meta_row_height_chroma[k], mode_lib->vba.DPTEBytesPerRowY, mode_lib->vba.DPTEBytesPerRowC, mode_lib->vba.dpte_row_height[k], mode_lib->vba.dpte_row_height_chroma[k], &mode_lib->vba.meta_row_bw[k], &mode_lib->vba.dpte_row_bw[k], &mode_lib->vba.qual_row_bw[k]); } mode_lib->vba.ExtraLatency = mode_lib->vba.UrgentRoundTripAndOutOfOrderLatencyPerState[i] + (mode_lib->vba.TotalNumberOfActiveDPP[i][j] * mode_lib->vba.PixelChunkSizeInKByte + mode_lib->vba.TotalNumberOfDCCActiveDPP[i][j] * mode_lib->vba.MetaChunkSize) * 1024.0 / mode_lib->vba.ReturnBWPerState[i]; if (mode_lib->vba.GPUVMEnable == true) { mode_lib->vba.ExtraLatency = mode_lib->vba.ExtraLatency + mode_lib->vba.TotalNumberOfActiveDPP[i][j] * mode_lib->vba.PTEGroupSize / mode_lib->vba.ReturnBWPerState[i]; } mode_lib->vba.TimeCalc = 24.0 / mode_lib->vba.ProjectedDCFCLKDeepSleep; for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { if (mode_lib->vba.BlendingAndTiming[k] == k) { if (mode_lib->vba.WritebackEnable[k] == true) { locals->WritebackDelay[i][k] = mode_lib->vba.WritebackLatency + CalculateWriteBackDelay( mode_lib->vba.WritebackPixelFormat[k], mode_lib->vba.WritebackHRatio[k], mode_lib->vba.WritebackVRatio[k], mode_lib->vba.WritebackLumaHTaps[k], mode_lib->vba.WritebackLumaVTaps[k], mode_lib->vba.WritebackChromaHTaps[k], mode_lib->vba.WritebackChromaVTaps[k], mode_lib->vba.WritebackDestinationWidth[k]) / locals->RequiredDISPCLK[i][j]; } else { locals->WritebackDelay[i][k] = 0.0; } for (m = 0; m <= mode_lib->vba.NumberOfActivePlanes - 1; m++) { if (mode_lib->vba.BlendingAndTiming[m] == k && mode_lib->vba.WritebackEnable[m] == true) { locals->WritebackDelay[i][k] = dml_max(locals->WritebackDelay[i][k], mode_lib->vba.WritebackLatency + CalculateWriteBackDelay( mode_lib->vba.WritebackPixelFormat[m], mode_lib->vba.WritebackHRatio[m], mode_lib->vba.WritebackVRatio[m], mode_lib->vba.WritebackLumaHTaps[m], mode_lib->vba.WritebackLumaVTaps[m], mode_lib->vba.WritebackChromaHTaps[m], mode_lib->vba.WritebackChromaVTaps[m], mode_lib->vba.WritebackDestinationWidth[m]) / locals->RequiredDISPCLK[i][j]); } } } } for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { for (m = 0; m <= mode_lib->vba.NumberOfActivePlanes - 1; m++) { if (mode_lib->vba.BlendingAndTiming[k] == m) { locals->WritebackDelay[i][k] = locals->WritebackDelay[i][m]; } } } for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { for (m = 0; m < locals->NumberOfCursors[k]; m++) locals->cursor_bw[k] = locals->NumberOfCursors[k] * locals->CursorWidth[k][m] * locals->CursorBPP[k][m] / 8 / (locals->HTotal[k] / locals->PixelClock[k]) * locals->VRatio[k]; } for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { locals->MaximumVStartup[k] = mode_lib->vba.VTotal[k] - mode_lib->vba.VActive[k] - dml_max(1.0, dml_ceil(locals->WritebackDelay[i][k] / (mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]), 1.0)); } mode_lib->vba.NextPrefetchMode = mode_lib->vba.MinPrefetchMode; do { mode_lib->vba.PrefetchMode[i][j] = mode_lib->vba.NextPrefetchMode; mode_lib->vba.NextPrefetchMode = mode_lib->vba.NextPrefetchMode + 1; mode_lib->vba.TWait = CalculateTWait( mode_lib->vba.PrefetchMode[i][j], mode_lib->vba.DRAMClockChangeLatency, mode_lib->vba.UrgentLatency, mode_lib->vba.SREnterPlusExitTime); for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { if (mode_lib->vba.XFCEnabled[k] == true) { mode_lib->vba.XFCRemoteSurfaceFlipDelay = CalculateRemoteSurfaceFlipDelay( mode_lib, mode_lib->vba.VRatio[k], locals->SwathWidthYPerState[i][j][k], dml_ceil(locals->BytePerPixelInDETY[k], 1.0), mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k], mode_lib->vba.XFCTSlvVupdateOffset, mode_lib->vba.XFCTSlvVupdateWidth, mode_lib->vba.XFCTSlvVreadyOffset, mode_lib->vba.XFCXBUFLatencyTolerance, mode_lib->vba.XFCFillBWOverhead, mode_lib->vba.XFCSlvChunkSize, mode_lib->vba.XFCBusTransportTime, mode_lib->vba.TimeCalc, mode_lib->vba.TWait, &mode_lib->vba.SrcActiveDrainRate, &mode_lib->vba.TInitXFill, &mode_lib->vba.TslvChk); } else { mode_lib->vba.XFCRemoteSurfaceFlipDelay = 0.0; } CalculateDelayAfterScaler(mode_lib, mode_lib->vba.ReturnBWPerState[i], mode_lib->vba.ReadBandwidthLuma[k], mode_lib->vba.ReadBandwidthChroma[k], mode_lib->vba.MaxTotalVActiveRDBandwidth, mode_lib->vba.DisplayPipeLineDeliveryTimeLuma[k], mode_lib->vba.DisplayPipeLineDeliveryTimeChroma[k], mode_lib->vba.RequiredDPPCLK[i][j][k], mode_lib->vba.RequiredDISPCLK[i][j], mode_lib->vba.PixelClock[k], mode_lib->vba.DSCDelayPerState[i][k], mode_lib->vba.NoOfDPP[i][j][k], mode_lib->vba.ScalerEnabled[k], mode_lib->vba.NumberOfCursors[k], mode_lib->vba.DPPCLKDelaySubtotal, mode_lib->vba.DPPCLKDelaySCL, mode_lib->vba.DPPCLKDelaySCLLBOnly, mode_lib->vba.DPPCLKDelayCNVCFormater, mode_lib->vba.DPPCLKDelayCNVCCursor, mode_lib->vba.DISPCLKDelaySubtotal, mode_lib->vba.SwathWidthYPerState[i][j][k] / mode_lib->vba.HRatio[k], mode_lib->vba.OutputFormat[k], mode_lib->vba.HTotal[k], mode_lib->vba.SwathWidthYSingleDPP[k], mode_lib->vba.BytePerPixelInDETY[k], mode_lib->vba.BytePerPixelInDETC[k], mode_lib->vba.SwathHeightYThisState[k], mode_lib->vba.SwathHeightCThisState[k], mode_lib->vba.Interlace[k], mode_lib->vba.ProgressiveToInterlaceUnitInOPP, &mode_lib->vba.DSTXAfterScaler[k], &mode_lib->vba.DSTYAfterScaler[k]); mode_lib->vba.IsErrorResult[i][j][k] = CalculatePrefetchSchedule( mode_lib, mode_lib->vba.RequiredDPPCLK[i][j][k], mode_lib->vba.RequiredDISPCLK[i][j], mode_lib->vba.PixelClock[k], mode_lib->vba.ProjectedDCFCLKDeepSleep, mode_lib->vba.NoOfDPP[i][j][k], mode_lib->vba.NumberOfCursors[k], mode_lib->vba.VTotal[k] - mode_lib->vba.VActive[k], mode_lib->vba.HTotal[k], mode_lib->vba.MaxInterDCNTileRepeaters, mode_lib->vba.MaximumVStartup[k], mode_lib->vba.GPUVMMaxPageTableLevels, mode_lib->vba.GPUVMEnable, mode_lib->vba.DynamicMetadataEnable[k], mode_lib->vba.DynamicMetadataLinesBeforeActiveRequired[k], mode_lib->vba.DynamicMetadataTransmittedBytes[k], mode_lib->vba.DCCEnable[k], mode_lib->vba.UrgentLatencyPixelDataOnly, mode_lib->vba.ExtraLatency, mode_lib->vba.TimeCalc, mode_lib->vba.PDEAndMetaPTEBytesPerFrame[k], mode_lib->vba.MetaRowBytes[k], mode_lib->vba.DPTEBytesPerRow[k], mode_lib->vba.PrefetchLinesY[k], mode_lib->vba.SwathWidthYPerState[i][j][k], mode_lib->vba.BytePerPixelInDETY[k], mode_lib->vba.PrefillY[k], mode_lib->vba.MaxNumSwY[k], mode_lib->vba.PrefetchLinesC[k], mode_lib->vba.BytePerPixelInDETC[k], mode_lib->vba.PrefillC[k], mode_lib->vba.MaxNumSwC[k], mode_lib->vba.SwathHeightYPerState[i][j][k], mode_lib->vba.SwathHeightCPerState[i][j][k], mode_lib->vba.TWait, mode_lib->vba.XFCEnabled[k], mode_lib->vba.XFCRemoteSurfaceFlipDelay, mode_lib->vba.Interlace[k], mode_lib->vba.ProgressiveToInterlaceUnitInOPP, mode_lib->vba.DSTXAfterScaler[k], mode_lib->vba.DSTYAfterScaler[k], &mode_lib->vba.LineTimesForPrefetch[k], &mode_lib->vba.PrefetchBW[k], &mode_lib->vba.LinesForMetaPTE[k], &mode_lib->vba.LinesForMetaAndDPTERow[k], &mode_lib->vba.VRatioPreY[i][j][k], &mode_lib->vba.VRatioPreC[i][j][k], &mode_lib->vba.RequiredPrefetchPixelDataBWLuma[i][j][k], &mode_lib->vba.Tno_bw[k], &mode_lib->vba.VUpdateOffsetPix[k], &mode_lib->vba.VUpdateWidthPix[k], &mode_lib->vba.VReadyOffsetPix[k]); } mode_lib->vba.MaximumReadBandwidthWithoutPrefetch = 0.0; mode_lib->vba.MaximumReadBandwidthWithPrefetch = 0.0; locals->prefetch_vm_bw_valid = true; locals->prefetch_row_bw_valid = true; for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { if (locals->PDEAndMetaPTEBytesPerFrame[k] == 0) locals->prefetch_vm_bw[k] = 0; else if (locals->LinesForMetaPTE[k] > 0) locals->prefetch_vm_bw[k] = locals->PDEAndMetaPTEBytesPerFrame[k] / (locals->LinesForMetaPTE[k] * locals->HTotal[k] / locals->PixelClock[k]); else { locals->prefetch_vm_bw[k] = 0; locals->prefetch_vm_bw_valid = false; } if (locals->MetaRowBytes[k] + locals->DPTEBytesPerRow[k] == 0) locals->prefetch_row_bw[k] = 0; else if (locals->LinesForMetaAndDPTERow[k] > 0) locals->prefetch_row_bw[k] = (locals->MetaRowBytes[k] + locals->DPTEBytesPerRow[k]) / (locals->LinesForMetaAndDPTERow[k] * locals->HTotal[k] / locals->PixelClock[k]); else { locals->prefetch_row_bw[k] = 0; locals->prefetch_row_bw_valid = false; } mode_lib->vba.MaximumReadBandwidthWithoutPrefetch = mode_lib->vba.MaximumReadBandwidthWithPrefetch + mode_lib->vba.cursor_bw[k] + mode_lib->vba.ReadBandwidth[k] + mode_lib->vba.meta_row_bw[k] + mode_lib->vba.dpte_row_bw[k]; mode_lib->vba.MaximumReadBandwidthWithPrefetch = mode_lib->vba.MaximumReadBandwidthWithPrefetch + mode_lib->vba.cursor_bw[k] + dml_max3( mode_lib->vba.prefetch_vm_bw[k], mode_lib->vba.prefetch_row_bw[k], dml_max(mode_lib->vba.ReadBandwidth[k], mode_lib->vba.RequiredPrefetchPixelDataBWLuma[i][j][k]) + mode_lib->vba.meta_row_bw[k] + mode_lib->vba.dpte_row_bw[k]); } locals->BandwidthWithoutPrefetchSupported[i] = true; if (mode_lib->vba.MaximumReadBandwidthWithoutPrefetch > locals->ReturnBWPerState[i]) { locals->BandwidthWithoutPrefetchSupported[i] = false; } locals->PrefetchSupported[i][j] = true; if (mode_lib->vba.MaximumReadBandwidthWithPrefetch > locals->ReturnBWPerState[i]) { locals->PrefetchSupported[i][j] = false; } for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { if (locals->LineTimesForPrefetch[k] < 2.0 || locals->LinesForMetaPTE[k] >= 8.0 || locals->LinesForMetaAndDPTERow[k] >= 16.0 || mode_lib->vba.IsErrorResult[i][j][k] == true) { locals->PrefetchSupported[i][j] = false; } } locals->VRatioInPrefetchSupported[i][j] = true; for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { if (locals->VRatioPreY[i][j][k] > 4.0 || locals->VRatioPreC[i][j][k] > 4.0 || mode_lib->vba.IsErrorResult[i][j][k] == true) { locals->VRatioInPrefetchSupported[i][j] = false; } } } while ((locals->PrefetchSupported[i][j] != true || locals->VRatioInPrefetchSupported[i][j] != true) && mode_lib->vba.NextPrefetchMode < mode_lib->vba.MaxPrefetchMode); if (mode_lib->vba.PrefetchSupported[i][j] == true && mode_lib->vba.VRatioInPrefetchSupported[i][j] == true) { mode_lib->vba.BandwidthAvailableForImmediateFlip = mode_lib->vba.ReturnBWPerState[i]; for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { mode_lib->vba.BandwidthAvailableForImmediateFlip = mode_lib->vba.BandwidthAvailableForImmediateFlip - mode_lib->vba.cursor_bw[k] - dml_max( mode_lib->vba.ReadBandwidth[k] + mode_lib->vba.qual_row_bw[k], mode_lib->vba.PrefetchBW[k]); } for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { mode_lib->vba.ImmediateFlipBytes[k] = 0.0; if ((mode_lib->vba.SourcePixelFormat[k] != dm_420_8 && mode_lib->vba.SourcePixelFormat[k] != dm_420_10)) { mode_lib->vba.ImmediateFlipBytes[k] = mode_lib->vba.PDEAndMetaPTEBytesPerFrame[k] + mode_lib->vba.MetaRowBytes[k] + mode_lib->vba.DPTEBytesPerRow[k]; } } mode_lib->vba.TotImmediateFlipBytes = 0.0; for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { if ((mode_lib->vba.SourcePixelFormat[k] != dm_420_8 && mode_lib->vba.SourcePixelFormat[k] != dm_420_10)) { mode_lib->vba.TotImmediateFlipBytes = mode_lib->vba.TotImmediateFlipBytes + mode_lib->vba.ImmediateFlipBytes[k]; } } for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { CalculateFlipSchedule( mode_lib, mode_lib->vba.ExtraLatency, mode_lib->vba.UrgentLatencyPixelDataOnly, mode_lib->vba.GPUVMMaxPageTableLevels, mode_lib->vba.GPUVMEnable, mode_lib->vba.BandwidthAvailableForImmediateFlip, mode_lib->vba.TotImmediateFlipBytes, mode_lib->vba.SourcePixelFormat[k], mode_lib->vba.ImmediateFlipBytes[k], mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k], mode_lib->vba.VRatio[k], mode_lib->vba.Tno_bw[k], mode_lib->vba.PDEAndMetaPTEBytesPerFrame[k], mode_lib->vba.MetaRowBytes[k], mode_lib->vba.DPTEBytesPerRow[k], mode_lib->vba.DCCEnable[k], mode_lib->vba.dpte_row_height[k], mode_lib->vba.meta_row_height[k], mode_lib->vba.qual_row_bw[k], &mode_lib->vba.DestinationLinesToRequestVMInImmediateFlip[k], &mode_lib->vba.DestinationLinesToRequestRowInImmediateFlip[k], &mode_lib->vba.final_flip_bw[k], &mode_lib->vba.ImmediateFlipSupportedForPipe[k]); } mode_lib->vba.total_dcn_read_bw_with_flip = 0.0; for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { mode_lib->vba.total_dcn_read_bw_with_flip = mode_lib->vba.total_dcn_read_bw_with_flip + mode_lib->vba.cursor_bw[k] + dml_max3( mode_lib->vba.prefetch_vm_bw[k], mode_lib->vba.prefetch_row_bw[k], mode_lib->vba.final_flip_bw[k] + dml_max( mode_lib->vba.ReadBandwidth[k], mode_lib->vba.RequiredPrefetchPixelDataBWLuma[i][j][k])); } mode_lib->vba.ImmediateFlipSupportedForState[i][j] = true; if (mode_lib->vba.total_dcn_read_bw_with_flip > mode_lib->vba.ReturnBWPerState[i]) { mode_lib->vba.ImmediateFlipSupportedForState[i][j] = false; } for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { if (mode_lib->vba.ImmediateFlipSupportedForPipe[k] == false) { mode_lib->vba.ImmediateFlipSupportedForState[i][j] = false; } } } else { mode_lib->vba.ImmediateFlipSupportedForState[i][j] = false; } } } /*Vertical Active BW support*/ for (i = 0; i <= mode_lib->vba.soc.num_states; i++) { mode_lib->vba.MaxTotalVerticalActiveAvailableBandwidth[i] = dml_min(mode_lib->vba.ReturnBusWidth * mode_lib->vba.DCFCLKPerState[i], mode_lib->vba.FabricAndDRAMBandwidthPerState[i] * 1000) * mode_lib->vba.MaxAveragePercentOfIdealDRAMBWDisplayCanUseInNormalSystemOperation / 100; if (mode_lib->vba.MaxTotalVActiveRDBandwidth <= mode_lib->vba.MaxTotalVerticalActiveAvailableBandwidth[i]) mode_lib->vba.TotalVerticalActiveBandwidthSupport[i] = true; else mode_lib->vba.TotalVerticalActiveBandwidthSupport[i] = false; } /*PTE Buffer Size Check*/ for (i = 0; i <= mode_lib->vba.soc.num_states; i++) { for (j = 0; j < 2; j++) { locals->PTEBufferSizeNotExceeded[i][j] = true; for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { if (locals->PTEBufferSizeNotExceededY[i][j][k] == false || locals->PTEBufferSizeNotExceededC[i][j][k] == false) { locals->PTEBufferSizeNotExceeded[i][j] = false; } } } } /*Cursor Support Check*/ mode_lib->vba.CursorSupport = true; for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { for (j = 0; j < 2; j++) { if (mode_lib->vba.CursorWidth[k][j] > 0.0) { if (dml_floor( dml_floor( mode_lib->vba.CursorBufferSize - mode_lib->vba.CursorChunkSize, mode_lib->vba.CursorChunkSize) * 1024.0 / (mode_lib->vba.CursorWidth[k][j] * mode_lib->vba.CursorBPP[k][j] / 8.0), 1.0) * (mode_lib->vba.HTotal[k] / mode_lib->vba.PixelClock[k]) / mode_lib->vba.VRatio[k] < mode_lib->vba.UrgentLatencyPixelDataOnly || (mode_lib->vba.CursorBPP[k][j] == 64.0 && mode_lib->vba.Cursor64BppSupport == false)) { mode_lib->vba.CursorSupport = false; } } } } /*Valid Pitch Check*/ mode_lib->vba.PitchSupport = true; for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { locals->AlignedYPitch[k] = dml_ceil( dml_max(mode_lib->vba.PitchY[k], mode_lib->vba.ViewportWidth[k]), locals->MacroTileWidthY[k]); if (locals->AlignedYPitch[k] > mode_lib->vba.PitchY[k]) { mode_lib->vba.PitchSupport = false; } if (mode_lib->vba.DCCEnable[k] == true) { locals->AlignedDCCMetaPitch[k] = dml_ceil( dml_max( mode_lib->vba.DCCMetaPitchY[k], mode_lib->vba.ViewportWidth[k]), 64.0 * locals->Read256BlockWidthY[k]); } else { locals->AlignedDCCMetaPitch[k] = mode_lib->vba.DCCMetaPitchY[k]; } if (locals->AlignedDCCMetaPitch[k] > mode_lib->vba.DCCMetaPitchY[k]) { mode_lib->vba.PitchSupport = false; } if (mode_lib->vba.SourcePixelFormat[k] != dm_444_64 && mode_lib->vba.SourcePixelFormat[k] != dm_444_32 && mode_lib->vba.SourcePixelFormat[k] != dm_444_16 && mode_lib->vba.SourcePixelFormat[k] != dm_mono_16 && mode_lib->vba.SourcePixelFormat[k] != dm_mono_8) { locals->AlignedCPitch[k] = dml_ceil( dml_max( mode_lib->vba.PitchC[k], mode_lib->vba.ViewportWidth[k] / 2.0), locals->MacroTileWidthC[k]); } else { locals->AlignedCPitch[k] = mode_lib->vba.PitchC[k]; } if (locals->AlignedCPitch[k] > mode_lib->vba.PitchC[k]) { mode_lib->vba.PitchSupport = false; } } /*Mode Support, Voltage State and SOC Configuration*/ for (i = mode_lib->vba.soc.num_states; i >= 0; i--) { for (j = 0; j < 2; j++) { enum dm_validation_status status = DML_VALIDATION_OK; if (mode_lib->vba.ScaleRatioAndTapsSupport != true) { status = DML_FAIL_SCALE_RATIO_TAP; } else if (mode_lib->vba.SourceFormatPixelAndScanSupport != true) { status = DML_FAIL_SOURCE_PIXEL_FORMAT; } else if (locals->ViewportSizeSupport[i] != true) { status = DML_FAIL_VIEWPORT_SIZE; } else if (locals->DIOSupport[i] != true) { status = DML_FAIL_DIO_SUPPORT; } else if (locals->NotEnoughDSCUnits[i] != false) { status = DML_FAIL_NOT_ENOUGH_DSC; } else if (locals->DSCCLKRequiredMoreThanSupported[i] != false) { status = DML_FAIL_DSC_CLK_REQUIRED; } else if (locals->UrgentLatencySupport[i][j] != true) { status = DML_FAIL_URGENT_LATENCY; } else if (locals->ROBSupport[i] != true) { status = DML_FAIL_REORDERING_BUFFER; } else if (locals->DISPCLK_DPPCLK_Support[i][j] != true) { status = DML_FAIL_DISPCLK_DPPCLK; } else if (locals->TotalAvailablePipesSupport[i][j] != true) { status = DML_FAIL_TOTAL_AVAILABLE_PIPES; } else if (mode_lib->vba.NumberOfOTGSupport != true) { status = DML_FAIL_NUM_OTG; } else if (mode_lib->vba.WritebackModeSupport != true) { status = DML_FAIL_WRITEBACK_MODE; } else if (mode_lib->vba.WritebackLatencySupport != true) { status = DML_FAIL_WRITEBACK_LATENCY; } else if (mode_lib->vba.WritebackScaleRatioAndTapsSupport != true) { status = DML_FAIL_WRITEBACK_SCALE_RATIO_TAP; } else if (mode_lib->vba.CursorSupport != true) { status = DML_FAIL_CURSOR_SUPPORT; } else if (mode_lib->vba.PitchSupport != true) { status = DML_FAIL_PITCH_SUPPORT; } else if (locals->PrefetchSupported[i][j] != true) { status = DML_FAIL_PREFETCH_SUPPORT; } else if (locals->TotalVerticalActiveBandwidthSupport[i] != true) { status = DML_FAIL_TOTAL_V_ACTIVE_BW; } else if (locals->VRatioInPrefetchSupported[i][j] != true) { status = DML_FAIL_V_RATIO_PREFETCH; } else if (locals->PTEBufferSizeNotExceeded[i][j] != true) { status = DML_FAIL_PTE_BUFFER_SIZE; } else if (mode_lib->vba.NonsupportedDSCInputBPC != false) { status = DML_FAIL_DSC_INPUT_BPC; } if (status == DML_VALIDATION_OK) { locals->ModeSupport[i][j] = true; } else { locals->ModeSupport[i][j] = false; } locals->ValidationStatus[i] = status; } } { unsigned int MaximumMPCCombine = 0; mode_lib->vba.VoltageLevel = mode_lib->vba.soc.num_states + 1; for (i = mode_lib->vba.VoltageOverrideLevel; i <= mode_lib->vba.soc.num_states; i++) { if (locals->ModeSupport[i][0] == true || locals->ModeSupport[i][1] == true) { mode_lib->vba.VoltageLevel = i; if (locals->ModeSupport[i][1] == true && (locals->ModeSupport[i][0] == false || mode_lib->vba.WhenToDoMPCCombine == dm_mpc_always_when_possible)) { MaximumMPCCombine = 1; } else { MaximumMPCCombine = 0; } break; } } mode_lib->vba.ImmediateFlipSupport = locals->ImmediateFlipSupportedForState[mode_lib->vba.VoltageLevel][MaximumMPCCombine]; for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { mode_lib->vba.DPPPerPlane[k] = locals->NoOfDPP[mode_lib->vba.VoltageLevel][MaximumMPCCombine][k]; locals->DPPCLK[k] = locals->RequiredDPPCLK[mode_lib->vba.VoltageLevel][MaximumMPCCombine][k]; } mode_lib->vba.DISPCLK = locals->RequiredDISPCLK[mode_lib->vba.VoltageLevel][MaximumMPCCombine]; mode_lib->vba.maxMpcComb = MaximumMPCCombine; } mode_lib->vba.DCFCLK = mode_lib->vba.DCFCLKPerState[mode_lib->vba.VoltageLevel]; mode_lib->vba.DRAMSpeed = mode_lib->vba.DRAMSpeedPerState[mode_lib->vba.VoltageLevel]; mode_lib->vba.FabricClock = mode_lib->vba.FabricClockPerState[mode_lib->vba.VoltageLevel]; mode_lib->vba.SOCCLK = mode_lib->vba.SOCCLKPerState[mode_lib->vba.VoltageLevel]; mode_lib->vba.ReturnBW = locals->ReturnBWPerState[mode_lib->vba.VoltageLevel]; mode_lib->vba.FabricAndDRAMBandwidth = locals->FabricAndDRAMBandwidthPerState[mode_lib->vba.VoltageLevel]; for (k = 0; k <= mode_lib->vba.NumberOfActivePlanes - 1; k++) { if (mode_lib->vba.BlendingAndTiming[k] == k) { mode_lib->vba.ODMCombineEnabled[k] = locals->ODMCombineEnablePerState[mode_lib->vba.VoltageLevel][k]; } else { mode_lib->vba.ODMCombineEnabled[k] = 0; } mode_lib->vba.DSCEnabled[k] = locals->RequiresDSC[mode_lib->vba.VoltageLevel][k]; mode_lib->vba.OutputBpp[k] = locals->OutputBppPerState[mode_lib->vba.VoltageLevel][k]; } }