From: Dmytro Laktyushkin <[email protected]>

[Why & How]
Memory bandwidth calculations work differently than for ddr.
Add lpddr5 handling.

Reviewed-by: Charlene Liu <[email protected]>
Signed-off-by: Dmytro Laktyushkin <[email protected]>
Signed-off-by: Wayne Lin <[email protected]>
---
 .../dml21/inc/dml_top_soc_parameter_types.h   |  3 +
 .../src/dml2_core/dml2_core_dcn4_calcs.c      | 26 ++++++--
 .../dml21/src/dml2_dpmm/dml2_dpmm_dcn4.c      | 59 ++++++++++++-------
 .../src/inc/dml2_internal_shared_types.h      |  1 +
 4 files changed, 64 insertions(+), 25 deletions(-)

diff --git 
a/drivers/gpu/drm/amd/display/dc/dml2_0/dml21/inc/dml_top_soc_parameter_types.h 
b/drivers/gpu/drm/amd/display/dc/dml2_0/dml21/inc/dml_top_soc_parameter_types.h
index 1fbc520c2540..c4cce870877a 100644
--- 
a/drivers/gpu/drm/amd/display/dc/dml2_0/dml21/inc/dml_top_soc_parameter_types.h
+++ 
b/drivers/gpu/drm/amd/display/dc/dml2_0/dml21/inc/dml_top_soc_parameter_types.h
@@ -115,9 +115,12 @@ struct dml2_dram_params {
        unsigned int channel_width_bytes;
        unsigned int channel_count;
        unsigned int transactions_per_clock;
+       bool alt_clock_bw_conversion;
 };
 
+#define ENABLE_WCK
 struct dml2_soc_state_table {
+       struct dml2_clk_table wck_ratio;
        struct dml2_clk_table uclk;
        struct dml2_clk_table fclk;
        struct dml2_clk_table dcfclk;
diff --git 
a/drivers/gpu/drm/amd/display/dc/dml2_0/dml21/src/dml2_core/dml2_core_dcn4_calcs.c
 
b/drivers/gpu/drm/amd/display/dc/dml2_0/dml21/src/dml2_core/dml2_core_dcn4_calcs.c
index 01b87be24ce3..37699cc9e5c1 100644
--- 
a/drivers/gpu/drm/amd/display/dc/dml2_0/dml21/src/dml2_core/dml2_core_dcn4_calcs.c
+++ 
b/drivers/gpu/drm/amd/display/dc/dml2_0/dml21/src/dml2_core/dml2_core_dcn4_calcs.c
@@ -7077,10 +7077,21 @@ static void calculate_excess_vactive_bandwidth_required(
        }
 }
 
-static double uclk_khz_to_dram_bw_mbps(unsigned long uclk_khz, const struct 
dml2_dram_params *dram_config)
+static double uclk_khz_to_dram_bw_mbps(unsigned long uclk_khz, const struct 
dml2_dram_params *dram_config, const struct dml2_mcg_dram_bw_to_min_clk_table 
*dram_bw_table)
 {
        double bw_mbps = 0;
-       bw_mbps = ((double)uclk_khz * dram_config->channel_count * 
dram_config->channel_width_bytes * dram_config->transactions_per_clock) / 
1000.0;
+       int i;
+
+       if (!dram_config->alt_clock_bw_conversion)
+               bw_mbps = ((double)uclk_khz * dram_config->channel_count * 
dram_config->channel_width_bytes * dram_config->transactions_per_clock) / 
1000.0;
+       else
+               for (i = 0; i < dram_bw_table->num_entries; i++)
+                       if (dram_bw_table->entries[i].min_uclk_khz >= uclk_khz) 
{
+                               bw_mbps = 
(double)dram_bw_table->entries[i].pre_derate_dram_bw_kbps / 1000.0;
+                               break;
+                       }
+
+       ASSERT(bw_mbps > 0);
 
        return bw_mbps;
 }
@@ -7964,7 +7975,9 @@ static bool dml_core_mode_support(struct 
dml2_core_calcs_mode_support_ex *in_out
        mode_lib->ms.max_dispclk_freq_mhz = 
(double)min_clk_table->max_ss_clocks_khz.dispclk / 1000;
        mode_lib->ms.max_dscclk_freq_mhz = 
(double)min_clk_table->max_clocks_khz.dscclk / 1000;
        mode_lib->ms.max_dppclk_freq_mhz = 
(double)min_clk_table->max_ss_clocks_khz.dppclk / 1000;
-       mode_lib->ms.uclk_freq_mhz = 
dram_bw_kbps_to_uclk_mhz(min_clk_table->dram_bw_table.entries[in_out_params->min_clk_index].pre_derate_dram_bw_kbps,
 &mode_lib->soc.clk_table.dram_config);
+       mode_lib->ms.uclk_freq_mhz = 
(double)min_clk_table->dram_bw_table.entries[in_out_params->min_clk_index].min_uclk_khz
 / 1000.0;
+       if (!mode_lib->ms.uclk_freq_mhz)
+               mode_lib->ms.uclk_freq_mhz = 
dram_bw_kbps_to_uclk_mhz(min_clk_table->dram_bw_table.entries[in_out_params->min_clk_index].pre_derate_dram_bw_kbps,
 &mode_lib->soc.clk_table.dram_config);
        mode_lib->ms.dram_bw_mbps = 
((double)min_clk_table->dram_bw_table.entries[in_out_params->min_clk_index].pre_derate_dram_bw_kbps
 / 1000);
        mode_lib->ms.max_dram_bw_mbps = 
((double)min_clk_table->dram_bw_table.entries[min_clk_table->dram_bw_table.num_entries
 - 1].pre_derate_dram_bw_kbps / 1000);
        mode_lib->ms.qos_param_index = get_qos_param_index((unsigned int) 
(mode_lib->ms.uclk_freq_mhz * 1000.0), 
mode_lib->soc.qos_parameters.qos_params.dcn4x.per_uclk_dpm_params);
@@ -10407,7 +10420,7 @@ static bool dml_core_mode_programming(struct 
dml2_core_calcs_mode_programming_ex
 
        mode_lib->mp.Dcfclk = programming->min_clocks.dcn4x.active.dcfclk_khz / 
1000.0;
        mode_lib->mp.FabricClock = 
programming->min_clocks.dcn4x.active.fclk_khz / 1000.0;
-       mode_lib->mp.dram_bw_mbps = 
uclk_khz_to_dram_bw_mbps(programming->min_clocks.dcn4x.active.uclk_khz, 
&mode_lib->soc.clk_table.dram_config);
+       mode_lib->mp.dram_bw_mbps = 
uclk_khz_to_dram_bw_mbps(programming->min_clocks.dcn4x.active.uclk_khz, 
&mode_lib->soc.clk_table.dram_config, &min_clk_table->dram_bw_table);
        mode_lib->mp.uclk_freq_mhz = 
programming->min_clocks.dcn4x.active.uclk_khz / 1000.0;
        mode_lib->mp.GlobalDPPCLK = programming->min_clocks.dcn4x.dpprefclk_khz 
/ 1000.0;
        s->SOCCLK = (double)programming->min_clocks.dcn4x.socclk_khz / 1000;
@@ -10485,7 +10498,10 @@ static bool dml_core_mode_programming(struct 
dml2_core_calcs_mode_programming_ex
        DML_LOG_VERBOSE("DML::%s: SOCCLK = %f\n", __func__, s->SOCCLK);
        DML_LOG_VERBOSE("DML::%s: min_clk_index = %0d\n", __func__, 
in_out_params->min_clk_index);
        DML_LOG_VERBOSE("DML::%s: min_clk_table min_fclk_khz = %ld\n", 
__func__, 
min_clk_table->dram_bw_table.entries[in_out_params->min_clk_index].min_fclk_khz);
-       DML_LOG_VERBOSE("DML::%s: min_clk_table uclk_mhz = %f\n", __func__, 
dram_bw_kbps_to_uclk_mhz(min_clk_table->dram_bw_table.entries[in_out_params->min_clk_index].pre_derate_dram_bw_kbps,
 &mode_lib->soc.clk_table.dram_config));
+       if 
(min_clk_table->dram_bw_table.entries[in_out_params->min_clk_index].min_uclk_khz)
+               DML_LOG_VERBOSE("DML::%s: min_clk_table uclk_mhz = %f\n", 
__func__, 
min_clk_table->dram_bw_table.entries[in_out_params->min_clk_index].min_uclk_khz 
/ 1000.0);
+       else
+               DML_LOG_VERBOSE("DML::%s: min_clk_table uclk_mhz = %f\n", 
__func__, 
dram_bw_kbps_to_uclk_mhz(min_clk_table->dram_bw_table.entries[in_out_params->min_clk_index].pre_derate_dram_bw_kbps,
 &mode_lib->soc.clk_table.dram_config));
        for (k = 0; k < mode_lib->mp.num_active_pipes; ++k) {
                DML_LOG_VERBOSE("DML::%s: pipe=%d is in plane=%d\n", __func__, 
k, mode_lib->mp.pipe_plane[k]);
                DML_LOG_VERBOSE("DML::%s: Per-plane DPPPerSurface[%0d] = %d\n", 
__func__, k, mode_lib->mp.NoOfDPP[k]);
diff --git 
a/drivers/gpu/drm/amd/display/dc/dml2_0/dml21/src/dml2_dpmm/dml2_dpmm_dcn4.c 
b/drivers/gpu/drm/amd/display/dc/dml2_0/dml21/src/dml2_dpmm/dml2_dpmm_dcn4.c
index 22969a533a7b..5c713f2e6eca 100644
--- a/drivers/gpu/drm/amd/display/dc/dml2_0/dml21/src/dml2_dpmm/dml2_dpmm_dcn4.c
+++ b/drivers/gpu/drm/amd/display/dc/dml2_0/dml21/src/dml2_dpmm/dml2_dpmm_dcn4.c
@@ -7,14 +7,24 @@
 #include "dml_top_types.h"
 #include "lib_float_math.h"
 
-static double dram_bw_kbps_to_uclk_khz(unsigned long long bandwidth_kbps, 
const struct dml2_dram_params *dram_config)
+static double dram_bw_kbps_to_uclk_khz(unsigned long long bandwidth_kbps, 
const struct dml2_dram_params *dram_config, struct 
dml2_mcg_dram_bw_to_min_clk_table *dram_bw_table)
 {
        double uclk_khz = 0;
-       unsigned long uclk_mbytes_per_tick = 0;
 
-       uclk_mbytes_per_tick = dram_config->channel_count * 
dram_config->channel_width_bytes * dram_config->transactions_per_clock;
+       if (!dram_config->alt_clock_bw_conversion) {
+               unsigned long uclk_bytes_per_tick = 0;
 
-       uclk_khz = (double)bandwidth_kbps / uclk_mbytes_per_tick;
+               uclk_bytes_per_tick = dram_config->channel_count * 
dram_config->channel_width_bytes * dram_config->transactions_per_clock;
+               uclk_khz = (double)bandwidth_kbps / uclk_bytes_per_tick;
+       } else {
+               int i;
+               /* For lpddr5 bytes per tick changes with mpstate, use table to 
find uclk*/
+               for (i = 0; i < dram_bw_table->num_entries; i++)
+                       if (dram_bw_table->entries[i].pre_derate_dram_bw_kbps 
>= bandwidth_kbps) {
+                               uclk_khz = 
dram_bw_table->entries[i].min_uclk_khz;
+                               break;
+                       }
+       }
 
        return uclk_khz;
 }
@@ -34,7 +44,7 @@ static void get_minimum_clocks_for_latency(struct 
dml2_dpmm_map_mode_to_soc_dpm_
        *dcfclk = 
in_out->min_clk_table->dram_bw_table.entries[min_clock_index_for_latency].min_dcfclk_khz;
        *fclk = 
in_out->min_clk_table->dram_bw_table.entries[min_clock_index_for_latency].min_fclk_khz;
        *uclk = 
dram_bw_kbps_to_uclk_khz(in_out->min_clk_table->dram_bw_table.entries[min_clock_index_for_latency].pre_derate_dram_bw_kbps,
-               &in_out->soc_bb->clk_table.dram_config);
+               &in_out->soc_bb->clk_table.dram_config, 
&in_out->min_clk_table->dram_bw_table);
 }
 
 static unsigned long dml_round_up(double a)
@@ -53,14 +63,18 @@ static void calculate_system_active_minimums(struct 
dml2_dpmm_map_mode_to_soc_dp
        double min_uclk_latency, min_fclk_latency, min_dcfclk_latency;
        const struct dml2_core_mode_support_result *mode_support_result = 
&in_out->display_cfg->mode_support_result;
 
-       min_uclk_avg = 
dram_bw_kbps_to_uclk_khz(mode_support_result->global.active.average_bw_dram_kbps,
 &in_out->soc_bb->clk_table.dram_config);
-       min_uclk_avg = (double)min_uclk_avg / 
((double)in_out->soc_bb->qos_parameters.derate_table.system_active_average.dram_derate_percent_pixel
 / 100);
+       min_uclk_avg = 
dram_bw_kbps_to_uclk_khz(mode_support_result->global.active.average_bw_dram_kbps
+                                                                               
        / 
((double)in_out->soc_bb->qos_parameters.derate_table.system_active_average.dram_derate_percent_pixel
 / 100),
+                                                       
&in_out->soc_bb->clk_table.dram_config, &in_out->min_clk_table->dram_bw_table);
 
-       min_uclk_urgent = 
dram_bw_kbps_to_uclk_khz(mode_support_result->global.active.urgent_bw_dram_kbps,
 &in_out->soc_bb->clk_table.dram_config);
        if (in_out->display_cfg->display_config.hostvm_enable)
-               min_uclk_urgent = (double)min_uclk_urgent / 
((double)in_out->soc_bb->qos_parameters.derate_table.system_active_urgent.dram_derate_percent_pixel_and_vm
 / 100);
+               min_uclk_urgent = 
dram_bw_kbps_to_uclk_khz(mode_support_result->global.active.urgent_bw_dram_kbps
+                                                                               
/ 
((double)in_out->soc_bb->qos_parameters.derate_table.system_active_urgent.dram_derate_percent_pixel_and_vm
 / 100),
+                                                        
&in_out->soc_bb->clk_table.dram_config, &in_out->min_clk_table->dram_bw_table);
        else
-               min_uclk_urgent = (double)min_uclk_urgent / 
((double)in_out->soc_bb->qos_parameters.derate_table.system_active_urgent.dram_derate_percent_pixel
 / 100);
+               min_uclk_urgent = 
dram_bw_kbps_to_uclk_khz(mode_support_result->global.active.urgent_bw_dram_kbps
+                                                                               
/ 
((double)in_out->soc_bb->qos_parameters.derate_table.system_active_urgent.dram_derate_percent_pixel
 / 100),
+                                                        
&in_out->soc_bb->clk_table.dram_config, &in_out->min_clk_table->dram_bw_table);
 
        min_uclk_bw = min_uclk_urgent > min_uclk_avg ? min_uclk_urgent : 
min_uclk_avg;
 
@@ -97,11 +111,13 @@ static void calculate_svp_prefetch_minimums(struct 
dml2_dpmm_map_mode_to_soc_dpm
        const struct dml2_core_mode_support_result *mode_support_result = 
&in_out->display_cfg->mode_support_result;
 
        /* assumes DF throttling is enabled */
-       min_uclk_avg = 
dram_bw_kbps_to_uclk_khz(mode_support_result->global.svp_prefetch.average_bw_dram_kbps,
 &in_out->soc_bb->clk_table.dram_config);
-       min_uclk_avg = (double)min_uclk_avg / 
((double)in_out->soc_bb->qos_parameters.derate_table.dcn_mall_prefetch_average.dram_derate_percent_pixel
 / 100);
+       min_uclk_avg = 
dram_bw_kbps_to_uclk_khz(mode_support_result->global.svp_prefetch.average_bw_dram_kbps
+                                                               / 
((double)in_out->soc_bb->qos_parameters.derate_table.dcn_mall_prefetch_average.dram_derate_percent_pixel
 / 100),
+                                               
&in_out->soc_bb->clk_table.dram_config, &in_out->min_clk_table->dram_bw_table);
 
-       min_uclk_urgent = 
dram_bw_kbps_to_uclk_khz(mode_support_result->global.svp_prefetch.urgent_bw_dram_kbps,
 &in_out->soc_bb->clk_table.dram_config);
-       min_uclk_urgent = (double)min_uclk_urgent / 
((double)in_out->soc_bb->qos_parameters.derate_table.dcn_mall_prefetch_urgent.dram_derate_percent_pixel
 / 100);
+       min_uclk_urgent = 
dram_bw_kbps_to_uclk_khz(mode_support_result->global.svp_prefetch.urgent_bw_dram_kbps
+                                                               / 
((double)in_out->soc_bb->qos_parameters.derate_table.dcn_mall_prefetch_urgent.dram_derate_percent_pixel
 / 100),
+                                                
&in_out->soc_bb->clk_table.dram_config, &in_out->min_clk_table->dram_bw_table);
 
        min_uclk_bw = min_uclk_urgent > min_uclk_avg ? min_uclk_urgent : 
min_uclk_avg;
 
@@ -128,11 +144,13 @@ static void calculate_svp_prefetch_minimums(struct 
dml2_dpmm_map_mode_to_soc_dpm
        in_out->programming->min_clocks.dcn4x.svp_prefetch.dcfclk_khz = 
dml_round_up(min_dcfclk_bw > min_dcfclk_latency ? min_dcfclk_bw : 
min_dcfclk_latency);
 
        /* assumes DF throttling is disabled */
-       min_uclk_avg = 
dram_bw_kbps_to_uclk_khz(mode_support_result->global.svp_prefetch.average_bw_dram_kbps,
 &in_out->soc_bb->clk_table.dram_config);
-       min_uclk_avg = (double)min_uclk_avg / 
((double)in_out->soc_bb->qos_parameters.derate_table.system_active_average.dram_derate_percent_pixel
 / 100);
+       min_uclk_avg = 
dram_bw_kbps_to_uclk_khz(mode_support_result->global.svp_prefetch.average_bw_dram_kbps
+                                                                               
/ 
((double)in_out->soc_bb->qos_parameters.derate_table.system_active_average.dram_derate_percent_pixel
 / 100),
+                                                               
&in_out->soc_bb->clk_table.dram_config, &in_out->min_clk_table->dram_bw_table);
 
-       min_uclk_urgent = 
dram_bw_kbps_to_uclk_khz(mode_support_result->global.svp_prefetch.urgent_bw_dram_kbps,
 &in_out->soc_bb->clk_table.dram_config);
-       min_uclk_urgent = (double)min_uclk_urgent / 
((double)in_out->soc_bb->qos_parameters.derate_table.system_active_urgent.dram_derate_percent_pixel
 / 100);
+       min_uclk_urgent = 
dram_bw_kbps_to_uclk_khz(mode_support_result->global.svp_prefetch.urgent_bw_dram_kbps
+                                                                               
/ 
((double)in_out->soc_bb->qos_parameters.derate_table.system_active_urgent.dram_derate_percent_pixel
 / 100),
+                                                               
&in_out->soc_bb->clk_table.dram_config, &in_out->min_clk_table->dram_bw_table);
 
        min_uclk_bw = min_uclk_urgent > min_uclk_avg ? min_uclk_urgent : 
min_uclk_avg;
 
@@ -167,8 +185,9 @@ static void calculate_idle_minimums(struct 
dml2_dpmm_map_mode_to_soc_dpm_params_
        double min_uclk_latency, min_fclk_latency, min_dcfclk_latency;
        const struct dml2_core_mode_support_result *mode_support_result = 
&in_out->display_cfg->mode_support_result;
 
-       min_uclk_avg = 
dram_bw_kbps_to_uclk_khz(mode_support_result->global.active.average_bw_dram_kbps,
 &in_out->soc_bb->clk_table.dram_config);
-       min_uclk_avg = (double)min_uclk_avg / 
((double)in_out->soc_bb->qos_parameters.derate_table.system_idle_average.dram_derate_percent_pixel
 / 100);
+       min_uclk_avg = 
dram_bw_kbps_to_uclk_khz(mode_support_result->global.active.average_bw_dram_kbps
+                                                                               
/ 
((double)in_out->soc_bb->qos_parameters.derate_table.system_idle_average.dram_derate_percent_pixel
 / 100),
+                                                               
&in_out->soc_bb->clk_table.dram_config, &in_out->min_clk_table->dram_bw_table);
 
        min_fclk_avg = 
(double)mode_support_result->global.active.average_bw_sdp_kbps / 
in_out->soc_bb->fabric_datapath_to_dcn_data_return_bytes;
        min_fclk_avg = (double)min_fclk_avg / 
((double)in_out->soc_bb->qos_parameters.derate_table.system_idle_average.fclk_derate_percent
 / 100);
diff --git 
a/drivers/gpu/drm/amd/display/dc/dml2_0/dml21/src/inc/dml2_internal_shared_types.h
 
b/drivers/gpu/drm/amd/display/dc/dml2_0/dml21/src/inc/dml2_internal_shared_types.h
index 1a6c0727cd2a..a6bd75f30d20 100644
--- 
a/drivers/gpu/drm/amd/display/dc/dml2_0/dml21/src/inc/dml2_internal_shared_types.h
+++ 
b/drivers/gpu/drm/amd/display/dc/dml2_0/dml21/src/inc/dml2_internal_shared_types.h
@@ -16,6 +16,7 @@
 
 struct dram_bw_to_min_clk_table_entry {
        unsigned long long pre_derate_dram_bw_kbps;
+       unsigned long min_uclk_khz;
        unsigned long min_fclk_khz;
        unsigned long min_dcfclk_khz;
 };
-- 
2.43.0

Reply via email to