|
@@ -1,367 +0,0 @@
|
|
|
-/*
|
|
|
- * Copyright 2017 Advanced Micro Devices, Inc.
|
|
|
- *
|
|
|
- * Permission is hereby granted, free of charge, to any person obtaining a
|
|
|
- * copy of this software and associated documentation files (the "Software"),
|
|
|
- * to deal in the Software without restriction, including without limitation
|
|
|
- * the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
|
|
- * and/or sell copies of the Software, and to permit persons to whom the
|
|
|
- * Software is furnished to do so, subject to the following conditions:
|
|
|
- *
|
|
|
- * The above copyright notice and this permission notice shall be included in
|
|
|
- * all copies or substantial portions of the Software.
|
|
|
- *
|
|
|
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
|
- * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
|
- * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
|
- * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
|
|
|
- * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
|
|
|
- * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
|
|
|
- * OTHER DEALINGS IN THE SOFTWARE.
|
|
|
- *
|
|
|
- * Authors: AMD
|
|
|
- *
|
|
|
- */
|
|
|
-
|
|
|
-#include "display_pipe_clocks.h"
|
|
|
-#include "display_mode_lib.h"
|
|
|
-#include "soc_bounding_box.h"
|
|
|
-
|
|
|
-static enum voltage_state power_state(
|
|
|
- struct display_mode_lib *mode_lib,
|
|
|
- double dispclk,
|
|
|
- double dppclk)
|
|
|
-{
|
|
|
- enum voltage_state state1;
|
|
|
- enum voltage_state state2;
|
|
|
-
|
|
|
- if (dispclk <= mode_lib->soc.vmin.dispclk_mhz)
|
|
|
- state1 = dm_vmin;
|
|
|
- else if (dispclk <= mode_lib->soc.vnom.dispclk_mhz)
|
|
|
- state1 = dm_vnom;
|
|
|
- else if (dispclk <= mode_lib->soc.vmax.dispclk_mhz)
|
|
|
- state1 = dm_vmax;
|
|
|
- else
|
|
|
- state1 = dm_vmax_exceeded;
|
|
|
-
|
|
|
- if (dppclk <= mode_lib->soc.vmin.dppclk_mhz)
|
|
|
- state2 = dm_vmin;
|
|
|
- else if (dppclk <= mode_lib->soc.vnom.dppclk_mhz)
|
|
|
- state2 = dm_vnom;
|
|
|
- else if (dppclk <= mode_lib->soc.vmax.dppclk_mhz)
|
|
|
- state2 = dm_vmax;
|
|
|
- else
|
|
|
- state2 = dm_vmax_exceeded;
|
|
|
-
|
|
|
- if (state1 > state2)
|
|
|
- return state1;
|
|
|
- else
|
|
|
- return state2;
|
|
|
-}
|
|
|
-
|
|
|
-static unsigned int dpp_in_grp(
|
|
|
- struct _vcs_dpi_display_e2e_pipe_params_st *e2e,
|
|
|
- unsigned int num_pipes,
|
|
|
- unsigned int hsplit_grp)
|
|
|
-{
|
|
|
- unsigned int num_dpp = 0;
|
|
|
- unsigned int i;
|
|
|
-
|
|
|
- for (i = 0; i < num_pipes; i++) {
|
|
|
- if (e2e[i].pipe.src.is_hsplit) {
|
|
|
- if (e2e[i].pipe.src.hsplit_grp == hsplit_grp) {
|
|
|
- num_dpp++;
|
|
|
- }
|
|
|
- }
|
|
|
- }
|
|
|
-
|
|
|
- if (0 == num_dpp)
|
|
|
- num_dpp = 1;
|
|
|
-
|
|
|
- return num_dpp;
|
|
|
-}
|
|
|
-
|
|
|
-static void calculate_pipe_clk_requirement(
|
|
|
- struct display_mode_lib *mode_lib,
|
|
|
- struct _vcs_dpi_display_e2e_pipe_params_st *e2e,
|
|
|
- unsigned int num_dpp_in_grp,
|
|
|
- double *dppclk,
|
|
|
- double *dispclk,
|
|
|
- bool *dppdiv)
|
|
|
-{
|
|
|
- double pscl_throughput = 0.0;
|
|
|
- double max_hratio = e2e->pipe.scale_ratio_depth.hscl_ratio;
|
|
|
- double max_vratio = e2e->pipe.scale_ratio_depth.vscl_ratio;
|
|
|
- double max_htaps = e2e->pipe.scale_taps.htaps;
|
|
|
- double max_vtaps = e2e->pipe.scale_taps.vtaps;
|
|
|
- double dpp_clock_divider = (double) num_dpp_in_grp;
|
|
|
- double dispclk_dppclk_ratio;
|
|
|
- double dispclk_ramp_margin_percent;
|
|
|
-
|
|
|
- if (max_hratio > 1.0) {
|
|
|
- double pscl_to_lb = ((double) mode_lib->ip.max_pscl_lb_bw_pix_per_clk * max_hratio)
|
|
|
- / dml_ceil(max_htaps / 6.0);
|
|
|
- pscl_throughput = dml_min(
|
|
|
- pscl_to_lb,
|
|
|
- (double) mode_lib->ip.max_dchub_pscl_bw_pix_per_clk);
|
|
|
- } else {
|
|
|
- pscl_throughput = dml_min(
|
|
|
- (double) mode_lib->ip.max_pscl_lb_bw_pix_per_clk,
|
|
|
- (double) mode_lib->ip.max_dchub_pscl_bw_pix_per_clk);
|
|
|
- }
|
|
|
-
|
|
|
- DTRACE("pscl_throughput: %f pix per clk", pscl_throughput);
|
|
|
- DTRACE("vtaps: %f hratio: %f vratio: %f", max_vtaps, max_hratio, max_vratio);
|
|
|
- *dppclk = dml_max(
|
|
|
- max_vtaps / 6.0 * dml_min(1.0, max_hratio),
|
|
|
- max_hratio * max_vratio / pscl_throughput);
|
|
|
- DTRACE("pixel rate multiplier: %f", *dppclk);
|
|
|
- *dppclk = dml_max(*dppclk, 1.0);
|
|
|
- DTRACE("pixel rate multiplier clamped: %f", *dppclk);
|
|
|
- *dppclk = *dppclk * e2e->pipe.dest.pixel_rate_mhz;
|
|
|
-
|
|
|
- *dppclk = *dppclk / dpp_clock_divider;
|
|
|
- DTRACE("dppclk after split: %f", *dppclk);
|
|
|
-
|
|
|
- if (dpp_clock_divider > 1.0 && (*dppclk < e2e->pipe.dest.pixel_rate_mhz)) {
|
|
|
- dispclk_dppclk_ratio = 2.0;
|
|
|
- *dppdiv = true;
|
|
|
- } else {
|
|
|
- dispclk_dppclk_ratio = 1.0;
|
|
|
- *dppdiv = false;
|
|
|
- }
|
|
|
-
|
|
|
- dispclk_ramp_margin_percent = mode_lib->ip.dispclk_ramp_margin_percent;
|
|
|
-
|
|
|
- /* Comment this out because of Gabes possible bug in spreadsheet,
|
|
|
- * just to make other cases evident during debug
|
|
|
- *
|
|
|
- *if(e2e->clks_cfg.voltage == dm_vmax)
|
|
|
- * dispclk_ramp_margin_percent = 0.0;
|
|
|
- */
|
|
|
-
|
|
|
- /* account for ramping margin and downspread */
|
|
|
- *dispclk = dml_max(*dppclk * dispclk_dppclk_ratio, e2e->pipe.dest.pixel_rate_mhz)
|
|
|
- * (1.0 + (double) mode_lib->soc.downspread_percent / 100.0)
|
|
|
- * (1.0 + (double) dispclk_ramp_margin_percent / 100.0);
|
|
|
-
|
|
|
- return;
|
|
|
-}
|
|
|
-
|
|
|
-bool dml_clks_pipe_clock_requirement_fit_power_constraint(
|
|
|
- struct display_mode_lib *mode_lib,
|
|
|
- struct _vcs_dpi_display_e2e_pipe_params_st *e2e,
|
|
|
- unsigned int num_dpp_in_grp)
|
|
|
-{
|
|
|
- double dppclk = 0;
|
|
|
- double dispclk = 0;
|
|
|
- bool dppdiv = 0;
|
|
|
-
|
|
|
- calculate_pipe_clk_requirement(mode_lib, e2e, num_dpp_in_grp, &dppclk, &dispclk, &dppdiv);
|
|
|
-
|
|
|
- if (power_state(mode_lib, dispclk, dppclk) > e2e->clks_cfg.voltage) {
|
|
|
- return false;
|
|
|
- }
|
|
|
-
|
|
|
- return true;
|
|
|
-}
|
|
|
-
|
|
|
-static void get_plane_clks(
|
|
|
- struct display_mode_lib *mode_lib,
|
|
|
- struct _vcs_dpi_display_e2e_pipe_params_st *e2e,
|
|
|
- unsigned int num_pipes,
|
|
|
- double *dppclks,
|
|
|
- double *dispclks,
|
|
|
- bool *dppdiv)
|
|
|
-{
|
|
|
- /* it is assumed that the scale ratios passed into the e2e pipe params have already been calculated
|
|
|
- * for any split pipe configurations, where extra pixels inthe overlap region do not contribute to
|
|
|
- * the scale ratio. This means that we can simply calculate the dppclk for each dpp independently
|
|
|
- * and we would expect the same result on any split pipes, which would be handled
|
|
|
- */
|
|
|
- unsigned int i;
|
|
|
-
|
|
|
- for (i = 0; i < num_pipes; i++) {
|
|
|
- double num_dpp_in_grp;
|
|
|
- double dispclk_ramp_margin_percent;
|
|
|
- double dispclk_margined;
|
|
|
-
|
|
|
- if (e2e[i].pipe.src.is_hsplit)
|
|
|
- num_dpp_in_grp = (double) dpp_in_grp(
|
|
|
- e2e,
|
|
|
- num_pipes,
|
|
|
- e2e[i].pipe.src.hsplit_grp);
|
|
|
- else
|
|
|
- num_dpp_in_grp = 1;
|
|
|
-
|
|
|
- calculate_pipe_clk_requirement(
|
|
|
- mode_lib,
|
|
|
- &e2e[i],
|
|
|
- num_dpp_in_grp,
|
|
|
- &dppclks[i],
|
|
|
- &dispclks[i],
|
|
|
- &dppdiv[i]);
|
|
|
-
|
|
|
- dispclk_ramp_margin_percent = mode_lib->ip.dispclk_ramp_margin_percent;
|
|
|
-
|
|
|
- dispclk_margined = e2e[i].pipe.dest.pixel_rate_mhz
|
|
|
- * (1.0 + (double) mode_lib->soc.downspread_percent / 100.0)
|
|
|
- * (1.0 + (double) dispclk_ramp_margin_percent / 100.0);
|
|
|
-
|
|
|
- DTRACE("p%d: requested power state: %d", i, (int) e2e[0].clks_cfg.voltage);
|
|
|
-
|
|
|
- if (power_state(mode_lib, dispclks[i], dppclks[i])
|
|
|
- > power_state(mode_lib, dispclk_margined, dispclk_margined)
|
|
|
- && dispclk_margined > dppclks[i]) {
|
|
|
- if (power_state(mode_lib, dispclks[i], dppclks[i])
|
|
|
- > e2e[0].clks_cfg.voltage) {
|
|
|
- dispclks[i] = dispclk_margined;
|
|
|
- dppclks[i] = dispclk_margined;
|
|
|
- dppdiv[i] = false;
|
|
|
- }
|
|
|
- }
|
|
|
-
|
|
|
- DTRACE("p%d: dispclk: %f", i, dispclks[i]);
|
|
|
- }
|
|
|
-}
|
|
|
-
|
|
|
-static void get_dcfclk(
|
|
|
- struct display_mode_lib *mode_lib,
|
|
|
- struct _vcs_dpi_display_e2e_pipe_params_st *e2e,
|
|
|
- unsigned int num_pipes,
|
|
|
- double *dcfclk_mhz)
|
|
|
-{
|
|
|
- double bytes_per_pixel_det_y[DC__NUM_PIPES__MAX];
|
|
|
- double bytes_per_pixel_det_c[DC__NUM_PIPES__MAX];
|
|
|
- double swath_width_y[DC__NUM_PIPES__MAX];
|
|
|
- unsigned int i;
|
|
|
- double total_read_bandwidth_gbps = 0.0;
|
|
|
-
|
|
|
- for (i = 0; i < num_pipes; i++) {
|
|
|
- if (e2e[i].pipe.src.source_scan == dm_horz) {
|
|
|
- swath_width_y[i] = e2e[i].pipe.src.viewport_width * 1.0;
|
|
|
- } else {
|
|
|
- swath_width_y[i] = e2e[i].pipe.src.viewport_height * 1.0;
|
|
|
- }
|
|
|
-
|
|
|
- switch (e2e[i].pipe.src.source_format) {
|
|
|
- case dm_444_64:
|
|
|
- bytes_per_pixel_det_y[i] = 8.0;
|
|
|
- bytes_per_pixel_det_c[i] = 0.0;
|
|
|
- break;
|
|
|
- case dm_444_32:
|
|
|
- bytes_per_pixel_det_y[i] = 4.0;
|
|
|
- bytes_per_pixel_det_c[i] = 0.0;
|
|
|
- break;
|
|
|
- case dm_444_16:
|
|
|
- bytes_per_pixel_det_y[i] = 2.0;
|
|
|
- bytes_per_pixel_det_c[i] = 0.0;
|
|
|
- break;
|
|
|
- case dm_422_8:
|
|
|
- bytes_per_pixel_det_y[i] = 2.0;
|
|
|
- bytes_per_pixel_det_c[i] = 0.0;
|
|
|
- break;
|
|
|
- case dm_422_10:
|
|
|
- bytes_per_pixel_det_y[i] = 4.0;
|
|
|
- bytes_per_pixel_det_c[i] = 0.0;
|
|
|
- break;
|
|
|
- case dm_420_8:
|
|
|
- bytes_per_pixel_det_y[i] = 1.0;
|
|
|
- bytes_per_pixel_det_c[i] = 2.0;
|
|
|
- break;
|
|
|
- case dm_420_10:
|
|
|
- bytes_per_pixel_det_y[i] = 4.0 / 3.0;
|
|
|
- bytes_per_pixel_det_c[i] = 8.0 / 3.0;
|
|
|
- break;
|
|
|
- default:
|
|
|
- BREAK_TO_DEBUGGER(); /* invalid src_format in get_dcfclk */
|
|
|
- }
|
|
|
- }
|
|
|
-
|
|
|
- for (i = 0; i < num_pipes; i++) {
|
|
|
- double read_bandwidth_plane_mbps = 0.0;
|
|
|
- read_bandwidth_plane_mbps = (double) swath_width_y[i]
|
|
|
- * ((double) bytes_per_pixel_det_y[i]
|
|
|
- + (double) bytes_per_pixel_det_c[i] / 2.0)
|
|
|
- / ((double) e2e[i].pipe.dest.htotal
|
|
|
- / (double) e2e[i].pipe.dest.pixel_rate_mhz)
|
|
|
- * e2e[i].pipe.scale_ratio_depth.vscl_ratio;
|
|
|
-
|
|
|
- if (e2e[i].pipe.src.dcc) {
|
|
|
- read_bandwidth_plane_mbps += (read_bandwidth_plane_mbps / 1000.0 / 256.0);
|
|
|
- }
|
|
|
-
|
|
|
- if (e2e[i].pipe.src.vm) {
|
|
|
- read_bandwidth_plane_mbps += (read_bandwidth_plane_mbps / 1000.0 / 512.0);
|
|
|
- }
|
|
|
-
|
|
|
- total_read_bandwidth_gbps = total_read_bandwidth_gbps
|
|
|
- + read_bandwidth_plane_mbps / 1000.0;
|
|
|
- }
|
|
|
-
|
|
|
- DTRACE("total bandwidth = %f gbps", total_read_bandwidth_gbps);
|
|
|
-
|
|
|
- (*dcfclk_mhz) = (total_read_bandwidth_gbps * 1000.0) / mode_lib->soc.return_bus_width_bytes;
|
|
|
-
|
|
|
- DTRACE(
|
|
|
- "minimum theoretical dcfclk without stutter and full utilization = %f MHz",
|
|
|
- (*dcfclk_mhz));
|
|
|
-
|
|
|
-}
|
|
|
-
|
|
|
-struct _vcs_dpi_display_pipe_clock_st dml_clks_get_pipe_clocks(
|
|
|
- struct display_mode_lib *mode_lib,
|
|
|
- struct _vcs_dpi_display_e2e_pipe_params_st *e2e,
|
|
|
- unsigned int num_pipes)
|
|
|
-{
|
|
|
- struct _vcs_dpi_display_pipe_clock_st clocks;
|
|
|
- double max_dispclk = 0.0;
|
|
|
- double dcfclk;
|
|
|
- double dispclks[DC__NUM_PIPES__MAX];
|
|
|
- double dppclks[DC__NUM_PIPES__MAX];
|
|
|
- bool dppdiv[DC__NUM_PIPES__MAX];
|
|
|
- unsigned int i;
|
|
|
-
|
|
|
- DTRACE("Calculating pipe clocks...");
|
|
|
-
|
|
|
- /* this is the theoretical minimum, have to adjust based on valid values for soc */
|
|
|
- get_dcfclk(mode_lib, e2e, num_pipes, &dcfclk);
|
|
|
-
|
|
|
- /* if(dcfclk > soc.vnom.dcfclk_mhz)
|
|
|
- * dcfclk = soc.vmax.dcfclk_mhz;
|
|
|
- * else if(dcfclk > soc.vmin.dcfclk_mhz)
|
|
|
- * dcfclk = soc.vnom.dcfclk_mhz;
|
|
|
- * else
|
|
|
- * dcfclk = soc.vmin.dcfclk_mhz;
|
|
|
- */
|
|
|
-
|
|
|
- dcfclk = dml_socbb_voltage_scaling(
|
|
|
- &mode_lib->soc,
|
|
|
- (enum voltage_state) e2e[0].clks_cfg.voltage).dcfclk_mhz;
|
|
|
- clocks.dcfclk_mhz = dcfclk;
|
|
|
-
|
|
|
- get_plane_clks(mode_lib, e2e, num_pipes, dppclks, dispclks, dppdiv);
|
|
|
-
|
|
|
- for (i = 0; i < num_pipes; i++) {
|
|
|
- max_dispclk = dml_max(max_dispclk, dispclks[i]);
|
|
|
- }
|
|
|
-
|
|
|
- clocks.dispclk_mhz = max_dispclk;
|
|
|
- DTRACE("dispclk: %f Mhz", clocks.dispclk_mhz);
|
|
|
- DTRACE("dcfclk: %f Mhz", clocks.dcfclk_mhz);
|
|
|
-
|
|
|
- for (i = 0; i < num_pipes; i++) {
|
|
|
- if (dppclks[i] * 2 < max_dispclk)
|
|
|
- dppdiv[i] = 1;
|
|
|
-
|
|
|
- if (dppdiv[i])
|
|
|
- clocks.dppclk_div[i] = 1;
|
|
|
- else
|
|
|
- clocks.dppclk_div[i] = 0;
|
|
|
-
|
|
|
- clocks.dppclk_mhz[i] = max_dispclk / ((dppdiv[i]) ? 2.0 : 1.0);
|
|
|
- DTRACE("dppclk%d: %f Mhz", i, clocks.dppclk_mhz[i]);
|
|
|
- }
|
|
|
-
|
|
|
- return clocks;
|
|
|
-}
|