/* * Copyright 2018 Advanced Micro Devices, Inc. * * Permission is hereby granted, free of charge, to any person obtaining a * copy of this software and associated documentation files (the "Software"), * to deal in the Software without restriction, including without limitation * the rights to use, copy, modify, merge, publish, distribute, sublicense, * and/or sell copies of the Software, and to permit persons to whom the * Software is furnished to do so, subject to the following conditions: * * The above copyright notice and this permission notice shall be included in * all copies or substantial portions of the Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR * OTHER DEALINGS IN THE SOFTWARE. * * Authors: AMD * */ #include #include "reg_helper.h" #include "core_types.h" #include "clk_mgr_internal.h" #include "rv1_clk_mgr.h" #include "dce100/dce_clk_mgr.h" #include "dce112/dce112_clk_mgr.h" #include "rv1_clk_mgr_vbios_smu.h" #include "rv1_clk_mgr_clk.h" void rv1_init_clocks(struct clk_mgr *clk_mgr) { memset(&(clk_mgr->clks), 0, sizeof(struct dc_clocks)); } static int rv1_determine_dppclk_threshold(struct clk_mgr_internal *clk_mgr, struct dc_clocks *new_clocks) { bool request_dpp_div = new_clocks->dispclk_khz > new_clocks->dppclk_khz; bool dispclk_increase = new_clocks->dispclk_khz > clk_mgr->base.clks.dispclk_khz; int disp_clk_threshold = new_clocks->max_supported_dppclk_khz; bool cur_dpp_div = clk_mgr->base.clks.dispclk_khz > clk_mgr->base.clks.dppclk_khz; /* increase clock, looking for div is 0 for current, request div is 1*/ if (dispclk_increase) { /* already divided by 2, no need to reach target clk with 2 steps*/ if (cur_dpp_div) return new_clocks->dispclk_khz; /* request disp clk is lower than maximum supported dpp clk, * no need to reach target clk with two steps. */ if (new_clocks->dispclk_khz <= disp_clk_threshold) return new_clocks->dispclk_khz; /* target dpp clk not request divided by 2, still within threshold */ if (!request_dpp_div) return new_clocks->dispclk_khz; } else { /* decrease clock, looking for current dppclk divided by 2, * request dppclk not divided by 2. */ /* current dpp clk not divided by 2, no need to ramp*/ if (!cur_dpp_div) return new_clocks->dispclk_khz; /* current disp clk is lower than current maximum dpp clk, * no need to ramp */ if (clk_mgr->base.clks.dispclk_khz <= disp_clk_threshold) return new_clocks->dispclk_khz; /* request dpp clk need to be divided by 2 */ if (request_dpp_div) return new_clocks->dispclk_khz; } return disp_clk_threshold; } static void ramp_up_dispclk_with_dpp( struct clk_mgr_internal *clk_mgr, struct dc *dc, struct dc_clocks *new_clocks, bool safe_to_lower) { int i; int dispclk_to_dpp_threshold = rv1_determine_dppclk_threshold(clk_mgr, new_clocks); bool request_dpp_div = new_clocks->dispclk_khz > new_clocks->dppclk_khz; /* this function is to change dispclk, dppclk and dprefclk according to * bandwidth requirement. Its call stack is rv1_update_clocks --> * update_clocks --> dcn10_prepare_bandwidth / dcn10_optimize_bandwidth * --> prepare_bandwidth / optimize_bandwidth. before change dcn hw, * prepare_bandwidth will be called first to allow enough clock, * watermark for change, after end of dcn hw change, optimize_bandwidth * is executed to lower clock to save power for new dcn hw settings. * * below is sequence of commit_planes_for_stream: * * step 1: prepare_bandwidth - raise clock to have enough bandwidth * step 2: lock_doublebuffer_enable * step 3: pipe_control_lock(true) - make dchubp register change will * not take effect right way * step 4: apply_ctx_for_surface - program dchubp * step 5: pipe_control_lock(false) - dchubp register change take effect * step 6: optimize_bandwidth --> dc_post_update_surfaces_to_stream * for full_date, optimize clock to save power * * at end of step 1, dcn clocks (dprefclk, dispclk, dppclk) may be * changed for new dchubp configuration. but real dcn hub dchubps are * still running with old configuration until end of step 5. this need * clocks settings at step 1 should not less than that before step 1. * this is checked by two conditions: 1. if (should_set_clock(safe_to_lower * , new_clocks->dispclk_khz, clk_mgr_base->clks.dispclk_khz) || * new_clocks->dispclk_khz == clk_mgr_base->clks.dispclk_khz) * 2. request_dpp_div = new_clocks->dispclk_khz > new_clocks->dppclk_khz * * the second condition is based on new dchubp configuration. dppclk * for new dchubp may be different from dppclk before step 1. * for example, before step 1, dchubps are as below: * pipe 0: recout=(0,40,1920,980) viewport=(0,0,1920,979) * pipe 1: recout=(0,0,1920,1080) viewport=(0,0,1920,1080) * for dppclk for pipe0 need dppclk = dispclk * * new dchubp pipe split configuration: * pipe 0: recout=(0,0,960,1080) viewport=(0,0,960,1080) * pipe 1: recout=(960,0,960,1080) viewport=(960,0,960,1080) * dppclk only needs dppclk = dispclk /2. * * dispclk, dppclk are not lock by otg master lock. they take effect * after step 1. during this transition, dispclk are the same, but * dppclk is changed to half of previous clock for old dchubp * configuration between step 1 and step 6. This may cause p-state * warning intermittently. * * for new_clocks->dispclk_khz == clk_mgr_base->clks.dispclk_khz, we * need make sure dppclk are not changed to less between step 1 and 6. * for new_clocks->dispclk_khz > clk_mgr_base->clks.dispclk_khz, * new display clock is raised, but we do not know ratio of * new_clocks->dispclk_khz and clk_mgr_base->clks.dispclk_khz, * new_clocks->dispclk_khz /2 does not guarantee equal or higher than * old dppclk. we could ignore power saving different between * dppclk = displck and dppclk = dispclk / 2 between step 1 and step 6. * as long as safe_to_lower = false, set dpclk = dispclk to simplify * condition check. * todo: review this change for other asic. **/ if (!safe_to_lower) request_dpp_div = false; /* set disp clk to dpp clk threshold */ clk_mgr->funcs->set_dispclk(clk_mgr, dispclk_to_dpp_threshold); clk_mgr->funcs->set_dprefclk(clk_mgr); /* update request dpp clk division option */ for (i = 0; i < dc->res_pool->pipe_count; i++) { struct pipe_ctx *pipe_ctx = &dc->current_state->res_ctx.pipe_ctx[i]; if (!pipe_ctx->plane_state) continue; pipe_ctx->plane_res.dpp->funcs->dpp_dppclk_control( pipe_ctx->plane_res.dpp, request_dpp_div, true); } /* If target clk not same as dppclk threshold, set to target clock */ if (dispclk_to_dpp_threshold != new_clocks->dispclk_khz) { clk_mgr->funcs->set_dispclk(clk_mgr, new_clocks->dispclk_khz); clk_mgr->funcs->set_dprefclk(clk_mgr); } clk_mgr->base.clks.dispclk_khz = new_clocks->dispclk_khz; clk_mgr->base.clks.dppclk_khz = new_clocks->dppclk_khz; clk_mgr->base.clks.max_supported_dppclk_khz = new_clocks->max_supported_dppclk_khz; } static void rv1_update_clocks(struct clk_mgr *clk_mgr_base, struct dc_state *context, bool safe_to_lower) { struct clk_mgr_internal *clk_mgr = TO_CLK_MGR_INTERNAL(clk_mgr_base); struct dc *dc = clk_mgr_base->ctx->dc; struct dc_debug_options *debug = &dc->debug; struct dc_clocks *new_clocks = &context->bw_ctx.bw.dcn.clk; struct pp_smu_funcs_rv *pp_smu = NULL; bool send_request_to_increase = false; bool send_request_to_lower = false; int display_count; bool enter_display_off = false; ASSERT(clk_mgr->pp_smu); pp_smu = &clk_mgr->pp_smu->rv_funcs; display_count = clk_mgr_helper_get_active_display_cnt(dc, context); if (display_count == 0) enter_display_off = true; if (enter_display_off == safe_to_lower) { /* * Notify SMU active displays * if function pointer not set up, this message is * sent as part of pplib_apply_display_requirements. */ if (pp_smu->set_display_count) pp_smu->set_display_count(&pp_smu->pp_smu, display_count); } if (new_clocks->dispclk_khz > clk_mgr_base->clks.dispclk_khz || new_clocks->phyclk_khz > clk_mgr_base->clks.phyclk_khz || new_clocks->fclk_khz > clk_mgr_base->clks.fclk_khz || new_clocks->dcfclk_khz > clk_mgr_base->clks.dcfclk_khz) send_request_to_increase = true; if (should_set_clock(safe_to_lower, new_clocks->phyclk_khz, clk_mgr_base->clks.phyclk_khz)) { clk_mgr_base->clks.phyclk_khz = new_clocks->phyclk_khz; send_request_to_lower = true; } // F Clock if (debug->force_fclk_khz != 0) new_clocks->fclk_khz = debug->force_fclk_khz; if (should_set_clock(safe_to_lower, new_clocks->fclk_khz, clk_mgr_base->clks.fclk_khz)) { clk_mgr_base->clks.fclk_khz = new_clocks->fclk_khz; send_request_to_lower = true; } //DCF Clock if (should_set_clock(safe_to_lower, new_clocks->dcfclk_khz, clk_mgr_base->clks.dcfclk_khz)) { clk_mgr_base->clks.dcfclk_khz = new_clocks->dcfclk_khz; send_request_to_lower = true; } if (should_set_clock(safe_to_lower, new_clocks->dcfclk_deep_sleep_khz, clk_mgr_base->clks.dcfclk_deep_sleep_khz)) { clk_mgr_base->clks.dcfclk_deep_sleep_khz = new_clocks->dcfclk_deep_sleep_khz; send_request_to_lower = true; } /* make sure dcf clk is before dpp clk to * make sure we have enough voltage to run dpp clk */ if (send_request_to_increase) { /*use dcfclk to request voltage*/ if (pp_smu->set_hard_min_fclk_by_freq && pp_smu->set_hard_min_dcfclk_by_freq && pp_smu->set_min_deep_sleep_dcfclk) { pp_smu->set_hard_min_fclk_by_freq(&pp_smu->pp_smu, new_clocks->fclk_khz / 1000); pp_smu->set_hard_min_dcfclk_by_freq(&pp_smu->pp_smu, new_clocks->dcfclk_khz / 1000); pp_smu->set_min_deep_sleep_dcfclk(&pp_smu->pp_smu, (new_clocks->dcfclk_deep_sleep_khz + 999) / 1000); } } /* dcn1 dppclk is tied to dispclk */ /* program dispclk on = as a w/a for sleep resume clock ramping issues */ if (should_set_clock(safe_to_lower, new_clocks->dispclk_khz, clk_mgr_base->clks.dispclk_khz) || new_clocks->dispclk_khz == clk_mgr_base->clks.dispclk_khz) { ramp_up_dispclk_with_dpp(clk_mgr, dc, new_clocks, safe_to_lower); clk_mgr_base->clks.dispclk_khz = new_clocks->dispclk_khz; send_request_to_lower = true; } if (!send_request_to_increase && send_request_to_lower) { /*use dcfclk to request voltage*/ if (pp_smu->set_hard_min_fclk_by_freq && pp_smu->set_hard_min_dcfclk_by_freq && pp_smu->set_min_deep_sleep_dcfclk) { pp_smu->set_hard_min_fclk_by_freq(&pp_smu->pp_smu, new_clocks->fclk_khz / 1000); pp_smu->set_hard_min_dcfclk_by_freq(&pp_smu->pp_smu, new_clocks->dcfclk_khz / 1000); pp_smu->set_min_deep_sleep_dcfclk(&pp_smu->pp_smu, (new_clocks->dcfclk_deep_sleep_khz + 999) / 1000); } } } static void rv1_enable_pme_wa(struct clk_mgr *clk_mgr_base) { struct clk_mgr_internal *clk_mgr = TO_CLK_MGR_INTERNAL(clk_mgr_base); struct pp_smu_funcs_rv *pp_smu = NULL; if (clk_mgr->pp_smu) { pp_smu = &clk_mgr->pp_smu->rv_funcs; if (pp_smu->set_pme_wa_enable) pp_smu->set_pme_wa_enable(&pp_smu->pp_smu); } } static struct clk_mgr_funcs rv1_clk_funcs = { .init_clocks = rv1_init_clocks, .get_dp_ref_clk_frequency = dce12_get_dp_ref_freq_khz, .update_clocks = rv1_update_clocks, .enable_pme_wa = rv1_enable_pme_wa, }; static struct clk_mgr_internal_funcs rv1_clk_internal_funcs = { .set_dispclk = rv1_vbios_smu_set_dispclk, .set_dprefclk = dce112_set_dprefclk }; void rv1_clk_mgr_construct(struct dc_context *ctx, struct clk_mgr_internal *clk_mgr, struct pp_smu_funcs *pp_smu) { struct dc_debug_options *debug = &ctx->dc->debug; struct dc_bios *bp = ctx->dc_bios; clk_mgr->base.ctx = ctx; clk_mgr->pp_smu = pp_smu; clk_mgr->base.funcs = &rv1_clk_funcs; clk_mgr->funcs = &rv1_clk_internal_funcs; clk_mgr->dfs_bypass_disp_clk = 0; clk_mgr->dprefclk_ss_percentage = 0; clk_mgr->dprefclk_ss_divider = 1000; clk_mgr->ss_on_dprefclk = false; clk_mgr->base.dprefclk_khz = 600000; if (bp->integrated_info) clk_mgr->dentist_vco_freq_khz = bp->integrated_info->dentist_vco_freq; if (bp->fw_info_valid && clk_mgr->dentist_vco_freq_khz == 0) { clk_mgr->dentist_vco_freq_khz = bp->fw_info.smu_gpu_pll_output_freq; if (clk_mgr->dentist_vco_freq_khz == 0) clk_mgr->dentist_vco_freq_khz = 3600000; } if (!debug->disable_dfs_bypass && bp->integrated_info) if (bp->integrated_info->gpu_cap_info & DFS_BYPASS_ENABLE) clk_mgr->dfs_bypass_enabled = true; dce_clock_read_ss_info(clk_mgr); }