dcn20_fpu.c (75606B)
1// SPDX-License-Identifier: MIT 2/* 3 * Copyright 2021 Advanced Micro Devices, Inc. 4 * 5 * Permission is hereby granted, free of charge, to any person obtaining a 6 * copy of this software and associated documentation files (the "Software"), 7 * to deal in the Software without restriction, including without limitation 8 * the rights to use, copy, modify, merge, publish, distribute, sublicense, 9 * and/or sell copies of the Software, and to permit persons to whom the 10 * Software is furnished to do so, subject to the following conditions: 11 * 12 * The above copyright notice and this permission notice shall be included in 13 * all copies or substantial portions of the Software. 14 * 15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 18 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR 19 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, 20 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR 21 * OTHER DEALINGS IN THE SOFTWARE. 22 * 23 * Authors: AMD 24 * 25 */ 26 27#include "resource.h" 28#include "clk_mgr.h" 29#include "dc_link_dp.h" 30#include "dchubbub.h" 31#include "dcn20/dcn20_resource.h" 32#include "dcn21/dcn21_resource.h" 33 34#include "dcn20_fpu.h" 35 36#define DC_LOGGER_INIT(logger) 37 38#ifndef MAX 39#define MAX(X, Y) ((X) > (Y) ? (X) : (Y)) 40#endif 41#ifndef MIN 42#define MIN(X, Y) ((X) < (Y) ? (X) : (Y)) 43#endif 44 45/** 46 * DOC: DCN2x FPU manipulation Overview 47 * 48 * The DCN architecture relies on FPU operations, which require special 49 * compilation flags and the use of kernel_fpu_begin/end functions; ideally, we 50 * want to avoid spreading FPU access across multiple files. With this idea in 51 * mind, this file aims to centralize all DCN20 and DCN2.1 (DCN2x) functions 52 * that require FPU access in a single place. Code in this file follows the 53 * following code pattern: 54 * 55 * 1. Functions that use FPU operations should be isolated in static functions. 56 * 2. The FPU functions should have the noinline attribute to ensure anything 57 * that deals with FP register is contained within this call. 58 * 3. All function that needs to be accessed outside this file requires a 59 * public interface that not uses any FPU reference. 60 * 4. Developers **must not** use DC_FP_START/END in this file, but they need 61 * to ensure that the caller invokes it before access any function available 62 * in this file. For this reason, public functions in this file must invoke 63 * dc_assert_fp_enabled(); 64 * 65 * Let's expand a little bit more the idea in the code pattern. To fully 66 * isolate FPU operations in a single place, we must avoid situations where 67 * compilers spill FP values to registers due to FP enable in a specific C 68 * file. Note that even if we isolate all FPU functions in a single file and 69 * call its interface from other files, the compiler might enable the use of 70 * FPU before we call DC_FP_START. Nevertheless, it is the programmer's 71 * responsibility to invoke DC_FP_START/END in the correct place. To highlight 72 * situations where developers forgot to use the FP protection before calling 73 * the DC FPU interface functions, we introduce a helper that checks if the 74 * function is invoked under FP protection. If not, it will trigger a kernel 75 * warning. 76 */ 77 78struct _vcs_dpi_ip_params_st dcn2_0_ip = { 79 .odm_capable = 1, 80 .gpuvm_enable = 0, 81 .hostvm_enable = 0, 82 .gpuvm_max_page_table_levels = 4, 83 .hostvm_max_page_table_levels = 4, 84 .hostvm_cached_page_table_levels = 0, 85 .pte_group_size_bytes = 2048, 86 .num_dsc = 6, 87 .rob_buffer_size_kbytes = 168, 88 .det_buffer_size_kbytes = 164, 89 .dpte_buffer_size_in_pte_reqs_luma = 84, 90 .pde_proc_buffer_size_64k_reqs = 48, 91 .dpp_output_buffer_pixels = 2560, 92 .opp_output_buffer_lines = 1, 93 .pixel_chunk_size_kbytes = 8, 94 .pte_chunk_size_kbytes = 2, 95 .meta_chunk_size_kbytes = 2, 96 .writeback_chunk_size_kbytes = 2, 97 .line_buffer_size_bits = 789504, 98 .is_line_buffer_bpp_fixed = 0, 99 .line_buffer_fixed_bpp = 0, 100 .dcc_supported = true, 101 .max_line_buffer_lines = 12, 102 .writeback_luma_buffer_size_kbytes = 12, 103 .writeback_chroma_buffer_size_kbytes = 8, 104 .writeback_chroma_line_buffer_width_pixels = 4, 105 .writeback_max_hscl_ratio = 1, 106 .writeback_max_vscl_ratio = 1, 107 .writeback_min_hscl_ratio = 1, 108 .writeback_min_vscl_ratio = 1, 109 .writeback_max_hscl_taps = 12, 110 .writeback_max_vscl_taps = 12, 111 .writeback_line_buffer_luma_buffer_size = 0, 112 .writeback_line_buffer_chroma_buffer_size = 14643, 113 .cursor_buffer_size = 8, 114 .cursor_chunk_size = 2, 115 .max_num_otg = 6, 116 .max_num_dpp = 6, 117 .max_num_wb = 1, 118 .max_dchub_pscl_bw_pix_per_clk = 4, 119 .max_pscl_lb_bw_pix_per_clk = 2, 120 .max_lb_vscl_bw_pix_per_clk = 4, 121 .max_vscl_hscl_bw_pix_per_clk = 4, 122 .max_hscl_ratio = 8, 123 .max_vscl_ratio = 8, 124 .hscl_mults = 4, 125 .vscl_mults = 4, 126 .max_hscl_taps = 8, 127 .max_vscl_taps = 8, 128 .dispclk_ramp_margin_percent = 1, 129 .underscan_factor = 1.10, 130 .min_vblank_lines = 32, // 131 .dppclk_delay_subtotal = 77, // 132 .dppclk_delay_scl_lb_only = 16, 133 .dppclk_delay_scl = 50, 134 .dppclk_delay_cnvc_formatter = 8, 135 .dppclk_delay_cnvc_cursor = 6, 136 .dispclk_delay_subtotal = 87, // 137 .dcfclk_cstate_latency = 10, // SRExitTime 138 .max_inter_dcn_tile_repeaters = 8, 139 .xfc_supported = true, 140 .xfc_fill_bw_overhead_percent = 10.0, 141 .xfc_fill_constant_bytes = 0, 142 .number_of_cursors = 1, 143}; 144 145struct _vcs_dpi_ip_params_st dcn2_0_nv14_ip = { 146 .odm_capable = 1, 147 .gpuvm_enable = 0, 148 .hostvm_enable = 0, 149 .gpuvm_max_page_table_levels = 4, 150 .hostvm_max_page_table_levels = 4, 151 .hostvm_cached_page_table_levels = 0, 152 .num_dsc = 5, 153 .rob_buffer_size_kbytes = 168, 154 .det_buffer_size_kbytes = 164, 155 .dpte_buffer_size_in_pte_reqs_luma = 84, 156 .dpte_buffer_size_in_pte_reqs_chroma = 42,//todo 157 .dpp_output_buffer_pixels = 2560, 158 .opp_output_buffer_lines = 1, 159 .pixel_chunk_size_kbytes = 8, 160 .pte_enable = 1, 161 .max_page_table_levels = 4, 162 .pte_chunk_size_kbytes = 2, 163 .meta_chunk_size_kbytes = 2, 164 .writeback_chunk_size_kbytes = 2, 165 .line_buffer_size_bits = 789504, 166 .is_line_buffer_bpp_fixed = 0, 167 .line_buffer_fixed_bpp = 0, 168 .dcc_supported = true, 169 .max_line_buffer_lines = 12, 170 .writeback_luma_buffer_size_kbytes = 12, 171 .writeback_chroma_buffer_size_kbytes = 8, 172 .writeback_chroma_line_buffer_width_pixels = 4, 173 .writeback_max_hscl_ratio = 1, 174 .writeback_max_vscl_ratio = 1, 175 .writeback_min_hscl_ratio = 1, 176 .writeback_min_vscl_ratio = 1, 177 .writeback_max_hscl_taps = 12, 178 .writeback_max_vscl_taps = 12, 179 .writeback_line_buffer_luma_buffer_size = 0, 180 .writeback_line_buffer_chroma_buffer_size = 14643, 181 .cursor_buffer_size = 8, 182 .cursor_chunk_size = 2, 183 .max_num_otg = 5, 184 .max_num_dpp = 5, 185 .max_num_wb = 1, 186 .max_dchub_pscl_bw_pix_per_clk = 4, 187 .max_pscl_lb_bw_pix_per_clk = 2, 188 .max_lb_vscl_bw_pix_per_clk = 4, 189 .max_vscl_hscl_bw_pix_per_clk = 4, 190 .max_hscl_ratio = 8, 191 .max_vscl_ratio = 8, 192 .hscl_mults = 4, 193 .vscl_mults = 4, 194 .max_hscl_taps = 8, 195 .max_vscl_taps = 8, 196 .dispclk_ramp_margin_percent = 1, 197 .underscan_factor = 1.10, 198 .min_vblank_lines = 32, // 199 .dppclk_delay_subtotal = 77, // 200 .dppclk_delay_scl_lb_only = 16, 201 .dppclk_delay_scl = 50, 202 .dppclk_delay_cnvc_formatter = 8, 203 .dppclk_delay_cnvc_cursor = 6, 204 .dispclk_delay_subtotal = 87, // 205 .dcfclk_cstate_latency = 10, // SRExitTime 206 .max_inter_dcn_tile_repeaters = 8, 207 .xfc_supported = true, 208 .xfc_fill_bw_overhead_percent = 10.0, 209 .xfc_fill_constant_bytes = 0, 210 .ptoi_supported = 0, 211 .number_of_cursors = 1, 212}; 213 214struct _vcs_dpi_soc_bounding_box_st dcn2_0_soc = { 215 /* Defaults that get patched on driver load from firmware. */ 216 .clock_limits = { 217 { 218 .state = 0, 219 .dcfclk_mhz = 560.0, 220 .fabricclk_mhz = 560.0, 221 .dispclk_mhz = 513.0, 222 .dppclk_mhz = 513.0, 223 .phyclk_mhz = 540.0, 224 .socclk_mhz = 560.0, 225 .dscclk_mhz = 171.0, 226 .dram_speed_mts = 8960.0, 227 }, 228 { 229 .state = 1, 230 .dcfclk_mhz = 694.0, 231 .fabricclk_mhz = 694.0, 232 .dispclk_mhz = 642.0, 233 .dppclk_mhz = 642.0, 234 .phyclk_mhz = 600.0, 235 .socclk_mhz = 694.0, 236 .dscclk_mhz = 214.0, 237 .dram_speed_mts = 11104.0, 238 }, 239 { 240 .state = 2, 241 .dcfclk_mhz = 875.0, 242 .fabricclk_mhz = 875.0, 243 .dispclk_mhz = 734.0, 244 .dppclk_mhz = 734.0, 245 .phyclk_mhz = 810.0, 246 .socclk_mhz = 875.0, 247 .dscclk_mhz = 245.0, 248 .dram_speed_mts = 14000.0, 249 }, 250 { 251 .state = 3, 252 .dcfclk_mhz = 1000.0, 253 .fabricclk_mhz = 1000.0, 254 .dispclk_mhz = 1100.0, 255 .dppclk_mhz = 1100.0, 256 .phyclk_mhz = 810.0, 257 .socclk_mhz = 1000.0, 258 .dscclk_mhz = 367.0, 259 .dram_speed_mts = 16000.0, 260 }, 261 { 262 .state = 4, 263 .dcfclk_mhz = 1200.0, 264 .fabricclk_mhz = 1200.0, 265 .dispclk_mhz = 1284.0, 266 .dppclk_mhz = 1284.0, 267 .phyclk_mhz = 810.0, 268 .socclk_mhz = 1200.0, 269 .dscclk_mhz = 428.0, 270 .dram_speed_mts = 16000.0, 271 }, 272 /*Extra state, no dispclk ramping*/ 273 { 274 .state = 5, 275 .dcfclk_mhz = 1200.0, 276 .fabricclk_mhz = 1200.0, 277 .dispclk_mhz = 1284.0, 278 .dppclk_mhz = 1284.0, 279 .phyclk_mhz = 810.0, 280 .socclk_mhz = 1200.0, 281 .dscclk_mhz = 428.0, 282 .dram_speed_mts = 16000.0, 283 }, 284 }, 285 .num_states = 5, 286 .sr_exit_time_us = 8.6, 287 .sr_enter_plus_exit_time_us = 10.9, 288 .urgent_latency_us = 4.0, 289 .urgent_latency_pixel_data_only_us = 4.0, 290 .urgent_latency_pixel_mixed_with_vm_data_us = 4.0, 291 .urgent_latency_vm_data_only_us = 4.0, 292 .urgent_out_of_order_return_per_channel_pixel_only_bytes = 4096, 293 .urgent_out_of_order_return_per_channel_pixel_and_vm_bytes = 4096, 294 .urgent_out_of_order_return_per_channel_vm_only_bytes = 4096, 295 .pct_ideal_dram_sdp_bw_after_urgent_pixel_only = 40.0, 296 .pct_ideal_dram_sdp_bw_after_urgent_pixel_and_vm = 40.0, 297 .pct_ideal_dram_sdp_bw_after_urgent_vm_only = 40.0, 298 .max_avg_sdp_bw_use_normal_percent = 40.0, 299 .max_avg_dram_bw_use_normal_percent = 40.0, 300 .writeback_latency_us = 12.0, 301 .ideal_dram_bw_after_urgent_percent = 40.0, 302 .max_request_size_bytes = 256, 303 .dram_channel_width_bytes = 2, 304 .fabric_datapath_to_dcn_data_return_bytes = 64, 305 .dcn_downspread_percent = 0.5, 306 .downspread_percent = 0.38, 307 .dram_page_open_time_ns = 50.0, 308 .dram_rw_turnaround_time_ns = 17.5, 309 .dram_return_buffer_per_channel_bytes = 8192, 310 .round_trip_ping_latency_dcfclk_cycles = 131, 311 .urgent_out_of_order_return_per_channel_bytes = 256, 312 .channel_interleave_bytes = 256, 313 .num_banks = 8, 314 .num_chans = 16, 315 .vmm_page_size_bytes = 4096, 316 .dram_clock_change_latency_us = 404.0, 317 .dummy_pstate_latency_us = 5.0, 318 .writeback_dram_clock_change_latency_us = 23.0, 319 .return_bus_width_bytes = 64, 320 .dispclk_dppclk_vco_speed_mhz = 3850, 321 .xfc_bus_transport_time_us = 20, 322 .xfc_xbuf_latency_tolerance_us = 4, 323 .use_urgent_burst_bw = 0 324}; 325 326struct _vcs_dpi_soc_bounding_box_st dcn2_0_nv14_soc = { 327 .clock_limits = { 328 { 329 .state = 0, 330 .dcfclk_mhz = 560.0, 331 .fabricclk_mhz = 560.0, 332 .dispclk_mhz = 513.0, 333 .dppclk_mhz = 513.0, 334 .phyclk_mhz = 540.0, 335 .socclk_mhz = 560.0, 336 .dscclk_mhz = 171.0, 337 .dram_speed_mts = 8960.0, 338 }, 339 { 340 .state = 1, 341 .dcfclk_mhz = 694.0, 342 .fabricclk_mhz = 694.0, 343 .dispclk_mhz = 642.0, 344 .dppclk_mhz = 642.0, 345 .phyclk_mhz = 600.0, 346 .socclk_mhz = 694.0, 347 .dscclk_mhz = 214.0, 348 .dram_speed_mts = 11104.0, 349 }, 350 { 351 .state = 2, 352 .dcfclk_mhz = 875.0, 353 .fabricclk_mhz = 875.0, 354 .dispclk_mhz = 734.0, 355 .dppclk_mhz = 734.0, 356 .phyclk_mhz = 810.0, 357 .socclk_mhz = 875.0, 358 .dscclk_mhz = 245.0, 359 .dram_speed_mts = 14000.0, 360 }, 361 { 362 .state = 3, 363 .dcfclk_mhz = 1000.0, 364 .fabricclk_mhz = 1000.0, 365 .dispclk_mhz = 1100.0, 366 .dppclk_mhz = 1100.0, 367 .phyclk_mhz = 810.0, 368 .socclk_mhz = 1000.0, 369 .dscclk_mhz = 367.0, 370 .dram_speed_mts = 16000.0, 371 }, 372 { 373 .state = 4, 374 .dcfclk_mhz = 1200.0, 375 .fabricclk_mhz = 1200.0, 376 .dispclk_mhz = 1284.0, 377 .dppclk_mhz = 1284.0, 378 .phyclk_mhz = 810.0, 379 .socclk_mhz = 1200.0, 380 .dscclk_mhz = 428.0, 381 .dram_speed_mts = 16000.0, 382 }, 383 /*Extra state, no dispclk ramping*/ 384 { 385 .state = 5, 386 .dcfclk_mhz = 1200.0, 387 .fabricclk_mhz = 1200.0, 388 .dispclk_mhz = 1284.0, 389 .dppclk_mhz = 1284.0, 390 .phyclk_mhz = 810.0, 391 .socclk_mhz = 1200.0, 392 .dscclk_mhz = 428.0, 393 .dram_speed_mts = 16000.0, 394 }, 395 }, 396 .num_states = 5, 397 .sr_exit_time_us = 11.6, 398 .sr_enter_plus_exit_time_us = 13.9, 399 .urgent_latency_us = 4.0, 400 .urgent_latency_pixel_data_only_us = 4.0, 401 .urgent_latency_pixel_mixed_with_vm_data_us = 4.0, 402 .urgent_latency_vm_data_only_us = 4.0, 403 .urgent_out_of_order_return_per_channel_pixel_only_bytes = 4096, 404 .urgent_out_of_order_return_per_channel_pixel_and_vm_bytes = 4096, 405 .urgent_out_of_order_return_per_channel_vm_only_bytes = 4096, 406 .pct_ideal_dram_sdp_bw_after_urgent_pixel_only = 40.0, 407 .pct_ideal_dram_sdp_bw_after_urgent_pixel_and_vm = 40.0, 408 .pct_ideal_dram_sdp_bw_after_urgent_vm_only = 40.0, 409 .max_avg_sdp_bw_use_normal_percent = 40.0, 410 .max_avg_dram_bw_use_normal_percent = 40.0, 411 .writeback_latency_us = 12.0, 412 .ideal_dram_bw_after_urgent_percent = 40.0, 413 .max_request_size_bytes = 256, 414 .dram_channel_width_bytes = 2, 415 .fabric_datapath_to_dcn_data_return_bytes = 64, 416 .dcn_downspread_percent = 0.5, 417 .downspread_percent = 0.38, 418 .dram_page_open_time_ns = 50.0, 419 .dram_rw_turnaround_time_ns = 17.5, 420 .dram_return_buffer_per_channel_bytes = 8192, 421 .round_trip_ping_latency_dcfclk_cycles = 131, 422 .urgent_out_of_order_return_per_channel_bytes = 256, 423 .channel_interleave_bytes = 256, 424 .num_banks = 8, 425 .num_chans = 8, 426 .vmm_page_size_bytes = 4096, 427 .dram_clock_change_latency_us = 404.0, 428 .dummy_pstate_latency_us = 5.0, 429 .writeback_dram_clock_change_latency_us = 23.0, 430 .return_bus_width_bytes = 64, 431 .dispclk_dppclk_vco_speed_mhz = 3850, 432 .xfc_bus_transport_time_us = 20, 433 .xfc_xbuf_latency_tolerance_us = 4, 434 .use_urgent_burst_bw = 0 435}; 436 437struct _vcs_dpi_soc_bounding_box_st dcn2_0_nv12_soc = { 0 }; 438 439struct _vcs_dpi_ip_params_st dcn2_1_ip = { 440 .odm_capable = 1, 441 .gpuvm_enable = 1, 442 .hostvm_enable = 1, 443 .gpuvm_max_page_table_levels = 1, 444 .hostvm_max_page_table_levels = 4, 445 .hostvm_cached_page_table_levels = 2, 446 .num_dsc = 3, 447 .rob_buffer_size_kbytes = 168, 448 .det_buffer_size_kbytes = 164, 449 .dpte_buffer_size_in_pte_reqs_luma = 44, 450 .dpte_buffer_size_in_pte_reqs_chroma = 42,//todo 451 .dpp_output_buffer_pixels = 2560, 452 .opp_output_buffer_lines = 1, 453 .pixel_chunk_size_kbytes = 8, 454 .pte_enable = 1, 455 .max_page_table_levels = 4, 456 .pte_chunk_size_kbytes = 2, 457 .meta_chunk_size_kbytes = 2, 458 .min_meta_chunk_size_bytes = 256, 459 .writeback_chunk_size_kbytes = 2, 460 .line_buffer_size_bits = 789504, 461 .is_line_buffer_bpp_fixed = 0, 462 .line_buffer_fixed_bpp = 0, 463 .dcc_supported = true, 464 .max_line_buffer_lines = 12, 465 .writeback_luma_buffer_size_kbytes = 12, 466 .writeback_chroma_buffer_size_kbytes = 8, 467 .writeback_chroma_line_buffer_width_pixels = 4, 468 .writeback_max_hscl_ratio = 1, 469 .writeback_max_vscl_ratio = 1, 470 .writeback_min_hscl_ratio = 1, 471 .writeback_min_vscl_ratio = 1, 472 .writeback_max_hscl_taps = 12, 473 .writeback_max_vscl_taps = 12, 474 .writeback_line_buffer_luma_buffer_size = 0, 475 .writeback_line_buffer_chroma_buffer_size = 14643, 476 .cursor_buffer_size = 8, 477 .cursor_chunk_size = 2, 478 .max_num_otg = 4, 479 .max_num_dpp = 4, 480 .max_num_wb = 1, 481 .max_dchub_pscl_bw_pix_per_clk = 4, 482 .max_pscl_lb_bw_pix_per_clk = 2, 483 .max_lb_vscl_bw_pix_per_clk = 4, 484 .max_vscl_hscl_bw_pix_per_clk = 4, 485 .max_hscl_ratio = 4, 486 .max_vscl_ratio = 4, 487 .hscl_mults = 4, 488 .vscl_mults = 4, 489 .max_hscl_taps = 8, 490 .max_vscl_taps = 8, 491 .dispclk_ramp_margin_percent = 1, 492 .underscan_factor = 1.10, 493 .min_vblank_lines = 32, // 494 .dppclk_delay_subtotal = 77, // 495 .dppclk_delay_scl_lb_only = 16, 496 .dppclk_delay_scl = 50, 497 .dppclk_delay_cnvc_formatter = 8, 498 .dppclk_delay_cnvc_cursor = 6, 499 .dispclk_delay_subtotal = 87, // 500 .dcfclk_cstate_latency = 10, // SRExitTime 501 .max_inter_dcn_tile_repeaters = 8, 502 503 .xfc_supported = false, 504 .xfc_fill_bw_overhead_percent = 10.0, 505 .xfc_fill_constant_bytes = 0, 506 .ptoi_supported = 0, 507 .number_of_cursors = 1, 508}; 509 510struct _vcs_dpi_soc_bounding_box_st dcn2_1_soc = { 511 .clock_limits = { 512 { 513 .state = 0, 514 .dcfclk_mhz = 400.0, 515 .fabricclk_mhz = 400.0, 516 .dispclk_mhz = 600.0, 517 .dppclk_mhz = 400.00, 518 .phyclk_mhz = 600.0, 519 .socclk_mhz = 278.0, 520 .dscclk_mhz = 205.67, 521 .dram_speed_mts = 1600.0, 522 }, 523 { 524 .state = 1, 525 .dcfclk_mhz = 464.52, 526 .fabricclk_mhz = 800.0, 527 .dispclk_mhz = 654.55, 528 .dppclk_mhz = 626.09, 529 .phyclk_mhz = 600.0, 530 .socclk_mhz = 278.0, 531 .dscclk_mhz = 205.67, 532 .dram_speed_mts = 1600.0, 533 }, 534 { 535 .state = 2, 536 .dcfclk_mhz = 514.29, 537 .fabricclk_mhz = 933.0, 538 .dispclk_mhz = 757.89, 539 .dppclk_mhz = 685.71, 540 .phyclk_mhz = 600.0, 541 .socclk_mhz = 278.0, 542 .dscclk_mhz = 287.67, 543 .dram_speed_mts = 1866.0, 544 }, 545 { 546 .state = 3, 547 .dcfclk_mhz = 576.00, 548 .fabricclk_mhz = 1067.0, 549 .dispclk_mhz = 847.06, 550 .dppclk_mhz = 757.89, 551 .phyclk_mhz = 600.0, 552 .socclk_mhz = 715.0, 553 .dscclk_mhz = 318.334, 554 .dram_speed_mts = 2134.0, 555 }, 556 { 557 .state = 4, 558 .dcfclk_mhz = 626.09, 559 .fabricclk_mhz = 1200.0, 560 .dispclk_mhz = 900.00, 561 .dppclk_mhz = 847.06, 562 .phyclk_mhz = 810.0, 563 .socclk_mhz = 953.0, 564 .dscclk_mhz = 489.0, 565 .dram_speed_mts = 2400.0, 566 }, 567 { 568 .state = 5, 569 .dcfclk_mhz = 685.71, 570 .fabricclk_mhz = 1333.0, 571 .dispclk_mhz = 1028.57, 572 .dppclk_mhz = 960.00, 573 .phyclk_mhz = 810.0, 574 .socclk_mhz = 278.0, 575 .dscclk_mhz = 287.67, 576 .dram_speed_mts = 2666.0, 577 }, 578 { 579 .state = 6, 580 .dcfclk_mhz = 757.89, 581 .fabricclk_mhz = 1467.0, 582 .dispclk_mhz = 1107.69, 583 .dppclk_mhz = 1028.57, 584 .phyclk_mhz = 810.0, 585 .socclk_mhz = 715.0, 586 .dscclk_mhz = 318.334, 587 .dram_speed_mts = 3200.0, 588 }, 589 { 590 .state = 7, 591 .dcfclk_mhz = 847.06, 592 .fabricclk_mhz = 1600.0, 593 .dispclk_mhz = 1395.0, 594 .dppclk_mhz = 1285.00, 595 .phyclk_mhz = 1325.0, 596 .socclk_mhz = 953.0, 597 .dscclk_mhz = 489.0, 598 .dram_speed_mts = 4266.0, 599 }, 600 /*Extra state, no dispclk ramping*/ 601 { 602 .state = 8, 603 .dcfclk_mhz = 847.06, 604 .fabricclk_mhz = 1600.0, 605 .dispclk_mhz = 1395.0, 606 .dppclk_mhz = 1285.0, 607 .phyclk_mhz = 1325.0, 608 .socclk_mhz = 953.0, 609 .dscclk_mhz = 489.0, 610 .dram_speed_mts = 4266.0, 611 }, 612 613 }, 614 615 .sr_exit_time_us = 12.5, 616 .sr_enter_plus_exit_time_us = 17.0, 617 .urgent_latency_us = 4.0, 618 .urgent_latency_pixel_data_only_us = 4.0, 619 .urgent_latency_pixel_mixed_with_vm_data_us = 4.0, 620 .urgent_latency_vm_data_only_us = 4.0, 621 .urgent_out_of_order_return_per_channel_pixel_only_bytes = 4096, 622 .urgent_out_of_order_return_per_channel_pixel_and_vm_bytes = 4096, 623 .urgent_out_of_order_return_per_channel_vm_only_bytes = 4096, 624 .pct_ideal_dram_sdp_bw_after_urgent_pixel_only = 80.0, 625 .pct_ideal_dram_sdp_bw_after_urgent_pixel_and_vm = 75.0, 626 .pct_ideal_dram_sdp_bw_after_urgent_vm_only = 40.0, 627 .max_avg_sdp_bw_use_normal_percent = 60.0, 628 .max_avg_dram_bw_use_normal_percent = 100.0, 629 .writeback_latency_us = 12.0, 630 .max_request_size_bytes = 256, 631 .dram_channel_width_bytes = 4, 632 .fabric_datapath_to_dcn_data_return_bytes = 32, 633 .dcn_downspread_percent = 0.5, 634 .downspread_percent = 0.38, 635 .dram_page_open_time_ns = 50.0, 636 .dram_rw_turnaround_time_ns = 17.5, 637 .dram_return_buffer_per_channel_bytes = 8192, 638 .round_trip_ping_latency_dcfclk_cycles = 128, 639 .urgent_out_of_order_return_per_channel_bytes = 4096, 640 .channel_interleave_bytes = 256, 641 .num_banks = 8, 642 .num_chans = 4, 643 .vmm_page_size_bytes = 4096, 644 .dram_clock_change_latency_us = 23.84, 645 .return_bus_width_bytes = 64, 646 .dispclk_dppclk_vco_speed_mhz = 3600, 647 .xfc_bus_transport_time_us = 4, 648 .xfc_xbuf_latency_tolerance_us = 4, 649 .use_urgent_burst_bw = 1, 650 .num_states = 8 651}; 652 653void dcn20_populate_dml_writeback_from_context(struct dc *dc, 654 struct resource_context *res_ctx, 655 display_e2e_pipe_params_st *pipes) 656{ 657 int pipe_cnt, i; 658 659 dc_assert_fp_enabled(); 660 661 for (i = 0, pipe_cnt = 0; i < dc->res_pool->pipe_count; i++) { 662 struct dc_writeback_info *wb_info = &res_ctx->pipe_ctx[i].stream->writeback_info[0]; 663 664 if (!res_ctx->pipe_ctx[i].stream) 665 continue; 666 667 /* Set writeback information */ 668 pipes[pipe_cnt].dout.wb_enable = (wb_info->wb_enabled == true) ? 1 : 0; 669 pipes[pipe_cnt].dout.num_active_wb++; 670 pipes[pipe_cnt].dout.wb.wb_src_height = wb_info->dwb_params.cnv_params.crop_height; 671 pipes[pipe_cnt].dout.wb.wb_src_width = wb_info->dwb_params.cnv_params.crop_width; 672 pipes[pipe_cnt].dout.wb.wb_dst_width = wb_info->dwb_params.dest_width; 673 pipes[pipe_cnt].dout.wb.wb_dst_height = wb_info->dwb_params.dest_height; 674 pipes[pipe_cnt].dout.wb.wb_htaps_luma = 1; 675 pipes[pipe_cnt].dout.wb.wb_vtaps_luma = 1; 676 pipes[pipe_cnt].dout.wb.wb_htaps_chroma = wb_info->dwb_params.scaler_taps.h_taps_c; 677 pipes[pipe_cnt].dout.wb.wb_vtaps_chroma = wb_info->dwb_params.scaler_taps.v_taps_c; 678 pipes[pipe_cnt].dout.wb.wb_hratio = 1.0; 679 pipes[pipe_cnt].dout.wb.wb_vratio = 1.0; 680 if (wb_info->dwb_params.out_format == dwb_scaler_mode_yuv420) { 681 if (wb_info->dwb_params.output_depth == DWB_OUTPUT_PIXEL_DEPTH_8BPC) 682 pipes[pipe_cnt].dout.wb.wb_pixel_format = dm_420_8; 683 else 684 pipes[pipe_cnt].dout.wb.wb_pixel_format = dm_420_10; 685 } else { 686 pipes[pipe_cnt].dout.wb.wb_pixel_format = dm_444_32; 687 } 688 689 pipe_cnt++; 690 } 691} 692 693void dcn20_fpu_set_wb_arb_params(struct mcif_arb_params *wb_arb_params, 694 struct dc_state *context, 695 display_e2e_pipe_params_st *pipes, 696 int pipe_cnt, int i) 697{ 698 int k; 699 700 dc_assert_fp_enabled(); 701 702 for (k = 0; k < sizeof(wb_arb_params->cli_watermark)/sizeof(wb_arb_params->cli_watermark[0]); k++) { 703 wb_arb_params->cli_watermark[k] = get_wm_writeback_urgent(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 704 wb_arb_params->pstate_watermark[k] = get_wm_writeback_dram_clock_change(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 705 } 706 wb_arb_params->time_per_pixel = 16.0 * 1000 / (context->res_ctx.pipe_ctx[i].stream->phy_pix_clk / 1000); /* 4 bit fraction, ms */ 707} 708 709static bool is_dtbclk_required(struct dc *dc, struct dc_state *context) 710{ 711 int i; 712 for (i = 0; i < dc->res_pool->pipe_count; i++) { 713 if (!context->res_ctx.pipe_ctx[i].stream) 714 continue; 715 if (is_dp_128b_132b_signal(&context->res_ctx.pipe_ctx[i])) 716 return true; 717 } 718 return false; 719} 720 721static enum dcn_zstate_support_state decide_zstate_support(struct dc *dc, struct dc_state *context) 722{ 723 int plane_count; 724 int i; 725 unsigned int optimized_min_dst_y_next_start_us; 726 727 plane_count = 0; 728 optimized_min_dst_y_next_start_us = 0; 729 for (i = 0; i < dc->res_pool->pipe_count; i++) { 730 if (context->res_ctx.pipe_ctx[i].plane_state) 731 plane_count++; 732 } 733 734 /* 735 * Z9 and Z10 allowed cases: 736 * 1. 0 Planes enabled 737 * 2. single eDP, on link 0, 1 plane and stutter period > 5ms 738 * Z10 only cases: 739 * 1. single eDP, on link 0, 1 plane and stutter period >= 5ms 740 * Zstate not allowed cases: 741 * 1. Everything else 742 */ 743 if (plane_count == 0) 744 return DCN_ZSTATE_SUPPORT_ALLOW; 745 else if (context->stream_count == 1 && context->streams[0]->signal == SIGNAL_TYPE_EDP) { 746 struct dc_link *link = context->streams[0]->sink->link; 747 struct dc_stream_status *stream_status = &context->stream_status[0]; 748 749 if (dc_extended_blank_supported(dc)) { 750 for (i = 0; i < dc->res_pool->pipe_count; i++) { 751 if (context->res_ctx.pipe_ctx[i].stream == context->streams[0] 752 && context->res_ctx.pipe_ctx[i].stream->adjust.v_total_min == context->res_ctx.pipe_ctx[i].stream->adjust.v_total_max 753 && context->res_ctx.pipe_ctx[i].stream->adjust.v_total_min > context->res_ctx.pipe_ctx[i].stream->timing.v_total) { 754 optimized_min_dst_y_next_start_us = 755 context->res_ctx.pipe_ctx[i].dlg_regs.optimized_min_dst_y_next_start_us; 756 break; 757 } 758 } 759 } 760 /* zstate only supported on PWRSEQ0 and when there's <2 planes*/ 761 if (link->link_index != 0 || stream_status->plane_count > 1) 762 return DCN_ZSTATE_SUPPORT_DISALLOW; 763 764 if (context->bw_ctx.dml.vba.StutterPeriod > 5000.0 || optimized_min_dst_y_next_start_us > 5000) 765 return DCN_ZSTATE_SUPPORT_ALLOW; 766 else if (link->psr_settings.psr_version == DC_PSR_VERSION_1 && !dc->debug.disable_psr) 767 return DCN_ZSTATE_SUPPORT_ALLOW_Z10_ONLY; 768 else 769 return DCN_ZSTATE_SUPPORT_DISALLOW; 770 } else 771 return DCN_ZSTATE_SUPPORT_DISALLOW; 772} 773 774void dcn20_calculate_dlg_params( 775 struct dc *dc, struct dc_state *context, 776 display_e2e_pipe_params_st *pipes, 777 int pipe_cnt, 778 int vlevel) 779{ 780 int i, pipe_idx; 781 782 dc_assert_fp_enabled(); 783 784 /* Writeback MCIF_WB arbitration parameters */ 785 dc->res_pool->funcs->set_mcif_arb_params(dc, context, pipes, pipe_cnt); 786 787 context->bw_ctx.bw.dcn.clk.dispclk_khz = context->bw_ctx.dml.vba.DISPCLK * 1000; 788 context->bw_ctx.bw.dcn.clk.dcfclk_khz = context->bw_ctx.dml.vba.DCFCLK * 1000; 789 context->bw_ctx.bw.dcn.clk.socclk_khz = context->bw_ctx.dml.vba.SOCCLK * 1000; 790 context->bw_ctx.bw.dcn.clk.dramclk_khz = context->bw_ctx.dml.vba.DRAMSpeed * 1000 / 16; 791 792 if (dc->debug.min_dram_clk_khz > context->bw_ctx.bw.dcn.clk.dramclk_khz) 793 context->bw_ctx.bw.dcn.clk.dramclk_khz = dc->debug.min_dram_clk_khz; 794 795 context->bw_ctx.bw.dcn.clk.dcfclk_deep_sleep_khz = context->bw_ctx.dml.vba.DCFCLKDeepSleep * 1000; 796 context->bw_ctx.bw.dcn.clk.fclk_khz = context->bw_ctx.dml.vba.FabricClock * 1000; 797 context->bw_ctx.bw.dcn.clk.p_state_change_support = 798 context->bw_ctx.dml.vba.DRAMClockChangeSupport[vlevel][context->bw_ctx.dml.vba.maxMpcComb] 799 != dm_dram_clock_change_unsupported; 800 context->bw_ctx.bw.dcn.clk.dppclk_khz = 0; 801 802 context->bw_ctx.bw.dcn.clk.dtbclk_en = is_dtbclk_required(dc, context); 803 804 if (context->bw_ctx.bw.dcn.clk.dispclk_khz < dc->debug.min_disp_clk_khz) 805 context->bw_ctx.bw.dcn.clk.dispclk_khz = dc->debug.min_disp_clk_khz; 806 807 for (i = 0, pipe_idx = 0; i < dc->res_pool->pipe_count; i++) { 808 if (!context->res_ctx.pipe_ctx[i].stream) 809 continue; 810 pipes[pipe_idx].pipe.dest.vstartup_start = get_vstartup(&context->bw_ctx.dml, pipes, pipe_cnt, pipe_idx); 811 pipes[pipe_idx].pipe.dest.vupdate_offset = get_vupdate_offset(&context->bw_ctx.dml, pipes, pipe_cnt, pipe_idx); 812 pipes[pipe_idx].pipe.dest.vupdate_width = get_vupdate_width(&context->bw_ctx.dml, pipes, pipe_cnt, pipe_idx); 813 pipes[pipe_idx].pipe.dest.vready_offset = get_vready_offset(&context->bw_ctx.dml, pipes, pipe_cnt, pipe_idx); 814 context->res_ctx.pipe_ctx[i].det_buffer_size_kb = context->bw_ctx.dml.ip.det_buffer_size_kbytes; 815 context->res_ctx.pipe_ctx[i].unbounded_req = pipes[pipe_idx].pipe.src.unbounded_req_mode; 816 817 if (context->bw_ctx.bw.dcn.clk.dppclk_khz < pipes[pipe_idx].clks_cfg.dppclk_mhz * 1000) 818 context->bw_ctx.bw.dcn.clk.dppclk_khz = pipes[pipe_idx].clks_cfg.dppclk_mhz * 1000; 819 context->res_ctx.pipe_ctx[i].plane_res.bw.dppclk_khz = 820 pipes[pipe_idx].clks_cfg.dppclk_mhz * 1000; 821 context->res_ctx.pipe_ctx[i].pipe_dlg_param = pipes[pipe_idx].pipe.dest; 822 pipe_idx++; 823 } 824 /*save a original dppclock copy*/ 825 context->bw_ctx.bw.dcn.clk.bw_dppclk_khz = context->bw_ctx.bw.dcn.clk.dppclk_khz; 826 context->bw_ctx.bw.dcn.clk.bw_dispclk_khz = context->bw_ctx.bw.dcn.clk.dispclk_khz; 827 context->bw_ctx.bw.dcn.clk.max_supported_dppclk_khz = context->bw_ctx.dml.soc.clock_limits[vlevel].dppclk_mhz * 1000; 828 context->bw_ctx.bw.dcn.clk.max_supported_dispclk_khz = context->bw_ctx.dml.soc.clock_limits[vlevel].dispclk_mhz * 1000; 829 830 context->bw_ctx.bw.dcn.compbuf_size_kb = context->bw_ctx.dml.ip.config_return_buffer_size_in_kbytes 831 - context->bw_ctx.dml.ip.det_buffer_size_kbytes * pipe_idx; 832 833 for (i = 0, pipe_idx = 0; i < dc->res_pool->pipe_count; i++) { 834 bool cstate_en = context->bw_ctx.dml.vba.PrefetchMode[vlevel][context->bw_ctx.dml.vba.maxMpcComb] != 2; 835 836 if (!context->res_ctx.pipe_ctx[i].stream) 837 continue; 838 839 if (dc->ctx->dce_version == DCN_VERSION_2_01) 840 cstate_en = false; 841 842 context->bw_ctx.dml.funcs.rq_dlg_get_dlg_reg(&context->bw_ctx.dml, 843 &context->res_ctx.pipe_ctx[i].dlg_regs, 844 &context->res_ctx.pipe_ctx[i].ttu_regs, 845 pipes, 846 pipe_cnt, 847 pipe_idx, 848 cstate_en, 849 context->bw_ctx.bw.dcn.clk.p_state_change_support, 850 false, false, true); 851 852 context->bw_ctx.dml.funcs.rq_dlg_get_rq_reg(&context->bw_ctx.dml, 853 &context->res_ctx.pipe_ctx[i].rq_regs, 854 &pipes[pipe_idx].pipe); 855 pipe_idx++; 856 } 857 context->bw_ctx.bw.dcn.clk.zstate_support = decide_zstate_support(dc, context); 858} 859 860static void swizzle_to_dml_params( 861 enum swizzle_mode_values swizzle, 862 unsigned int *sw_mode) 863{ 864 switch (swizzle) { 865 case DC_SW_LINEAR: 866 *sw_mode = dm_sw_linear; 867 break; 868 case DC_SW_4KB_S: 869 *sw_mode = dm_sw_4kb_s; 870 break; 871 case DC_SW_4KB_S_X: 872 *sw_mode = dm_sw_4kb_s_x; 873 break; 874 case DC_SW_4KB_D: 875 *sw_mode = dm_sw_4kb_d; 876 break; 877 case DC_SW_4KB_D_X: 878 *sw_mode = dm_sw_4kb_d_x; 879 break; 880 case DC_SW_64KB_S: 881 *sw_mode = dm_sw_64kb_s; 882 break; 883 case DC_SW_64KB_S_X: 884 *sw_mode = dm_sw_64kb_s_x; 885 break; 886 case DC_SW_64KB_S_T: 887 *sw_mode = dm_sw_64kb_s_t; 888 break; 889 case DC_SW_64KB_D: 890 *sw_mode = dm_sw_64kb_d; 891 break; 892 case DC_SW_64KB_D_X: 893 *sw_mode = dm_sw_64kb_d_x; 894 break; 895 case DC_SW_64KB_D_T: 896 *sw_mode = dm_sw_64kb_d_t; 897 break; 898 case DC_SW_64KB_R_X: 899 *sw_mode = dm_sw_64kb_r_x; 900 break; 901 case DC_SW_VAR_S: 902 *sw_mode = dm_sw_var_s; 903 break; 904 case DC_SW_VAR_S_X: 905 *sw_mode = dm_sw_var_s_x; 906 break; 907 case DC_SW_VAR_D: 908 *sw_mode = dm_sw_var_d; 909 break; 910 case DC_SW_VAR_D_X: 911 *sw_mode = dm_sw_var_d_x; 912 break; 913 case DC_SW_VAR_R_X: 914 *sw_mode = dm_sw_var_r_x; 915 break; 916 default: 917 ASSERT(0); /* Not supported */ 918 break; 919 } 920} 921 922int dcn20_populate_dml_pipes_from_context( 923 struct dc *dc, 924 struct dc_state *context, 925 display_e2e_pipe_params_st *pipes, 926 bool fast_validate) 927{ 928 int pipe_cnt, i; 929 bool synchronized_vblank = true; 930 struct resource_context *res_ctx = &context->res_ctx; 931 932 dc_assert_fp_enabled(); 933 934 for (i = 0, pipe_cnt = -1; i < dc->res_pool->pipe_count; i++) { 935 if (!res_ctx->pipe_ctx[i].stream) 936 continue; 937 938 if (pipe_cnt < 0) { 939 pipe_cnt = i; 940 continue; 941 } 942 943 if (res_ctx->pipe_ctx[pipe_cnt].stream == res_ctx->pipe_ctx[i].stream) 944 continue; 945 946 if (dc->debug.disable_timing_sync || 947 (!resource_are_streams_timing_synchronizable( 948 res_ctx->pipe_ctx[pipe_cnt].stream, 949 res_ctx->pipe_ctx[i].stream) && 950 !resource_are_vblanks_synchronizable( 951 res_ctx->pipe_ctx[pipe_cnt].stream, 952 res_ctx->pipe_ctx[i].stream))) { 953 synchronized_vblank = false; 954 break; 955 } 956 } 957 958 for (i = 0, pipe_cnt = 0; i < dc->res_pool->pipe_count; i++) { 959 struct dc_crtc_timing *timing = &res_ctx->pipe_ctx[i].stream->timing; 960 unsigned int v_total; 961 unsigned int front_porch; 962 int output_bpc; 963 struct audio_check aud_check = {0}; 964 965 if (!res_ctx->pipe_ctx[i].stream) 966 continue; 967 968 v_total = timing->v_total; 969 front_porch = timing->v_front_porch; 970 971 /* todo: 972 pipes[pipe_cnt].pipe.src.dynamic_metadata_enable = 0; 973 pipes[pipe_cnt].pipe.src.dcc = 0; 974 pipes[pipe_cnt].pipe.src.vm = 0;*/ 975 976 pipes[pipe_cnt].clks_cfg.refclk_mhz = dc->res_pool->ref_clocks.dchub_ref_clock_inKhz / 1000.0; 977 978 pipes[pipe_cnt].dout.dsc_enable = res_ctx->pipe_ctx[i].stream->timing.flags.DSC; 979 /* todo: rotation?*/ 980 pipes[pipe_cnt].dout.dsc_slices = res_ctx->pipe_ctx[i].stream->timing.dsc_cfg.num_slices_h; 981 if (res_ctx->pipe_ctx[i].stream->use_dynamic_meta) { 982 pipes[pipe_cnt].pipe.src.dynamic_metadata_enable = true; 983 /* 1/2 vblank */ 984 pipes[pipe_cnt].pipe.src.dynamic_metadata_lines_before_active = 985 (v_total - timing->v_addressable 986 - timing->v_border_top - timing->v_border_bottom) / 2; 987 /* 36 bytes dp, 32 hdmi */ 988 pipes[pipe_cnt].pipe.src.dynamic_metadata_xmit_bytes = 989 dc_is_dp_signal(res_ctx->pipe_ctx[i].stream->signal) ? 36 : 32; 990 } 991 pipes[pipe_cnt].pipe.src.dcc = false; 992 pipes[pipe_cnt].pipe.src.dcc_rate = 1; 993 pipes[pipe_cnt].pipe.dest.synchronized_vblank_all_planes = synchronized_vblank; 994 pipes[pipe_cnt].pipe.dest.hblank_start = timing->h_total - timing->h_front_porch; 995 pipes[pipe_cnt].pipe.dest.hblank_end = pipes[pipe_cnt].pipe.dest.hblank_start 996 - timing->h_addressable 997 - timing->h_border_left 998 - timing->h_border_right; 999 pipes[pipe_cnt].pipe.dest.vblank_start = v_total - front_porch; 1000 pipes[pipe_cnt].pipe.dest.vblank_end = pipes[pipe_cnt].pipe.dest.vblank_start 1001 - timing->v_addressable 1002 - timing->v_border_top 1003 - timing->v_border_bottom; 1004 pipes[pipe_cnt].pipe.dest.htotal = timing->h_total; 1005 pipes[pipe_cnt].pipe.dest.vtotal = v_total; 1006 pipes[pipe_cnt].pipe.dest.hactive = 1007 timing->h_addressable + timing->h_border_left + timing->h_border_right; 1008 pipes[pipe_cnt].pipe.dest.vactive = 1009 timing->v_addressable + timing->v_border_top + timing->v_border_bottom; 1010 pipes[pipe_cnt].pipe.dest.interlaced = timing->flags.INTERLACE; 1011 pipes[pipe_cnt].pipe.dest.pixel_rate_mhz = timing->pix_clk_100hz/10000.0; 1012 if (timing->timing_3d_format == TIMING_3D_FORMAT_HW_FRAME_PACKING) 1013 pipes[pipe_cnt].pipe.dest.pixel_rate_mhz *= 2; 1014 pipes[pipe_cnt].pipe.dest.otg_inst = res_ctx->pipe_ctx[i].stream_res.tg->inst; 1015 pipes[pipe_cnt].dout.dp_lanes = 4; 1016 pipes[pipe_cnt].dout.is_virtual = 0; 1017 pipes[pipe_cnt].pipe.dest.vtotal_min = res_ctx->pipe_ctx[i].stream->adjust.v_total_min; 1018 pipes[pipe_cnt].pipe.dest.vtotal_max = res_ctx->pipe_ctx[i].stream->adjust.v_total_max; 1019 switch (get_num_odm_splits(&res_ctx->pipe_ctx[i])) { 1020 case 1: 1021 pipes[pipe_cnt].pipe.dest.odm_combine = dm_odm_combine_mode_2to1; 1022 break; 1023 case 3: 1024 pipes[pipe_cnt].pipe.dest.odm_combine = dm_odm_combine_mode_4to1; 1025 break; 1026 default: 1027 pipes[pipe_cnt].pipe.dest.odm_combine = dm_odm_combine_mode_disabled; 1028 } 1029 pipes[pipe_cnt].pipe.src.hsplit_grp = res_ctx->pipe_ctx[i].pipe_idx; 1030 if (res_ctx->pipe_ctx[i].top_pipe && res_ctx->pipe_ctx[i].top_pipe->plane_state 1031 == res_ctx->pipe_ctx[i].plane_state) { 1032 struct pipe_ctx *first_pipe = res_ctx->pipe_ctx[i].top_pipe; 1033 int split_idx = 0; 1034 1035 while (first_pipe->top_pipe && first_pipe->top_pipe->plane_state 1036 == res_ctx->pipe_ctx[i].plane_state) { 1037 first_pipe = first_pipe->top_pipe; 1038 split_idx++; 1039 } 1040 /* Treat 4to1 mpc combine as an mpo of 2 2-to-1 combines */ 1041 if (split_idx == 0) 1042 pipes[pipe_cnt].pipe.src.hsplit_grp = first_pipe->pipe_idx; 1043 else if (split_idx == 1) 1044 pipes[pipe_cnt].pipe.src.hsplit_grp = res_ctx->pipe_ctx[i].pipe_idx; 1045 else if (split_idx == 2) 1046 pipes[pipe_cnt].pipe.src.hsplit_grp = res_ctx->pipe_ctx[i].top_pipe->pipe_idx; 1047 } else if (res_ctx->pipe_ctx[i].prev_odm_pipe) { 1048 struct pipe_ctx *first_pipe = res_ctx->pipe_ctx[i].prev_odm_pipe; 1049 1050 while (first_pipe->prev_odm_pipe) 1051 first_pipe = first_pipe->prev_odm_pipe; 1052 pipes[pipe_cnt].pipe.src.hsplit_grp = first_pipe->pipe_idx; 1053 } 1054 1055 switch (res_ctx->pipe_ctx[i].stream->signal) { 1056 case SIGNAL_TYPE_DISPLAY_PORT_MST: 1057 case SIGNAL_TYPE_DISPLAY_PORT: 1058 pipes[pipe_cnt].dout.output_type = dm_dp; 1059 break; 1060 case SIGNAL_TYPE_EDP: 1061 pipes[pipe_cnt].dout.output_type = dm_edp; 1062 break; 1063 case SIGNAL_TYPE_HDMI_TYPE_A: 1064 case SIGNAL_TYPE_DVI_SINGLE_LINK: 1065 case SIGNAL_TYPE_DVI_DUAL_LINK: 1066 pipes[pipe_cnt].dout.output_type = dm_hdmi; 1067 break; 1068 default: 1069 /* In case there is no signal, set dp with 4 lanes to allow max config */ 1070 pipes[pipe_cnt].dout.is_virtual = 1; 1071 pipes[pipe_cnt].dout.output_type = dm_dp; 1072 pipes[pipe_cnt].dout.dp_lanes = 4; 1073 } 1074 1075 switch (res_ctx->pipe_ctx[i].stream->timing.display_color_depth) { 1076 case COLOR_DEPTH_666: 1077 output_bpc = 6; 1078 break; 1079 case COLOR_DEPTH_888: 1080 output_bpc = 8; 1081 break; 1082 case COLOR_DEPTH_101010: 1083 output_bpc = 10; 1084 break; 1085 case COLOR_DEPTH_121212: 1086 output_bpc = 12; 1087 break; 1088 case COLOR_DEPTH_141414: 1089 output_bpc = 14; 1090 break; 1091 case COLOR_DEPTH_161616: 1092 output_bpc = 16; 1093 break; 1094 case COLOR_DEPTH_999: 1095 output_bpc = 9; 1096 break; 1097 case COLOR_DEPTH_111111: 1098 output_bpc = 11; 1099 break; 1100 default: 1101 output_bpc = 8; 1102 break; 1103 } 1104 1105 switch (res_ctx->pipe_ctx[i].stream->timing.pixel_encoding) { 1106 case PIXEL_ENCODING_RGB: 1107 case PIXEL_ENCODING_YCBCR444: 1108 pipes[pipe_cnt].dout.output_format = dm_444; 1109 pipes[pipe_cnt].dout.output_bpp = output_bpc * 3; 1110 break; 1111 case PIXEL_ENCODING_YCBCR420: 1112 pipes[pipe_cnt].dout.output_format = dm_420; 1113 pipes[pipe_cnt].dout.output_bpp = (output_bpc * 3.0) / 2; 1114 break; 1115 case PIXEL_ENCODING_YCBCR422: 1116 if (res_ctx->pipe_ctx[i].stream->timing.flags.DSC && 1117 !res_ctx->pipe_ctx[i].stream->timing.dsc_cfg.ycbcr422_simple) 1118 pipes[pipe_cnt].dout.output_format = dm_n422; 1119 else 1120 pipes[pipe_cnt].dout.output_format = dm_s422; 1121 pipes[pipe_cnt].dout.output_bpp = output_bpc * 2; 1122 break; 1123 default: 1124 pipes[pipe_cnt].dout.output_format = dm_444; 1125 pipes[pipe_cnt].dout.output_bpp = output_bpc * 3; 1126 } 1127 1128 if (res_ctx->pipe_ctx[i].stream->timing.flags.DSC) 1129 pipes[pipe_cnt].dout.output_bpp = res_ctx->pipe_ctx[i].stream->timing.dsc_cfg.bits_per_pixel / 16.0; 1130 1131 /* todo: default max for now, until there is logic reflecting this in dc*/ 1132 pipes[pipe_cnt].dout.dsc_input_bpc = 12; 1133 /*fill up the audio sample rate (unit in kHz)*/ 1134 get_audio_check(&res_ctx->pipe_ctx[i].stream->audio_info, &aud_check); 1135 pipes[pipe_cnt].dout.max_audio_sample_rate = aud_check.max_audiosample_rate / 1000; 1136 /* 1137 * For graphic plane, cursor number is 1, nv12 is 0 1138 * bw calculations due to cursor on/off 1139 */ 1140 if (res_ctx->pipe_ctx[i].plane_state && 1141 res_ctx->pipe_ctx[i].plane_state->address.type == PLN_ADDR_TYPE_VIDEO_PROGRESSIVE) 1142 pipes[pipe_cnt].pipe.src.num_cursors = 0; 1143 else 1144 pipes[pipe_cnt].pipe.src.num_cursors = dc->dml.ip.number_of_cursors; 1145 1146 pipes[pipe_cnt].pipe.src.cur0_src_width = 256; 1147 pipes[pipe_cnt].pipe.src.cur0_bpp = dm_cur_32bit; 1148 1149 if (!res_ctx->pipe_ctx[i].plane_state) { 1150 pipes[pipe_cnt].pipe.src.is_hsplit = pipes[pipe_cnt].pipe.dest.odm_combine != dm_odm_combine_mode_disabled; 1151 pipes[pipe_cnt].pipe.src.source_scan = dm_horz; 1152 pipes[pipe_cnt].pipe.src.sw_mode = dm_sw_4kb_s; 1153 pipes[pipe_cnt].pipe.src.macro_tile_size = dm_64k_tile; 1154 pipes[pipe_cnt].pipe.src.viewport_width = timing->h_addressable; 1155 if (pipes[pipe_cnt].pipe.src.viewport_width > 1920) 1156 pipes[pipe_cnt].pipe.src.viewport_width = 1920; 1157 pipes[pipe_cnt].pipe.src.viewport_height = timing->v_addressable; 1158 if (pipes[pipe_cnt].pipe.src.viewport_height > 1080) 1159 pipes[pipe_cnt].pipe.src.viewport_height = 1080; 1160 pipes[pipe_cnt].pipe.src.surface_height_y = pipes[pipe_cnt].pipe.src.viewport_height; 1161 pipes[pipe_cnt].pipe.src.surface_width_y = pipes[pipe_cnt].pipe.src.viewport_width; 1162 pipes[pipe_cnt].pipe.src.surface_height_c = pipes[pipe_cnt].pipe.src.viewport_height; 1163 pipes[pipe_cnt].pipe.src.surface_width_c = pipes[pipe_cnt].pipe.src.viewport_width; 1164 pipes[pipe_cnt].pipe.src.data_pitch = ((pipes[pipe_cnt].pipe.src.viewport_width + 255) / 256) * 256; 1165 pipes[pipe_cnt].pipe.src.source_format = dm_444_32; 1166 pipes[pipe_cnt].pipe.dest.recout_width = pipes[pipe_cnt].pipe.src.viewport_width; /*vp_width/hratio*/ 1167 pipes[pipe_cnt].pipe.dest.recout_height = pipes[pipe_cnt].pipe.src.viewport_height; /*vp_height/vratio*/ 1168 pipes[pipe_cnt].pipe.dest.full_recout_width = pipes[pipe_cnt].pipe.dest.recout_width; /*when is_hsplit != 1*/ 1169 pipes[pipe_cnt].pipe.dest.full_recout_height = pipes[pipe_cnt].pipe.dest.recout_height; /*when is_hsplit != 1*/ 1170 pipes[pipe_cnt].pipe.scale_ratio_depth.lb_depth = dm_lb_16; 1171 pipes[pipe_cnt].pipe.scale_ratio_depth.hscl_ratio = 1.0; 1172 pipes[pipe_cnt].pipe.scale_ratio_depth.vscl_ratio = 1.0; 1173 pipes[pipe_cnt].pipe.scale_ratio_depth.scl_enable = 0; /*Lb only or Full scl*/ 1174 pipes[pipe_cnt].pipe.scale_taps.htaps = 1; 1175 pipes[pipe_cnt].pipe.scale_taps.vtaps = 1; 1176 pipes[pipe_cnt].pipe.dest.vtotal_min = v_total; 1177 pipes[pipe_cnt].pipe.dest.vtotal_max = v_total; 1178 1179 if (pipes[pipe_cnt].pipe.dest.odm_combine == dm_odm_combine_mode_2to1) { 1180 pipes[pipe_cnt].pipe.src.viewport_width /= 2; 1181 pipes[pipe_cnt].pipe.dest.recout_width /= 2; 1182 } else if (pipes[pipe_cnt].pipe.dest.odm_combine == dm_odm_combine_mode_4to1) { 1183 pipes[pipe_cnt].pipe.src.viewport_width /= 4; 1184 pipes[pipe_cnt].pipe.dest.recout_width /= 4; 1185 } 1186 } else { 1187 struct dc_plane_state *pln = res_ctx->pipe_ctx[i].plane_state; 1188 struct scaler_data *scl = &res_ctx->pipe_ctx[i].plane_res.scl_data; 1189 1190 pipes[pipe_cnt].pipe.src.immediate_flip = pln->flip_immediate; 1191 pipes[pipe_cnt].pipe.src.is_hsplit = (res_ctx->pipe_ctx[i].bottom_pipe && res_ctx->pipe_ctx[i].bottom_pipe->plane_state == pln) 1192 || (res_ctx->pipe_ctx[i].top_pipe && res_ctx->pipe_ctx[i].top_pipe->plane_state == pln) 1193 || pipes[pipe_cnt].pipe.dest.odm_combine != dm_odm_combine_mode_disabled; 1194 1195 /* stereo is not split */ 1196 if (pln->stereo_format == PLANE_STEREO_FORMAT_SIDE_BY_SIDE || 1197 pln->stereo_format == PLANE_STEREO_FORMAT_TOP_AND_BOTTOM) { 1198 pipes[pipe_cnt].pipe.src.is_hsplit = false; 1199 pipes[pipe_cnt].pipe.src.hsplit_grp = res_ctx->pipe_ctx[i].pipe_idx; 1200 } 1201 1202 pipes[pipe_cnt].pipe.src.source_scan = pln->rotation == ROTATION_ANGLE_90 1203 || pln->rotation == ROTATION_ANGLE_270 ? dm_vert : dm_horz; 1204 pipes[pipe_cnt].pipe.src.viewport_y_y = scl->viewport.y; 1205 pipes[pipe_cnt].pipe.src.viewport_y_c = scl->viewport_c.y; 1206 pipes[pipe_cnt].pipe.src.viewport_width = scl->viewport.width; 1207 pipes[pipe_cnt].pipe.src.viewport_width_c = scl->viewport_c.width; 1208 pipes[pipe_cnt].pipe.src.viewport_height = scl->viewport.height; 1209 pipes[pipe_cnt].pipe.src.viewport_height_c = scl->viewport_c.height; 1210 pipes[pipe_cnt].pipe.src.viewport_width_max = pln->src_rect.width; 1211 pipes[pipe_cnt].pipe.src.viewport_height_max = pln->src_rect.height; 1212 pipes[pipe_cnt].pipe.src.surface_width_y = pln->plane_size.surface_size.width; 1213 pipes[pipe_cnt].pipe.src.surface_height_y = pln->plane_size.surface_size.height; 1214 pipes[pipe_cnt].pipe.src.surface_width_c = pln->plane_size.chroma_size.width; 1215 pipes[pipe_cnt].pipe.src.surface_height_c = pln->plane_size.chroma_size.height; 1216 if (pln->format == SURFACE_PIXEL_FORMAT_GRPH_RGBE_ALPHA 1217 || pln->format >= SURFACE_PIXEL_FORMAT_VIDEO_BEGIN) { 1218 pipes[pipe_cnt].pipe.src.data_pitch = pln->plane_size.surface_pitch; 1219 pipes[pipe_cnt].pipe.src.data_pitch_c = pln->plane_size.chroma_pitch; 1220 pipes[pipe_cnt].pipe.src.meta_pitch = pln->dcc.meta_pitch; 1221 pipes[pipe_cnt].pipe.src.meta_pitch_c = pln->dcc.meta_pitch_c; 1222 } else { 1223 pipes[pipe_cnt].pipe.src.data_pitch = pln->plane_size.surface_pitch; 1224 pipes[pipe_cnt].pipe.src.meta_pitch = pln->dcc.meta_pitch; 1225 } 1226 pipes[pipe_cnt].pipe.src.dcc = pln->dcc.enable; 1227 pipes[pipe_cnt].pipe.dest.recout_width = scl->recout.width; 1228 pipes[pipe_cnt].pipe.dest.recout_height = scl->recout.height; 1229 pipes[pipe_cnt].pipe.dest.full_recout_height = scl->recout.height; 1230 pipes[pipe_cnt].pipe.dest.full_recout_width = scl->recout.width; 1231 if (pipes[pipe_cnt].pipe.dest.odm_combine == dm_odm_combine_mode_2to1) 1232 pipes[pipe_cnt].pipe.dest.full_recout_width *= 2; 1233 else if (pipes[pipe_cnt].pipe.dest.odm_combine == dm_odm_combine_mode_4to1) 1234 pipes[pipe_cnt].pipe.dest.full_recout_width *= 4; 1235 else { 1236 struct pipe_ctx *split_pipe = res_ctx->pipe_ctx[i].bottom_pipe; 1237 1238 while (split_pipe && split_pipe->plane_state == pln) { 1239 pipes[pipe_cnt].pipe.dest.full_recout_width += split_pipe->plane_res.scl_data.recout.width; 1240 split_pipe = split_pipe->bottom_pipe; 1241 } 1242 split_pipe = res_ctx->pipe_ctx[i].top_pipe; 1243 while (split_pipe && split_pipe->plane_state == pln) { 1244 pipes[pipe_cnt].pipe.dest.full_recout_width += split_pipe->plane_res.scl_data.recout.width; 1245 split_pipe = split_pipe->top_pipe; 1246 } 1247 } 1248 1249 pipes[pipe_cnt].pipe.scale_ratio_depth.lb_depth = dm_lb_16; 1250 pipes[pipe_cnt].pipe.scale_ratio_depth.hscl_ratio = (double) scl->ratios.horz.value / (1ULL<<32); 1251 pipes[pipe_cnt].pipe.scale_ratio_depth.hscl_ratio_c = (double) scl->ratios.horz_c.value / (1ULL<<32); 1252 pipes[pipe_cnt].pipe.scale_ratio_depth.vscl_ratio = (double) scl->ratios.vert.value / (1ULL<<32); 1253 pipes[pipe_cnt].pipe.scale_ratio_depth.vscl_ratio_c = (double) scl->ratios.vert_c.value / (1ULL<<32); 1254 pipes[pipe_cnt].pipe.scale_ratio_depth.scl_enable = 1255 scl->ratios.vert.value != dc_fixpt_one.value 1256 || scl->ratios.horz.value != dc_fixpt_one.value 1257 || scl->ratios.vert_c.value != dc_fixpt_one.value 1258 || scl->ratios.horz_c.value != dc_fixpt_one.value /*Lb only or Full scl*/ 1259 || dc->debug.always_scale; /*support always scale*/ 1260 pipes[pipe_cnt].pipe.scale_taps.htaps = scl->taps.h_taps; 1261 pipes[pipe_cnt].pipe.scale_taps.htaps_c = scl->taps.h_taps_c; 1262 pipes[pipe_cnt].pipe.scale_taps.vtaps = scl->taps.v_taps; 1263 pipes[pipe_cnt].pipe.scale_taps.vtaps_c = scl->taps.v_taps_c; 1264 1265 pipes[pipe_cnt].pipe.src.macro_tile_size = 1266 swizzle_mode_to_macro_tile_size(pln->tiling_info.gfx9.swizzle); 1267 swizzle_to_dml_params(pln->tiling_info.gfx9.swizzle, 1268 &pipes[pipe_cnt].pipe.src.sw_mode); 1269 1270 switch (pln->format) { 1271 case SURFACE_PIXEL_FORMAT_VIDEO_420_YCbCr: 1272 case SURFACE_PIXEL_FORMAT_VIDEO_420_YCrCb: 1273 pipes[pipe_cnt].pipe.src.source_format = dm_420_8; 1274 break; 1275 case SURFACE_PIXEL_FORMAT_VIDEO_420_10bpc_YCbCr: 1276 case SURFACE_PIXEL_FORMAT_VIDEO_420_10bpc_YCrCb: 1277 pipes[pipe_cnt].pipe.src.source_format = dm_420_10; 1278 break; 1279 case SURFACE_PIXEL_FORMAT_GRPH_ARGB16161616: 1280 case SURFACE_PIXEL_FORMAT_GRPH_ABGR16161616: 1281 case SURFACE_PIXEL_FORMAT_GRPH_ARGB16161616F: 1282 case SURFACE_PIXEL_FORMAT_GRPH_ABGR16161616F: 1283 pipes[pipe_cnt].pipe.src.source_format = dm_444_64; 1284 break; 1285 case SURFACE_PIXEL_FORMAT_GRPH_ARGB1555: 1286 case SURFACE_PIXEL_FORMAT_GRPH_RGB565: 1287 pipes[pipe_cnt].pipe.src.source_format = dm_444_16; 1288 break; 1289 case SURFACE_PIXEL_FORMAT_GRPH_PALETA_256_COLORS: 1290 pipes[pipe_cnt].pipe.src.source_format = dm_444_8; 1291 break; 1292 case SURFACE_PIXEL_FORMAT_GRPH_RGBE_ALPHA: 1293 pipes[pipe_cnt].pipe.src.source_format = dm_rgbe_alpha; 1294 break; 1295 default: 1296 pipes[pipe_cnt].pipe.src.source_format = dm_444_32; 1297 break; 1298 } 1299 } 1300 1301 pipe_cnt++; 1302 } 1303 1304 /* populate writeback information */ 1305 dc->res_pool->funcs->populate_dml_writeback_from_context(dc, res_ctx, pipes); 1306 1307 return pipe_cnt; 1308} 1309 1310void dcn20_calculate_wm( 1311 struct dc *dc, struct dc_state *context, 1312 display_e2e_pipe_params_st *pipes, 1313 int *out_pipe_cnt, 1314 int *pipe_split_from, 1315 int vlevel, 1316 bool fast_validate) 1317{ 1318 int pipe_cnt, i, pipe_idx; 1319 1320 dc_assert_fp_enabled(); 1321 1322 for (i = 0, pipe_idx = 0, pipe_cnt = 0; i < dc->res_pool->pipe_count; i++) { 1323 if (!context->res_ctx.pipe_ctx[i].stream) 1324 continue; 1325 1326 pipes[pipe_cnt].clks_cfg.refclk_mhz = dc->res_pool->ref_clocks.dchub_ref_clock_inKhz / 1000.0; 1327 pipes[pipe_cnt].clks_cfg.dispclk_mhz = context->bw_ctx.dml.vba.RequiredDISPCLK[vlevel][context->bw_ctx.dml.vba.maxMpcComb]; 1328 1329 if (pipe_split_from[i] < 0) { 1330 pipes[pipe_cnt].clks_cfg.dppclk_mhz = 1331 context->bw_ctx.dml.vba.RequiredDPPCLK[vlevel][context->bw_ctx.dml.vba.maxMpcComb][pipe_idx]; 1332 if (context->bw_ctx.dml.vba.BlendingAndTiming[pipe_idx] == pipe_idx) 1333 pipes[pipe_cnt].pipe.dest.odm_combine = 1334 context->bw_ctx.dml.vba.ODMCombineEnabled[pipe_idx]; 1335 else 1336 pipes[pipe_cnt].pipe.dest.odm_combine = 0; 1337 pipe_idx++; 1338 } else { 1339 pipes[pipe_cnt].clks_cfg.dppclk_mhz = 1340 context->bw_ctx.dml.vba.RequiredDPPCLK[vlevel][context->bw_ctx.dml.vba.maxMpcComb][pipe_split_from[i]]; 1341 if (context->bw_ctx.dml.vba.BlendingAndTiming[pipe_split_from[i]] == pipe_split_from[i]) 1342 pipes[pipe_cnt].pipe.dest.odm_combine = 1343 context->bw_ctx.dml.vba.ODMCombineEnabled[pipe_split_from[i]]; 1344 else 1345 pipes[pipe_cnt].pipe.dest.odm_combine = 0; 1346 } 1347 1348 if (dc->config.forced_clocks) { 1349 pipes[pipe_cnt].clks_cfg.dispclk_mhz = context->bw_ctx.dml.soc.clock_limits[0].dispclk_mhz; 1350 pipes[pipe_cnt].clks_cfg.dppclk_mhz = context->bw_ctx.dml.soc.clock_limits[0].dppclk_mhz; 1351 } 1352 if (dc->debug.min_disp_clk_khz > pipes[pipe_cnt].clks_cfg.dispclk_mhz * 1000) 1353 pipes[pipe_cnt].clks_cfg.dispclk_mhz = dc->debug.min_disp_clk_khz / 1000.0; 1354 if (dc->debug.min_dpp_clk_khz > pipes[pipe_cnt].clks_cfg.dppclk_mhz * 1000) 1355 pipes[pipe_cnt].clks_cfg.dppclk_mhz = dc->debug.min_dpp_clk_khz / 1000.0; 1356 1357 pipe_cnt++; 1358 } 1359 1360 if (pipe_cnt != pipe_idx) { 1361 if (dc->res_pool->funcs->populate_dml_pipes) 1362 pipe_cnt = dc->res_pool->funcs->populate_dml_pipes(dc, 1363 context, pipes, fast_validate); 1364 else 1365 pipe_cnt = dcn20_populate_dml_pipes_from_context(dc, 1366 context, pipes, fast_validate); 1367 } 1368 1369 *out_pipe_cnt = pipe_cnt; 1370 1371 pipes[0].clks_cfg.voltage = vlevel; 1372 pipes[0].clks_cfg.dcfclk_mhz = context->bw_ctx.dml.soc.clock_limits[vlevel].dcfclk_mhz; 1373 pipes[0].clks_cfg.socclk_mhz = context->bw_ctx.dml.soc.clock_limits[vlevel].socclk_mhz; 1374 1375 /* only pipe 0 is read for voltage and dcf/soc clocks */ 1376 if (vlevel < 1) { 1377 pipes[0].clks_cfg.voltage = 1; 1378 pipes[0].clks_cfg.dcfclk_mhz = context->bw_ctx.dml.soc.clock_limits[1].dcfclk_mhz; 1379 pipes[0].clks_cfg.socclk_mhz = context->bw_ctx.dml.soc.clock_limits[1].socclk_mhz; 1380 } 1381 context->bw_ctx.bw.dcn.watermarks.b.urgent_ns = get_wm_urgent(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1382 context->bw_ctx.bw.dcn.watermarks.b.cstate_pstate.cstate_enter_plus_exit_ns = get_wm_stutter_enter_exit(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1383 context->bw_ctx.bw.dcn.watermarks.b.cstate_pstate.cstate_exit_ns = get_wm_stutter_exit(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1384 context->bw_ctx.bw.dcn.watermarks.b.cstate_pstate.pstate_change_ns = get_wm_dram_clock_change(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1385 context->bw_ctx.bw.dcn.watermarks.b.pte_meta_urgent_ns = get_wm_memory_trip(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1386 context->bw_ctx.bw.dcn.watermarks.b.frac_urg_bw_nom = get_fraction_of_urgent_bandwidth(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1387 context->bw_ctx.bw.dcn.watermarks.b.frac_urg_bw_flip = get_fraction_of_urgent_bandwidth_imm_flip(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1388 context->bw_ctx.bw.dcn.watermarks.b.urgent_latency_ns = get_urgent_latency(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1389 1390 if (vlevel < 2) { 1391 pipes[0].clks_cfg.voltage = 2; 1392 pipes[0].clks_cfg.dcfclk_mhz = context->bw_ctx.dml.soc.clock_limits[2].dcfclk_mhz; 1393 pipes[0].clks_cfg.socclk_mhz = context->bw_ctx.dml.soc.clock_limits[2].socclk_mhz; 1394 } 1395 context->bw_ctx.bw.dcn.watermarks.c.urgent_ns = get_wm_urgent(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1396 context->bw_ctx.bw.dcn.watermarks.c.cstate_pstate.cstate_enter_plus_exit_ns = get_wm_stutter_enter_exit(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1397 context->bw_ctx.bw.dcn.watermarks.c.cstate_pstate.cstate_exit_ns = get_wm_stutter_exit(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1398 context->bw_ctx.bw.dcn.watermarks.c.cstate_pstate.pstate_change_ns = get_wm_dram_clock_change(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1399 context->bw_ctx.bw.dcn.watermarks.c.pte_meta_urgent_ns = get_wm_memory_trip(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1400 context->bw_ctx.bw.dcn.watermarks.c.frac_urg_bw_nom = get_fraction_of_urgent_bandwidth(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1401 context->bw_ctx.bw.dcn.watermarks.c.frac_urg_bw_flip = get_fraction_of_urgent_bandwidth_imm_flip(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1402 1403 if (vlevel < 3) { 1404 pipes[0].clks_cfg.voltage = 3; 1405 pipes[0].clks_cfg.dcfclk_mhz = context->bw_ctx.dml.soc.clock_limits[2].dcfclk_mhz; 1406 pipes[0].clks_cfg.socclk_mhz = context->bw_ctx.dml.soc.clock_limits[2].socclk_mhz; 1407 } 1408 context->bw_ctx.bw.dcn.watermarks.d.urgent_ns = get_wm_urgent(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1409 context->bw_ctx.bw.dcn.watermarks.d.cstate_pstate.cstate_enter_plus_exit_ns = get_wm_stutter_enter_exit(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1410 context->bw_ctx.bw.dcn.watermarks.d.cstate_pstate.cstate_exit_ns = get_wm_stutter_exit(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1411 context->bw_ctx.bw.dcn.watermarks.d.cstate_pstate.pstate_change_ns = get_wm_dram_clock_change(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1412 context->bw_ctx.bw.dcn.watermarks.d.pte_meta_urgent_ns = get_wm_memory_trip(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1413 context->bw_ctx.bw.dcn.watermarks.d.frac_urg_bw_nom = get_fraction_of_urgent_bandwidth(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1414 context->bw_ctx.bw.dcn.watermarks.d.frac_urg_bw_flip = get_fraction_of_urgent_bandwidth_imm_flip(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1415 1416 pipes[0].clks_cfg.voltage = vlevel; 1417 pipes[0].clks_cfg.dcfclk_mhz = context->bw_ctx.dml.soc.clock_limits[vlevel].dcfclk_mhz; 1418 pipes[0].clks_cfg.socclk_mhz = context->bw_ctx.dml.soc.clock_limits[vlevel].socclk_mhz; 1419 context->bw_ctx.bw.dcn.watermarks.a.urgent_ns = get_wm_urgent(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1420 context->bw_ctx.bw.dcn.watermarks.a.cstate_pstate.cstate_enter_plus_exit_ns = get_wm_stutter_enter_exit(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1421 context->bw_ctx.bw.dcn.watermarks.a.cstate_pstate.cstate_exit_ns = get_wm_stutter_exit(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1422 context->bw_ctx.bw.dcn.watermarks.a.cstate_pstate.pstate_change_ns = get_wm_dram_clock_change(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1423 context->bw_ctx.bw.dcn.watermarks.a.pte_meta_urgent_ns = get_wm_memory_trip(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1424 context->bw_ctx.bw.dcn.watermarks.a.frac_urg_bw_nom = get_fraction_of_urgent_bandwidth(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1425 context->bw_ctx.bw.dcn.watermarks.a.frac_urg_bw_flip = get_fraction_of_urgent_bandwidth_imm_flip(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1426} 1427 1428void dcn20_update_bounding_box(struct dc *dc, struct _vcs_dpi_soc_bounding_box_st *bb, 1429 struct pp_smu_nv_clock_table *max_clocks, unsigned int *uclk_states, unsigned int num_states) 1430{ 1431 struct _vcs_dpi_voltage_scaling_st calculated_states[DC__VOLTAGE_STATES]; 1432 int i; 1433 int num_calculated_states = 0; 1434 int min_dcfclk = 0; 1435 1436 dc_assert_fp_enabled(); 1437 1438 if (num_states == 0) 1439 return; 1440 1441 memset(calculated_states, 0, sizeof(calculated_states)); 1442 1443 if (dc->bb_overrides.min_dcfclk_mhz > 0) 1444 min_dcfclk = dc->bb_overrides.min_dcfclk_mhz; 1445 else { 1446 if (ASICREV_IS_NAVI12_P(dc->ctx->asic_id.hw_internal_rev)) 1447 min_dcfclk = 310; 1448 else 1449 // Accounting for SOC/DCF relationship, we can go as high as 1450 // 506Mhz in Vmin. 1451 min_dcfclk = 506; 1452 } 1453 1454 for (i = 0; i < num_states; i++) { 1455 int min_fclk_required_by_uclk; 1456 calculated_states[i].state = i; 1457 calculated_states[i].dram_speed_mts = uclk_states[i] * 16 / 1000; 1458 1459 // FCLK:UCLK ratio is 1.08 1460 min_fclk_required_by_uclk = div_u64(((unsigned long long)uclk_states[i]) * 1080, 1461 1000000); 1462 1463 calculated_states[i].fabricclk_mhz = (min_fclk_required_by_uclk < min_dcfclk) ? 1464 min_dcfclk : min_fclk_required_by_uclk; 1465 1466 calculated_states[i].socclk_mhz = (calculated_states[i].fabricclk_mhz > max_clocks->socClockInKhz / 1000) ? 1467 max_clocks->socClockInKhz / 1000 : calculated_states[i].fabricclk_mhz; 1468 1469 calculated_states[i].dcfclk_mhz = (calculated_states[i].fabricclk_mhz > max_clocks->dcfClockInKhz / 1000) ? 1470 max_clocks->dcfClockInKhz / 1000 : calculated_states[i].fabricclk_mhz; 1471 1472 calculated_states[i].dispclk_mhz = max_clocks->displayClockInKhz / 1000; 1473 calculated_states[i].dppclk_mhz = max_clocks->displayClockInKhz / 1000; 1474 calculated_states[i].dscclk_mhz = max_clocks->displayClockInKhz / (1000 * 3); 1475 1476 calculated_states[i].phyclk_mhz = max_clocks->phyClockInKhz / 1000; 1477 1478 num_calculated_states++; 1479 } 1480 1481 calculated_states[num_calculated_states - 1].socclk_mhz = max_clocks->socClockInKhz / 1000; 1482 calculated_states[num_calculated_states - 1].fabricclk_mhz = max_clocks->socClockInKhz / 1000; 1483 calculated_states[num_calculated_states - 1].dcfclk_mhz = max_clocks->dcfClockInKhz / 1000; 1484 1485 memcpy(bb->clock_limits, calculated_states, sizeof(bb->clock_limits)); 1486 bb->num_states = num_calculated_states; 1487 1488 // Duplicate the last state, DML always an extra state identical to max state to work 1489 memcpy(&bb->clock_limits[num_calculated_states], &bb->clock_limits[num_calculated_states - 1], sizeof(struct _vcs_dpi_voltage_scaling_st)); 1490 bb->clock_limits[num_calculated_states].state = bb->num_states; 1491} 1492 1493void dcn20_cap_soc_clocks( 1494 struct _vcs_dpi_soc_bounding_box_st *bb, 1495 struct pp_smu_nv_clock_table max_clocks) 1496{ 1497 int i; 1498 1499 dc_assert_fp_enabled(); 1500 1501 // First pass - cap all clocks higher than the reported max 1502 for (i = 0; i < bb->num_states; i++) { 1503 if ((bb->clock_limits[i].dcfclk_mhz > (max_clocks.dcfClockInKhz / 1000)) 1504 && max_clocks.dcfClockInKhz != 0) 1505 bb->clock_limits[i].dcfclk_mhz = (max_clocks.dcfClockInKhz / 1000); 1506 1507 if ((bb->clock_limits[i].dram_speed_mts > (max_clocks.uClockInKhz / 1000) * 16) 1508 && max_clocks.uClockInKhz != 0) 1509 bb->clock_limits[i].dram_speed_mts = (max_clocks.uClockInKhz / 1000) * 16; 1510 1511 if ((bb->clock_limits[i].fabricclk_mhz > (max_clocks.fabricClockInKhz / 1000)) 1512 && max_clocks.fabricClockInKhz != 0) 1513 bb->clock_limits[i].fabricclk_mhz = (max_clocks.fabricClockInKhz / 1000); 1514 1515 if ((bb->clock_limits[i].dispclk_mhz > (max_clocks.displayClockInKhz / 1000)) 1516 && max_clocks.displayClockInKhz != 0) 1517 bb->clock_limits[i].dispclk_mhz = (max_clocks.displayClockInKhz / 1000); 1518 1519 if ((bb->clock_limits[i].dppclk_mhz > (max_clocks.dppClockInKhz / 1000)) 1520 && max_clocks.dppClockInKhz != 0) 1521 bb->clock_limits[i].dppclk_mhz = (max_clocks.dppClockInKhz / 1000); 1522 1523 if ((bb->clock_limits[i].phyclk_mhz > (max_clocks.phyClockInKhz / 1000)) 1524 && max_clocks.phyClockInKhz != 0) 1525 bb->clock_limits[i].phyclk_mhz = (max_clocks.phyClockInKhz / 1000); 1526 1527 if ((bb->clock_limits[i].socclk_mhz > (max_clocks.socClockInKhz / 1000)) 1528 && max_clocks.socClockInKhz != 0) 1529 bb->clock_limits[i].socclk_mhz = (max_clocks.socClockInKhz / 1000); 1530 1531 if ((bb->clock_limits[i].dscclk_mhz > (max_clocks.dscClockInKhz / 1000)) 1532 && max_clocks.dscClockInKhz != 0) 1533 bb->clock_limits[i].dscclk_mhz = (max_clocks.dscClockInKhz / 1000); 1534 } 1535 1536 // Second pass - remove all duplicate clock states 1537 for (i = bb->num_states - 1; i > 1; i--) { 1538 bool duplicate = true; 1539 1540 if (bb->clock_limits[i-1].dcfclk_mhz != bb->clock_limits[i].dcfclk_mhz) 1541 duplicate = false; 1542 if (bb->clock_limits[i-1].dispclk_mhz != bb->clock_limits[i].dispclk_mhz) 1543 duplicate = false; 1544 if (bb->clock_limits[i-1].dppclk_mhz != bb->clock_limits[i].dppclk_mhz) 1545 duplicate = false; 1546 if (bb->clock_limits[i-1].dram_speed_mts != bb->clock_limits[i].dram_speed_mts) 1547 duplicate = false; 1548 if (bb->clock_limits[i-1].dscclk_mhz != bb->clock_limits[i].dscclk_mhz) 1549 duplicate = false; 1550 if (bb->clock_limits[i-1].fabricclk_mhz != bb->clock_limits[i].fabricclk_mhz) 1551 duplicate = false; 1552 if (bb->clock_limits[i-1].phyclk_mhz != bb->clock_limits[i].phyclk_mhz) 1553 duplicate = false; 1554 if (bb->clock_limits[i-1].socclk_mhz != bb->clock_limits[i].socclk_mhz) 1555 duplicate = false; 1556 1557 if (duplicate) 1558 bb->num_states--; 1559 } 1560} 1561 1562void dcn20_patch_bounding_box(struct dc *dc, struct _vcs_dpi_soc_bounding_box_st *bb) 1563{ 1564 dc_assert_fp_enabled(); 1565 1566 if ((int)(bb->sr_exit_time_us * 1000) != dc->bb_overrides.sr_exit_time_ns 1567 && dc->bb_overrides.sr_exit_time_ns) { 1568 bb->sr_exit_time_us = dc->bb_overrides.sr_exit_time_ns / 1000.0; 1569 } 1570 1571 if ((int)(bb->sr_enter_plus_exit_time_us * 1000) 1572 != dc->bb_overrides.sr_enter_plus_exit_time_ns 1573 && dc->bb_overrides.sr_enter_plus_exit_time_ns) { 1574 bb->sr_enter_plus_exit_time_us = 1575 dc->bb_overrides.sr_enter_plus_exit_time_ns / 1000.0; 1576 } 1577 1578 if ((int)(bb->urgent_latency_us * 1000) != dc->bb_overrides.urgent_latency_ns 1579 && dc->bb_overrides.urgent_latency_ns) { 1580 bb->urgent_latency_us = dc->bb_overrides.urgent_latency_ns / 1000.0; 1581 } 1582 1583 if ((int)(bb->dram_clock_change_latency_us * 1000) 1584 != dc->bb_overrides.dram_clock_change_latency_ns 1585 && dc->bb_overrides.dram_clock_change_latency_ns) { 1586 bb->dram_clock_change_latency_us = 1587 dc->bb_overrides.dram_clock_change_latency_ns / 1000.0; 1588 } 1589 1590 if ((int)(bb->dummy_pstate_latency_us * 1000) 1591 != dc->bb_overrides.dummy_clock_change_latency_ns 1592 && dc->bb_overrides.dummy_clock_change_latency_ns) { 1593 bb->dummy_pstate_latency_us = 1594 dc->bb_overrides.dummy_clock_change_latency_ns / 1000.0; 1595 } 1596} 1597 1598static bool dcn20_validate_bandwidth_internal(struct dc *dc, struct dc_state *context, 1599 bool fast_validate) 1600{ 1601 bool out = false; 1602 1603 BW_VAL_TRACE_SETUP(); 1604 1605 int vlevel = 0; 1606 int pipe_split_from[MAX_PIPES]; 1607 int pipe_cnt = 0; 1608 display_e2e_pipe_params_st *pipes = kzalloc(dc->res_pool->pipe_count * sizeof(display_e2e_pipe_params_st), GFP_ATOMIC); 1609 DC_LOGGER_INIT(dc->ctx->logger); 1610 1611 BW_VAL_TRACE_COUNT(); 1612 1613 out = dcn20_fast_validate_bw(dc, context, pipes, &pipe_cnt, pipe_split_from, &vlevel, fast_validate); 1614 1615 if (pipe_cnt == 0) 1616 goto validate_out; 1617 1618 if (!out) 1619 goto validate_fail; 1620 1621 BW_VAL_TRACE_END_VOLTAGE_LEVEL(); 1622 1623 if (fast_validate) { 1624 BW_VAL_TRACE_SKIP(fast); 1625 goto validate_out; 1626 } 1627 1628 dcn20_calculate_wm(dc, context, pipes, &pipe_cnt, pipe_split_from, vlevel, fast_validate); 1629 dcn20_calculate_dlg_params(dc, context, pipes, pipe_cnt, vlevel); 1630 1631 BW_VAL_TRACE_END_WATERMARKS(); 1632 1633 goto validate_out; 1634 1635validate_fail: 1636 DC_LOG_WARNING("Mode Validation Warning: %s failed validation.\n", 1637 dml_get_status_message(context->bw_ctx.dml.vba.ValidationStatus[context->bw_ctx.dml.vba.soc.num_states])); 1638 1639 BW_VAL_TRACE_SKIP(fail); 1640 out = false; 1641 1642validate_out: 1643 kfree(pipes); 1644 1645 BW_VAL_TRACE_FINISH(); 1646 1647 return out; 1648} 1649 1650bool dcn20_validate_bandwidth_fp(struct dc *dc, 1651 struct dc_state *context, 1652 bool fast_validate) 1653{ 1654 bool voltage_supported = false; 1655 bool full_pstate_supported = false; 1656 bool dummy_pstate_supported = false; 1657 double p_state_latency_us; 1658 1659 dc_assert_fp_enabled(); 1660 1661 p_state_latency_us = context->bw_ctx.dml.soc.dram_clock_change_latency_us; 1662 context->bw_ctx.dml.soc.disable_dram_clock_change_vactive_support = 1663 dc->debug.disable_dram_clock_change_vactive_support; 1664 context->bw_ctx.dml.soc.allow_dram_clock_one_display_vactive = 1665 dc->debug.enable_dram_clock_change_one_display_vactive; 1666 1667 /*Unsafe due to current pipe merge and split logic*/ 1668 ASSERT(context != dc->current_state); 1669 1670 if (fast_validate) { 1671 return dcn20_validate_bandwidth_internal(dc, context, true); 1672 } 1673 1674 // Best case, we support full UCLK switch latency 1675 voltage_supported = dcn20_validate_bandwidth_internal(dc, context, false); 1676 full_pstate_supported = context->bw_ctx.bw.dcn.clk.p_state_change_support; 1677 1678 if (context->bw_ctx.dml.soc.dummy_pstate_latency_us == 0 || 1679 (voltage_supported && full_pstate_supported)) { 1680 context->bw_ctx.bw.dcn.clk.p_state_change_support = full_pstate_supported; 1681 goto restore_dml_state; 1682 } 1683 1684 // Fallback: Try to only support G6 temperature read latency 1685 context->bw_ctx.dml.soc.dram_clock_change_latency_us = context->bw_ctx.dml.soc.dummy_pstate_latency_us; 1686 1687 voltage_supported = dcn20_validate_bandwidth_internal(dc, context, false); 1688 dummy_pstate_supported = context->bw_ctx.bw.dcn.clk.p_state_change_support; 1689 1690 if (voltage_supported && (dummy_pstate_supported || !(context->stream_count))) { 1691 context->bw_ctx.bw.dcn.clk.p_state_change_support = false; 1692 goto restore_dml_state; 1693 } 1694 1695 // ERROR: fallback is supposed to always work. 1696 ASSERT(false); 1697 1698restore_dml_state: 1699 context->bw_ctx.dml.soc.dram_clock_change_latency_us = p_state_latency_us; 1700 return voltage_supported; 1701} 1702 1703void dcn20_fpu_set_wm_ranges(int i, 1704 struct pp_smu_wm_range_sets *ranges, 1705 struct _vcs_dpi_soc_bounding_box_st *loaded_bb) 1706{ 1707 dc_assert_fp_enabled(); 1708 1709 ranges->reader_wm_sets[i].min_fill_clk_mhz = (i > 0) ? (loaded_bb->clock_limits[i - 1].dram_speed_mts / 16) + 1 : 0; 1710 ranges->reader_wm_sets[i].max_fill_clk_mhz = loaded_bb->clock_limits[i].dram_speed_mts / 16; 1711} 1712 1713void dcn20_fpu_adjust_dppclk(struct vba_vars_st *v, 1714 int vlevel, 1715 int max_mpc_comb, 1716 int pipe_idx, 1717 bool is_validating_bw) 1718{ 1719 dc_assert_fp_enabled(); 1720 1721 if (is_validating_bw) 1722 v->RequiredDPPCLK[vlevel][max_mpc_comb][pipe_idx] *= 2; 1723 else 1724 v->RequiredDPPCLK[vlevel][max_mpc_comb][pipe_idx] /= 2; 1725} 1726 1727int dcn21_populate_dml_pipes_from_context(struct dc *dc, 1728 struct dc_state *context, 1729 display_e2e_pipe_params_st *pipes, 1730 bool fast_validate) 1731{ 1732 uint32_t pipe_cnt; 1733 int i; 1734 1735 dc_assert_fp_enabled(); 1736 1737 pipe_cnt = dcn20_populate_dml_pipes_from_context(dc, context, pipes, fast_validate); 1738 1739 for (i = 0; i < pipe_cnt; i++) { 1740 1741 pipes[i].pipe.src.hostvm = dc->res_pool->hubbub->riommu_active; 1742 pipes[i].pipe.src.gpuvm = 1; 1743 } 1744 1745 return pipe_cnt; 1746} 1747 1748static void patch_bounding_box(struct dc *dc, struct _vcs_dpi_soc_bounding_box_st *bb) 1749{ 1750 int i; 1751 1752 if (dc->bb_overrides.sr_exit_time_ns) { 1753 for (i = 0; i < WM_SET_COUNT; i++) { 1754 dc->clk_mgr->bw_params->wm_table.entries[i].sr_exit_time_us = 1755 dc->bb_overrides.sr_exit_time_ns / 1000.0; 1756 } 1757 } 1758 1759 if (dc->bb_overrides.sr_enter_plus_exit_time_ns) { 1760 for (i = 0; i < WM_SET_COUNT; i++) { 1761 dc->clk_mgr->bw_params->wm_table.entries[i].sr_enter_plus_exit_time_us = 1762 dc->bb_overrides.sr_enter_plus_exit_time_ns / 1000.0; 1763 } 1764 } 1765 1766 if (dc->bb_overrides.urgent_latency_ns) { 1767 bb->urgent_latency_us = dc->bb_overrides.urgent_latency_ns / 1000.0; 1768 } 1769 1770 if (dc->bb_overrides.dram_clock_change_latency_ns) { 1771 for (i = 0; i < WM_SET_COUNT; i++) { 1772 dc->clk_mgr->bw_params->wm_table.entries[i].pstate_latency_us = 1773 dc->bb_overrides.dram_clock_change_latency_ns / 1000.0; 1774 } 1775 } 1776} 1777 1778static void calculate_wm_set_for_vlevel(int vlevel, 1779 struct wm_range_table_entry *table_entry, 1780 struct dcn_watermarks *wm_set, 1781 struct display_mode_lib *dml, 1782 display_e2e_pipe_params_st *pipes, 1783 int pipe_cnt) 1784{ 1785 double dram_clock_change_latency_cached = dml->soc.dram_clock_change_latency_us; 1786 1787 ASSERT(vlevel < dml->soc.num_states); 1788 /* only pipe 0 is read for voltage and dcf/soc clocks */ 1789 pipes[0].clks_cfg.voltage = vlevel; 1790 pipes[0].clks_cfg.dcfclk_mhz = dml->soc.clock_limits[vlevel].dcfclk_mhz; 1791 pipes[0].clks_cfg.socclk_mhz = dml->soc.clock_limits[vlevel].socclk_mhz; 1792 1793 dml->soc.dram_clock_change_latency_us = table_entry->pstate_latency_us; 1794 dml->soc.sr_exit_time_us = table_entry->sr_exit_time_us; 1795 dml->soc.sr_enter_plus_exit_time_us = table_entry->sr_enter_plus_exit_time_us; 1796 1797 wm_set->urgent_ns = get_wm_urgent(dml, pipes, pipe_cnt) * 1000; 1798 wm_set->cstate_pstate.cstate_enter_plus_exit_ns = get_wm_stutter_enter_exit(dml, pipes, pipe_cnt) * 1000; 1799 wm_set->cstate_pstate.cstate_exit_ns = get_wm_stutter_exit(dml, pipes, pipe_cnt) * 1000; 1800 wm_set->cstate_pstate.pstate_change_ns = get_wm_dram_clock_change(dml, pipes, pipe_cnt) * 1000; 1801 wm_set->pte_meta_urgent_ns = get_wm_memory_trip(dml, pipes, pipe_cnt) * 1000; 1802 wm_set->frac_urg_bw_nom = get_fraction_of_urgent_bandwidth(dml, pipes, pipe_cnt) * 1000; 1803 wm_set->frac_urg_bw_flip = get_fraction_of_urgent_bandwidth_imm_flip(dml, pipes, pipe_cnt) * 1000; 1804 wm_set->urgent_latency_ns = get_urgent_latency(dml, pipes, pipe_cnt) * 1000; 1805 dml->soc.dram_clock_change_latency_us = dram_clock_change_latency_cached; 1806} 1807 1808static void dcn21_calculate_wm(struct dc *dc, struct dc_state *context, 1809 display_e2e_pipe_params_st *pipes, 1810 int *out_pipe_cnt, 1811 int *pipe_split_from, 1812 int vlevel_req, 1813 bool fast_validate) 1814{ 1815 int pipe_cnt, i, pipe_idx; 1816 int vlevel, vlevel_max; 1817 struct wm_range_table_entry *table_entry; 1818 struct clk_bw_params *bw_params = dc->clk_mgr->bw_params; 1819 1820 ASSERT(bw_params); 1821 1822 patch_bounding_box(dc, &context->bw_ctx.dml.soc); 1823 1824 for (i = 0, pipe_idx = 0, pipe_cnt = 0; i < dc->res_pool->pipe_count; i++) { 1825 if (!context->res_ctx.pipe_ctx[i].stream) 1826 continue; 1827 1828 pipes[pipe_cnt].clks_cfg.refclk_mhz = dc->res_pool->ref_clocks.dchub_ref_clock_inKhz / 1000.0; 1829 pipes[pipe_cnt].clks_cfg.dispclk_mhz = context->bw_ctx.dml.vba.RequiredDISPCLK[vlevel_req][context->bw_ctx.dml.vba.maxMpcComb]; 1830 1831 if (pipe_split_from[i] < 0) { 1832 pipes[pipe_cnt].clks_cfg.dppclk_mhz = 1833 context->bw_ctx.dml.vba.RequiredDPPCLK[vlevel_req][context->bw_ctx.dml.vba.maxMpcComb][pipe_idx]; 1834 if (context->bw_ctx.dml.vba.BlendingAndTiming[pipe_idx] == pipe_idx) 1835 pipes[pipe_cnt].pipe.dest.odm_combine = 1836 context->bw_ctx.dml.vba.ODMCombineEnablePerState[vlevel_req][pipe_idx]; 1837 else 1838 pipes[pipe_cnt].pipe.dest.odm_combine = 0; 1839 pipe_idx++; 1840 } else { 1841 pipes[pipe_cnt].clks_cfg.dppclk_mhz = 1842 context->bw_ctx.dml.vba.RequiredDPPCLK[vlevel_req][context->bw_ctx.dml.vba.maxMpcComb][pipe_split_from[i]]; 1843 if (context->bw_ctx.dml.vba.BlendingAndTiming[pipe_split_from[i]] == pipe_split_from[i]) 1844 pipes[pipe_cnt].pipe.dest.odm_combine = 1845 context->bw_ctx.dml.vba.ODMCombineEnablePerState[vlevel_req][pipe_split_from[i]]; 1846 else 1847 pipes[pipe_cnt].pipe.dest.odm_combine = 0; 1848 } 1849 pipe_cnt++; 1850 } 1851 1852 if (pipe_cnt != pipe_idx) { 1853 if (dc->res_pool->funcs->populate_dml_pipes) 1854 pipe_cnt = dc->res_pool->funcs->populate_dml_pipes(dc, 1855 context, pipes, fast_validate); 1856 else 1857 pipe_cnt = dcn21_populate_dml_pipes_from_context(dc, 1858 context, pipes, fast_validate); 1859 } 1860 1861 *out_pipe_cnt = pipe_cnt; 1862 1863 vlevel_max = bw_params->clk_table.num_entries - 1; 1864 1865 1866 /* WM Set D */ 1867 table_entry = &bw_params->wm_table.entries[WM_D]; 1868 if (table_entry->wm_type == WM_TYPE_RETRAINING) 1869 vlevel = 0; 1870 else 1871 vlevel = vlevel_max; 1872 calculate_wm_set_for_vlevel(vlevel, table_entry, &context->bw_ctx.bw.dcn.watermarks.d, 1873 &context->bw_ctx.dml, pipes, pipe_cnt); 1874 /* WM Set C */ 1875 table_entry = &bw_params->wm_table.entries[WM_C]; 1876 vlevel = MIN(MAX(vlevel_req, 3), vlevel_max); 1877 calculate_wm_set_for_vlevel(vlevel, table_entry, &context->bw_ctx.bw.dcn.watermarks.c, 1878 &context->bw_ctx.dml, pipes, pipe_cnt); 1879 /* WM Set B */ 1880 table_entry = &bw_params->wm_table.entries[WM_B]; 1881 vlevel = MIN(MAX(vlevel_req, 2), vlevel_max); 1882 calculate_wm_set_for_vlevel(vlevel, table_entry, &context->bw_ctx.bw.dcn.watermarks.b, 1883 &context->bw_ctx.dml, pipes, pipe_cnt); 1884 1885 /* WM Set A */ 1886 table_entry = &bw_params->wm_table.entries[WM_A]; 1887 vlevel = MIN(vlevel_req, vlevel_max); 1888 calculate_wm_set_for_vlevel(vlevel, table_entry, &context->bw_ctx.bw.dcn.watermarks.a, 1889 &context->bw_ctx.dml, pipes, pipe_cnt); 1890} 1891 1892bool dcn21_validate_bandwidth_fp(struct dc *dc, 1893 struct dc_state *context, 1894 bool fast_validate) 1895{ 1896 bool out = false; 1897 1898 BW_VAL_TRACE_SETUP(); 1899 1900 int vlevel = 0; 1901 int pipe_split_from[MAX_PIPES]; 1902 int pipe_cnt = 0; 1903 display_e2e_pipe_params_st *pipes = kzalloc(dc->res_pool->pipe_count * sizeof(display_e2e_pipe_params_st), GFP_ATOMIC); 1904 DC_LOGGER_INIT(dc->ctx->logger); 1905 1906 BW_VAL_TRACE_COUNT(); 1907 1908 dc_assert_fp_enabled(); 1909 1910 /*Unsafe due to current pipe merge and split logic*/ 1911 ASSERT(context != dc->current_state); 1912 1913 out = dcn21_fast_validate_bw(dc, context, pipes, &pipe_cnt, pipe_split_from, &vlevel, fast_validate); 1914 1915 if (pipe_cnt == 0) 1916 goto validate_out; 1917 1918 if (!out) 1919 goto validate_fail; 1920 1921 BW_VAL_TRACE_END_VOLTAGE_LEVEL(); 1922 1923 if (fast_validate) { 1924 BW_VAL_TRACE_SKIP(fast); 1925 goto validate_out; 1926 } 1927 1928 dcn21_calculate_wm(dc, context, pipes, &pipe_cnt, pipe_split_from, vlevel, fast_validate); 1929 dcn20_calculate_dlg_params(dc, context, pipes, pipe_cnt, vlevel); 1930 1931 BW_VAL_TRACE_END_WATERMARKS(); 1932 1933 goto validate_out; 1934 1935validate_fail: 1936 DC_LOG_WARNING("Mode Validation Warning: %s failed validation.\n", 1937 dml_get_status_message(context->bw_ctx.dml.vba.ValidationStatus[context->bw_ctx.dml.vba.soc.num_states])); 1938 1939 BW_VAL_TRACE_SKIP(fail); 1940 out = false; 1941 1942validate_out: 1943 kfree(pipes); 1944 1945 BW_VAL_TRACE_FINISH(); 1946 1947 return out; 1948} 1949 1950static struct _vcs_dpi_voltage_scaling_st construct_low_pstate_lvl(struct clk_limit_table *clk_table, unsigned int high_voltage_lvl) 1951{ 1952 struct _vcs_dpi_voltage_scaling_st low_pstate_lvl; 1953 int i; 1954 1955 low_pstate_lvl.state = 1; 1956 low_pstate_lvl.dcfclk_mhz = clk_table->entries[0].dcfclk_mhz; 1957 low_pstate_lvl.fabricclk_mhz = clk_table->entries[0].fclk_mhz; 1958 low_pstate_lvl.socclk_mhz = clk_table->entries[0].socclk_mhz; 1959 low_pstate_lvl.dram_speed_mts = clk_table->entries[0].memclk_mhz * 2; 1960 1961 low_pstate_lvl.dispclk_mhz = dcn2_1_soc.clock_limits[high_voltage_lvl].dispclk_mhz; 1962 low_pstate_lvl.dppclk_mhz = dcn2_1_soc.clock_limits[high_voltage_lvl].dppclk_mhz; 1963 low_pstate_lvl.dram_bw_per_chan_gbps = dcn2_1_soc.clock_limits[high_voltage_lvl].dram_bw_per_chan_gbps; 1964 low_pstate_lvl.dscclk_mhz = dcn2_1_soc.clock_limits[high_voltage_lvl].dscclk_mhz; 1965 low_pstate_lvl.dtbclk_mhz = dcn2_1_soc.clock_limits[high_voltage_lvl].dtbclk_mhz; 1966 low_pstate_lvl.phyclk_d18_mhz = dcn2_1_soc.clock_limits[high_voltage_lvl].phyclk_d18_mhz; 1967 low_pstate_lvl.phyclk_mhz = dcn2_1_soc.clock_limits[high_voltage_lvl].phyclk_mhz; 1968 1969 for (i = clk_table->num_entries; i > 1; i--) 1970 clk_table->entries[i] = clk_table->entries[i-1]; 1971 clk_table->entries[1] = clk_table->entries[0]; 1972 clk_table->num_entries++; 1973 1974 return low_pstate_lvl; 1975} 1976 1977void dcn21_update_bw_bounding_box(struct dc *dc, struct clk_bw_params *bw_params) 1978{ 1979 struct dcn21_resource_pool *pool = TO_DCN21_RES_POOL(dc->res_pool); 1980 struct clk_limit_table *clk_table = &bw_params->clk_table; 1981 struct _vcs_dpi_voltage_scaling_st clock_limits[DC__VOLTAGE_STATES]; 1982 unsigned int i, closest_clk_lvl = 0, k = 0; 1983 int j; 1984 1985 dc_assert_fp_enabled(); 1986 1987 dcn2_1_ip.max_num_otg = pool->base.res_cap->num_timing_generator; 1988 dcn2_1_ip.max_num_dpp = pool->base.pipe_count; 1989 dcn2_1_soc.num_chans = bw_params->num_channels; 1990 1991 ASSERT(clk_table->num_entries); 1992 /* Copy dcn2_1_soc.clock_limits to clock_limits to avoid copying over null states later */ 1993 for (i = 0; i < dcn2_1_soc.num_states + 1; i++) { 1994 clock_limits[i] = dcn2_1_soc.clock_limits[i]; 1995 } 1996 1997 for (i = 0; i < clk_table->num_entries; i++) { 1998 /* loop backwards*/ 1999 for (closest_clk_lvl = 0, j = dcn2_1_soc.num_states - 1; j >= 0; j--) { 2000 if ((unsigned int) dcn2_1_soc.clock_limits[j].dcfclk_mhz <= clk_table->entries[i].dcfclk_mhz) { 2001 closest_clk_lvl = j; 2002 break; 2003 } 2004 } 2005 2006 /* clk_table[1] is reserved for min DF PState. skip here to fill in later. */ 2007 if (i == 1) 2008 k++; 2009 2010 clock_limits[k].state = k; 2011 clock_limits[k].dcfclk_mhz = clk_table->entries[i].dcfclk_mhz; 2012 clock_limits[k].fabricclk_mhz = clk_table->entries[i].fclk_mhz; 2013 clock_limits[k].socclk_mhz = clk_table->entries[i].socclk_mhz; 2014 clock_limits[k].dram_speed_mts = clk_table->entries[i].memclk_mhz * 2; 2015 2016 clock_limits[k].dispclk_mhz = dcn2_1_soc.clock_limits[closest_clk_lvl].dispclk_mhz; 2017 clock_limits[k].dppclk_mhz = dcn2_1_soc.clock_limits[closest_clk_lvl].dppclk_mhz; 2018 clock_limits[k].dram_bw_per_chan_gbps = dcn2_1_soc.clock_limits[closest_clk_lvl].dram_bw_per_chan_gbps; 2019 clock_limits[k].dscclk_mhz = dcn2_1_soc.clock_limits[closest_clk_lvl].dscclk_mhz; 2020 clock_limits[k].dtbclk_mhz = dcn2_1_soc.clock_limits[closest_clk_lvl].dtbclk_mhz; 2021 clock_limits[k].phyclk_d18_mhz = dcn2_1_soc.clock_limits[closest_clk_lvl].phyclk_d18_mhz; 2022 clock_limits[k].phyclk_mhz = dcn2_1_soc.clock_limits[closest_clk_lvl].phyclk_mhz; 2023 2024 k++; 2025 } 2026 for (i = 0; i < clk_table->num_entries + 1; i++) 2027 dcn2_1_soc.clock_limits[i] = clock_limits[i]; 2028 if (clk_table->num_entries) { 2029 dcn2_1_soc.num_states = clk_table->num_entries + 1; 2030 /* fill in min DF PState */ 2031 dcn2_1_soc.clock_limits[1] = construct_low_pstate_lvl(clk_table, closest_clk_lvl); 2032 /* duplicate last level */ 2033 dcn2_1_soc.clock_limits[dcn2_1_soc.num_states] = dcn2_1_soc.clock_limits[dcn2_1_soc.num_states - 1]; 2034 dcn2_1_soc.clock_limits[dcn2_1_soc.num_states].state = dcn2_1_soc.num_states; 2035 } 2036 2037 dml_init_instance(&dc->dml, &dcn2_1_soc, &dcn2_1_ip, DML_PROJECT_DCN21); 2038}