1 // SPDX-License-Identifier: MIT 2 /* 3 * Copyright 2021 Advanced Micro Devices, Inc. 4 * 5 * Permission is hereby granted, free of charge, to any person obtaining a 6 * copy of this software and associated documentation files (the "Software"), 7 * to deal in the Software without restriction, including without limitation 8 * the rights to use, copy, modify, merge, publish, distribute, sublicense, 9 * and/or sell copies of the Software, and to permit persons to whom the 10 * Software is furnished to do so, subject to the following conditions: 11 * 12 * The above copyright notice and this permission notice shall be included in 13 * all copies or substantial portions of the Software. 14 * 15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 18 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR 19 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, 20 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR 21 * OTHER DEALINGS IN THE SOFTWARE. 22 * 23 * Authors: AMD 24 * 25 */ 26 27 #include "resource.h" 28 #include "clk_mgr.h" 29 #include "dc_link_dp.h" 30 #include "dchubbub.h" 31 #include "dcn20/dcn20_resource.h" 32 #include "dcn21/dcn21_resource.h" 33 #include "clk_mgr/dcn21/rn_clk_mgr.h" 34 35 #include "dcn20_fpu.h" 36 37 #define DC_LOGGER_INIT(logger) 38 39 #ifndef MAX 40 #define MAX(X, Y) ((X) > (Y) ? (X) : (Y)) 41 #endif 42 #ifndef MIN 43 #define MIN(X, Y) ((X) < (Y) ? (X) : (Y)) 44 #endif 45 46 /* Constant */ 47 #define LPDDR_MEM_RETRAIN_LATENCY 4.977 /* Number obtained from LPDDR4 Training Counter Requirement doc */ 48 49 /** 50 * DOC: DCN2x FPU manipulation Overview 51 * 52 * The DCN architecture relies on FPU operations, which require special 53 * compilation flags and the use of kernel_fpu_begin/end functions; ideally, we 54 * want to avoid spreading FPU access across multiple files. With this idea in 55 * mind, this file aims to centralize all DCN20 and DCN2.1 (DCN2x) functions 56 * that require FPU access in a single place. Code in this file follows the 57 * following code pattern: 58 * 59 * 1. Functions that use FPU operations should be isolated in static functions. 60 * 2. The FPU functions should have the noinline attribute to ensure anything 61 * that deals with FP register is contained within this call. 62 * 3. All function that needs to be accessed outside this file requires a 63 * public interface that not uses any FPU reference. 64 * 4. Developers **must not** use DC_FP_START/END in this file, but they need 65 * to ensure that the caller invokes it before access any function available 66 * in this file. For this reason, public functions in this file must invoke 67 * dc_assert_fp_enabled(); 68 * 69 * Let's expand a little bit more the idea in the code pattern. To fully 70 * isolate FPU operations in a single place, we must avoid situations where 71 * compilers spill FP values to registers due to FP enable in a specific C 72 * file. Note that even if we isolate all FPU functions in a single file and 73 * call its interface from other files, the compiler might enable the use of 74 * FPU before we call DC_FP_START. Nevertheless, it is the programmer's 75 * responsibility to invoke DC_FP_START/END in the correct place. To highlight 76 * situations where developers forgot to use the FP protection before calling 77 * the DC FPU interface functions, we introduce a helper that checks if the 78 * function is invoked under FP protection. If not, it will trigger a kernel 79 * warning. 80 */ 81 82 struct _vcs_dpi_ip_params_st dcn2_0_ip = { 83 .odm_capable = 1, 84 .gpuvm_enable = 0, 85 .hostvm_enable = 0, 86 .gpuvm_max_page_table_levels = 4, 87 .hostvm_max_page_table_levels = 4, 88 .hostvm_cached_page_table_levels = 0, 89 .pte_group_size_bytes = 2048, 90 .num_dsc = 6, 91 .rob_buffer_size_kbytes = 168, 92 .det_buffer_size_kbytes = 164, 93 .dpte_buffer_size_in_pte_reqs_luma = 84, 94 .pde_proc_buffer_size_64k_reqs = 48, 95 .dpp_output_buffer_pixels = 2560, 96 .opp_output_buffer_lines = 1, 97 .pixel_chunk_size_kbytes = 8, 98 .pte_chunk_size_kbytes = 2, 99 .meta_chunk_size_kbytes = 2, 100 .writeback_chunk_size_kbytes = 2, 101 .line_buffer_size_bits = 789504, 102 .is_line_buffer_bpp_fixed = 0, 103 .line_buffer_fixed_bpp = 0, 104 .dcc_supported = true, 105 .max_line_buffer_lines = 12, 106 .writeback_luma_buffer_size_kbytes = 12, 107 .writeback_chroma_buffer_size_kbytes = 8, 108 .writeback_chroma_line_buffer_width_pixels = 4, 109 .writeback_max_hscl_ratio = 1, 110 .writeback_max_vscl_ratio = 1, 111 .writeback_min_hscl_ratio = 1, 112 .writeback_min_vscl_ratio = 1, 113 .writeback_max_hscl_taps = 12, 114 .writeback_max_vscl_taps = 12, 115 .writeback_line_buffer_luma_buffer_size = 0, 116 .writeback_line_buffer_chroma_buffer_size = 14643, 117 .cursor_buffer_size = 8, 118 .cursor_chunk_size = 2, 119 .max_num_otg = 6, 120 .max_num_dpp = 6, 121 .max_num_wb = 1, 122 .max_dchub_pscl_bw_pix_per_clk = 4, 123 .max_pscl_lb_bw_pix_per_clk = 2, 124 .max_lb_vscl_bw_pix_per_clk = 4, 125 .max_vscl_hscl_bw_pix_per_clk = 4, 126 .max_hscl_ratio = 8, 127 .max_vscl_ratio = 8, 128 .hscl_mults = 4, 129 .vscl_mults = 4, 130 .max_hscl_taps = 8, 131 .max_vscl_taps = 8, 132 .dispclk_ramp_margin_percent = 1, 133 .underscan_factor = 1.10, 134 .min_vblank_lines = 32, // 135 .dppclk_delay_subtotal = 77, // 136 .dppclk_delay_scl_lb_only = 16, 137 .dppclk_delay_scl = 50, 138 .dppclk_delay_cnvc_formatter = 8, 139 .dppclk_delay_cnvc_cursor = 6, 140 .dispclk_delay_subtotal = 87, // 141 .dcfclk_cstate_latency = 10, // SRExitTime 142 .max_inter_dcn_tile_repeaters = 8, 143 .xfc_supported = true, 144 .xfc_fill_bw_overhead_percent = 10.0, 145 .xfc_fill_constant_bytes = 0, 146 .number_of_cursors = 1, 147 }; 148 149 struct _vcs_dpi_ip_params_st dcn2_0_nv14_ip = { 150 .odm_capable = 1, 151 .gpuvm_enable = 0, 152 .hostvm_enable = 0, 153 .gpuvm_max_page_table_levels = 4, 154 .hostvm_max_page_table_levels = 4, 155 .hostvm_cached_page_table_levels = 0, 156 .num_dsc = 5, 157 .rob_buffer_size_kbytes = 168, 158 .det_buffer_size_kbytes = 164, 159 .dpte_buffer_size_in_pte_reqs_luma = 84, 160 .dpte_buffer_size_in_pte_reqs_chroma = 42,//todo 161 .dpp_output_buffer_pixels = 2560, 162 .opp_output_buffer_lines = 1, 163 .pixel_chunk_size_kbytes = 8, 164 .pte_enable = 1, 165 .max_page_table_levels = 4, 166 .pte_chunk_size_kbytes = 2, 167 .meta_chunk_size_kbytes = 2, 168 .writeback_chunk_size_kbytes = 2, 169 .line_buffer_size_bits = 789504, 170 .is_line_buffer_bpp_fixed = 0, 171 .line_buffer_fixed_bpp = 0, 172 .dcc_supported = true, 173 .max_line_buffer_lines = 12, 174 .writeback_luma_buffer_size_kbytes = 12, 175 .writeback_chroma_buffer_size_kbytes = 8, 176 .writeback_chroma_line_buffer_width_pixels = 4, 177 .writeback_max_hscl_ratio = 1, 178 .writeback_max_vscl_ratio = 1, 179 .writeback_min_hscl_ratio = 1, 180 .writeback_min_vscl_ratio = 1, 181 .writeback_max_hscl_taps = 12, 182 .writeback_max_vscl_taps = 12, 183 .writeback_line_buffer_luma_buffer_size = 0, 184 .writeback_line_buffer_chroma_buffer_size = 14643, 185 .cursor_buffer_size = 8, 186 .cursor_chunk_size = 2, 187 .max_num_otg = 5, 188 .max_num_dpp = 5, 189 .max_num_wb = 1, 190 .max_dchub_pscl_bw_pix_per_clk = 4, 191 .max_pscl_lb_bw_pix_per_clk = 2, 192 .max_lb_vscl_bw_pix_per_clk = 4, 193 .max_vscl_hscl_bw_pix_per_clk = 4, 194 .max_hscl_ratio = 8, 195 .max_vscl_ratio = 8, 196 .hscl_mults = 4, 197 .vscl_mults = 4, 198 .max_hscl_taps = 8, 199 .max_vscl_taps = 8, 200 .dispclk_ramp_margin_percent = 1, 201 .underscan_factor = 1.10, 202 .min_vblank_lines = 32, // 203 .dppclk_delay_subtotal = 77, // 204 .dppclk_delay_scl_lb_only = 16, 205 .dppclk_delay_scl = 50, 206 .dppclk_delay_cnvc_formatter = 8, 207 .dppclk_delay_cnvc_cursor = 6, 208 .dispclk_delay_subtotal = 87, // 209 .dcfclk_cstate_latency = 10, // SRExitTime 210 .max_inter_dcn_tile_repeaters = 8, 211 .xfc_supported = true, 212 .xfc_fill_bw_overhead_percent = 10.0, 213 .xfc_fill_constant_bytes = 0, 214 .ptoi_supported = 0, 215 .number_of_cursors = 1, 216 }; 217 218 struct _vcs_dpi_soc_bounding_box_st dcn2_0_soc = { 219 /* Defaults that get patched on driver load from firmware. */ 220 .clock_limits = { 221 { 222 .state = 0, 223 .dcfclk_mhz = 560.0, 224 .fabricclk_mhz = 560.0, 225 .dispclk_mhz = 513.0, 226 .dppclk_mhz = 513.0, 227 .phyclk_mhz = 540.0, 228 .socclk_mhz = 560.0, 229 .dscclk_mhz = 171.0, 230 .dram_speed_mts = 8960.0, 231 }, 232 { 233 .state = 1, 234 .dcfclk_mhz = 694.0, 235 .fabricclk_mhz = 694.0, 236 .dispclk_mhz = 642.0, 237 .dppclk_mhz = 642.0, 238 .phyclk_mhz = 600.0, 239 .socclk_mhz = 694.0, 240 .dscclk_mhz = 214.0, 241 .dram_speed_mts = 11104.0, 242 }, 243 { 244 .state = 2, 245 .dcfclk_mhz = 875.0, 246 .fabricclk_mhz = 875.0, 247 .dispclk_mhz = 734.0, 248 .dppclk_mhz = 734.0, 249 .phyclk_mhz = 810.0, 250 .socclk_mhz = 875.0, 251 .dscclk_mhz = 245.0, 252 .dram_speed_mts = 14000.0, 253 }, 254 { 255 .state = 3, 256 .dcfclk_mhz = 1000.0, 257 .fabricclk_mhz = 1000.0, 258 .dispclk_mhz = 1100.0, 259 .dppclk_mhz = 1100.0, 260 .phyclk_mhz = 810.0, 261 .socclk_mhz = 1000.0, 262 .dscclk_mhz = 367.0, 263 .dram_speed_mts = 16000.0, 264 }, 265 { 266 .state = 4, 267 .dcfclk_mhz = 1200.0, 268 .fabricclk_mhz = 1200.0, 269 .dispclk_mhz = 1284.0, 270 .dppclk_mhz = 1284.0, 271 .phyclk_mhz = 810.0, 272 .socclk_mhz = 1200.0, 273 .dscclk_mhz = 428.0, 274 .dram_speed_mts = 16000.0, 275 }, 276 /*Extra state, no dispclk ramping*/ 277 { 278 .state = 5, 279 .dcfclk_mhz = 1200.0, 280 .fabricclk_mhz = 1200.0, 281 .dispclk_mhz = 1284.0, 282 .dppclk_mhz = 1284.0, 283 .phyclk_mhz = 810.0, 284 .socclk_mhz = 1200.0, 285 .dscclk_mhz = 428.0, 286 .dram_speed_mts = 16000.0, 287 }, 288 }, 289 .num_states = 5, 290 .sr_exit_time_us = 8.6, 291 .sr_enter_plus_exit_time_us = 10.9, 292 .urgent_latency_us = 4.0, 293 .urgent_latency_pixel_data_only_us = 4.0, 294 .urgent_latency_pixel_mixed_with_vm_data_us = 4.0, 295 .urgent_latency_vm_data_only_us = 4.0, 296 .urgent_out_of_order_return_per_channel_pixel_only_bytes = 4096, 297 .urgent_out_of_order_return_per_channel_pixel_and_vm_bytes = 4096, 298 .urgent_out_of_order_return_per_channel_vm_only_bytes = 4096, 299 .pct_ideal_dram_sdp_bw_after_urgent_pixel_only = 40.0, 300 .pct_ideal_dram_sdp_bw_after_urgent_pixel_and_vm = 40.0, 301 .pct_ideal_dram_sdp_bw_after_urgent_vm_only = 40.0, 302 .max_avg_sdp_bw_use_normal_percent = 40.0, 303 .max_avg_dram_bw_use_normal_percent = 40.0, 304 .writeback_latency_us = 12.0, 305 .ideal_dram_bw_after_urgent_percent = 40.0, 306 .max_request_size_bytes = 256, 307 .dram_channel_width_bytes = 2, 308 .fabric_datapath_to_dcn_data_return_bytes = 64, 309 .dcn_downspread_percent = 0.5, 310 .downspread_percent = 0.38, 311 .dram_page_open_time_ns = 50.0, 312 .dram_rw_turnaround_time_ns = 17.5, 313 .dram_return_buffer_per_channel_bytes = 8192, 314 .round_trip_ping_latency_dcfclk_cycles = 131, 315 .urgent_out_of_order_return_per_channel_bytes = 256, 316 .channel_interleave_bytes = 256, 317 .num_banks = 8, 318 .num_chans = 16, 319 .vmm_page_size_bytes = 4096, 320 .dram_clock_change_latency_us = 404.0, 321 .dummy_pstate_latency_us = 5.0, 322 .writeback_dram_clock_change_latency_us = 23.0, 323 .return_bus_width_bytes = 64, 324 .dispclk_dppclk_vco_speed_mhz = 3850, 325 .xfc_bus_transport_time_us = 20, 326 .xfc_xbuf_latency_tolerance_us = 4, 327 .use_urgent_burst_bw = 0 328 }; 329 330 struct _vcs_dpi_soc_bounding_box_st dcn2_0_nv14_soc = { 331 .clock_limits = { 332 { 333 .state = 0, 334 .dcfclk_mhz = 560.0, 335 .fabricclk_mhz = 560.0, 336 .dispclk_mhz = 513.0, 337 .dppclk_mhz = 513.0, 338 .phyclk_mhz = 540.0, 339 .socclk_mhz = 560.0, 340 .dscclk_mhz = 171.0, 341 .dram_speed_mts = 8960.0, 342 }, 343 { 344 .state = 1, 345 .dcfclk_mhz = 694.0, 346 .fabricclk_mhz = 694.0, 347 .dispclk_mhz = 642.0, 348 .dppclk_mhz = 642.0, 349 .phyclk_mhz = 600.0, 350 .socclk_mhz = 694.0, 351 .dscclk_mhz = 214.0, 352 .dram_speed_mts = 11104.0, 353 }, 354 { 355 .state = 2, 356 .dcfclk_mhz = 875.0, 357 .fabricclk_mhz = 875.0, 358 .dispclk_mhz = 734.0, 359 .dppclk_mhz = 734.0, 360 .phyclk_mhz = 810.0, 361 .socclk_mhz = 875.0, 362 .dscclk_mhz = 245.0, 363 .dram_speed_mts = 14000.0, 364 }, 365 { 366 .state = 3, 367 .dcfclk_mhz = 1000.0, 368 .fabricclk_mhz = 1000.0, 369 .dispclk_mhz = 1100.0, 370 .dppclk_mhz = 1100.0, 371 .phyclk_mhz = 810.0, 372 .socclk_mhz = 1000.0, 373 .dscclk_mhz = 367.0, 374 .dram_speed_mts = 16000.0, 375 }, 376 { 377 .state = 4, 378 .dcfclk_mhz = 1200.0, 379 .fabricclk_mhz = 1200.0, 380 .dispclk_mhz = 1284.0, 381 .dppclk_mhz = 1284.0, 382 .phyclk_mhz = 810.0, 383 .socclk_mhz = 1200.0, 384 .dscclk_mhz = 428.0, 385 .dram_speed_mts = 16000.0, 386 }, 387 /*Extra state, no dispclk ramping*/ 388 { 389 .state = 5, 390 .dcfclk_mhz = 1200.0, 391 .fabricclk_mhz = 1200.0, 392 .dispclk_mhz = 1284.0, 393 .dppclk_mhz = 1284.0, 394 .phyclk_mhz = 810.0, 395 .socclk_mhz = 1200.0, 396 .dscclk_mhz = 428.0, 397 .dram_speed_mts = 16000.0, 398 }, 399 }, 400 .num_states = 5, 401 .sr_exit_time_us = 11.6, 402 .sr_enter_plus_exit_time_us = 13.9, 403 .urgent_latency_us = 4.0, 404 .urgent_latency_pixel_data_only_us = 4.0, 405 .urgent_latency_pixel_mixed_with_vm_data_us = 4.0, 406 .urgent_latency_vm_data_only_us = 4.0, 407 .urgent_out_of_order_return_per_channel_pixel_only_bytes = 4096, 408 .urgent_out_of_order_return_per_channel_pixel_and_vm_bytes = 4096, 409 .urgent_out_of_order_return_per_channel_vm_only_bytes = 4096, 410 .pct_ideal_dram_sdp_bw_after_urgent_pixel_only = 40.0, 411 .pct_ideal_dram_sdp_bw_after_urgent_pixel_and_vm = 40.0, 412 .pct_ideal_dram_sdp_bw_after_urgent_vm_only = 40.0, 413 .max_avg_sdp_bw_use_normal_percent = 40.0, 414 .max_avg_dram_bw_use_normal_percent = 40.0, 415 .writeback_latency_us = 12.0, 416 .ideal_dram_bw_after_urgent_percent = 40.0, 417 .max_request_size_bytes = 256, 418 .dram_channel_width_bytes = 2, 419 .fabric_datapath_to_dcn_data_return_bytes = 64, 420 .dcn_downspread_percent = 0.5, 421 .downspread_percent = 0.38, 422 .dram_page_open_time_ns = 50.0, 423 .dram_rw_turnaround_time_ns = 17.5, 424 .dram_return_buffer_per_channel_bytes = 8192, 425 .round_trip_ping_latency_dcfclk_cycles = 131, 426 .urgent_out_of_order_return_per_channel_bytes = 256, 427 .channel_interleave_bytes = 256, 428 .num_banks = 8, 429 .num_chans = 8, 430 .vmm_page_size_bytes = 4096, 431 .dram_clock_change_latency_us = 404.0, 432 .dummy_pstate_latency_us = 5.0, 433 .writeback_dram_clock_change_latency_us = 23.0, 434 .return_bus_width_bytes = 64, 435 .dispclk_dppclk_vco_speed_mhz = 3850, 436 .xfc_bus_transport_time_us = 20, 437 .xfc_xbuf_latency_tolerance_us = 4, 438 .use_urgent_burst_bw = 0 439 }; 440 441 struct _vcs_dpi_soc_bounding_box_st dcn2_0_nv12_soc = { 0 }; 442 443 struct _vcs_dpi_ip_params_st dcn2_1_ip = { 444 .odm_capable = 1, 445 .gpuvm_enable = 1, 446 .hostvm_enable = 1, 447 .gpuvm_max_page_table_levels = 1, 448 .hostvm_max_page_table_levels = 4, 449 .hostvm_cached_page_table_levels = 2, 450 .num_dsc = 3, 451 .rob_buffer_size_kbytes = 168, 452 .det_buffer_size_kbytes = 164, 453 .dpte_buffer_size_in_pte_reqs_luma = 44, 454 .dpte_buffer_size_in_pte_reqs_chroma = 42,//todo 455 .dpp_output_buffer_pixels = 2560, 456 .opp_output_buffer_lines = 1, 457 .pixel_chunk_size_kbytes = 8, 458 .pte_enable = 1, 459 .max_page_table_levels = 4, 460 .pte_chunk_size_kbytes = 2, 461 .meta_chunk_size_kbytes = 2, 462 .min_meta_chunk_size_bytes = 256, 463 .writeback_chunk_size_kbytes = 2, 464 .line_buffer_size_bits = 789504, 465 .is_line_buffer_bpp_fixed = 0, 466 .line_buffer_fixed_bpp = 0, 467 .dcc_supported = true, 468 .max_line_buffer_lines = 12, 469 .writeback_luma_buffer_size_kbytes = 12, 470 .writeback_chroma_buffer_size_kbytes = 8, 471 .writeback_chroma_line_buffer_width_pixels = 4, 472 .writeback_max_hscl_ratio = 1, 473 .writeback_max_vscl_ratio = 1, 474 .writeback_min_hscl_ratio = 1, 475 .writeback_min_vscl_ratio = 1, 476 .writeback_max_hscl_taps = 12, 477 .writeback_max_vscl_taps = 12, 478 .writeback_line_buffer_luma_buffer_size = 0, 479 .writeback_line_buffer_chroma_buffer_size = 14643, 480 .cursor_buffer_size = 8, 481 .cursor_chunk_size = 2, 482 .max_num_otg = 4, 483 .max_num_dpp = 4, 484 .max_num_wb = 1, 485 .max_dchub_pscl_bw_pix_per_clk = 4, 486 .max_pscl_lb_bw_pix_per_clk = 2, 487 .max_lb_vscl_bw_pix_per_clk = 4, 488 .max_vscl_hscl_bw_pix_per_clk = 4, 489 .max_hscl_ratio = 4, 490 .max_vscl_ratio = 4, 491 .hscl_mults = 4, 492 .vscl_mults = 4, 493 .max_hscl_taps = 8, 494 .max_vscl_taps = 8, 495 .dispclk_ramp_margin_percent = 1, 496 .underscan_factor = 1.10, 497 .min_vblank_lines = 32, // 498 .dppclk_delay_subtotal = 77, // 499 .dppclk_delay_scl_lb_only = 16, 500 .dppclk_delay_scl = 50, 501 .dppclk_delay_cnvc_formatter = 8, 502 .dppclk_delay_cnvc_cursor = 6, 503 .dispclk_delay_subtotal = 87, // 504 .dcfclk_cstate_latency = 10, // SRExitTime 505 .max_inter_dcn_tile_repeaters = 8, 506 507 .xfc_supported = false, 508 .xfc_fill_bw_overhead_percent = 10.0, 509 .xfc_fill_constant_bytes = 0, 510 .ptoi_supported = 0, 511 .number_of_cursors = 1, 512 }; 513 514 struct _vcs_dpi_soc_bounding_box_st dcn2_1_soc = { 515 .clock_limits = { 516 { 517 .state = 0, 518 .dcfclk_mhz = 400.0, 519 .fabricclk_mhz = 400.0, 520 .dispclk_mhz = 600.0, 521 .dppclk_mhz = 400.00, 522 .phyclk_mhz = 600.0, 523 .socclk_mhz = 278.0, 524 .dscclk_mhz = 205.67, 525 .dram_speed_mts = 1600.0, 526 }, 527 { 528 .state = 1, 529 .dcfclk_mhz = 464.52, 530 .fabricclk_mhz = 800.0, 531 .dispclk_mhz = 654.55, 532 .dppclk_mhz = 626.09, 533 .phyclk_mhz = 600.0, 534 .socclk_mhz = 278.0, 535 .dscclk_mhz = 205.67, 536 .dram_speed_mts = 1600.0, 537 }, 538 { 539 .state = 2, 540 .dcfclk_mhz = 514.29, 541 .fabricclk_mhz = 933.0, 542 .dispclk_mhz = 757.89, 543 .dppclk_mhz = 685.71, 544 .phyclk_mhz = 600.0, 545 .socclk_mhz = 278.0, 546 .dscclk_mhz = 287.67, 547 .dram_speed_mts = 1866.0, 548 }, 549 { 550 .state = 3, 551 .dcfclk_mhz = 576.00, 552 .fabricclk_mhz = 1067.0, 553 .dispclk_mhz = 847.06, 554 .dppclk_mhz = 757.89, 555 .phyclk_mhz = 600.0, 556 .socclk_mhz = 715.0, 557 .dscclk_mhz = 318.334, 558 .dram_speed_mts = 2134.0, 559 }, 560 { 561 .state = 4, 562 .dcfclk_mhz = 626.09, 563 .fabricclk_mhz = 1200.0, 564 .dispclk_mhz = 900.00, 565 .dppclk_mhz = 847.06, 566 .phyclk_mhz = 810.0, 567 .socclk_mhz = 953.0, 568 .dscclk_mhz = 300.0, 569 .dram_speed_mts = 2400.0, 570 }, 571 { 572 .state = 5, 573 .dcfclk_mhz = 685.71, 574 .fabricclk_mhz = 1333.0, 575 .dispclk_mhz = 1028.57, 576 .dppclk_mhz = 960.00, 577 .phyclk_mhz = 810.0, 578 .socclk_mhz = 278.0, 579 .dscclk_mhz = 342.86, 580 .dram_speed_mts = 2666.0, 581 }, 582 { 583 .state = 6, 584 .dcfclk_mhz = 757.89, 585 .fabricclk_mhz = 1467.0, 586 .dispclk_mhz = 1107.69, 587 .dppclk_mhz = 1028.57, 588 .phyclk_mhz = 810.0, 589 .socclk_mhz = 715.0, 590 .dscclk_mhz = 369.23, 591 .dram_speed_mts = 3200.0, 592 }, 593 { 594 .state = 7, 595 .dcfclk_mhz = 847.06, 596 .fabricclk_mhz = 1600.0, 597 .dispclk_mhz = 1395.0, 598 .dppclk_mhz = 1285.00, 599 .phyclk_mhz = 1325.0, 600 .socclk_mhz = 953.0, 601 .dscclk_mhz = 489.0, 602 .dram_speed_mts = 4266.0, 603 }, 604 /*Extra state, no dispclk ramping*/ 605 { 606 .state = 8, 607 .dcfclk_mhz = 847.06, 608 .fabricclk_mhz = 1600.0, 609 .dispclk_mhz = 1395.0, 610 .dppclk_mhz = 1285.0, 611 .phyclk_mhz = 1325.0, 612 .socclk_mhz = 953.0, 613 .dscclk_mhz = 489.0, 614 .dram_speed_mts = 4266.0, 615 }, 616 617 }, 618 619 .sr_exit_time_us = 12.5, 620 .sr_enter_plus_exit_time_us = 17.0, 621 .urgent_latency_us = 4.0, 622 .urgent_latency_pixel_data_only_us = 4.0, 623 .urgent_latency_pixel_mixed_with_vm_data_us = 4.0, 624 .urgent_latency_vm_data_only_us = 4.0, 625 .urgent_out_of_order_return_per_channel_pixel_only_bytes = 4096, 626 .urgent_out_of_order_return_per_channel_pixel_and_vm_bytes = 4096, 627 .urgent_out_of_order_return_per_channel_vm_only_bytes = 4096, 628 .pct_ideal_dram_sdp_bw_after_urgent_pixel_only = 80.0, 629 .pct_ideal_dram_sdp_bw_after_urgent_pixel_and_vm = 75.0, 630 .pct_ideal_dram_sdp_bw_after_urgent_vm_only = 40.0, 631 .max_avg_sdp_bw_use_normal_percent = 60.0, 632 .max_avg_dram_bw_use_normal_percent = 100.0, 633 .writeback_latency_us = 12.0, 634 .max_request_size_bytes = 256, 635 .dram_channel_width_bytes = 4, 636 .fabric_datapath_to_dcn_data_return_bytes = 32, 637 .dcn_downspread_percent = 0.5, 638 .downspread_percent = 0.38, 639 .dram_page_open_time_ns = 50.0, 640 .dram_rw_turnaround_time_ns = 17.5, 641 .dram_return_buffer_per_channel_bytes = 8192, 642 .round_trip_ping_latency_dcfclk_cycles = 128, 643 .urgent_out_of_order_return_per_channel_bytes = 4096, 644 .channel_interleave_bytes = 256, 645 .num_banks = 8, 646 .num_chans = 4, 647 .vmm_page_size_bytes = 4096, 648 .dram_clock_change_latency_us = 23.84, 649 .return_bus_width_bytes = 64, 650 .dispclk_dppclk_vco_speed_mhz = 3600, 651 .xfc_bus_transport_time_us = 4, 652 .xfc_xbuf_latency_tolerance_us = 4, 653 .use_urgent_burst_bw = 1, 654 .num_states = 8 655 }; 656 657 struct wm_table ddr4_wm_table_gs = { 658 .entries = { 659 { 660 .wm_inst = WM_A, 661 .wm_type = WM_TYPE_PSTATE_CHG, 662 .pstate_latency_us = 11.72, 663 .sr_exit_time_us = 7.09, 664 .sr_enter_plus_exit_time_us = 8.14, 665 .valid = true, 666 }, 667 { 668 .wm_inst = WM_B, 669 .wm_type = WM_TYPE_PSTATE_CHG, 670 .pstate_latency_us = 11.72, 671 .sr_exit_time_us = 10.12, 672 .sr_enter_plus_exit_time_us = 11.48, 673 .valid = true, 674 }, 675 { 676 .wm_inst = WM_C, 677 .wm_type = WM_TYPE_PSTATE_CHG, 678 .pstate_latency_us = 11.72, 679 .sr_exit_time_us = 10.12, 680 .sr_enter_plus_exit_time_us = 11.48, 681 .valid = true, 682 }, 683 { 684 .wm_inst = WM_D, 685 .wm_type = WM_TYPE_PSTATE_CHG, 686 .pstate_latency_us = 11.72, 687 .sr_exit_time_us = 10.12, 688 .sr_enter_plus_exit_time_us = 11.48, 689 .valid = true, 690 }, 691 } 692 }; 693 694 struct wm_table lpddr4_wm_table_gs = { 695 .entries = { 696 { 697 .wm_inst = WM_A, 698 .wm_type = WM_TYPE_PSTATE_CHG, 699 .pstate_latency_us = 11.65333, 700 .sr_exit_time_us = 5.32, 701 .sr_enter_plus_exit_time_us = 6.38, 702 .valid = true, 703 }, 704 { 705 .wm_inst = WM_B, 706 .wm_type = WM_TYPE_PSTATE_CHG, 707 .pstate_latency_us = 11.65333, 708 .sr_exit_time_us = 9.82, 709 .sr_enter_plus_exit_time_us = 11.196, 710 .valid = true, 711 }, 712 { 713 .wm_inst = WM_C, 714 .wm_type = WM_TYPE_PSTATE_CHG, 715 .pstate_latency_us = 11.65333, 716 .sr_exit_time_us = 9.89, 717 .sr_enter_plus_exit_time_us = 11.24, 718 .valid = true, 719 }, 720 { 721 .wm_inst = WM_D, 722 .wm_type = WM_TYPE_PSTATE_CHG, 723 .pstate_latency_us = 11.65333, 724 .sr_exit_time_us = 9.748, 725 .sr_enter_plus_exit_time_us = 11.102, 726 .valid = true, 727 }, 728 } 729 }; 730 731 struct wm_table lpddr4_wm_table_with_disabled_ppt = { 732 .entries = { 733 { 734 .wm_inst = WM_A, 735 .wm_type = WM_TYPE_PSTATE_CHG, 736 .pstate_latency_us = 11.65333, 737 .sr_exit_time_us = 8.32, 738 .sr_enter_plus_exit_time_us = 9.38, 739 .valid = true, 740 }, 741 { 742 .wm_inst = WM_B, 743 .wm_type = WM_TYPE_PSTATE_CHG, 744 .pstate_latency_us = 11.65333, 745 .sr_exit_time_us = 9.82, 746 .sr_enter_plus_exit_time_us = 11.196, 747 .valid = true, 748 }, 749 { 750 .wm_inst = WM_C, 751 .wm_type = WM_TYPE_PSTATE_CHG, 752 .pstate_latency_us = 11.65333, 753 .sr_exit_time_us = 9.89, 754 .sr_enter_plus_exit_time_us = 11.24, 755 .valid = true, 756 }, 757 { 758 .wm_inst = WM_D, 759 .wm_type = WM_TYPE_PSTATE_CHG, 760 .pstate_latency_us = 11.65333, 761 .sr_exit_time_us = 9.748, 762 .sr_enter_plus_exit_time_us = 11.102, 763 .valid = true, 764 }, 765 } 766 }; 767 768 struct wm_table ddr4_wm_table_rn = { 769 .entries = { 770 { 771 .wm_inst = WM_A, 772 .wm_type = WM_TYPE_PSTATE_CHG, 773 .pstate_latency_us = 11.72, 774 .sr_exit_time_us = 11.90, 775 .sr_enter_plus_exit_time_us = 12.80, 776 .valid = true, 777 }, 778 { 779 .wm_inst = WM_B, 780 .wm_type = WM_TYPE_PSTATE_CHG, 781 .pstate_latency_us = 11.72, 782 .sr_exit_time_us = 13.18, 783 .sr_enter_plus_exit_time_us = 14.30, 784 .valid = true, 785 }, 786 { 787 .wm_inst = WM_C, 788 .wm_type = WM_TYPE_PSTATE_CHG, 789 .pstate_latency_us = 11.72, 790 .sr_exit_time_us = 13.18, 791 .sr_enter_plus_exit_time_us = 14.30, 792 .valid = true, 793 }, 794 { 795 .wm_inst = WM_D, 796 .wm_type = WM_TYPE_PSTATE_CHG, 797 .pstate_latency_us = 11.72, 798 .sr_exit_time_us = 13.18, 799 .sr_enter_plus_exit_time_us = 14.30, 800 .valid = true, 801 }, 802 } 803 }; 804 805 struct wm_table ddr4_1R_wm_table_rn = { 806 .entries = { 807 { 808 .wm_inst = WM_A, 809 .wm_type = WM_TYPE_PSTATE_CHG, 810 .pstate_latency_us = 11.72, 811 .sr_exit_time_us = 13.90, 812 .sr_enter_plus_exit_time_us = 14.80, 813 .valid = true, 814 }, 815 { 816 .wm_inst = WM_B, 817 .wm_type = WM_TYPE_PSTATE_CHG, 818 .pstate_latency_us = 11.72, 819 .sr_exit_time_us = 13.90, 820 .sr_enter_plus_exit_time_us = 14.80, 821 .valid = true, 822 }, 823 { 824 .wm_inst = WM_C, 825 .wm_type = WM_TYPE_PSTATE_CHG, 826 .pstate_latency_us = 11.72, 827 .sr_exit_time_us = 13.90, 828 .sr_enter_plus_exit_time_us = 14.80, 829 .valid = true, 830 }, 831 { 832 .wm_inst = WM_D, 833 .wm_type = WM_TYPE_PSTATE_CHG, 834 .pstate_latency_us = 11.72, 835 .sr_exit_time_us = 13.90, 836 .sr_enter_plus_exit_time_us = 14.80, 837 .valid = true, 838 }, 839 } 840 }; 841 842 struct wm_table lpddr4_wm_table_rn = { 843 .entries = { 844 { 845 .wm_inst = WM_A, 846 .wm_type = WM_TYPE_PSTATE_CHG, 847 .pstate_latency_us = 11.65333, 848 .sr_exit_time_us = 7.32, 849 .sr_enter_plus_exit_time_us = 8.38, 850 .valid = true, 851 }, 852 { 853 .wm_inst = WM_B, 854 .wm_type = WM_TYPE_PSTATE_CHG, 855 .pstate_latency_us = 11.65333, 856 .sr_exit_time_us = 9.82, 857 .sr_enter_plus_exit_time_us = 11.196, 858 .valid = true, 859 }, 860 { 861 .wm_inst = WM_C, 862 .wm_type = WM_TYPE_PSTATE_CHG, 863 .pstate_latency_us = 11.65333, 864 .sr_exit_time_us = 9.89, 865 .sr_enter_plus_exit_time_us = 11.24, 866 .valid = true, 867 }, 868 { 869 .wm_inst = WM_D, 870 .wm_type = WM_TYPE_PSTATE_CHG, 871 .pstate_latency_us = 11.65333, 872 .sr_exit_time_us = 9.748, 873 .sr_enter_plus_exit_time_us = 11.102, 874 .valid = true, 875 }, 876 } 877 }; 878 879 void dcn20_populate_dml_writeback_from_context(struct dc *dc, 880 struct resource_context *res_ctx, 881 display_e2e_pipe_params_st *pipes) 882 { 883 int pipe_cnt, i; 884 885 dc_assert_fp_enabled(); 886 887 for (i = 0, pipe_cnt = 0; i < dc->res_pool->pipe_count; i++) { 888 struct dc_writeback_info *wb_info = &res_ctx->pipe_ctx[i].stream->writeback_info[0]; 889 890 if (!res_ctx->pipe_ctx[i].stream) 891 continue; 892 893 /* Set writeback information */ 894 pipes[pipe_cnt].dout.wb_enable = (wb_info->wb_enabled == true) ? 1 : 0; 895 pipes[pipe_cnt].dout.num_active_wb++; 896 pipes[pipe_cnt].dout.wb.wb_src_height = wb_info->dwb_params.cnv_params.crop_height; 897 pipes[pipe_cnt].dout.wb.wb_src_width = wb_info->dwb_params.cnv_params.crop_width; 898 pipes[pipe_cnt].dout.wb.wb_dst_width = wb_info->dwb_params.dest_width; 899 pipes[pipe_cnt].dout.wb.wb_dst_height = wb_info->dwb_params.dest_height; 900 pipes[pipe_cnt].dout.wb.wb_htaps_luma = 1; 901 pipes[pipe_cnt].dout.wb.wb_vtaps_luma = 1; 902 pipes[pipe_cnt].dout.wb.wb_htaps_chroma = wb_info->dwb_params.scaler_taps.h_taps_c; 903 pipes[pipe_cnt].dout.wb.wb_vtaps_chroma = wb_info->dwb_params.scaler_taps.v_taps_c; 904 pipes[pipe_cnt].dout.wb.wb_hratio = 1.0; 905 pipes[pipe_cnt].dout.wb.wb_vratio = 1.0; 906 if (wb_info->dwb_params.out_format == dwb_scaler_mode_yuv420) { 907 if (wb_info->dwb_params.output_depth == DWB_OUTPUT_PIXEL_DEPTH_8BPC) 908 pipes[pipe_cnt].dout.wb.wb_pixel_format = dm_420_8; 909 else 910 pipes[pipe_cnt].dout.wb.wb_pixel_format = dm_420_10; 911 } else { 912 pipes[pipe_cnt].dout.wb.wb_pixel_format = dm_444_32; 913 } 914 915 pipe_cnt++; 916 } 917 } 918 919 void dcn20_fpu_set_wb_arb_params(struct mcif_arb_params *wb_arb_params, 920 struct dc_state *context, 921 display_e2e_pipe_params_st *pipes, 922 int pipe_cnt, int i) 923 { 924 int k; 925 926 dc_assert_fp_enabled(); 927 928 for (k = 0; k < sizeof(wb_arb_params->cli_watermark)/sizeof(wb_arb_params->cli_watermark[0]); k++) { 929 wb_arb_params->cli_watermark[k] = get_wm_writeback_urgent(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 930 wb_arb_params->pstate_watermark[k] = get_wm_writeback_dram_clock_change(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 931 } 932 wb_arb_params->time_per_pixel = 16.0 * 1000 / (context->res_ctx.pipe_ctx[i].stream->phy_pix_clk / 1000); /* 4 bit fraction, ms */ 933 } 934 935 static bool is_dtbclk_required(struct dc *dc, struct dc_state *context) 936 { 937 int i; 938 for (i = 0; i < dc->res_pool->pipe_count; i++) { 939 if (!context->res_ctx.pipe_ctx[i].stream) 940 continue; 941 if (is_dp_128b_132b_signal(&context->res_ctx.pipe_ctx[i])) 942 return true; 943 } 944 return false; 945 } 946 947 static enum dcn_zstate_support_state decide_zstate_support(struct dc *dc, struct dc_state *context) 948 { 949 int plane_count; 950 int i; 951 unsigned int optimized_min_dst_y_next_start_us; 952 bool allow_z8 = context->bw_ctx.dml.vba.StutterPeriod > 1000.0; 953 954 plane_count = 0; 955 optimized_min_dst_y_next_start_us = 0; 956 for (i = 0; i < dc->res_pool->pipe_count; i++) { 957 if (context->res_ctx.pipe_ctx[i].plane_state) 958 plane_count++; 959 } 960 961 /* 962 * Z9 and Z10 allowed cases: 963 * 1. 0 Planes enabled 964 * 2. single eDP, on link 0, 1 plane and stutter period > 5ms 965 * Z10 only cases: 966 * 1. single eDP, on link 0, 1 plane and stutter period >= 5ms 967 * Z8 cases: 968 * 1. stutter period sufficient 969 * Zstate not allowed cases: 970 * 1. Everything else 971 */ 972 if (plane_count == 0) 973 return DCN_ZSTATE_SUPPORT_ALLOW; 974 else if (context->stream_count == 1 && context->streams[0]->signal == SIGNAL_TYPE_EDP) { 975 struct dc_link *link = context->streams[0]->sink->link; 976 struct dc_stream_status *stream_status = &context->stream_status[0]; 977 978 if (dc_extended_blank_supported(dc)) { 979 for (i = 0; i < dc->res_pool->pipe_count; i++) { 980 if (context->res_ctx.pipe_ctx[i].stream == context->streams[0] 981 && context->res_ctx.pipe_ctx[i].stream->adjust.v_total_min == context->res_ctx.pipe_ctx[i].stream->adjust.v_total_max 982 && context->res_ctx.pipe_ctx[i].stream->adjust.v_total_min > context->res_ctx.pipe_ctx[i].stream->timing.v_total) { 983 optimized_min_dst_y_next_start_us = 984 context->res_ctx.pipe_ctx[i].dlg_regs.optimized_min_dst_y_next_start_us; 985 break; 986 } 987 } 988 } 989 /* zstate only supported on PWRSEQ0 and when there's <2 planes*/ 990 if (link->link_index != 0 || stream_status->plane_count > 1) 991 return DCN_ZSTATE_SUPPORT_DISALLOW; 992 993 if (context->bw_ctx.dml.vba.StutterPeriod > 5000.0 || optimized_min_dst_y_next_start_us > 5000) 994 return DCN_ZSTATE_SUPPORT_ALLOW; 995 else if (link->psr_settings.psr_version == DC_PSR_VERSION_1 && !link->panel_config.psr.disable_psr) 996 return allow_z8 ? DCN_ZSTATE_SUPPORT_ALLOW_Z8_Z10_ONLY : DCN_ZSTATE_SUPPORT_ALLOW_Z10_ONLY; 997 else 998 return allow_z8 ? DCN_ZSTATE_SUPPORT_ALLOW_Z8_ONLY : DCN_ZSTATE_SUPPORT_DISALLOW; 999 } else if (allow_z8) { 1000 return DCN_ZSTATE_SUPPORT_ALLOW_Z8_ONLY; 1001 } else { 1002 return DCN_ZSTATE_SUPPORT_DISALLOW; 1003 } 1004 } 1005 1006 void dcn20_calculate_dlg_params( 1007 struct dc *dc, struct dc_state *context, 1008 display_e2e_pipe_params_st *pipes, 1009 int pipe_cnt, 1010 int vlevel) 1011 { 1012 int i, pipe_idx; 1013 1014 dc_assert_fp_enabled(); 1015 1016 /* Writeback MCIF_WB arbitration parameters */ 1017 dc->res_pool->funcs->set_mcif_arb_params(dc, context, pipes, pipe_cnt); 1018 1019 context->bw_ctx.bw.dcn.clk.dispclk_khz = context->bw_ctx.dml.vba.DISPCLK * 1000; 1020 context->bw_ctx.bw.dcn.clk.dcfclk_khz = context->bw_ctx.dml.vba.DCFCLK * 1000; 1021 context->bw_ctx.bw.dcn.clk.socclk_khz = context->bw_ctx.dml.vba.SOCCLK * 1000; 1022 context->bw_ctx.bw.dcn.clk.dramclk_khz = context->bw_ctx.dml.vba.DRAMSpeed * 1000 / 16; 1023 1024 if (dc->debug.min_dram_clk_khz > context->bw_ctx.bw.dcn.clk.dramclk_khz) 1025 context->bw_ctx.bw.dcn.clk.dramclk_khz = dc->debug.min_dram_clk_khz; 1026 1027 context->bw_ctx.bw.dcn.clk.dcfclk_deep_sleep_khz = context->bw_ctx.dml.vba.DCFCLKDeepSleep * 1000; 1028 context->bw_ctx.bw.dcn.clk.fclk_khz = context->bw_ctx.dml.vba.FabricClock * 1000; 1029 context->bw_ctx.bw.dcn.clk.p_state_change_support = 1030 context->bw_ctx.dml.vba.DRAMClockChangeSupport[vlevel][context->bw_ctx.dml.vba.maxMpcComb] 1031 != dm_dram_clock_change_unsupported; 1032 1033 /* Pstate change might not be supported by hardware, but it might be 1034 * possible with firmware driven vertical blank stretching. 1035 */ 1036 context->bw_ctx.bw.dcn.clk.p_state_change_support |= context->bw_ctx.bw.dcn.clk.fw_based_mclk_switching; 1037 1038 context->bw_ctx.bw.dcn.clk.dppclk_khz = 0; 1039 1040 context->bw_ctx.bw.dcn.clk.dtbclk_en = is_dtbclk_required(dc, context); 1041 1042 if (context->bw_ctx.bw.dcn.clk.dispclk_khz < dc->debug.min_disp_clk_khz) 1043 context->bw_ctx.bw.dcn.clk.dispclk_khz = dc->debug.min_disp_clk_khz; 1044 1045 for (i = 0, pipe_idx = 0; i < dc->res_pool->pipe_count; i++) { 1046 if (!context->res_ctx.pipe_ctx[i].stream) 1047 continue; 1048 pipes[pipe_idx].pipe.dest.vstartup_start = get_vstartup(&context->bw_ctx.dml, pipes, pipe_cnt, pipe_idx); 1049 pipes[pipe_idx].pipe.dest.vupdate_offset = get_vupdate_offset(&context->bw_ctx.dml, pipes, pipe_cnt, pipe_idx); 1050 pipes[pipe_idx].pipe.dest.vupdate_width = get_vupdate_width(&context->bw_ctx.dml, pipes, pipe_cnt, pipe_idx); 1051 pipes[pipe_idx].pipe.dest.vready_offset = get_vready_offset(&context->bw_ctx.dml, pipes, pipe_cnt, pipe_idx); 1052 if (context->res_ctx.pipe_ctx[i].stream->mall_stream_config.type == SUBVP_PHANTOM) { 1053 // Phantom pipe requires that DET_SIZE = 0 and no unbounded requests 1054 context->res_ctx.pipe_ctx[i].det_buffer_size_kb = 0; 1055 context->res_ctx.pipe_ctx[i].unbounded_req = false; 1056 } else { 1057 context->res_ctx.pipe_ctx[i].det_buffer_size_kb = context->bw_ctx.dml.ip.det_buffer_size_kbytes; 1058 context->res_ctx.pipe_ctx[i].unbounded_req = pipes[pipe_idx].pipe.src.unbounded_req_mode; 1059 } 1060 if (context->bw_ctx.bw.dcn.clk.dppclk_khz < pipes[pipe_idx].clks_cfg.dppclk_mhz * 1000) 1061 context->bw_ctx.bw.dcn.clk.dppclk_khz = pipes[pipe_idx].clks_cfg.dppclk_mhz * 1000; 1062 context->res_ctx.pipe_ctx[i].plane_res.bw.dppclk_khz = 1063 pipes[pipe_idx].clks_cfg.dppclk_mhz * 1000; 1064 context->res_ctx.pipe_ctx[i].pipe_dlg_param = pipes[pipe_idx].pipe.dest; 1065 pipe_idx++; 1066 } 1067 /*save a original dppclock copy*/ 1068 context->bw_ctx.bw.dcn.clk.bw_dppclk_khz = context->bw_ctx.bw.dcn.clk.dppclk_khz; 1069 context->bw_ctx.bw.dcn.clk.bw_dispclk_khz = context->bw_ctx.bw.dcn.clk.dispclk_khz; 1070 context->bw_ctx.bw.dcn.clk.max_supported_dppclk_khz = context->bw_ctx.dml.soc.clock_limits[vlevel].dppclk_mhz * 1000; 1071 context->bw_ctx.bw.dcn.clk.max_supported_dispclk_khz = context->bw_ctx.dml.soc.clock_limits[vlevel].dispclk_mhz * 1000; 1072 1073 context->bw_ctx.bw.dcn.compbuf_size_kb = context->bw_ctx.dml.ip.config_return_buffer_size_in_kbytes 1074 - context->bw_ctx.dml.ip.det_buffer_size_kbytes * pipe_idx; 1075 1076 for (i = 0, pipe_idx = 0; i < dc->res_pool->pipe_count; i++) { 1077 bool cstate_en = context->bw_ctx.dml.vba.PrefetchMode[vlevel][context->bw_ctx.dml.vba.maxMpcComb] != 2; 1078 1079 if (!context->res_ctx.pipe_ctx[i].stream) 1080 continue; 1081 1082 if (dc->ctx->dce_version == DCN_VERSION_2_01) 1083 cstate_en = false; 1084 1085 context->bw_ctx.dml.funcs.rq_dlg_get_dlg_reg(&context->bw_ctx.dml, 1086 &context->res_ctx.pipe_ctx[i].dlg_regs, 1087 &context->res_ctx.pipe_ctx[i].ttu_regs, 1088 pipes, 1089 pipe_cnt, 1090 pipe_idx, 1091 cstate_en, 1092 context->bw_ctx.bw.dcn.clk.p_state_change_support, 1093 false, false, true); 1094 1095 context->bw_ctx.dml.funcs.rq_dlg_get_rq_reg(&context->bw_ctx.dml, 1096 &context->res_ctx.pipe_ctx[i].rq_regs, 1097 &pipes[pipe_idx].pipe); 1098 pipe_idx++; 1099 } 1100 context->bw_ctx.bw.dcn.clk.zstate_support = decide_zstate_support(dc, context); 1101 } 1102 1103 static void swizzle_to_dml_params( 1104 enum swizzle_mode_values swizzle, 1105 unsigned int *sw_mode) 1106 { 1107 switch (swizzle) { 1108 case DC_SW_LINEAR: 1109 *sw_mode = dm_sw_linear; 1110 break; 1111 case DC_SW_4KB_S: 1112 *sw_mode = dm_sw_4kb_s; 1113 break; 1114 case DC_SW_4KB_S_X: 1115 *sw_mode = dm_sw_4kb_s_x; 1116 break; 1117 case DC_SW_4KB_D: 1118 *sw_mode = dm_sw_4kb_d; 1119 break; 1120 case DC_SW_4KB_D_X: 1121 *sw_mode = dm_sw_4kb_d_x; 1122 break; 1123 case DC_SW_64KB_S: 1124 *sw_mode = dm_sw_64kb_s; 1125 break; 1126 case DC_SW_64KB_S_X: 1127 *sw_mode = dm_sw_64kb_s_x; 1128 break; 1129 case DC_SW_64KB_S_T: 1130 *sw_mode = dm_sw_64kb_s_t; 1131 break; 1132 case DC_SW_64KB_D: 1133 *sw_mode = dm_sw_64kb_d; 1134 break; 1135 case DC_SW_64KB_D_X: 1136 *sw_mode = dm_sw_64kb_d_x; 1137 break; 1138 case DC_SW_64KB_D_T: 1139 *sw_mode = dm_sw_64kb_d_t; 1140 break; 1141 case DC_SW_64KB_R_X: 1142 *sw_mode = dm_sw_64kb_r_x; 1143 break; 1144 case DC_SW_VAR_S: 1145 *sw_mode = dm_sw_var_s; 1146 break; 1147 case DC_SW_VAR_S_X: 1148 *sw_mode = dm_sw_var_s_x; 1149 break; 1150 case DC_SW_VAR_D: 1151 *sw_mode = dm_sw_var_d; 1152 break; 1153 case DC_SW_VAR_D_X: 1154 *sw_mode = dm_sw_var_d_x; 1155 break; 1156 case DC_SW_VAR_R_X: 1157 *sw_mode = dm_sw_var_r_x; 1158 break; 1159 default: 1160 ASSERT(0); /* Not supported */ 1161 break; 1162 } 1163 } 1164 1165 int dcn20_populate_dml_pipes_from_context( 1166 struct dc *dc, 1167 struct dc_state *context, 1168 display_e2e_pipe_params_st *pipes, 1169 bool fast_validate) 1170 { 1171 int pipe_cnt, i; 1172 bool synchronized_vblank = true; 1173 struct resource_context *res_ctx = &context->res_ctx; 1174 1175 dc_assert_fp_enabled(); 1176 1177 for (i = 0, pipe_cnt = -1; i < dc->res_pool->pipe_count; i++) { 1178 if (!res_ctx->pipe_ctx[i].stream) 1179 continue; 1180 1181 if (pipe_cnt < 0) { 1182 pipe_cnt = i; 1183 continue; 1184 } 1185 1186 if (res_ctx->pipe_ctx[pipe_cnt].stream == res_ctx->pipe_ctx[i].stream) 1187 continue; 1188 1189 if (dc->debug.disable_timing_sync || 1190 (!resource_are_streams_timing_synchronizable( 1191 res_ctx->pipe_ctx[pipe_cnt].stream, 1192 res_ctx->pipe_ctx[i].stream) && 1193 !resource_are_vblanks_synchronizable( 1194 res_ctx->pipe_ctx[pipe_cnt].stream, 1195 res_ctx->pipe_ctx[i].stream))) { 1196 synchronized_vblank = false; 1197 break; 1198 } 1199 } 1200 1201 for (i = 0, pipe_cnt = 0; i < dc->res_pool->pipe_count; i++) { 1202 struct dc_crtc_timing *timing = &res_ctx->pipe_ctx[i].stream->timing; 1203 unsigned int v_total; 1204 unsigned int front_porch; 1205 int output_bpc; 1206 struct audio_check aud_check = {0}; 1207 1208 if (!res_ctx->pipe_ctx[i].stream) 1209 continue; 1210 1211 v_total = timing->v_total; 1212 front_porch = timing->v_front_porch; 1213 1214 /* todo: 1215 pipes[pipe_cnt].pipe.src.dynamic_metadata_enable = 0; 1216 pipes[pipe_cnt].pipe.src.dcc = 0; 1217 pipes[pipe_cnt].pipe.src.vm = 0;*/ 1218 1219 pipes[pipe_cnt].clks_cfg.refclk_mhz = dc->res_pool->ref_clocks.dchub_ref_clock_inKhz / 1000.0; 1220 1221 pipes[pipe_cnt].dout.dsc_enable = res_ctx->pipe_ctx[i].stream->timing.flags.DSC; 1222 /* todo: rotation?*/ 1223 pipes[pipe_cnt].dout.dsc_slices = res_ctx->pipe_ctx[i].stream->timing.dsc_cfg.num_slices_h; 1224 if (res_ctx->pipe_ctx[i].stream->use_dynamic_meta) { 1225 pipes[pipe_cnt].pipe.src.dynamic_metadata_enable = true; 1226 /* 1/2 vblank */ 1227 pipes[pipe_cnt].pipe.src.dynamic_metadata_lines_before_active = 1228 (v_total - timing->v_addressable 1229 - timing->v_border_top - timing->v_border_bottom) / 2; 1230 /* 36 bytes dp, 32 hdmi */ 1231 pipes[pipe_cnt].pipe.src.dynamic_metadata_xmit_bytes = 1232 dc_is_dp_signal(res_ctx->pipe_ctx[i].stream->signal) ? 36 : 32; 1233 } 1234 pipes[pipe_cnt].pipe.src.dcc = false; 1235 pipes[pipe_cnt].pipe.src.dcc_rate = 1; 1236 pipes[pipe_cnt].pipe.dest.synchronized_vblank_all_planes = synchronized_vblank; 1237 pipes[pipe_cnt].pipe.dest.synchronize_timings = synchronized_vblank; 1238 pipes[pipe_cnt].pipe.dest.hblank_start = timing->h_total - timing->h_front_porch; 1239 pipes[pipe_cnt].pipe.dest.hblank_end = pipes[pipe_cnt].pipe.dest.hblank_start 1240 - timing->h_addressable 1241 - timing->h_border_left 1242 - timing->h_border_right; 1243 pipes[pipe_cnt].pipe.dest.vblank_start = v_total - front_porch; 1244 pipes[pipe_cnt].pipe.dest.vblank_end = pipes[pipe_cnt].pipe.dest.vblank_start 1245 - timing->v_addressable 1246 - timing->v_border_top 1247 - timing->v_border_bottom; 1248 pipes[pipe_cnt].pipe.dest.htotal = timing->h_total; 1249 pipes[pipe_cnt].pipe.dest.vtotal = v_total; 1250 pipes[pipe_cnt].pipe.dest.hactive = 1251 timing->h_addressable + timing->h_border_left + timing->h_border_right; 1252 pipes[pipe_cnt].pipe.dest.vactive = 1253 timing->v_addressable + timing->v_border_top + timing->v_border_bottom; 1254 pipes[pipe_cnt].pipe.dest.interlaced = timing->flags.INTERLACE; 1255 pipes[pipe_cnt].pipe.dest.pixel_rate_mhz = timing->pix_clk_100hz/10000.0; 1256 if (timing->timing_3d_format == TIMING_3D_FORMAT_HW_FRAME_PACKING) 1257 pipes[pipe_cnt].pipe.dest.pixel_rate_mhz *= 2; 1258 pipes[pipe_cnt].pipe.dest.otg_inst = res_ctx->pipe_ctx[i].stream_res.tg->inst; 1259 pipes[pipe_cnt].dout.dp_lanes = 4; 1260 if (res_ctx->pipe_ctx[i].stream->link) 1261 pipes[pipe_cnt].dout.dp_rate = dm_dp_rate_na; 1262 pipes[pipe_cnt].dout.is_virtual = 0; 1263 pipes[pipe_cnt].pipe.dest.vtotal_min = res_ctx->pipe_ctx[i].stream->adjust.v_total_min; 1264 pipes[pipe_cnt].pipe.dest.vtotal_max = res_ctx->pipe_ctx[i].stream->adjust.v_total_max; 1265 switch (get_num_odm_splits(&res_ctx->pipe_ctx[i])) { 1266 case 1: 1267 pipes[pipe_cnt].pipe.dest.odm_combine = dm_odm_combine_mode_2to1; 1268 break; 1269 case 3: 1270 pipes[pipe_cnt].pipe.dest.odm_combine = dm_odm_combine_mode_4to1; 1271 break; 1272 default: 1273 pipes[pipe_cnt].pipe.dest.odm_combine = dm_odm_combine_mode_disabled; 1274 } 1275 pipes[pipe_cnt].pipe.src.hsplit_grp = res_ctx->pipe_ctx[i].pipe_idx; 1276 if (res_ctx->pipe_ctx[i].top_pipe && res_ctx->pipe_ctx[i].top_pipe->plane_state 1277 == res_ctx->pipe_ctx[i].plane_state) { 1278 struct pipe_ctx *first_pipe = res_ctx->pipe_ctx[i].top_pipe; 1279 int split_idx = 0; 1280 1281 while (first_pipe->top_pipe && first_pipe->top_pipe->plane_state 1282 == res_ctx->pipe_ctx[i].plane_state) { 1283 first_pipe = first_pipe->top_pipe; 1284 split_idx++; 1285 } 1286 /* Treat 4to1 mpc combine as an mpo of 2 2-to-1 combines */ 1287 if (split_idx == 0) 1288 pipes[pipe_cnt].pipe.src.hsplit_grp = first_pipe->pipe_idx; 1289 else if (split_idx == 1) 1290 pipes[pipe_cnt].pipe.src.hsplit_grp = res_ctx->pipe_ctx[i].pipe_idx; 1291 else if (split_idx == 2) 1292 pipes[pipe_cnt].pipe.src.hsplit_grp = res_ctx->pipe_ctx[i].top_pipe->pipe_idx; 1293 } else if (res_ctx->pipe_ctx[i].prev_odm_pipe) { 1294 struct pipe_ctx *first_pipe = res_ctx->pipe_ctx[i].prev_odm_pipe; 1295 1296 while (first_pipe->prev_odm_pipe) 1297 first_pipe = first_pipe->prev_odm_pipe; 1298 pipes[pipe_cnt].pipe.src.hsplit_grp = first_pipe->pipe_idx; 1299 } 1300 1301 switch (res_ctx->pipe_ctx[i].stream->signal) { 1302 case SIGNAL_TYPE_DISPLAY_PORT_MST: 1303 case SIGNAL_TYPE_DISPLAY_PORT: 1304 pipes[pipe_cnt].dout.output_type = dm_dp; 1305 if (is_dp_128b_132b_signal(&res_ctx->pipe_ctx[i])) 1306 pipes[pipe_cnt].dout.output_type = dm_dp2p0; 1307 break; 1308 case SIGNAL_TYPE_EDP: 1309 pipes[pipe_cnt].dout.output_type = dm_edp; 1310 break; 1311 case SIGNAL_TYPE_HDMI_TYPE_A: 1312 case SIGNAL_TYPE_DVI_SINGLE_LINK: 1313 case SIGNAL_TYPE_DVI_DUAL_LINK: 1314 pipes[pipe_cnt].dout.output_type = dm_hdmi; 1315 break; 1316 default: 1317 /* In case there is no signal, set dp with 4 lanes to allow max config */ 1318 pipes[pipe_cnt].dout.is_virtual = 1; 1319 pipes[pipe_cnt].dout.output_type = dm_dp; 1320 pipes[pipe_cnt].dout.dp_lanes = 4; 1321 pipes[pipe_cnt].dout.dp_rate = dm_dp_rate_hbr2; 1322 } 1323 1324 switch (res_ctx->pipe_ctx[i].stream->timing.display_color_depth) { 1325 case COLOR_DEPTH_666: 1326 output_bpc = 6; 1327 break; 1328 case COLOR_DEPTH_888: 1329 output_bpc = 8; 1330 break; 1331 case COLOR_DEPTH_101010: 1332 output_bpc = 10; 1333 break; 1334 case COLOR_DEPTH_121212: 1335 output_bpc = 12; 1336 break; 1337 case COLOR_DEPTH_141414: 1338 output_bpc = 14; 1339 break; 1340 case COLOR_DEPTH_161616: 1341 output_bpc = 16; 1342 break; 1343 case COLOR_DEPTH_999: 1344 output_bpc = 9; 1345 break; 1346 case COLOR_DEPTH_111111: 1347 output_bpc = 11; 1348 break; 1349 default: 1350 output_bpc = 8; 1351 break; 1352 } 1353 1354 switch (res_ctx->pipe_ctx[i].stream->timing.pixel_encoding) { 1355 case PIXEL_ENCODING_RGB: 1356 case PIXEL_ENCODING_YCBCR444: 1357 pipes[pipe_cnt].dout.output_format = dm_444; 1358 pipes[pipe_cnt].dout.output_bpp = output_bpc * 3; 1359 break; 1360 case PIXEL_ENCODING_YCBCR420: 1361 pipes[pipe_cnt].dout.output_format = dm_420; 1362 pipes[pipe_cnt].dout.output_bpp = (output_bpc * 3.0) / 2; 1363 break; 1364 case PIXEL_ENCODING_YCBCR422: 1365 if (res_ctx->pipe_ctx[i].stream->timing.flags.DSC && 1366 !res_ctx->pipe_ctx[i].stream->timing.dsc_cfg.ycbcr422_simple) 1367 pipes[pipe_cnt].dout.output_format = dm_n422; 1368 else 1369 pipes[pipe_cnt].dout.output_format = dm_s422; 1370 pipes[pipe_cnt].dout.output_bpp = output_bpc * 2; 1371 break; 1372 default: 1373 pipes[pipe_cnt].dout.output_format = dm_444; 1374 pipes[pipe_cnt].dout.output_bpp = output_bpc * 3; 1375 } 1376 1377 if (res_ctx->pipe_ctx[i].stream->timing.flags.DSC) 1378 pipes[pipe_cnt].dout.output_bpp = res_ctx->pipe_ctx[i].stream->timing.dsc_cfg.bits_per_pixel / 16.0; 1379 1380 /* todo: default max for now, until there is logic reflecting this in dc*/ 1381 pipes[pipe_cnt].dout.dsc_input_bpc = 12; 1382 /*fill up the audio sample rate (unit in kHz)*/ 1383 get_audio_check(&res_ctx->pipe_ctx[i].stream->audio_info, &aud_check); 1384 pipes[pipe_cnt].dout.max_audio_sample_rate = aud_check.max_audiosample_rate / 1000; 1385 /* 1386 * For graphic plane, cursor number is 1, nv12 is 0 1387 * bw calculations due to cursor on/off 1388 */ 1389 if (res_ctx->pipe_ctx[i].plane_state && 1390 (res_ctx->pipe_ctx[i].plane_state->address.type == PLN_ADDR_TYPE_VIDEO_PROGRESSIVE || 1391 res_ctx->pipe_ctx[i].stream->mall_stream_config.type == SUBVP_PHANTOM)) 1392 pipes[pipe_cnt].pipe.src.num_cursors = 0; 1393 else 1394 pipes[pipe_cnt].pipe.src.num_cursors = dc->dml.ip.number_of_cursors; 1395 1396 pipes[pipe_cnt].pipe.src.cur0_src_width = 256; 1397 pipes[pipe_cnt].pipe.src.cur0_bpp = dm_cur_32bit; 1398 1399 if (!res_ctx->pipe_ctx[i].plane_state) { 1400 pipes[pipe_cnt].pipe.src.is_hsplit = pipes[pipe_cnt].pipe.dest.odm_combine != dm_odm_combine_mode_disabled; 1401 pipes[pipe_cnt].pipe.src.source_scan = dm_horz; 1402 pipes[pipe_cnt].pipe.src.source_rotation = dm_rotation_0; 1403 pipes[pipe_cnt].pipe.src.sw_mode = dm_sw_4kb_s; 1404 pipes[pipe_cnt].pipe.src.macro_tile_size = dm_64k_tile; 1405 pipes[pipe_cnt].pipe.src.viewport_width = timing->h_addressable; 1406 if (pipes[pipe_cnt].pipe.src.viewport_width > 1920) 1407 pipes[pipe_cnt].pipe.src.viewport_width = 1920; 1408 pipes[pipe_cnt].pipe.src.viewport_height = timing->v_addressable; 1409 if (pipes[pipe_cnt].pipe.src.viewport_height > 1080) 1410 pipes[pipe_cnt].pipe.src.viewport_height = 1080; 1411 pipes[pipe_cnt].pipe.src.surface_height_y = pipes[pipe_cnt].pipe.src.viewport_height; 1412 pipes[pipe_cnt].pipe.src.surface_width_y = pipes[pipe_cnt].pipe.src.viewport_width; 1413 pipes[pipe_cnt].pipe.src.surface_height_c = pipes[pipe_cnt].pipe.src.viewport_height; 1414 pipes[pipe_cnt].pipe.src.surface_width_c = pipes[pipe_cnt].pipe.src.viewport_width; 1415 pipes[pipe_cnt].pipe.src.data_pitch = ((pipes[pipe_cnt].pipe.src.viewport_width + 255) / 256) * 256; 1416 pipes[pipe_cnt].pipe.src.source_format = dm_444_32; 1417 pipes[pipe_cnt].pipe.dest.recout_width = pipes[pipe_cnt].pipe.src.viewport_width; /*vp_width/hratio*/ 1418 pipes[pipe_cnt].pipe.dest.recout_height = pipes[pipe_cnt].pipe.src.viewport_height; /*vp_height/vratio*/ 1419 pipes[pipe_cnt].pipe.dest.full_recout_width = pipes[pipe_cnt].pipe.dest.recout_width; /*when is_hsplit != 1*/ 1420 pipes[pipe_cnt].pipe.dest.full_recout_height = pipes[pipe_cnt].pipe.dest.recout_height; /*when is_hsplit != 1*/ 1421 pipes[pipe_cnt].pipe.scale_ratio_depth.lb_depth = dm_lb_16; 1422 pipes[pipe_cnt].pipe.scale_ratio_depth.hscl_ratio = 1.0; 1423 pipes[pipe_cnt].pipe.scale_ratio_depth.vscl_ratio = 1.0; 1424 pipes[pipe_cnt].pipe.scale_ratio_depth.scl_enable = 0; /*Lb only or Full scl*/ 1425 pipes[pipe_cnt].pipe.scale_taps.htaps = 1; 1426 pipes[pipe_cnt].pipe.scale_taps.vtaps = 1; 1427 pipes[pipe_cnt].pipe.dest.vtotal_min = v_total; 1428 pipes[pipe_cnt].pipe.dest.vtotal_max = v_total; 1429 1430 if (pipes[pipe_cnt].pipe.dest.odm_combine == dm_odm_combine_mode_2to1) { 1431 pipes[pipe_cnt].pipe.src.viewport_width /= 2; 1432 pipes[pipe_cnt].pipe.dest.recout_width /= 2; 1433 } else if (pipes[pipe_cnt].pipe.dest.odm_combine == dm_odm_combine_mode_4to1) { 1434 pipes[pipe_cnt].pipe.src.viewport_width /= 4; 1435 pipes[pipe_cnt].pipe.dest.recout_width /= 4; 1436 } 1437 } else { 1438 struct dc_plane_state *pln = res_ctx->pipe_ctx[i].plane_state; 1439 struct scaler_data *scl = &res_ctx->pipe_ctx[i].plane_res.scl_data; 1440 1441 pipes[pipe_cnt].pipe.src.immediate_flip = pln->flip_immediate; 1442 pipes[pipe_cnt].pipe.src.is_hsplit = (res_ctx->pipe_ctx[i].bottom_pipe && res_ctx->pipe_ctx[i].bottom_pipe->plane_state == pln) 1443 || (res_ctx->pipe_ctx[i].top_pipe && res_ctx->pipe_ctx[i].top_pipe->plane_state == pln) 1444 || pipes[pipe_cnt].pipe.dest.odm_combine != dm_odm_combine_mode_disabled; 1445 1446 /* stereo is not split */ 1447 if (pln->stereo_format == PLANE_STEREO_FORMAT_SIDE_BY_SIDE || 1448 pln->stereo_format == PLANE_STEREO_FORMAT_TOP_AND_BOTTOM) { 1449 pipes[pipe_cnt].pipe.src.is_hsplit = false; 1450 pipes[pipe_cnt].pipe.src.hsplit_grp = res_ctx->pipe_ctx[i].pipe_idx; 1451 } 1452 1453 pipes[pipe_cnt].pipe.src.source_scan = pln->rotation == ROTATION_ANGLE_90 1454 || pln->rotation == ROTATION_ANGLE_270 ? dm_vert : dm_horz; 1455 switch (pln->rotation) { 1456 case ROTATION_ANGLE_0: 1457 pipes[pipe_cnt].pipe.src.source_rotation = dm_rotation_0; 1458 break; 1459 case ROTATION_ANGLE_90: 1460 pipes[pipe_cnt].pipe.src.source_rotation = dm_rotation_90; 1461 break; 1462 case ROTATION_ANGLE_180: 1463 pipes[pipe_cnt].pipe.src.source_rotation = dm_rotation_180; 1464 break; 1465 case ROTATION_ANGLE_270: 1466 pipes[pipe_cnt].pipe.src.source_rotation = dm_rotation_270; 1467 break; 1468 default: 1469 break; 1470 } 1471 pipes[pipe_cnt].pipe.src.viewport_y_y = scl->viewport.y; 1472 pipes[pipe_cnt].pipe.src.viewport_y_c = scl->viewport_c.y; 1473 pipes[pipe_cnt].pipe.src.viewport_x_y = scl->viewport.x; 1474 pipes[pipe_cnt].pipe.src.viewport_x_c = scl->viewport_c.x; 1475 pipes[pipe_cnt].pipe.src.viewport_width = scl->viewport.width; 1476 pipes[pipe_cnt].pipe.src.viewport_width_c = scl->viewport_c.width; 1477 pipes[pipe_cnt].pipe.src.viewport_height = scl->viewport.height; 1478 pipes[pipe_cnt].pipe.src.viewport_height_c = scl->viewport_c.height; 1479 pipes[pipe_cnt].pipe.src.viewport_width_max = pln->src_rect.width; 1480 pipes[pipe_cnt].pipe.src.viewport_height_max = pln->src_rect.height; 1481 pipes[pipe_cnt].pipe.src.surface_width_y = pln->plane_size.surface_size.width; 1482 pipes[pipe_cnt].pipe.src.surface_height_y = pln->plane_size.surface_size.height; 1483 pipes[pipe_cnt].pipe.src.surface_width_c = pln->plane_size.chroma_size.width; 1484 pipes[pipe_cnt].pipe.src.surface_height_c = pln->plane_size.chroma_size.height; 1485 if (pln->format == SURFACE_PIXEL_FORMAT_GRPH_RGBE_ALPHA 1486 || pln->format >= SURFACE_PIXEL_FORMAT_VIDEO_BEGIN) { 1487 pipes[pipe_cnt].pipe.src.data_pitch = pln->plane_size.surface_pitch; 1488 pipes[pipe_cnt].pipe.src.data_pitch_c = pln->plane_size.chroma_pitch; 1489 pipes[pipe_cnt].pipe.src.meta_pitch = pln->dcc.meta_pitch; 1490 pipes[pipe_cnt].pipe.src.meta_pitch_c = pln->dcc.meta_pitch_c; 1491 } else { 1492 pipes[pipe_cnt].pipe.src.data_pitch = pln->plane_size.surface_pitch; 1493 pipes[pipe_cnt].pipe.src.meta_pitch = pln->dcc.meta_pitch; 1494 } 1495 pipes[pipe_cnt].pipe.src.dcc = pln->dcc.enable; 1496 pipes[pipe_cnt].pipe.dest.recout_width = scl->recout.width; 1497 pipes[pipe_cnt].pipe.dest.recout_height = scl->recout.height; 1498 pipes[pipe_cnt].pipe.dest.full_recout_height = scl->recout.height; 1499 pipes[pipe_cnt].pipe.dest.full_recout_width = scl->recout.width; 1500 if (pipes[pipe_cnt].pipe.dest.odm_combine == dm_odm_combine_mode_2to1) 1501 pipes[pipe_cnt].pipe.dest.full_recout_width *= 2; 1502 else if (pipes[pipe_cnt].pipe.dest.odm_combine == dm_odm_combine_mode_4to1) 1503 pipes[pipe_cnt].pipe.dest.full_recout_width *= 4; 1504 else { 1505 struct pipe_ctx *split_pipe = res_ctx->pipe_ctx[i].bottom_pipe; 1506 1507 while (split_pipe && split_pipe->plane_state == pln) { 1508 pipes[pipe_cnt].pipe.dest.full_recout_width += split_pipe->plane_res.scl_data.recout.width; 1509 split_pipe = split_pipe->bottom_pipe; 1510 } 1511 split_pipe = res_ctx->pipe_ctx[i].top_pipe; 1512 while (split_pipe && split_pipe->plane_state == pln) { 1513 pipes[pipe_cnt].pipe.dest.full_recout_width += split_pipe->plane_res.scl_data.recout.width; 1514 split_pipe = split_pipe->top_pipe; 1515 } 1516 } 1517 1518 pipes[pipe_cnt].pipe.scale_ratio_depth.lb_depth = dm_lb_16; 1519 pipes[pipe_cnt].pipe.scale_ratio_depth.hscl_ratio = (double) scl->ratios.horz.value / (1ULL<<32); 1520 pipes[pipe_cnt].pipe.scale_ratio_depth.hscl_ratio_c = (double) scl->ratios.horz_c.value / (1ULL<<32); 1521 pipes[pipe_cnt].pipe.scale_ratio_depth.vscl_ratio = (double) scl->ratios.vert.value / (1ULL<<32); 1522 pipes[pipe_cnt].pipe.scale_ratio_depth.vscl_ratio_c = (double) scl->ratios.vert_c.value / (1ULL<<32); 1523 pipes[pipe_cnt].pipe.scale_ratio_depth.scl_enable = 1524 scl->ratios.vert.value != dc_fixpt_one.value 1525 || scl->ratios.horz.value != dc_fixpt_one.value 1526 || scl->ratios.vert_c.value != dc_fixpt_one.value 1527 || scl->ratios.horz_c.value != dc_fixpt_one.value /*Lb only or Full scl*/ 1528 || dc->debug.always_scale; /*support always scale*/ 1529 pipes[pipe_cnt].pipe.scale_taps.htaps = scl->taps.h_taps; 1530 pipes[pipe_cnt].pipe.scale_taps.htaps_c = scl->taps.h_taps_c; 1531 pipes[pipe_cnt].pipe.scale_taps.vtaps = scl->taps.v_taps; 1532 pipes[pipe_cnt].pipe.scale_taps.vtaps_c = scl->taps.v_taps_c; 1533 1534 pipes[pipe_cnt].pipe.src.macro_tile_size = 1535 swizzle_mode_to_macro_tile_size(pln->tiling_info.gfx9.swizzle); 1536 swizzle_to_dml_params(pln->tiling_info.gfx9.swizzle, 1537 &pipes[pipe_cnt].pipe.src.sw_mode); 1538 1539 switch (pln->format) { 1540 case SURFACE_PIXEL_FORMAT_VIDEO_420_YCbCr: 1541 case SURFACE_PIXEL_FORMAT_VIDEO_420_YCrCb: 1542 pipes[pipe_cnt].pipe.src.source_format = dm_420_8; 1543 break; 1544 case SURFACE_PIXEL_FORMAT_VIDEO_420_10bpc_YCbCr: 1545 case SURFACE_PIXEL_FORMAT_VIDEO_420_10bpc_YCrCb: 1546 pipes[pipe_cnt].pipe.src.source_format = dm_420_10; 1547 break; 1548 case SURFACE_PIXEL_FORMAT_GRPH_ARGB16161616: 1549 case SURFACE_PIXEL_FORMAT_GRPH_ABGR16161616: 1550 case SURFACE_PIXEL_FORMAT_GRPH_ARGB16161616F: 1551 case SURFACE_PIXEL_FORMAT_GRPH_ABGR16161616F: 1552 pipes[pipe_cnt].pipe.src.source_format = dm_444_64; 1553 break; 1554 case SURFACE_PIXEL_FORMAT_GRPH_ARGB1555: 1555 case SURFACE_PIXEL_FORMAT_GRPH_RGB565: 1556 pipes[pipe_cnt].pipe.src.source_format = dm_444_16; 1557 break; 1558 case SURFACE_PIXEL_FORMAT_GRPH_PALETA_256_COLORS: 1559 pipes[pipe_cnt].pipe.src.source_format = dm_444_8; 1560 break; 1561 case SURFACE_PIXEL_FORMAT_GRPH_RGBE_ALPHA: 1562 pipes[pipe_cnt].pipe.src.source_format = dm_rgbe_alpha; 1563 break; 1564 default: 1565 pipes[pipe_cnt].pipe.src.source_format = dm_444_32; 1566 break; 1567 } 1568 } 1569 1570 pipe_cnt++; 1571 } 1572 1573 /* populate writeback information */ 1574 dc->res_pool->funcs->populate_dml_writeback_from_context(dc, res_ctx, pipes); 1575 1576 return pipe_cnt; 1577 } 1578 1579 void dcn20_calculate_wm( 1580 struct dc *dc, struct dc_state *context, 1581 display_e2e_pipe_params_st *pipes, 1582 int *out_pipe_cnt, 1583 int *pipe_split_from, 1584 int vlevel, 1585 bool fast_validate) 1586 { 1587 int pipe_cnt, i, pipe_idx; 1588 1589 dc_assert_fp_enabled(); 1590 1591 for (i = 0, pipe_idx = 0, pipe_cnt = 0; i < dc->res_pool->pipe_count; i++) { 1592 if (!context->res_ctx.pipe_ctx[i].stream) 1593 continue; 1594 1595 pipes[pipe_cnt].clks_cfg.refclk_mhz = dc->res_pool->ref_clocks.dchub_ref_clock_inKhz / 1000.0; 1596 pipes[pipe_cnt].clks_cfg.dispclk_mhz = context->bw_ctx.dml.vba.RequiredDISPCLK[vlevel][context->bw_ctx.dml.vba.maxMpcComb]; 1597 1598 if (pipe_split_from[i] < 0) { 1599 pipes[pipe_cnt].clks_cfg.dppclk_mhz = 1600 context->bw_ctx.dml.vba.RequiredDPPCLK[vlevel][context->bw_ctx.dml.vba.maxMpcComb][pipe_idx]; 1601 if (context->bw_ctx.dml.vba.BlendingAndTiming[pipe_idx] == pipe_idx) 1602 pipes[pipe_cnt].pipe.dest.odm_combine = 1603 context->bw_ctx.dml.vba.ODMCombineEnabled[pipe_idx]; 1604 else 1605 pipes[pipe_cnt].pipe.dest.odm_combine = 0; 1606 pipe_idx++; 1607 } else { 1608 pipes[pipe_cnt].clks_cfg.dppclk_mhz = 1609 context->bw_ctx.dml.vba.RequiredDPPCLK[vlevel][context->bw_ctx.dml.vba.maxMpcComb][pipe_split_from[i]]; 1610 if (context->bw_ctx.dml.vba.BlendingAndTiming[pipe_split_from[i]] == pipe_split_from[i]) 1611 pipes[pipe_cnt].pipe.dest.odm_combine = 1612 context->bw_ctx.dml.vba.ODMCombineEnabled[pipe_split_from[i]]; 1613 else 1614 pipes[pipe_cnt].pipe.dest.odm_combine = 0; 1615 } 1616 1617 if (dc->config.forced_clocks) { 1618 pipes[pipe_cnt].clks_cfg.dispclk_mhz = context->bw_ctx.dml.soc.clock_limits[0].dispclk_mhz; 1619 pipes[pipe_cnt].clks_cfg.dppclk_mhz = context->bw_ctx.dml.soc.clock_limits[0].dppclk_mhz; 1620 } 1621 if (dc->debug.min_disp_clk_khz > pipes[pipe_cnt].clks_cfg.dispclk_mhz * 1000) 1622 pipes[pipe_cnt].clks_cfg.dispclk_mhz = dc->debug.min_disp_clk_khz / 1000.0; 1623 if (dc->debug.min_dpp_clk_khz > pipes[pipe_cnt].clks_cfg.dppclk_mhz * 1000) 1624 pipes[pipe_cnt].clks_cfg.dppclk_mhz = dc->debug.min_dpp_clk_khz / 1000.0; 1625 1626 pipe_cnt++; 1627 } 1628 1629 if (pipe_cnt != pipe_idx) { 1630 if (dc->res_pool->funcs->populate_dml_pipes) 1631 pipe_cnt = dc->res_pool->funcs->populate_dml_pipes(dc, 1632 context, pipes, fast_validate); 1633 else 1634 pipe_cnt = dcn20_populate_dml_pipes_from_context(dc, 1635 context, pipes, fast_validate); 1636 } 1637 1638 *out_pipe_cnt = pipe_cnt; 1639 1640 pipes[0].clks_cfg.voltage = vlevel; 1641 pipes[0].clks_cfg.dcfclk_mhz = context->bw_ctx.dml.soc.clock_limits[vlevel].dcfclk_mhz; 1642 pipes[0].clks_cfg.socclk_mhz = context->bw_ctx.dml.soc.clock_limits[vlevel].socclk_mhz; 1643 1644 /* only pipe 0 is read for voltage and dcf/soc clocks */ 1645 if (vlevel < 1) { 1646 pipes[0].clks_cfg.voltage = 1; 1647 pipes[0].clks_cfg.dcfclk_mhz = context->bw_ctx.dml.soc.clock_limits[1].dcfclk_mhz; 1648 pipes[0].clks_cfg.socclk_mhz = context->bw_ctx.dml.soc.clock_limits[1].socclk_mhz; 1649 } 1650 context->bw_ctx.bw.dcn.watermarks.b.urgent_ns = get_wm_urgent(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1651 context->bw_ctx.bw.dcn.watermarks.b.cstate_pstate.cstate_enter_plus_exit_ns = get_wm_stutter_enter_exit(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1652 context->bw_ctx.bw.dcn.watermarks.b.cstate_pstate.cstate_exit_ns = get_wm_stutter_exit(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1653 context->bw_ctx.bw.dcn.watermarks.b.cstate_pstate.pstate_change_ns = get_wm_dram_clock_change(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1654 context->bw_ctx.bw.dcn.watermarks.b.pte_meta_urgent_ns = get_wm_memory_trip(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1655 context->bw_ctx.bw.dcn.watermarks.b.frac_urg_bw_nom = get_fraction_of_urgent_bandwidth(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1656 context->bw_ctx.bw.dcn.watermarks.b.frac_urg_bw_flip = get_fraction_of_urgent_bandwidth_imm_flip(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1657 context->bw_ctx.bw.dcn.watermarks.b.urgent_latency_ns = get_urgent_latency(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1658 1659 if (vlevel < 2) { 1660 pipes[0].clks_cfg.voltage = 2; 1661 pipes[0].clks_cfg.dcfclk_mhz = context->bw_ctx.dml.soc.clock_limits[2].dcfclk_mhz; 1662 pipes[0].clks_cfg.socclk_mhz = context->bw_ctx.dml.soc.clock_limits[2].socclk_mhz; 1663 } 1664 context->bw_ctx.bw.dcn.watermarks.c.urgent_ns = get_wm_urgent(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1665 context->bw_ctx.bw.dcn.watermarks.c.cstate_pstate.cstate_enter_plus_exit_ns = get_wm_stutter_enter_exit(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1666 context->bw_ctx.bw.dcn.watermarks.c.cstate_pstate.cstate_exit_ns = get_wm_stutter_exit(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1667 context->bw_ctx.bw.dcn.watermarks.c.cstate_pstate.pstate_change_ns = get_wm_dram_clock_change(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1668 context->bw_ctx.bw.dcn.watermarks.c.pte_meta_urgent_ns = get_wm_memory_trip(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1669 context->bw_ctx.bw.dcn.watermarks.c.frac_urg_bw_nom = get_fraction_of_urgent_bandwidth(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1670 context->bw_ctx.bw.dcn.watermarks.c.frac_urg_bw_flip = get_fraction_of_urgent_bandwidth_imm_flip(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1671 1672 if (vlevel < 3) { 1673 pipes[0].clks_cfg.voltage = 3; 1674 pipes[0].clks_cfg.dcfclk_mhz = context->bw_ctx.dml.soc.clock_limits[2].dcfclk_mhz; 1675 pipes[0].clks_cfg.socclk_mhz = context->bw_ctx.dml.soc.clock_limits[2].socclk_mhz; 1676 } 1677 context->bw_ctx.bw.dcn.watermarks.d.urgent_ns = get_wm_urgent(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1678 context->bw_ctx.bw.dcn.watermarks.d.cstate_pstate.cstate_enter_plus_exit_ns = get_wm_stutter_enter_exit(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1679 context->bw_ctx.bw.dcn.watermarks.d.cstate_pstate.cstate_exit_ns = get_wm_stutter_exit(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1680 context->bw_ctx.bw.dcn.watermarks.d.cstate_pstate.pstate_change_ns = get_wm_dram_clock_change(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1681 context->bw_ctx.bw.dcn.watermarks.d.pte_meta_urgent_ns = get_wm_memory_trip(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1682 context->bw_ctx.bw.dcn.watermarks.d.frac_urg_bw_nom = get_fraction_of_urgent_bandwidth(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1683 context->bw_ctx.bw.dcn.watermarks.d.frac_urg_bw_flip = get_fraction_of_urgent_bandwidth_imm_flip(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1684 1685 pipes[0].clks_cfg.voltage = vlevel; 1686 pipes[0].clks_cfg.dcfclk_mhz = context->bw_ctx.dml.soc.clock_limits[vlevel].dcfclk_mhz; 1687 pipes[0].clks_cfg.socclk_mhz = context->bw_ctx.dml.soc.clock_limits[vlevel].socclk_mhz; 1688 context->bw_ctx.bw.dcn.watermarks.a.urgent_ns = get_wm_urgent(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1689 context->bw_ctx.bw.dcn.watermarks.a.cstate_pstate.cstate_enter_plus_exit_ns = get_wm_stutter_enter_exit(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1690 context->bw_ctx.bw.dcn.watermarks.a.cstate_pstate.cstate_exit_ns = get_wm_stutter_exit(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1691 context->bw_ctx.bw.dcn.watermarks.a.cstate_pstate.pstate_change_ns = get_wm_dram_clock_change(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1692 context->bw_ctx.bw.dcn.watermarks.a.pte_meta_urgent_ns = get_wm_memory_trip(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1693 context->bw_ctx.bw.dcn.watermarks.a.frac_urg_bw_nom = get_fraction_of_urgent_bandwidth(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1694 context->bw_ctx.bw.dcn.watermarks.a.frac_urg_bw_flip = get_fraction_of_urgent_bandwidth_imm_flip(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000; 1695 } 1696 1697 void dcn20_update_bounding_box(struct dc *dc, struct _vcs_dpi_soc_bounding_box_st *bb, 1698 struct pp_smu_nv_clock_table *max_clocks, unsigned int *uclk_states, unsigned int num_states) 1699 { 1700 int num_calculated_states = 0; 1701 int min_dcfclk = 0; 1702 int i; 1703 1704 dc_assert_fp_enabled(); 1705 1706 if (num_states == 0) 1707 return; 1708 1709 memset(bb->clock_limits, 0, sizeof(bb->clock_limits)); 1710 1711 if (dc->bb_overrides.min_dcfclk_mhz > 0) { 1712 min_dcfclk = dc->bb_overrides.min_dcfclk_mhz; 1713 } else { 1714 if (ASICREV_IS_NAVI12_P(dc->ctx->asic_id.hw_internal_rev)) 1715 min_dcfclk = 310; 1716 else 1717 // Accounting for SOC/DCF relationship, we can go as high as 1718 // 506Mhz in Vmin. 1719 min_dcfclk = 506; 1720 } 1721 1722 for (i = 0; i < num_states; i++) { 1723 int min_fclk_required_by_uclk; 1724 bb->clock_limits[i].state = i; 1725 bb->clock_limits[i].dram_speed_mts = uclk_states[i] * 16 / 1000; 1726 1727 // FCLK:UCLK ratio is 1.08 1728 min_fclk_required_by_uclk = div_u64(((unsigned long long)uclk_states[i]) * 1080, 1729 1000000); 1730 1731 bb->clock_limits[i].fabricclk_mhz = (min_fclk_required_by_uclk < min_dcfclk) ? 1732 min_dcfclk : min_fclk_required_by_uclk; 1733 1734 bb->clock_limits[i].socclk_mhz = (bb->clock_limits[i].fabricclk_mhz > max_clocks->socClockInKhz / 1000) ? 1735 max_clocks->socClockInKhz / 1000 : bb->clock_limits[i].fabricclk_mhz; 1736 1737 bb->clock_limits[i].dcfclk_mhz = (bb->clock_limits[i].fabricclk_mhz > max_clocks->dcfClockInKhz / 1000) ? 1738 max_clocks->dcfClockInKhz / 1000 : bb->clock_limits[i].fabricclk_mhz; 1739 1740 bb->clock_limits[i].dispclk_mhz = max_clocks->displayClockInKhz / 1000; 1741 bb->clock_limits[i].dppclk_mhz = max_clocks->displayClockInKhz / 1000; 1742 bb->clock_limits[i].dscclk_mhz = max_clocks->displayClockInKhz / (1000 * 3); 1743 1744 bb->clock_limits[i].phyclk_mhz = max_clocks->phyClockInKhz / 1000; 1745 1746 num_calculated_states++; 1747 } 1748 1749 bb->clock_limits[num_calculated_states - 1].socclk_mhz = max_clocks->socClockInKhz / 1000; 1750 bb->clock_limits[num_calculated_states - 1].fabricclk_mhz = max_clocks->socClockInKhz / 1000; 1751 bb->clock_limits[num_calculated_states - 1].dcfclk_mhz = max_clocks->dcfClockInKhz / 1000; 1752 1753 bb->num_states = num_calculated_states; 1754 1755 // Duplicate the last state, DML always an extra state identical to max state to work 1756 memcpy(&bb->clock_limits[num_calculated_states], &bb->clock_limits[num_calculated_states - 1], sizeof(struct _vcs_dpi_voltage_scaling_st)); 1757 bb->clock_limits[num_calculated_states].state = bb->num_states; 1758 } 1759 1760 void dcn20_cap_soc_clocks( 1761 struct _vcs_dpi_soc_bounding_box_st *bb, 1762 struct pp_smu_nv_clock_table max_clocks) 1763 { 1764 int i; 1765 1766 dc_assert_fp_enabled(); 1767 1768 // First pass - cap all clocks higher than the reported max 1769 for (i = 0; i < bb->num_states; i++) { 1770 if ((bb->clock_limits[i].dcfclk_mhz > (max_clocks.dcfClockInKhz / 1000)) 1771 && max_clocks.dcfClockInKhz != 0) 1772 bb->clock_limits[i].dcfclk_mhz = (max_clocks.dcfClockInKhz / 1000); 1773 1774 if ((bb->clock_limits[i].dram_speed_mts > (max_clocks.uClockInKhz / 1000) * 16) 1775 && max_clocks.uClockInKhz != 0) 1776 bb->clock_limits[i].dram_speed_mts = (max_clocks.uClockInKhz / 1000) * 16; 1777 1778 if ((bb->clock_limits[i].fabricclk_mhz > (max_clocks.fabricClockInKhz / 1000)) 1779 && max_clocks.fabricClockInKhz != 0) 1780 bb->clock_limits[i].fabricclk_mhz = (max_clocks.fabricClockInKhz / 1000); 1781 1782 if ((bb->clock_limits[i].dispclk_mhz > (max_clocks.displayClockInKhz / 1000)) 1783 && max_clocks.displayClockInKhz != 0) 1784 bb->clock_limits[i].dispclk_mhz = (max_clocks.displayClockInKhz / 1000); 1785 1786 if ((bb->clock_limits[i].dppclk_mhz > (max_clocks.dppClockInKhz / 1000)) 1787 && max_clocks.dppClockInKhz != 0) 1788 bb->clock_limits[i].dppclk_mhz = (max_clocks.dppClockInKhz / 1000); 1789 1790 if ((bb->clock_limits[i].phyclk_mhz > (max_clocks.phyClockInKhz / 1000)) 1791 && max_clocks.phyClockInKhz != 0) 1792 bb->clock_limits[i].phyclk_mhz = (max_clocks.phyClockInKhz / 1000); 1793 1794 if ((bb->clock_limits[i].socclk_mhz > (max_clocks.socClockInKhz / 1000)) 1795 && max_clocks.socClockInKhz != 0) 1796 bb->clock_limits[i].socclk_mhz = (max_clocks.socClockInKhz / 1000); 1797 1798 if ((bb->clock_limits[i].dscclk_mhz > (max_clocks.dscClockInKhz / 1000)) 1799 && max_clocks.dscClockInKhz != 0) 1800 bb->clock_limits[i].dscclk_mhz = (max_clocks.dscClockInKhz / 1000); 1801 } 1802 1803 // Second pass - remove all duplicate clock states 1804 for (i = bb->num_states - 1; i > 1; i--) { 1805 bool duplicate = true; 1806 1807 if (bb->clock_limits[i-1].dcfclk_mhz != bb->clock_limits[i].dcfclk_mhz) 1808 duplicate = false; 1809 if (bb->clock_limits[i-1].dispclk_mhz != bb->clock_limits[i].dispclk_mhz) 1810 duplicate = false; 1811 if (bb->clock_limits[i-1].dppclk_mhz != bb->clock_limits[i].dppclk_mhz) 1812 duplicate = false; 1813 if (bb->clock_limits[i-1].dram_speed_mts != bb->clock_limits[i].dram_speed_mts) 1814 duplicate = false; 1815 if (bb->clock_limits[i-1].dscclk_mhz != bb->clock_limits[i].dscclk_mhz) 1816 duplicate = false; 1817 if (bb->clock_limits[i-1].fabricclk_mhz != bb->clock_limits[i].fabricclk_mhz) 1818 duplicate = false; 1819 if (bb->clock_limits[i-1].phyclk_mhz != bb->clock_limits[i].phyclk_mhz) 1820 duplicate = false; 1821 if (bb->clock_limits[i-1].socclk_mhz != bb->clock_limits[i].socclk_mhz) 1822 duplicate = false; 1823 1824 if (duplicate) 1825 bb->num_states--; 1826 } 1827 } 1828 1829 void dcn20_patch_bounding_box(struct dc *dc, struct _vcs_dpi_soc_bounding_box_st *bb) 1830 { 1831 dc_assert_fp_enabled(); 1832 1833 if ((int)(bb->sr_exit_time_us * 1000) != dc->bb_overrides.sr_exit_time_ns 1834 && dc->bb_overrides.sr_exit_time_ns) { 1835 bb->sr_exit_time_us = dc->bb_overrides.sr_exit_time_ns / 1000.0; 1836 } 1837 1838 if ((int)(bb->sr_enter_plus_exit_time_us * 1000) 1839 != dc->bb_overrides.sr_enter_plus_exit_time_ns 1840 && dc->bb_overrides.sr_enter_plus_exit_time_ns) { 1841 bb->sr_enter_plus_exit_time_us = 1842 dc->bb_overrides.sr_enter_plus_exit_time_ns / 1000.0; 1843 } 1844 1845 if ((int)(bb->urgent_latency_us * 1000) != dc->bb_overrides.urgent_latency_ns 1846 && dc->bb_overrides.urgent_latency_ns) { 1847 bb->urgent_latency_us = dc->bb_overrides.urgent_latency_ns / 1000.0; 1848 } 1849 1850 if ((int)(bb->dram_clock_change_latency_us * 1000) 1851 != dc->bb_overrides.dram_clock_change_latency_ns 1852 && dc->bb_overrides.dram_clock_change_latency_ns) { 1853 bb->dram_clock_change_latency_us = 1854 dc->bb_overrides.dram_clock_change_latency_ns / 1000.0; 1855 } 1856 1857 if ((int)(bb->dummy_pstate_latency_us * 1000) 1858 != dc->bb_overrides.dummy_clock_change_latency_ns 1859 && dc->bb_overrides.dummy_clock_change_latency_ns) { 1860 bb->dummy_pstate_latency_us = 1861 dc->bb_overrides.dummy_clock_change_latency_ns / 1000.0; 1862 } 1863 } 1864 1865 static bool dcn20_validate_bandwidth_internal(struct dc *dc, struct dc_state *context, 1866 bool fast_validate) 1867 { 1868 bool out = false; 1869 1870 BW_VAL_TRACE_SETUP(); 1871 1872 int vlevel = 0; 1873 int pipe_split_from[MAX_PIPES]; 1874 int pipe_cnt = 0; 1875 display_e2e_pipe_params_st *pipes = kzalloc(dc->res_pool->pipe_count * sizeof(display_e2e_pipe_params_st), GFP_ATOMIC); 1876 DC_LOGGER_INIT(dc->ctx->logger); 1877 1878 BW_VAL_TRACE_COUNT(); 1879 1880 out = dcn20_fast_validate_bw(dc, context, pipes, &pipe_cnt, pipe_split_from, &vlevel, fast_validate); 1881 1882 if (pipe_cnt == 0) 1883 goto validate_out; 1884 1885 if (!out) 1886 goto validate_fail; 1887 1888 BW_VAL_TRACE_END_VOLTAGE_LEVEL(); 1889 1890 if (fast_validate) { 1891 BW_VAL_TRACE_SKIP(fast); 1892 goto validate_out; 1893 } 1894 1895 dcn20_calculate_wm(dc, context, pipes, &pipe_cnt, pipe_split_from, vlevel, fast_validate); 1896 dcn20_calculate_dlg_params(dc, context, pipes, pipe_cnt, vlevel); 1897 1898 BW_VAL_TRACE_END_WATERMARKS(); 1899 1900 goto validate_out; 1901 1902 validate_fail: 1903 DC_LOG_WARNING("Mode Validation Warning: %s failed validation.\n", 1904 dml_get_status_message(context->bw_ctx.dml.vba.ValidationStatus[context->bw_ctx.dml.vba.soc.num_states])); 1905 1906 BW_VAL_TRACE_SKIP(fail); 1907 out = false; 1908 1909 validate_out: 1910 kfree(pipes); 1911 1912 BW_VAL_TRACE_FINISH(); 1913 1914 return out; 1915 } 1916 1917 bool dcn20_validate_bandwidth_fp(struct dc *dc, 1918 struct dc_state *context, 1919 bool fast_validate) 1920 { 1921 bool voltage_supported = false; 1922 bool full_pstate_supported = false; 1923 bool dummy_pstate_supported = false; 1924 double p_state_latency_us; 1925 1926 dc_assert_fp_enabled(); 1927 1928 p_state_latency_us = context->bw_ctx.dml.soc.dram_clock_change_latency_us; 1929 context->bw_ctx.dml.soc.disable_dram_clock_change_vactive_support = 1930 dc->debug.disable_dram_clock_change_vactive_support; 1931 context->bw_ctx.dml.soc.allow_dram_clock_one_display_vactive = 1932 dc->debug.enable_dram_clock_change_one_display_vactive; 1933 1934 /*Unsafe due to current pipe merge and split logic*/ 1935 ASSERT(context != dc->current_state); 1936 1937 if (fast_validate) { 1938 return dcn20_validate_bandwidth_internal(dc, context, true); 1939 } 1940 1941 // Best case, we support full UCLK switch latency 1942 voltage_supported = dcn20_validate_bandwidth_internal(dc, context, false); 1943 full_pstate_supported = context->bw_ctx.bw.dcn.clk.p_state_change_support; 1944 1945 if (context->bw_ctx.dml.soc.dummy_pstate_latency_us == 0 || 1946 (voltage_supported && full_pstate_supported)) { 1947 context->bw_ctx.bw.dcn.clk.p_state_change_support = full_pstate_supported; 1948 goto restore_dml_state; 1949 } 1950 1951 // Fallback: Try to only support G6 temperature read latency 1952 context->bw_ctx.dml.soc.dram_clock_change_latency_us = context->bw_ctx.dml.soc.dummy_pstate_latency_us; 1953 1954 voltage_supported = dcn20_validate_bandwidth_internal(dc, context, false); 1955 dummy_pstate_supported = context->bw_ctx.bw.dcn.clk.p_state_change_support; 1956 1957 if (voltage_supported && (dummy_pstate_supported || !(context->stream_count))) { 1958 context->bw_ctx.bw.dcn.clk.p_state_change_support = false; 1959 goto restore_dml_state; 1960 } 1961 1962 // ERROR: fallback is supposed to always work. 1963 ASSERT(false); 1964 1965 restore_dml_state: 1966 context->bw_ctx.dml.soc.dram_clock_change_latency_us = p_state_latency_us; 1967 return voltage_supported; 1968 } 1969 1970 void dcn20_fpu_set_wm_ranges(int i, 1971 struct pp_smu_wm_range_sets *ranges, 1972 struct _vcs_dpi_soc_bounding_box_st *loaded_bb) 1973 { 1974 dc_assert_fp_enabled(); 1975 1976 ranges->reader_wm_sets[i].min_fill_clk_mhz = (i > 0) ? (loaded_bb->clock_limits[i - 1].dram_speed_mts / 16) + 1 : 0; 1977 ranges->reader_wm_sets[i].max_fill_clk_mhz = loaded_bb->clock_limits[i].dram_speed_mts / 16; 1978 } 1979 1980 void dcn20_fpu_adjust_dppclk(struct vba_vars_st *v, 1981 int vlevel, 1982 int max_mpc_comb, 1983 int pipe_idx, 1984 bool is_validating_bw) 1985 { 1986 dc_assert_fp_enabled(); 1987 1988 if (is_validating_bw) 1989 v->RequiredDPPCLK[vlevel][max_mpc_comb][pipe_idx] *= 2; 1990 else 1991 v->RequiredDPPCLK[vlevel][max_mpc_comb][pipe_idx] /= 2; 1992 } 1993 1994 int dcn21_populate_dml_pipes_from_context(struct dc *dc, 1995 struct dc_state *context, 1996 display_e2e_pipe_params_st *pipes, 1997 bool fast_validate) 1998 { 1999 uint32_t pipe_cnt; 2000 int i; 2001 2002 dc_assert_fp_enabled(); 2003 2004 pipe_cnt = dcn20_populate_dml_pipes_from_context(dc, context, pipes, fast_validate); 2005 2006 for (i = 0; i < pipe_cnt; i++) { 2007 2008 pipes[i].pipe.src.hostvm = dc->res_pool->hubbub->riommu_active; 2009 pipes[i].pipe.src.gpuvm = 1; 2010 } 2011 2012 return pipe_cnt; 2013 } 2014 2015 static void patch_bounding_box(struct dc *dc, struct _vcs_dpi_soc_bounding_box_st *bb) 2016 { 2017 int i; 2018 2019 if (dc->bb_overrides.sr_exit_time_ns) { 2020 for (i = 0; i < WM_SET_COUNT; i++) { 2021 dc->clk_mgr->bw_params->wm_table.entries[i].sr_exit_time_us = 2022 dc->bb_overrides.sr_exit_time_ns / 1000.0; 2023 } 2024 } 2025 2026 if (dc->bb_overrides.sr_enter_plus_exit_time_ns) { 2027 for (i = 0; i < WM_SET_COUNT; i++) { 2028 dc->clk_mgr->bw_params->wm_table.entries[i].sr_enter_plus_exit_time_us = 2029 dc->bb_overrides.sr_enter_plus_exit_time_ns / 1000.0; 2030 } 2031 } 2032 2033 if (dc->bb_overrides.urgent_latency_ns) { 2034 bb->urgent_latency_us = dc->bb_overrides.urgent_latency_ns / 1000.0; 2035 } 2036 2037 if (dc->bb_overrides.dram_clock_change_latency_ns) { 2038 for (i = 0; i < WM_SET_COUNT; i++) { 2039 dc->clk_mgr->bw_params->wm_table.entries[i].pstate_latency_us = 2040 dc->bb_overrides.dram_clock_change_latency_ns / 1000.0; 2041 } 2042 } 2043 } 2044 2045 static void calculate_wm_set_for_vlevel(int vlevel, 2046 struct wm_range_table_entry *table_entry, 2047 struct dcn_watermarks *wm_set, 2048 struct display_mode_lib *dml, 2049 display_e2e_pipe_params_st *pipes, 2050 int pipe_cnt) 2051 { 2052 double dram_clock_change_latency_cached = dml->soc.dram_clock_change_latency_us; 2053 2054 ASSERT(vlevel < dml->soc.num_states); 2055 /* only pipe 0 is read for voltage and dcf/soc clocks */ 2056 pipes[0].clks_cfg.voltage = vlevel; 2057 pipes[0].clks_cfg.dcfclk_mhz = dml->soc.clock_limits[vlevel].dcfclk_mhz; 2058 pipes[0].clks_cfg.socclk_mhz = dml->soc.clock_limits[vlevel].socclk_mhz; 2059 2060 dml->soc.dram_clock_change_latency_us = table_entry->pstate_latency_us; 2061 dml->soc.sr_exit_time_us = table_entry->sr_exit_time_us; 2062 dml->soc.sr_enter_plus_exit_time_us = table_entry->sr_enter_plus_exit_time_us; 2063 2064 wm_set->urgent_ns = get_wm_urgent(dml, pipes, pipe_cnt) * 1000; 2065 wm_set->cstate_pstate.cstate_enter_plus_exit_ns = get_wm_stutter_enter_exit(dml, pipes, pipe_cnt) * 1000; 2066 wm_set->cstate_pstate.cstate_exit_ns = get_wm_stutter_exit(dml, pipes, pipe_cnt) * 1000; 2067 wm_set->cstate_pstate.pstate_change_ns = get_wm_dram_clock_change(dml, pipes, pipe_cnt) * 1000; 2068 wm_set->pte_meta_urgent_ns = get_wm_memory_trip(dml, pipes, pipe_cnt) * 1000; 2069 wm_set->frac_urg_bw_nom = get_fraction_of_urgent_bandwidth(dml, pipes, pipe_cnt) * 1000; 2070 wm_set->frac_urg_bw_flip = get_fraction_of_urgent_bandwidth_imm_flip(dml, pipes, pipe_cnt) * 1000; 2071 wm_set->urgent_latency_ns = get_urgent_latency(dml, pipes, pipe_cnt) * 1000; 2072 dml->soc.dram_clock_change_latency_us = dram_clock_change_latency_cached; 2073 } 2074 2075 static void dcn21_calculate_wm(struct dc *dc, struct dc_state *context, 2076 display_e2e_pipe_params_st *pipes, 2077 int *out_pipe_cnt, 2078 int *pipe_split_from, 2079 int vlevel_req, 2080 bool fast_validate) 2081 { 2082 int pipe_cnt, i, pipe_idx; 2083 int vlevel, vlevel_max; 2084 struct wm_range_table_entry *table_entry; 2085 struct clk_bw_params *bw_params = dc->clk_mgr->bw_params; 2086 2087 ASSERT(bw_params); 2088 2089 patch_bounding_box(dc, &context->bw_ctx.dml.soc); 2090 2091 for (i = 0, pipe_idx = 0, pipe_cnt = 0; i < dc->res_pool->pipe_count; i++) { 2092 if (!context->res_ctx.pipe_ctx[i].stream) 2093 continue; 2094 2095 pipes[pipe_cnt].clks_cfg.refclk_mhz = dc->res_pool->ref_clocks.dchub_ref_clock_inKhz / 1000.0; 2096 pipes[pipe_cnt].clks_cfg.dispclk_mhz = context->bw_ctx.dml.vba.RequiredDISPCLK[vlevel_req][context->bw_ctx.dml.vba.maxMpcComb]; 2097 2098 if (pipe_split_from[i] < 0) { 2099 pipes[pipe_cnt].clks_cfg.dppclk_mhz = 2100 context->bw_ctx.dml.vba.RequiredDPPCLK[vlevel_req][context->bw_ctx.dml.vba.maxMpcComb][pipe_idx]; 2101 if (context->bw_ctx.dml.vba.BlendingAndTiming[pipe_idx] == pipe_idx) 2102 pipes[pipe_cnt].pipe.dest.odm_combine = 2103 context->bw_ctx.dml.vba.ODMCombineEnablePerState[vlevel_req][pipe_idx]; 2104 else 2105 pipes[pipe_cnt].pipe.dest.odm_combine = 0; 2106 pipe_idx++; 2107 } else { 2108 pipes[pipe_cnt].clks_cfg.dppclk_mhz = 2109 context->bw_ctx.dml.vba.RequiredDPPCLK[vlevel_req][context->bw_ctx.dml.vba.maxMpcComb][pipe_split_from[i]]; 2110 if (context->bw_ctx.dml.vba.BlendingAndTiming[pipe_split_from[i]] == pipe_split_from[i]) 2111 pipes[pipe_cnt].pipe.dest.odm_combine = 2112 context->bw_ctx.dml.vba.ODMCombineEnablePerState[vlevel_req][pipe_split_from[i]]; 2113 else 2114 pipes[pipe_cnt].pipe.dest.odm_combine = 0; 2115 } 2116 pipe_cnt++; 2117 } 2118 2119 if (pipe_cnt != pipe_idx) { 2120 if (dc->res_pool->funcs->populate_dml_pipes) 2121 pipe_cnt = dc->res_pool->funcs->populate_dml_pipes(dc, 2122 context, pipes, fast_validate); 2123 else 2124 pipe_cnt = dcn21_populate_dml_pipes_from_context(dc, 2125 context, pipes, fast_validate); 2126 } 2127 2128 *out_pipe_cnt = pipe_cnt; 2129 2130 vlevel_max = bw_params->clk_table.num_entries - 1; 2131 2132 2133 /* WM Set D */ 2134 table_entry = &bw_params->wm_table.entries[WM_D]; 2135 if (table_entry->wm_type == WM_TYPE_RETRAINING) 2136 vlevel = 0; 2137 else 2138 vlevel = vlevel_max; 2139 calculate_wm_set_for_vlevel(vlevel, table_entry, &context->bw_ctx.bw.dcn.watermarks.d, 2140 &context->bw_ctx.dml, pipes, pipe_cnt); 2141 /* WM Set C */ 2142 table_entry = &bw_params->wm_table.entries[WM_C]; 2143 vlevel = MIN(MAX(vlevel_req, 3), vlevel_max); 2144 calculate_wm_set_for_vlevel(vlevel, table_entry, &context->bw_ctx.bw.dcn.watermarks.c, 2145 &context->bw_ctx.dml, pipes, pipe_cnt); 2146 /* WM Set B */ 2147 table_entry = &bw_params->wm_table.entries[WM_B]; 2148 vlevel = MIN(MAX(vlevel_req, 2), vlevel_max); 2149 calculate_wm_set_for_vlevel(vlevel, table_entry, &context->bw_ctx.bw.dcn.watermarks.b, 2150 &context->bw_ctx.dml, pipes, pipe_cnt); 2151 2152 /* WM Set A */ 2153 table_entry = &bw_params->wm_table.entries[WM_A]; 2154 vlevel = MIN(vlevel_req, vlevel_max); 2155 calculate_wm_set_for_vlevel(vlevel, table_entry, &context->bw_ctx.bw.dcn.watermarks.a, 2156 &context->bw_ctx.dml, pipes, pipe_cnt); 2157 } 2158 2159 bool dcn21_validate_bandwidth_fp(struct dc *dc, 2160 struct dc_state *context, 2161 bool fast_validate) 2162 { 2163 bool out = false; 2164 2165 BW_VAL_TRACE_SETUP(); 2166 2167 int vlevel = 0; 2168 int pipe_split_from[MAX_PIPES]; 2169 int pipe_cnt = 0; 2170 display_e2e_pipe_params_st *pipes = kzalloc(dc->res_pool->pipe_count * sizeof(display_e2e_pipe_params_st), GFP_ATOMIC); 2171 DC_LOGGER_INIT(dc->ctx->logger); 2172 2173 BW_VAL_TRACE_COUNT(); 2174 2175 dc_assert_fp_enabled(); 2176 2177 /*Unsafe due to current pipe merge and split logic*/ 2178 ASSERT(context != dc->current_state); 2179 2180 out = dcn21_fast_validate_bw(dc, context, pipes, &pipe_cnt, pipe_split_from, &vlevel, fast_validate); 2181 2182 if (pipe_cnt == 0) 2183 goto validate_out; 2184 2185 if (!out) 2186 goto validate_fail; 2187 2188 BW_VAL_TRACE_END_VOLTAGE_LEVEL(); 2189 2190 if (fast_validate) { 2191 BW_VAL_TRACE_SKIP(fast); 2192 goto validate_out; 2193 } 2194 2195 dcn21_calculate_wm(dc, context, pipes, &pipe_cnt, pipe_split_from, vlevel, fast_validate); 2196 dcn20_calculate_dlg_params(dc, context, pipes, pipe_cnt, vlevel); 2197 2198 BW_VAL_TRACE_END_WATERMARKS(); 2199 2200 goto validate_out; 2201 2202 validate_fail: 2203 DC_LOG_WARNING("Mode Validation Warning: %s failed validation.\n", 2204 dml_get_status_message(context->bw_ctx.dml.vba.ValidationStatus[context->bw_ctx.dml.vba.soc.num_states])); 2205 2206 BW_VAL_TRACE_SKIP(fail); 2207 out = false; 2208 2209 validate_out: 2210 kfree(pipes); 2211 2212 BW_VAL_TRACE_FINISH(); 2213 2214 return out; 2215 } 2216 2217 static struct _vcs_dpi_voltage_scaling_st construct_low_pstate_lvl(struct clk_limit_table *clk_table, unsigned int high_voltage_lvl) 2218 { 2219 struct _vcs_dpi_voltage_scaling_st low_pstate_lvl; 2220 int i; 2221 2222 low_pstate_lvl.state = 1; 2223 low_pstate_lvl.dcfclk_mhz = clk_table->entries[0].dcfclk_mhz; 2224 low_pstate_lvl.fabricclk_mhz = clk_table->entries[0].fclk_mhz; 2225 low_pstate_lvl.socclk_mhz = clk_table->entries[0].socclk_mhz; 2226 low_pstate_lvl.dram_speed_mts = clk_table->entries[0].memclk_mhz * 2; 2227 2228 low_pstate_lvl.dispclk_mhz = dcn2_1_soc.clock_limits[high_voltage_lvl].dispclk_mhz; 2229 low_pstate_lvl.dppclk_mhz = dcn2_1_soc.clock_limits[high_voltage_lvl].dppclk_mhz; 2230 low_pstate_lvl.dram_bw_per_chan_gbps = dcn2_1_soc.clock_limits[high_voltage_lvl].dram_bw_per_chan_gbps; 2231 low_pstate_lvl.dscclk_mhz = dcn2_1_soc.clock_limits[high_voltage_lvl].dscclk_mhz; 2232 low_pstate_lvl.dtbclk_mhz = dcn2_1_soc.clock_limits[high_voltage_lvl].dtbclk_mhz; 2233 low_pstate_lvl.phyclk_d18_mhz = dcn2_1_soc.clock_limits[high_voltage_lvl].phyclk_d18_mhz; 2234 low_pstate_lvl.phyclk_mhz = dcn2_1_soc.clock_limits[high_voltage_lvl].phyclk_mhz; 2235 2236 for (i = clk_table->num_entries; i > 1; i--) 2237 clk_table->entries[i] = clk_table->entries[i-1]; 2238 clk_table->entries[1] = clk_table->entries[0]; 2239 clk_table->num_entries++; 2240 2241 return low_pstate_lvl; 2242 } 2243 2244 void dcn21_update_bw_bounding_box(struct dc *dc, struct clk_bw_params *bw_params) 2245 { 2246 struct _vcs_dpi_voltage_scaling_st *s = dc->scratch.update_bw_bounding_box.clock_limits; 2247 struct dcn21_resource_pool *pool = TO_DCN21_RES_POOL(dc->res_pool); 2248 struct clk_limit_table *clk_table = &bw_params->clk_table; 2249 unsigned int i, closest_clk_lvl = 0, k = 0; 2250 int j; 2251 2252 dc_assert_fp_enabled(); 2253 2254 dcn2_1_ip.max_num_otg = pool->base.res_cap->num_timing_generator; 2255 dcn2_1_ip.max_num_dpp = pool->base.pipe_count; 2256 dcn2_1_soc.num_chans = bw_params->num_channels; 2257 2258 ASSERT(clk_table->num_entries); 2259 /* Copy dcn2_1_soc.clock_limits to clock_limits to avoid copying over null states later */ 2260 memcpy(s, dcn2_1_soc.clock_limits, sizeof(dcn2_1_soc.clock_limits)); 2261 2262 for (i = 0; i < clk_table->num_entries; i++) { 2263 /* loop backwards*/ 2264 for (closest_clk_lvl = 0, j = dcn2_1_soc.num_states - 1; j >= 0; j--) { 2265 if ((unsigned int) dcn2_1_soc.clock_limits[j].dcfclk_mhz <= clk_table->entries[i].dcfclk_mhz) { 2266 closest_clk_lvl = j; 2267 break; 2268 } 2269 } 2270 2271 /* clk_table[1] is reserved for min DF PState. skip here to fill in later. */ 2272 if (i == 1) 2273 k++; 2274 2275 s[k].state = k; 2276 s[k].dcfclk_mhz = clk_table->entries[i].dcfclk_mhz; 2277 s[k].fabricclk_mhz = clk_table->entries[i].fclk_mhz; 2278 s[k].socclk_mhz = clk_table->entries[i].socclk_mhz; 2279 s[k].dram_speed_mts = clk_table->entries[i].memclk_mhz * 2; 2280 2281 s[k].dispclk_mhz = dcn2_1_soc.clock_limits[closest_clk_lvl].dispclk_mhz; 2282 s[k].dppclk_mhz = dcn2_1_soc.clock_limits[closest_clk_lvl].dppclk_mhz; 2283 s[k].dram_bw_per_chan_gbps = 2284 dcn2_1_soc.clock_limits[closest_clk_lvl].dram_bw_per_chan_gbps; 2285 s[k].dscclk_mhz = dcn2_1_soc.clock_limits[closest_clk_lvl].dscclk_mhz; 2286 s[k].dtbclk_mhz = dcn2_1_soc.clock_limits[closest_clk_lvl].dtbclk_mhz; 2287 s[k].phyclk_d18_mhz = dcn2_1_soc.clock_limits[closest_clk_lvl].phyclk_d18_mhz; 2288 s[k].phyclk_mhz = dcn2_1_soc.clock_limits[closest_clk_lvl].phyclk_mhz; 2289 2290 k++; 2291 } 2292 2293 memcpy(dcn2_1_soc.clock_limits, s, sizeof(dcn2_1_soc.clock_limits)); 2294 2295 if (clk_table->num_entries) { 2296 dcn2_1_soc.num_states = clk_table->num_entries + 1; 2297 /* fill in min DF PState */ 2298 dcn2_1_soc.clock_limits[1] = construct_low_pstate_lvl(clk_table, closest_clk_lvl); 2299 /* duplicate last level */ 2300 dcn2_1_soc.clock_limits[dcn2_1_soc.num_states] = dcn2_1_soc.clock_limits[dcn2_1_soc.num_states - 1]; 2301 dcn2_1_soc.clock_limits[dcn2_1_soc.num_states].state = dcn2_1_soc.num_states; 2302 } 2303 2304 dml_init_instance(&dc->dml, &dcn2_1_soc, &dcn2_1_ip, DML_PROJECT_DCN21); 2305 } 2306 2307 void dcn21_clk_mgr_set_bw_params_wm_table(struct clk_bw_params *bw_params) 2308 { 2309 dc_assert_fp_enabled(); 2310 2311 bw_params->wm_table.entries[WM_D].pstate_latency_us = LPDDR_MEM_RETRAIN_LATENCY; 2312 bw_params->wm_table.entries[WM_D].wm_inst = WM_D; 2313 bw_params->wm_table.entries[WM_D].wm_type = WM_TYPE_RETRAINING; 2314 bw_params->wm_table.entries[WM_D].valid = true; 2315 } 2316 2317 void dcn201_populate_dml_writeback_from_context_fpu(struct dc *dc, 2318 struct resource_context *res_ctx, 2319 display_e2e_pipe_params_st *pipes) 2320 { 2321 int pipe_cnt, i, j; 2322 double max_calc_writeback_dispclk; 2323 double writeback_dispclk; 2324 struct writeback_st dout_wb; 2325 2326 dc_assert_fp_enabled(); 2327 2328 for (i = 0, pipe_cnt = 0; i < dc->res_pool->pipe_count; i++) { 2329 struct dc_stream_state *stream = res_ctx->pipe_ctx[i].stream; 2330 2331 if (!stream) 2332 continue; 2333 max_calc_writeback_dispclk = 0; 2334 2335 /* Set writeback information */ 2336 pipes[pipe_cnt].dout.wb_enable = 0; 2337 pipes[pipe_cnt].dout.num_active_wb = 0; 2338 for (j = 0; j < stream->num_wb_info; j++) { 2339 struct dc_writeback_info *wb_info = &stream->writeback_info[j]; 2340 2341 if (wb_info->wb_enabled && wb_info->writeback_source_plane && 2342 (wb_info->writeback_source_plane == res_ctx->pipe_ctx[i].plane_state)) { 2343 pipes[pipe_cnt].dout.wb_enable = 1; 2344 pipes[pipe_cnt].dout.num_active_wb++; 2345 dout_wb.wb_src_height = wb_info->dwb_params.cnv_params.crop_en ? 2346 wb_info->dwb_params.cnv_params.crop_height : 2347 wb_info->dwb_params.cnv_params.src_height; 2348 dout_wb.wb_src_width = wb_info->dwb_params.cnv_params.crop_en ? 2349 wb_info->dwb_params.cnv_params.crop_width : 2350 wb_info->dwb_params.cnv_params.src_width; 2351 dout_wb.wb_dst_width = wb_info->dwb_params.dest_width; 2352 dout_wb.wb_dst_height = wb_info->dwb_params.dest_height; 2353 dout_wb.wb_htaps_luma = wb_info->dwb_params.scaler_taps.h_taps; 2354 dout_wb.wb_vtaps_luma = wb_info->dwb_params.scaler_taps.v_taps; 2355 dout_wb.wb_htaps_chroma = wb_info->dwb_params.scaler_taps.h_taps_c; 2356 dout_wb.wb_vtaps_chroma = wb_info->dwb_params.scaler_taps.v_taps_c; 2357 dout_wb.wb_hratio = wb_info->dwb_params.cnv_params.crop_en ? 2358 (double)wb_info->dwb_params.cnv_params.crop_width / 2359 (double)wb_info->dwb_params.dest_width : 2360 (double)wb_info->dwb_params.cnv_params.src_width / 2361 (double)wb_info->dwb_params.dest_width; 2362 dout_wb.wb_vratio = wb_info->dwb_params.cnv_params.crop_en ? 2363 (double)wb_info->dwb_params.cnv_params.crop_height / 2364 (double)wb_info->dwb_params.dest_height : 2365 (double)wb_info->dwb_params.cnv_params.src_height / 2366 (double)wb_info->dwb_params.dest_height; 2367 if (wb_info->dwb_params.out_format == dwb_scaler_mode_yuv420) { 2368 if (wb_info->dwb_params.output_depth == DWB_OUTPUT_PIXEL_DEPTH_8BPC) 2369 dout_wb.wb_pixel_format = dm_420_8; 2370 else 2371 dout_wb.wb_pixel_format = dm_420_10; 2372 } else 2373 dout_wb.wb_pixel_format = dm_444_32; 2374 2375 /* Workaround for cases where multiple writebacks are connected to same plane 2376 * In which case, need to compute worst case and set the associated writeback parameters 2377 * This workaround is necessary due to DML computation assuming only 1 set of writeback 2378 * parameters per pipe */ 2379 writeback_dispclk = CalculateWriteBackDISPCLK( 2380 dout_wb.wb_pixel_format, 2381 pipes[pipe_cnt].pipe.dest.pixel_rate_mhz, 2382 dout_wb.wb_hratio, 2383 dout_wb.wb_vratio, 2384 dout_wb.wb_htaps_luma, 2385 dout_wb.wb_vtaps_luma, 2386 dout_wb.wb_htaps_chroma, 2387 dout_wb.wb_vtaps_chroma, 2388 dout_wb.wb_dst_width, 2389 pipes[pipe_cnt].pipe.dest.htotal, 2390 2); 2391 2392 if (writeback_dispclk > max_calc_writeback_dispclk) { 2393 max_calc_writeback_dispclk = writeback_dispclk; 2394 pipes[pipe_cnt].dout.wb = dout_wb; 2395 } 2396 } 2397 } 2398 2399 pipe_cnt++; 2400 } 2401 2402 } 2403