Merge tag 'asoc-v5.19' of https://git.kernel.org/pub/scm/linux/kernel/git/broonie...
[linux-2.6-microblaze.git] / drivers / gpu / drm / amd / display / dc / dml / dcn20 / dcn20_fpu.c
1 // SPDX-License-Identifier: MIT
2 /*
3  * Copyright 2021 Advanced Micro Devices, Inc.
4  *
5  * Permission is hereby granted, free of charge, to any person obtaining a
6  * copy of this software and associated documentation files (the "Software"),
7  * to deal in the Software without restriction, including without limitation
8  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
9  * and/or sell copies of the Software, and to permit persons to whom the
10  * Software is furnished to do so, subject to the following conditions:
11  *
12  * The above copyright notice and this permission notice shall be included in
13  * all copies or substantial portions of the Software.
14  *
15  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
18  * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
19  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
20  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
21  * OTHER DEALINGS IN THE SOFTWARE.
22  *
23  * Authors: AMD
24  *
25  */
26
27 #include "resource.h"
28 #include "clk_mgr.h"
29 #include "dc_link_dp.h"
30 #include "dchubbub.h"
31 #include "dcn20/dcn20_resource.h"
32 #include "dcn21/dcn21_resource.h"
33
34 #include "dcn20_fpu.h"
35
36 #define DC_LOGGER_INIT(logger)
37
38 #ifndef MAX
39 #define MAX(X, Y) ((X) > (Y) ? (X) : (Y))
40 #endif
41 #ifndef MIN
42 #define MIN(X, Y) ((X) < (Y) ? (X) : (Y))
43 #endif
44
45 /**
46  * DOC: DCN2x FPU manipulation Overview
47  *
48  * The DCN architecture relies on FPU operations, which require special
49  * compilation flags and the use of kernel_fpu_begin/end functions; ideally, we
50  * want to avoid spreading FPU access across multiple files. With this idea in
51  * mind, this file aims to centralize all DCN20 and DCN2.1 (DCN2x) functions
52  * that require FPU access in a single place. Code in this file follows the
53  * following code pattern:
54  *
55  * 1. Functions that use FPU operations should be isolated in static functions.
56  * 2. The FPU functions should have the noinline attribute to ensure anything
57  *    that deals with FP register is contained within this call.
58  * 3. All function that needs to be accessed outside this file requires a
59  *    public interface that not uses any FPU reference.
60  * 4. Developers **must not** use DC_FP_START/END in this file, but they need
61  *    to ensure that the caller invokes it before access any function available
62  *    in this file. For this reason, public functions in this file must invoke
63  *    dc_assert_fp_enabled();
64  *
65  * Let's expand a little bit more the idea in the code pattern. To fully
66  * isolate FPU operations in a single place, we must avoid situations where
67  * compilers spill FP values to registers due to FP enable in a specific C
68  * file. Note that even if we isolate all FPU functions in a single file and
69  * call its interface from other files, the compiler might enable the use of
70  * FPU before we call DC_FP_START. Nevertheless, it is the programmer's
71  * responsibility to invoke DC_FP_START/END in the correct place. To highlight
72  * situations where developers forgot to use the FP protection before calling
73  * the DC FPU interface functions, we introduce a helper that checks if the
74  * function is invoked under FP protection. If not, it will trigger a kernel
75  * warning.
76  */
77
78 struct _vcs_dpi_ip_params_st dcn2_0_ip = {
79         .odm_capable = 1,
80         .gpuvm_enable = 0,
81         .hostvm_enable = 0,
82         .gpuvm_max_page_table_levels = 4,
83         .hostvm_max_page_table_levels = 4,
84         .hostvm_cached_page_table_levels = 0,
85         .pte_group_size_bytes = 2048,
86         .num_dsc = 6,
87         .rob_buffer_size_kbytes = 168,
88         .det_buffer_size_kbytes = 164,
89         .dpte_buffer_size_in_pte_reqs_luma = 84,
90         .pde_proc_buffer_size_64k_reqs = 48,
91         .dpp_output_buffer_pixels = 2560,
92         .opp_output_buffer_lines = 1,
93         .pixel_chunk_size_kbytes = 8,
94         .pte_chunk_size_kbytes = 2,
95         .meta_chunk_size_kbytes = 2,
96         .writeback_chunk_size_kbytes = 2,
97         .line_buffer_size_bits = 789504,
98         .is_line_buffer_bpp_fixed = 0,
99         .line_buffer_fixed_bpp = 0,
100         .dcc_supported = true,
101         .max_line_buffer_lines = 12,
102         .writeback_luma_buffer_size_kbytes = 12,
103         .writeback_chroma_buffer_size_kbytes = 8,
104         .writeback_chroma_line_buffer_width_pixels = 4,
105         .writeback_max_hscl_ratio = 1,
106         .writeback_max_vscl_ratio = 1,
107         .writeback_min_hscl_ratio = 1,
108         .writeback_min_vscl_ratio = 1,
109         .writeback_max_hscl_taps = 12,
110         .writeback_max_vscl_taps = 12,
111         .writeback_line_buffer_luma_buffer_size = 0,
112         .writeback_line_buffer_chroma_buffer_size = 14643,
113         .cursor_buffer_size = 8,
114         .cursor_chunk_size = 2,
115         .max_num_otg = 6,
116         .max_num_dpp = 6,
117         .max_num_wb = 1,
118         .max_dchub_pscl_bw_pix_per_clk = 4,
119         .max_pscl_lb_bw_pix_per_clk = 2,
120         .max_lb_vscl_bw_pix_per_clk = 4,
121         .max_vscl_hscl_bw_pix_per_clk = 4,
122         .max_hscl_ratio = 8,
123         .max_vscl_ratio = 8,
124         .hscl_mults = 4,
125         .vscl_mults = 4,
126         .max_hscl_taps = 8,
127         .max_vscl_taps = 8,
128         .dispclk_ramp_margin_percent = 1,
129         .underscan_factor = 1.10,
130         .min_vblank_lines = 32, //
131         .dppclk_delay_subtotal = 77, //
132         .dppclk_delay_scl_lb_only = 16,
133         .dppclk_delay_scl = 50,
134         .dppclk_delay_cnvc_formatter = 8,
135         .dppclk_delay_cnvc_cursor = 6,
136         .dispclk_delay_subtotal = 87, //
137         .dcfclk_cstate_latency = 10, // SRExitTime
138         .max_inter_dcn_tile_repeaters = 8,
139         .xfc_supported = true,
140         .xfc_fill_bw_overhead_percent = 10.0,
141         .xfc_fill_constant_bytes = 0,
142         .number_of_cursors = 1,
143 };
144
145 struct _vcs_dpi_ip_params_st dcn2_0_nv14_ip = {
146         .odm_capable = 1,
147         .gpuvm_enable = 0,
148         .hostvm_enable = 0,
149         .gpuvm_max_page_table_levels = 4,
150         .hostvm_max_page_table_levels = 4,
151         .hostvm_cached_page_table_levels = 0,
152         .num_dsc = 5,
153         .rob_buffer_size_kbytes = 168,
154         .det_buffer_size_kbytes = 164,
155         .dpte_buffer_size_in_pte_reqs_luma = 84,
156         .dpte_buffer_size_in_pte_reqs_chroma = 42,//todo
157         .dpp_output_buffer_pixels = 2560,
158         .opp_output_buffer_lines = 1,
159         .pixel_chunk_size_kbytes = 8,
160         .pte_enable = 1,
161         .max_page_table_levels = 4,
162         .pte_chunk_size_kbytes = 2,
163         .meta_chunk_size_kbytes = 2,
164         .writeback_chunk_size_kbytes = 2,
165         .line_buffer_size_bits = 789504,
166         .is_line_buffer_bpp_fixed = 0,
167         .line_buffer_fixed_bpp = 0,
168         .dcc_supported = true,
169         .max_line_buffer_lines = 12,
170         .writeback_luma_buffer_size_kbytes = 12,
171         .writeback_chroma_buffer_size_kbytes = 8,
172         .writeback_chroma_line_buffer_width_pixels = 4,
173         .writeback_max_hscl_ratio = 1,
174         .writeback_max_vscl_ratio = 1,
175         .writeback_min_hscl_ratio = 1,
176         .writeback_min_vscl_ratio = 1,
177         .writeback_max_hscl_taps = 12,
178         .writeback_max_vscl_taps = 12,
179         .writeback_line_buffer_luma_buffer_size = 0,
180         .writeback_line_buffer_chroma_buffer_size = 14643,
181         .cursor_buffer_size = 8,
182         .cursor_chunk_size = 2,
183         .max_num_otg = 5,
184         .max_num_dpp = 5,
185         .max_num_wb = 1,
186         .max_dchub_pscl_bw_pix_per_clk = 4,
187         .max_pscl_lb_bw_pix_per_clk = 2,
188         .max_lb_vscl_bw_pix_per_clk = 4,
189         .max_vscl_hscl_bw_pix_per_clk = 4,
190         .max_hscl_ratio = 8,
191         .max_vscl_ratio = 8,
192         .hscl_mults = 4,
193         .vscl_mults = 4,
194         .max_hscl_taps = 8,
195         .max_vscl_taps = 8,
196         .dispclk_ramp_margin_percent = 1,
197         .underscan_factor = 1.10,
198         .min_vblank_lines = 32, //
199         .dppclk_delay_subtotal = 77, //
200         .dppclk_delay_scl_lb_only = 16,
201         .dppclk_delay_scl = 50,
202         .dppclk_delay_cnvc_formatter = 8,
203         .dppclk_delay_cnvc_cursor = 6,
204         .dispclk_delay_subtotal = 87, //
205         .dcfclk_cstate_latency = 10, // SRExitTime
206         .max_inter_dcn_tile_repeaters = 8,
207         .xfc_supported = true,
208         .xfc_fill_bw_overhead_percent = 10.0,
209         .xfc_fill_constant_bytes = 0,
210         .ptoi_supported = 0,
211         .number_of_cursors = 1,
212 };
213
214 struct _vcs_dpi_soc_bounding_box_st dcn2_0_soc = {
215         /* Defaults that get patched on driver load from firmware. */
216         .clock_limits = {
217                         {
218                                 .state = 0,
219                                 .dcfclk_mhz = 560.0,
220                                 .fabricclk_mhz = 560.0,
221                                 .dispclk_mhz = 513.0,
222                                 .dppclk_mhz = 513.0,
223                                 .phyclk_mhz = 540.0,
224                                 .socclk_mhz = 560.0,
225                                 .dscclk_mhz = 171.0,
226                                 .dram_speed_mts = 8960.0,
227                         },
228                         {
229                                 .state = 1,
230                                 .dcfclk_mhz = 694.0,
231                                 .fabricclk_mhz = 694.0,
232                                 .dispclk_mhz = 642.0,
233                                 .dppclk_mhz = 642.0,
234                                 .phyclk_mhz = 600.0,
235                                 .socclk_mhz = 694.0,
236                                 .dscclk_mhz = 214.0,
237                                 .dram_speed_mts = 11104.0,
238                         },
239                         {
240                                 .state = 2,
241                                 .dcfclk_mhz = 875.0,
242                                 .fabricclk_mhz = 875.0,
243                                 .dispclk_mhz = 734.0,
244                                 .dppclk_mhz = 734.0,
245                                 .phyclk_mhz = 810.0,
246                                 .socclk_mhz = 875.0,
247                                 .dscclk_mhz = 245.0,
248                                 .dram_speed_mts = 14000.0,
249                         },
250                         {
251                                 .state = 3,
252                                 .dcfclk_mhz = 1000.0,
253                                 .fabricclk_mhz = 1000.0,
254                                 .dispclk_mhz = 1100.0,
255                                 .dppclk_mhz = 1100.0,
256                                 .phyclk_mhz = 810.0,
257                                 .socclk_mhz = 1000.0,
258                                 .dscclk_mhz = 367.0,
259                                 .dram_speed_mts = 16000.0,
260                         },
261                         {
262                                 .state = 4,
263                                 .dcfclk_mhz = 1200.0,
264                                 .fabricclk_mhz = 1200.0,
265                                 .dispclk_mhz = 1284.0,
266                                 .dppclk_mhz = 1284.0,
267                                 .phyclk_mhz = 810.0,
268                                 .socclk_mhz = 1200.0,
269                                 .dscclk_mhz = 428.0,
270                                 .dram_speed_mts = 16000.0,
271                         },
272                         /*Extra state, no dispclk ramping*/
273                         {
274                                 .state = 5,
275                                 .dcfclk_mhz = 1200.0,
276                                 .fabricclk_mhz = 1200.0,
277                                 .dispclk_mhz = 1284.0,
278                                 .dppclk_mhz = 1284.0,
279                                 .phyclk_mhz = 810.0,
280                                 .socclk_mhz = 1200.0,
281                                 .dscclk_mhz = 428.0,
282                                 .dram_speed_mts = 16000.0,
283                         },
284                 },
285         .num_states = 5,
286         .sr_exit_time_us = 8.6,
287         .sr_enter_plus_exit_time_us = 10.9,
288         .urgent_latency_us = 4.0,
289         .urgent_latency_pixel_data_only_us = 4.0,
290         .urgent_latency_pixel_mixed_with_vm_data_us = 4.0,
291         .urgent_latency_vm_data_only_us = 4.0,
292         .urgent_out_of_order_return_per_channel_pixel_only_bytes = 4096,
293         .urgent_out_of_order_return_per_channel_pixel_and_vm_bytes = 4096,
294         .urgent_out_of_order_return_per_channel_vm_only_bytes = 4096,
295         .pct_ideal_dram_sdp_bw_after_urgent_pixel_only = 40.0,
296         .pct_ideal_dram_sdp_bw_after_urgent_pixel_and_vm = 40.0,
297         .pct_ideal_dram_sdp_bw_after_urgent_vm_only = 40.0,
298         .max_avg_sdp_bw_use_normal_percent = 40.0,
299         .max_avg_dram_bw_use_normal_percent = 40.0,
300         .writeback_latency_us = 12.0,
301         .ideal_dram_bw_after_urgent_percent = 40.0,
302         .max_request_size_bytes = 256,
303         .dram_channel_width_bytes = 2,
304         .fabric_datapath_to_dcn_data_return_bytes = 64,
305         .dcn_downspread_percent = 0.5,
306         .downspread_percent = 0.38,
307         .dram_page_open_time_ns = 50.0,
308         .dram_rw_turnaround_time_ns = 17.5,
309         .dram_return_buffer_per_channel_bytes = 8192,
310         .round_trip_ping_latency_dcfclk_cycles = 131,
311         .urgent_out_of_order_return_per_channel_bytes = 256,
312         .channel_interleave_bytes = 256,
313         .num_banks = 8,
314         .num_chans = 16,
315         .vmm_page_size_bytes = 4096,
316         .dram_clock_change_latency_us = 404.0,
317         .dummy_pstate_latency_us = 5.0,
318         .writeback_dram_clock_change_latency_us = 23.0,
319         .return_bus_width_bytes = 64,
320         .dispclk_dppclk_vco_speed_mhz = 3850,
321         .xfc_bus_transport_time_us = 20,
322         .xfc_xbuf_latency_tolerance_us = 4,
323         .use_urgent_burst_bw = 0
324 };
325
326 struct _vcs_dpi_soc_bounding_box_st dcn2_0_nv14_soc = {
327         .clock_limits = {
328                         {
329                                 .state = 0,
330                                 .dcfclk_mhz = 560.0,
331                                 .fabricclk_mhz = 560.0,
332                                 .dispclk_mhz = 513.0,
333                                 .dppclk_mhz = 513.0,
334                                 .phyclk_mhz = 540.0,
335                                 .socclk_mhz = 560.0,
336                                 .dscclk_mhz = 171.0,
337                                 .dram_speed_mts = 8960.0,
338                         },
339                         {
340                                 .state = 1,
341                                 .dcfclk_mhz = 694.0,
342                                 .fabricclk_mhz = 694.0,
343                                 .dispclk_mhz = 642.0,
344                                 .dppclk_mhz = 642.0,
345                                 .phyclk_mhz = 600.0,
346                                 .socclk_mhz = 694.0,
347                                 .dscclk_mhz = 214.0,
348                                 .dram_speed_mts = 11104.0,
349                         },
350                         {
351                                 .state = 2,
352                                 .dcfclk_mhz = 875.0,
353                                 .fabricclk_mhz = 875.0,
354                                 .dispclk_mhz = 734.0,
355                                 .dppclk_mhz = 734.0,
356                                 .phyclk_mhz = 810.0,
357                                 .socclk_mhz = 875.0,
358                                 .dscclk_mhz = 245.0,
359                                 .dram_speed_mts = 14000.0,
360                         },
361                         {
362                                 .state = 3,
363                                 .dcfclk_mhz = 1000.0,
364                                 .fabricclk_mhz = 1000.0,
365                                 .dispclk_mhz = 1100.0,
366                                 .dppclk_mhz = 1100.0,
367                                 .phyclk_mhz = 810.0,
368                                 .socclk_mhz = 1000.0,
369                                 .dscclk_mhz = 367.0,
370                                 .dram_speed_mts = 16000.0,
371                         },
372                         {
373                                 .state = 4,
374                                 .dcfclk_mhz = 1200.0,
375                                 .fabricclk_mhz = 1200.0,
376                                 .dispclk_mhz = 1284.0,
377                                 .dppclk_mhz = 1284.0,
378                                 .phyclk_mhz = 810.0,
379                                 .socclk_mhz = 1200.0,
380                                 .dscclk_mhz = 428.0,
381                                 .dram_speed_mts = 16000.0,
382                         },
383                         /*Extra state, no dispclk ramping*/
384                         {
385                                 .state = 5,
386                                 .dcfclk_mhz = 1200.0,
387                                 .fabricclk_mhz = 1200.0,
388                                 .dispclk_mhz = 1284.0,
389                                 .dppclk_mhz = 1284.0,
390                                 .phyclk_mhz = 810.0,
391                                 .socclk_mhz = 1200.0,
392                                 .dscclk_mhz = 428.0,
393                                 .dram_speed_mts = 16000.0,
394                         },
395                 },
396         .num_states = 5,
397         .sr_exit_time_us = 11.6,
398         .sr_enter_plus_exit_time_us = 13.9,
399         .urgent_latency_us = 4.0,
400         .urgent_latency_pixel_data_only_us = 4.0,
401         .urgent_latency_pixel_mixed_with_vm_data_us = 4.0,
402         .urgent_latency_vm_data_only_us = 4.0,
403         .urgent_out_of_order_return_per_channel_pixel_only_bytes = 4096,
404         .urgent_out_of_order_return_per_channel_pixel_and_vm_bytes = 4096,
405         .urgent_out_of_order_return_per_channel_vm_only_bytes = 4096,
406         .pct_ideal_dram_sdp_bw_after_urgent_pixel_only = 40.0,
407         .pct_ideal_dram_sdp_bw_after_urgent_pixel_and_vm = 40.0,
408         .pct_ideal_dram_sdp_bw_after_urgent_vm_only = 40.0,
409         .max_avg_sdp_bw_use_normal_percent = 40.0,
410         .max_avg_dram_bw_use_normal_percent = 40.0,
411         .writeback_latency_us = 12.0,
412         .ideal_dram_bw_after_urgent_percent = 40.0,
413         .max_request_size_bytes = 256,
414         .dram_channel_width_bytes = 2,
415         .fabric_datapath_to_dcn_data_return_bytes = 64,
416         .dcn_downspread_percent = 0.5,
417         .downspread_percent = 0.38,
418         .dram_page_open_time_ns = 50.0,
419         .dram_rw_turnaround_time_ns = 17.5,
420         .dram_return_buffer_per_channel_bytes = 8192,
421         .round_trip_ping_latency_dcfclk_cycles = 131,
422         .urgent_out_of_order_return_per_channel_bytes = 256,
423         .channel_interleave_bytes = 256,
424         .num_banks = 8,
425         .num_chans = 8,
426         .vmm_page_size_bytes = 4096,
427         .dram_clock_change_latency_us = 404.0,
428         .dummy_pstate_latency_us = 5.0,
429         .writeback_dram_clock_change_latency_us = 23.0,
430         .return_bus_width_bytes = 64,
431         .dispclk_dppclk_vco_speed_mhz = 3850,
432         .xfc_bus_transport_time_us = 20,
433         .xfc_xbuf_latency_tolerance_us = 4,
434         .use_urgent_burst_bw = 0
435 };
436
437 struct _vcs_dpi_soc_bounding_box_st dcn2_0_nv12_soc = { 0 };
438
439 struct _vcs_dpi_ip_params_st dcn2_1_ip = {
440         .odm_capable = 1,
441         .gpuvm_enable = 1,
442         .hostvm_enable = 1,
443         .gpuvm_max_page_table_levels = 1,
444         .hostvm_max_page_table_levels = 4,
445         .hostvm_cached_page_table_levels = 2,
446         .num_dsc = 3,
447         .rob_buffer_size_kbytes = 168,
448         .det_buffer_size_kbytes = 164,
449         .dpte_buffer_size_in_pte_reqs_luma = 44,
450         .dpte_buffer_size_in_pte_reqs_chroma = 42,//todo
451         .dpp_output_buffer_pixels = 2560,
452         .opp_output_buffer_lines = 1,
453         .pixel_chunk_size_kbytes = 8,
454         .pte_enable = 1,
455         .max_page_table_levels = 4,
456         .pte_chunk_size_kbytes = 2,
457         .meta_chunk_size_kbytes = 2,
458         .min_meta_chunk_size_bytes = 256,
459         .writeback_chunk_size_kbytes = 2,
460         .line_buffer_size_bits = 789504,
461         .is_line_buffer_bpp_fixed = 0,
462         .line_buffer_fixed_bpp = 0,
463         .dcc_supported = true,
464         .max_line_buffer_lines = 12,
465         .writeback_luma_buffer_size_kbytes = 12,
466         .writeback_chroma_buffer_size_kbytes = 8,
467         .writeback_chroma_line_buffer_width_pixels = 4,
468         .writeback_max_hscl_ratio = 1,
469         .writeback_max_vscl_ratio = 1,
470         .writeback_min_hscl_ratio = 1,
471         .writeback_min_vscl_ratio = 1,
472         .writeback_max_hscl_taps = 12,
473         .writeback_max_vscl_taps = 12,
474         .writeback_line_buffer_luma_buffer_size = 0,
475         .writeback_line_buffer_chroma_buffer_size = 14643,
476         .cursor_buffer_size = 8,
477         .cursor_chunk_size = 2,
478         .max_num_otg = 4,
479         .max_num_dpp = 4,
480         .max_num_wb = 1,
481         .max_dchub_pscl_bw_pix_per_clk = 4,
482         .max_pscl_lb_bw_pix_per_clk = 2,
483         .max_lb_vscl_bw_pix_per_clk = 4,
484         .max_vscl_hscl_bw_pix_per_clk = 4,
485         .max_hscl_ratio = 4,
486         .max_vscl_ratio = 4,
487         .hscl_mults = 4,
488         .vscl_mults = 4,
489         .max_hscl_taps = 8,
490         .max_vscl_taps = 8,
491         .dispclk_ramp_margin_percent = 1,
492         .underscan_factor = 1.10,
493         .min_vblank_lines = 32, //
494         .dppclk_delay_subtotal = 77, //
495         .dppclk_delay_scl_lb_only = 16,
496         .dppclk_delay_scl = 50,
497         .dppclk_delay_cnvc_formatter = 8,
498         .dppclk_delay_cnvc_cursor = 6,
499         .dispclk_delay_subtotal = 87, //
500         .dcfclk_cstate_latency = 10, // SRExitTime
501         .max_inter_dcn_tile_repeaters = 8,
502
503         .xfc_supported = false,
504         .xfc_fill_bw_overhead_percent = 10.0,
505         .xfc_fill_constant_bytes = 0,
506         .ptoi_supported = 0,
507         .number_of_cursors = 1,
508 };
509
510 struct _vcs_dpi_soc_bounding_box_st dcn2_1_soc = {
511         .clock_limits = {
512                         {
513                                 .state = 0,
514                                 .dcfclk_mhz = 400.0,
515                                 .fabricclk_mhz = 400.0,
516                                 .dispclk_mhz = 600.0,
517                                 .dppclk_mhz = 400.00,
518                                 .phyclk_mhz = 600.0,
519                                 .socclk_mhz = 278.0,
520                                 .dscclk_mhz = 205.67,
521                                 .dram_speed_mts = 1600.0,
522                         },
523                         {
524                                 .state = 1,
525                                 .dcfclk_mhz = 464.52,
526                                 .fabricclk_mhz = 800.0,
527                                 .dispclk_mhz = 654.55,
528                                 .dppclk_mhz = 626.09,
529                                 .phyclk_mhz = 600.0,
530                                 .socclk_mhz = 278.0,
531                                 .dscclk_mhz = 205.67,
532                                 .dram_speed_mts = 1600.0,
533                         },
534                         {
535                                 .state = 2,
536                                 .dcfclk_mhz = 514.29,
537                                 .fabricclk_mhz = 933.0,
538                                 .dispclk_mhz = 757.89,
539                                 .dppclk_mhz = 685.71,
540                                 .phyclk_mhz = 600.0,
541                                 .socclk_mhz = 278.0,
542                                 .dscclk_mhz = 287.67,
543                                 .dram_speed_mts = 1866.0,
544                         },
545                         {
546                                 .state = 3,
547                                 .dcfclk_mhz = 576.00,
548                                 .fabricclk_mhz = 1067.0,
549                                 .dispclk_mhz = 847.06,
550                                 .dppclk_mhz = 757.89,
551                                 .phyclk_mhz = 600.0,
552                                 .socclk_mhz = 715.0,
553                                 .dscclk_mhz = 318.334,
554                                 .dram_speed_mts = 2134.0,
555                         },
556                         {
557                                 .state = 4,
558                                 .dcfclk_mhz = 626.09,
559                                 .fabricclk_mhz = 1200.0,
560                                 .dispclk_mhz = 900.00,
561                                 .dppclk_mhz = 847.06,
562                                 .phyclk_mhz = 810.0,
563                                 .socclk_mhz = 953.0,
564                                 .dscclk_mhz = 489.0,
565                                 .dram_speed_mts = 2400.0,
566                         },
567                         {
568                                 .state = 5,
569                                 .dcfclk_mhz = 685.71,
570                                 .fabricclk_mhz = 1333.0,
571                                 .dispclk_mhz = 1028.57,
572                                 .dppclk_mhz = 960.00,
573                                 .phyclk_mhz = 810.0,
574                                 .socclk_mhz = 278.0,
575                                 .dscclk_mhz = 287.67,
576                                 .dram_speed_mts = 2666.0,
577                         },
578                         {
579                                 .state = 6,
580                                 .dcfclk_mhz = 757.89,
581                                 .fabricclk_mhz = 1467.0,
582                                 .dispclk_mhz = 1107.69,
583                                 .dppclk_mhz = 1028.57,
584                                 .phyclk_mhz = 810.0,
585                                 .socclk_mhz = 715.0,
586                                 .dscclk_mhz = 318.334,
587                                 .dram_speed_mts = 3200.0,
588                         },
589                         {
590                                 .state = 7,
591                                 .dcfclk_mhz = 847.06,
592                                 .fabricclk_mhz = 1600.0,
593                                 .dispclk_mhz = 1395.0,
594                                 .dppclk_mhz = 1285.00,
595                                 .phyclk_mhz = 1325.0,
596                                 .socclk_mhz = 953.0,
597                                 .dscclk_mhz = 489.0,
598                                 .dram_speed_mts = 4266.0,
599                         },
600                         /*Extra state, no dispclk ramping*/
601                         {
602                                 .state = 8,
603                                 .dcfclk_mhz = 847.06,
604                                 .fabricclk_mhz = 1600.0,
605                                 .dispclk_mhz = 1395.0,
606                                 .dppclk_mhz = 1285.0,
607                                 .phyclk_mhz = 1325.0,
608                                 .socclk_mhz = 953.0,
609                                 .dscclk_mhz = 489.0,
610                                 .dram_speed_mts = 4266.0,
611                         },
612
613                 },
614
615         .sr_exit_time_us = 12.5,
616         .sr_enter_plus_exit_time_us = 17.0,
617         .urgent_latency_us = 4.0,
618         .urgent_latency_pixel_data_only_us = 4.0,
619         .urgent_latency_pixel_mixed_with_vm_data_us = 4.0,
620         .urgent_latency_vm_data_only_us = 4.0,
621         .urgent_out_of_order_return_per_channel_pixel_only_bytes = 4096,
622         .urgent_out_of_order_return_per_channel_pixel_and_vm_bytes = 4096,
623         .urgent_out_of_order_return_per_channel_vm_only_bytes = 4096,
624         .pct_ideal_dram_sdp_bw_after_urgent_pixel_only = 80.0,
625         .pct_ideal_dram_sdp_bw_after_urgent_pixel_and_vm = 75.0,
626         .pct_ideal_dram_sdp_bw_after_urgent_vm_only = 40.0,
627         .max_avg_sdp_bw_use_normal_percent = 60.0,
628         .max_avg_dram_bw_use_normal_percent = 100.0,
629         .writeback_latency_us = 12.0,
630         .max_request_size_bytes = 256,
631         .dram_channel_width_bytes = 4,
632         .fabric_datapath_to_dcn_data_return_bytes = 32,
633         .dcn_downspread_percent = 0.5,
634         .downspread_percent = 0.38,
635         .dram_page_open_time_ns = 50.0,
636         .dram_rw_turnaround_time_ns = 17.5,
637         .dram_return_buffer_per_channel_bytes = 8192,
638         .round_trip_ping_latency_dcfclk_cycles = 128,
639         .urgent_out_of_order_return_per_channel_bytes = 4096,
640         .channel_interleave_bytes = 256,
641         .num_banks = 8,
642         .num_chans = 4,
643         .vmm_page_size_bytes = 4096,
644         .dram_clock_change_latency_us = 23.84,
645         .return_bus_width_bytes = 64,
646         .dispclk_dppclk_vco_speed_mhz = 3600,
647         .xfc_bus_transport_time_us = 4,
648         .xfc_xbuf_latency_tolerance_us = 4,
649         .use_urgent_burst_bw = 1,
650         .num_states = 8
651 };
652
653 void dcn20_populate_dml_writeback_from_context(struct dc *dc,
654                                                struct resource_context *res_ctx,
655                                                display_e2e_pipe_params_st *pipes)
656 {
657         int pipe_cnt, i;
658
659         dc_assert_fp_enabled();
660
661         for (i = 0, pipe_cnt = 0; i < dc->res_pool->pipe_count; i++) {
662                 struct dc_writeback_info *wb_info = &res_ctx->pipe_ctx[i].stream->writeback_info[0];
663
664                 if (!res_ctx->pipe_ctx[i].stream)
665                         continue;
666
667                 /* Set writeback information */
668                 pipes[pipe_cnt].dout.wb_enable = (wb_info->wb_enabled == true) ? 1 : 0;
669                 pipes[pipe_cnt].dout.num_active_wb++;
670                 pipes[pipe_cnt].dout.wb.wb_src_height = wb_info->dwb_params.cnv_params.crop_height;
671                 pipes[pipe_cnt].dout.wb.wb_src_width = wb_info->dwb_params.cnv_params.crop_width;
672                 pipes[pipe_cnt].dout.wb.wb_dst_width = wb_info->dwb_params.dest_width;
673                 pipes[pipe_cnt].dout.wb.wb_dst_height = wb_info->dwb_params.dest_height;
674                 pipes[pipe_cnt].dout.wb.wb_htaps_luma = 1;
675                 pipes[pipe_cnt].dout.wb.wb_vtaps_luma = 1;
676                 pipes[pipe_cnt].dout.wb.wb_htaps_chroma = wb_info->dwb_params.scaler_taps.h_taps_c;
677                 pipes[pipe_cnt].dout.wb.wb_vtaps_chroma = wb_info->dwb_params.scaler_taps.v_taps_c;
678                 pipes[pipe_cnt].dout.wb.wb_hratio = 1.0;
679                 pipes[pipe_cnt].dout.wb.wb_vratio = 1.0;
680                 if (wb_info->dwb_params.out_format == dwb_scaler_mode_yuv420) {
681                         if (wb_info->dwb_params.output_depth == DWB_OUTPUT_PIXEL_DEPTH_8BPC)
682                                 pipes[pipe_cnt].dout.wb.wb_pixel_format = dm_420_8;
683                         else
684                                 pipes[pipe_cnt].dout.wb.wb_pixel_format = dm_420_10;
685                 } else {
686                         pipes[pipe_cnt].dout.wb.wb_pixel_format = dm_444_32;
687                 }
688
689                 pipe_cnt++;
690         }
691 }
692
693 void dcn20_fpu_set_wb_arb_params(struct mcif_arb_params *wb_arb_params,
694                                 struct dc_state *context,
695                                 display_e2e_pipe_params_st *pipes,
696                                 int pipe_cnt, int i)
697 {
698        int k;
699
700        dc_assert_fp_enabled();
701
702        for (k = 0; k < sizeof(wb_arb_params->cli_watermark)/sizeof(wb_arb_params->cli_watermark[0]); k++) {
703                wb_arb_params->cli_watermark[k] = get_wm_writeback_urgent(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000;
704                wb_arb_params->pstate_watermark[k] = get_wm_writeback_dram_clock_change(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000;
705        }
706        wb_arb_params->time_per_pixel = 16.0 * 1000 / (context->res_ctx.pipe_ctx[i].stream->phy_pix_clk / 1000); /* 4 bit fraction, ms */
707 }
708
709 static bool is_dtbclk_required(struct dc *dc, struct dc_state *context)
710 {
711         int i;
712         for (i = 0; i < dc->res_pool->pipe_count; i++) {
713                 if (!context->res_ctx.pipe_ctx[i].stream)
714                         continue;
715                 if (is_dp_128b_132b_signal(&context->res_ctx.pipe_ctx[i]))
716                         return true;
717         }
718         return false;
719 }
720
721 static enum dcn_zstate_support_state  decide_zstate_support(struct dc *dc, struct dc_state *context)
722 {
723         int plane_count;
724         int i;
725         unsigned int optimized_min_dst_y_next_start_us;
726
727         plane_count = 0;
728         optimized_min_dst_y_next_start_us = 0;
729         for (i = 0; i < dc->res_pool->pipe_count; i++) {
730                 if (context->res_ctx.pipe_ctx[i].plane_state)
731                         plane_count++;
732         }
733
734         /*
735          * Z9 and Z10 allowed cases:
736          *      1. 0 Planes enabled
737          *      2. single eDP, on link 0, 1 plane and stutter period > 5ms
738          * Z10 only cases:
739          *      1. single eDP, on link 0, 1 plane and stutter period >= 5ms
740          * Zstate not allowed cases:
741          *      1. Everything else
742          */
743         if (plane_count == 0)
744                 return DCN_ZSTATE_SUPPORT_ALLOW;
745         else if (context->stream_count == 1 &&  context->streams[0]->signal == SIGNAL_TYPE_EDP) {
746                 struct dc_link *link = context->streams[0]->sink->link;
747                 struct dc_stream_status *stream_status = &context->stream_status[0];
748
749                 if (dc_extended_blank_supported(dc)) {
750                         for (i = 0; i < dc->res_pool->pipe_count; i++) {
751                                 if (context->res_ctx.pipe_ctx[i].stream == context->streams[0]
752                                         && context->res_ctx.pipe_ctx[i].stream->adjust.v_total_min == context->res_ctx.pipe_ctx[i].stream->adjust.v_total_max
753                                         && context->res_ctx.pipe_ctx[i].stream->adjust.v_total_min > context->res_ctx.pipe_ctx[i].stream->timing.v_total) {
754                                                 optimized_min_dst_y_next_start_us =
755                                                         context->res_ctx.pipe_ctx[i].dlg_regs.optimized_min_dst_y_next_start_us;
756                                                 break;
757                                 }
758                         }
759                 }
760                 /* zstate only supported on PWRSEQ0  and when there's <2 planes*/
761                 if (link->link_index != 0 || stream_status->plane_count > 1)
762                         return DCN_ZSTATE_SUPPORT_DISALLOW;
763
764                 if (context->bw_ctx.dml.vba.StutterPeriod > 5000.0 || optimized_min_dst_y_next_start_us > 5000)
765                         return DCN_ZSTATE_SUPPORT_ALLOW;
766                 else if (link->psr_settings.psr_version == DC_PSR_VERSION_1 && !dc->debug.disable_psr)
767                         return DCN_ZSTATE_SUPPORT_ALLOW_Z10_ONLY;
768                 else
769                         return DCN_ZSTATE_SUPPORT_DISALLOW;
770         } else
771                 return DCN_ZSTATE_SUPPORT_DISALLOW;
772 }
773
774 void dcn20_calculate_dlg_params(
775                 struct dc *dc, struct dc_state *context,
776                 display_e2e_pipe_params_st *pipes,
777                 int pipe_cnt,
778                 int vlevel)
779 {
780         int i, pipe_idx;
781
782         dc_assert_fp_enabled();
783
784         /* Writeback MCIF_WB arbitration parameters */
785         dc->res_pool->funcs->set_mcif_arb_params(dc, context, pipes, pipe_cnt);
786
787         context->bw_ctx.bw.dcn.clk.dispclk_khz = context->bw_ctx.dml.vba.DISPCLK * 1000;
788         context->bw_ctx.bw.dcn.clk.dcfclk_khz = context->bw_ctx.dml.vba.DCFCLK * 1000;
789         context->bw_ctx.bw.dcn.clk.socclk_khz = context->bw_ctx.dml.vba.SOCCLK * 1000;
790         context->bw_ctx.bw.dcn.clk.dramclk_khz = context->bw_ctx.dml.vba.DRAMSpeed * 1000 / 16;
791
792         if (dc->debug.min_dram_clk_khz > context->bw_ctx.bw.dcn.clk.dramclk_khz)
793                 context->bw_ctx.bw.dcn.clk.dramclk_khz = dc->debug.min_dram_clk_khz;
794
795         context->bw_ctx.bw.dcn.clk.dcfclk_deep_sleep_khz = context->bw_ctx.dml.vba.DCFCLKDeepSleep * 1000;
796         context->bw_ctx.bw.dcn.clk.fclk_khz = context->bw_ctx.dml.vba.FabricClock * 1000;
797         context->bw_ctx.bw.dcn.clk.p_state_change_support =
798                 context->bw_ctx.dml.vba.DRAMClockChangeSupport[vlevel][context->bw_ctx.dml.vba.maxMpcComb]
799                                                         != dm_dram_clock_change_unsupported;
800         context->bw_ctx.bw.dcn.clk.dppclk_khz = 0;
801
802         context->bw_ctx.bw.dcn.clk.dtbclk_en = is_dtbclk_required(dc, context);
803
804         if (context->bw_ctx.bw.dcn.clk.dispclk_khz < dc->debug.min_disp_clk_khz)
805                 context->bw_ctx.bw.dcn.clk.dispclk_khz = dc->debug.min_disp_clk_khz;
806
807         for (i = 0, pipe_idx = 0; i < dc->res_pool->pipe_count; i++) {
808                 if (!context->res_ctx.pipe_ctx[i].stream)
809                         continue;
810                 pipes[pipe_idx].pipe.dest.vstartup_start = get_vstartup(&context->bw_ctx.dml, pipes, pipe_cnt, pipe_idx);
811                 pipes[pipe_idx].pipe.dest.vupdate_offset = get_vupdate_offset(&context->bw_ctx.dml, pipes, pipe_cnt, pipe_idx);
812                 pipes[pipe_idx].pipe.dest.vupdate_width = get_vupdate_width(&context->bw_ctx.dml, pipes, pipe_cnt, pipe_idx);
813                 pipes[pipe_idx].pipe.dest.vready_offset = get_vready_offset(&context->bw_ctx.dml, pipes, pipe_cnt, pipe_idx);
814                 context->res_ctx.pipe_ctx[i].det_buffer_size_kb = context->bw_ctx.dml.ip.det_buffer_size_kbytes;
815                 context->res_ctx.pipe_ctx[i].unbounded_req = pipes[pipe_idx].pipe.src.unbounded_req_mode;
816
817                 if (context->bw_ctx.bw.dcn.clk.dppclk_khz < pipes[pipe_idx].clks_cfg.dppclk_mhz * 1000)
818                         context->bw_ctx.bw.dcn.clk.dppclk_khz = pipes[pipe_idx].clks_cfg.dppclk_mhz * 1000;
819                 context->res_ctx.pipe_ctx[i].plane_res.bw.dppclk_khz =
820                                                 pipes[pipe_idx].clks_cfg.dppclk_mhz * 1000;
821                 context->res_ctx.pipe_ctx[i].pipe_dlg_param = pipes[pipe_idx].pipe.dest;
822                 pipe_idx++;
823         }
824         /*save a original dppclock copy*/
825         context->bw_ctx.bw.dcn.clk.bw_dppclk_khz = context->bw_ctx.bw.dcn.clk.dppclk_khz;
826         context->bw_ctx.bw.dcn.clk.bw_dispclk_khz = context->bw_ctx.bw.dcn.clk.dispclk_khz;
827         context->bw_ctx.bw.dcn.clk.max_supported_dppclk_khz = context->bw_ctx.dml.soc.clock_limits[vlevel].dppclk_mhz * 1000;
828         context->bw_ctx.bw.dcn.clk.max_supported_dispclk_khz = context->bw_ctx.dml.soc.clock_limits[vlevel].dispclk_mhz * 1000;
829
830         context->bw_ctx.bw.dcn.compbuf_size_kb = context->bw_ctx.dml.ip.config_return_buffer_size_in_kbytes
831                                                 - context->bw_ctx.dml.ip.det_buffer_size_kbytes * pipe_idx;
832
833         for (i = 0, pipe_idx = 0; i < dc->res_pool->pipe_count; i++) {
834                 bool cstate_en = context->bw_ctx.dml.vba.PrefetchMode[vlevel][context->bw_ctx.dml.vba.maxMpcComb] != 2;
835
836                 if (!context->res_ctx.pipe_ctx[i].stream)
837                         continue;
838
839                 if (dc->ctx->dce_version == DCN_VERSION_2_01)
840                         cstate_en = false;
841
842                 context->bw_ctx.dml.funcs.rq_dlg_get_dlg_reg(&context->bw_ctx.dml,
843                                 &context->res_ctx.pipe_ctx[i].dlg_regs,
844                                 &context->res_ctx.pipe_ctx[i].ttu_regs,
845                                 pipes,
846                                 pipe_cnt,
847                                 pipe_idx,
848                                 cstate_en,
849                                 context->bw_ctx.bw.dcn.clk.p_state_change_support,
850                                 false, false, true);
851
852                 context->bw_ctx.dml.funcs.rq_dlg_get_rq_reg(&context->bw_ctx.dml,
853                                 &context->res_ctx.pipe_ctx[i].rq_regs,
854                                 &pipes[pipe_idx].pipe);
855                 pipe_idx++;
856         }
857         context->bw_ctx.bw.dcn.clk.zstate_support = decide_zstate_support(dc, context);
858 }
859
860 static void swizzle_to_dml_params(
861                 enum swizzle_mode_values swizzle,
862                 unsigned int *sw_mode)
863 {
864         switch (swizzle) {
865         case DC_SW_LINEAR:
866                 *sw_mode = dm_sw_linear;
867                 break;
868         case DC_SW_4KB_S:
869                 *sw_mode = dm_sw_4kb_s;
870                 break;
871         case DC_SW_4KB_S_X:
872                 *sw_mode = dm_sw_4kb_s_x;
873                 break;
874         case DC_SW_4KB_D:
875                 *sw_mode = dm_sw_4kb_d;
876                 break;
877         case DC_SW_4KB_D_X:
878                 *sw_mode = dm_sw_4kb_d_x;
879                 break;
880         case DC_SW_64KB_S:
881                 *sw_mode = dm_sw_64kb_s;
882                 break;
883         case DC_SW_64KB_S_X:
884                 *sw_mode = dm_sw_64kb_s_x;
885                 break;
886         case DC_SW_64KB_S_T:
887                 *sw_mode = dm_sw_64kb_s_t;
888                 break;
889         case DC_SW_64KB_D:
890                 *sw_mode = dm_sw_64kb_d;
891                 break;
892         case DC_SW_64KB_D_X:
893                 *sw_mode = dm_sw_64kb_d_x;
894                 break;
895         case DC_SW_64KB_D_T:
896                 *sw_mode = dm_sw_64kb_d_t;
897                 break;
898         case DC_SW_64KB_R_X:
899                 *sw_mode = dm_sw_64kb_r_x;
900                 break;
901         case DC_SW_VAR_S:
902                 *sw_mode = dm_sw_var_s;
903                 break;
904         case DC_SW_VAR_S_X:
905                 *sw_mode = dm_sw_var_s_x;
906                 break;
907         case DC_SW_VAR_D:
908                 *sw_mode = dm_sw_var_d;
909                 break;
910         case DC_SW_VAR_D_X:
911                 *sw_mode = dm_sw_var_d_x;
912                 break;
913         case DC_SW_VAR_R_X:
914                 *sw_mode = dm_sw_var_r_x;
915                 break;
916         default:
917                 ASSERT(0); /* Not supported */
918                 break;
919         }
920 }
921
922 int dcn20_populate_dml_pipes_from_context(
923                 struct dc *dc,
924                 struct dc_state *context,
925                 display_e2e_pipe_params_st *pipes,
926                 bool fast_validate)
927 {
928         int pipe_cnt, i;
929         bool synchronized_vblank = true;
930         struct resource_context *res_ctx = &context->res_ctx;
931
932         dc_assert_fp_enabled();
933
934         for (i = 0, pipe_cnt = -1; i < dc->res_pool->pipe_count; i++) {
935                 if (!res_ctx->pipe_ctx[i].stream)
936                         continue;
937
938                 if (pipe_cnt < 0) {
939                         pipe_cnt = i;
940                         continue;
941                 }
942
943                 if (res_ctx->pipe_ctx[pipe_cnt].stream == res_ctx->pipe_ctx[i].stream)
944                         continue;
945
946                 if (dc->debug.disable_timing_sync ||
947                         (!resource_are_streams_timing_synchronizable(
948                                 res_ctx->pipe_ctx[pipe_cnt].stream,
949                                 res_ctx->pipe_ctx[i].stream) &&
950                         !resource_are_vblanks_synchronizable(
951                                 res_ctx->pipe_ctx[pipe_cnt].stream,
952                                 res_ctx->pipe_ctx[i].stream))) {
953                         synchronized_vblank = false;
954                         break;
955                 }
956         }
957
958         for (i = 0, pipe_cnt = 0; i < dc->res_pool->pipe_count; i++) {
959                 struct dc_crtc_timing *timing = &res_ctx->pipe_ctx[i].stream->timing;
960                 unsigned int v_total;
961                 unsigned int front_porch;
962                 int output_bpc;
963                 struct audio_check aud_check = {0};
964
965                 if (!res_ctx->pipe_ctx[i].stream)
966                         continue;
967
968                 v_total = timing->v_total;
969                 front_porch = timing->v_front_porch;
970
971                 /* todo:
972                 pipes[pipe_cnt].pipe.src.dynamic_metadata_enable = 0;
973                 pipes[pipe_cnt].pipe.src.dcc = 0;
974                 pipes[pipe_cnt].pipe.src.vm = 0;*/
975
976                 pipes[pipe_cnt].clks_cfg.refclk_mhz = dc->res_pool->ref_clocks.dchub_ref_clock_inKhz / 1000.0;
977
978                 pipes[pipe_cnt].dout.dsc_enable = res_ctx->pipe_ctx[i].stream->timing.flags.DSC;
979                 /* todo: rotation?*/
980                 pipes[pipe_cnt].dout.dsc_slices = res_ctx->pipe_ctx[i].stream->timing.dsc_cfg.num_slices_h;
981                 if (res_ctx->pipe_ctx[i].stream->use_dynamic_meta) {
982                         pipes[pipe_cnt].pipe.src.dynamic_metadata_enable = true;
983                         /* 1/2 vblank */
984                         pipes[pipe_cnt].pipe.src.dynamic_metadata_lines_before_active =
985                                 (v_total - timing->v_addressable
986                                         - timing->v_border_top - timing->v_border_bottom) / 2;
987                         /* 36 bytes dp, 32 hdmi */
988                         pipes[pipe_cnt].pipe.src.dynamic_metadata_xmit_bytes =
989                                 dc_is_dp_signal(res_ctx->pipe_ctx[i].stream->signal) ? 36 : 32;
990                 }
991                 pipes[pipe_cnt].pipe.src.dcc = false;
992                 pipes[pipe_cnt].pipe.src.dcc_rate = 1;
993                 pipes[pipe_cnt].pipe.dest.synchronized_vblank_all_planes = synchronized_vblank;
994                 pipes[pipe_cnt].pipe.dest.hblank_start = timing->h_total - timing->h_front_porch;
995                 pipes[pipe_cnt].pipe.dest.hblank_end = pipes[pipe_cnt].pipe.dest.hblank_start
996                                 - timing->h_addressable
997                                 - timing->h_border_left
998                                 - timing->h_border_right;
999                 pipes[pipe_cnt].pipe.dest.vblank_start = v_total - front_porch;
1000                 pipes[pipe_cnt].pipe.dest.vblank_end = pipes[pipe_cnt].pipe.dest.vblank_start
1001                                 - timing->v_addressable
1002                                 - timing->v_border_top
1003                                 - timing->v_border_bottom;
1004                 pipes[pipe_cnt].pipe.dest.htotal = timing->h_total;
1005                 pipes[pipe_cnt].pipe.dest.vtotal = v_total;
1006                 pipes[pipe_cnt].pipe.dest.hactive =
1007                         timing->h_addressable + timing->h_border_left + timing->h_border_right;
1008                 pipes[pipe_cnt].pipe.dest.vactive =
1009                         timing->v_addressable + timing->v_border_top + timing->v_border_bottom;
1010                 pipes[pipe_cnt].pipe.dest.interlaced = timing->flags.INTERLACE;
1011                 pipes[pipe_cnt].pipe.dest.pixel_rate_mhz = timing->pix_clk_100hz/10000.0;
1012                 if (timing->timing_3d_format == TIMING_3D_FORMAT_HW_FRAME_PACKING)
1013                         pipes[pipe_cnt].pipe.dest.pixel_rate_mhz *= 2;
1014                 pipes[pipe_cnt].pipe.dest.otg_inst = res_ctx->pipe_ctx[i].stream_res.tg->inst;
1015                 pipes[pipe_cnt].dout.dp_lanes = 4;
1016                 pipes[pipe_cnt].dout.is_virtual = 0;
1017                 pipes[pipe_cnt].pipe.dest.vtotal_min = res_ctx->pipe_ctx[i].stream->adjust.v_total_min;
1018                 pipes[pipe_cnt].pipe.dest.vtotal_max = res_ctx->pipe_ctx[i].stream->adjust.v_total_max;
1019                 switch (get_num_odm_splits(&res_ctx->pipe_ctx[i])) {
1020                 case 1:
1021                         pipes[pipe_cnt].pipe.dest.odm_combine = dm_odm_combine_mode_2to1;
1022                         break;
1023                 case 3:
1024                         pipes[pipe_cnt].pipe.dest.odm_combine = dm_odm_combine_mode_4to1;
1025                         break;
1026                 default:
1027                         pipes[pipe_cnt].pipe.dest.odm_combine = dm_odm_combine_mode_disabled;
1028                 }
1029                 pipes[pipe_cnt].pipe.src.hsplit_grp = res_ctx->pipe_ctx[i].pipe_idx;
1030                 if (res_ctx->pipe_ctx[i].top_pipe && res_ctx->pipe_ctx[i].top_pipe->plane_state
1031                                 == res_ctx->pipe_ctx[i].plane_state) {
1032                         struct pipe_ctx *first_pipe = res_ctx->pipe_ctx[i].top_pipe;
1033                         int split_idx = 0;
1034
1035                         while (first_pipe->top_pipe && first_pipe->top_pipe->plane_state
1036                                         == res_ctx->pipe_ctx[i].plane_state) {
1037                                 first_pipe = first_pipe->top_pipe;
1038                                 split_idx++;
1039                         }
1040                         /* Treat 4to1 mpc combine as an mpo of 2 2-to-1 combines */
1041                         if (split_idx == 0)
1042                                 pipes[pipe_cnt].pipe.src.hsplit_grp = first_pipe->pipe_idx;
1043                         else if (split_idx == 1)
1044                                 pipes[pipe_cnt].pipe.src.hsplit_grp = res_ctx->pipe_ctx[i].pipe_idx;
1045                         else if (split_idx == 2)
1046                                 pipes[pipe_cnt].pipe.src.hsplit_grp = res_ctx->pipe_ctx[i].top_pipe->pipe_idx;
1047                 } else if (res_ctx->pipe_ctx[i].prev_odm_pipe) {
1048                         struct pipe_ctx *first_pipe = res_ctx->pipe_ctx[i].prev_odm_pipe;
1049
1050                         while (first_pipe->prev_odm_pipe)
1051                                 first_pipe = first_pipe->prev_odm_pipe;
1052                         pipes[pipe_cnt].pipe.src.hsplit_grp = first_pipe->pipe_idx;
1053                 }
1054
1055                 switch (res_ctx->pipe_ctx[i].stream->signal) {
1056                 case SIGNAL_TYPE_DISPLAY_PORT_MST:
1057                 case SIGNAL_TYPE_DISPLAY_PORT:
1058                         pipes[pipe_cnt].dout.output_type = dm_dp;
1059                         break;
1060                 case SIGNAL_TYPE_EDP:
1061                         pipes[pipe_cnt].dout.output_type = dm_edp;
1062                         break;
1063                 case SIGNAL_TYPE_HDMI_TYPE_A:
1064                 case SIGNAL_TYPE_DVI_SINGLE_LINK:
1065                 case SIGNAL_TYPE_DVI_DUAL_LINK:
1066                         pipes[pipe_cnt].dout.output_type = dm_hdmi;
1067                         break;
1068                 default:
1069                         /* In case there is no signal, set dp with 4 lanes to allow max config */
1070                         pipes[pipe_cnt].dout.is_virtual = 1;
1071                         pipes[pipe_cnt].dout.output_type = dm_dp;
1072                         pipes[pipe_cnt].dout.dp_lanes = 4;
1073                 }
1074
1075                 switch (res_ctx->pipe_ctx[i].stream->timing.display_color_depth) {
1076                 case COLOR_DEPTH_666:
1077                         output_bpc = 6;
1078                         break;
1079                 case COLOR_DEPTH_888:
1080                         output_bpc = 8;
1081                         break;
1082                 case COLOR_DEPTH_101010:
1083                         output_bpc = 10;
1084                         break;
1085                 case COLOR_DEPTH_121212:
1086                         output_bpc = 12;
1087                         break;
1088                 case COLOR_DEPTH_141414:
1089                         output_bpc = 14;
1090                         break;
1091                 case COLOR_DEPTH_161616:
1092                         output_bpc = 16;
1093                         break;
1094                 case COLOR_DEPTH_999:
1095                         output_bpc = 9;
1096                         break;
1097                 case COLOR_DEPTH_111111:
1098                         output_bpc = 11;
1099                         break;
1100                 default:
1101                         output_bpc = 8;
1102                         break;
1103                 }
1104
1105                 switch (res_ctx->pipe_ctx[i].stream->timing.pixel_encoding) {
1106                 case PIXEL_ENCODING_RGB:
1107                 case PIXEL_ENCODING_YCBCR444:
1108                         pipes[pipe_cnt].dout.output_format = dm_444;
1109                         pipes[pipe_cnt].dout.output_bpp = output_bpc * 3;
1110                         break;
1111                 case PIXEL_ENCODING_YCBCR420:
1112                         pipes[pipe_cnt].dout.output_format = dm_420;
1113                         pipes[pipe_cnt].dout.output_bpp = (output_bpc * 3.0) / 2;
1114                         break;
1115                 case PIXEL_ENCODING_YCBCR422:
1116                         if (res_ctx->pipe_ctx[i].stream->timing.flags.DSC &&
1117                             !res_ctx->pipe_ctx[i].stream->timing.dsc_cfg.ycbcr422_simple)
1118                                 pipes[pipe_cnt].dout.output_format = dm_n422;
1119                         else
1120                                 pipes[pipe_cnt].dout.output_format = dm_s422;
1121                         pipes[pipe_cnt].dout.output_bpp = output_bpc * 2;
1122                         break;
1123                 default:
1124                         pipes[pipe_cnt].dout.output_format = dm_444;
1125                         pipes[pipe_cnt].dout.output_bpp = output_bpc * 3;
1126                 }
1127
1128                 if (res_ctx->pipe_ctx[i].stream->timing.flags.DSC)
1129                         pipes[pipe_cnt].dout.output_bpp = res_ctx->pipe_ctx[i].stream->timing.dsc_cfg.bits_per_pixel / 16.0;
1130
1131                 /* todo: default max for now, until there is logic reflecting this in dc*/
1132                 pipes[pipe_cnt].dout.dsc_input_bpc = 12;
1133                 /*fill up the audio sample rate (unit in kHz)*/
1134                 get_audio_check(&res_ctx->pipe_ctx[i].stream->audio_info, &aud_check);
1135                 pipes[pipe_cnt].dout.max_audio_sample_rate = aud_check.max_audiosample_rate / 1000;
1136                 /*
1137                  * For graphic plane, cursor number is 1, nv12 is 0
1138                  * bw calculations due to cursor on/off
1139                  */
1140                 if (res_ctx->pipe_ctx[i].plane_state &&
1141                                 res_ctx->pipe_ctx[i].plane_state->address.type == PLN_ADDR_TYPE_VIDEO_PROGRESSIVE)
1142                         pipes[pipe_cnt].pipe.src.num_cursors = 0;
1143                 else
1144                         pipes[pipe_cnt].pipe.src.num_cursors = dc->dml.ip.number_of_cursors;
1145
1146                 pipes[pipe_cnt].pipe.src.cur0_src_width = 256;
1147                 pipes[pipe_cnt].pipe.src.cur0_bpp = dm_cur_32bit;
1148
1149                 if (!res_ctx->pipe_ctx[i].plane_state) {
1150                         pipes[pipe_cnt].pipe.src.is_hsplit = pipes[pipe_cnt].pipe.dest.odm_combine != dm_odm_combine_mode_disabled;
1151                         pipes[pipe_cnt].pipe.src.source_scan = dm_horz;
1152                         pipes[pipe_cnt].pipe.src.sw_mode = dm_sw_4kb_s;
1153                         pipes[pipe_cnt].pipe.src.macro_tile_size = dm_64k_tile;
1154                         pipes[pipe_cnt].pipe.src.viewport_width = timing->h_addressable;
1155                         if (pipes[pipe_cnt].pipe.src.viewport_width > 1920)
1156                                 pipes[pipe_cnt].pipe.src.viewport_width = 1920;
1157                         pipes[pipe_cnt].pipe.src.viewport_height = timing->v_addressable;
1158                         if (pipes[pipe_cnt].pipe.src.viewport_height > 1080)
1159                                 pipes[pipe_cnt].pipe.src.viewport_height = 1080;
1160                         pipes[pipe_cnt].pipe.src.surface_height_y = pipes[pipe_cnt].pipe.src.viewport_height;
1161                         pipes[pipe_cnt].pipe.src.surface_width_y = pipes[pipe_cnt].pipe.src.viewport_width;
1162                         pipes[pipe_cnt].pipe.src.surface_height_c = pipes[pipe_cnt].pipe.src.viewport_height;
1163                         pipes[pipe_cnt].pipe.src.surface_width_c = pipes[pipe_cnt].pipe.src.viewport_width;
1164                         pipes[pipe_cnt].pipe.src.data_pitch = ((pipes[pipe_cnt].pipe.src.viewport_width + 255) / 256) * 256;
1165                         pipes[pipe_cnt].pipe.src.source_format = dm_444_32;
1166                         pipes[pipe_cnt].pipe.dest.recout_width = pipes[pipe_cnt].pipe.src.viewport_width; /*vp_width/hratio*/
1167                         pipes[pipe_cnt].pipe.dest.recout_height = pipes[pipe_cnt].pipe.src.viewport_height; /*vp_height/vratio*/
1168                         pipes[pipe_cnt].pipe.dest.full_recout_width = pipes[pipe_cnt].pipe.dest.recout_width;  /*when is_hsplit != 1*/
1169                         pipes[pipe_cnt].pipe.dest.full_recout_height = pipes[pipe_cnt].pipe.dest.recout_height; /*when is_hsplit != 1*/
1170                         pipes[pipe_cnt].pipe.scale_ratio_depth.lb_depth = dm_lb_16;
1171                         pipes[pipe_cnt].pipe.scale_ratio_depth.hscl_ratio = 1.0;
1172                         pipes[pipe_cnt].pipe.scale_ratio_depth.vscl_ratio = 1.0;
1173                         pipes[pipe_cnt].pipe.scale_ratio_depth.scl_enable = 0; /*Lb only or Full scl*/
1174                         pipes[pipe_cnt].pipe.scale_taps.htaps = 1;
1175                         pipes[pipe_cnt].pipe.scale_taps.vtaps = 1;
1176                         pipes[pipe_cnt].pipe.dest.vtotal_min = v_total;
1177                         pipes[pipe_cnt].pipe.dest.vtotal_max = v_total;
1178
1179                         if (pipes[pipe_cnt].pipe.dest.odm_combine == dm_odm_combine_mode_2to1) {
1180                                 pipes[pipe_cnt].pipe.src.viewport_width /= 2;
1181                                 pipes[pipe_cnt].pipe.dest.recout_width /= 2;
1182                         } else if (pipes[pipe_cnt].pipe.dest.odm_combine == dm_odm_combine_mode_4to1) {
1183                                 pipes[pipe_cnt].pipe.src.viewport_width /= 4;
1184                                 pipes[pipe_cnt].pipe.dest.recout_width /= 4;
1185                         }
1186                 } else {
1187                         struct dc_plane_state *pln = res_ctx->pipe_ctx[i].plane_state;
1188                         struct scaler_data *scl = &res_ctx->pipe_ctx[i].plane_res.scl_data;
1189
1190                         pipes[pipe_cnt].pipe.src.immediate_flip = pln->flip_immediate;
1191                         pipes[pipe_cnt].pipe.src.is_hsplit = (res_ctx->pipe_ctx[i].bottom_pipe && res_ctx->pipe_ctx[i].bottom_pipe->plane_state == pln)
1192                                         || (res_ctx->pipe_ctx[i].top_pipe && res_ctx->pipe_ctx[i].top_pipe->plane_state == pln)
1193                                         || pipes[pipe_cnt].pipe.dest.odm_combine != dm_odm_combine_mode_disabled;
1194
1195                         /* stereo is not split */
1196                         if (pln->stereo_format == PLANE_STEREO_FORMAT_SIDE_BY_SIDE ||
1197                             pln->stereo_format == PLANE_STEREO_FORMAT_TOP_AND_BOTTOM) {
1198                                 pipes[pipe_cnt].pipe.src.is_hsplit = false;
1199                                 pipes[pipe_cnt].pipe.src.hsplit_grp = res_ctx->pipe_ctx[i].pipe_idx;
1200                         }
1201
1202                         pipes[pipe_cnt].pipe.src.source_scan = pln->rotation == ROTATION_ANGLE_90
1203                                         || pln->rotation == ROTATION_ANGLE_270 ? dm_vert : dm_horz;
1204                         pipes[pipe_cnt].pipe.src.viewport_y_y = scl->viewport.y;
1205                         pipes[pipe_cnt].pipe.src.viewport_y_c = scl->viewport_c.y;
1206                         pipes[pipe_cnt].pipe.src.viewport_width = scl->viewport.width;
1207                         pipes[pipe_cnt].pipe.src.viewport_width_c = scl->viewport_c.width;
1208                         pipes[pipe_cnt].pipe.src.viewport_height = scl->viewport.height;
1209                         pipes[pipe_cnt].pipe.src.viewport_height_c = scl->viewport_c.height;
1210                         pipes[pipe_cnt].pipe.src.viewport_width_max = pln->src_rect.width;
1211                         pipes[pipe_cnt].pipe.src.viewport_height_max = pln->src_rect.height;
1212                         pipes[pipe_cnt].pipe.src.surface_width_y = pln->plane_size.surface_size.width;
1213                         pipes[pipe_cnt].pipe.src.surface_height_y = pln->plane_size.surface_size.height;
1214                         pipes[pipe_cnt].pipe.src.surface_width_c = pln->plane_size.chroma_size.width;
1215                         pipes[pipe_cnt].pipe.src.surface_height_c = pln->plane_size.chroma_size.height;
1216                         if (pln->format == SURFACE_PIXEL_FORMAT_GRPH_RGBE_ALPHA
1217                                         || pln->format >= SURFACE_PIXEL_FORMAT_VIDEO_BEGIN) {
1218                                 pipes[pipe_cnt].pipe.src.data_pitch = pln->plane_size.surface_pitch;
1219                                 pipes[pipe_cnt].pipe.src.data_pitch_c = pln->plane_size.chroma_pitch;
1220                                 pipes[pipe_cnt].pipe.src.meta_pitch = pln->dcc.meta_pitch;
1221                                 pipes[pipe_cnt].pipe.src.meta_pitch_c = pln->dcc.meta_pitch_c;
1222                         } else {
1223                                 pipes[pipe_cnt].pipe.src.data_pitch = pln->plane_size.surface_pitch;
1224                                 pipes[pipe_cnt].pipe.src.meta_pitch = pln->dcc.meta_pitch;
1225                         }
1226                         pipes[pipe_cnt].pipe.src.dcc = pln->dcc.enable;
1227                         pipes[pipe_cnt].pipe.dest.recout_width = scl->recout.width;
1228                         pipes[pipe_cnt].pipe.dest.recout_height = scl->recout.height;
1229                         pipes[pipe_cnt].pipe.dest.full_recout_height = scl->recout.height;
1230                         pipes[pipe_cnt].pipe.dest.full_recout_width = scl->recout.width;
1231                         if (pipes[pipe_cnt].pipe.dest.odm_combine == dm_odm_combine_mode_2to1)
1232                                 pipes[pipe_cnt].pipe.dest.full_recout_width *= 2;
1233                         else if (pipes[pipe_cnt].pipe.dest.odm_combine == dm_odm_combine_mode_4to1)
1234                                 pipes[pipe_cnt].pipe.dest.full_recout_width *= 4;
1235                         else {
1236                                 struct pipe_ctx *split_pipe = res_ctx->pipe_ctx[i].bottom_pipe;
1237
1238                                 while (split_pipe && split_pipe->plane_state == pln) {
1239                                         pipes[pipe_cnt].pipe.dest.full_recout_width += split_pipe->plane_res.scl_data.recout.width;
1240                                         split_pipe = split_pipe->bottom_pipe;
1241                                 }
1242                                 split_pipe = res_ctx->pipe_ctx[i].top_pipe;
1243                                 while (split_pipe && split_pipe->plane_state == pln) {
1244                                         pipes[pipe_cnt].pipe.dest.full_recout_width += split_pipe->plane_res.scl_data.recout.width;
1245                                         split_pipe = split_pipe->top_pipe;
1246                                 }
1247                         }
1248
1249                         pipes[pipe_cnt].pipe.scale_ratio_depth.lb_depth = dm_lb_16;
1250                         pipes[pipe_cnt].pipe.scale_ratio_depth.hscl_ratio = (double) scl->ratios.horz.value / (1ULL<<32);
1251                         pipes[pipe_cnt].pipe.scale_ratio_depth.hscl_ratio_c = (double) scl->ratios.horz_c.value / (1ULL<<32);
1252                         pipes[pipe_cnt].pipe.scale_ratio_depth.vscl_ratio = (double) scl->ratios.vert.value / (1ULL<<32);
1253                         pipes[pipe_cnt].pipe.scale_ratio_depth.vscl_ratio_c = (double) scl->ratios.vert_c.value / (1ULL<<32);
1254                         pipes[pipe_cnt].pipe.scale_ratio_depth.scl_enable =
1255                                         scl->ratios.vert.value != dc_fixpt_one.value
1256                                         || scl->ratios.horz.value != dc_fixpt_one.value
1257                                         || scl->ratios.vert_c.value != dc_fixpt_one.value
1258                                         || scl->ratios.horz_c.value != dc_fixpt_one.value /*Lb only or Full scl*/
1259                                         || dc->debug.always_scale; /*support always scale*/
1260                         pipes[pipe_cnt].pipe.scale_taps.htaps = scl->taps.h_taps;
1261                         pipes[pipe_cnt].pipe.scale_taps.htaps_c = scl->taps.h_taps_c;
1262                         pipes[pipe_cnt].pipe.scale_taps.vtaps = scl->taps.v_taps;
1263                         pipes[pipe_cnt].pipe.scale_taps.vtaps_c = scl->taps.v_taps_c;
1264
1265                         pipes[pipe_cnt].pipe.src.macro_tile_size =
1266                                         swizzle_mode_to_macro_tile_size(pln->tiling_info.gfx9.swizzle);
1267                         swizzle_to_dml_params(pln->tiling_info.gfx9.swizzle,
1268                                         &pipes[pipe_cnt].pipe.src.sw_mode);
1269
1270                         switch (pln->format) {
1271                         case SURFACE_PIXEL_FORMAT_VIDEO_420_YCbCr:
1272                         case SURFACE_PIXEL_FORMAT_VIDEO_420_YCrCb:
1273                                 pipes[pipe_cnt].pipe.src.source_format = dm_420_8;
1274                                 break;
1275                         case SURFACE_PIXEL_FORMAT_VIDEO_420_10bpc_YCbCr:
1276                         case SURFACE_PIXEL_FORMAT_VIDEO_420_10bpc_YCrCb:
1277                                 pipes[pipe_cnt].pipe.src.source_format = dm_420_10;
1278                                 break;
1279                         case SURFACE_PIXEL_FORMAT_GRPH_ARGB16161616:
1280                         case SURFACE_PIXEL_FORMAT_GRPH_ABGR16161616:
1281                         case SURFACE_PIXEL_FORMAT_GRPH_ARGB16161616F:
1282                         case SURFACE_PIXEL_FORMAT_GRPH_ABGR16161616F:
1283                                 pipes[pipe_cnt].pipe.src.source_format = dm_444_64;
1284                                 break;
1285                         case SURFACE_PIXEL_FORMAT_GRPH_ARGB1555:
1286                         case SURFACE_PIXEL_FORMAT_GRPH_RGB565:
1287                                 pipes[pipe_cnt].pipe.src.source_format = dm_444_16;
1288                                 break;
1289                         case SURFACE_PIXEL_FORMAT_GRPH_PALETA_256_COLORS:
1290                                 pipes[pipe_cnt].pipe.src.source_format = dm_444_8;
1291                                 break;
1292                         case SURFACE_PIXEL_FORMAT_GRPH_RGBE_ALPHA:
1293                                 pipes[pipe_cnt].pipe.src.source_format = dm_rgbe_alpha;
1294                                 break;
1295                         default:
1296                                 pipes[pipe_cnt].pipe.src.source_format = dm_444_32;
1297                                 break;
1298                         }
1299                 }
1300
1301                 pipe_cnt++;
1302         }
1303
1304         /* populate writeback information */
1305         DC_FP_START();
1306         dc->res_pool->funcs->populate_dml_writeback_from_context(dc, res_ctx, pipes);
1307         DC_FP_END();
1308
1309         return pipe_cnt;
1310 }
1311
1312 void dcn20_calculate_wm(
1313                 struct dc *dc, struct dc_state *context,
1314                 display_e2e_pipe_params_st *pipes,
1315                 int *out_pipe_cnt,
1316                 int *pipe_split_from,
1317                 int vlevel,
1318                 bool fast_validate)
1319 {
1320         int pipe_cnt, i, pipe_idx;
1321
1322         dc_assert_fp_enabled();
1323
1324         for (i = 0, pipe_idx = 0, pipe_cnt = 0; i < dc->res_pool->pipe_count; i++) {
1325                 if (!context->res_ctx.pipe_ctx[i].stream)
1326                         continue;
1327
1328                 pipes[pipe_cnt].clks_cfg.refclk_mhz = dc->res_pool->ref_clocks.dchub_ref_clock_inKhz / 1000.0;
1329                 pipes[pipe_cnt].clks_cfg.dispclk_mhz = context->bw_ctx.dml.vba.RequiredDISPCLK[vlevel][context->bw_ctx.dml.vba.maxMpcComb];
1330
1331                 if (pipe_split_from[i] < 0) {
1332                         pipes[pipe_cnt].clks_cfg.dppclk_mhz =
1333                                         context->bw_ctx.dml.vba.RequiredDPPCLK[vlevel][context->bw_ctx.dml.vba.maxMpcComb][pipe_idx];
1334                         if (context->bw_ctx.dml.vba.BlendingAndTiming[pipe_idx] == pipe_idx)
1335                                 pipes[pipe_cnt].pipe.dest.odm_combine =
1336                                                 context->bw_ctx.dml.vba.ODMCombineEnabled[pipe_idx];
1337                         else
1338                                 pipes[pipe_cnt].pipe.dest.odm_combine = 0;
1339                         pipe_idx++;
1340                 } else {
1341                         pipes[pipe_cnt].clks_cfg.dppclk_mhz =
1342                                         context->bw_ctx.dml.vba.RequiredDPPCLK[vlevel][context->bw_ctx.dml.vba.maxMpcComb][pipe_split_from[i]];
1343                         if (context->bw_ctx.dml.vba.BlendingAndTiming[pipe_split_from[i]] == pipe_split_from[i])
1344                                 pipes[pipe_cnt].pipe.dest.odm_combine =
1345                                                 context->bw_ctx.dml.vba.ODMCombineEnabled[pipe_split_from[i]];
1346                         else
1347                                 pipes[pipe_cnt].pipe.dest.odm_combine = 0;
1348                 }
1349
1350                 if (dc->config.forced_clocks) {
1351                         pipes[pipe_cnt].clks_cfg.dispclk_mhz = context->bw_ctx.dml.soc.clock_limits[0].dispclk_mhz;
1352                         pipes[pipe_cnt].clks_cfg.dppclk_mhz = context->bw_ctx.dml.soc.clock_limits[0].dppclk_mhz;
1353                 }
1354                 if (dc->debug.min_disp_clk_khz > pipes[pipe_cnt].clks_cfg.dispclk_mhz * 1000)
1355                         pipes[pipe_cnt].clks_cfg.dispclk_mhz = dc->debug.min_disp_clk_khz / 1000.0;
1356                 if (dc->debug.min_dpp_clk_khz > pipes[pipe_cnt].clks_cfg.dppclk_mhz * 1000)
1357                         pipes[pipe_cnt].clks_cfg.dppclk_mhz = dc->debug.min_dpp_clk_khz / 1000.0;
1358
1359                 pipe_cnt++;
1360         }
1361
1362         if (pipe_cnt != pipe_idx) {
1363                 if (dc->res_pool->funcs->populate_dml_pipes)
1364                         pipe_cnt = dc->res_pool->funcs->populate_dml_pipes(dc,
1365                                 context, pipes, fast_validate);
1366                 else
1367                         pipe_cnt = dcn20_populate_dml_pipes_from_context(dc,
1368                                 context, pipes, fast_validate);
1369         }
1370
1371         *out_pipe_cnt = pipe_cnt;
1372
1373         pipes[0].clks_cfg.voltage = vlevel;
1374         pipes[0].clks_cfg.dcfclk_mhz = context->bw_ctx.dml.soc.clock_limits[vlevel].dcfclk_mhz;
1375         pipes[0].clks_cfg.socclk_mhz = context->bw_ctx.dml.soc.clock_limits[vlevel].socclk_mhz;
1376
1377         /* only pipe 0 is read for voltage and dcf/soc clocks */
1378         if (vlevel < 1) {
1379                 pipes[0].clks_cfg.voltage = 1;
1380                 pipes[0].clks_cfg.dcfclk_mhz = context->bw_ctx.dml.soc.clock_limits[1].dcfclk_mhz;
1381                 pipes[0].clks_cfg.socclk_mhz = context->bw_ctx.dml.soc.clock_limits[1].socclk_mhz;
1382         }
1383         context->bw_ctx.bw.dcn.watermarks.b.urgent_ns = get_wm_urgent(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000;
1384         context->bw_ctx.bw.dcn.watermarks.b.cstate_pstate.cstate_enter_plus_exit_ns = get_wm_stutter_enter_exit(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000;
1385         context->bw_ctx.bw.dcn.watermarks.b.cstate_pstate.cstate_exit_ns = get_wm_stutter_exit(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000;
1386         context->bw_ctx.bw.dcn.watermarks.b.cstate_pstate.pstate_change_ns = get_wm_dram_clock_change(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000;
1387         context->bw_ctx.bw.dcn.watermarks.b.pte_meta_urgent_ns = get_wm_memory_trip(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000;
1388         context->bw_ctx.bw.dcn.watermarks.b.frac_urg_bw_nom = get_fraction_of_urgent_bandwidth(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000;
1389         context->bw_ctx.bw.dcn.watermarks.b.frac_urg_bw_flip = get_fraction_of_urgent_bandwidth_imm_flip(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000;
1390         context->bw_ctx.bw.dcn.watermarks.b.urgent_latency_ns = get_urgent_latency(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000;
1391
1392         if (vlevel < 2) {
1393                 pipes[0].clks_cfg.voltage = 2;
1394                 pipes[0].clks_cfg.dcfclk_mhz = context->bw_ctx.dml.soc.clock_limits[2].dcfclk_mhz;
1395                 pipes[0].clks_cfg.socclk_mhz = context->bw_ctx.dml.soc.clock_limits[2].socclk_mhz;
1396         }
1397         context->bw_ctx.bw.dcn.watermarks.c.urgent_ns = get_wm_urgent(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000;
1398         context->bw_ctx.bw.dcn.watermarks.c.cstate_pstate.cstate_enter_plus_exit_ns = get_wm_stutter_enter_exit(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000;
1399         context->bw_ctx.bw.dcn.watermarks.c.cstate_pstate.cstate_exit_ns = get_wm_stutter_exit(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000;
1400         context->bw_ctx.bw.dcn.watermarks.c.cstate_pstate.pstate_change_ns = get_wm_dram_clock_change(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000;
1401         context->bw_ctx.bw.dcn.watermarks.c.pte_meta_urgent_ns = get_wm_memory_trip(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000;
1402         context->bw_ctx.bw.dcn.watermarks.c.frac_urg_bw_nom = get_fraction_of_urgent_bandwidth(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000;
1403         context->bw_ctx.bw.dcn.watermarks.c.frac_urg_bw_flip = get_fraction_of_urgent_bandwidth_imm_flip(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000;
1404
1405         if (vlevel < 3) {
1406                 pipes[0].clks_cfg.voltage = 3;
1407                 pipes[0].clks_cfg.dcfclk_mhz = context->bw_ctx.dml.soc.clock_limits[2].dcfclk_mhz;
1408                 pipes[0].clks_cfg.socclk_mhz = context->bw_ctx.dml.soc.clock_limits[2].socclk_mhz;
1409         }
1410         context->bw_ctx.bw.dcn.watermarks.d.urgent_ns = get_wm_urgent(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000;
1411         context->bw_ctx.bw.dcn.watermarks.d.cstate_pstate.cstate_enter_plus_exit_ns = get_wm_stutter_enter_exit(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000;
1412         context->bw_ctx.bw.dcn.watermarks.d.cstate_pstate.cstate_exit_ns = get_wm_stutter_exit(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000;
1413         context->bw_ctx.bw.dcn.watermarks.d.cstate_pstate.pstate_change_ns = get_wm_dram_clock_change(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000;
1414         context->bw_ctx.bw.dcn.watermarks.d.pte_meta_urgent_ns = get_wm_memory_trip(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000;
1415         context->bw_ctx.bw.dcn.watermarks.d.frac_urg_bw_nom = get_fraction_of_urgent_bandwidth(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000;
1416         context->bw_ctx.bw.dcn.watermarks.d.frac_urg_bw_flip = get_fraction_of_urgent_bandwidth_imm_flip(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000;
1417
1418         pipes[0].clks_cfg.voltage = vlevel;
1419         pipes[0].clks_cfg.dcfclk_mhz = context->bw_ctx.dml.soc.clock_limits[vlevel].dcfclk_mhz;
1420         pipes[0].clks_cfg.socclk_mhz = context->bw_ctx.dml.soc.clock_limits[vlevel].socclk_mhz;
1421         context->bw_ctx.bw.dcn.watermarks.a.urgent_ns = get_wm_urgent(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000;
1422         context->bw_ctx.bw.dcn.watermarks.a.cstate_pstate.cstate_enter_plus_exit_ns = get_wm_stutter_enter_exit(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000;
1423         context->bw_ctx.bw.dcn.watermarks.a.cstate_pstate.cstate_exit_ns = get_wm_stutter_exit(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000;
1424         context->bw_ctx.bw.dcn.watermarks.a.cstate_pstate.pstate_change_ns = get_wm_dram_clock_change(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000;
1425         context->bw_ctx.bw.dcn.watermarks.a.pte_meta_urgent_ns = get_wm_memory_trip(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000;
1426         context->bw_ctx.bw.dcn.watermarks.a.frac_urg_bw_nom = get_fraction_of_urgent_bandwidth(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000;
1427         context->bw_ctx.bw.dcn.watermarks.a.frac_urg_bw_flip = get_fraction_of_urgent_bandwidth_imm_flip(&context->bw_ctx.dml, pipes, pipe_cnt) * 1000;
1428 }
1429
1430 void dcn20_update_bounding_box(struct dc *dc, struct _vcs_dpi_soc_bounding_box_st *bb,
1431                 struct pp_smu_nv_clock_table *max_clocks, unsigned int *uclk_states, unsigned int num_states)
1432 {
1433         struct _vcs_dpi_voltage_scaling_st calculated_states[DC__VOLTAGE_STATES];
1434         int i;
1435         int num_calculated_states = 0;
1436         int min_dcfclk = 0;
1437
1438         dc_assert_fp_enabled();
1439
1440         if (num_states == 0)
1441                 return;
1442
1443         memset(calculated_states, 0, sizeof(calculated_states));
1444
1445         if (dc->bb_overrides.min_dcfclk_mhz > 0)
1446                 min_dcfclk = dc->bb_overrides.min_dcfclk_mhz;
1447         else {
1448                 if (ASICREV_IS_NAVI12_P(dc->ctx->asic_id.hw_internal_rev))
1449                         min_dcfclk = 310;
1450                 else
1451                         // Accounting for SOC/DCF relationship, we can go as high as
1452                         // 506Mhz in Vmin.
1453                         min_dcfclk = 506;
1454         }
1455
1456         for (i = 0; i < num_states; i++) {
1457                 int min_fclk_required_by_uclk;
1458                 calculated_states[i].state = i;
1459                 calculated_states[i].dram_speed_mts = uclk_states[i] * 16 / 1000;
1460
1461                 // FCLK:UCLK ratio is 1.08
1462                 min_fclk_required_by_uclk = div_u64(((unsigned long long)uclk_states[i]) * 1080,
1463                         1000000);
1464
1465                 calculated_states[i].fabricclk_mhz = (min_fclk_required_by_uclk < min_dcfclk) ?
1466                                 min_dcfclk : min_fclk_required_by_uclk;
1467
1468                 calculated_states[i].socclk_mhz = (calculated_states[i].fabricclk_mhz > max_clocks->socClockInKhz / 1000) ?
1469                                 max_clocks->socClockInKhz / 1000 : calculated_states[i].fabricclk_mhz;
1470
1471                 calculated_states[i].dcfclk_mhz = (calculated_states[i].fabricclk_mhz > max_clocks->dcfClockInKhz / 1000) ?
1472                                 max_clocks->dcfClockInKhz / 1000 : calculated_states[i].fabricclk_mhz;
1473
1474                 calculated_states[i].dispclk_mhz = max_clocks->displayClockInKhz / 1000;
1475                 calculated_states[i].dppclk_mhz = max_clocks->displayClockInKhz / 1000;
1476                 calculated_states[i].dscclk_mhz = max_clocks->displayClockInKhz / (1000 * 3);
1477
1478                 calculated_states[i].phyclk_mhz = max_clocks->phyClockInKhz / 1000;
1479
1480                 num_calculated_states++;
1481         }
1482
1483         calculated_states[num_calculated_states - 1].socclk_mhz = max_clocks->socClockInKhz / 1000;
1484         calculated_states[num_calculated_states - 1].fabricclk_mhz = max_clocks->socClockInKhz / 1000;
1485         calculated_states[num_calculated_states - 1].dcfclk_mhz = max_clocks->dcfClockInKhz / 1000;
1486
1487         memcpy(bb->clock_limits, calculated_states, sizeof(bb->clock_limits));
1488         bb->num_states = num_calculated_states;
1489
1490         // Duplicate the last state, DML always an extra state identical to max state to work
1491         memcpy(&bb->clock_limits[num_calculated_states], &bb->clock_limits[num_calculated_states - 1], sizeof(struct _vcs_dpi_voltage_scaling_st));
1492         bb->clock_limits[num_calculated_states].state = bb->num_states;
1493 }
1494
1495 void dcn20_cap_soc_clocks(
1496                 struct _vcs_dpi_soc_bounding_box_st *bb,
1497                 struct pp_smu_nv_clock_table max_clocks)
1498 {
1499         int i;
1500
1501         dc_assert_fp_enabled();
1502
1503         // First pass - cap all clocks higher than the reported max
1504         for (i = 0; i < bb->num_states; i++) {
1505                 if ((bb->clock_limits[i].dcfclk_mhz > (max_clocks.dcfClockInKhz / 1000))
1506                                 && max_clocks.dcfClockInKhz != 0)
1507                         bb->clock_limits[i].dcfclk_mhz = (max_clocks.dcfClockInKhz / 1000);
1508
1509                 if ((bb->clock_limits[i].dram_speed_mts > (max_clocks.uClockInKhz / 1000) * 16)
1510                                                 && max_clocks.uClockInKhz != 0)
1511                         bb->clock_limits[i].dram_speed_mts = (max_clocks.uClockInKhz / 1000) * 16;
1512
1513                 if ((bb->clock_limits[i].fabricclk_mhz > (max_clocks.fabricClockInKhz / 1000))
1514                                                 && max_clocks.fabricClockInKhz != 0)
1515                         bb->clock_limits[i].fabricclk_mhz = (max_clocks.fabricClockInKhz / 1000);
1516
1517                 if ((bb->clock_limits[i].dispclk_mhz > (max_clocks.displayClockInKhz / 1000))
1518                                                 && max_clocks.displayClockInKhz != 0)
1519                         bb->clock_limits[i].dispclk_mhz = (max_clocks.displayClockInKhz / 1000);
1520
1521                 if ((bb->clock_limits[i].dppclk_mhz > (max_clocks.dppClockInKhz / 1000))
1522                                                 && max_clocks.dppClockInKhz != 0)
1523                         bb->clock_limits[i].dppclk_mhz = (max_clocks.dppClockInKhz / 1000);
1524
1525                 if ((bb->clock_limits[i].phyclk_mhz > (max_clocks.phyClockInKhz / 1000))
1526                                                 && max_clocks.phyClockInKhz != 0)
1527                         bb->clock_limits[i].phyclk_mhz = (max_clocks.phyClockInKhz / 1000);
1528
1529                 if ((bb->clock_limits[i].socclk_mhz > (max_clocks.socClockInKhz / 1000))
1530                                                 && max_clocks.socClockInKhz != 0)
1531                         bb->clock_limits[i].socclk_mhz = (max_clocks.socClockInKhz / 1000);
1532
1533                 if ((bb->clock_limits[i].dscclk_mhz > (max_clocks.dscClockInKhz / 1000))
1534                                                 && max_clocks.dscClockInKhz != 0)
1535                         bb->clock_limits[i].dscclk_mhz = (max_clocks.dscClockInKhz / 1000);
1536         }
1537
1538         // Second pass - remove all duplicate clock states
1539         for (i = bb->num_states - 1; i > 1; i--) {
1540                 bool duplicate = true;
1541
1542                 if (bb->clock_limits[i-1].dcfclk_mhz != bb->clock_limits[i].dcfclk_mhz)
1543                         duplicate = false;
1544                 if (bb->clock_limits[i-1].dispclk_mhz != bb->clock_limits[i].dispclk_mhz)
1545                         duplicate = false;
1546                 if (bb->clock_limits[i-1].dppclk_mhz != bb->clock_limits[i].dppclk_mhz)
1547                         duplicate = false;
1548                 if (bb->clock_limits[i-1].dram_speed_mts != bb->clock_limits[i].dram_speed_mts)
1549                         duplicate = false;
1550                 if (bb->clock_limits[i-1].dscclk_mhz != bb->clock_limits[i].dscclk_mhz)
1551                         duplicate = false;
1552                 if (bb->clock_limits[i-1].fabricclk_mhz != bb->clock_limits[i].fabricclk_mhz)
1553                         duplicate = false;
1554                 if (bb->clock_limits[i-1].phyclk_mhz != bb->clock_limits[i].phyclk_mhz)
1555                         duplicate = false;
1556                 if (bb->clock_limits[i-1].socclk_mhz != bb->clock_limits[i].socclk_mhz)
1557                         duplicate = false;
1558
1559                 if (duplicate)
1560                         bb->num_states--;
1561         }
1562 }
1563
1564 void dcn20_patch_bounding_box(struct dc *dc, struct _vcs_dpi_soc_bounding_box_st *bb)
1565 {
1566         dc_assert_fp_enabled();
1567
1568         if ((int)(bb->sr_exit_time_us * 1000) != dc->bb_overrides.sr_exit_time_ns
1569                         && dc->bb_overrides.sr_exit_time_ns) {
1570                 bb->sr_exit_time_us = dc->bb_overrides.sr_exit_time_ns / 1000.0;
1571         }
1572
1573         if ((int)(bb->sr_enter_plus_exit_time_us * 1000)
1574                                 != dc->bb_overrides.sr_enter_plus_exit_time_ns
1575                         && dc->bb_overrides.sr_enter_plus_exit_time_ns) {
1576                 bb->sr_enter_plus_exit_time_us =
1577                                 dc->bb_overrides.sr_enter_plus_exit_time_ns / 1000.0;
1578         }
1579
1580         if ((int)(bb->urgent_latency_us * 1000) != dc->bb_overrides.urgent_latency_ns
1581                         && dc->bb_overrides.urgent_latency_ns) {
1582                 bb->urgent_latency_us = dc->bb_overrides.urgent_latency_ns / 1000.0;
1583         }
1584
1585         if ((int)(bb->dram_clock_change_latency_us * 1000)
1586                                 != dc->bb_overrides.dram_clock_change_latency_ns
1587                         && dc->bb_overrides.dram_clock_change_latency_ns) {
1588                 bb->dram_clock_change_latency_us =
1589                                 dc->bb_overrides.dram_clock_change_latency_ns / 1000.0;
1590         }
1591
1592         if ((int)(bb->dummy_pstate_latency_us * 1000)
1593                                 != dc->bb_overrides.dummy_clock_change_latency_ns
1594                         && dc->bb_overrides.dummy_clock_change_latency_ns) {
1595                 bb->dummy_pstate_latency_us =
1596                                 dc->bb_overrides.dummy_clock_change_latency_ns / 1000.0;
1597         }
1598 }
1599
1600 static bool dcn20_validate_bandwidth_internal(struct dc *dc, struct dc_state *context,
1601                 bool fast_validate)
1602 {
1603         bool out = false;
1604
1605         BW_VAL_TRACE_SETUP();
1606
1607         int vlevel = 0;
1608         int pipe_split_from[MAX_PIPES];
1609         int pipe_cnt = 0;
1610         display_e2e_pipe_params_st *pipes = kzalloc(dc->res_pool->pipe_count * sizeof(display_e2e_pipe_params_st), GFP_ATOMIC);
1611         DC_LOGGER_INIT(dc->ctx->logger);
1612
1613         BW_VAL_TRACE_COUNT();
1614
1615         out = dcn20_fast_validate_bw(dc, context, pipes, &pipe_cnt, pipe_split_from, &vlevel, fast_validate);
1616
1617         if (pipe_cnt == 0)
1618                 goto validate_out;
1619
1620         if (!out)
1621                 goto validate_fail;
1622
1623         BW_VAL_TRACE_END_VOLTAGE_LEVEL();
1624
1625         if (fast_validate) {
1626                 BW_VAL_TRACE_SKIP(fast);
1627                 goto validate_out;
1628         }
1629
1630         dcn20_calculate_wm(dc, context, pipes, &pipe_cnt, pipe_split_from, vlevel, fast_validate);
1631         dcn20_calculate_dlg_params(dc, context, pipes, pipe_cnt, vlevel);
1632
1633         BW_VAL_TRACE_END_WATERMARKS();
1634
1635         goto validate_out;
1636
1637 validate_fail:
1638         DC_LOG_WARNING("Mode Validation Warning: %s failed validation.\n",
1639                 dml_get_status_message(context->bw_ctx.dml.vba.ValidationStatus[context->bw_ctx.dml.vba.soc.num_states]));
1640
1641         BW_VAL_TRACE_SKIP(fail);
1642         out = false;
1643
1644 validate_out:
1645         kfree(pipes);
1646
1647         BW_VAL_TRACE_FINISH();
1648
1649         return out;
1650 }
1651
1652 bool dcn20_validate_bandwidth_fp(struct dc *dc,
1653                                 struct dc_state *context,
1654                                 bool fast_validate)
1655 {
1656        bool voltage_supported = false;
1657        bool full_pstate_supported = false;
1658        bool dummy_pstate_supported = false;
1659        double p_state_latency_us;
1660
1661        dc_assert_fp_enabled();
1662
1663        p_state_latency_us = context->bw_ctx.dml.soc.dram_clock_change_latency_us;
1664        context->bw_ctx.dml.soc.disable_dram_clock_change_vactive_support =
1665                dc->debug.disable_dram_clock_change_vactive_support;
1666        context->bw_ctx.dml.soc.allow_dram_clock_one_display_vactive =
1667                dc->debug.enable_dram_clock_change_one_display_vactive;
1668
1669        /*Unsafe due to current pipe merge and split logic*/
1670        ASSERT(context != dc->current_state);
1671
1672        if (fast_validate) {
1673                return dcn20_validate_bandwidth_internal(dc, context, true);
1674        }
1675
1676        // Best case, we support full UCLK switch latency
1677        voltage_supported = dcn20_validate_bandwidth_internal(dc, context, false);
1678        full_pstate_supported = context->bw_ctx.bw.dcn.clk.p_state_change_support;
1679
1680        if (context->bw_ctx.dml.soc.dummy_pstate_latency_us == 0 ||
1681                (voltage_supported && full_pstate_supported)) {
1682                context->bw_ctx.bw.dcn.clk.p_state_change_support = full_pstate_supported;
1683                goto restore_dml_state;
1684        }
1685
1686        // Fallback: Try to only support G6 temperature read latency
1687        context->bw_ctx.dml.soc.dram_clock_change_latency_us = context->bw_ctx.dml.soc.dummy_pstate_latency_us;
1688
1689        voltage_supported = dcn20_validate_bandwidth_internal(dc, context, false);
1690        dummy_pstate_supported = context->bw_ctx.bw.dcn.clk.p_state_change_support;
1691
1692        if (voltage_supported && (dummy_pstate_supported || !(context->stream_count))) {
1693                context->bw_ctx.bw.dcn.clk.p_state_change_support = false;
1694                goto restore_dml_state;
1695        }
1696
1697        // ERROR: fallback is supposed to always work.
1698        ASSERT(false);
1699
1700 restore_dml_state:
1701        context->bw_ctx.dml.soc.dram_clock_change_latency_us = p_state_latency_us;
1702        return voltage_supported;
1703 }
1704
1705 void dcn20_fpu_set_wm_ranges(int i,
1706                             struct pp_smu_wm_range_sets *ranges,
1707                             struct _vcs_dpi_soc_bounding_box_st *loaded_bb)
1708 {
1709        dc_assert_fp_enabled();
1710
1711        ranges->reader_wm_sets[i].min_fill_clk_mhz = (i > 0) ? (loaded_bb->clock_limits[i - 1].dram_speed_mts / 16) + 1 : 0;
1712        ranges->reader_wm_sets[i].max_fill_clk_mhz = loaded_bb->clock_limits[i].dram_speed_mts / 16;
1713 }
1714
1715 void dcn20_fpu_adjust_dppclk(struct vba_vars_st *v,
1716                             int vlevel,
1717                             int max_mpc_comb,
1718                             int pipe_idx,
1719                             bool is_validating_bw)
1720 {
1721        dc_assert_fp_enabled();
1722
1723        if (is_validating_bw)
1724                v->RequiredDPPCLK[vlevel][max_mpc_comb][pipe_idx] *= 2;
1725        else
1726                v->RequiredDPPCLK[vlevel][max_mpc_comb][pipe_idx] /= 2;
1727 }
1728
1729 int dcn21_populate_dml_pipes_from_context(struct dc *dc,
1730                                           struct dc_state *context,
1731                                           display_e2e_pipe_params_st *pipes,
1732                                           bool fast_validate)
1733 {
1734         uint32_t pipe_cnt;
1735         int i;
1736
1737         dc_assert_fp_enabled();
1738
1739         pipe_cnt = dcn20_populate_dml_pipes_from_context(dc, context, pipes, fast_validate);
1740
1741         for (i = 0; i < pipe_cnt; i++) {
1742
1743                 pipes[i].pipe.src.hostvm = dc->res_pool->hubbub->riommu_active;
1744                 pipes[i].pipe.src.gpuvm = 1;
1745         }
1746
1747         return pipe_cnt;
1748 }
1749
1750 static void patch_bounding_box(struct dc *dc, struct _vcs_dpi_soc_bounding_box_st *bb)
1751 {
1752         int i;
1753
1754         if (dc->bb_overrides.sr_exit_time_ns) {
1755                 for (i = 0; i < WM_SET_COUNT; i++) {
1756                           dc->clk_mgr->bw_params->wm_table.entries[i].sr_exit_time_us =
1757                                           dc->bb_overrides.sr_exit_time_ns / 1000.0;
1758                 }
1759         }
1760
1761         if (dc->bb_overrides.sr_enter_plus_exit_time_ns) {
1762                 for (i = 0; i < WM_SET_COUNT; i++) {
1763                           dc->clk_mgr->bw_params->wm_table.entries[i].sr_enter_plus_exit_time_us =
1764                                           dc->bb_overrides.sr_enter_plus_exit_time_ns / 1000.0;
1765                 }
1766         }
1767
1768         if (dc->bb_overrides.urgent_latency_ns) {
1769                 bb->urgent_latency_us = dc->bb_overrides.urgent_latency_ns / 1000.0;
1770         }
1771
1772         if (dc->bb_overrides.dram_clock_change_latency_ns) {
1773                 for (i = 0; i < WM_SET_COUNT; i++) {
1774                         dc->clk_mgr->bw_params->wm_table.entries[i].pstate_latency_us =
1775                                 dc->bb_overrides.dram_clock_change_latency_ns / 1000.0;
1776                 }
1777         }
1778 }
1779
1780 static void calculate_wm_set_for_vlevel(int vlevel,
1781                                         struct wm_range_table_entry *table_entry,
1782                                         struct dcn_watermarks *wm_set,
1783                                         struct display_mode_lib *dml,
1784                                         display_e2e_pipe_params_st *pipes,
1785                                         int pipe_cnt)
1786 {
1787         double dram_clock_change_latency_cached = dml->soc.dram_clock_change_latency_us;
1788
1789         ASSERT(vlevel < dml->soc.num_states);
1790         /* only pipe 0 is read for voltage and dcf/soc clocks */
1791         pipes[0].clks_cfg.voltage = vlevel;
1792         pipes[0].clks_cfg.dcfclk_mhz = dml->soc.clock_limits[vlevel].dcfclk_mhz;
1793         pipes[0].clks_cfg.socclk_mhz = dml->soc.clock_limits[vlevel].socclk_mhz;
1794
1795         dml->soc.dram_clock_change_latency_us = table_entry->pstate_latency_us;
1796         dml->soc.sr_exit_time_us = table_entry->sr_exit_time_us;
1797         dml->soc.sr_enter_plus_exit_time_us = table_entry->sr_enter_plus_exit_time_us;
1798
1799         wm_set->urgent_ns = get_wm_urgent(dml, pipes, pipe_cnt) * 1000;
1800         wm_set->cstate_pstate.cstate_enter_plus_exit_ns = get_wm_stutter_enter_exit(dml, pipes, pipe_cnt) * 1000;
1801         wm_set->cstate_pstate.cstate_exit_ns = get_wm_stutter_exit(dml, pipes, pipe_cnt) * 1000;
1802         wm_set->cstate_pstate.pstate_change_ns = get_wm_dram_clock_change(dml, pipes, pipe_cnt) * 1000;
1803         wm_set->pte_meta_urgent_ns = get_wm_memory_trip(dml, pipes, pipe_cnt) * 1000;
1804         wm_set->frac_urg_bw_nom = get_fraction_of_urgent_bandwidth(dml, pipes, pipe_cnt) * 1000;
1805         wm_set->frac_urg_bw_flip = get_fraction_of_urgent_bandwidth_imm_flip(dml, pipes, pipe_cnt) * 1000;
1806         wm_set->urgent_latency_ns = get_urgent_latency(dml, pipes, pipe_cnt) * 1000;
1807         dml->soc.dram_clock_change_latency_us = dram_clock_change_latency_cached;
1808 }
1809
1810 static void dcn21_calculate_wm(struct dc *dc, struct dc_state *context,
1811                         display_e2e_pipe_params_st *pipes,
1812                         int *out_pipe_cnt,
1813                         int *pipe_split_from,
1814                         int vlevel_req,
1815                         bool fast_validate)
1816 {
1817         int pipe_cnt, i, pipe_idx;
1818         int vlevel, vlevel_max;
1819         struct wm_range_table_entry *table_entry;
1820         struct clk_bw_params *bw_params = dc->clk_mgr->bw_params;
1821
1822         ASSERT(bw_params);
1823
1824         patch_bounding_box(dc, &context->bw_ctx.dml.soc);
1825
1826         for (i = 0, pipe_idx = 0, pipe_cnt = 0; i < dc->res_pool->pipe_count; i++) {
1827                         if (!context->res_ctx.pipe_ctx[i].stream)
1828                                 continue;
1829
1830                         pipes[pipe_cnt].clks_cfg.refclk_mhz = dc->res_pool->ref_clocks.dchub_ref_clock_inKhz / 1000.0;
1831                         pipes[pipe_cnt].clks_cfg.dispclk_mhz = context->bw_ctx.dml.vba.RequiredDISPCLK[vlevel_req][context->bw_ctx.dml.vba.maxMpcComb];
1832
1833                         if (pipe_split_from[i] < 0) {
1834                                 pipes[pipe_cnt].clks_cfg.dppclk_mhz =
1835                                                 context->bw_ctx.dml.vba.RequiredDPPCLK[vlevel_req][context->bw_ctx.dml.vba.maxMpcComb][pipe_idx];
1836                                 if (context->bw_ctx.dml.vba.BlendingAndTiming[pipe_idx] == pipe_idx)
1837                                         pipes[pipe_cnt].pipe.dest.odm_combine =
1838                                                         context->bw_ctx.dml.vba.ODMCombineEnablePerState[vlevel_req][pipe_idx];
1839                                 else
1840                                         pipes[pipe_cnt].pipe.dest.odm_combine = 0;
1841                                 pipe_idx++;
1842                         } else {
1843                                 pipes[pipe_cnt].clks_cfg.dppclk_mhz =
1844                                                 context->bw_ctx.dml.vba.RequiredDPPCLK[vlevel_req][context->bw_ctx.dml.vba.maxMpcComb][pipe_split_from[i]];
1845                                 if (context->bw_ctx.dml.vba.BlendingAndTiming[pipe_split_from[i]] == pipe_split_from[i])
1846                                         pipes[pipe_cnt].pipe.dest.odm_combine =
1847                                                         context->bw_ctx.dml.vba.ODMCombineEnablePerState[vlevel_req][pipe_split_from[i]];
1848                                 else
1849                                         pipes[pipe_cnt].pipe.dest.odm_combine = 0;
1850                         }
1851                         pipe_cnt++;
1852         }
1853
1854         if (pipe_cnt != pipe_idx) {
1855                 if (dc->res_pool->funcs->populate_dml_pipes)
1856                         pipe_cnt = dc->res_pool->funcs->populate_dml_pipes(dc,
1857                                 context, pipes, fast_validate);
1858                 else
1859                         pipe_cnt = dcn21_populate_dml_pipes_from_context(dc,
1860                                 context, pipes, fast_validate);
1861         }
1862
1863         *out_pipe_cnt = pipe_cnt;
1864
1865         vlevel_max = bw_params->clk_table.num_entries - 1;
1866
1867
1868         /* WM Set D */
1869         table_entry = &bw_params->wm_table.entries[WM_D];
1870         if (table_entry->wm_type == WM_TYPE_RETRAINING)
1871                 vlevel = 0;
1872         else
1873                 vlevel = vlevel_max;
1874         calculate_wm_set_for_vlevel(vlevel, table_entry, &context->bw_ctx.bw.dcn.watermarks.d,
1875                                                 &context->bw_ctx.dml, pipes, pipe_cnt);
1876         /* WM Set C */
1877         table_entry = &bw_params->wm_table.entries[WM_C];
1878         vlevel = MIN(MAX(vlevel_req, 3), vlevel_max);
1879         calculate_wm_set_for_vlevel(vlevel, table_entry, &context->bw_ctx.bw.dcn.watermarks.c,
1880                                                 &context->bw_ctx.dml, pipes, pipe_cnt);
1881         /* WM Set B */
1882         table_entry = &bw_params->wm_table.entries[WM_B];
1883         vlevel = MIN(MAX(vlevel_req, 2), vlevel_max);
1884         calculate_wm_set_for_vlevel(vlevel, table_entry, &context->bw_ctx.bw.dcn.watermarks.b,
1885                                                 &context->bw_ctx.dml, pipes, pipe_cnt);
1886
1887         /* WM Set A */
1888         table_entry = &bw_params->wm_table.entries[WM_A];
1889         vlevel = MIN(vlevel_req, vlevel_max);
1890         calculate_wm_set_for_vlevel(vlevel, table_entry, &context->bw_ctx.bw.dcn.watermarks.a,
1891                                                 &context->bw_ctx.dml, pipes, pipe_cnt);
1892 }
1893
1894 bool dcn21_validate_bandwidth_fp(struct dc *dc,
1895                                  struct dc_state *context,
1896                                  bool fast_validate)
1897 {
1898         bool out = false;
1899
1900         BW_VAL_TRACE_SETUP();
1901
1902         int vlevel = 0;
1903         int pipe_split_from[MAX_PIPES];
1904         int pipe_cnt = 0;
1905         display_e2e_pipe_params_st *pipes = kzalloc(dc->res_pool->pipe_count * sizeof(display_e2e_pipe_params_st), GFP_ATOMIC);
1906         DC_LOGGER_INIT(dc->ctx->logger);
1907
1908         BW_VAL_TRACE_COUNT();
1909
1910         dc_assert_fp_enabled();
1911
1912         /*Unsafe due to current pipe merge and split logic*/
1913         ASSERT(context != dc->current_state);
1914
1915         out = dcn21_fast_validate_bw(dc, context, pipes, &pipe_cnt, pipe_split_from, &vlevel, fast_validate);
1916
1917         if (pipe_cnt == 0)
1918                 goto validate_out;
1919
1920         if (!out)
1921                 goto validate_fail;
1922
1923         BW_VAL_TRACE_END_VOLTAGE_LEVEL();
1924
1925         if (fast_validate) {
1926                 BW_VAL_TRACE_SKIP(fast);
1927                 goto validate_out;
1928         }
1929
1930         dcn21_calculate_wm(dc, context, pipes, &pipe_cnt, pipe_split_from, vlevel, fast_validate);
1931         dcn20_calculate_dlg_params(dc, context, pipes, pipe_cnt, vlevel);
1932
1933         BW_VAL_TRACE_END_WATERMARKS();
1934
1935         goto validate_out;
1936
1937 validate_fail:
1938         DC_LOG_WARNING("Mode Validation Warning: %s failed validation.\n",
1939                         dml_get_status_message(context->bw_ctx.dml.vba.ValidationStatus[context->bw_ctx.dml.vba.soc.num_states]));
1940
1941         BW_VAL_TRACE_SKIP(fail);
1942         out = false;
1943
1944 validate_out:
1945         kfree(pipes);
1946
1947         BW_VAL_TRACE_FINISH();
1948
1949         return out;
1950 }
1951
1952 static struct _vcs_dpi_voltage_scaling_st construct_low_pstate_lvl(struct clk_limit_table *clk_table, unsigned int high_voltage_lvl)
1953 {
1954         struct _vcs_dpi_voltage_scaling_st low_pstate_lvl;
1955         int i;
1956
1957         low_pstate_lvl.state = 1;
1958         low_pstate_lvl.dcfclk_mhz = clk_table->entries[0].dcfclk_mhz;
1959         low_pstate_lvl.fabricclk_mhz = clk_table->entries[0].fclk_mhz;
1960         low_pstate_lvl.socclk_mhz = clk_table->entries[0].socclk_mhz;
1961         low_pstate_lvl.dram_speed_mts = clk_table->entries[0].memclk_mhz * 2;
1962
1963         low_pstate_lvl.dispclk_mhz = dcn2_1_soc.clock_limits[high_voltage_lvl].dispclk_mhz;
1964         low_pstate_lvl.dppclk_mhz = dcn2_1_soc.clock_limits[high_voltage_lvl].dppclk_mhz;
1965         low_pstate_lvl.dram_bw_per_chan_gbps = dcn2_1_soc.clock_limits[high_voltage_lvl].dram_bw_per_chan_gbps;
1966         low_pstate_lvl.dscclk_mhz = dcn2_1_soc.clock_limits[high_voltage_lvl].dscclk_mhz;
1967         low_pstate_lvl.dtbclk_mhz = dcn2_1_soc.clock_limits[high_voltage_lvl].dtbclk_mhz;
1968         low_pstate_lvl.phyclk_d18_mhz = dcn2_1_soc.clock_limits[high_voltage_lvl].phyclk_d18_mhz;
1969         low_pstate_lvl.phyclk_mhz = dcn2_1_soc.clock_limits[high_voltage_lvl].phyclk_mhz;
1970
1971         for (i = clk_table->num_entries; i > 1; i--)
1972                 clk_table->entries[i] = clk_table->entries[i-1];
1973         clk_table->entries[1] = clk_table->entries[0];
1974         clk_table->num_entries++;
1975
1976         return low_pstate_lvl;
1977 }
1978
1979 void dcn21_update_bw_bounding_box(struct dc *dc, struct clk_bw_params *bw_params)
1980 {
1981         struct dcn21_resource_pool *pool = TO_DCN21_RES_POOL(dc->res_pool);
1982         struct clk_limit_table *clk_table = &bw_params->clk_table;
1983         struct _vcs_dpi_voltage_scaling_st clock_limits[DC__VOLTAGE_STATES];
1984         unsigned int i, closest_clk_lvl = 0, k = 0;
1985         int j;
1986
1987         dc_assert_fp_enabled();
1988
1989         dcn2_1_ip.max_num_otg = pool->base.res_cap->num_timing_generator;
1990         dcn2_1_ip.max_num_dpp = pool->base.pipe_count;
1991         dcn2_1_soc.num_chans = bw_params->num_channels;
1992
1993         ASSERT(clk_table->num_entries);
1994         /* Copy dcn2_1_soc.clock_limits to clock_limits to avoid copying over null states later */
1995         for (i = 0; i < dcn2_1_soc.num_states + 1; i++) {
1996                 clock_limits[i] = dcn2_1_soc.clock_limits[i];
1997         }
1998
1999         for (i = 0; i < clk_table->num_entries; i++) {
2000                 /* loop backwards*/
2001                 for (closest_clk_lvl = 0, j = dcn2_1_soc.num_states - 1; j >= 0; j--) {
2002                         if ((unsigned int) dcn2_1_soc.clock_limits[j].dcfclk_mhz <= clk_table->entries[i].dcfclk_mhz) {
2003                                 closest_clk_lvl = j;
2004                                 break;
2005                         }
2006                 }
2007
2008                 /* clk_table[1] is reserved for min DF PState.  skip here to fill in later. */
2009                 if (i == 1)
2010                         k++;
2011
2012                 clock_limits[k].state = k;
2013                 clock_limits[k].dcfclk_mhz = clk_table->entries[i].dcfclk_mhz;
2014                 clock_limits[k].fabricclk_mhz = clk_table->entries[i].fclk_mhz;
2015                 clock_limits[k].socclk_mhz = clk_table->entries[i].socclk_mhz;
2016                 clock_limits[k].dram_speed_mts = clk_table->entries[i].memclk_mhz * 2;
2017
2018                 clock_limits[k].dispclk_mhz = dcn2_1_soc.clock_limits[closest_clk_lvl].dispclk_mhz;
2019                 clock_limits[k].dppclk_mhz = dcn2_1_soc.clock_limits[closest_clk_lvl].dppclk_mhz;
2020                 clock_limits[k].dram_bw_per_chan_gbps = dcn2_1_soc.clock_limits[closest_clk_lvl].dram_bw_per_chan_gbps;
2021                 clock_limits[k].dscclk_mhz = dcn2_1_soc.clock_limits[closest_clk_lvl].dscclk_mhz;
2022                 clock_limits[k].dtbclk_mhz = dcn2_1_soc.clock_limits[closest_clk_lvl].dtbclk_mhz;
2023                 clock_limits[k].phyclk_d18_mhz = dcn2_1_soc.clock_limits[closest_clk_lvl].phyclk_d18_mhz;
2024                 clock_limits[k].phyclk_mhz = dcn2_1_soc.clock_limits[closest_clk_lvl].phyclk_mhz;
2025
2026                 k++;
2027         }
2028         for (i = 0; i < clk_table->num_entries + 1; i++)
2029                 dcn2_1_soc.clock_limits[i] = clock_limits[i];
2030         if (clk_table->num_entries) {
2031                 dcn2_1_soc.num_states = clk_table->num_entries + 1;
2032                 /* fill in min DF PState */
2033                 dcn2_1_soc.clock_limits[1] = construct_low_pstate_lvl(clk_table, closest_clk_lvl);
2034                 /* duplicate last level */
2035                 dcn2_1_soc.clock_limits[dcn2_1_soc.num_states] = dcn2_1_soc.clock_limits[dcn2_1_soc.num_states - 1];
2036                 dcn2_1_soc.clock_limits[dcn2_1_soc.num_states].state = dcn2_1_soc.num_states;
2037         }
2038
2039         dml_init_instance(&dc->dml, &dcn2_1_soc, &dcn2_1_ip, DML_PROJECT_DCN21);
2040 }