1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27#include "dm_services.h"
28#include "dc.h"
29#include "dcn_calcs.h"
30#include "dcn_calc_auto.h"
31#include "dal_asic_id.h"
32#include "resource.h"
33#include "dcn10/dcn10_resource.h"
34#include "dcn10/dcn10_hubbub.h"
35#include "dml/dml1_display_rq_dlg_calc.h"
36
37#include "dcn_calc_math.h"
38
39#define DC_LOGGER \
40 dc->ctx->logger
41
42#define WM_SET_COUNT 4
43#define WM_A 0
44#define WM_B 1
45#define WM_C 2
46#define WM_D 3
47
48
49
50
51
52
53
54
55
56
57
58
59
60const struct dcn_soc_bounding_box dcn10_soc_defaults = {
61
62 .sr_exit_time = 17,
63 .sr_enter_plus_exit_time = 19,
64 .urgent_latency = 4,
65 .dram_clock_change_latency = 17,
66 .write_back_latency = 12,
67 .percent_of_ideal_drambw_received_after_urg_latency = 80,
68
69
70
71
72
73
74
75 .dcfclkv_max0p9 = 655,
76 .dcfclkv_nom0p8 = 626,
77 .dcfclkv_mid0p72 = 600,
78 .dcfclkv_min0p65 = 300,
79
80
81 .max_dispclk_vmax0p9 = 1108,
82 .max_dispclk_vnom0p8 = 1029,
83 .max_dispclk_vmid0p72 = 960,
84 .max_dispclk_vmin0p65 = 626,
85
86
87 .max_dppclk_vmax0p9 = 720,
88 .max_dppclk_vnom0p8 = 686,
89 .max_dppclk_vmid0p72 = 626,
90 .max_dppclk_vmin0p65 = 400,
91
92
93 .phyclkv_max0p9 = 900,
94 .phyclkv_nom0p8 = 847,
95 .phyclkv_mid0p72 = 800,
96 .phyclkv_min0p65 = 600,
97
98
99
100 .fabric_and_dram_bandwidth_vmax0p9 = 38.4f,
101 .fabric_and_dram_bandwidth_vnom0p8 = 34.133f,
102 .fabric_and_dram_bandwidth_vmid0p72 = 29.866f,
103 .fabric_and_dram_bandwidth_vmin0p65 = 12.8f,
104
105
106
107
108
109
110
111 .number_of_channels = 2,
112
113 .socclk = 208,
114 .downspreading = 0.5f,
115 .round_trip_ping_latency_cycles = 128,
116 .urgent_out_of_order_return_per_channel = 256,
117 .vmm_page_size = 4096,
118 .return_bus_width = 64,
119 .max_request_size = 256,
120
121
122 .percent_disp_bw_limit = 0.3f
123};
124
125const struct dcn_ip_params dcn10_ip_defaults = {
126 .rob_buffer_size_in_kbyte = 64,
127 .det_buffer_size_in_kbyte = 164,
128 .dpp_output_buffer_pixels = 2560,
129 .opp_output_buffer_lines = 1,
130 .pixel_chunk_size_in_kbyte = 8,
131 .pte_enable = dcn_bw_yes,
132 .pte_chunk_size = 2,
133 .meta_chunk_size = 2,
134 .writeback_chunk_size = 2,
135 .odm_capability = dcn_bw_no,
136 .dsc_capability = dcn_bw_no,
137 .line_buffer_size = 589824,
138 .max_line_buffer_lines = 12,
139 .is_line_buffer_bpp_fixed = dcn_bw_no,
140 .line_buffer_fixed_bpp = dcn_bw_na,
141 .writeback_luma_buffer_size = 12,
142 .writeback_chroma_buffer_size = 8,
143 .max_num_dpp = 4,
144 .max_num_writeback = 2,
145 .max_dchub_topscl_throughput = 4,
146 .max_pscl_tolb_throughput = 2,
147 .max_lb_tovscl_throughput = 4,
148 .max_vscl_tohscl_throughput = 4,
149 .max_hscl_ratio = 4,
150 .max_vscl_ratio = 4,
151 .max_hscl_taps = 8,
152 .max_vscl_taps = 8,
153 .pte_buffer_size_in_requests = 42,
154 .dispclk_ramping_margin = 1,
155 .under_scan_factor = 1.11f,
156 .max_inter_dcn_tile_repeaters = 8,
157 .can_vstartup_lines_exceed_vsync_plus_back_porch_lines_minus_one = dcn_bw_no,
158 .bug_forcing_luma_and_chroma_request_to_same_size_fixed = dcn_bw_no,
159 .dcfclk_cstate_latency = 10
160};
161
162static enum dcn_bw_defs tl_sw_mode_to_bw_defs(enum swizzle_mode_values sw_mode)
163{
164 switch (sw_mode) {
165 case DC_SW_LINEAR:
166 return dcn_bw_sw_linear;
167 case DC_SW_4KB_S:
168 return dcn_bw_sw_4_kb_s;
169 case DC_SW_4KB_D:
170 return dcn_bw_sw_4_kb_d;
171 case DC_SW_64KB_S:
172 return dcn_bw_sw_64_kb_s;
173 case DC_SW_64KB_D:
174 return dcn_bw_sw_64_kb_d;
175 case DC_SW_VAR_S:
176 return dcn_bw_sw_var_s;
177 case DC_SW_VAR_D:
178 return dcn_bw_sw_var_d;
179 case DC_SW_64KB_S_T:
180 return dcn_bw_sw_64_kb_s_t;
181 case DC_SW_64KB_D_T:
182 return dcn_bw_sw_64_kb_d_t;
183 case DC_SW_4KB_S_X:
184 return dcn_bw_sw_4_kb_s_x;
185 case DC_SW_4KB_D_X:
186 return dcn_bw_sw_4_kb_d_x;
187 case DC_SW_64KB_S_X:
188 return dcn_bw_sw_64_kb_s_x;
189 case DC_SW_64KB_D_X:
190 return dcn_bw_sw_64_kb_d_x;
191 case DC_SW_VAR_S_X:
192 return dcn_bw_sw_var_s_x;
193 case DC_SW_VAR_D_X:
194 return dcn_bw_sw_var_d_x;
195 case DC_SW_256B_S:
196 case DC_SW_256_D:
197 case DC_SW_256_R:
198 case DC_SW_4KB_R:
199 case DC_SW_64KB_R:
200 case DC_SW_VAR_R:
201 case DC_SW_4KB_R_X:
202 case DC_SW_64KB_R_X:
203 case DC_SW_VAR_R_X:
204 default:
205 BREAK_TO_DEBUGGER();
206 return dcn_bw_sw_4_kb_s;
207 }
208}
209
210static int tl_lb_bpp_to_int(enum lb_pixel_depth depth)
211{
212 switch (depth) {
213 case LB_PIXEL_DEPTH_18BPP:
214 return 18;
215 case LB_PIXEL_DEPTH_24BPP:
216 return 24;
217 case LB_PIXEL_DEPTH_30BPP:
218 return 30;
219 case LB_PIXEL_DEPTH_36BPP:
220 return 36;
221 default:
222 return 30;
223 }
224}
225
226static enum dcn_bw_defs tl_pixel_format_to_bw_defs(enum surface_pixel_format format)
227{
228 switch (format) {
229 case SURFACE_PIXEL_FORMAT_GRPH_ARGB1555:
230 case SURFACE_PIXEL_FORMAT_GRPH_RGB565:
231 return dcn_bw_rgb_sub_16;
232 case SURFACE_PIXEL_FORMAT_GRPH_ARGB8888:
233 case SURFACE_PIXEL_FORMAT_GRPH_ABGR8888:
234 case SURFACE_PIXEL_FORMAT_GRPH_ARGB2101010:
235 case SURFACE_PIXEL_FORMAT_GRPH_ABGR2101010:
236 case SURFACE_PIXEL_FORMAT_GRPH_ABGR2101010_XR_BIAS:
237 return dcn_bw_rgb_sub_32;
238 case SURFACE_PIXEL_FORMAT_GRPH_ARGB16161616:
239 case SURFACE_PIXEL_FORMAT_GRPH_ABGR16161616:
240 case SURFACE_PIXEL_FORMAT_GRPH_ARGB16161616F:
241 case SURFACE_PIXEL_FORMAT_GRPH_ABGR16161616F:
242 return dcn_bw_rgb_sub_64;
243 case SURFACE_PIXEL_FORMAT_VIDEO_420_YCbCr:
244 case SURFACE_PIXEL_FORMAT_VIDEO_420_YCrCb:
245 return dcn_bw_yuv420_sub_8;
246 case SURFACE_PIXEL_FORMAT_VIDEO_420_10bpc_YCbCr:
247 case SURFACE_PIXEL_FORMAT_VIDEO_420_10bpc_YCrCb:
248 return dcn_bw_yuv420_sub_10;
249 default:
250 return dcn_bw_rgb_sub_32;
251 }
252}
253
254enum source_macro_tile_size swizzle_mode_to_macro_tile_size(enum swizzle_mode_values sw_mode)
255{
256 switch (sw_mode) {
257
258 case DC_SW_LINEAR:
259 return dm_4k_tile;
260 case DC_SW_4KB_S:
261 case DC_SW_4KB_S_X:
262 return dm_4k_tile;
263 case DC_SW_64KB_S:
264 case DC_SW_64KB_S_X:
265 case DC_SW_64KB_S_T:
266 return dm_64k_tile;
267 case DC_SW_VAR_S:
268 case DC_SW_VAR_S_X:
269 return dm_256k_tile;
270
271
272 case DC_SW_4KB_D:
273 case DC_SW_4KB_D_X:
274 return dm_4k_tile;
275 case DC_SW_64KB_D:
276 case DC_SW_64KB_D_X:
277 case DC_SW_64KB_D_T:
278 return dm_64k_tile;
279 case DC_SW_VAR_D:
280 case DC_SW_VAR_D_X:
281 return dm_256k_tile;
282
283 case DC_SW_4KB_R:
284 case DC_SW_4KB_R_X:
285 return dm_4k_tile;
286 case DC_SW_64KB_R:
287 case DC_SW_64KB_R_X:
288 return dm_64k_tile;
289 case DC_SW_VAR_R:
290 case DC_SW_VAR_R_X:
291 return dm_256k_tile;
292
293
294 case DC_SW_256B_S:
295 default:
296 ASSERT(0);
297 return 0;
298 }
299}
300
301static void pipe_ctx_to_e2e_pipe_params (
302 const struct pipe_ctx *pipe,
303 struct _vcs_dpi_display_pipe_params_st *input)
304{
305 input->src.is_hsplit = false;
306
307
308 if (pipe->plane_state->stereo_format == PLANE_STEREO_FORMAT_SIDE_BY_SIDE ||
309 pipe->plane_state->stereo_format == PLANE_STEREO_FORMAT_TOP_AND_BOTTOM) {
310
311 input->src.hsplit_grp = pipe->pipe_idx;
312 } else if (pipe->top_pipe != NULL && pipe->top_pipe->plane_state == pipe->plane_state) {
313 input->src.is_hsplit = true;
314 } else if (pipe->bottom_pipe != NULL && pipe->bottom_pipe->plane_state == pipe->plane_state) {
315 input->src.is_hsplit = true;
316 }
317
318 if (pipe->plane_res.dpp->ctx->dc->debug.optimized_watermark) {
319
320
321
322
323 input->src.dcc = pipe->plane_state->dcc.enable ? 1 : 0;
324 } else {
325
326
327
328
329
330
331 unsigned int bpe;
332
333 input->src.dcc = pipe->plane_res.dpp->ctx->dc->res_pool->hubbub->funcs->
334 dcc_support_pixel_format(pipe->plane_state->format, &bpe) ? 1 : 0;
335 }
336 input->src.dcc_rate = 1;
337 input->src.meta_pitch = pipe->plane_state->dcc.meta_pitch;
338 input->src.source_scan = dm_horz;
339 input->src.sw_mode = pipe->plane_state->tiling_info.gfx9.swizzle;
340
341 input->src.viewport_width = pipe->plane_res.scl_data.viewport.width;
342 input->src.viewport_height = pipe->plane_res.scl_data.viewport.height;
343 input->src.data_pitch = pipe->plane_res.scl_data.viewport.width;
344 input->src.data_pitch_c = pipe->plane_res.scl_data.viewport.width;
345 input->src.cur0_src_width = 128;
346 input->src.cur0_bpp = 32;
347
348 input->src.macro_tile_size = swizzle_mode_to_macro_tile_size(pipe->plane_state->tiling_info.gfx9.swizzle);
349
350 switch (pipe->plane_state->rotation) {
351 case ROTATION_ANGLE_0:
352 case ROTATION_ANGLE_180:
353 input->src.source_scan = dm_horz;
354 break;
355 case ROTATION_ANGLE_90:
356 case ROTATION_ANGLE_270:
357 input->src.source_scan = dm_vert;
358 break;
359 default:
360 ASSERT(0);
361 break;
362 }
363
364
365 switch (pipe->plane_state->format) {
366 case SURFACE_PIXEL_FORMAT_VIDEO_420_YCbCr:
367 case SURFACE_PIXEL_FORMAT_VIDEO_420_YCrCb:
368 input->src.source_format = dm_420_8;
369 input->src.viewport_width_c = input->src.viewport_width / 2;
370 input->src.viewport_height_c = input->src.viewport_height / 2;
371 break;
372 case SURFACE_PIXEL_FORMAT_VIDEO_420_10bpc_YCbCr:
373 case SURFACE_PIXEL_FORMAT_VIDEO_420_10bpc_YCrCb:
374 input->src.source_format = dm_420_10;
375 input->src.viewport_width_c = input->src.viewport_width / 2;
376 input->src.viewport_height_c = input->src.viewport_height / 2;
377 break;
378 case SURFACE_PIXEL_FORMAT_GRPH_ARGB16161616:
379 case SURFACE_PIXEL_FORMAT_GRPH_ABGR16161616:
380 case SURFACE_PIXEL_FORMAT_GRPH_ARGB16161616F:
381 case SURFACE_PIXEL_FORMAT_GRPH_ABGR16161616F:
382 input->src.source_format = dm_444_64;
383 input->src.viewport_width_c = input->src.viewport_width;
384 input->src.viewport_height_c = input->src.viewport_height;
385 break;
386 case SURFACE_PIXEL_FORMAT_GRPH_RGBE_ALPHA:
387 input->src.source_format = dm_rgbe_alpha;
388 input->src.viewport_width_c = input->src.viewport_width;
389 input->src.viewport_height_c = input->src.viewport_height;
390 break;
391 default:
392 input->src.source_format = dm_444_32;
393 input->src.viewport_width_c = input->src.viewport_width;
394 input->src.viewport_height_c = input->src.viewport_height;
395 break;
396 }
397
398 input->scale_taps.htaps = pipe->plane_res.scl_data.taps.h_taps;
399 input->scale_ratio_depth.hscl_ratio = pipe->plane_res.scl_data.ratios.horz.value/4294967296.0;
400 input->scale_ratio_depth.vscl_ratio = pipe->plane_res.scl_data.ratios.vert.value/4294967296.0;
401 input->scale_ratio_depth.vinit = pipe->plane_res.scl_data.inits.v.value/4294967296.0;
402 if (input->scale_ratio_depth.vinit < 1.0)
403 input->scale_ratio_depth.vinit = 1;
404 input->scale_taps.vtaps = pipe->plane_res.scl_data.taps.v_taps;
405 input->scale_taps.vtaps_c = pipe->plane_res.scl_data.taps.v_taps_c;
406 input->scale_taps.htaps_c = pipe->plane_res.scl_data.taps.h_taps_c;
407 input->scale_ratio_depth.hscl_ratio_c = pipe->plane_res.scl_data.ratios.horz_c.value/4294967296.0;
408 input->scale_ratio_depth.vscl_ratio_c = pipe->plane_res.scl_data.ratios.vert_c.value/4294967296.0;
409 input->scale_ratio_depth.vinit_c = pipe->plane_res.scl_data.inits.v_c.value/4294967296.0;
410 if (input->scale_ratio_depth.vinit_c < 1.0)
411 input->scale_ratio_depth.vinit_c = 1;
412 switch (pipe->plane_res.scl_data.lb_params.depth) {
413 case LB_PIXEL_DEPTH_30BPP:
414 input->scale_ratio_depth.lb_depth = 30; break;
415 case LB_PIXEL_DEPTH_36BPP:
416 input->scale_ratio_depth.lb_depth = 36; break;
417 default:
418 input->scale_ratio_depth.lb_depth = 24; break;
419 }
420
421
422 input->dest.vactive = pipe->stream->timing.v_addressable + pipe->stream->timing.v_border_top
423 + pipe->stream->timing.v_border_bottom;
424
425 input->dest.recout_width = pipe->plane_res.scl_data.recout.width;
426 input->dest.recout_height = pipe->plane_res.scl_data.recout.height;
427
428 input->dest.full_recout_width = pipe->plane_res.scl_data.recout.width;
429 input->dest.full_recout_height = pipe->plane_res.scl_data.recout.height;
430
431 input->dest.htotal = pipe->stream->timing.h_total;
432 input->dest.hblank_start = input->dest.htotal - pipe->stream->timing.h_front_porch;
433 input->dest.hblank_end = input->dest.hblank_start
434 - pipe->stream->timing.h_addressable
435 - pipe->stream->timing.h_border_left
436 - pipe->stream->timing.h_border_right;
437
438 input->dest.vtotal = pipe->stream->timing.v_total;
439 input->dest.vblank_start = input->dest.vtotal - pipe->stream->timing.v_front_porch;
440 input->dest.vblank_end = input->dest.vblank_start
441 - pipe->stream->timing.v_addressable
442 - pipe->stream->timing.v_border_bottom
443 - pipe->stream->timing.v_border_top;
444 input->dest.pixel_rate_mhz = pipe->stream->timing.pix_clk_100hz/10000.0;
445 input->dest.vstartup_start = pipe->pipe_dlg_param.vstartup_start;
446 input->dest.vupdate_offset = pipe->pipe_dlg_param.vupdate_offset;
447 input->dest.vupdate_offset = pipe->pipe_dlg_param.vupdate_offset;
448 input->dest.vupdate_width = pipe->pipe_dlg_param.vupdate_width;
449
450}
451
452static void dcn_bw_calc_rq_dlg_ttu(
453 const struct dc *dc,
454 const struct dcn_bw_internal_vars *v,
455 struct pipe_ctx *pipe,
456 int in_idx)
457{
458 struct display_mode_lib *dml = (struct display_mode_lib *)(&dc->dml);
459 struct _vcs_dpi_display_dlg_regs_st *dlg_regs = &pipe->dlg_regs;
460 struct _vcs_dpi_display_ttu_regs_st *ttu_regs = &pipe->ttu_regs;
461 struct _vcs_dpi_display_rq_regs_st *rq_regs = &pipe->rq_regs;
462 struct _vcs_dpi_display_rq_params_st *rq_param = &pipe->dml_rq_param;
463 struct _vcs_dpi_display_dlg_sys_params_st *dlg_sys_param = &pipe->dml_dlg_sys_param;
464 struct _vcs_dpi_display_e2e_pipe_params_st *input = &pipe->dml_input;
465 float total_active_bw = 0;
466 float total_prefetch_bw = 0;
467 int total_flip_bytes = 0;
468 int i;
469
470 memset(dlg_regs, 0, sizeof(*dlg_regs));
471 memset(ttu_regs, 0, sizeof(*ttu_regs));
472 memset(rq_regs, 0, sizeof(*rq_regs));
473 memset(rq_param, 0, sizeof(*rq_param));
474 memset(dlg_sys_param, 0, sizeof(*dlg_sys_param));
475 memset(input, 0, sizeof(*input));
476
477 for (i = 0; i < number_of_planes; i++) {
478 total_active_bw += v->read_bandwidth[i];
479 total_prefetch_bw += v->prefetch_bandwidth[i];
480 total_flip_bytes += v->total_immediate_flip_bytes[i];
481 }
482 dlg_sys_param->total_flip_bw = v->return_bw - dcn_bw_max2(total_active_bw, total_prefetch_bw);
483 if (dlg_sys_param->total_flip_bw < 0.0)
484 dlg_sys_param->total_flip_bw = 0;
485
486 dlg_sys_param->t_mclk_wm_us = v->dram_clock_change_watermark;
487 dlg_sys_param->t_sr_wm_us = v->stutter_enter_plus_exit_watermark;
488 dlg_sys_param->t_urg_wm_us = v->urgent_watermark;
489 dlg_sys_param->t_extra_us = v->urgent_extra_latency;
490 dlg_sys_param->deepsleep_dcfclk_mhz = v->dcf_clk_deep_sleep;
491 dlg_sys_param->total_flip_bytes = total_flip_bytes;
492
493 pipe_ctx_to_e2e_pipe_params(pipe, &input->pipe);
494 input->clks_cfg.dcfclk_mhz = v->dcfclk;
495 input->clks_cfg.dispclk_mhz = v->dispclk;
496 input->clks_cfg.dppclk_mhz = v->dppclk;
497 input->clks_cfg.refclk_mhz = dc->res_pool->ref_clocks.dchub_ref_clock_inKhz / 1000.0;
498 input->clks_cfg.socclk_mhz = v->socclk;
499 input->clks_cfg.voltage = v->voltage_level;
500
501 input->dout.output_format = (v->output_format[in_idx] == dcn_bw_420) ? dm_420 : dm_444;
502 input->dout.output_type = (v->output[in_idx] == dcn_bw_hdmi) ? dm_hdmi : dm_dp;
503
504
505
506 dlg_sys_param->t_srx_delay_us = dc->dcn_ip->dcfclk_cstate_latency / v->dcf_clk_deep_sleep;
507
508 dml1_rq_dlg_get_rq_params(dml, rq_param, &input->pipe.src);
509 dml1_extract_rq_regs(dml, rq_regs, rq_param);
510 dml1_rq_dlg_get_dlg_params(
511 dml,
512 dlg_regs,
513 ttu_regs,
514 &rq_param->dlg,
515 dlg_sys_param,
516 input,
517 true,
518 true,
519 v->pte_enable == dcn_bw_yes,
520 pipe->plane_state->flip_immediate);
521}
522
523static void split_stream_across_pipes(
524 struct resource_context *res_ctx,
525 const struct resource_pool *pool,
526 struct pipe_ctx *primary_pipe,
527 struct pipe_ctx *secondary_pipe)
528{
529 int pipe_idx = secondary_pipe->pipe_idx;
530
531 if (!primary_pipe->plane_state)
532 return;
533
534 *secondary_pipe = *primary_pipe;
535
536 secondary_pipe->pipe_idx = pipe_idx;
537 secondary_pipe->plane_res.mi = pool->mis[secondary_pipe->pipe_idx];
538 secondary_pipe->plane_res.hubp = pool->hubps[secondary_pipe->pipe_idx];
539 secondary_pipe->plane_res.ipp = pool->ipps[secondary_pipe->pipe_idx];
540 secondary_pipe->plane_res.xfm = pool->transforms[secondary_pipe->pipe_idx];
541 secondary_pipe->plane_res.dpp = pool->dpps[secondary_pipe->pipe_idx];
542 secondary_pipe->plane_res.mpcc_inst = pool->dpps[secondary_pipe->pipe_idx]->inst;
543 if (primary_pipe->bottom_pipe) {
544 ASSERT(primary_pipe->bottom_pipe != secondary_pipe);
545 secondary_pipe->bottom_pipe = primary_pipe->bottom_pipe;
546 secondary_pipe->bottom_pipe->top_pipe = secondary_pipe;
547 }
548 primary_pipe->bottom_pipe = secondary_pipe;
549 secondary_pipe->top_pipe = primary_pipe;
550
551 resource_build_scaling_params(primary_pipe);
552 resource_build_scaling_params(secondary_pipe);
553}
554
555#if 0
556static void calc_wm_sets_and_perf_params(
557 struct dc_state *context,
558 struct dcn_bw_internal_vars *v)
559{
560
561 if (v->voltage_level < 2) {
562 v->fabric_and_dram_bandwidth_per_state[1] = v->fabric_and_dram_bandwidth_vnom0p8;
563 v->fabric_and_dram_bandwidth_per_state[0] = v->fabric_and_dram_bandwidth_vnom0p8;
564 v->fabric_and_dram_bandwidth = v->fabric_and_dram_bandwidth_vnom0p8;
565 dispclkdppclkdcfclk_deep_sleep_prefetch_parameters_watermarks_and_performance_calculation(v);
566
567 context->bw_ctx.bw.dcn.watermarks.b.cstate_pstate.cstate_exit_ns =
568 v->stutter_exit_watermark * 1000;
569 context->bw_ctx.bw.dcn.watermarks.b.cstate_pstate.cstate_enter_plus_exit_ns =
570 v->stutter_enter_plus_exit_watermark * 1000;
571 context->bw_ctx.bw.dcn.watermarks.b.cstate_pstate.pstate_change_ns =
572 v->dram_clock_change_watermark * 1000;
573 context->bw_ctx.bw.dcn.watermarks.b.pte_meta_urgent_ns = v->ptemeta_urgent_watermark * 1000;
574 context->bw_ctx.bw.dcn.watermarks.b.urgent_ns = v->urgent_watermark * 1000;
575
576 v->dcfclk_per_state[1] = v->dcfclkv_nom0p8;
577 v->dcfclk_per_state[0] = v->dcfclkv_nom0p8;
578 v->dcfclk = v->dcfclkv_nom0p8;
579 dispclkdppclkdcfclk_deep_sleep_prefetch_parameters_watermarks_and_performance_calculation(v);
580
581 context->bw_ctx.bw.dcn.watermarks.c.cstate_pstate.cstate_exit_ns =
582 v->stutter_exit_watermark * 1000;
583 context->bw_ctx.bw.dcn.watermarks.c.cstate_pstate.cstate_enter_plus_exit_ns =
584 v->stutter_enter_plus_exit_watermark * 1000;
585 context->bw_ctx.bw.dcn.watermarks.c.cstate_pstate.pstate_change_ns =
586 v->dram_clock_change_watermark * 1000;
587 context->bw_ctx.bw.dcn.watermarks.c.pte_meta_urgent_ns = v->ptemeta_urgent_watermark * 1000;
588 context->bw_ctx.bw.dcn.watermarks.c.urgent_ns = v->urgent_watermark * 1000;
589 }
590
591 if (v->voltage_level < 3) {
592 v->fabric_and_dram_bandwidth_per_state[2] = v->fabric_and_dram_bandwidth_vmax0p9;
593 v->fabric_and_dram_bandwidth_per_state[1] = v->fabric_and_dram_bandwidth_vmax0p9;
594 v->fabric_and_dram_bandwidth_per_state[0] = v->fabric_and_dram_bandwidth_vmax0p9;
595 v->fabric_and_dram_bandwidth = v->fabric_and_dram_bandwidth_vmax0p9;
596 v->dcfclk_per_state[2] = v->dcfclkv_max0p9;
597 v->dcfclk_per_state[1] = v->dcfclkv_max0p9;
598 v->dcfclk_per_state[0] = v->dcfclkv_max0p9;
599 v->dcfclk = v->dcfclkv_max0p9;
600 dispclkdppclkdcfclk_deep_sleep_prefetch_parameters_watermarks_and_performance_calculation(v);
601
602 context->bw_ctx.bw.dcn.watermarks.d.cstate_pstate.cstate_exit_ns =
603 v->stutter_exit_watermark * 1000;
604 context->bw_ctx.bw.dcn.watermarks.d.cstate_pstate.cstate_enter_plus_exit_ns =
605 v->stutter_enter_plus_exit_watermark * 1000;
606 context->bw_ctx.bw.dcn.watermarks.d.cstate_pstate.pstate_change_ns =
607 v->dram_clock_change_watermark * 1000;
608 context->bw_ctx.bw.dcn.watermarks.d.pte_meta_urgent_ns = v->ptemeta_urgent_watermark * 1000;
609 context->bw_ctx.bw.dcn.watermarks.d.urgent_ns = v->urgent_watermark * 1000;
610 }
611
612 v->fabric_and_dram_bandwidth_per_state[2] = v->fabric_and_dram_bandwidth_vnom0p8;
613 v->fabric_and_dram_bandwidth_per_state[1] = v->fabric_and_dram_bandwidth_vmid0p72;
614 v->fabric_and_dram_bandwidth_per_state[0] = v->fabric_and_dram_bandwidth_vmin0p65;
615 v->fabric_and_dram_bandwidth = v->fabric_and_dram_bandwidth_per_state[v->voltage_level];
616 v->dcfclk_per_state[2] = v->dcfclkv_nom0p8;
617 v->dcfclk_per_state[1] = v->dcfclkv_mid0p72;
618 v->dcfclk_per_state[0] = v->dcfclkv_min0p65;
619 v->dcfclk = v->dcfclk_per_state[v->voltage_level];
620 dispclkdppclkdcfclk_deep_sleep_prefetch_parameters_watermarks_and_performance_calculation(v);
621
622 context->bw_ctx.bw.dcn.watermarks.a.cstate_pstate.cstate_exit_ns =
623 v->stutter_exit_watermark * 1000;
624 context->bw_ctx.bw.dcn.watermarks.a.cstate_pstate.cstate_enter_plus_exit_ns =
625 v->stutter_enter_plus_exit_watermark * 1000;
626 context->bw_ctx.bw.dcn.watermarks.a.cstate_pstate.pstate_change_ns =
627 v->dram_clock_change_watermark * 1000;
628 context->bw_ctx.bw.dcn.watermarks.a.pte_meta_urgent_ns = v->ptemeta_urgent_watermark * 1000;
629 context->bw_ctx.bw.dcn.watermarks.a.urgent_ns = v->urgent_watermark * 1000;
630 if (v->voltage_level >= 2) {
631 context->bw_ctx.bw.dcn.watermarks.b = context->bw_ctx.bw.dcn.watermarks.a;
632 context->bw_ctx.bw.dcn.watermarks.c = context->bw_ctx.bw.dcn.watermarks.a;
633 }
634 if (v->voltage_level >= 3)
635 context->bw_ctx.bw.dcn.watermarks.d = context->bw_ctx.bw.dcn.watermarks.a;
636}
637#endif
638
639static bool dcn_bw_apply_registry_override(struct dc *dc)
640{
641 bool updated = false;
642
643 DC_FP_START();
644 if ((int)(dc->dcn_soc->sr_exit_time * 1000) != dc->debug.sr_exit_time_ns
645 && dc->debug.sr_exit_time_ns) {
646 updated = true;
647 dc->dcn_soc->sr_exit_time = dc->debug.sr_exit_time_ns / 1000.0;
648 }
649
650 if ((int)(dc->dcn_soc->sr_enter_plus_exit_time * 1000)
651 != dc->debug.sr_enter_plus_exit_time_ns
652 && dc->debug.sr_enter_plus_exit_time_ns) {
653 updated = true;
654 dc->dcn_soc->sr_enter_plus_exit_time =
655 dc->debug.sr_enter_plus_exit_time_ns / 1000.0;
656 }
657
658 if ((int)(dc->dcn_soc->urgent_latency * 1000) != dc->debug.urgent_latency_ns
659 && dc->debug.urgent_latency_ns) {
660 updated = true;
661 dc->dcn_soc->urgent_latency = dc->debug.urgent_latency_ns / 1000.0;
662 }
663
664 if ((int)(dc->dcn_soc->percent_of_ideal_drambw_received_after_urg_latency * 1000)
665 != dc->debug.percent_of_ideal_drambw
666 && dc->debug.percent_of_ideal_drambw) {
667 updated = true;
668 dc->dcn_soc->percent_of_ideal_drambw_received_after_urg_latency =
669 dc->debug.percent_of_ideal_drambw;
670 }
671
672 if ((int)(dc->dcn_soc->dram_clock_change_latency * 1000)
673 != dc->debug.dram_clock_change_latency_ns
674 && dc->debug.dram_clock_change_latency_ns) {
675 updated = true;
676 dc->dcn_soc->dram_clock_change_latency =
677 dc->debug.dram_clock_change_latency_ns / 1000.0;
678 }
679 DC_FP_END();
680
681 return updated;
682}
683
684static void hack_disable_optional_pipe_split(struct dcn_bw_internal_vars *v)
685{
686
687
688
689
690 v->max_dispclk[0] = v->max_dppclk_vmin0p65;
691}
692
693static void hack_force_pipe_split(struct dcn_bw_internal_vars *v,
694 unsigned int pixel_rate_100hz)
695{
696 float pixel_rate_mhz = pixel_rate_100hz / 10000;
697
698
699
700
701
702 if (pixel_rate_mhz < v->max_dppclk[0])
703 v->max_dppclk[0] = pixel_rate_mhz;
704}
705
706static void hack_bounding_box(struct dcn_bw_internal_vars *v,
707 struct dc_debug_options *dbg,
708 struct dc_state *context)
709{
710 int i;
711
712 for (i = 0; i < MAX_PIPES; i++) {
713 struct pipe_ctx *pipe = &context->res_ctx.pipe_ctx[i];
714
715
716
717
718
719
720 if (pipe->plane_state &&
721 (pipe->plane_state->dst_rect.width <= 16 ||
722 pipe->plane_state->dst_rect.height <= 16 ||
723 pipe->plane_state->src_rect.width <= 16 ||
724 pipe->plane_state->src_rect.height <= 16)) {
725 hack_disable_optional_pipe_split(v);
726 return;
727 }
728 }
729
730 if (dbg->pipe_split_policy == MPC_SPLIT_AVOID)
731 hack_disable_optional_pipe_split(v);
732
733 if (dbg->pipe_split_policy == MPC_SPLIT_AVOID_MULT_DISP &&
734 context->stream_count >= 2)
735 hack_disable_optional_pipe_split(v);
736
737 if (context->stream_count == 1 &&
738 dbg->force_single_disp_pipe_split)
739 hack_force_pipe_split(v, context->streams[0]->timing.pix_clk_100hz);
740}
741
742unsigned int get_highest_allowed_voltage_level(uint32_t chip_family, uint32_t hw_internal_rev, uint32_t pci_revision_id)
743{
744
745 if ((chip_family == FAMILY_RV) &&
746 ASICREV_IS_RAVEN2(hw_internal_rev))
747 switch (pci_revision_id) {
748 case PRID_DALI_DE:
749 case PRID_DALI_DF:
750 case PRID_DALI_E3:
751 case PRID_DALI_E4:
752 case PRID_POLLOCK_94:
753 case PRID_POLLOCK_95:
754 case PRID_POLLOCK_E9:
755 case PRID_POLLOCK_EA:
756 case PRID_POLLOCK_EB:
757 return 0;
758 default:
759 break;
760 }
761
762
763 return 4;
764}
765
766bool dcn_validate_bandwidth(
767 struct dc *dc,
768 struct dc_state *context,
769 bool fast_validate)
770{
771
772
773
774
775 BW_VAL_TRACE_SETUP();
776
777 const struct resource_pool *pool = dc->res_pool;
778 struct dcn_bw_internal_vars *v = &context->dcn_bw_vars;
779 int i, input_idx, k;
780 int vesa_sync_start, asic_blank_end, asic_blank_start;
781 bool bw_limit_pass;
782 float bw_limit;
783
784 PERFORMANCE_TRACE_START();
785
786 BW_VAL_TRACE_COUNT();
787
788 if (dcn_bw_apply_registry_override(dc))
789 dcn_bw_sync_calcs_and_dml(dc);
790
791 memset(v, 0, sizeof(*v));
792 DC_FP_START();
793
794 v->sr_exit_time = dc->dcn_soc->sr_exit_time;
795 v->sr_enter_plus_exit_time = dc->dcn_soc->sr_enter_plus_exit_time;
796 v->urgent_latency = dc->dcn_soc->urgent_latency;
797 v->write_back_latency = dc->dcn_soc->write_back_latency;
798 v->percent_of_ideal_drambw_received_after_urg_latency =
799 dc->dcn_soc->percent_of_ideal_drambw_received_after_urg_latency;
800
801 v->dcfclkv_min0p65 = dc->dcn_soc->dcfclkv_min0p65;
802 v->dcfclkv_mid0p72 = dc->dcn_soc->dcfclkv_mid0p72;
803 v->dcfclkv_nom0p8 = dc->dcn_soc->dcfclkv_nom0p8;
804 v->dcfclkv_max0p9 = dc->dcn_soc->dcfclkv_max0p9;
805
806 v->max_dispclk_vmin0p65 = dc->dcn_soc->max_dispclk_vmin0p65;
807 v->max_dispclk_vmid0p72 = dc->dcn_soc->max_dispclk_vmid0p72;
808 v->max_dispclk_vnom0p8 = dc->dcn_soc->max_dispclk_vnom0p8;
809 v->max_dispclk_vmax0p9 = dc->dcn_soc->max_dispclk_vmax0p9;
810
811 v->max_dppclk_vmin0p65 = dc->dcn_soc->max_dppclk_vmin0p65;
812 v->max_dppclk_vmid0p72 = dc->dcn_soc->max_dppclk_vmid0p72;
813 v->max_dppclk_vnom0p8 = dc->dcn_soc->max_dppclk_vnom0p8;
814 v->max_dppclk_vmax0p9 = dc->dcn_soc->max_dppclk_vmax0p9;
815
816 v->socclk = dc->dcn_soc->socclk;
817
818 v->fabric_and_dram_bandwidth_vmin0p65 = dc->dcn_soc->fabric_and_dram_bandwidth_vmin0p65;
819 v->fabric_and_dram_bandwidth_vmid0p72 = dc->dcn_soc->fabric_and_dram_bandwidth_vmid0p72;
820 v->fabric_and_dram_bandwidth_vnom0p8 = dc->dcn_soc->fabric_and_dram_bandwidth_vnom0p8;
821 v->fabric_and_dram_bandwidth_vmax0p9 = dc->dcn_soc->fabric_and_dram_bandwidth_vmax0p9;
822
823 v->phyclkv_min0p65 = dc->dcn_soc->phyclkv_min0p65;
824 v->phyclkv_mid0p72 = dc->dcn_soc->phyclkv_mid0p72;
825 v->phyclkv_nom0p8 = dc->dcn_soc->phyclkv_nom0p8;
826 v->phyclkv_max0p9 = dc->dcn_soc->phyclkv_max0p9;
827
828 v->downspreading = dc->dcn_soc->downspreading;
829 v->round_trip_ping_latency_cycles = dc->dcn_soc->round_trip_ping_latency_cycles;
830 v->urgent_out_of_order_return_per_channel = dc->dcn_soc->urgent_out_of_order_return_per_channel;
831 v->number_of_channels = dc->dcn_soc->number_of_channels;
832 v->vmm_page_size = dc->dcn_soc->vmm_page_size;
833 v->dram_clock_change_latency = dc->dcn_soc->dram_clock_change_latency;
834 v->return_bus_width = dc->dcn_soc->return_bus_width;
835
836 v->rob_buffer_size_in_kbyte = dc->dcn_ip->rob_buffer_size_in_kbyte;
837 v->det_buffer_size_in_kbyte = dc->dcn_ip->det_buffer_size_in_kbyte;
838 v->dpp_output_buffer_pixels = dc->dcn_ip->dpp_output_buffer_pixels;
839 v->opp_output_buffer_lines = dc->dcn_ip->opp_output_buffer_lines;
840 v->pixel_chunk_size_in_kbyte = dc->dcn_ip->pixel_chunk_size_in_kbyte;
841 v->pte_enable = dc->dcn_ip->pte_enable;
842 v->pte_chunk_size = dc->dcn_ip->pte_chunk_size;
843 v->meta_chunk_size = dc->dcn_ip->meta_chunk_size;
844 v->writeback_chunk_size = dc->dcn_ip->writeback_chunk_size;
845 v->odm_capability = dc->dcn_ip->odm_capability;
846 v->dsc_capability = dc->dcn_ip->dsc_capability;
847 v->line_buffer_size = dc->dcn_ip->line_buffer_size;
848 v->is_line_buffer_bpp_fixed = dc->dcn_ip->is_line_buffer_bpp_fixed;
849 v->line_buffer_fixed_bpp = dc->dcn_ip->line_buffer_fixed_bpp;
850 v->max_line_buffer_lines = dc->dcn_ip->max_line_buffer_lines;
851 v->writeback_luma_buffer_size = dc->dcn_ip->writeback_luma_buffer_size;
852 v->writeback_chroma_buffer_size = dc->dcn_ip->writeback_chroma_buffer_size;
853 v->max_num_dpp = dc->dcn_ip->max_num_dpp;
854 v->max_num_writeback = dc->dcn_ip->max_num_writeback;
855 v->max_dchub_topscl_throughput = dc->dcn_ip->max_dchub_topscl_throughput;
856 v->max_pscl_tolb_throughput = dc->dcn_ip->max_pscl_tolb_throughput;
857 v->max_lb_tovscl_throughput = dc->dcn_ip->max_lb_tovscl_throughput;
858 v->max_vscl_tohscl_throughput = dc->dcn_ip->max_vscl_tohscl_throughput;
859 v->max_hscl_ratio = dc->dcn_ip->max_hscl_ratio;
860 v->max_vscl_ratio = dc->dcn_ip->max_vscl_ratio;
861 v->max_hscl_taps = dc->dcn_ip->max_hscl_taps;
862 v->max_vscl_taps = dc->dcn_ip->max_vscl_taps;
863 v->under_scan_factor = dc->dcn_ip->under_scan_factor;
864 v->pte_buffer_size_in_requests = dc->dcn_ip->pte_buffer_size_in_requests;
865 v->dispclk_ramping_margin = dc->dcn_ip->dispclk_ramping_margin;
866 v->max_inter_dcn_tile_repeaters = dc->dcn_ip->max_inter_dcn_tile_repeaters;
867 v->can_vstartup_lines_exceed_vsync_plus_back_porch_lines_minus_one =
868 dc->dcn_ip->can_vstartup_lines_exceed_vsync_plus_back_porch_lines_minus_one;
869 v->bug_forcing_luma_and_chroma_request_to_same_size_fixed =
870 dc->dcn_ip->bug_forcing_luma_and_chroma_request_to_same_size_fixed;
871
872 v->voltage[5] = dcn_bw_no_support;
873 v->voltage[4] = dcn_bw_v_max0p9;
874 v->voltage[3] = dcn_bw_v_max0p9;
875 v->voltage[2] = dcn_bw_v_nom0p8;
876 v->voltage[1] = dcn_bw_v_mid0p72;
877 v->voltage[0] = dcn_bw_v_min0p65;
878 v->fabric_and_dram_bandwidth_per_state[5] = v->fabric_and_dram_bandwidth_vmax0p9;
879 v->fabric_and_dram_bandwidth_per_state[4] = v->fabric_and_dram_bandwidth_vmax0p9;
880 v->fabric_and_dram_bandwidth_per_state[3] = v->fabric_and_dram_bandwidth_vmax0p9;
881 v->fabric_and_dram_bandwidth_per_state[2] = v->fabric_and_dram_bandwidth_vnom0p8;
882 v->fabric_and_dram_bandwidth_per_state[1] = v->fabric_and_dram_bandwidth_vmid0p72;
883 v->fabric_and_dram_bandwidth_per_state[0] = v->fabric_and_dram_bandwidth_vmin0p65;
884 v->dcfclk_per_state[5] = v->dcfclkv_max0p9;
885 v->dcfclk_per_state[4] = v->dcfclkv_max0p9;
886 v->dcfclk_per_state[3] = v->dcfclkv_max0p9;
887 v->dcfclk_per_state[2] = v->dcfclkv_nom0p8;
888 v->dcfclk_per_state[1] = v->dcfclkv_mid0p72;
889 v->dcfclk_per_state[0] = v->dcfclkv_min0p65;
890 v->max_dispclk[5] = v->max_dispclk_vmax0p9;
891 v->max_dispclk[4] = v->max_dispclk_vmax0p9;
892 v->max_dispclk[3] = v->max_dispclk_vmax0p9;
893 v->max_dispclk[2] = v->max_dispclk_vnom0p8;
894 v->max_dispclk[1] = v->max_dispclk_vmid0p72;
895 v->max_dispclk[0] = v->max_dispclk_vmin0p65;
896 v->max_dppclk[5] = v->max_dppclk_vmax0p9;
897 v->max_dppclk[4] = v->max_dppclk_vmax0p9;
898 v->max_dppclk[3] = v->max_dppclk_vmax0p9;
899 v->max_dppclk[2] = v->max_dppclk_vnom0p8;
900 v->max_dppclk[1] = v->max_dppclk_vmid0p72;
901 v->max_dppclk[0] = v->max_dppclk_vmin0p65;
902 v->phyclk_per_state[5] = v->phyclkv_max0p9;
903 v->phyclk_per_state[4] = v->phyclkv_max0p9;
904 v->phyclk_per_state[3] = v->phyclkv_max0p9;
905 v->phyclk_per_state[2] = v->phyclkv_nom0p8;
906 v->phyclk_per_state[1] = v->phyclkv_mid0p72;
907 v->phyclk_per_state[0] = v->phyclkv_min0p65;
908 v->synchronized_vblank = dcn_bw_no;
909 v->ta_pscalculation = dcn_bw_override;
910 v->allow_different_hratio_vratio = dcn_bw_yes;
911
912 for (i = 0, input_idx = 0; i < pool->pipe_count; i++) {
913 struct pipe_ctx *pipe = &context->res_ctx.pipe_ctx[i];
914
915 if (!pipe->stream)
916 continue;
917
918 if (pipe->top_pipe && pipe->top_pipe->plane_state == pipe->plane_state)
919 continue;
920
921 v->underscan_output[input_idx] = false;
922 v->interlace_output[input_idx] = false;
923
924 v->htotal[input_idx] = pipe->stream->timing.h_total;
925 v->vtotal[input_idx] = pipe->stream->timing.v_total;
926 v->vactive[input_idx] = pipe->stream->timing.v_addressable +
927 pipe->stream->timing.v_border_top + pipe->stream->timing.v_border_bottom;
928 v->v_sync_plus_back_porch[input_idx] = pipe->stream->timing.v_total
929 - v->vactive[input_idx]
930 - pipe->stream->timing.v_front_porch;
931 v->pixel_clock[input_idx] = pipe->stream->timing.pix_clk_100hz/10000.0;
932 if (pipe->stream->timing.timing_3d_format == TIMING_3D_FORMAT_HW_FRAME_PACKING)
933 v->pixel_clock[input_idx] *= 2;
934 if (!pipe->plane_state) {
935 v->dcc_enable[input_idx] = dcn_bw_yes;
936 v->source_pixel_format[input_idx] = dcn_bw_rgb_sub_32;
937 v->source_surface_mode[input_idx] = dcn_bw_sw_4_kb_s;
938 v->lb_bit_per_pixel[input_idx] = 30;
939 v->viewport_width[input_idx] = pipe->stream->timing.h_addressable;
940 v->viewport_height[input_idx] = pipe->stream->timing.v_addressable;
941
942
943
944
945
946
947
948 if (v->viewport_width[input_idx] > 1920)
949 v->viewport_width[input_idx] = 1920;
950 if (v->viewport_height[input_idx] > 1080)
951 v->viewport_height[input_idx] = 1080;
952 v->scaler_rec_out_width[input_idx] = v->viewport_width[input_idx];
953 v->scaler_recout_height[input_idx] = v->viewport_height[input_idx];
954 v->override_hta_ps[input_idx] = 1;
955 v->override_vta_ps[input_idx] = 1;
956 v->override_hta_pschroma[input_idx] = 1;
957 v->override_vta_pschroma[input_idx] = 1;
958 v->source_scan[input_idx] = dcn_bw_hor;
959
960 } else {
961 v->viewport_height[input_idx] = pipe->plane_res.scl_data.viewport.height;
962 v->viewport_width[input_idx] = pipe->plane_res.scl_data.viewport.width;
963 v->scaler_rec_out_width[input_idx] = pipe->plane_res.scl_data.recout.width;
964 v->scaler_recout_height[input_idx] = pipe->plane_res.scl_data.recout.height;
965 if (pipe->bottom_pipe && pipe->bottom_pipe->plane_state == pipe->plane_state) {
966 if (pipe->plane_state->rotation % 2 == 0) {
967 int viewport_end = pipe->plane_res.scl_data.viewport.width
968 + pipe->plane_res.scl_data.viewport.x;
969 int viewport_b_end = pipe->bottom_pipe->plane_res.scl_data.viewport.width
970 + pipe->bottom_pipe->plane_res.scl_data.viewport.x;
971
972 if (viewport_end > viewport_b_end)
973 v->viewport_width[input_idx] = viewport_end
974 - pipe->bottom_pipe->plane_res.scl_data.viewport.x;
975 else
976 v->viewport_width[input_idx] = viewport_b_end
977 - pipe->plane_res.scl_data.viewport.x;
978 } else {
979 int viewport_end = pipe->plane_res.scl_data.viewport.height
980 + pipe->plane_res.scl_data.viewport.y;
981 int viewport_b_end = pipe->bottom_pipe->plane_res.scl_data.viewport.height
982 + pipe->bottom_pipe->plane_res.scl_data.viewport.y;
983
984 if (viewport_end > viewport_b_end)
985 v->viewport_height[input_idx] = viewport_end
986 - pipe->bottom_pipe->plane_res.scl_data.viewport.y;
987 else
988 v->viewport_height[input_idx] = viewport_b_end
989 - pipe->plane_res.scl_data.viewport.y;
990 }
991 v->scaler_rec_out_width[input_idx] = pipe->plane_res.scl_data.recout.width
992 + pipe->bottom_pipe->plane_res.scl_data.recout.width;
993 }
994
995 if (pipe->plane_state->rotation % 2 == 0) {
996 ASSERT(pipe->plane_res.scl_data.ratios.horz.value != dc_fixpt_one.value
997 || v->scaler_rec_out_width[input_idx] == v->viewport_width[input_idx]);
998 ASSERT(pipe->plane_res.scl_data.ratios.vert.value != dc_fixpt_one.value
999 || v->scaler_recout_height[input_idx] == v->viewport_height[input_idx]);
1000 } else {
1001 ASSERT(pipe->plane_res.scl_data.ratios.horz.value != dc_fixpt_one.value
1002 || v->scaler_recout_height[input_idx] == v->viewport_width[input_idx]);
1003 ASSERT(pipe->plane_res.scl_data.ratios.vert.value != dc_fixpt_one.value
1004 || v->scaler_rec_out_width[input_idx] == v->viewport_height[input_idx]);
1005 }
1006
1007 if (dc->debug.optimized_watermark) {
1008
1009
1010
1011
1012 v->dcc_enable[input_idx] = pipe->plane_state->dcc.enable ? dcn_bw_yes : dcn_bw_no;
1013 } else {
1014
1015
1016
1017
1018
1019
1020 unsigned int bpe;
1021
1022 v->dcc_enable[input_idx] = dc->res_pool->hubbub->funcs->dcc_support_pixel_format(
1023 pipe->plane_state->format, &bpe) ? dcn_bw_yes : dcn_bw_no;
1024 }
1025
1026 v->source_pixel_format[input_idx] = tl_pixel_format_to_bw_defs(
1027 pipe->plane_state->format);
1028 v->source_surface_mode[input_idx] = tl_sw_mode_to_bw_defs(
1029 pipe->plane_state->tiling_info.gfx9.swizzle);
1030 v->lb_bit_per_pixel[input_idx] = tl_lb_bpp_to_int(pipe->plane_res.scl_data.lb_params.depth);
1031 v->override_hta_ps[input_idx] = pipe->plane_res.scl_data.taps.h_taps;
1032 v->override_vta_ps[input_idx] = pipe->plane_res.scl_data.taps.v_taps;
1033 v->override_hta_pschroma[input_idx] = pipe->plane_res.scl_data.taps.h_taps_c;
1034 v->override_vta_pschroma[input_idx] = pipe->plane_res.scl_data.taps.v_taps_c;
1035
1036
1037
1038
1039
1040 if (v->override_hta_pschroma[input_idx] == 1)
1041 v->override_hta_pschroma[input_idx] = 2;
1042 if (v->override_vta_pschroma[input_idx] == 1)
1043 v->override_vta_pschroma[input_idx] = 2;
1044 v->source_scan[input_idx] = (pipe->plane_state->rotation % 2) ? dcn_bw_vert : dcn_bw_hor;
1045 }
1046 if (v->is_line_buffer_bpp_fixed == dcn_bw_yes)
1047 v->lb_bit_per_pixel[input_idx] = v->line_buffer_fixed_bpp;
1048 v->dcc_rate[input_idx] = 1;
1049 v->output_format[input_idx] = pipe->stream->timing.pixel_encoding ==
1050 PIXEL_ENCODING_YCBCR420 ? dcn_bw_420 : dcn_bw_444;
1051 v->output[input_idx] = pipe->stream->signal ==
1052 SIGNAL_TYPE_HDMI_TYPE_A ? dcn_bw_hdmi : dcn_bw_dp;
1053 v->output_deep_color[input_idx] = dcn_bw_encoder_8bpc;
1054 if (v->output[input_idx] == dcn_bw_hdmi) {
1055 switch (pipe->stream->timing.display_color_depth) {
1056 case COLOR_DEPTH_101010:
1057 v->output_deep_color[input_idx] = dcn_bw_encoder_10bpc;
1058 break;
1059 case COLOR_DEPTH_121212:
1060 v->output_deep_color[input_idx] = dcn_bw_encoder_12bpc;
1061 break;
1062 case COLOR_DEPTH_161616:
1063 v->output_deep_color[input_idx] = dcn_bw_encoder_16bpc;
1064 break;
1065 default:
1066 break;
1067 }
1068 }
1069
1070 input_idx++;
1071 }
1072 v->number_of_active_planes = input_idx;
1073
1074 scaler_settings_calculation(v);
1075
1076 hack_bounding_box(v, &dc->debug, context);
1077
1078 mode_support_and_system_configuration(v);
1079
1080
1081 if (v->voltage_level != 0
1082 && context->stream_count == 1
1083 && dc->debug.force_single_disp_pipe_split) {
1084 v->max_dppclk[0] = v->max_dppclk_vmin0p65;
1085 mode_support_and_system_configuration(v);
1086 }
1087
1088 if (v->voltage_level == 0 &&
1089 (dc->debug.sr_exit_time_dpm0_ns
1090 || dc->debug.sr_enter_plus_exit_time_dpm0_ns)) {
1091
1092 if (dc->debug.sr_enter_plus_exit_time_dpm0_ns)
1093 v->sr_enter_plus_exit_time =
1094 dc->debug.sr_enter_plus_exit_time_dpm0_ns / 1000.0f;
1095 if (dc->debug.sr_exit_time_dpm0_ns)
1096 v->sr_exit_time = dc->debug.sr_exit_time_dpm0_ns / 1000.0f;
1097 context->bw_ctx.dml.soc.sr_enter_plus_exit_time_us = v->sr_enter_plus_exit_time;
1098 context->bw_ctx.dml.soc.sr_exit_time_us = v->sr_exit_time;
1099 mode_support_and_system_configuration(v);
1100 }
1101
1102 display_pipe_configuration(v);
1103
1104 for (k = 0; k <= v->number_of_active_planes - 1; k++) {
1105 if (v->source_scan[k] == dcn_bw_hor)
1106 v->swath_width_y[k] = v->viewport_width[k] / v->dpp_per_plane[k];
1107 else
1108 v->swath_width_y[k] = v->viewport_height[k] / v->dpp_per_plane[k];
1109 }
1110 for (k = 0; k <= v->number_of_active_planes - 1; k++) {
1111 if (v->source_pixel_format[k] == dcn_bw_rgb_sub_64) {
1112 v->byte_per_pixel_dety[k] = 8.0;
1113 v->byte_per_pixel_detc[k] = 0.0;
1114 } else if (v->source_pixel_format[k] == dcn_bw_rgb_sub_32) {
1115 v->byte_per_pixel_dety[k] = 4.0;
1116 v->byte_per_pixel_detc[k] = 0.0;
1117 } else if (v->source_pixel_format[k] == dcn_bw_rgb_sub_16) {
1118 v->byte_per_pixel_dety[k] = 2.0;
1119 v->byte_per_pixel_detc[k] = 0.0;
1120 } else if (v->source_pixel_format[k] == dcn_bw_yuv420_sub_8) {
1121 v->byte_per_pixel_dety[k] = 1.0;
1122 v->byte_per_pixel_detc[k] = 2.0;
1123 } else {
1124 v->byte_per_pixel_dety[k] = 4.0f / 3.0f;
1125 v->byte_per_pixel_detc[k] = 8.0f / 3.0f;
1126 }
1127 }
1128
1129 v->total_data_read_bandwidth = 0.0;
1130 for (k = 0; k <= v->number_of_active_planes - 1; k++) {
1131 v->read_bandwidth_plane_luma[k] = v->swath_width_y[k] * v->dpp_per_plane[k] *
1132 dcn_bw_ceil2(v->byte_per_pixel_dety[k], 1.0) / (v->htotal[k] / v->pixel_clock[k]) * v->v_ratio[k];
1133 v->read_bandwidth_plane_chroma[k] = v->swath_width_y[k] / 2.0 * v->dpp_per_plane[k] *
1134 dcn_bw_ceil2(v->byte_per_pixel_detc[k], 2.0) / (v->htotal[k] / v->pixel_clock[k]) * v->v_ratio[k] / 2.0;
1135 v->total_data_read_bandwidth = v->total_data_read_bandwidth +
1136 v->read_bandwidth_plane_luma[k] + v->read_bandwidth_plane_chroma[k];
1137 }
1138
1139 BW_VAL_TRACE_END_VOLTAGE_LEVEL();
1140
1141 if (v->voltage_level != number_of_states_plus_one && !fast_validate) {
1142 float bw_consumed = v->total_bandwidth_consumed_gbyte_per_second;
1143
1144 if (bw_consumed < v->fabric_and_dram_bandwidth_vmin0p65)
1145 bw_consumed = v->fabric_and_dram_bandwidth_vmin0p65;
1146 else if (bw_consumed < v->fabric_and_dram_bandwidth_vmid0p72)
1147 bw_consumed = v->fabric_and_dram_bandwidth_vmid0p72;
1148 else if (bw_consumed < v->fabric_and_dram_bandwidth_vnom0p8)
1149 bw_consumed = v->fabric_and_dram_bandwidth_vnom0p8;
1150 else
1151 bw_consumed = v->fabric_and_dram_bandwidth_vmax0p9;
1152
1153 if (bw_consumed < v->fabric_and_dram_bandwidth)
1154 if (dc->debug.voltage_align_fclk)
1155 bw_consumed = v->fabric_and_dram_bandwidth;
1156
1157 display_pipe_configuration(v);
1158
1159
1160
1161
1162 dispclkdppclkdcfclk_deep_sleep_prefetch_parameters_watermarks_and_performance_calculation(v);
1163
1164 context->bw_ctx.bw.dcn.watermarks.a.cstate_pstate.cstate_exit_ns =
1165 v->stutter_exit_watermark * 1000;
1166 context->bw_ctx.bw.dcn.watermarks.a.cstate_pstate.cstate_enter_plus_exit_ns =
1167 v->stutter_enter_plus_exit_watermark * 1000;
1168 context->bw_ctx.bw.dcn.watermarks.a.cstate_pstate.pstate_change_ns =
1169 v->dram_clock_change_watermark * 1000;
1170 context->bw_ctx.bw.dcn.watermarks.a.pte_meta_urgent_ns = v->ptemeta_urgent_watermark * 1000;
1171 context->bw_ctx.bw.dcn.watermarks.a.urgent_ns = v->urgent_watermark * 1000;
1172 context->bw_ctx.bw.dcn.watermarks.b = context->bw_ctx.bw.dcn.watermarks.a;
1173 context->bw_ctx.bw.dcn.watermarks.c = context->bw_ctx.bw.dcn.watermarks.a;
1174 context->bw_ctx.bw.dcn.watermarks.d = context->bw_ctx.bw.dcn.watermarks.a;
1175
1176 context->bw_ctx.bw.dcn.clk.fclk_khz = (int)(bw_consumed * 1000000 /
1177 (ddr4_dram_factor_single_Channel * v->number_of_channels));
1178 if (bw_consumed == v->fabric_and_dram_bandwidth_vmin0p65)
1179 context->bw_ctx.bw.dcn.clk.fclk_khz = (int)(bw_consumed * 1000000 / 32);
1180
1181 context->bw_ctx.bw.dcn.clk.dcfclk_deep_sleep_khz = (int)(v->dcf_clk_deep_sleep * 1000);
1182 context->bw_ctx.bw.dcn.clk.dcfclk_khz = (int)(v->dcfclk * 1000);
1183
1184 context->bw_ctx.bw.dcn.clk.dispclk_khz = (int)(v->dispclk * 1000);
1185 if (dc->debug.max_disp_clk == true)
1186 context->bw_ctx.bw.dcn.clk.dispclk_khz = (int)(dc->dcn_soc->max_dispclk_vmax0p9 * 1000);
1187
1188 if (context->bw_ctx.bw.dcn.clk.dispclk_khz <
1189 dc->debug.min_disp_clk_khz) {
1190 context->bw_ctx.bw.dcn.clk.dispclk_khz =
1191 dc->debug.min_disp_clk_khz;
1192 }
1193
1194 context->bw_ctx.bw.dcn.clk.dppclk_khz = context->bw_ctx.bw.dcn.clk.dispclk_khz /
1195 v->dispclk_dppclk_ratio;
1196 context->bw_ctx.bw.dcn.clk.phyclk_khz = v->phyclk_per_state[v->voltage_level];
1197 switch (v->voltage_level) {
1198 case 0:
1199 context->bw_ctx.bw.dcn.clk.max_supported_dppclk_khz =
1200 (int)(dc->dcn_soc->max_dppclk_vmin0p65 * 1000);
1201 break;
1202 case 1:
1203 context->bw_ctx.bw.dcn.clk.max_supported_dppclk_khz =
1204 (int)(dc->dcn_soc->max_dppclk_vmid0p72 * 1000);
1205 break;
1206 case 2:
1207 context->bw_ctx.bw.dcn.clk.max_supported_dppclk_khz =
1208 (int)(dc->dcn_soc->max_dppclk_vnom0p8 * 1000);
1209 break;
1210 default:
1211 context->bw_ctx.bw.dcn.clk.max_supported_dppclk_khz =
1212 (int)(dc->dcn_soc->max_dppclk_vmax0p9 * 1000);
1213 break;
1214 }
1215
1216 BW_VAL_TRACE_END_WATERMARKS();
1217
1218 for (i = 0, input_idx = 0; i < pool->pipe_count; i++) {
1219 struct pipe_ctx *pipe = &context->res_ctx.pipe_ctx[i];
1220
1221
1222 if (!pipe->stream)
1223 continue;
1224
1225 if (pipe->top_pipe && pipe->top_pipe->plane_state == pipe->plane_state)
1226 continue;
1227
1228 pipe->pipe_dlg_param.vupdate_width = v->v_update_width_pix[input_idx];
1229 pipe->pipe_dlg_param.vupdate_offset = v->v_update_offset_pix[input_idx];
1230 pipe->pipe_dlg_param.vready_offset = v->v_ready_offset_pix[input_idx];
1231 pipe->pipe_dlg_param.vstartup_start = v->v_startup[input_idx];
1232
1233 pipe->pipe_dlg_param.htotal = pipe->stream->timing.h_total;
1234 pipe->pipe_dlg_param.vtotal = pipe->stream->timing.v_total;
1235 vesa_sync_start = pipe->stream->timing.v_addressable +
1236 pipe->stream->timing.v_border_bottom +
1237 pipe->stream->timing.v_front_porch;
1238
1239 asic_blank_end = (pipe->stream->timing.v_total -
1240 vesa_sync_start -
1241 pipe->stream->timing.v_border_top)
1242 * (pipe->stream->timing.flags.INTERLACE ? 1 : 0);
1243
1244 asic_blank_start = asic_blank_end +
1245 (pipe->stream->timing.v_border_top +
1246 pipe->stream->timing.v_addressable +
1247 pipe->stream->timing.v_border_bottom)
1248 * (pipe->stream->timing.flags.INTERLACE ? 1 : 0);
1249
1250 pipe->pipe_dlg_param.vblank_start = asic_blank_start;
1251 pipe->pipe_dlg_param.vblank_end = asic_blank_end;
1252
1253 if (pipe->plane_state) {
1254 struct pipe_ctx *hsplit_pipe = pipe->bottom_pipe;
1255
1256 pipe->plane_state->update_flags.bits.full_update = 1;
1257
1258 if (v->dpp_per_plane[input_idx] == 2 ||
1259 ((pipe->stream->view_format ==
1260 VIEW_3D_FORMAT_SIDE_BY_SIDE ||
1261 pipe->stream->view_format ==
1262 VIEW_3D_FORMAT_TOP_AND_BOTTOM) &&
1263 (pipe->stream->timing.timing_3d_format ==
1264 TIMING_3D_FORMAT_TOP_AND_BOTTOM ||
1265 pipe->stream->timing.timing_3d_format ==
1266 TIMING_3D_FORMAT_SIDE_BY_SIDE))) {
1267 if (hsplit_pipe && hsplit_pipe->plane_state == pipe->plane_state) {
1268
1269 hsplit_pipe->pipe_dlg_param.vupdate_width = v->v_update_width_pix[input_idx];
1270 hsplit_pipe->pipe_dlg_param.vupdate_offset = v->v_update_offset_pix[input_idx];
1271 hsplit_pipe->pipe_dlg_param.vready_offset = v->v_ready_offset_pix[input_idx];
1272 hsplit_pipe->pipe_dlg_param.vstartup_start = v->v_startup[input_idx];
1273
1274 hsplit_pipe->pipe_dlg_param.htotal = pipe->stream->timing.h_total;
1275 hsplit_pipe->pipe_dlg_param.vtotal = pipe->stream->timing.v_total;
1276 hsplit_pipe->pipe_dlg_param.vblank_start = pipe->pipe_dlg_param.vblank_start;
1277 hsplit_pipe->pipe_dlg_param.vblank_end = pipe->pipe_dlg_param.vblank_end;
1278 } else {
1279
1280 hsplit_pipe = find_idle_secondary_pipe(&context->res_ctx, pool, pipe);
1281 ASSERT(hsplit_pipe);
1282 split_stream_across_pipes(&context->res_ctx, pool, pipe, hsplit_pipe);
1283 }
1284
1285 dcn_bw_calc_rq_dlg_ttu(dc, v, hsplit_pipe, input_idx);
1286 } else if (hsplit_pipe && hsplit_pipe->plane_state == pipe->plane_state) {
1287
1288 pipe->bottom_pipe = hsplit_pipe->bottom_pipe;
1289 if (hsplit_pipe->bottom_pipe)
1290 hsplit_pipe->bottom_pipe->top_pipe = pipe;
1291 hsplit_pipe->plane_state = NULL;
1292 hsplit_pipe->stream = NULL;
1293 hsplit_pipe->top_pipe = NULL;
1294 hsplit_pipe->bottom_pipe = NULL;
1295
1296 memset(&hsplit_pipe->plane_res, 0, sizeof(hsplit_pipe->plane_res));
1297 memset(&hsplit_pipe->stream_res, 0, sizeof(hsplit_pipe->stream_res));
1298 resource_build_scaling_params(pipe);
1299 }
1300
1301 dcn_bw_calc_rq_dlg_ttu(dc, v, pipe, input_idx);
1302 }
1303
1304 input_idx++;
1305 }
1306 } else if (v->voltage_level == number_of_states_plus_one) {
1307 BW_VAL_TRACE_SKIP(fail);
1308 } else if (fast_validate) {
1309 BW_VAL_TRACE_SKIP(fast);
1310 }
1311
1312 if (v->voltage_level == 0) {
1313 context->bw_ctx.dml.soc.sr_enter_plus_exit_time_us =
1314 dc->dcn_soc->sr_enter_plus_exit_time;
1315 context->bw_ctx.dml.soc.sr_exit_time_us = dc->dcn_soc->sr_exit_time;
1316 }
1317
1318
1319
1320
1321
1322 bw_limit = dc->dcn_soc->percent_disp_bw_limit * v->fabric_and_dram_bandwidth_vmax0p9;
1323 bw_limit_pass = (v->total_data_read_bandwidth / 1000.0) < bw_limit;
1324
1325 DC_FP_END();
1326
1327 PERFORMANCE_TRACE_END();
1328 BW_VAL_TRACE_FINISH();
1329
1330 if (bw_limit_pass && v->voltage_level <= get_highest_allowed_voltage_level(
1331 dc->ctx->asic_id.chip_family,
1332 dc->ctx->asic_id.hw_internal_rev,
1333 dc->ctx->asic_id.pci_revision_id))
1334 return true;
1335 else
1336 return false;
1337}
1338
1339static unsigned int dcn_find_normalized_clock_vdd_Level(
1340 const struct dc *dc,
1341 enum dm_pp_clock_type clocks_type,
1342 int clocks_in_khz)
1343{
1344 int vdd_level = dcn_bw_v_min0p65;
1345
1346 if (clocks_in_khz == 0)
1347 return vdd_level;
1348
1349 switch (clocks_type) {
1350 case DM_PP_CLOCK_TYPE_DISPLAY_CLK:
1351 if (clocks_in_khz > dc->dcn_soc->max_dispclk_vmax0p9*1000) {
1352 vdd_level = dcn_bw_v_max0p91;
1353 BREAK_TO_DEBUGGER();
1354 } else if (clocks_in_khz > dc->dcn_soc->max_dispclk_vnom0p8*1000) {
1355 vdd_level = dcn_bw_v_max0p9;
1356 } else if (clocks_in_khz > dc->dcn_soc->max_dispclk_vmid0p72*1000) {
1357 vdd_level = dcn_bw_v_nom0p8;
1358 } else if (clocks_in_khz > dc->dcn_soc->max_dispclk_vmin0p65*1000) {
1359 vdd_level = dcn_bw_v_mid0p72;
1360 } else
1361 vdd_level = dcn_bw_v_min0p65;
1362 break;
1363 case DM_PP_CLOCK_TYPE_DISPLAYPHYCLK:
1364 if (clocks_in_khz > dc->dcn_soc->phyclkv_max0p9*1000) {
1365 vdd_level = dcn_bw_v_max0p91;
1366 BREAK_TO_DEBUGGER();
1367 } else if (clocks_in_khz > dc->dcn_soc->phyclkv_nom0p8*1000) {
1368 vdd_level = dcn_bw_v_max0p9;
1369 } else if (clocks_in_khz > dc->dcn_soc->phyclkv_mid0p72*1000) {
1370 vdd_level = dcn_bw_v_nom0p8;
1371 } else if (clocks_in_khz > dc->dcn_soc->phyclkv_min0p65*1000) {
1372 vdd_level = dcn_bw_v_mid0p72;
1373 } else
1374 vdd_level = dcn_bw_v_min0p65;
1375 break;
1376
1377 case DM_PP_CLOCK_TYPE_DPPCLK:
1378 if (clocks_in_khz > dc->dcn_soc->max_dppclk_vmax0p9*1000) {
1379 vdd_level = dcn_bw_v_max0p91;
1380 BREAK_TO_DEBUGGER();
1381 } else if (clocks_in_khz > dc->dcn_soc->max_dppclk_vnom0p8*1000) {
1382 vdd_level = dcn_bw_v_max0p9;
1383 } else if (clocks_in_khz > dc->dcn_soc->max_dppclk_vmid0p72*1000) {
1384 vdd_level = dcn_bw_v_nom0p8;
1385 } else if (clocks_in_khz > dc->dcn_soc->max_dppclk_vmin0p65*1000) {
1386 vdd_level = dcn_bw_v_mid0p72;
1387 } else
1388 vdd_level = dcn_bw_v_min0p65;
1389 break;
1390
1391 case DM_PP_CLOCK_TYPE_MEMORY_CLK:
1392 {
1393 unsigned factor = (ddr4_dram_factor_single_Channel * dc->dcn_soc->number_of_channels);
1394
1395 if (clocks_in_khz > dc->dcn_soc->fabric_and_dram_bandwidth_vmax0p9*1000000/factor) {
1396 vdd_level = dcn_bw_v_max0p91;
1397 BREAK_TO_DEBUGGER();
1398 } else if (clocks_in_khz > dc->dcn_soc->fabric_and_dram_bandwidth_vnom0p8*1000000/factor) {
1399 vdd_level = dcn_bw_v_max0p9;
1400 } else if (clocks_in_khz > dc->dcn_soc->fabric_and_dram_bandwidth_vmid0p72*1000000/factor) {
1401 vdd_level = dcn_bw_v_nom0p8;
1402 } else if (clocks_in_khz > dc->dcn_soc->fabric_and_dram_bandwidth_vmin0p65*1000000/factor) {
1403 vdd_level = dcn_bw_v_mid0p72;
1404 } else
1405 vdd_level = dcn_bw_v_min0p65;
1406 }
1407 break;
1408
1409 case DM_PP_CLOCK_TYPE_DCFCLK:
1410 if (clocks_in_khz > dc->dcn_soc->dcfclkv_max0p9*1000) {
1411 vdd_level = dcn_bw_v_max0p91;
1412 BREAK_TO_DEBUGGER();
1413 } else if (clocks_in_khz > dc->dcn_soc->dcfclkv_nom0p8*1000) {
1414 vdd_level = dcn_bw_v_max0p9;
1415 } else if (clocks_in_khz > dc->dcn_soc->dcfclkv_mid0p72*1000) {
1416 vdd_level = dcn_bw_v_nom0p8;
1417 } else if (clocks_in_khz > dc->dcn_soc->dcfclkv_min0p65*1000) {
1418 vdd_level = dcn_bw_v_mid0p72;
1419 } else
1420 vdd_level = dcn_bw_v_min0p65;
1421 break;
1422
1423 default:
1424 break;
1425 }
1426 return vdd_level;
1427}
1428
1429unsigned int dcn_find_dcfclk_suits_all(
1430 const struct dc *dc,
1431 struct dc_clocks *clocks)
1432{
1433 unsigned vdd_level, vdd_level_temp;
1434 unsigned dcf_clk;
1435
1436
1437 vdd_level = dcn_find_normalized_clock_vdd_Level(
1438 dc, DM_PP_CLOCK_TYPE_DISPLAY_CLK, clocks->dispclk_khz);
1439 vdd_level_temp = dcn_find_normalized_clock_vdd_Level(
1440 dc, DM_PP_CLOCK_TYPE_DISPLAYPHYCLK, clocks->phyclk_khz);
1441
1442 vdd_level = dcn_bw_max(vdd_level, vdd_level_temp);
1443 vdd_level_temp = dcn_find_normalized_clock_vdd_Level(
1444 dc, DM_PP_CLOCK_TYPE_DPPCLK, clocks->dppclk_khz);
1445 vdd_level = dcn_bw_max(vdd_level, vdd_level_temp);
1446
1447 vdd_level_temp = dcn_find_normalized_clock_vdd_Level(
1448 dc, DM_PP_CLOCK_TYPE_MEMORY_CLK, clocks->fclk_khz);
1449 vdd_level = dcn_bw_max(vdd_level, vdd_level_temp);
1450 vdd_level_temp = dcn_find_normalized_clock_vdd_Level(
1451 dc, DM_PP_CLOCK_TYPE_DCFCLK, clocks->dcfclk_khz);
1452
1453
1454 vdd_level = dcn_bw_max(vdd_level, vdd_level_temp);
1455 if (vdd_level == dcn_bw_v_max0p91) {
1456 BREAK_TO_DEBUGGER();
1457 dcf_clk = dc->dcn_soc->dcfclkv_max0p9*1000;
1458 } else if (vdd_level == dcn_bw_v_max0p9)
1459 dcf_clk = dc->dcn_soc->dcfclkv_max0p9*1000;
1460 else if (vdd_level == dcn_bw_v_nom0p8)
1461 dcf_clk = dc->dcn_soc->dcfclkv_nom0p8*1000;
1462 else if (vdd_level == dcn_bw_v_mid0p72)
1463 dcf_clk = dc->dcn_soc->dcfclkv_mid0p72*1000;
1464 else
1465 dcf_clk = dc->dcn_soc->dcfclkv_min0p65*1000;
1466
1467 DC_LOG_BANDWIDTH_CALCS("\tdcf_clk for voltage = %d\n", dcf_clk);
1468 return dcf_clk;
1469}
1470
1471static bool verify_clock_values(struct dm_pp_clock_levels_with_voltage *clks)
1472{
1473 int i;
1474
1475 if (clks->num_levels == 0)
1476 return false;
1477
1478 for (i = 0; i < clks->num_levels; i++)
1479
1480 if (clks->data[i].clocks_in_khz == 0)
1481 return false;
1482
1483 return true;
1484}
1485
1486void dcn_bw_update_from_pplib(struct dc *dc)
1487{
1488 struct dc_context *ctx = dc->ctx;
1489 struct dm_pp_clock_levels_with_voltage fclks = {0}, dcfclks = {0};
1490 bool res;
1491 unsigned vmin0p65_idx, vmid0p72_idx, vnom0p8_idx, vmax0p9_idx;
1492
1493
1494 res = dm_pp_get_clock_levels_by_type_with_voltage(
1495 ctx, DM_PP_CLOCK_TYPE_FCLK, &fclks);
1496
1497 DC_FP_START();
1498
1499 if (res)
1500 res = verify_clock_values(&fclks);
1501
1502 if (res) {
1503 ASSERT(fclks.num_levels);
1504
1505 vmin0p65_idx = 0;
1506 vmid0p72_idx = fclks.num_levels -
1507 (fclks.num_levels > 2 ? 3 : (fclks.num_levels > 1 ? 2 : 1));
1508 vnom0p8_idx = fclks.num_levels - (fclks.num_levels > 1 ? 2 : 1);
1509 vmax0p9_idx = fclks.num_levels - 1;
1510
1511 dc->dcn_soc->fabric_and_dram_bandwidth_vmin0p65 =
1512 32 * (fclks.data[vmin0p65_idx].clocks_in_khz / 1000.0) / 1000.0;
1513 dc->dcn_soc->fabric_and_dram_bandwidth_vmid0p72 =
1514 dc->dcn_soc->number_of_channels *
1515 (fclks.data[vmid0p72_idx].clocks_in_khz / 1000.0)
1516 * ddr4_dram_factor_single_Channel / 1000.0;
1517 dc->dcn_soc->fabric_and_dram_bandwidth_vnom0p8 =
1518 dc->dcn_soc->number_of_channels *
1519 (fclks.data[vnom0p8_idx].clocks_in_khz / 1000.0)
1520 * ddr4_dram_factor_single_Channel / 1000.0;
1521 dc->dcn_soc->fabric_and_dram_bandwidth_vmax0p9 =
1522 dc->dcn_soc->number_of_channels *
1523 (fclks.data[vmax0p9_idx].clocks_in_khz / 1000.0)
1524 * ddr4_dram_factor_single_Channel / 1000.0;
1525 } else
1526 BREAK_TO_DEBUGGER();
1527
1528 DC_FP_END();
1529
1530 res = dm_pp_get_clock_levels_by_type_with_voltage(
1531 ctx, DM_PP_CLOCK_TYPE_DCFCLK, &dcfclks);
1532
1533 DC_FP_START();
1534
1535 if (res)
1536 res = verify_clock_values(&dcfclks);
1537
1538 if (res && dcfclks.num_levels >= 3) {
1539 dc->dcn_soc->dcfclkv_min0p65 = dcfclks.data[0].clocks_in_khz / 1000.0;
1540 dc->dcn_soc->dcfclkv_mid0p72 = dcfclks.data[dcfclks.num_levels - 3].clocks_in_khz / 1000.0;
1541 dc->dcn_soc->dcfclkv_nom0p8 = dcfclks.data[dcfclks.num_levels - 2].clocks_in_khz / 1000.0;
1542 dc->dcn_soc->dcfclkv_max0p9 = dcfclks.data[dcfclks.num_levels - 1].clocks_in_khz / 1000.0;
1543 } else
1544 BREAK_TO_DEBUGGER();
1545
1546 DC_FP_END();
1547}
1548
1549void dcn_bw_notify_pplib_of_wm_ranges(struct dc *dc)
1550{
1551 struct pp_smu_funcs_rv *pp = NULL;
1552 struct pp_smu_wm_range_sets ranges = {0};
1553 int min_fclk_khz, min_dcfclk_khz, socclk_khz;
1554 const int overdrive = 5000000;
1555
1556 if (dc->res_pool->pp_smu)
1557 pp = &dc->res_pool->pp_smu->rv_funcs;
1558 if (!pp || !pp->set_wm_ranges)
1559 return;
1560
1561 DC_FP_START();
1562 min_fclk_khz = dc->dcn_soc->fabric_and_dram_bandwidth_vmin0p65 * 1000000 / 32;
1563 min_dcfclk_khz = dc->dcn_soc->dcfclkv_min0p65 * 1000;
1564 socclk_khz = dc->dcn_soc->socclk * 1000;
1565 DC_FP_END();
1566
1567
1568
1569
1570
1571
1572
1573
1574
1575 ranges.num_reader_wm_sets = WM_SET_COUNT;
1576 ranges.num_writer_wm_sets = WM_SET_COUNT;
1577 ranges.reader_wm_sets[0].wm_inst = WM_A;
1578 ranges.reader_wm_sets[0].min_drain_clk_mhz = min_dcfclk_khz / 1000;
1579 ranges.reader_wm_sets[0].max_drain_clk_mhz = overdrive / 1000;
1580 ranges.reader_wm_sets[0].min_fill_clk_mhz = min_fclk_khz / 1000;
1581 ranges.reader_wm_sets[0].max_fill_clk_mhz = overdrive / 1000;
1582 ranges.writer_wm_sets[0].wm_inst = WM_A;
1583 ranges.writer_wm_sets[0].min_fill_clk_mhz = socclk_khz / 1000;
1584 ranges.writer_wm_sets[0].max_fill_clk_mhz = overdrive / 1000;
1585 ranges.writer_wm_sets[0].min_drain_clk_mhz = min_fclk_khz / 1000;
1586 ranges.writer_wm_sets[0].max_drain_clk_mhz = overdrive / 1000;
1587
1588 if (dc->debug.pplib_wm_report_mode == WM_REPORT_OVERRIDE) {
1589 ranges.reader_wm_sets[0].wm_inst = WM_A;
1590 ranges.reader_wm_sets[0].min_drain_clk_mhz = 300;
1591 ranges.reader_wm_sets[0].max_drain_clk_mhz = 5000;
1592 ranges.reader_wm_sets[0].min_fill_clk_mhz = 800;
1593 ranges.reader_wm_sets[0].max_fill_clk_mhz = 5000;
1594 ranges.writer_wm_sets[0].wm_inst = WM_A;
1595 ranges.writer_wm_sets[0].min_fill_clk_mhz = 200;
1596 ranges.writer_wm_sets[0].max_fill_clk_mhz = 5000;
1597 ranges.writer_wm_sets[0].min_drain_clk_mhz = 800;
1598 ranges.writer_wm_sets[0].max_drain_clk_mhz = 5000;
1599 }
1600
1601 ranges.reader_wm_sets[1] = ranges.writer_wm_sets[0];
1602 ranges.reader_wm_sets[1].wm_inst = WM_B;
1603
1604 ranges.reader_wm_sets[2] = ranges.writer_wm_sets[0];
1605 ranges.reader_wm_sets[2].wm_inst = WM_C;
1606
1607 ranges.reader_wm_sets[3] = ranges.writer_wm_sets[0];
1608 ranges.reader_wm_sets[3].wm_inst = WM_D;
1609
1610
1611 pp->set_wm_ranges(&pp->pp_smu, &ranges);
1612}
1613
1614void dcn_bw_sync_calcs_and_dml(struct dc *dc)
1615{
1616 DC_FP_START();
1617 DC_LOG_BANDWIDTH_CALCS("sr_exit_time: %f ns\n"
1618 "sr_enter_plus_exit_time: %f ns\n"
1619 "urgent_latency: %f ns\n"
1620 "write_back_latency: %f ns\n"
1621 "percent_of_ideal_drambw_received_after_urg_latency: %f %%\n"
1622 "max_request_size: %d bytes\n"
1623 "dcfclkv_max0p9: %f kHz\n"
1624 "dcfclkv_nom0p8: %f kHz\n"
1625 "dcfclkv_mid0p72: %f kHz\n"
1626 "dcfclkv_min0p65: %f kHz\n"
1627 "max_dispclk_vmax0p9: %f kHz\n"
1628 "max_dispclk_vnom0p8: %f kHz\n"
1629 "max_dispclk_vmid0p72: %f kHz\n"
1630 "max_dispclk_vmin0p65: %f kHz\n"
1631 "max_dppclk_vmax0p9: %f kHz\n"
1632 "max_dppclk_vnom0p8: %f kHz\n"
1633 "max_dppclk_vmid0p72: %f kHz\n"
1634 "max_dppclk_vmin0p65: %f kHz\n"
1635 "socclk: %f kHz\n"
1636 "fabric_and_dram_bandwidth_vmax0p9: %f MB/s\n"
1637 "fabric_and_dram_bandwidth_vnom0p8: %f MB/s\n"
1638 "fabric_and_dram_bandwidth_vmid0p72: %f MB/s\n"
1639 "fabric_and_dram_bandwidth_vmin0p65: %f MB/s\n"
1640 "phyclkv_max0p9: %f kHz\n"
1641 "phyclkv_nom0p8: %f kHz\n"
1642 "phyclkv_mid0p72: %f kHz\n"
1643 "phyclkv_min0p65: %f kHz\n"
1644 "downspreading: %f %%\n"
1645 "round_trip_ping_latency_cycles: %d DCFCLK Cycles\n"
1646 "urgent_out_of_order_return_per_channel: %d Bytes\n"
1647 "number_of_channels: %d\n"
1648 "vmm_page_size: %d Bytes\n"
1649 "dram_clock_change_latency: %f ns\n"
1650 "return_bus_width: %d Bytes\n",
1651 dc->dcn_soc->sr_exit_time * 1000,
1652 dc->dcn_soc->sr_enter_plus_exit_time * 1000,
1653 dc->dcn_soc->urgent_latency * 1000,
1654 dc->dcn_soc->write_back_latency * 1000,
1655 dc->dcn_soc->percent_of_ideal_drambw_received_after_urg_latency,
1656 dc->dcn_soc->max_request_size,
1657 dc->dcn_soc->dcfclkv_max0p9 * 1000,
1658 dc->dcn_soc->dcfclkv_nom0p8 * 1000,
1659 dc->dcn_soc->dcfclkv_mid0p72 * 1000,
1660 dc->dcn_soc->dcfclkv_min0p65 * 1000,
1661 dc->dcn_soc->max_dispclk_vmax0p9 * 1000,
1662 dc->dcn_soc->max_dispclk_vnom0p8 * 1000,
1663 dc->dcn_soc->max_dispclk_vmid0p72 * 1000,
1664 dc->dcn_soc->max_dispclk_vmin0p65 * 1000,
1665 dc->dcn_soc->max_dppclk_vmax0p9 * 1000,
1666 dc->dcn_soc->max_dppclk_vnom0p8 * 1000,
1667 dc->dcn_soc->max_dppclk_vmid0p72 * 1000,
1668 dc->dcn_soc->max_dppclk_vmin0p65 * 1000,
1669 dc->dcn_soc->socclk * 1000,
1670 dc->dcn_soc->fabric_and_dram_bandwidth_vmax0p9 * 1000,
1671 dc->dcn_soc->fabric_and_dram_bandwidth_vnom0p8 * 1000,
1672 dc->dcn_soc->fabric_and_dram_bandwidth_vmid0p72 * 1000,
1673 dc->dcn_soc->fabric_and_dram_bandwidth_vmin0p65 * 1000,
1674 dc->dcn_soc->phyclkv_max0p9 * 1000,
1675 dc->dcn_soc->phyclkv_nom0p8 * 1000,
1676 dc->dcn_soc->phyclkv_mid0p72 * 1000,
1677 dc->dcn_soc->phyclkv_min0p65 * 1000,
1678 dc->dcn_soc->downspreading * 100,
1679 dc->dcn_soc->round_trip_ping_latency_cycles,
1680 dc->dcn_soc->urgent_out_of_order_return_per_channel,
1681 dc->dcn_soc->number_of_channels,
1682 dc->dcn_soc->vmm_page_size,
1683 dc->dcn_soc->dram_clock_change_latency * 1000,
1684 dc->dcn_soc->return_bus_width);
1685 DC_LOG_BANDWIDTH_CALCS("rob_buffer_size_in_kbyte: %f\n"
1686 "det_buffer_size_in_kbyte: %f\n"
1687 "dpp_output_buffer_pixels: %f\n"
1688 "opp_output_buffer_lines: %f\n"
1689 "pixel_chunk_size_in_kbyte: %f\n"
1690 "pte_enable: %d\n"
1691 "pte_chunk_size: %d kbytes\n"
1692 "meta_chunk_size: %d kbytes\n"
1693 "writeback_chunk_size: %d kbytes\n"
1694 "odm_capability: %d\n"
1695 "dsc_capability: %d\n"
1696 "line_buffer_size: %d bits\n"
1697 "max_line_buffer_lines: %d\n"
1698 "is_line_buffer_bpp_fixed: %d\n"
1699 "line_buffer_fixed_bpp: %d\n"
1700 "writeback_luma_buffer_size: %d kbytes\n"
1701 "writeback_chroma_buffer_size: %d kbytes\n"
1702 "max_num_dpp: %d\n"
1703 "max_num_writeback: %d\n"
1704 "max_dchub_topscl_throughput: %d pixels/dppclk\n"
1705 "max_pscl_tolb_throughput: %d pixels/dppclk\n"
1706 "max_lb_tovscl_throughput: %d pixels/dppclk\n"
1707 "max_vscl_tohscl_throughput: %d pixels/dppclk\n"
1708 "max_hscl_ratio: %f\n"
1709 "max_vscl_ratio: %f\n"
1710 "max_hscl_taps: %d\n"
1711 "max_vscl_taps: %d\n"
1712 "pte_buffer_size_in_requests: %d\n"
1713 "dispclk_ramping_margin: %f %%\n"
1714 "under_scan_factor: %f %%\n"
1715 "max_inter_dcn_tile_repeaters: %d\n"
1716 "can_vstartup_lines_exceed_vsync_plus_back_porch_lines_minus_one: %d\n"
1717 "bug_forcing_luma_and_chroma_request_to_same_size_fixed: %d\n"
1718 "dcfclk_cstate_latency: %d\n",
1719 dc->dcn_ip->rob_buffer_size_in_kbyte,
1720 dc->dcn_ip->det_buffer_size_in_kbyte,
1721 dc->dcn_ip->dpp_output_buffer_pixels,
1722 dc->dcn_ip->opp_output_buffer_lines,
1723 dc->dcn_ip->pixel_chunk_size_in_kbyte,
1724 dc->dcn_ip->pte_enable,
1725 dc->dcn_ip->pte_chunk_size,
1726 dc->dcn_ip->meta_chunk_size,
1727 dc->dcn_ip->writeback_chunk_size,
1728 dc->dcn_ip->odm_capability,
1729 dc->dcn_ip->dsc_capability,
1730 dc->dcn_ip->line_buffer_size,
1731 dc->dcn_ip->max_line_buffer_lines,
1732 dc->dcn_ip->is_line_buffer_bpp_fixed,
1733 dc->dcn_ip->line_buffer_fixed_bpp,
1734 dc->dcn_ip->writeback_luma_buffer_size,
1735 dc->dcn_ip->writeback_chroma_buffer_size,
1736 dc->dcn_ip->max_num_dpp,
1737 dc->dcn_ip->max_num_writeback,
1738 dc->dcn_ip->max_dchub_topscl_throughput,
1739 dc->dcn_ip->max_pscl_tolb_throughput,
1740 dc->dcn_ip->max_lb_tovscl_throughput,
1741 dc->dcn_ip->max_vscl_tohscl_throughput,
1742 dc->dcn_ip->max_hscl_ratio,
1743 dc->dcn_ip->max_vscl_ratio,
1744 dc->dcn_ip->max_hscl_taps,
1745 dc->dcn_ip->max_vscl_taps,
1746 dc->dcn_ip->pte_buffer_size_in_requests,
1747 dc->dcn_ip->dispclk_ramping_margin,
1748 dc->dcn_ip->under_scan_factor * 100,
1749 dc->dcn_ip->max_inter_dcn_tile_repeaters,
1750 dc->dcn_ip->can_vstartup_lines_exceed_vsync_plus_back_porch_lines_minus_one,
1751 dc->dcn_ip->bug_forcing_luma_and_chroma_request_to_same_size_fixed,
1752 dc->dcn_ip->dcfclk_cstate_latency);
1753
1754 dc->dml.soc.sr_exit_time_us = dc->dcn_soc->sr_exit_time;
1755 dc->dml.soc.sr_enter_plus_exit_time_us = dc->dcn_soc->sr_enter_plus_exit_time;
1756 dc->dml.soc.urgent_latency_us = dc->dcn_soc->urgent_latency;
1757 dc->dml.soc.writeback_latency_us = dc->dcn_soc->write_back_latency;
1758 dc->dml.soc.ideal_dram_bw_after_urgent_percent =
1759 dc->dcn_soc->percent_of_ideal_drambw_received_after_urg_latency;
1760 dc->dml.soc.max_request_size_bytes = dc->dcn_soc->max_request_size;
1761 dc->dml.soc.downspread_percent = dc->dcn_soc->downspreading;
1762 dc->dml.soc.round_trip_ping_latency_dcfclk_cycles =
1763 dc->dcn_soc->round_trip_ping_latency_cycles;
1764 dc->dml.soc.urgent_out_of_order_return_per_channel_bytes =
1765 dc->dcn_soc->urgent_out_of_order_return_per_channel;
1766 dc->dml.soc.num_chans = dc->dcn_soc->number_of_channels;
1767 dc->dml.soc.vmm_page_size_bytes = dc->dcn_soc->vmm_page_size;
1768 dc->dml.soc.dram_clock_change_latency_us = dc->dcn_soc->dram_clock_change_latency;
1769 dc->dml.soc.return_bus_width_bytes = dc->dcn_soc->return_bus_width;
1770
1771 dc->dml.ip.rob_buffer_size_kbytes = dc->dcn_ip->rob_buffer_size_in_kbyte;
1772 dc->dml.ip.det_buffer_size_kbytes = dc->dcn_ip->det_buffer_size_in_kbyte;
1773 dc->dml.ip.dpp_output_buffer_pixels = dc->dcn_ip->dpp_output_buffer_pixels;
1774 dc->dml.ip.opp_output_buffer_lines = dc->dcn_ip->opp_output_buffer_lines;
1775 dc->dml.ip.pixel_chunk_size_kbytes = dc->dcn_ip->pixel_chunk_size_in_kbyte;
1776 dc->dml.ip.pte_enable = dc->dcn_ip->pte_enable == dcn_bw_yes;
1777 dc->dml.ip.pte_chunk_size_kbytes = dc->dcn_ip->pte_chunk_size;
1778 dc->dml.ip.meta_chunk_size_kbytes = dc->dcn_ip->meta_chunk_size;
1779 dc->dml.ip.writeback_chunk_size_kbytes = dc->dcn_ip->writeback_chunk_size;
1780 dc->dml.ip.line_buffer_size_bits = dc->dcn_ip->line_buffer_size;
1781 dc->dml.ip.max_line_buffer_lines = dc->dcn_ip->max_line_buffer_lines;
1782 dc->dml.ip.IsLineBufferBppFixed = dc->dcn_ip->is_line_buffer_bpp_fixed == dcn_bw_yes;
1783 dc->dml.ip.LineBufferFixedBpp = dc->dcn_ip->line_buffer_fixed_bpp;
1784 dc->dml.ip.writeback_luma_buffer_size_kbytes = dc->dcn_ip->writeback_luma_buffer_size;
1785 dc->dml.ip.writeback_chroma_buffer_size_kbytes = dc->dcn_ip->writeback_chroma_buffer_size;
1786 dc->dml.ip.max_num_dpp = dc->dcn_ip->max_num_dpp;
1787 dc->dml.ip.max_num_wb = dc->dcn_ip->max_num_writeback;
1788 dc->dml.ip.max_dchub_pscl_bw_pix_per_clk = dc->dcn_ip->max_dchub_topscl_throughput;
1789 dc->dml.ip.max_pscl_lb_bw_pix_per_clk = dc->dcn_ip->max_pscl_tolb_throughput;
1790 dc->dml.ip.max_lb_vscl_bw_pix_per_clk = dc->dcn_ip->max_lb_tovscl_throughput;
1791 dc->dml.ip.max_vscl_hscl_bw_pix_per_clk = dc->dcn_ip->max_vscl_tohscl_throughput;
1792 dc->dml.ip.max_hscl_ratio = dc->dcn_ip->max_hscl_ratio;
1793 dc->dml.ip.max_vscl_ratio = dc->dcn_ip->max_vscl_ratio;
1794 dc->dml.ip.max_hscl_taps = dc->dcn_ip->max_hscl_taps;
1795 dc->dml.ip.max_vscl_taps = dc->dcn_ip->max_vscl_taps;
1796
1797 dc->dml.ip.dispclk_ramp_margin_percent = dc->dcn_ip->dispclk_ramping_margin;
1798 dc->dml.ip.underscan_factor = dc->dcn_ip->under_scan_factor;
1799 dc->dml.ip.max_inter_dcn_tile_repeaters = dc->dcn_ip->max_inter_dcn_tile_repeaters;
1800 dc->dml.ip.can_vstartup_lines_exceed_vsync_plus_back_porch_lines_minus_one =
1801 dc->dcn_ip->can_vstartup_lines_exceed_vsync_plus_back_porch_lines_minus_one == dcn_bw_yes;
1802 dc->dml.ip.bug_forcing_LC_req_same_size_fixed =
1803 dc->dcn_ip->bug_forcing_luma_and_chroma_request_to_same_size_fixed == dcn_bw_yes;
1804 dc->dml.ip.dcfclk_cstate_latency = dc->dcn_ip->dcfclk_cstate_latency;
1805 DC_FP_END();
1806}
1807