xref: /linux/drivers/gpu/drm/amd/display/dc/dsc/dc_dsc.c (revision 15a1fbdcfb519c2bd291ed01c6c94e0b89537a77)
1 /*
2  * Copyright 2019 Advanced Micro Devices, Inc.
3  *
4  * Permission is hereby granted, free of charge, to any person obtaining a
5  * copy of this software and associated documentation files (the "Software"),
6  * to deal in the Software without restriction, including without limitation
7  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8  * and/or sell copies of the Software, and to permit persons to whom the
9  * Software is furnished to do so, subject to the following conditions:
10  *
11  * The above copyright notice and this permission notice shall be included in
12  * all copies or substantial portions of the Software.
13  *
14  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
17  * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20  * OTHER DEALINGS IN THE SOFTWARE.
21  *
22  * Author: AMD
23  */
24 
25 #include "dc_hw_types.h"
26 #include "dsc.h"
27 #include <drm/drm_dp_helper.h>
28 #include "dc.h"
29 
30 /* This module's internal functions */
31 
32 /* default DSC policy target bitrate limit is 16bpp */
33 static uint32_t dsc_policy_max_target_bpp_limit = 16;
34 
35 static uint32_t dc_dsc_bandwidth_in_kbps_from_timing(
36 	const struct dc_crtc_timing *timing)
37 {
38 	uint32_t bits_per_channel = 0;
39 	uint32_t kbps;
40 
41 	if (timing->flags.DSC) {
42 		kbps = (timing->pix_clk_100hz * timing->dsc_cfg.bits_per_pixel);
43 		kbps = kbps / 160 + ((kbps % 160) ? 1 : 0);
44 		return kbps;
45 	}
46 
47 	switch (timing->display_color_depth) {
48 	case COLOR_DEPTH_666:
49 		bits_per_channel = 6;
50 		break;
51 	case COLOR_DEPTH_888:
52 		bits_per_channel = 8;
53 		break;
54 	case COLOR_DEPTH_101010:
55 		bits_per_channel = 10;
56 		break;
57 	case COLOR_DEPTH_121212:
58 		bits_per_channel = 12;
59 		break;
60 	case COLOR_DEPTH_141414:
61 		bits_per_channel = 14;
62 		break;
63 	case COLOR_DEPTH_161616:
64 		bits_per_channel = 16;
65 		break;
66 	default:
67 		break;
68 	}
69 
70 	ASSERT(bits_per_channel != 0);
71 
72 	kbps = timing->pix_clk_100hz / 10;
73 	kbps *= bits_per_channel;
74 
75 	if (timing->flags.Y_ONLY != 1) {
76 		/*Only YOnly make reduce bandwidth by 1/3 compares to RGB*/
77 		kbps *= 3;
78 		if (timing->pixel_encoding == PIXEL_ENCODING_YCBCR420)
79 			kbps /= 2;
80 		else if (timing->pixel_encoding == PIXEL_ENCODING_YCBCR422)
81 			kbps = kbps * 2 / 3;
82 	}
83 
84 	return kbps;
85 
86 }
87 
88 static bool dsc_buff_block_size_from_dpcd(int dpcd_buff_block_size, int *buff_block_size)
89 {
90 
91 	switch (dpcd_buff_block_size) {
92 	case DP_DSC_RC_BUF_BLK_SIZE_1:
93 		*buff_block_size = 1024;
94 		break;
95 	case DP_DSC_RC_BUF_BLK_SIZE_4:
96 		*buff_block_size = 4 * 1024;
97 		break;
98 	case DP_DSC_RC_BUF_BLK_SIZE_16:
99 		*buff_block_size = 16 * 1024;
100 		break;
101 	case DP_DSC_RC_BUF_BLK_SIZE_64:
102 		*buff_block_size = 64 * 1024;
103 		break;
104 	default: {
105 			dm_error("%s: DPCD DSC buffer size not recognized.\n", __func__);
106 			return false;
107 		}
108 	}
109 
110 	return true;
111 }
112 
113 
114 static bool dsc_line_buff_depth_from_dpcd(int dpcd_line_buff_bit_depth, int *line_buff_bit_depth)
115 {
116 	if (0 <= dpcd_line_buff_bit_depth && dpcd_line_buff_bit_depth <= 7)
117 		*line_buff_bit_depth = dpcd_line_buff_bit_depth + 9;
118 	else if (dpcd_line_buff_bit_depth == 8)
119 		*line_buff_bit_depth = 8;
120 	else {
121 		dm_error("%s: DPCD DSC buffer depth not recognized.\n", __func__);
122 		return false;
123 	}
124 
125 	return true;
126 }
127 
128 
129 static bool dsc_throughput_from_dpcd(int dpcd_throughput, int *throughput)
130 {
131 	switch (dpcd_throughput) {
132 	case DP_DSC_THROUGHPUT_MODE_0_UPSUPPORTED:
133 		*throughput = 0;
134 		break;
135 	case DP_DSC_THROUGHPUT_MODE_0_170:
136 		*throughput = 170;
137 		break;
138 	case DP_DSC_THROUGHPUT_MODE_0_340:
139 		*throughput = 340;
140 		break;
141 	case DP_DSC_THROUGHPUT_MODE_0_400:
142 		*throughput = 400;
143 		break;
144 	case DP_DSC_THROUGHPUT_MODE_0_450:
145 		*throughput = 450;
146 		break;
147 	case DP_DSC_THROUGHPUT_MODE_0_500:
148 		*throughput = 500;
149 		break;
150 	case DP_DSC_THROUGHPUT_MODE_0_550:
151 		*throughput = 550;
152 		break;
153 	case DP_DSC_THROUGHPUT_MODE_0_600:
154 		*throughput = 600;
155 		break;
156 	case DP_DSC_THROUGHPUT_MODE_0_650:
157 		*throughput = 650;
158 		break;
159 	case DP_DSC_THROUGHPUT_MODE_0_700:
160 		*throughput = 700;
161 		break;
162 	case DP_DSC_THROUGHPUT_MODE_0_750:
163 		*throughput = 750;
164 		break;
165 	case DP_DSC_THROUGHPUT_MODE_0_800:
166 		*throughput = 800;
167 		break;
168 	case DP_DSC_THROUGHPUT_MODE_0_850:
169 		*throughput = 850;
170 		break;
171 	case DP_DSC_THROUGHPUT_MODE_0_900:
172 		*throughput = 900;
173 		break;
174 	case DP_DSC_THROUGHPUT_MODE_0_950:
175 		*throughput = 950;
176 		break;
177 	case DP_DSC_THROUGHPUT_MODE_0_1000:
178 		*throughput = 1000;
179 		break;
180 	default: {
181 			dm_error("%s: DPCD DSC throughput mode not recognized.\n", __func__);
182 			return false;
183 		}
184 	}
185 
186 	return true;
187 }
188 
189 
190 static bool dsc_bpp_increment_div_from_dpcd(int bpp_increment_dpcd, uint32_t *bpp_increment_div)
191 {
192 
193 	switch (bpp_increment_dpcd) {
194 	case 0:
195 		*bpp_increment_div = 16;
196 		break;
197 	case 1:
198 		*bpp_increment_div = 8;
199 		break;
200 	case 2:
201 		*bpp_increment_div = 4;
202 		break;
203 	case 3:
204 		*bpp_increment_div = 2;
205 		break;
206 	case 4:
207 		*bpp_increment_div = 1;
208 		break;
209 	default: {
210 		dm_error("%s: DPCD DSC bits-per-pixel increment not recognized.\n", __func__);
211 		return false;
212 	}
213 	}
214 
215 	return true;
216 }
217 
218 static void get_dsc_enc_caps(
219 	const struct display_stream_compressor *dsc,
220 	struct dsc_enc_caps *dsc_enc_caps,
221 	int pixel_clock_100Hz)
222 {
223 	// This is a static HW query, so we can use any DSC
224 
225 	memset(dsc_enc_caps, 0, sizeof(struct dsc_enc_caps));
226 	if (dsc) {
227 		if (!dsc->ctx->dc->debug.disable_dsc)
228 			dsc->funcs->dsc_get_enc_caps(dsc_enc_caps, pixel_clock_100Hz);
229 		if (dsc->ctx->dc->debug.native422_support)
230 			dsc_enc_caps->color_formats.bits.YCBCR_NATIVE_422 = 1;
231 	}
232 }
233 
234 /* Returns 'false' if no intersection was found for at least one capablity.
235  * It also implicitly validates some sink caps against invalid value of zero.
236  */
237 static bool intersect_dsc_caps(
238 	const struct dsc_dec_dpcd_caps *dsc_sink_caps,
239 	const struct dsc_enc_caps *dsc_enc_caps,
240 	enum dc_pixel_encoding pixel_encoding,
241 	struct dsc_enc_caps *dsc_common_caps)
242 {
243 	int32_t max_slices;
244 	int32_t total_sink_throughput;
245 
246 	memset(dsc_common_caps, 0, sizeof(struct dsc_enc_caps));
247 
248 	dsc_common_caps->dsc_version = min(dsc_sink_caps->dsc_version, dsc_enc_caps->dsc_version);
249 	if (!dsc_common_caps->dsc_version)
250 		return false;
251 
252 	dsc_common_caps->slice_caps.bits.NUM_SLICES_1 = dsc_sink_caps->slice_caps1.bits.NUM_SLICES_1 && dsc_enc_caps->slice_caps.bits.NUM_SLICES_1;
253 	dsc_common_caps->slice_caps.bits.NUM_SLICES_2 = dsc_sink_caps->slice_caps1.bits.NUM_SLICES_2 && dsc_enc_caps->slice_caps.bits.NUM_SLICES_2;
254 	dsc_common_caps->slice_caps.bits.NUM_SLICES_4 = dsc_sink_caps->slice_caps1.bits.NUM_SLICES_4 && dsc_enc_caps->slice_caps.bits.NUM_SLICES_4;
255 	dsc_common_caps->slice_caps.bits.NUM_SLICES_8 = dsc_sink_caps->slice_caps1.bits.NUM_SLICES_8 && dsc_enc_caps->slice_caps.bits.NUM_SLICES_8;
256 	if (!dsc_common_caps->slice_caps.raw)
257 		return false;
258 
259 	dsc_common_caps->lb_bit_depth = min(dsc_sink_caps->lb_bit_depth, dsc_enc_caps->lb_bit_depth);
260 	if (!dsc_common_caps->lb_bit_depth)
261 		return false;
262 
263 	dsc_common_caps->is_block_pred_supported = dsc_sink_caps->is_block_pred_supported && dsc_enc_caps->is_block_pred_supported;
264 
265 	dsc_common_caps->color_formats.raw = dsc_sink_caps->color_formats.raw & dsc_enc_caps->color_formats.raw;
266 	if (!dsc_common_caps->color_formats.raw)
267 		return false;
268 
269 	dsc_common_caps->color_depth.raw = dsc_sink_caps->color_depth.raw & dsc_enc_caps->color_depth.raw;
270 	if (!dsc_common_caps->color_depth.raw)
271 		return false;
272 
273 	max_slices = 0;
274 	if (dsc_common_caps->slice_caps.bits.NUM_SLICES_1)
275 		max_slices = 1;
276 
277 	if (dsc_common_caps->slice_caps.bits.NUM_SLICES_2)
278 		max_slices = 2;
279 
280 	if (dsc_common_caps->slice_caps.bits.NUM_SLICES_4)
281 		max_slices = 4;
282 
283 	total_sink_throughput = max_slices * dsc_sink_caps->throughput_mode_0_mps;
284 	if (pixel_encoding == PIXEL_ENCODING_YCBCR422 || pixel_encoding == PIXEL_ENCODING_YCBCR420)
285 		total_sink_throughput = max_slices * dsc_sink_caps->throughput_mode_1_mps;
286 
287 	dsc_common_caps->max_total_throughput_mps = min(total_sink_throughput, dsc_enc_caps->max_total_throughput_mps);
288 
289 	dsc_common_caps->max_slice_width = min(dsc_sink_caps->max_slice_width, dsc_enc_caps->max_slice_width);
290 	if (!dsc_common_caps->max_slice_width)
291 		return false;
292 
293 	dsc_common_caps->bpp_increment_div = min(dsc_sink_caps->bpp_increment_div, dsc_enc_caps->bpp_increment_div);
294 
295 	// TODO DSC: Remove this workaround for N422 and 420 once it's fixed, or move it to get_dsc_encoder_caps()
296 	if (pixel_encoding == PIXEL_ENCODING_YCBCR422 || pixel_encoding == PIXEL_ENCODING_YCBCR420)
297 		dsc_common_caps->bpp_increment_div = min(dsc_common_caps->bpp_increment_div, (uint32_t)8);
298 
299 	return true;
300 }
301 
302 static inline uint32_t dsc_div_by_10_round_up(uint32_t value)
303 {
304 	return (value + 9) / 10;
305 }
306 
307 static inline uint32_t calc_dsc_bpp_x16(uint32_t stream_bandwidth_kbps, uint32_t pix_clk_100hz, uint32_t bpp_increment_div)
308 {
309 	uint32_t dsc_target_bpp_x16;
310 	float f_dsc_target_bpp;
311 	float f_stream_bandwidth_100bps = stream_bandwidth_kbps * 10.0f;
312 	uint32_t precision = bpp_increment_div; // bpp_increment_div is actually precision
313 
314 	f_dsc_target_bpp = f_stream_bandwidth_100bps / pix_clk_100hz;
315 
316 	// Round down to the nearest precision stop to bring it into DSC spec range
317 	dsc_target_bpp_x16 = (uint32_t)(f_dsc_target_bpp * precision);
318 	dsc_target_bpp_x16 = (dsc_target_bpp_x16 * 16) / precision;
319 
320 	return dsc_target_bpp_x16;
321 }
322 
323 /* Get DSC bandwidth range based on [min_bpp, max_bpp] target bitrate range, and timing's pixel clock
324  * and uncompressed bandwidth.
325  */
326 static void get_dsc_bandwidth_range(
327 		const uint32_t min_bpp,
328 		const uint32_t max_bpp,
329 		const struct dsc_enc_caps *dsc_caps,
330 		const struct dc_crtc_timing *timing,
331 		struct dc_dsc_bw_range *range)
332 {
333 	/* native stream bandwidth */
334 	range->stream_kbps = dc_dsc_bandwidth_in_kbps_from_timing(timing);
335 
336 	/* max dsc target bpp */
337 	range->max_kbps = dsc_div_by_10_round_up(max_bpp * timing->pix_clk_100hz);
338 	range->max_target_bpp_x16 = max_bpp * 16;
339 	if (range->max_kbps > range->stream_kbps) {
340 		/* max dsc target bpp is capped to native bandwidth */
341 		range->max_kbps = range->stream_kbps;
342 		range->max_target_bpp_x16 = calc_dsc_bpp_x16(range->stream_kbps, timing->pix_clk_100hz, dsc_caps->bpp_increment_div);
343 	}
344 
345 	/* min dsc target bpp */
346 	range->min_kbps = dsc_div_by_10_round_up(min_bpp * timing->pix_clk_100hz);
347 	range->min_target_bpp_x16 = min_bpp * 16;
348 	if (range->min_kbps > range->max_kbps) {
349 		/* min dsc target bpp is capped to max dsc bandwidth*/
350 		range->min_kbps = range->max_kbps;
351 		range->min_target_bpp_x16 = range->max_target_bpp_x16;
352 	}
353 }
354 
355 
356 /* Decides if DSC should be used and calculates target bpp if it should, applying DSC policy.
357  *
358  * Returns:
359  *     - 'true' if DSC was required by policy and was successfully applied
360  *     - 'false' if DSC was not necessary (e.g. if uncompressed stream fits 'target_bandwidth_kbps'),
361  *        or if it couldn't be applied based on DSC policy.
362  */
363 static bool decide_dsc_target_bpp_x16(
364 		const struct dc_dsc_policy *policy,
365 		const struct dsc_enc_caps *dsc_common_caps,
366 		const int target_bandwidth_kbps,
367 		const struct dc_crtc_timing *timing,
368 		int *target_bpp_x16)
369 {
370 	bool should_use_dsc = false;
371 	struct dc_dsc_bw_range range;
372 
373 	memset(&range, 0, sizeof(range));
374 
375 	get_dsc_bandwidth_range(policy->min_target_bpp, policy->max_target_bpp,
376 			dsc_common_caps, timing, &range);
377 	if (target_bandwidth_kbps >= range.stream_kbps) {
378 		/* enough bandwidth without dsc */
379 		*target_bpp_x16 = 0;
380 		should_use_dsc = false;
381 	} else if (target_bandwidth_kbps >= range.max_kbps) {
382 		/* use max target bpp allowed */
383 		*target_bpp_x16 = range.max_target_bpp_x16;
384 		should_use_dsc = true;
385 	} else if (target_bandwidth_kbps >= range.min_kbps) {
386 		/* use target bpp that can take entire target bandwidth */
387 		*target_bpp_x16 = calc_dsc_bpp_x16(target_bandwidth_kbps, timing->pix_clk_100hz, dsc_common_caps->bpp_increment_div);
388 		should_use_dsc = true;
389 	} else {
390 		/* not enough bandwidth to fulfill minimum requirement */
391 		*target_bpp_x16 = 0;
392 		should_use_dsc = false;
393 	}
394 
395 	return should_use_dsc;
396 }
397 
398 #define MIN_AVAILABLE_SLICES_SIZE  4
399 
400 static int get_available_dsc_slices(union dsc_enc_slice_caps slice_caps, int *available_slices)
401 {
402 	int idx = 0;
403 
404 	memset(available_slices, -1, MIN_AVAILABLE_SLICES_SIZE);
405 
406 	if (slice_caps.bits.NUM_SLICES_1)
407 		available_slices[idx++] = 1;
408 
409 	if (slice_caps.bits.NUM_SLICES_2)
410 		available_slices[idx++] = 2;
411 
412 	if (slice_caps.bits.NUM_SLICES_4)
413 		available_slices[idx++] = 4;
414 
415 	if (slice_caps.bits.NUM_SLICES_8)
416 		available_slices[idx++] = 8;
417 
418 	return idx;
419 }
420 
421 
422 static int get_max_dsc_slices(union dsc_enc_slice_caps slice_caps)
423 {
424 	int max_slices = 0;
425 	int available_slices[MIN_AVAILABLE_SLICES_SIZE];
426 	int end_idx = get_available_dsc_slices(slice_caps, &available_slices[0]);
427 
428 	if (end_idx > 0)
429 		max_slices = available_slices[end_idx - 1];
430 
431 	return max_slices;
432 }
433 
434 
435 // Increment sice number in available sice numbers stops if possible, or just increment if not
436 static int inc_num_slices(union dsc_enc_slice_caps slice_caps, int num_slices)
437 {
438 	// Get next bigger num slices available in common caps
439 	int available_slices[MIN_AVAILABLE_SLICES_SIZE];
440 	int end_idx;
441 	int i;
442 	int new_num_slices = num_slices;
443 
444 	end_idx = get_available_dsc_slices(slice_caps, &available_slices[0]);
445 	if (end_idx == 0) {
446 		// No available slices found
447 		new_num_slices++;
448 		return new_num_slices;
449 	}
450 
451 	// Numbers of slices found - get the next bigger number
452 	for (i = 0; i < end_idx; i++) {
453 		if (new_num_slices < available_slices[i]) {
454 			new_num_slices = available_slices[i];
455 			break;
456 		}
457 	}
458 
459 	if (new_num_slices == num_slices) // No biger number of slices found
460 		new_num_slices++;
461 
462 	return new_num_slices;
463 }
464 
465 
466 // Decrement sice number in available sice numbers stops if possible, or just decrement if not. Stop at zero.
467 static int dec_num_slices(union dsc_enc_slice_caps slice_caps, int num_slices)
468 {
469 	// Get next bigger num slices available in common caps
470 	int available_slices[MIN_AVAILABLE_SLICES_SIZE];
471 	int end_idx;
472 	int i;
473 	int new_num_slices = num_slices;
474 
475 	end_idx = get_available_dsc_slices(slice_caps, &available_slices[0]);
476 	if (end_idx == 0 && new_num_slices > 0) {
477 		// No numbers of slices found
478 		new_num_slices++;
479 		return new_num_slices;
480 	}
481 
482 	// Numbers of slices found - get the next smaller number
483 	for (i = end_idx - 1; i >= 0; i--) {
484 		if (new_num_slices > available_slices[i]) {
485 			new_num_slices = available_slices[i];
486 			break;
487 		}
488 	}
489 
490 	if (new_num_slices == num_slices) {
491 		// No smaller number of slices found
492 		new_num_slices--;
493 		if (new_num_slices < 0)
494 			new_num_slices = 0;
495 	}
496 
497 	return new_num_slices;
498 }
499 
500 
501 // Choose next bigger number of slices if the requested number of slices is not available
502 static int fit_num_slices_up(union dsc_enc_slice_caps slice_caps, int num_slices)
503 {
504 	// Get next bigger num slices available in common caps
505 	int available_slices[MIN_AVAILABLE_SLICES_SIZE];
506 	int end_idx;
507 	int i;
508 	int new_num_slices = num_slices;
509 
510 	end_idx = get_available_dsc_slices(slice_caps, &available_slices[0]);
511 	if (end_idx == 0) {
512 		// No available slices found
513 		new_num_slices++;
514 		return new_num_slices;
515 	}
516 
517 	// Numbers of slices found - get the equal or next bigger number
518 	for (i = 0; i < end_idx; i++) {
519 		if (new_num_slices <= available_slices[i]) {
520 			new_num_slices = available_slices[i];
521 			break;
522 		}
523 	}
524 
525 	return new_num_slices;
526 }
527 
528 
529 /* Attempts to set DSC configuration for the stream, applying DSC policy.
530  * Returns 'true' if successful or 'false' if not.
531  *
532  * Parameters:
533  *
534  * dsc_sink_caps       - DSC sink decoder capabilities (from DPCD)
535  *
536  * dsc_enc_caps        - DSC encoder capabilities
537  *
538  * target_bandwidth_kbps  - Target bandwidth to fit the stream into.
539  *                          If 0, do not calculate target bpp.
540  *
541  * timing              - The stream timing to fit into 'target_bandwidth_kbps' or apply
542  *                       maximum compression to, if 'target_badwidth == 0'
543  *
544  * dsc_cfg             - DSC configuration to use if it was possible to come up with
545  *                       one for the given inputs.
546  *                       The target bitrate after DSC can be calculated by multiplying
547  *                       dsc_cfg.bits_per_pixel (in U6.4 format) by pixel rate, e.g.
548  *
549  *                       dsc_stream_bitrate_kbps = (int)ceil(timing->pix_clk_khz * dsc_cfg.bits_per_pixel / 16.0);
550  */
551 static bool setup_dsc_config(
552 		const struct dsc_dec_dpcd_caps *dsc_sink_caps,
553 		const struct dsc_enc_caps *dsc_enc_caps,
554 		int target_bandwidth_kbps,
555 		const struct dc_crtc_timing *timing,
556 		int min_slice_height_override,
557 		struct dc_dsc_config *dsc_cfg)
558 {
559 	struct dsc_enc_caps dsc_common_caps;
560 	int max_slices_h;
561 	int min_slices_h;
562 	int num_slices_h;
563 	int pic_width;
564 	int slice_width;
565 	int target_bpp;
566 	int sink_per_slice_throughput_mps;
567 	int branch_max_throughput_mps = 0;
568 	bool is_dsc_possible = false;
569 	int pic_height;
570 	int slice_height;
571 	struct dc_dsc_policy policy;
572 
573 	memset(dsc_cfg, 0, sizeof(struct dc_dsc_config));
574 
575 	dc_dsc_get_policy_for_timing(timing, &policy);
576 	pic_width = timing->h_addressable + timing->h_border_left + timing->h_border_right;
577 	pic_height = timing->v_addressable + timing->v_border_top + timing->v_border_bottom;
578 
579 	if (!dsc_sink_caps->is_dsc_supported)
580 		goto done;
581 
582 	if (dsc_sink_caps->branch_max_line_width && dsc_sink_caps->branch_max_line_width < pic_width)
583 		goto done;
584 
585 	// Intersect decoder with encoder DSC caps and validate DSC settings
586 	is_dsc_possible = intersect_dsc_caps(dsc_sink_caps, dsc_enc_caps, timing->pixel_encoding, &dsc_common_caps);
587 	if (!is_dsc_possible)
588 		goto done;
589 
590 	if (target_bandwidth_kbps > 0) {
591 		is_dsc_possible = decide_dsc_target_bpp_x16(
592 				&policy,
593 				&dsc_common_caps,
594 				target_bandwidth_kbps,
595 				timing,
596 				&target_bpp);
597 		dsc_cfg->bits_per_pixel = target_bpp;
598 	}
599 	if (!is_dsc_possible)
600 		goto done;
601 
602 	sink_per_slice_throughput_mps = 0;
603 
604 	// Validate available DSC settings against the mode timing
605 
606 	// Validate color format (and pick up the throughput values)
607 	dsc_cfg->ycbcr422_simple = false;
608 	switch (timing->pixel_encoding)	{
609 	case PIXEL_ENCODING_RGB:
610 		is_dsc_possible = (bool)dsc_common_caps.color_formats.bits.RGB;
611 		sink_per_slice_throughput_mps = dsc_sink_caps->throughput_mode_0_mps;
612 		branch_max_throughput_mps = dsc_sink_caps->branch_overall_throughput_0_mps;
613 		break;
614 	case PIXEL_ENCODING_YCBCR444:
615 		is_dsc_possible = (bool)dsc_common_caps.color_formats.bits.YCBCR_444;
616 		sink_per_slice_throughput_mps = dsc_sink_caps->throughput_mode_0_mps;
617 		branch_max_throughput_mps = dsc_sink_caps->branch_overall_throughput_0_mps;
618 		break;
619 	case PIXEL_ENCODING_YCBCR422:
620 		is_dsc_possible = (bool)dsc_common_caps.color_formats.bits.YCBCR_NATIVE_422;
621 		sink_per_slice_throughput_mps = dsc_sink_caps->throughput_mode_1_mps;
622 		branch_max_throughput_mps = dsc_sink_caps->branch_overall_throughput_1_mps;
623 		if (!is_dsc_possible) {
624 			is_dsc_possible = (bool)dsc_common_caps.color_formats.bits.YCBCR_SIMPLE_422;
625 			dsc_cfg->ycbcr422_simple = is_dsc_possible;
626 			sink_per_slice_throughput_mps = dsc_sink_caps->throughput_mode_0_mps;
627 		}
628 		break;
629 	case PIXEL_ENCODING_YCBCR420:
630 		is_dsc_possible = (bool)dsc_common_caps.color_formats.bits.YCBCR_NATIVE_420;
631 		sink_per_slice_throughput_mps = dsc_sink_caps->throughput_mode_1_mps;
632 		branch_max_throughput_mps = dsc_sink_caps->branch_overall_throughput_1_mps;
633 		break;
634 	default:
635 		is_dsc_possible = false;
636 	}
637 
638 	// Validate branch's maximum throughput
639 	if (branch_max_throughput_mps && dsc_div_by_10_round_up(timing->pix_clk_100hz) > branch_max_throughput_mps * 1000)
640 		is_dsc_possible = false;
641 
642 	if (!is_dsc_possible)
643 		goto done;
644 
645 	// Color depth
646 	switch (timing->display_color_depth) {
647 	case COLOR_DEPTH_888:
648 		is_dsc_possible = (bool)dsc_common_caps.color_depth.bits.COLOR_DEPTH_8_BPC;
649 		break;
650 	case COLOR_DEPTH_101010:
651 		is_dsc_possible = (bool)dsc_common_caps.color_depth.bits.COLOR_DEPTH_10_BPC;
652 		break;
653 	case COLOR_DEPTH_121212:
654 		is_dsc_possible = (bool)dsc_common_caps.color_depth.bits.COLOR_DEPTH_12_BPC;
655 		break;
656 	default:
657 		is_dsc_possible = false;
658 	}
659 
660 	if (!is_dsc_possible)
661 		goto done;
662 
663 	// Slice width (i.e. number of slices per line)
664 	max_slices_h = get_max_dsc_slices(dsc_common_caps.slice_caps);
665 
666 	while (max_slices_h > 0) {
667 		if (pic_width % max_slices_h == 0)
668 			break;
669 
670 		max_slices_h = dec_num_slices(dsc_common_caps.slice_caps, max_slices_h);
671 	}
672 
673 	is_dsc_possible = (dsc_common_caps.max_slice_width > 0);
674 	if (!is_dsc_possible)
675 		goto done;
676 
677 	min_slices_h = pic_width / dsc_common_caps.max_slice_width;
678 	if (pic_width % dsc_common_caps.max_slice_width)
679 		min_slices_h++;
680 
681 	min_slices_h = fit_num_slices_up(dsc_common_caps.slice_caps, min_slices_h);
682 
683 	while (min_slices_h <= max_slices_h) {
684 		int pix_clk_per_slice_khz = dsc_div_by_10_round_up(timing->pix_clk_100hz) / min_slices_h;
685 		if (pix_clk_per_slice_khz <= sink_per_slice_throughput_mps * 1000)
686 			break;
687 
688 		min_slices_h = inc_num_slices(dsc_common_caps.slice_caps, min_slices_h);
689 	}
690 
691 	if (pic_width % min_slices_h != 0)
692 		min_slices_h = 0; // DSC TODO: Maybe try increasing the number of slices first?
693 
694 	is_dsc_possible = (min_slices_h <= max_slices_h);
695 	if (!is_dsc_possible)
696 		goto done;
697 
698 	if (policy.use_min_slices_h) {
699 		if (min_slices_h > 0)
700 			num_slices_h = min_slices_h;
701 		else if (max_slices_h > 0) { // Fall back to max slices if min slices is not working out
702 			if (policy.max_slices_h)
703 				num_slices_h = min(policy.max_slices_h, max_slices_h);
704 			else
705 				num_slices_h = max_slices_h;
706 		} else
707 			is_dsc_possible = false;
708 	} else {
709 		if (max_slices_h > 0) {
710 			if (policy.max_slices_h)
711 				num_slices_h = min(policy.max_slices_h, max_slices_h);
712 			else
713 				num_slices_h = max_slices_h;
714 		} else if (min_slices_h > 0) // Fall back to min slices if max slices is not possible
715 			num_slices_h = min_slices_h;
716 		else
717 			is_dsc_possible = false;
718 	}
719 
720 	if (!is_dsc_possible)
721 		goto done;
722 
723 	dsc_cfg->num_slices_h = num_slices_h;
724 	slice_width = pic_width / num_slices_h;
725 
726 	is_dsc_possible = slice_width <= dsc_common_caps.max_slice_width;
727 	if (!is_dsc_possible)
728 		goto done;
729 
730 	// Slice height (i.e. number of slices per column): start with policy and pick the first one that height is divisible by.
731 	// For 4:2:0 make sure the slice height is divisible by 2 as well.
732 	if (min_slice_height_override == 0)
733 		slice_height = min(policy.min_slice_height, pic_height);
734 	else
735 		slice_height = min(min_slice_height_override, pic_height);
736 
737 	while (slice_height < pic_height && (pic_height % slice_height != 0 ||
738 		(timing->pixel_encoding == PIXEL_ENCODING_YCBCR420 && slice_height % 2 != 0)))
739 		slice_height++;
740 
741 	if (timing->pixel_encoding == PIXEL_ENCODING_YCBCR420) // For the case when pic_height < dsc_policy.min_sice_height
742 		is_dsc_possible = (slice_height % 2 == 0);
743 
744 	if (!is_dsc_possible)
745 		goto done;
746 
747 	dsc_cfg->num_slices_v = pic_height/slice_height;
748 
749 	// Final decission: can we do DSC or not?
750 	if (is_dsc_possible) {
751 		// Fill out the rest of DSC settings
752 		dsc_cfg->block_pred_enable = dsc_common_caps.is_block_pred_supported;
753 		dsc_cfg->linebuf_depth = dsc_common_caps.lb_bit_depth;
754 		dsc_cfg->version_minor = (dsc_common_caps.dsc_version & 0xf0) >> 4;
755 	}
756 
757 done:
758 	if (!is_dsc_possible)
759 		memset(dsc_cfg, 0, sizeof(struct dc_dsc_config));
760 
761 	return is_dsc_possible;
762 }
763 
764 bool dc_dsc_parse_dsc_dpcd(const struct dc *dc, const uint8_t *dpcd_dsc_basic_data, const uint8_t *dpcd_dsc_ext_data, struct dsc_dec_dpcd_caps *dsc_sink_caps)
765 {
766 	if (!dpcd_dsc_basic_data)
767 		return false;
768 
769 	dsc_sink_caps->is_dsc_supported = (dpcd_dsc_basic_data[DP_DSC_SUPPORT - DP_DSC_SUPPORT] & DP_DSC_DECOMPRESSION_IS_SUPPORTED) != 0;
770 	if (!dsc_sink_caps->is_dsc_supported)
771 		return false;
772 
773 	dsc_sink_caps->dsc_version = dpcd_dsc_basic_data[DP_DSC_REV - DP_DSC_SUPPORT];
774 
775 	{
776 		int buff_block_size;
777 		int buff_size;
778 
779 		if (!dsc_buff_block_size_from_dpcd(dpcd_dsc_basic_data[DP_DSC_RC_BUF_BLK_SIZE - DP_DSC_SUPPORT], &buff_block_size))
780 			return false;
781 
782 		buff_size = dpcd_dsc_basic_data[DP_DSC_RC_BUF_SIZE - DP_DSC_SUPPORT] + 1;
783 		dsc_sink_caps->rc_buffer_size = buff_size * buff_block_size;
784 	}
785 
786 	dsc_sink_caps->slice_caps1.raw = dpcd_dsc_basic_data[DP_DSC_SLICE_CAP_1 - DP_DSC_SUPPORT];
787 	if (!dsc_line_buff_depth_from_dpcd(dpcd_dsc_basic_data[DP_DSC_LINE_BUF_BIT_DEPTH - DP_DSC_SUPPORT], &dsc_sink_caps->lb_bit_depth))
788 		return false;
789 
790 	dsc_sink_caps->is_block_pred_supported =
791 		(dpcd_dsc_basic_data[DP_DSC_BLK_PREDICTION_SUPPORT - DP_DSC_SUPPORT] & DP_DSC_BLK_PREDICTION_IS_SUPPORTED) != 0;
792 
793 	dsc_sink_caps->edp_max_bits_per_pixel =
794 		dpcd_dsc_basic_data[DP_DSC_MAX_BITS_PER_PIXEL_LOW - DP_DSC_SUPPORT] |
795 		dpcd_dsc_basic_data[DP_DSC_MAX_BITS_PER_PIXEL_HI - DP_DSC_SUPPORT] << 8;
796 
797 	dsc_sink_caps->color_formats.raw = dpcd_dsc_basic_data[DP_DSC_DEC_COLOR_FORMAT_CAP - DP_DSC_SUPPORT];
798 	dsc_sink_caps->color_depth.raw = dpcd_dsc_basic_data[DP_DSC_DEC_COLOR_DEPTH_CAP - DP_DSC_SUPPORT];
799 
800 	{
801 		int dpcd_throughput = dpcd_dsc_basic_data[DP_DSC_PEAK_THROUGHPUT - DP_DSC_SUPPORT];
802 
803 		if (!dsc_throughput_from_dpcd(dpcd_throughput & DP_DSC_THROUGHPUT_MODE_0_MASK, &dsc_sink_caps->throughput_mode_0_mps))
804 			return false;
805 
806 		dpcd_throughput = (dpcd_throughput & DP_DSC_THROUGHPUT_MODE_1_MASK) >> DP_DSC_THROUGHPUT_MODE_1_SHIFT;
807 		if (!dsc_throughput_from_dpcd(dpcd_throughput, &dsc_sink_caps->throughput_mode_1_mps))
808 			return false;
809 	}
810 
811 	dsc_sink_caps->max_slice_width = dpcd_dsc_basic_data[DP_DSC_MAX_SLICE_WIDTH - DP_DSC_SUPPORT] * 320;
812 	dsc_sink_caps->slice_caps2.raw = dpcd_dsc_basic_data[DP_DSC_SLICE_CAP_2 - DP_DSC_SUPPORT];
813 
814 	if (!dsc_bpp_increment_div_from_dpcd(dpcd_dsc_basic_data[DP_DSC_BITS_PER_PIXEL_INC - DP_DSC_SUPPORT], &dsc_sink_caps->bpp_increment_div))
815 		return false;
816 
817 	if (dc->debug.dsc_bpp_increment_div) {
818 		/* dsc_bpp_increment_div should onl be 1, 2, 4, 8 or 16, but rather than rejecting invalid values,
819 		 * we'll accept all and get it into range. This also makes the above check against 0 redundant,
820 		 * but that one stresses out the override will be only used if it's not 0.
821 		 */
822 		if (dc->debug.dsc_bpp_increment_div >= 1)
823 			dsc_sink_caps->bpp_increment_div = 1;
824 		if (dc->debug.dsc_bpp_increment_div >= 2)
825 			dsc_sink_caps->bpp_increment_div = 2;
826 		if (dc->debug.dsc_bpp_increment_div >= 4)
827 			dsc_sink_caps->bpp_increment_div = 4;
828 		if (dc->debug.dsc_bpp_increment_div >= 8)
829 			dsc_sink_caps->bpp_increment_div = 8;
830 		if (dc->debug.dsc_bpp_increment_div >= 16)
831 			dsc_sink_caps->bpp_increment_div = 16;
832 	}
833 
834 	/* Extended caps */
835 	if (dpcd_dsc_ext_data == NULL) { // Extended DPCD DSC data can be null, e.g. because it doesn't apply to SST
836 		dsc_sink_caps->branch_overall_throughput_0_mps = 0;
837 		dsc_sink_caps->branch_overall_throughput_1_mps = 0;
838 		dsc_sink_caps->branch_max_line_width = 0;
839 		return true;
840 	}
841 
842 	dsc_sink_caps->branch_overall_throughput_0_mps = dpcd_dsc_ext_data[DP_DSC_BRANCH_OVERALL_THROUGHPUT_0 - DP_DSC_BRANCH_OVERALL_THROUGHPUT_0];
843 	if (dsc_sink_caps->branch_overall_throughput_0_mps == 0)
844 		dsc_sink_caps->branch_overall_throughput_0_mps = 0;
845 	else if (dsc_sink_caps->branch_overall_throughput_0_mps == 1)
846 		dsc_sink_caps->branch_overall_throughput_0_mps = 680;
847 	else {
848 		dsc_sink_caps->branch_overall_throughput_0_mps *= 50;
849 		dsc_sink_caps->branch_overall_throughput_0_mps += 600;
850 	}
851 
852 	dsc_sink_caps->branch_overall_throughput_1_mps = dpcd_dsc_ext_data[DP_DSC_BRANCH_OVERALL_THROUGHPUT_1 - DP_DSC_BRANCH_OVERALL_THROUGHPUT_0];
853 	if (dsc_sink_caps->branch_overall_throughput_1_mps == 0)
854 		dsc_sink_caps->branch_overall_throughput_1_mps = 0;
855 	else if (dsc_sink_caps->branch_overall_throughput_1_mps == 1)
856 		dsc_sink_caps->branch_overall_throughput_1_mps = 680;
857 	else {
858 		dsc_sink_caps->branch_overall_throughput_1_mps *= 50;
859 		dsc_sink_caps->branch_overall_throughput_1_mps += 600;
860 	}
861 
862 	dsc_sink_caps->branch_max_line_width = dpcd_dsc_ext_data[DP_DSC_BRANCH_MAX_LINE_WIDTH - DP_DSC_BRANCH_OVERALL_THROUGHPUT_0] * 320;
863 	ASSERT(dsc_sink_caps->branch_max_line_width == 0 || dsc_sink_caps->branch_max_line_width >= 5120);
864 
865 	return true;
866 }
867 
868 
869 /* If DSC is possbile, get DSC bandwidth range based on [min_bpp, max_bpp] target bitrate range and
870  * timing's pixel clock and uncompressed bandwidth.
871  * If DSC is not possible, leave '*range' untouched.
872  */
873 bool dc_dsc_compute_bandwidth_range(
874 		const struct display_stream_compressor *dsc,
875 		const uint32_t dsc_min_slice_height_override,
876 		const uint32_t min_bpp,
877 		const uint32_t max_bpp,
878 		const struct dsc_dec_dpcd_caps *dsc_sink_caps,
879 		const struct dc_crtc_timing *timing,
880 		struct dc_dsc_bw_range *range)
881 {
882 	bool is_dsc_possible = false;
883 	struct dsc_enc_caps dsc_enc_caps;
884 	struct dsc_enc_caps dsc_common_caps;
885 	struct dc_dsc_config config;
886 
887 	get_dsc_enc_caps(dsc, &dsc_enc_caps, timing->pix_clk_100hz);
888 
889 	is_dsc_possible = intersect_dsc_caps(dsc_sink_caps, &dsc_enc_caps,
890 			timing->pixel_encoding, &dsc_common_caps);
891 
892 	if (is_dsc_possible)
893 		is_dsc_possible = setup_dsc_config(dsc_sink_caps, &dsc_enc_caps, 0, timing,
894 				dsc_min_slice_height_override, &config);
895 
896 	if (is_dsc_possible)
897 		get_dsc_bandwidth_range(min_bpp, max_bpp, &dsc_common_caps, timing, range);
898 
899 	return is_dsc_possible;
900 }
901 
902 bool dc_dsc_compute_config(
903 		const struct display_stream_compressor *dsc,
904 		const struct dsc_dec_dpcd_caps *dsc_sink_caps,
905 		const uint32_t dsc_min_slice_height_override,
906 		uint32_t target_bandwidth_kbps,
907 		const struct dc_crtc_timing *timing,
908 		struct dc_dsc_config *dsc_cfg)
909 {
910 	bool is_dsc_possible = false;
911 	struct dsc_enc_caps dsc_enc_caps;
912 
913 	get_dsc_enc_caps(dsc, &dsc_enc_caps, timing->pix_clk_100hz);
914 	is_dsc_possible = setup_dsc_config(dsc_sink_caps,
915 			&dsc_enc_caps,
916 			target_bandwidth_kbps,
917 			timing, dsc_min_slice_height_override, dsc_cfg);
918 	return is_dsc_possible;
919 }
920 
921 void dc_dsc_get_policy_for_timing(const struct dc_crtc_timing *timing, struct dc_dsc_policy *policy)
922 {
923 	uint32_t bpc = 0;
924 
925 	policy->min_target_bpp = 0;
926 	policy->max_target_bpp = 0;
927 
928 	/* DSC Policy: Use minimum number of slices that fits the pixel clock */
929 	policy->use_min_slices_h = true;
930 
931 	/* DSC Policy: Use max available slices
932 	 * (in our case 4 for or 8, depending on the mode)
933 	 */
934 	policy->max_slices_h = 0;
935 
936 	/* DSC Policy: Use slice height recommended
937 	 * by VESA DSC Spreadsheet user guide
938 	 */
939 	policy->min_slice_height = 108;
940 
941 	/* DSC Policy: follow DP specs with an internal upper limit to 16 bpp
942 	 * for better interoperability
943 	 */
944 	switch (timing->display_color_depth) {
945 	case COLOR_DEPTH_888:
946 		bpc = 8;
947 		break;
948 	case COLOR_DEPTH_101010:
949 		bpc = 10;
950 		break;
951 	case COLOR_DEPTH_121212:
952 		bpc = 12;
953 		break;
954 	default:
955 		return;
956 	}
957 	switch (timing->pixel_encoding) {
958 	case PIXEL_ENCODING_RGB:
959 	case PIXEL_ENCODING_YCBCR444:
960 	case PIXEL_ENCODING_YCBCR422: /* assume no YCbCr422 native support */
961 		/* DP specs limits to 8 */
962 		policy->min_target_bpp = 8;
963 		/* DP specs limits to 3 x bpc */
964 		policy->max_target_bpp = 3 * bpc;
965 		break;
966 	case PIXEL_ENCODING_YCBCR420:
967 		/* DP specs limits to 6 */
968 		policy->min_target_bpp = 6;
969 		/* DP specs limits to 1.5 x bpc assume bpc is an even number */
970 		policy->max_target_bpp = bpc * 3 / 2;
971 		break;
972 	default:
973 		return;
974 	}
975 	/* internal upper limit, default 16 bpp */
976 	if (policy->max_target_bpp > dsc_policy_max_target_bpp_limit)
977 		policy->max_target_bpp = dsc_policy_max_target_bpp_limit;
978 }
979 
980 void dc_dsc_policy_set_max_target_bpp_limit(uint32_t limit)
981 {
982 	dsc_policy_max_target_bpp_limit = limit;
983 }
984