xref: /linux/drivers/gpu/drm/amd/display/dc/dcn30/dcn30_cm_common.c (revision 3fd6c59042dbba50391e30862beac979491145fe)
1 /*
2  * Copyright 2020 Advanced Micro Devices, Inc.
3  *
4  * Permission is hereby granted, free of charge, to any person obtaining a
5  * copy of this software and associated documentation files (the "Software"),
6  * to deal in the Software without restriction, including without limitation
7  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8  * and/or sell copies of the Software, and to permit persons to whom the
9  * Software is furnished to do so, subject to the following conditions:
10  *
11  * The above copyright notice and this permission notice shall be included in
12  * all copies or substantial portions of the Software.
13  *
14  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
17  * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20  * OTHER DEALINGS IN THE SOFTWARE.
21  *
22  * Authors: AMD
23  *
24  */
25 
26 #include "dm_services.h"
27 #include "core_types.h"
28 #include "reg_helper.h"
29 #include "dcn30/dcn30_dpp.h"
30 #include "basics/conversion.h"
31 #include "dcn30/dcn30_cm_common.h"
32 #include "custom_float.h"
33 
34 #define REG(reg) reg
35 
36 #define CTX \
37 	ctx //dpp->base.ctx
38 
39 #undef FN
40 #define FN(reg_name, field_name) \
41 	reg->shifts.field_name, reg->masks.field_name
42 
cm_helper_program_gamcor_xfer_func(struct dc_context * ctx,const struct pwl_params * params,const struct dcn3_xfer_func_reg * reg)43 void cm_helper_program_gamcor_xfer_func(
44 		struct dc_context *ctx,
45 		const struct pwl_params *params,
46 		const struct dcn3_xfer_func_reg *reg)
47 {
48 	uint32_t reg_region_cur;
49 	unsigned int i = 0;
50 
51 	REG_SET_2(reg->start_cntl_b, 0,
52 		exp_region_start, params->corner_points[0].blue.custom_float_x,
53 		exp_resion_start_segment, 0);
54 	REG_SET_2(reg->start_cntl_g, 0,
55 		exp_region_start, params->corner_points[0].green.custom_float_x,
56 		exp_resion_start_segment, 0);
57 	REG_SET_2(reg->start_cntl_r, 0,
58 		exp_region_start, params->corner_points[0].red.custom_float_x,
59 		exp_resion_start_segment, 0);
60 
61 	REG_SET(reg->start_slope_cntl_b, 0, //linear slope at start of curve
62 		field_region_linear_slope, params->corner_points[0].blue.custom_float_slope);
63 	REG_SET(reg->start_slope_cntl_g, 0,
64 		field_region_linear_slope, params->corner_points[0].green.custom_float_slope);
65 	REG_SET(reg->start_slope_cntl_r, 0,
66 		field_region_linear_slope, params->corner_points[0].red.custom_float_slope);
67 
68 	REG_SET(reg->start_end_cntl1_b, 0,
69 		field_region_end_base, params->corner_points[1].blue.custom_float_y);
70 	REG_SET(reg->start_end_cntl1_g, 0,
71 		field_region_end_base, params->corner_points[1].green.custom_float_y);
72 	REG_SET(reg->start_end_cntl1_r, 0,
73 		field_region_end_base, params->corner_points[1].red.custom_float_y);
74 
75 	REG_SET_2(reg->start_end_cntl2_b, 0,
76 		field_region_end_slope, params->corner_points[1].blue.custom_float_slope,
77 		field_region_end, params->corner_points[1].blue.custom_float_x);
78 	REG_SET_2(reg->start_end_cntl2_g, 0,
79 		field_region_end_slope, params->corner_points[1].green.custom_float_slope,
80 		field_region_end, params->corner_points[1].green.custom_float_x);
81 	REG_SET_2(reg->start_end_cntl2_r, 0,
82 		field_region_end_slope, params->corner_points[1].red.custom_float_slope,
83 		field_region_end, params->corner_points[1].red.custom_float_x);
84 
85 	for (reg_region_cur = reg->region_start;
86 		reg_region_cur <= reg->region_end;
87 		reg_region_cur++) {
88 
89 		const struct gamma_curve *curve0 = &(params->arr_curve_points[2 * i]);
90 		const struct gamma_curve *curve1 = &(params->arr_curve_points[(2 * i) + 1]);
91 
92 		REG_SET_4(reg_region_cur, 0,
93 			exp_region0_lut_offset, curve0->offset,
94 			exp_region0_num_segments, curve0->segments_num,
95 			exp_region1_lut_offset, curve1->offset,
96 			exp_region1_num_segments, curve1->segments_num);
97 
98 		i++;
99 	}
100 }
101 
102 /* driver uses 32 regions or less, but DCN HW has 34, extra 2 are set to 0 */
103 #define MAX_REGIONS_NUMBER 34
104 #define MAX_LOW_POINT      25
105 #define NUMBER_REGIONS     32
106 #define NUMBER_SW_SEGMENTS 16
107 
cm3_helper_translate_curve_to_hw_format(const struct dc_transfer_func * output_tf,struct pwl_params * lut_params,bool fixpoint)108 bool cm3_helper_translate_curve_to_hw_format(
109 				const struct dc_transfer_func *output_tf,
110 				struct pwl_params *lut_params, bool fixpoint)
111 {
112 	struct curve_points3 *corner_points;
113 	struct pwl_result_data *rgb_resulted;
114 	struct pwl_result_data *rgb;
115 	struct pwl_result_data *rgb_plus_1;
116 	struct pwl_result_data *rgb_minus_1;
117 
118 	int32_t region_start, region_end;
119 	int32_t i;
120 	uint32_t j, k, seg_distr[MAX_REGIONS_NUMBER], increment, start_index, hw_points;
121 
122 	if (output_tf == NULL || lut_params == NULL || output_tf->type == TF_TYPE_BYPASS)
123 		return false;
124 
125 	corner_points = lut_params->corner_points;
126 	rgb_resulted = lut_params->rgb_resulted;
127 	hw_points = 0;
128 
129 	memset(lut_params, 0, sizeof(struct pwl_params));
130 	memset(seg_distr, 0, sizeof(seg_distr));
131 
132 	if (output_tf->tf == TRANSFER_FUNCTION_PQ || output_tf->tf == TRANSFER_FUNCTION_GAMMA22 ||
133 		output_tf->tf == TRANSFER_FUNCTION_HLG) {
134 		/* 32 segments
135 		 * segments are from 2^-25 to 2^7
136 		 */
137 		for (i = 0; i < NUMBER_REGIONS ; i++)
138 			seg_distr[i] = 3;
139 
140 		region_start = -MAX_LOW_POINT;
141 		region_end   = NUMBER_REGIONS - MAX_LOW_POINT;
142 	} else {
143 		/* 13 segments
144 		 * segment is from 2^-12 to 2^0
145 		 * There are less than 256 points, for optimization
146 		 */
147 		const uint8_t SEG_COUNT = 12;
148 
149 		for (i = 0; i < SEG_COUNT; i++)
150 			seg_distr[i] = 4;
151 
152 		seg_distr[SEG_COUNT] = 1;
153 
154 		region_start = -SEG_COUNT;
155 		region_end = 1;
156 	}
157 
158 	for (i = region_end - region_start; i < MAX_REGIONS_NUMBER ; i++)
159 		seg_distr[i] = -1;
160 
161 	for (k = 0; k < MAX_REGIONS_NUMBER; k++) {
162 		if (seg_distr[k] != -1)
163 			hw_points += (1 << seg_distr[k]);
164 	}
165 
166 	j = 0;
167 	for (k = 0; k < (region_end - region_start); k++) {
168 		increment = NUMBER_SW_SEGMENTS / (1 << seg_distr[k]);
169 		start_index = (region_start + k + MAX_LOW_POINT) *
170 				NUMBER_SW_SEGMENTS;
171 		for (i = start_index; i < start_index + NUMBER_SW_SEGMENTS;
172 				i += increment) {
173 			if (j == hw_points)
174 				break;
175 			if (i >= TRANSFER_FUNC_POINTS)
176 				return false;
177 			rgb_resulted[j].red = output_tf->tf_pts.red[i];
178 			rgb_resulted[j].green = output_tf->tf_pts.green[i];
179 			rgb_resulted[j].blue = output_tf->tf_pts.blue[i];
180 			j++;
181 		}
182 	}
183 
184 	/* last point */
185 	start_index = (region_end + MAX_LOW_POINT) * NUMBER_SW_SEGMENTS;
186 	rgb_resulted[hw_points].red = output_tf->tf_pts.red[start_index];
187 	rgb_resulted[hw_points].green = output_tf->tf_pts.green[start_index];
188 	rgb_resulted[hw_points].blue = output_tf->tf_pts.blue[start_index];
189 
190 	rgb_resulted[hw_points+1].red = rgb_resulted[hw_points].red;
191 	rgb_resulted[hw_points+1].green = rgb_resulted[hw_points].green;
192 	rgb_resulted[hw_points+1].blue = rgb_resulted[hw_points].blue;
193 
194 	// All 3 color channels have same x
195 	corner_points[0].red.x = dc_fixpt_pow(dc_fixpt_from_int(2),
196 					     dc_fixpt_from_int(region_start));
197 	corner_points[0].green.x = corner_points[0].red.x;
198 	corner_points[0].blue.x = corner_points[0].red.x;
199 
200 	corner_points[1].red.x = dc_fixpt_pow(dc_fixpt_from_int(2),
201 					     dc_fixpt_from_int(region_end));
202 	corner_points[1].green.x = corner_points[1].red.x;
203 	corner_points[1].blue.x = corner_points[1].red.x;
204 
205 	corner_points[0].red.y = rgb_resulted[0].red;
206 	corner_points[0].green.y = rgb_resulted[0].green;
207 	corner_points[0].blue.y = rgb_resulted[0].blue;
208 
209 	corner_points[0].red.slope = dc_fixpt_div(corner_points[0].red.y,
210 			corner_points[0].red.x);
211 	corner_points[0].green.slope = dc_fixpt_div(corner_points[0].green.y,
212 			corner_points[0].green.x);
213 	corner_points[0].blue.slope = dc_fixpt_div(corner_points[0].blue.y,
214 			corner_points[0].blue.x);
215 
216 	/* see comment above, m_arrPoints[1].y should be the Y value for the
217 	 * region end (m_numOfHwPoints), not last HW point(m_numOfHwPoints - 1)
218 	 */
219 	corner_points[1].red.y = rgb_resulted[hw_points].red;
220 	corner_points[1].green.y = rgb_resulted[hw_points].green;
221 	corner_points[1].blue.y = rgb_resulted[hw_points].blue;
222 	corner_points[1].red.slope = dc_fixpt_zero;
223 	corner_points[1].green.slope = dc_fixpt_zero;
224 	corner_points[1].blue.slope = dc_fixpt_zero;
225 
226 	// DCN3+ have 257 pts in lieu of no separate slope registers
227 	// Prior HW had 256 base+slope pairs
228 	lut_params->hw_points_num = hw_points + 1;
229 
230 	k = 0;
231 	for (i = 1; i < MAX_REGIONS_NUMBER; i++) {
232 		if (seg_distr[k] != -1) {
233 			lut_params->arr_curve_points[k].segments_num =
234 					seg_distr[k];
235 			lut_params->arr_curve_points[i].offset =
236 					lut_params->arr_curve_points[k].offset + (1 << seg_distr[k]);
237 		}
238 		k++;
239 	}
240 
241 	if (seg_distr[k] != -1)
242 		lut_params->arr_curve_points[k].segments_num = seg_distr[k];
243 
244 	rgb = rgb_resulted;
245 	rgb_plus_1 = rgb_resulted + 1;
246 	rgb_minus_1 = rgb;
247 
248 	if (fixpoint == true) {
249 		i = 1;
250 		while (i != hw_points + 2) {
251 			if (i >= hw_points) {
252 				if (dc_fixpt_lt(rgb_plus_1->red, rgb->red))
253 					rgb_plus_1->red = dc_fixpt_add(rgb->red,
254 							rgb_minus_1->delta_red);
255 				if (dc_fixpt_lt(rgb_plus_1->green, rgb->green))
256 					rgb_plus_1->green = dc_fixpt_add(rgb->green,
257 							rgb_minus_1->delta_green);
258 				if (dc_fixpt_lt(rgb_plus_1->blue, rgb->blue))
259 					rgb_plus_1->blue = dc_fixpt_add(rgb->blue,
260 							rgb_minus_1->delta_blue);
261 			}
262 
263 			rgb->delta_red_reg   = dc_fixpt_clamp_u0d10(rgb->delta_red);
264 			rgb->delta_green_reg = dc_fixpt_clamp_u0d10(rgb->delta_green);
265 			rgb->delta_blue_reg  = dc_fixpt_clamp_u0d10(rgb->delta_blue);
266 			rgb->red_reg         = dc_fixpt_clamp_u0d14(rgb->red);
267 			rgb->green_reg       = dc_fixpt_clamp_u0d14(rgb->green);
268 			rgb->blue_reg        = dc_fixpt_clamp_u0d14(rgb->blue);
269 
270 			++rgb_plus_1;
271 			rgb_minus_1 = rgb;
272 			++rgb;
273 			++i;
274 		}
275 	}
276 	cm3_helper_convert_to_custom_float(rgb_resulted,
277 						lut_params->corner_points,
278 						hw_points+1, fixpoint);
279 
280 	return true;
281 }
282 
cm3_helper_convert_to_custom_float(struct pwl_result_data * rgb_resulted,struct curve_points3 * corner_points,uint32_t hw_points_num,bool fixpoint)283 bool cm3_helper_convert_to_custom_float(
284 		struct pwl_result_data *rgb_resulted,
285 		struct curve_points3 *corner_points,
286 		uint32_t hw_points_num,
287 		bool fixpoint)
288 {
289 	struct custom_float_format fmt;
290 
291 	struct pwl_result_data *rgb = rgb_resulted;
292 
293 	uint32_t i = 0;
294 
295 	fmt.exponenta_bits = 6;
296 	fmt.mantissa_bits = 12;
297 	fmt.sign = false;
298 
299 	/* corner_points[0] - beginning base, slope offset for R,G,B
300 	 * corner_points[1] - end base, slope offset for R,G,B
301 	 */
302 	if (!convert_to_custom_float_format(corner_points[0].red.x, &fmt,
303 				&corner_points[0].red.custom_float_x)) {
304 		BREAK_TO_DEBUGGER();
305 		return false;
306 	}
307 	if (!convert_to_custom_float_format(corner_points[0].green.x, &fmt,
308 				&corner_points[0].green.custom_float_x)) {
309 		BREAK_TO_DEBUGGER();
310 		return false;
311 	}
312 	if (!convert_to_custom_float_format(corner_points[0].blue.x, &fmt,
313 				&corner_points[0].blue.custom_float_x)) {
314 		BREAK_TO_DEBUGGER();
315 		return false;
316 	}
317 
318 	if (!convert_to_custom_float_format(corner_points[0].red.offset, &fmt,
319 				&corner_points[0].red.custom_float_offset)) {
320 		BREAK_TO_DEBUGGER();
321 		return false;
322 	}
323 	if (!convert_to_custom_float_format(corner_points[0].green.offset, &fmt,
324 				&corner_points[0].green.custom_float_offset)) {
325 		BREAK_TO_DEBUGGER();
326 		return false;
327 	}
328 	if (!convert_to_custom_float_format(corner_points[0].blue.offset, &fmt,
329 				&corner_points[0].blue.custom_float_offset)) {
330 		BREAK_TO_DEBUGGER();
331 		return false;
332 	}
333 
334 	if (!convert_to_custom_float_format(corner_points[0].red.slope, &fmt,
335 				&corner_points[0].red.custom_float_slope)) {
336 		BREAK_TO_DEBUGGER();
337 		return false;
338 	}
339 	if (!convert_to_custom_float_format(corner_points[0].green.slope, &fmt,
340 				&corner_points[0].green.custom_float_slope)) {
341 		BREAK_TO_DEBUGGER();
342 		return false;
343 	}
344 	if (!convert_to_custom_float_format(corner_points[0].blue.slope, &fmt,
345 				&corner_points[0].blue.custom_float_slope)) {
346 		BREAK_TO_DEBUGGER();
347 		return false;
348 	}
349 
350 	if (fixpoint == true) {
351 		corner_points[1].red.custom_float_y =
352 				dc_fixpt_clamp_u0d14(corner_points[1].red.y);
353 		corner_points[1].green.custom_float_y =
354 				dc_fixpt_clamp_u0d14(corner_points[1].green.y);
355 		corner_points[1].blue.custom_float_y =
356 				dc_fixpt_clamp_u0d14(corner_points[1].blue.y);
357 	} else {
358 		if (!convert_to_custom_float_format(corner_points[1].red.y,
359 				&fmt, &corner_points[1].red.custom_float_y)) {
360 			BREAK_TO_DEBUGGER();
361 			return false;
362 		}
363 		if (!convert_to_custom_float_format(corner_points[1].green.y,
364 				&fmt, &corner_points[1].green.custom_float_y)) {
365 			BREAK_TO_DEBUGGER();
366 			return false;
367 		}
368 		if (!convert_to_custom_float_format(corner_points[1].blue.y,
369 				&fmt, &corner_points[1].blue.custom_float_y)) {
370 			BREAK_TO_DEBUGGER();
371 			return false;
372 		}
373 	}
374 
375 	fmt.mantissa_bits = 10;
376 	fmt.sign = false;
377 
378 	if (!convert_to_custom_float_format(corner_points[1].red.x, &fmt,
379 				&corner_points[1].red.custom_float_x)) {
380 		BREAK_TO_DEBUGGER();
381 		return false;
382 	}
383 	if (!convert_to_custom_float_format(corner_points[1].green.x, &fmt,
384 				&corner_points[1].green.custom_float_x)) {
385 		BREAK_TO_DEBUGGER();
386 		return false;
387 	}
388 	if (!convert_to_custom_float_format(corner_points[1].blue.x, &fmt,
389 				&corner_points[1].blue.custom_float_x)) {
390 		BREAK_TO_DEBUGGER();
391 		return false;
392 	}
393 
394 	if (!convert_to_custom_float_format(corner_points[1].red.slope, &fmt,
395 				&corner_points[1].red.custom_float_slope)) {
396 		BREAK_TO_DEBUGGER();
397 		return false;
398 	}
399 	if (!convert_to_custom_float_format(corner_points[1].green.slope, &fmt,
400 				&corner_points[1].green.custom_float_slope)) {
401 		BREAK_TO_DEBUGGER();
402 		return false;
403 	}
404 	if (!convert_to_custom_float_format(corner_points[1].blue.slope, &fmt,
405 				&corner_points[1].blue.custom_float_slope)) {
406 		BREAK_TO_DEBUGGER();
407 		return false;
408 	}
409 
410 	if (hw_points_num == 0 || rgb_resulted == NULL || fixpoint == true)
411 		return true;
412 
413 	fmt.mantissa_bits = 12;
414 
415 	while (i != hw_points_num) {
416 		if (!convert_to_custom_float_format(rgb->red, &fmt,
417 						    &rgb->red_reg)) {
418 			BREAK_TO_DEBUGGER();
419 			return false;
420 		}
421 
422 		if (!convert_to_custom_float_format(rgb->green, &fmt,
423 						    &rgb->green_reg)) {
424 			BREAK_TO_DEBUGGER();
425 			return false;
426 		}
427 
428 		if (!convert_to_custom_float_format(rgb->blue, &fmt,
429 						    &rgb->blue_reg)) {
430 			BREAK_TO_DEBUGGER();
431 			return false;
432 		}
433 
434 		++rgb;
435 		++i;
436 	}
437 
438 	return true;
439 }
440 
is_rgb_equal(const struct pwl_result_data * rgb,uint32_t num)441 bool is_rgb_equal(const struct pwl_result_data *rgb, uint32_t num)
442 {
443 	uint32_t i;
444 	bool ret = true;
445 
446 	for (i = 0 ; i < num; i++) {
447 		if (rgb[i].red_reg != rgb[i].green_reg ||
448 		rgb[i].blue_reg != rgb[i].red_reg  ||
449 		rgb[i].blue_reg != rgb[i].green_reg) {
450 			ret = false;
451 			break;
452 		}
453 	}
454 	return ret;
455 }
456 
457