1 /*
2 * Copyright 2020 Advanced Micro Devices, Inc.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
13 *
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20 * OTHER DEALINGS IN THE SOFTWARE.
21 *
22 * Authors: AMD
23 *
24 */
25
26 #include "dm_services.h"
27 #include "core_types.h"
28 #include "reg_helper.h"
29 #include "dcn30/dcn30_dpp.h"
30 #include "basics/conversion.h"
31 #include "dcn30/dcn30_cm_common.h"
32 #include "custom_float.h"
33
34 #define REG(reg) reg
35
36 #define CTX \
37 ctx //dpp->base.ctx
38
39 #undef FN
40 #define FN(reg_name, field_name) \
41 reg->shifts.field_name, reg->masks.field_name
42
cm_helper_program_gamcor_xfer_func(struct dc_context * ctx,const struct pwl_params * params,const struct dcn3_xfer_func_reg * reg)43 void cm_helper_program_gamcor_xfer_func(
44 struct dc_context *ctx,
45 const struct pwl_params *params,
46 const struct dcn3_xfer_func_reg *reg)
47 {
48 uint32_t reg_region_cur;
49 unsigned int i = 0;
50
51 REG_SET_2(reg->start_cntl_b, 0,
52 exp_region_start, params->corner_points[0].blue.custom_float_x,
53 exp_resion_start_segment, 0);
54 REG_SET_2(reg->start_cntl_g, 0,
55 exp_region_start, params->corner_points[0].green.custom_float_x,
56 exp_resion_start_segment, 0);
57 REG_SET_2(reg->start_cntl_r, 0,
58 exp_region_start, params->corner_points[0].red.custom_float_x,
59 exp_resion_start_segment, 0);
60
61 REG_SET(reg->start_slope_cntl_b, 0, //linear slope at start of curve
62 field_region_linear_slope, params->corner_points[0].blue.custom_float_slope);
63 REG_SET(reg->start_slope_cntl_g, 0,
64 field_region_linear_slope, params->corner_points[0].green.custom_float_slope);
65 REG_SET(reg->start_slope_cntl_r, 0,
66 field_region_linear_slope, params->corner_points[0].red.custom_float_slope);
67
68 REG_SET(reg->start_end_cntl1_b, 0,
69 field_region_end_base, params->corner_points[1].blue.custom_float_y);
70 REG_SET(reg->start_end_cntl1_g, 0,
71 field_region_end_base, params->corner_points[1].green.custom_float_y);
72 REG_SET(reg->start_end_cntl1_r, 0,
73 field_region_end_base, params->corner_points[1].red.custom_float_y);
74
75 REG_SET_2(reg->start_end_cntl2_b, 0,
76 field_region_end_slope, params->corner_points[1].blue.custom_float_slope,
77 field_region_end, params->corner_points[1].blue.custom_float_x);
78 REG_SET_2(reg->start_end_cntl2_g, 0,
79 field_region_end_slope, params->corner_points[1].green.custom_float_slope,
80 field_region_end, params->corner_points[1].green.custom_float_x);
81 REG_SET_2(reg->start_end_cntl2_r, 0,
82 field_region_end_slope, params->corner_points[1].red.custom_float_slope,
83 field_region_end, params->corner_points[1].red.custom_float_x);
84
85 for (reg_region_cur = reg->region_start;
86 reg_region_cur <= reg->region_end;
87 reg_region_cur++) {
88
89 const struct gamma_curve *curve0 = &(params->arr_curve_points[2 * i]);
90 const struct gamma_curve *curve1 = &(params->arr_curve_points[(2 * i) + 1]);
91
92 REG_SET_4(reg_region_cur, 0,
93 exp_region0_lut_offset, curve0->offset,
94 exp_region0_num_segments, curve0->segments_num,
95 exp_region1_lut_offset, curve1->offset,
96 exp_region1_num_segments, curve1->segments_num);
97
98 i++;
99 }
100 }
101
102 /* driver uses 32 regions or less, but DCN HW has 34, extra 2 are set to 0 */
103 #define MAX_REGIONS_NUMBER 34
104 #define MAX_LOW_POINT 25
105 #define NUMBER_REGIONS 32
106 #define NUMBER_SW_SEGMENTS 16
107
cm3_helper_translate_curve_to_hw_format(const struct dc_transfer_func * output_tf,struct pwl_params * lut_params,bool fixpoint)108 bool cm3_helper_translate_curve_to_hw_format(
109 const struct dc_transfer_func *output_tf,
110 struct pwl_params *lut_params, bool fixpoint)
111 {
112 struct curve_points3 *corner_points;
113 struct pwl_result_data *rgb_resulted;
114 struct pwl_result_data *rgb;
115 struct pwl_result_data *rgb_plus_1;
116 struct pwl_result_data *rgb_minus_1;
117
118 int32_t region_start, region_end;
119 int32_t i;
120 uint32_t j, k, seg_distr[MAX_REGIONS_NUMBER], increment, start_index, hw_points;
121
122 if (output_tf == NULL || lut_params == NULL || output_tf->type == TF_TYPE_BYPASS)
123 return false;
124
125 corner_points = lut_params->corner_points;
126 rgb_resulted = lut_params->rgb_resulted;
127 hw_points = 0;
128
129 memset(lut_params, 0, sizeof(struct pwl_params));
130 memset(seg_distr, 0, sizeof(seg_distr));
131
132 if (output_tf->tf == TRANSFER_FUNCTION_PQ || output_tf->tf == TRANSFER_FUNCTION_GAMMA22 ||
133 output_tf->tf == TRANSFER_FUNCTION_HLG) {
134 /* 32 segments
135 * segments are from 2^-25 to 2^7
136 */
137 for (i = 0; i < NUMBER_REGIONS ; i++)
138 seg_distr[i] = 3;
139
140 region_start = -MAX_LOW_POINT;
141 region_end = NUMBER_REGIONS - MAX_LOW_POINT;
142 } else {
143 /* 13 segments
144 * segment is from 2^-12 to 2^0
145 * There are less than 256 points, for optimization
146 */
147 const uint8_t SEG_COUNT = 12;
148
149 for (i = 0; i < SEG_COUNT; i++)
150 seg_distr[i] = 4;
151
152 seg_distr[SEG_COUNT] = 1;
153
154 region_start = -SEG_COUNT;
155 region_end = 1;
156 }
157
158 for (i = region_end - region_start; i < MAX_REGIONS_NUMBER ; i++)
159 seg_distr[i] = -1;
160
161 for (k = 0; k < MAX_REGIONS_NUMBER; k++) {
162 if (seg_distr[k] != -1)
163 hw_points += (1 << seg_distr[k]);
164 }
165
166 j = 0;
167 for (k = 0; k < (region_end - region_start); k++) {
168 increment = NUMBER_SW_SEGMENTS / (1 << seg_distr[k]);
169 start_index = (region_start + k + MAX_LOW_POINT) *
170 NUMBER_SW_SEGMENTS;
171 for (i = start_index; i < start_index + NUMBER_SW_SEGMENTS;
172 i += increment) {
173 if (j == hw_points)
174 break;
175 if (i >= TRANSFER_FUNC_POINTS)
176 return false;
177 rgb_resulted[j].red = output_tf->tf_pts.red[i];
178 rgb_resulted[j].green = output_tf->tf_pts.green[i];
179 rgb_resulted[j].blue = output_tf->tf_pts.blue[i];
180 j++;
181 }
182 }
183
184 /* last point */
185 start_index = (region_end + MAX_LOW_POINT) * NUMBER_SW_SEGMENTS;
186 rgb_resulted[hw_points].red = output_tf->tf_pts.red[start_index];
187 rgb_resulted[hw_points].green = output_tf->tf_pts.green[start_index];
188 rgb_resulted[hw_points].blue = output_tf->tf_pts.blue[start_index];
189
190 rgb_resulted[hw_points+1].red = rgb_resulted[hw_points].red;
191 rgb_resulted[hw_points+1].green = rgb_resulted[hw_points].green;
192 rgb_resulted[hw_points+1].blue = rgb_resulted[hw_points].blue;
193
194 // All 3 color channels have same x
195 corner_points[0].red.x = dc_fixpt_pow(dc_fixpt_from_int(2),
196 dc_fixpt_from_int(region_start));
197 corner_points[0].green.x = corner_points[0].red.x;
198 corner_points[0].blue.x = corner_points[0].red.x;
199
200 corner_points[1].red.x = dc_fixpt_pow(dc_fixpt_from_int(2),
201 dc_fixpt_from_int(region_end));
202 corner_points[1].green.x = corner_points[1].red.x;
203 corner_points[1].blue.x = corner_points[1].red.x;
204
205 corner_points[0].red.y = rgb_resulted[0].red;
206 corner_points[0].green.y = rgb_resulted[0].green;
207 corner_points[0].blue.y = rgb_resulted[0].blue;
208
209 corner_points[0].red.slope = dc_fixpt_div(corner_points[0].red.y,
210 corner_points[0].red.x);
211 corner_points[0].green.slope = dc_fixpt_div(corner_points[0].green.y,
212 corner_points[0].green.x);
213 corner_points[0].blue.slope = dc_fixpt_div(corner_points[0].blue.y,
214 corner_points[0].blue.x);
215
216 /* see comment above, m_arrPoints[1].y should be the Y value for the
217 * region end (m_numOfHwPoints), not last HW point(m_numOfHwPoints - 1)
218 */
219 corner_points[1].red.y = rgb_resulted[hw_points].red;
220 corner_points[1].green.y = rgb_resulted[hw_points].green;
221 corner_points[1].blue.y = rgb_resulted[hw_points].blue;
222 corner_points[1].red.slope = dc_fixpt_zero;
223 corner_points[1].green.slope = dc_fixpt_zero;
224 corner_points[1].blue.slope = dc_fixpt_zero;
225
226 // DCN3+ have 257 pts in lieu of no separate slope registers
227 // Prior HW had 256 base+slope pairs
228 lut_params->hw_points_num = hw_points + 1;
229
230 k = 0;
231 for (i = 1; i < MAX_REGIONS_NUMBER; i++) {
232 if (seg_distr[k] != -1) {
233 lut_params->arr_curve_points[k].segments_num =
234 seg_distr[k];
235 lut_params->arr_curve_points[i].offset =
236 lut_params->arr_curve_points[k].offset + (1 << seg_distr[k]);
237 }
238 k++;
239 }
240
241 if (seg_distr[k] != -1)
242 lut_params->arr_curve_points[k].segments_num = seg_distr[k];
243
244 rgb = rgb_resulted;
245 rgb_plus_1 = rgb_resulted + 1;
246 rgb_minus_1 = rgb;
247
248 if (fixpoint == true) {
249 i = 1;
250 while (i != hw_points + 2) {
251 if (i >= hw_points) {
252 if (dc_fixpt_lt(rgb_plus_1->red, rgb->red))
253 rgb_plus_1->red = dc_fixpt_add(rgb->red,
254 rgb_minus_1->delta_red);
255 if (dc_fixpt_lt(rgb_plus_1->green, rgb->green))
256 rgb_plus_1->green = dc_fixpt_add(rgb->green,
257 rgb_minus_1->delta_green);
258 if (dc_fixpt_lt(rgb_plus_1->blue, rgb->blue))
259 rgb_plus_1->blue = dc_fixpt_add(rgb->blue,
260 rgb_minus_1->delta_blue);
261 }
262
263 rgb->delta_red_reg = dc_fixpt_clamp_u0d10(rgb->delta_red);
264 rgb->delta_green_reg = dc_fixpt_clamp_u0d10(rgb->delta_green);
265 rgb->delta_blue_reg = dc_fixpt_clamp_u0d10(rgb->delta_blue);
266 rgb->red_reg = dc_fixpt_clamp_u0d14(rgb->red);
267 rgb->green_reg = dc_fixpt_clamp_u0d14(rgb->green);
268 rgb->blue_reg = dc_fixpt_clamp_u0d14(rgb->blue);
269
270 ++rgb_plus_1;
271 rgb_minus_1 = rgb;
272 ++rgb;
273 ++i;
274 }
275 }
276 cm3_helper_convert_to_custom_float(rgb_resulted,
277 lut_params->corner_points,
278 hw_points+1, fixpoint);
279
280 return true;
281 }
282
cm3_helper_convert_to_custom_float(struct pwl_result_data * rgb_resulted,struct curve_points3 * corner_points,uint32_t hw_points_num,bool fixpoint)283 bool cm3_helper_convert_to_custom_float(
284 struct pwl_result_data *rgb_resulted,
285 struct curve_points3 *corner_points,
286 uint32_t hw_points_num,
287 bool fixpoint)
288 {
289 struct custom_float_format fmt;
290
291 struct pwl_result_data *rgb = rgb_resulted;
292
293 uint32_t i = 0;
294
295 fmt.exponenta_bits = 6;
296 fmt.mantissa_bits = 12;
297 fmt.sign = false;
298
299 /* corner_points[0] - beginning base, slope offset for R,G,B
300 * corner_points[1] - end base, slope offset for R,G,B
301 */
302 if (!convert_to_custom_float_format(corner_points[0].red.x, &fmt,
303 &corner_points[0].red.custom_float_x)) {
304 BREAK_TO_DEBUGGER();
305 return false;
306 }
307 if (!convert_to_custom_float_format(corner_points[0].green.x, &fmt,
308 &corner_points[0].green.custom_float_x)) {
309 BREAK_TO_DEBUGGER();
310 return false;
311 }
312 if (!convert_to_custom_float_format(corner_points[0].blue.x, &fmt,
313 &corner_points[0].blue.custom_float_x)) {
314 BREAK_TO_DEBUGGER();
315 return false;
316 }
317
318 if (!convert_to_custom_float_format(corner_points[0].red.offset, &fmt,
319 &corner_points[0].red.custom_float_offset)) {
320 BREAK_TO_DEBUGGER();
321 return false;
322 }
323 if (!convert_to_custom_float_format(corner_points[0].green.offset, &fmt,
324 &corner_points[0].green.custom_float_offset)) {
325 BREAK_TO_DEBUGGER();
326 return false;
327 }
328 if (!convert_to_custom_float_format(corner_points[0].blue.offset, &fmt,
329 &corner_points[0].blue.custom_float_offset)) {
330 BREAK_TO_DEBUGGER();
331 return false;
332 }
333
334 if (!convert_to_custom_float_format(corner_points[0].red.slope, &fmt,
335 &corner_points[0].red.custom_float_slope)) {
336 BREAK_TO_DEBUGGER();
337 return false;
338 }
339 if (!convert_to_custom_float_format(corner_points[0].green.slope, &fmt,
340 &corner_points[0].green.custom_float_slope)) {
341 BREAK_TO_DEBUGGER();
342 return false;
343 }
344 if (!convert_to_custom_float_format(corner_points[0].blue.slope, &fmt,
345 &corner_points[0].blue.custom_float_slope)) {
346 BREAK_TO_DEBUGGER();
347 return false;
348 }
349
350 if (fixpoint == true) {
351 corner_points[1].red.custom_float_y =
352 dc_fixpt_clamp_u0d14(corner_points[1].red.y);
353 corner_points[1].green.custom_float_y =
354 dc_fixpt_clamp_u0d14(corner_points[1].green.y);
355 corner_points[1].blue.custom_float_y =
356 dc_fixpt_clamp_u0d14(corner_points[1].blue.y);
357 } else {
358 if (!convert_to_custom_float_format(corner_points[1].red.y,
359 &fmt, &corner_points[1].red.custom_float_y)) {
360 BREAK_TO_DEBUGGER();
361 return false;
362 }
363 if (!convert_to_custom_float_format(corner_points[1].green.y,
364 &fmt, &corner_points[1].green.custom_float_y)) {
365 BREAK_TO_DEBUGGER();
366 return false;
367 }
368 if (!convert_to_custom_float_format(corner_points[1].blue.y,
369 &fmt, &corner_points[1].blue.custom_float_y)) {
370 BREAK_TO_DEBUGGER();
371 return false;
372 }
373 }
374
375 fmt.mantissa_bits = 10;
376 fmt.sign = false;
377
378 if (!convert_to_custom_float_format(corner_points[1].red.x, &fmt,
379 &corner_points[1].red.custom_float_x)) {
380 BREAK_TO_DEBUGGER();
381 return false;
382 }
383 if (!convert_to_custom_float_format(corner_points[1].green.x, &fmt,
384 &corner_points[1].green.custom_float_x)) {
385 BREAK_TO_DEBUGGER();
386 return false;
387 }
388 if (!convert_to_custom_float_format(corner_points[1].blue.x, &fmt,
389 &corner_points[1].blue.custom_float_x)) {
390 BREAK_TO_DEBUGGER();
391 return false;
392 }
393
394 if (!convert_to_custom_float_format(corner_points[1].red.slope, &fmt,
395 &corner_points[1].red.custom_float_slope)) {
396 BREAK_TO_DEBUGGER();
397 return false;
398 }
399 if (!convert_to_custom_float_format(corner_points[1].green.slope, &fmt,
400 &corner_points[1].green.custom_float_slope)) {
401 BREAK_TO_DEBUGGER();
402 return false;
403 }
404 if (!convert_to_custom_float_format(corner_points[1].blue.slope, &fmt,
405 &corner_points[1].blue.custom_float_slope)) {
406 BREAK_TO_DEBUGGER();
407 return false;
408 }
409
410 if (hw_points_num == 0 || rgb_resulted == NULL || fixpoint == true)
411 return true;
412
413 fmt.mantissa_bits = 12;
414
415 while (i != hw_points_num) {
416 if (!convert_to_custom_float_format(rgb->red, &fmt,
417 &rgb->red_reg)) {
418 BREAK_TO_DEBUGGER();
419 return false;
420 }
421
422 if (!convert_to_custom_float_format(rgb->green, &fmt,
423 &rgb->green_reg)) {
424 BREAK_TO_DEBUGGER();
425 return false;
426 }
427
428 if (!convert_to_custom_float_format(rgb->blue, &fmt,
429 &rgb->blue_reg)) {
430 BREAK_TO_DEBUGGER();
431 return false;
432 }
433
434 ++rgb;
435 ++i;
436 }
437
438 return true;
439 }
440
is_rgb_equal(const struct pwl_result_data * rgb,uint32_t num)441 bool is_rgb_equal(const struct pwl_result_data *rgb, uint32_t num)
442 {
443 uint32_t i;
444 bool ret = true;
445
446 for (i = 0 ; i < num; i++) {
447 if (rgb[i].red_reg != rgb[i].green_reg ||
448 rgb[i].blue_reg != rgb[i].red_reg ||
449 rgb[i].blue_reg != rgb[i].green_reg) {
450 ret = false;
451 break;
452 }
453 }
454 return ret;
455 }
456
457