2 * Copyright 2020 Advanced Micro Devices, Inc.
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20 * OTHER DEALINGS IN THE SOFTWARE.
26 #include "dm_services.h"
27 #include "core_types.h"
28 #include "reg_helper.h"
29 #include "dcn30_dpp.h"
30 #include "basics/conversion.h"
31 #include "dcn30_cm_common.h"
32 #include "custom_float.h"
40 #define FN(reg_name, field_name) \
41 reg->shifts.field_name, reg->masks.field_name
43 void cm_helper_program_gamcor_xfer_func(
44 struct dc_context *ctx,
45 const struct pwl_params *params,
46 const struct dcn3_xfer_func_reg *reg)
48 uint32_t reg_region_cur;
51 REG_SET_2(reg->start_cntl_b, 0,
52 exp_region_start, params->corner_points[0].blue.custom_float_x,
53 exp_resion_start_segment, 0);
54 REG_SET_2(reg->start_cntl_g, 0,
55 exp_region_start, params->corner_points[0].green.custom_float_x,
56 exp_resion_start_segment, 0);
57 REG_SET_2(reg->start_cntl_r, 0,
58 exp_region_start, params->corner_points[0].red.custom_float_x,
59 exp_resion_start_segment, 0);
61 REG_SET(reg->start_slope_cntl_b, 0, //linear slope at start of curve
62 field_region_linear_slope, params->corner_points[0].blue.custom_float_slope);
63 REG_SET(reg->start_slope_cntl_g, 0,
64 field_region_linear_slope, params->corner_points[0].green.custom_float_slope);
65 REG_SET(reg->start_slope_cntl_r, 0,
66 field_region_linear_slope, params->corner_points[0].red.custom_float_slope);
68 REG_SET(reg->start_end_cntl1_b, 0,
69 field_region_end_base, params->corner_points[1].blue.custom_float_y);
70 REG_SET(reg->start_end_cntl1_g, 0,
71 field_region_end_base, params->corner_points[1].green.custom_float_y);
72 REG_SET(reg->start_end_cntl1_r, 0,
73 field_region_end_base, params->corner_points[1].red.custom_float_y);
75 REG_SET_2(reg->start_end_cntl2_b, 0,
76 field_region_end_slope, params->corner_points[1].blue.custom_float_slope,
77 field_region_end, params->corner_points[1].blue.custom_float_x);
78 REG_SET_2(reg->start_end_cntl2_g, 0,
79 field_region_end_slope, params->corner_points[1].green.custom_float_slope,
80 field_region_end, params->corner_points[1].green.custom_float_x);
81 REG_SET_2(reg->start_end_cntl2_r, 0,
82 field_region_end_slope, params->corner_points[1].red.custom_float_slope,
83 field_region_end, params->corner_points[1].red.custom_float_x);
85 for (reg_region_cur = reg->region_start;
86 reg_region_cur <= reg->region_end;
89 const struct gamma_curve *curve0 = &(params->arr_curve_points[2 * i]);
90 const struct gamma_curve *curve1 = &(params->arr_curve_points[(2 * i) + 1]);
92 REG_SET_4(reg_region_cur, 0,
93 exp_region0_lut_offset, curve0->offset,
94 exp_region0_num_segments, curve0->segments_num,
95 exp_region1_lut_offset, curve1->offset,
96 exp_region1_num_segments, curve1->segments_num);
102 /* driver uses 32 regions or less, but DCN HW has 34, extra 2 are set to 0 */
103 #define MAX_REGIONS_NUMBER 34
104 #define MAX_LOW_POINT 25
105 #define NUMBER_REGIONS 32
106 #define NUMBER_SW_SEGMENTS 16
108 bool cm3_helper_translate_curve_to_hw_format(
109 const struct dc_transfer_func *output_tf,
110 struct pwl_params *lut_params, bool fixpoint)
112 struct curve_points3 *corner_points;
113 struct pwl_result_data *rgb_resulted;
114 struct pwl_result_data *rgb;
115 struct pwl_result_data *rgb_plus_1;
116 struct pwl_result_data *rgb_minus_1;
117 struct fixed31_32 end_value;
119 int32_t region_start, region_end;
121 uint32_t j, k, seg_distr[MAX_REGIONS_NUMBER], increment, start_index, hw_points;
123 if (output_tf == NULL || lut_params == NULL || output_tf->type == TF_TYPE_BYPASS)
126 corner_points = lut_params->corner_points;
127 rgb_resulted = lut_params->rgb_resulted;
130 memset(lut_params, 0, sizeof(struct pwl_params));
131 memset(seg_distr, 0, sizeof(seg_distr));
133 if (output_tf->tf == TRANSFER_FUNCTION_PQ || output_tf->tf == TRANSFER_FUNCTION_GAMMA22 ||
134 output_tf->tf == TRANSFER_FUNCTION_HLG) {
136 * segments are from 2^-25 to 2^7
138 for (i = 0; i < NUMBER_REGIONS ; i++)
141 region_start = -MAX_LOW_POINT;
142 region_end = NUMBER_REGIONS - MAX_LOW_POINT;
145 * segment is from 2^-10 to 2^0
146 * There are less than 256 points, for optimization
164 for (i = region_end - region_start; i < MAX_REGIONS_NUMBER ; i++)
167 for (k = 0; k < MAX_REGIONS_NUMBER; k++) {
168 if (seg_distr[k] != -1)
169 hw_points += (1 << seg_distr[k]);
173 for (k = 0; k < (region_end - region_start); k++) {
174 increment = NUMBER_SW_SEGMENTS / (1 << seg_distr[k]);
175 start_index = (region_start + k + MAX_LOW_POINT) *
177 for (i = start_index; i < start_index + NUMBER_SW_SEGMENTS;
179 if (j == hw_points - 1)
181 rgb_resulted[j].red = output_tf->tf_pts.red[i];
182 rgb_resulted[j].green = output_tf->tf_pts.green[i];
183 rgb_resulted[j].blue = output_tf->tf_pts.blue[i];
189 start_index = (region_end + MAX_LOW_POINT) * NUMBER_SW_SEGMENTS;
190 rgb_resulted[hw_points - 1].red = output_tf->tf_pts.red[start_index];
191 rgb_resulted[hw_points - 1].green = output_tf->tf_pts.green[start_index];
192 rgb_resulted[hw_points - 1].blue = output_tf->tf_pts.blue[start_index];
194 rgb_resulted[hw_points].red = rgb_resulted[hw_points - 1].red;
195 rgb_resulted[hw_points].green = rgb_resulted[hw_points - 1].green;
196 rgb_resulted[hw_points].blue = rgb_resulted[hw_points - 1].blue;
198 // All 3 color channels have same x
199 corner_points[0].red.x = dc_fixpt_pow(dc_fixpt_from_int(2),
200 dc_fixpt_from_int(region_start));
201 corner_points[0].green.x = corner_points[0].red.x;
202 corner_points[0].blue.x = corner_points[0].red.x;
204 corner_points[1].red.x = dc_fixpt_pow(dc_fixpt_from_int(2),
205 dc_fixpt_from_int(region_end));
206 corner_points[1].green.x = corner_points[1].red.x;
207 corner_points[1].blue.x = corner_points[1].red.x;
209 corner_points[0].red.y = rgb_resulted[0].red;
210 corner_points[0].green.y = rgb_resulted[0].green;
211 corner_points[0].blue.y = rgb_resulted[0].blue;
213 corner_points[0].red.slope = dc_fixpt_div(corner_points[0].red.y,
214 corner_points[0].red.x);
215 corner_points[0].green.slope = dc_fixpt_div(corner_points[0].green.y,
216 corner_points[0].green.x);
217 corner_points[0].blue.slope = dc_fixpt_div(corner_points[0].blue.y,
218 corner_points[0].blue.x);
220 /* see comment above, m_arrPoints[1].y should be the Y value for the
221 * region end (m_numOfHwPoints), not last HW point(m_numOfHwPoints - 1)
223 corner_points[1].red.y = rgb_resulted[hw_points - 1].red;
224 corner_points[1].green.y = rgb_resulted[hw_points - 1].green;
225 corner_points[1].blue.y = rgb_resulted[hw_points - 1].blue;
226 corner_points[1].red.slope = dc_fixpt_zero;
227 corner_points[1].green.slope = dc_fixpt_zero;
228 corner_points[1].blue.slope = dc_fixpt_zero;
230 if (output_tf->tf == TRANSFER_FUNCTION_PQ || output_tf->tf == TRANSFER_FUNCTION_HLG) {
231 /* for PQ/HLG, we want to have a straight line from last HW X point,
232 * and the slope to be such that we hit 1.0 at 10000/1000 nits.
235 if (output_tf->tf == TRANSFER_FUNCTION_PQ)
236 end_value = dc_fixpt_from_int(125);
238 end_value = dc_fixpt_from_fraction(125, 10);
240 corner_points[1].red.slope = dc_fixpt_div(
241 dc_fixpt_sub(dc_fixpt_one, corner_points[1].red.y),
242 dc_fixpt_sub(end_value, corner_points[1].red.x));
243 corner_points[1].green.slope = dc_fixpt_div(
244 dc_fixpt_sub(dc_fixpt_one, corner_points[1].green.y),
245 dc_fixpt_sub(end_value, corner_points[1].green.x));
246 corner_points[1].blue.slope = dc_fixpt_div(
247 dc_fixpt_sub(dc_fixpt_one, corner_points[1].blue.y),
248 dc_fixpt_sub(end_value, corner_points[1].blue.x));
250 lut_params->hw_points_num = hw_points;
253 for (i = 1; i < MAX_REGIONS_NUMBER; i++) {
254 if (seg_distr[k] != -1) {
255 lut_params->arr_curve_points[k].segments_num =
257 lut_params->arr_curve_points[i].offset =
258 lut_params->arr_curve_points[k].offset + (1 << seg_distr[k]);
263 if (seg_distr[k] != -1)
264 lut_params->arr_curve_points[k].segments_num = seg_distr[k];
267 rgb_plus_1 = rgb_resulted + 1;
271 while (i != hw_points + 1) {
272 if (i >= hw_points - 1) {
273 if (dc_fixpt_lt(rgb_plus_1->red, rgb->red))
274 rgb_plus_1->red = dc_fixpt_add(rgb->red, rgb_minus_1->delta_red);
275 if (dc_fixpt_lt(rgb_plus_1->green, rgb->green))
276 rgb_plus_1->green = dc_fixpt_add(rgb->green, rgb_minus_1->delta_green);
277 if (dc_fixpt_lt(rgb_plus_1->blue, rgb->blue))
278 rgb_plus_1->blue = dc_fixpt_add(rgb->blue, rgb_minus_1->delta_blue);
281 rgb->delta_red = dc_fixpt_sub(rgb_plus_1->red, rgb->red);
282 rgb->delta_green = dc_fixpt_sub(rgb_plus_1->green, rgb->green);
283 rgb->delta_blue = dc_fixpt_sub(rgb_plus_1->blue, rgb->blue);
285 if (fixpoint == true) {
286 rgb->delta_red_reg = dc_fixpt_clamp_u0d10(rgb->delta_red);
287 rgb->delta_green_reg = dc_fixpt_clamp_u0d10(rgb->delta_green);
288 rgb->delta_blue_reg = dc_fixpt_clamp_u0d10(rgb->delta_blue);
289 rgb->red_reg = dc_fixpt_clamp_u0d14(rgb->red);
290 rgb->green_reg = dc_fixpt_clamp_u0d14(rgb->green);
291 rgb->blue_reg = dc_fixpt_clamp_u0d14(rgb->blue);
299 cm3_helper_convert_to_custom_float(rgb_resulted,
300 lut_params->corner_points,
301 hw_points, fixpoint);
306 #define NUM_DEGAMMA_REGIONS 12
309 bool cm3_helper_translate_curve_to_degamma_hw_format(
310 const struct dc_transfer_func *output_tf,
311 struct pwl_params *lut_params)
313 struct curve_points3 *corner_points;
314 struct pwl_result_data *rgb_resulted;
315 struct pwl_result_data *rgb;
316 struct pwl_result_data *rgb_plus_1;
318 int32_t region_start, region_end;
320 uint32_t j, k, seg_distr[MAX_REGIONS_NUMBER], increment, start_index, hw_points;
322 if (output_tf == NULL || lut_params == NULL || output_tf->type == TF_TYPE_BYPASS)
325 corner_points = lut_params->corner_points;
326 rgb_resulted = lut_params->rgb_resulted;
329 memset(lut_params, 0, sizeof(struct pwl_params));
330 memset(seg_distr, 0, sizeof(seg_distr));
332 region_start = -NUM_DEGAMMA_REGIONS;
336 for (i = region_end - region_start; i < MAX_REGIONS_NUMBER ; i++)
339 * segments are from 2^-12 to 0
341 for (i = 0; i < NUM_DEGAMMA_REGIONS ; i++)
344 for (k = 0; k < MAX_REGIONS_NUMBER; k++) {
345 if (seg_distr[k] != -1)
346 hw_points += (1 << seg_distr[k]);
350 for (k = 0; k < (region_end - region_start); k++) {
351 increment = NUMBER_SW_SEGMENTS / (1 << seg_distr[k]);
352 start_index = (region_start + k + MAX_LOW_POINT) *
354 for (i = start_index; i < start_index + NUMBER_SW_SEGMENTS;
356 if (j == hw_points - 1)
358 rgb_resulted[j].red = output_tf->tf_pts.red[i];
359 rgb_resulted[j].green = output_tf->tf_pts.green[i];
360 rgb_resulted[j].blue = output_tf->tf_pts.blue[i];
366 start_index = (region_end + MAX_LOW_POINT) * NUMBER_SW_SEGMENTS;
367 rgb_resulted[hw_points - 1].red = output_tf->tf_pts.red[start_index];
368 rgb_resulted[hw_points - 1].green = output_tf->tf_pts.green[start_index];
369 rgb_resulted[hw_points - 1].blue = output_tf->tf_pts.blue[start_index];
371 corner_points[0].red.x = dc_fixpt_pow(dc_fixpt_from_int(2),
372 dc_fixpt_from_int(region_start));
373 corner_points[0].green.x = corner_points[0].red.x;
374 corner_points[0].blue.x = corner_points[0].red.x;
375 corner_points[1].red.x = dc_fixpt_pow(dc_fixpt_from_int(2),
376 dc_fixpt_from_int(region_end));
377 corner_points[1].green.x = corner_points[1].red.x;
378 corner_points[1].blue.x = corner_points[1].red.x;
380 corner_points[0].red.y = rgb_resulted[0].red;
381 corner_points[0].green.y = rgb_resulted[0].green;
382 corner_points[0].blue.y = rgb_resulted[0].blue;
384 /* see comment above, m_arrPoints[1].y should be the Y value for the
385 * region end (m_numOfHwPoints), not last HW point(m_numOfHwPoints - 1)
387 corner_points[1].red.y = rgb_resulted[hw_points - 1].red;
388 corner_points[1].green.y = rgb_resulted[hw_points - 1].green;
389 corner_points[1].blue.y = rgb_resulted[hw_points - 1].blue;
390 corner_points[1].red.slope = dc_fixpt_zero;
391 corner_points[1].green.slope = dc_fixpt_zero;
392 corner_points[1].blue.slope = dc_fixpt_zero;
394 if (output_tf->tf == TRANSFER_FUNCTION_PQ) {
395 /* for PQ, we want to have a straight line from last HW X point,
396 * and the slope to be such that we hit 1.0 at 10000 nits.
398 const struct fixed31_32 end_value =
399 dc_fixpt_from_int(125);
401 corner_points[1].red.slope = dc_fixpt_div(
402 dc_fixpt_sub(dc_fixpt_one, corner_points[1].red.y),
403 dc_fixpt_sub(end_value, corner_points[1].red.x));
404 corner_points[1].green.slope = dc_fixpt_div(
405 dc_fixpt_sub(dc_fixpt_one, corner_points[1].green.y),
406 dc_fixpt_sub(end_value, corner_points[1].green.x));
407 corner_points[1].blue.slope = dc_fixpt_div(
408 dc_fixpt_sub(dc_fixpt_one, corner_points[1].blue.y),
409 dc_fixpt_sub(end_value, corner_points[1].blue.x));
412 lut_params->hw_points_num = hw_points;
415 for (i = 1; i < MAX_REGIONS_NUMBER; i++) {
416 if (seg_distr[k] != -1) {
417 lut_params->arr_curve_points[k].segments_num =
419 lut_params->arr_curve_points[i].offset =
420 lut_params->arr_curve_points[k].offset + (1 << seg_distr[k]);
425 if (seg_distr[k] != -1)
426 lut_params->arr_curve_points[k].segments_num = seg_distr[k];
429 rgb_plus_1 = rgb_resulted + 1;
432 while (i != hw_points + 1) {
433 if (dc_fixpt_lt(rgb_plus_1->red, rgb->red))
434 rgb_plus_1->red = rgb->red;
435 if (dc_fixpt_lt(rgb_plus_1->green, rgb->green))
436 rgb_plus_1->green = rgb->green;
437 if (dc_fixpt_lt(rgb_plus_1->blue, rgb->blue))
438 rgb_plus_1->blue = rgb->blue;
440 rgb->delta_red = dc_fixpt_sub(rgb_plus_1->red, rgb->red);
441 rgb->delta_green = dc_fixpt_sub(rgb_plus_1->green, rgb->green);
442 rgb->delta_blue = dc_fixpt_sub(rgb_plus_1->blue, rgb->blue);
448 cm3_helper_convert_to_custom_float(rgb_resulted,
449 lut_params->corner_points,
455 bool cm3_helper_convert_to_custom_float(
456 struct pwl_result_data *rgb_resulted,
457 struct curve_points3 *corner_points,
458 uint32_t hw_points_num,
461 struct custom_float_format fmt;
463 struct pwl_result_data *rgb = rgb_resulted;
467 fmt.exponenta_bits = 6;
468 fmt.mantissa_bits = 12;
471 /* corner_points[0] - beginning base, slope offset for R,G,B
472 * corner_points[1] - end base, slope offset for R,G,B
474 if (!convert_to_custom_float_format(corner_points[0].red.x, &fmt,
475 &corner_points[0].red.custom_float_x)) {
479 if (!convert_to_custom_float_format(corner_points[0].green.x, &fmt,
480 &corner_points[0].green.custom_float_x)) {
484 if (!convert_to_custom_float_format(corner_points[0].blue.x, &fmt,
485 &corner_points[0].blue.custom_float_x)) {
490 if (!convert_to_custom_float_format(corner_points[0].red.offset, &fmt,
491 &corner_points[0].red.custom_float_offset)) {
495 if (!convert_to_custom_float_format(corner_points[0].green.offset, &fmt,
496 &corner_points[0].green.custom_float_offset)) {
500 if (!convert_to_custom_float_format(corner_points[0].blue.offset, &fmt,
501 &corner_points[0].blue.custom_float_offset)) {
506 if (!convert_to_custom_float_format(corner_points[0].red.slope, &fmt,
507 &corner_points[0].red.custom_float_slope)) {
511 if (!convert_to_custom_float_format(corner_points[0].green.slope, &fmt,
512 &corner_points[0].green.custom_float_slope)) {
516 if (!convert_to_custom_float_format(corner_points[0].blue.slope, &fmt,
517 &corner_points[0].blue.custom_float_slope)) {
522 if (fixpoint == true) {
523 corner_points[1].red.custom_float_y =
524 dc_fixpt_clamp_u0d14(corner_points[1].red.y);
525 corner_points[1].green.custom_float_y =
526 dc_fixpt_clamp_u0d14(corner_points[1].green.y);
527 corner_points[1].blue.custom_float_y =
528 dc_fixpt_clamp_u0d14(corner_points[1].blue.y);
530 if (!convert_to_custom_float_format(corner_points[1].red.y,
531 &fmt, &corner_points[1].red.custom_float_y)) {
535 if (!convert_to_custom_float_format(corner_points[1].green.y,
536 &fmt, &corner_points[1].green.custom_float_y)) {
540 if (!convert_to_custom_float_format(corner_points[1].blue.y,
541 &fmt, &corner_points[1].blue.custom_float_y)) {
547 fmt.mantissa_bits = 10;
550 if (!convert_to_custom_float_format(corner_points[1].red.x, &fmt,
551 &corner_points[1].red.custom_float_x)) {
555 if (!convert_to_custom_float_format(corner_points[1].green.x, &fmt,
556 &corner_points[1].green.custom_float_x)) {
560 if (!convert_to_custom_float_format(corner_points[1].blue.x, &fmt,
561 &corner_points[1].blue.custom_float_x)) {
566 if (!convert_to_custom_float_format(corner_points[1].red.slope, &fmt,
567 &corner_points[1].red.custom_float_slope)) {
571 if (!convert_to_custom_float_format(corner_points[1].green.slope, &fmt,
572 &corner_points[1].green.custom_float_slope)) {
576 if (!convert_to_custom_float_format(corner_points[1].blue.slope, &fmt,
577 &corner_points[1].blue.custom_float_slope)) {
582 if (hw_points_num == 0 || rgb_resulted == NULL || fixpoint == true)
585 fmt.mantissa_bits = 12;
587 while (i != hw_points_num) {
588 if (!convert_to_custom_float_format(rgb->red, &fmt,
594 if (!convert_to_custom_float_format(rgb->green, &fmt,
600 if (!convert_to_custom_float_format(rgb->blue, &fmt,
606 if (!convert_to_custom_float_format(rgb->delta_red, &fmt,
607 &rgb->delta_red_reg)) {
612 if (!convert_to_custom_float_format(rgb->delta_green, &fmt,
613 &rgb->delta_green_reg)) {
618 if (!convert_to_custom_float_format(rgb->delta_blue, &fmt,
619 &rgb->delta_blue_reg)) {
631 bool is_rgb_equal(const struct pwl_result_data *rgb, uint32_t num)
636 for (i = 0 ; i < num; i++) {
637 if (rgb[i].red_reg != rgb[i].green_reg ||
638 rgb[i].blue_reg != rgb[i].red_reg ||
639 rgb[i].blue_reg != rgb[i].green_reg) {