2 * Copyright 2016 Advanced Micro Devices, Inc.
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20 * OTHER DEALINGS IN THE SOFTWARE.
26 #include "reg_helper.h"
27 #include "dcn10/dcn10_dpp.h"
29 #include "dcn10_cm_common.h"
30 #include "custom_float.h"
38 #define FN(reg_name, field_name) \
39 reg->shifts.field_name, reg->masks.field_name
41 void cm_helper_program_color_matrices(
42 struct dc_context *ctx,
43 const uint16_t *regval,
44 const struct color_matrices_reg *reg)
49 for (cur_csc_reg = reg->csc_c11_c12;
50 cur_csc_reg <= reg->csc_c33_c34;
53 const uint16_t *regval0 = &(regval[2 * i]);
54 const uint16_t *regval1 = &(regval[(2 * i) + 1]);
56 REG_SET_2(cur_csc_reg, 0,
65 void cm_helper_read_color_matrices(struct dc_context *ctx,
67 const struct color_matrices_reg *reg)
69 uint32_t cur_csc_reg, regval0, regval1;
72 for (cur_csc_reg = reg->csc_c11_c12;
73 cur_csc_reg <= reg->csc_c33_c34; cur_csc_reg++) {
74 REG_GET_2(cur_csc_reg,
78 regval[2 * i] = regval0;
79 regval[(2 * i) + 1] = regval1;
85 void cm_helper_program_xfer_func(
86 struct dc_context *ctx,
87 const struct pwl_params *params,
88 const struct xfer_func_reg *reg)
90 uint32_t reg_region_cur;
93 REG_SET_2(reg->start_cntl_b, 0,
94 exp_region_start, params->corner_points[0].blue.custom_float_x,
95 exp_resion_start_segment, 0);
96 REG_SET_2(reg->start_cntl_g, 0,
97 exp_region_start, params->corner_points[0].green.custom_float_x,
98 exp_resion_start_segment, 0);
99 REG_SET_2(reg->start_cntl_r, 0,
100 exp_region_start, params->corner_points[0].red.custom_float_x,
101 exp_resion_start_segment, 0);
103 REG_SET(reg->start_slope_cntl_b, 0,
104 field_region_linear_slope, params->corner_points[0].blue.custom_float_slope);
105 REG_SET(reg->start_slope_cntl_g, 0,
106 field_region_linear_slope, params->corner_points[0].green.custom_float_slope);
107 REG_SET(reg->start_slope_cntl_r, 0,
108 field_region_linear_slope, params->corner_points[0].red.custom_float_slope);
110 REG_SET(reg->start_end_cntl1_b, 0,
111 field_region_end, params->corner_points[1].blue.custom_float_x);
112 REG_SET_2(reg->start_end_cntl2_b, 0,
113 field_region_end_slope, params->corner_points[1].blue.custom_float_slope,
114 field_region_end_base, params->corner_points[1].blue.custom_float_y);
116 REG_SET(reg->start_end_cntl1_g, 0,
117 field_region_end, params->corner_points[1].green.custom_float_x);
118 REG_SET_2(reg->start_end_cntl2_g, 0,
119 field_region_end_slope, params->corner_points[1].green.custom_float_slope,
120 field_region_end_base, params->corner_points[1].green.custom_float_y);
122 REG_SET(reg->start_end_cntl1_r, 0,
123 field_region_end, params->corner_points[1].red.custom_float_x);
124 REG_SET_2(reg->start_end_cntl2_r, 0,
125 field_region_end_slope, params->corner_points[1].red.custom_float_slope,
126 field_region_end_base, params->corner_points[1].red.custom_float_y);
128 for (reg_region_cur = reg->region_start;
129 reg_region_cur <= reg->region_end;
132 const struct gamma_curve *curve0 = &(params->arr_curve_points[2 * i]);
133 const struct gamma_curve *curve1 = &(params->arr_curve_points[(2 * i) + 1]);
135 REG_SET_4(reg_region_cur, 0,
136 exp_region0_lut_offset, curve0->offset,
137 exp_region0_num_segments, curve0->segments_num,
138 exp_region1_lut_offset, curve1->offset,
139 exp_region1_num_segments, curve1->segments_num);
148 bool cm_helper_convert_to_custom_float(
149 struct pwl_result_data *rgb_resulted,
150 struct curve_points3 *corner_points,
151 uint32_t hw_points_num,
154 struct custom_float_format fmt;
156 struct pwl_result_data *rgb = rgb_resulted;
160 fmt.exponenta_bits = 6;
161 fmt.mantissa_bits = 12;
164 /* corner_points[0] - beginning base, slope offset for R,G,B
165 * corner_points[1] - end base, slope offset for R,G,B
167 if (!convert_to_custom_float_format(corner_points[0].red.x, &fmt,
168 &corner_points[0].red.custom_float_x)) {
172 if (!convert_to_custom_float_format(corner_points[0].green.x, &fmt,
173 &corner_points[0].green.custom_float_x)) {
177 if (!convert_to_custom_float_format(corner_points[0].blue.x, &fmt,
178 &corner_points[0].blue.custom_float_x)) {
183 if (!convert_to_custom_float_format(corner_points[0].red.offset, &fmt,
184 &corner_points[0].red.custom_float_offset)) {
188 if (!convert_to_custom_float_format(corner_points[0].green.offset, &fmt,
189 &corner_points[0].green.custom_float_offset)) {
193 if (!convert_to_custom_float_format(corner_points[0].blue.offset, &fmt,
194 &corner_points[0].blue.custom_float_offset)) {
199 if (!convert_to_custom_float_format(corner_points[0].red.slope, &fmt,
200 &corner_points[0].red.custom_float_slope)) {
204 if (!convert_to_custom_float_format(corner_points[0].green.slope, &fmt,
205 &corner_points[0].green.custom_float_slope)) {
209 if (!convert_to_custom_float_format(corner_points[0].blue.slope, &fmt,
210 &corner_points[0].blue.custom_float_slope)) {
215 fmt.mantissa_bits = 10;
218 if (!convert_to_custom_float_format(corner_points[1].red.x, &fmt,
219 &corner_points[1].red.custom_float_x)) {
223 if (!convert_to_custom_float_format(corner_points[1].green.x, &fmt,
224 &corner_points[1].green.custom_float_x)) {
228 if (!convert_to_custom_float_format(corner_points[1].blue.x, &fmt,
229 &corner_points[1].blue.custom_float_x)) {
234 if (fixpoint == true) {
235 corner_points[1].red.custom_float_y =
236 dc_fixpt_clamp_u0d14(corner_points[1].red.y);
237 corner_points[1].green.custom_float_y =
238 dc_fixpt_clamp_u0d14(corner_points[1].green.y);
239 corner_points[1].blue.custom_float_y =
240 dc_fixpt_clamp_u0d14(corner_points[1].blue.y);
242 if (!convert_to_custom_float_format(corner_points[1].red.y,
243 &fmt, &corner_points[1].red.custom_float_y)) {
247 if (!convert_to_custom_float_format(corner_points[1].green.y,
248 &fmt, &corner_points[1].green.custom_float_y)) {
252 if (!convert_to_custom_float_format(corner_points[1].blue.y,
253 &fmt, &corner_points[1].blue.custom_float_y)) {
259 if (!convert_to_custom_float_format(corner_points[1].red.slope, &fmt,
260 &corner_points[1].red.custom_float_slope)) {
264 if (!convert_to_custom_float_format(corner_points[1].green.slope, &fmt,
265 &corner_points[1].green.custom_float_slope)) {
269 if (!convert_to_custom_float_format(corner_points[1].blue.slope, &fmt,
270 &corner_points[1].blue.custom_float_slope)) {
275 if (hw_points_num == 0 || rgb_resulted == NULL || fixpoint == true)
278 fmt.mantissa_bits = 12;
281 while (i != hw_points_num) {
282 if (!convert_to_custom_float_format(rgb->red, &fmt,
288 if (!convert_to_custom_float_format(rgb->green, &fmt,
294 if (!convert_to_custom_float_format(rgb->blue, &fmt,
300 if (!convert_to_custom_float_format(rgb->delta_red, &fmt,
301 &rgb->delta_red_reg)) {
306 if (!convert_to_custom_float_format(rgb->delta_green, &fmt,
307 &rgb->delta_green_reg)) {
312 if (!convert_to_custom_float_format(rgb->delta_blue, &fmt,
313 &rgb->delta_blue_reg)) {
325 /* driver uses 32 regions or less, but DCN HW has 34, extra 2 are set to 0 */
326 #define MAX_REGIONS_NUMBER 34
327 #define MAX_LOW_POINT 25
328 #define NUMBER_REGIONS 32
329 #define NUMBER_SW_SEGMENTS 16
334 bool cm_helper_translate_curve_to_hw_format(struct dc_context *ctx,
335 const struct dc_transfer_func *output_tf,
336 struct pwl_params *lut_params, bool fixpoint)
338 struct curve_points3 *corner_points;
339 struct pwl_result_data *rgb_resulted;
340 struct pwl_result_data *rgb;
341 struct pwl_result_data *rgb_plus_1;
342 struct pwl_result_data *rgb_minus_1;
344 int32_t region_start, region_end;
346 uint32_t j, k, seg_distr[MAX_REGIONS_NUMBER], increment, start_index, hw_points;
348 if (output_tf == NULL || lut_params == NULL || output_tf->type == TF_TYPE_BYPASS)
351 corner_points = lut_params->corner_points;
352 rgb_resulted = lut_params->rgb_resulted;
355 memset(lut_params, 0, sizeof(struct pwl_params));
356 memset(seg_distr, 0, sizeof(seg_distr));
358 if (output_tf->tf == TRANSFER_FUNCTION_PQ || output_tf->tf == TRANSFER_FUNCTION_GAMMA22) {
360 * segments are from 2^-25 to 2^7
362 for (i = 0; i < NUMBER_REGIONS ; i++)
365 region_start = -MAX_LOW_POINT;
366 region_end = NUMBER_REGIONS - MAX_LOW_POINT;
369 * segment is from 2^-12 to 2^0
370 * There are less than 256 points, for optimization
372 const uint8_t SEG_COUNT = 12;
374 for (i = 0; i < SEG_COUNT; i++)
377 seg_distr[SEG_COUNT] = 1;
379 region_start = -SEG_COUNT;
383 for (i = region_end - region_start; i < MAX_REGIONS_NUMBER ; i++)
386 for (k = 0; k < MAX_REGIONS_NUMBER; k++) {
387 if (seg_distr[k] != -1)
388 hw_points += (1 << seg_distr[k]);
392 for (k = 0; k < (region_end - region_start); k++) {
393 increment = NUMBER_SW_SEGMENTS / (1 << seg_distr[k]);
394 start_index = (region_start + k + MAX_LOW_POINT) *
396 for (i = start_index; i < start_index + NUMBER_SW_SEGMENTS;
398 if (j == hw_points - 1)
400 if (i >= TRANSFER_FUNC_POINTS) {
401 DC_LOG_ERROR("Index out of bounds: i=%d, TRANSFER_FUNC_POINTS=%d\n",
402 i, TRANSFER_FUNC_POINTS);
405 rgb_resulted[j].red = output_tf->tf_pts.red[i];
406 rgb_resulted[j].green = output_tf->tf_pts.green[i];
407 rgb_resulted[j].blue = output_tf->tf_pts.blue[i];
413 start_index = (region_end + MAX_LOW_POINT) * NUMBER_SW_SEGMENTS;
414 rgb_resulted[hw_points - 1].red = output_tf->tf_pts.red[start_index];
415 rgb_resulted[hw_points - 1].green = output_tf->tf_pts.green[start_index];
416 rgb_resulted[hw_points - 1].blue = output_tf->tf_pts.blue[start_index];
418 rgb_resulted[hw_points].red = rgb_resulted[hw_points - 1].red;
419 rgb_resulted[hw_points].green = rgb_resulted[hw_points - 1].green;
420 rgb_resulted[hw_points].blue = rgb_resulted[hw_points - 1].blue;
422 // All 3 color channels have same x
423 corner_points[0].red.x = dc_fixpt_pow(dc_fixpt_from_int(2),
424 dc_fixpt_from_int(region_start));
425 corner_points[0].green.x = corner_points[0].red.x;
426 corner_points[0].blue.x = corner_points[0].red.x;
428 corner_points[1].red.x = dc_fixpt_pow(dc_fixpt_from_int(2),
429 dc_fixpt_from_int(region_end));
430 corner_points[1].green.x = corner_points[1].red.x;
431 corner_points[1].blue.x = corner_points[1].red.x;
433 corner_points[0].red.y = rgb_resulted[0].red;
434 corner_points[0].green.y = rgb_resulted[0].green;
435 corner_points[0].blue.y = rgb_resulted[0].blue;
437 corner_points[0].red.slope = dc_fixpt_div(corner_points[0].red.y,
438 corner_points[0].red.x);
439 corner_points[0].green.slope = dc_fixpt_div(corner_points[0].green.y,
440 corner_points[0].green.x);
441 corner_points[0].blue.slope = dc_fixpt_div(corner_points[0].blue.y,
442 corner_points[0].blue.x);
444 /* see comment above, m_arrPoints[1].y should be the Y value for the
445 * region end (m_numOfHwPoints), not last HW point(m_numOfHwPoints - 1)
447 corner_points[1].red.y = rgb_resulted[hw_points - 1].red;
448 corner_points[1].green.y = rgb_resulted[hw_points - 1].green;
449 corner_points[1].blue.y = rgb_resulted[hw_points - 1].blue;
450 corner_points[1].red.slope = dc_fixpt_zero;
451 corner_points[1].green.slope = dc_fixpt_zero;
452 corner_points[1].blue.slope = dc_fixpt_zero;
454 if (output_tf->tf == TRANSFER_FUNCTION_PQ) {
455 /* for PQ, we want to have a straight line from last HW X point,
456 * and the slope to be such that we hit 1.0 at 10000 nits.
458 const struct fixed31_32 end_value =
459 dc_fixpt_from_int(125);
461 corner_points[1].red.slope = dc_fixpt_div(
462 dc_fixpt_sub(dc_fixpt_one, corner_points[1].red.y),
463 dc_fixpt_sub(end_value, corner_points[1].red.x));
464 corner_points[1].green.slope = dc_fixpt_div(
465 dc_fixpt_sub(dc_fixpt_one, corner_points[1].green.y),
466 dc_fixpt_sub(end_value, corner_points[1].green.x));
467 corner_points[1].blue.slope = dc_fixpt_div(
468 dc_fixpt_sub(dc_fixpt_one, corner_points[1].blue.y),
469 dc_fixpt_sub(end_value, corner_points[1].blue.x));
472 lut_params->hw_points_num = hw_points;
475 for (i = 1; i < MAX_REGIONS_NUMBER; i++) {
476 if (seg_distr[k] != -1) {
477 lut_params->arr_curve_points[k].segments_num =
479 lut_params->arr_curve_points[i].offset =
480 lut_params->arr_curve_points[k].offset + (1 << seg_distr[k]);
485 if (seg_distr[k] != -1)
486 lut_params->arr_curve_points[k].segments_num = seg_distr[k];
489 rgb_plus_1 = rgb_resulted + 1;
493 while (i != hw_points + 1) {
495 if (i >= hw_points - 1) {
496 if (dc_fixpt_lt(rgb_plus_1->red, rgb->red))
497 rgb_plus_1->red = dc_fixpt_add(rgb->red, rgb_minus_1->delta_red);
498 if (dc_fixpt_lt(rgb_plus_1->green, rgb->green))
499 rgb_plus_1->green = dc_fixpt_add(rgb->green, rgb_minus_1->delta_green);
500 if (dc_fixpt_lt(rgb_plus_1->blue, rgb->blue))
501 rgb_plus_1->blue = dc_fixpt_add(rgb->blue, rgb_minus_1->delta_blue);
504 rgb->delta_red = dc_fixpt_sub(rgb_plus_1->red, rgb->red);
505 rgb->delta_green = dc_fixpt_sub(rgb_plus_1->green, rgb->green);
506 rgb->delta_blue = dc_fixpt_sub(rgb_plus_1->blue, rgb->blue);
509 if (fixpoint == true) {
510 uint32_t red_clamp = dc_fixpt_clamp_u0d14(rgb->delta_red);
511 uint32_t green_clamp = dc_fixpt_clamp_u0d14(rgb->delta_green);
512 uint32_t blue_clamp = dc_fixpt_clamp_u0d14(rgb->delta_blue);
514 if (red_clamp >> 10 || green_clamp >> 10 || blue_clamp >> 10)
515 DC_LOG_WARNING("Losing delta precision while programming shaper LUT.");
517 rgb->delta_red_reg = red_clamp & 0x3ff;
518 rgb->delta_green_reg = green_clamp & 0x3ff;
519 rgb->delta_blue_reg = blue_clamp & 0x3ff;
520 rgb->red_reg = dc_fixpt_clamp_u0d14(rgb->red);
521 rgb->green_reg = dc_fixpt_clamp_u0d14(rgb->green);
522 rgb->blue_reg = dc_fixpt_clamp_u0d14(rgb->blue);
530 cm_helper_convert_to_custom_float(rgb_resulted,
531 lut_params->corner_points,
532 hw_points, fixpoint);
537 #define NUM_DEGAMMA_REGIONS 12
540 bool cm_helper_translate_curve_to_degamma_hw_format(
541 const struct dc_transfer_func *output_tf,
542 struct pwl_params *lut_params)
544 struct curve_points3 *corner_points;
545 struct pwl_result_data *rgb_resulted;
546 struct pwl_result_data *rgb;
547 struct pwl_result_data *rgb_plus_1;
549 int32_t region_start, region_end;
551 uint32_t j, k, seg_distr[MAX_REGIONS_NUMBER], increment, start_index, hw_points;
553 if (output_tf == NULL || lut_params == NULL || output_tf->type == TF_TYPE_BYPASS)
556 corner_points = lut_params->corner_points;
557 rgb_resulted = lut_params->rgb_resulted;
560 memset(lut_params, 0, sizeof(struct pwl_params));
561 memset(seg_distr, 0, sizeof(seg_distr));
563 region_start = -NUM_DEGAMMA_REGIONS;
567 for (i = region_end - region_start; i < MAX_REGIONS_NUMBER ; i++)
570 * segments are from 2^-12 to 0
572 for (i = 0; i < NUM_DEGAMMA_REGIONS ; i++)
575 for (k = 0; k < MAX_REGIONS_NUMBER; k++) {
576 if (seg_distr[k] != -1)
577 hw_points += (1 << seg_distr[k]);
581 for (k = 0; k < (region_end - region_start); k++) {
582 increment = NUMBER_SW_SEGMENTS / (1 << seg_distr[k]);
583 start_index = (region_start + k + MAX_LOW_POINT) *
585 for (i = start_index; i < start_index + NUMBER_SW_SEGMENTS;
587 if (j == hw_points - 1)
589 if (i >= TRANSFER_FUNC_POINTS)
591 rgb_resulted[j].red = output_tf->tf_pts.red[i];
592 rgb_resulted[j].green = output_tf->tf_pts.green[i];
593 rgb_resulted[j].blue = output_tf->tf_pts.blue[i];
599 start_index = (region_end + MAX_LOW_POINT) * NUMBER_SW_SEGMENTS;
600 rgb_resulted[hw_points - 1].red = output_tf->tf_pts.red[start_index];
601 rgb_resulted[hw_points - 1].green = output_tf->tf_pts.green[start_index];
602 rgb_resulted[hw_points - 1].blue = output_tf->tf_pts.blue[start_index];
604 rgb_resulted[hw_points].red = rgb_resulted[hw_points - 1].red;
605 rgb_resulted[hw_points].green = rgb_resulted[hw_points - 1].green;
606 rgb_resulted[hw_points].blue = rgb_resulted[hw_points - 1].blue;
608 corner_points[0].red.x = dc_fixpt_pow(dc_fixpt_from_int(2),
609 dc_fixpt_from_int(region_start));
610 corner_points[0].green.x = corner_points[0].red.x;
611 corner_points[0].blue.x = corner_points[0].red.x;
612 corner_points[1].red.x = dc_fixpt_pow(dc_fixpt_from_int(2),
613 dc_fixpt_from_int(region_end));
614 corner_points[1].green.x = corner_points[1].red.x;
615 corner_points[1].blue.x = corner_points[1].red.x;
617 corner_points[0].red.y = rgb_resulted[0].red;
618 corner_points[0].green.y = rgb_resulted[0].green;
619 corner_points[0].blue.y = rgb_resulted[0].blue;
621 /* see comment above, m_arrPoints[1].y should be the Y value for the
622 * region end (m_numOfHwPoints), not last HW point(m_numOfHwPoints - 1)
624 corner_points[1].red.y = rgb_resulted[hw_points - 1].red;
625 corner_points[1].green.y = rgb_resulted[hw_points - 1].green;
626 corner_points[1].blue.y = rgb_resulted[hw_points - 1].blue;
627 corner_points[1].red.slope = dc_fixpt_zero;
628 corner_points[1].green.slope = dc_fixpt_zero;
629 corner_points[1].blue.slope = dc_fixpt_zero;
631 if (output_tf->tf == TRANSFER_FUNCTION_PQ) {
632 /* for PQ, we want to have a straight line from last HW X point,
633 * and the slope to be such that we hit 1.0 at 10000 nits.
635 const struct fixed31_32 end_value =
636 dc_fixpt_from_int(125);
638 corner_points[1].red.slope = dc_fixpt_div(
639 dc_fixpt_sub(dc_fixpt_one, corner_points[1].red.y),
640 dc_fixpt_sub(end_value, corner_points[1].red.x));
641 corner_points[1].green.slope = dc_fixpt_div(
642 dc_fixpt_sub(dc_fixpt_one, corner_points[1].green.y),
643 dc_fixpt_sub(end_value, corner_points[1].green.x));
644 corner_points[1].blue.slope = dc_fixpt_div(
645 dc_fixpt_sub(dc_fixpt_one, corner_points[1].blue.y),
646 dc_fixpt_sub(end_value, corner_points[1].blue.x));
649 lut_params->hw_points_num = hw_points;
652 for (i = 1; i < MAX_REGIONS_NUMBER; i++) {
653 if (seg_distr[k] != -1) {
654 lut_params->arr_curve_points[k].segments_num =
656 lut_params->arr_curve_points[i].offset =
657 lut_params->arr_curve_points[k].offset + (1 << seg_distr[k]);
662 if (seg_distr[k] != -1)
663 lut_params->arr_curve_points[k].segments_num = seg_distr[k];
666 rgb_plus_1 = rgb_resulted + 1;
669 while (i != hw_points + 1) {
670 rgb->delta_red = dc_fixpt_sub(rgb_plus_1->red, rgb->red);
671 rgb->delta_green = dc_fixpt_sub(rgb_plus_1->green, rgb->green);
672 rgb->delta_blue = dc_fixpt_sub(rgb_plus_1->blue, rgb->blue);
678 cm_helper_convert_to_custom_float(rgb_resulted,
679 lut_params->corner_points,