1 /*
2 * Copyright 2018 Advanced Micro Devices, Inc.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
13 *
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20 * OTHER DEALINGS IN THE SOFTWARE.
21 *
22 * Authors: AMD
23 *
24 */
25 #include "amdgpu.h"
26 #include "amdgpu_mode.h"
27 #include "amdgpu_dm.h"
28 #include "dc.h"
29 #include "modules/color/color_gamma.h"
30 #include "basics/conversion.h"
31
32 /*
33 * The DC interface to HW gives us the following color management blocks
34 * per pipe (surface):
35 *
36 * - Input gamma LUT (de-normalized)
37 * - Input CSC (normalized)
38 * - Surface degamma LUT (normalized)
39 * - Surface CSC (normalized)
40 * - Surface regamma LUT (normalized)
41 * - Output CSC (normalized)
42 *
43 * But these aren't a direct mapping to DRM color properties. The current DRM
44 * interface exposes CRTC degamma, CRTC CTM and CRTC regamma while our hardware
45 * is essentially giving:
46 *
47 * Plane CTM -> Plane degamma -> Plane CTM -> Plane regamma -> Plane CTM
48 *
49 * The input gamma LUT block isn't really applicable here since it operates
50 * on the actual input data itself rather than the HW fp representation. The
51 * input and output CSC blocks are technically available to use as part of
52 * the DC interface but are typically used internally by DC for conversions
53 * between color spaces. These could be blended together with user
54 * adjustments in the future but for now these should remain untouched.
55 *
56 * The pipe blending also happens after these blocks so we don't actually
57 * support any CRTC props with correct blending with multiple planes - but we
58 * can still support CRTC color management properties in DM in most single
59 * plane cases correctly with clever management of the DC interface in DM.
60 *
61 * As per DRM documentation, blocks should be in hardware bypass when their
62 * respective property is set to NULL. A linear DGM/RGM LUT should also
63 * considered as putting the respective block into bypass mode.
64 *
65 * This means that the following
66 * configuration is assumed to be the default:
67 *
68 * Plane DGM Bypass -> Plane CTM Bypass -> Plane RGM Bypass -> ...
69 * CRTC DGM Bypass -> CRTC CTM Bypass -> CRTC RGM Bypass
70 */
71
72 #define MAX_DRM_LUT_VALUE 0xFFFF
73
74 /*
75 * Initialize the color module.
76 *
77 * We're not using the full color module, only certain components.
78 * Only call setup functions for components that we need.
79 */
amdgpu_dm_init_color_mod(void)80 void amdgpu_dm_init_color_mod(void)
81 {
82 setup_x_points_distribution();
83 }
84
85 /* Extracts the DRM lut and lut size from a blob. */
86 static const struct drm_color_lut *
__extract_blob_lut(const struct drm_property_blob * blob,uint32_t * size)87 __extract_blob_lut(const struct drm_property_blob *blob, uint32_t *size)
88 {
89 *size = blob ? drm_color_lut_size(blob) : 0;
90 return blob ? (struct drm_color_lut *)blob->data : NULL;
91 }
92
93 /*
94 * Return true if the given lut is a linear mapping of values, i.e. it acts
95 * like a bypass LUT.
96 *
97 * It is considered linear if the lut represents:
98 * f(a) = (0xFF00/MAX_COLOR_LUT_ENTRIES-1)a; for integer a in
99 * [0, MAX_COLOR_LUT_ENTRIES)
100 */
__is_lut_linear(const struct drm_color_lut * lut,uint32_t size)101 static bool __is_lut_linear(const struct drm_color_lut *lut, uint32_t size)
102 {
103 int i;
104 uint32_t expected;
105 int delta;
106
107 for (i = 0; i < size; i++) {
108 /* All color values should equal */
109 if ((lut[i].red != lut[i].green) || (lut[i].green != lut[i].blue))
110 return false;
111
112 expected = i * MAX_DRM_LUT_VALUE / (size-1);
113
114 /* Allow a +/-1 error. */
115 delta = lut[i].red - expected;
116 if (delta < -1 || 1 < delta)
117 return false;
118 }
119 return true;
120 }
121
122 /*
123 * Convert the drm_color_lut to dc_gamma. The conversion depends on the size
124 * of the lut - whether or not it's legacy.
125 */
__drm_lut_to_dc_gamma(const struct drm_color_lut * lut,struct dc_gamma * gamma,bool is_legacy)126 static void __drm_lut_to_dc_gamma(const struct drm_color_lut *lut,
127 struct dc_gamma *gamma, bool is_legacy)
128 {
129 uint32_t r, g, b;
130 int i;
131
132 if (is_legacy) {
133 for (i = 0; i < MAX_COLOR_LEGACY_LUT_ENTRIES; i++) {
134 r = drm_color_lut_extract(lut[i].red, 16);
135 g = drm_color_lut_extract(lut[i].green, 16);
136 b = drm_color_lut_extract(lut[i].blue, 16);
137
138 gamma->entries.red[i] = dc_fixpt_from_int(r);
139 gamma->entries.green[i] = dc_fixpt_from_int(g);
140 gamma->entries.blue[i] = dc_fixpt_from_int(b);
141 }
142 return;
143 }
144
145 /* else */
146 for (i = 0; i < MAX_COLOR_LUT_ENTRIES; i++) {
147 r = drm_color_lut_extract(lut[i].red, 16);
148 g = drm_color_lut_extract(lut[i].green, 16);
149 b = drm_color_lut_extract(lut[i].blue, 16);
150
151 gamma->entries.red[i] = dc_fixpt_from_fraction(r, MAX_DRM_LUT_VALUE);
152 gamma->entries.green[i] = dc_fixpt_from_fraction(g, MAX_DRM_LUT_VALUE);
153 gamma->entries.blue[i] = dc_fixpt_from_fraction(b, MAX_DRM_LUT_VALUE);
154 }
155 }
156
157 /*
158 * Converts a DRM CTM to a DC CSC float matrix.
159 * The matrix needs to be a 3x4 (12 entry) matrix.
160 */
__drm_ctm_to_dc_matrix(const struct drm_color_ctm * ctm,struct fixed31_32 * matrix)161 static void __drm_ctm_to_dc_matrix(const struct drm_color_ctm *ctm,
162 struct fixed31_32 *matrix)
163 {
164 int64_t val;
165 int i;
166
167 /*
168 * DRM gives a 3x3 matrix, but DC wants 3x4. Assuming we're operating
169 * with homogeneous coordinates, augment the matrix with 0's.
170 *
171 * The format provided is S31.32, using signed-magnitude representation.
172 * Our fixed31_32 is also S31.32, but is using 2's complement. We have
173 * to convert from signed-magnitude to 2's complement.
174 */
175 for (i = 0; i < 12; i++) {
176 /* Skip 4th element */
177 if (i % 4 == 3) {
178 matrix[i] = dc_fixpt_zero;
179 continue;
180 }
181
182 /* gamut_remap_matrix[i] = ctm[i - floor(i/4)] */
183 val = ctm->matrix[i - (i / 4)];
184 /* If negative, convert to 2's complement. */
185 if (val & (1ULL << 63))
186 val = -(val & ~(1ULL << 63));
187
188 matrix[i].value = val;
189 }
190 }
191
192 /* Calculates the legacy transfer function - only for sRGB input space. */
__set_legacy_tf(struct dc_transfer_func * func,const struct drm_color_lut * lut,uint32_t lut_size,bool has_rom)193 static int __set_legacy_tf(struct dc_transfer_func *func,
194 const struct drm_color_lut *lut, uint32_t lut_size,
195 bool has_rom)
196 {
197 struct dc_gamma *gamma = NULL;
198 struct calculate_buffer cal_buffer = {0};
199 bool res;
200
201 ASSERT(lut && lut_size == MAX_COLOR_LEGACY_LUT_ENTRIES);
202
203 cal_buffer.buffer_index = -1;
204
205 gamma = dc_create_gamma();
206 if (!gamma)
207 return -ENOMEM;
208
209 gamma->type = GAMMA_RGB_256;
210 gamma->num_entries = lut_size;
211 __drm_lut_to_dc_gamma(lut, gamma, true);
212
213 res = mod_color_calculate_regamma_params(func, gamma, true, has_rom,
214 NULL, &cal_buffer);
215
216 dc_gamma_release(&gamma);
217
218 return res ? 0 : -ENOMEM;
219 }
220
221 /* Calculates the output transfer function based on expected input space. */
__set_output_tf(struct dc_transfer_func * func,const struct drm_color_lut * lut,uint32_t lut_size,bool has_rom)222 static int __set_output_tf(struct dc_transfer_func *func,
223 const struct drm_color_lut *lut, uint32_t lut_size,
224 bool has_rom)
225 {
226 struct dc_gamma *gamma = NULL;
227 struct calculate_buffer cal_buffer = {0};
228 bool res;
229
230 ASSERT(lut && lut_size == MAX_COLOR_LUT_ENTRIES);
231
232 cal_buffer.buffer_index = -1;
233
234 gamma = dc_create_gamma();
235 if (!gamma)
236 return -ENOMEM;
237
238 gamma->num_entries = lut_size;
239 __drm_lut_to_dc_gamma(lut, gamma, false);
240
241 if (func->tf == TRANSFER_FUNCTION_LINEAR) {
242 /*
243 * Color module doesn't like calculating regamma params
244 * on top of a linear input. But degamma params can be used
245 * instead to simulate this.
246 */
247 gamma->type = GAMMA_CUSTOM;
248 res = mod_color_calculate_degamma_params(NULL, func,
249 gamma, true);
250 } else {
251 /*
252 * Assume sRGB. The actual mapping will depend on whether the
253 * input was legacy or not.
254 */
255 gamma->type = GAMMA_CS_TFM_1D;
256 res = mod_color_calculate_regamma_params(func, gamma, false,
257 has_rom, NULL, &cal_buffer);
258 }
259
260 dc_gamma_release(&gamma);
261
262 return res ? 0 : -ENOMEM;
263 }
264
265 /* Caculates the input transfer function based on expected input space. */
__set_input_tf(struct dc_transfer_func * func,const struct drm_color_lut * lut,uint32_t lut_size)266 static int __set_input_tf(struct dc_transfer_func *func,
267 const struct drm_color_lut *lut, uint32_t lut_size)
268 {
269 struct dc_gamma *gamma = NULL;
270 bool res;
271
272 gamma = dc_create_gamma();
273 if (!gamma)
274 return -ENOMEM;
275
276 gamma->type = GAMMA_CUSTOM;
277 gamma->num_entries = lut_size;
278
279 __drm_lut_to_dc_gamma(lut, gamma, false);
280
281 res = mod_color_calculate_degamma_params(NULL, func, gamma, true);
282 dc_gamma_release(&gamma);
283
284 return res ? 0 : -ENOMEM;
285 }
286
287 /**
288 * Verifies that the Degamma and Gamma LUTs attached to the |crtc_state| are of
289 * the expected size.
290 * Returns 0 on success.
291 */
amdgpu_dm_verify_lut_sizes(const struct drm_crtc_state * crtc_state)292 int amdgpu_dm_verify_lut_sizes(const struct drm_crtc_state *crtc_state)
293 {
294 const struct drm_color_lut *lut = NULL;
295 uint32_t size = 0;
296
297 lut = __extract_blob_lut(crtc_state->degamma_lut, &size);
298 if (lut && size != MAX_COLOR_LUT_ENTRIES) {
299 DRM_DEBUG_DRIVER(
300 "Invalid Degamma LUT size. Should be %u but got %u.\n",
301 MAX_COLOR_LUT_ENTRIES, size);
302 return -EINVAL;
303 }
304
305 lut = __extract_blob_lut(crtc_state->gamma_lut, &size);
306 if (lut && size != MAX_COLOR_LUT_ENTRIES &&
307 size != MAX_COLOR_LEGACY_LUT_ENTRIES) {
308 DRM_DEBUG_DRIVER(
309 "Invalid Gamma LUT size. Should be %u (or %u for legacy) but got %u.\n",
310 MAX_COLOR_LUT_ENTRIES, MAX_COLOR_LEGACY_LUT_ENTRIES,
311 size);
312 return -EINVAL;
313 }
314
315 return 0;
316 }
317
318 /**
319 * amdgpu_dm_update_crtc_color_mgmt: Maps DRM color management to DC stream.
320 * @crtc: amdgpu_dm crtc state
321 *
322 * With no plane level color management properties we're free to use any
323 * of the HW blocks as long as the CRTC CTM always comes before the
324 * CRTC RGM and after the CRTC DGM.
325 *
326 * The CRTC RGM block will be placed in the RGM LUT block if it is non-linear.
327 * The CRTC DGM block will be placed in the DGM LUT block if it is non-linear.
328 * The CRTC CTM will be placed in the gamut remap block if it is non-linear.
329 *
330 * The RGM block is typically more fully featured and accurate across
331 * all ASICs - DCE can't support a custom non-linear CRTC DGM.
332 *
333 * For supporting both plane level color management and CRTC level color
334 * management at once we have to either restrict the usage of CRTC properties
335 * or blend adjustments together.
336 *
337 * Returns 0 on success.
338 */
amdgpu_dm_update_crtc_color_mgmt(struct dm_crtc_state * crtc)339 int amdgpu_dm_update_crtc_color_mgmt(struct dm_crtc_state *crtc)
340 {
341 struct dc_stream_state *stream = crtc->stream;
342 struct amdgpu_device *adev = drm_to_adev(crtc->base.state->dev);
343 bool has_rom = adev->asic_type <= CHIP_RAVEN;
344 struct drm_color_ctm *ctm = NULL;
345 const struct drm_color_lut *degamma_lut, *regamma_lut;
346 uint32_t degamma_size, regamma_size;
347 bool has_regamma, has_degamma;
348 bool is_legacy;
349 int r;
350
351 r = amdgpu_dm_verify_lut_sizes(&crtc->base);
352 if (r)
353 return r;
354
355 degamma_lut = __extract_blob_lut(crtc->base.degamma_lut, °amma_size);
356 regamma_lut = __extract_blob_lut(crtc->base.gamma_lut, ®amma_size);
357
358 has_degamma =
359 degamma_lut && !__is_lut_linear(degamma_lut, degamma_size);
360
361 has_regamma =
362 regamma_lut && !__is_lut_linear(regamma_lut, regamma_size);
363
364 is_legacy = regamma_size == MAX_COLOR_LEGACY_LUT_ENTRIES;
365
366 /* Reset all adjustments. */
367 crtc->cm_has_degamma = false;
368 crtc->cm_is_degamma_srgb = false;
369
370 /* Setup regamma and degamma. */
371 if (is_legacy) {
372 /*
373 * Legacy regamma forces us to use the sRGB RGM as a base.
374 * This also means we can't use linear DGM since DGM needs
375 * to use sRGB as a base as well, resulting in incorrect CRTC
376 * DGM and CRTC CTM.
377 *
378 * TODO: Just map this to the standard regamma interface
379 * instead since this isn't really right. One of the cases
380 * where this setup currently fails is trying to do an
381 * inverse color ramp in legacy userspace.
382 */
383 crtc->cm_is_degamma_srgb = true;
384 stream->out_transfer_func->type = TF_TYPE_DISTRIBUTED_POINTS;
385 stream->out_transfer_func->tf = TRANSFER_FUNCTION_SRGB;
386
387 r = __set_legacy_tf(stream->out_transfer_func, regamma_lut,
388 regamma_size, has_rom);
389 if (r)
390 return r;
391 } else if (has_regamma) {
392 /* CRTC RGM goes into RGM LUT. */
393 stream->out_transfer_func->type = TF_TYPE_DISTRIBUTED_POINTS;
394 stream->out_transfer_func->tf = TRANSFER_FUNCTION_LINEAR;
395
396 r = __set_output_tf(stream->out_transfer_func, regamma_lut,
397 regamma_size, has_rom);
398 if (r)
399 return r;
400 } else {
401 /*
402 * No CRTC RGM means we can just put the block into bypass
403 * since we don't have any plane level adjustments using it.
404 */
405 stream->out_transfer_func->type = TF_TYPE_BYPASS;
406 stream->out_transfer_func->tf = TRANSFER_FUNCTION_LINEAR;
407 }
408
409 /*
410 * CRTC DGM goes into DGM LUT. It would be nice to place it
411 * into the RGM since it's a more featured block but we'd
412 * have to place the CTM in the OCSC in that case.
413 */
414 crtc->cm_has_degamma = has_degamma;
415
416 /* Setup CRTC CTM. */
417 if (crtc->base.ctm) {
418 ctm = (struct drm_color_ctm *)crtc->base.ctm->data;
419
420 /*
421 * Gamut remapping must be used for gamma correction
422 * since it comes before the regamma correction.
423 *
424 * OCSC could be used for gamma correction, but we'd need to
425 * blend the adjustments together with the required output
426 * conversion matrix - so just use the gamut remap block
427 * for now.
428 */
429 __drm_ctm_to_dc_matrix(ctm, stream->gamut_remap_matrix.matrix);
430
431 stream->gamut_remap_matrix.enable_remap = true;
432 stream->csc_color_matrix.enable_adjustment = false;
433 } else {
434 /* Bypass CTM. */
435 stream->gamut_remap_matrix.enable_remap = false;
436 stream->csc_color_matrix.enable_adjustment = false;
437 }
438
439 return 0;
440 }
441
442 /**
443 * amdgpu_dm_update_plane_color_mgmt: Maps DRM color management to DC plane.
444 * @crtc: amdgpu_dm crtc state
445 * @dc_plane_state: target DC surface
446 *
447 * Update the underlying dc_stream_state's input transfer function (ITF) in
448 * preparation for hardware commit. The transfer function used depends on
449 * the prepartion done on the stream for color management.
450 *
451 * Returns 0 on success.
452 */
amdgpu_dm_update_plane_color_mgmt(struct dm_crtc_state * crtc,struct dc_plane_state * dc_plane_state)453 int amdgpu_dm_update_plane_color_mgmt(struct dm_crtc_state *crtc,
454 struct dc_plane_state *dc_plane_state)
455 {
456 const struct drm_color_lut *degamma_lut;
457 enum dc_transfer_func_predefined tf = TRANSFER_FUNCTION_SRGB;
458 uint32_t degamma_size;
459 int r;
460
461 /* Get the correct base transfer function for implicit degamma. */
462 switch (dc_plane_state->format) {
463 case SURFACE_PIXEL_FORMAT_VIDEO_420_YCbCr:
464 case SURFACE_PIXEL_FORMAT_VIDEO_420_YCrCb:
465 /* DC doesn't have a transfer function for BT601 specifically. */
466 tf = TRANSFER_FUNCTION_BT709;
467 break;
468 default:
469 break;
470 }
471
472 if (crtc->cm_has_degamma) {
473 degamma_lut = __extract_blob_lut(crtc->base.degamma_lut,
474 °amma_size);
475 ASSERT(degamma_size == MAX_COLOR_LUT_ENTRIES);
476
477 dc_plane_state->in_transfer_func->type =
478 TF_TYPE_DISTRIBUTED_POINTS;
479
480 /*
481 * This case isn't fully correct, but also fairly
482 * uncommon. This is userspace trying to use a
483 * legacy gamma LUT + atomic degamma LUT
484 * at the same time.
485 *
486 * Legacy gamma requires the input to be in linear
487 * space, so that means we need to apply an sRGB
488 * degamma. But color module also doesn't support
489 * a user ramp in this case so the degamma will
490 * be lost.
491 *
492 * Even if we did support it, it's still not right:
493 *
494 * Input -> CRTC DGM -> sRGB DGM -> CRTC CTM ->
495 * sRGB RGM -> CRTC RGM -> Output
496 *
497 * The CSC will be done in the wrong space since
498 * we're applying an sRGB DGM on top of the CRTC
499 * DGM.
500 *
501 * TODO: Don't use the legacy gamma interface and just
502 * map these to the atomic one instead.
503 */
504 if (crtc->cm_is_degamma_srgb)
505 dc_plane_state->in_transfer_func->tf = tf;
506 else
507 dc_plane_state->in_transfer_func->tf =
508 TRANSFER_FUNCTION_LINEAR;
509
510 r = __set_input_tf(dc_plane_state->in_transfer_func,
511 degamma_lut, degamma_size);
512 if (r)
513 return r;
514 } else if (crtc->cm_is_degamma_srgb) {
515 /*
516 * For legacy gamma support we need the regamma input
517 * in linear space. Assume that the input is sRGB.
518 */
519 dc_plane_state->in_transfer_func->type = TF_TYPE_PREDEFINED;
520 dc_plane_state->in_transfer_func->tf = tf;
521
522 if (tf != TRANSFER_FUNCTION_SRGB &&
523 !mod_color_calculate_degamma_params(NULL,
524 dc_plane_state->in_transfer_func, NULL, false))
525 return -ENOMEM;
526 } else {
527 /* ...Otherwise we can just bypass the DGM block. */
528 dc_plane_state->in_transfer_func->type = TF_TYPE_BYPASS;
529 dc_plane_state->in_transfer_func->tf = TRANSFER_FUNCTION_LINEAR;
530 }
531
532 return 0;
533 }
534