root/drivers/gpu/drm/amd/display/amdgpu_dm/amdgpu_dm_color.c
// SPDX-License-Identifier: MIT
/*
 * Copyright 2018 Advanced Micro Devices, Inc.
 *
 * Permission is hereby granted, free of charge, to any person obtaining a
 * copy of this software and associated documentation files (the "Software"),
 * to deal in the Software without restriction, including without limitation
 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
 * and/or sell copies of the Software, and to permit persons to whom the
 * Software is furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice shall be included in
 * all copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
 * OTHER DEALINGS IN THE SOFTWARE.
 *
 * Authors: AMD
 *
 */

#include <drm/drm_colorop.h>

#include "amdgpu.h"
#include "amdgpu_mode.h"
#include "amdgpu_dm.h"
#include "amdgpu_dm_colorop.h"
#include "dc.h"
#include "modules/color/color_gamma.h"

/**
 * DOC: overview
 *
 * We have three types of color management in the AMD display driver.
 * 1. the legacy &drm_crtc DEGAMMA, CTM, and GAMMA properties
 * 2. AMD driver private color management on &drm_plane and &drm_crtc
 * 3. AMD plane color pipeline
 *
 * The CRTC properties are the original color management. When they were
 * implemented per-plane color management was not a thing yet. Because
 * of that we could get away with plumbing the DEGAMMA and CTM
 * properties to pre-blending HW functions. This is incompatible with
 * per-plane color management, such as via the AMD private properties or
 * the new drm_plane color pipeline. The only compatible CRTC property
 * with per-plane color management is the GAMMA property as it is
 * applied post-blending.
 *
 * The AMD driver private color management properties are only exposed
 * when the kernel is built explicitly with -DAMD_PRIVATE_COLOR. They
 * are temporary building blocks on the path to full-fledged &drm_plane
 * and &drm_crtc color pipelines and lay the driver's groundwork for the
 * color pipelines.
 *
 * The AMD plane color pipeline describes AMD's &drm_colorops via the
 * &drm_plane's COLOR_PIPELINE property.
 *
 * drm_crtc Properties
 * -------------------
 *
 * The DC interface to HW gives us the following color management blocks
 * per pipe (surface):
 *
 * - Input gamma LUT (de-normalized)
 * - Input CSC (normalized)
 * - Surface degamma LUT (normalized)
 * - Surface CSC (normalized)
 * - Surface regamma LUT (normalized)
 * - Output CSC (normalized)
 *
 * But these aren't a direct mapping to DRM color properties. The
 * current DRM interface exposes CRTC degamma, CRTC CTM and CRTC regamma
 * while our hardware is essentially giving:
 *
 * Plane CTM -> Plane degamma -> Plane CTM -> Plane regamma -> Plane CTM
 *
 * The input gamma LUT block isn't really applicable here since it
 * operates on the actual input data itself rather than the HW fp
 * representation. The input and output CSC blocks are technically
 * available to use as part of the DC interface but are typically used
 * internally by DC for conversions between color spaces. These could be
 * blended together with user adjustments in the future but for now
 * these should remain untouched.
 *
 * The pipe blending also happens after these blocks so we don't
 * actually support any CRTC props with correct blending with multiple
 * planes - but we can still support CRTC color management properties in
 * DM in most single plane cases correctly with clever management of the
 * DC interface in DM.
 *
 * As per DRM documentation, blocks should be in hardware bypass when
 * their respective property is set to NULL. A linear DGM/RGM LUT should
 * also considered as putting the respective block into bypass mode.
 *
 * This means that the following configuration is assumed to be the
 * default:
 *
 * Plane DGM Bypass -> Plane CTM Bypass -> Plane RGM Bypass -> ... CRTC
 * DGM Bypass -> CRTC CTM Bypass -> CRTC RGM Bypass
 *
 * AMD Private Color Management on drm_plane
 * -----------------------------------------
 *
 * The AMD private color management properties on a &drm_plane are:
 *
 * - AMD_PLANE_DEGAMMA_LUT
 * - AMD_PLANE_DEGAMMA_LUT_SIZE
 * - AMD_PLANE_DEGAMMA_TF
 * - AMD_PLANE_HDR_MULT
 * - AMD_PLANE_CTM
 * - AMD_PLANE_SHAPER_LUT
 * - AMD_PLANE_SHAPER_LUT_SIZE
 * - AMD_PLANE_SHAPER_TF
 * - AMD_PLANE_LUT3D
 * - AMD_PLANE_LUT3D_SIZE
 * - AMD_PLANE_BLEND_LUT
 * - AMD_PLANE_BLEND_LUT_SIZE
 * - AMD_PLANE_BLEND_TF
 *
 * The AMD private color management property on a &drm_crtc is:
 *
 * - AMD_CRTC_REGAMMA_TF
 *
 * Use of these properties is discouraged.
 *
 * AMD plane color pipeline
 * ------------------------
 *
 * The AMD &drm_plane color pipeline is advertised for DCN generations
 * 3.0 and newer. It exposes these elements in this order:
 *
 * 1. 1D curve colorop
 * 2. Multiplier
 * 3. 3x4 CTM
 * 4. 1D curve colorop
 * 5. 1D LUT
 * 6. 3D LUT
 * 7. 1D curve colorop
 * 8. 1D LUT
 *
 * The multiplier (#2) is a simple multiplier that is applied to all
 * channels.
 *
 * The 3x4 CTM (#3) is a simple 3x4 matrix.
 *
 * #1, and #7 are non-linear to linear curves. #4 is a linear to
 * non-linear curve. They support sRGB, PQ, and BT.709/BT.2020 EOTFs or
 * their inverse.
 *
 * The 1D LUTs (#5 and #8) are plain 4096 entry LUTs.
 *
 * The 3DLUT (#6) is a tetrahedrally interpolated 17 cube LUT.
 *
 */

#define MAX_DRM_LUT_VALUE 0xFFFF
#define MAX_DRM_LUT32_VALUE 0xFFFFFFFF
#define SDR_WHITE_LEVEL_INIT_VALUE 80

/**
 * amdgpu_dm_init_color_mod - Initialize the color module.
 *
 * We're not using the full color module, only certain components.
 * Only call setup functions for components that we need.
 */
void amdgpu_dm_init_color_mod(void)
{
        setup_x_points_distribution();
}

static inline struct fixed31_32 amdgpu_dm_fixpt_from_s3132(__u64 x)
{
        struct fixed31_32 val;

        /* If negative, convert to 2's complement. */
        if (x & (1ULL << 63))
                x = -(x & ~(1ULL << 63));

        val.value = x;
        return val;
}

#ifdef AMD_PRIVATE_COLOR
/* Pre-defined Transfer Functions (TF)
 *
 * AMD driver supports pre-defined mathematical functions for transferring
 * between encoded values and optical/linear space. Depending on HW color caps,
 * ROMs and curves built by the AMD color module support these transforms.
 *
 * The driver-specific color implementation exposes properties for pre-blending
 * degamma TF, shaper TF (before 3D LUT), and blend(dpp.ogam) TF and
 * post-blending regamma (mpc.ogam) TF. However, only pre-blending degamma
 * supports ROM curves. AMD color module uses pre-defined coefficients to build
 * curves for the other blocks. What can be done by each color block is
 * described by struct dpp_color_capsand struct mpc_color_caps.
 *
 * AMD driver-specific color API exposes the following pre-defined transfer
 * functions:
 *
 * - Identity: linear/identity relationship between pixel value and
 *   luminance value;
 * - Gamma 2.2, Gamma 2.4, Gamma 2.6: pure power functions;
 * - sRGB: 2.4: The piece-wise transfer function from IEC 61966-2-1:1999;
 * - BT.709: has a linear segment in the bottom part and then a power function
 *   with a 0.45 (~1/2.22) gamma for the rest of the range; standardized by
 *   ITU-R BT.709-6;
 * - PQ (Perceptual Quantizer): used for HDR display, allows luminance range
 *   capability of 0 to 10,000 nits; standardized by SMPTE ST 2084.
 *
 * The AMD color model is designed with an assumption that SDR (sRGB, BT.709,
 * Gamma 2.2, etc.) peak white maps (normalized to 1.0 FP) to 80 nits in the PQ
 * system. This has the implication that PQ EOTF (non-linear to linear) maps to
 * [0.0..125.0] where 125.0 = 10,000 nits / 80 nits.
 *
 * Non-linear and linear forms are described in the table below:
 *
 * ┌───────────┬─────────────────────┬──────────────────────┐
 * │           │     Non-linear      │   Linear             │
 * ├───────────┼─────────────────────┼──────────────────────┤
 * │      sRGB │ UNORM or [0.0, 1.0] │ [0.0, 1.0]           │
 * ├───────────┼─────────────────────┼──────────────────────┤
 * │     BT709 │ UNORM or [0.0, 1.0] │ [0.0, 1.0]           │
 * ├───────────┼─────────────────────┼──────────────────────┤
 * │ Gamma 2.x │ UNORM or [0.0, 1.0] │ [0.0, 1.0]           │
 * ├───────────┼─────────────────────┼──────────────────────┤
 * │        PQ │ UNORM or FP16 CCCS* │ [0.0, 125.0]         │
 * ├───────────┼─────────────────────┼──────────────────────┤
 * │  Identity │ UNORM or FP16 CCCS* │ [0.0, 1.0] or CCCS** │
 * └───────────┴─────────────────────┴──────────────────────┘
 * * CCCS: Windows canonical composition color space
 * ** Respectively
 *
 * In the driver-specific API, color block names attached to TF properties
 * suggest the intention regarding non-linear encoding pixel's luminance
 * values. As some newer encodings don't use gamma curve, we make encoding and
 * decoding explicit by defining an enum list of transfer functions supported
 * in terms of EOTF and inverse EOTF, where:
 *
 * - EOTF (electro-optical transfer function): is the transfer function to go
 *   from the encoded value to an optical (linear) value. De-gamma functions
 *   traditionally do this.
 * - Inverse EOTF (simply the inverse of the EOTF): is usually intended to go
 *   from an optical/linear space (which might have been used for blending)
 *   back to the encoded values. Gamma functions traditionally do this.
 */
static const char * const
amdgpu_transfer_function_names[] = {
        [AMDGPU_TRANSFER_FUNCTION_DEFAULT]              = "Default",
        [AMDGPU_TRANSFER_FUNCTION_IDENTITY]             = "Identity",
        [AMDGPU_TRANSFER_FUNCTION_SRGB_EOTF]            = "sRGB EOTF",
        [AMDGPU_TRANSFER_FUNCTION_BT709_INV_OETF]       = "BT.709 inv_OETF",
        [AMDGPU_TRANSFER_FUNCTION_PQ_EOTF]              = "PQ EOTF",
        [AMDGPU_TRANSFER_FUNCTION_GAMMA22_EOTF]         = "Gamma 2.2 EOTF",
        [AMDGPU_TRANSFER_FUNCTION_GAMMA24_EOTF]         = "Gamma 2.4 EOTF",
        [AMDGPU_TRANSFER_FUNCTION_GAMMA26_EOTF]         = "Gamma 2.6 EOTF",
        [AMDGPU_TRANSFER_FUNCTION_SRGB_INV_EOTF]        = "sRGB inv_EOTF",
        [AMDGPU_TRANSFER_FUNCTION_BT709_OETF]           = "BT.709 OETF",
        [AMDGPU_TRANSFER_FUNCTION_PQ_INV_EOTF]          = "PQ inv_EOTF",
        [AMDGPU_TRANSFER_FUNCTION_GAMMA22_INV_EOTF]     = "Gamma 2.2 inv_EOTF",
        [AMDGPU_TRANSFER_FUNCTION_GAMMA24_INV_EOTF]     = "Gamma 2.4 inv_EOTF",
        [AMDGPU_TRANSFER_FUNCTION_GAMMA26_INV_EOTF]     = "Gamma 2.6 inv_EOTF",
};

static const u32 amdgpu_eotf =
        BIT(AMDGPU_TRANSFER_FUNCTION_SRGB_EOTF) |
        BIT(AMDGPU_TRANSFER_FUNCTION_BT709_INV_OETF) |
        BIT(AMDGPU_TRANSFER_FUNCTION_PQ_EOTF) |
        BIT(AMDGPU_TRANSFER_FUNCTION_GAMMA22_EOTF) |
        BIT(AMDGPU_TRANSFER_FUNCTION_GAMMA24_EOTF) |
        BIT(AMDGPU_TRANSFER_FUNCTION_GAMMA26_EOTF);

static const u32 amdgpu_inv_eotf =
        BIT(AMDGPU_TRANSFER_FUNCTION_SRGB_INV_EOTF) |
        BIT(AMDGPU_TRANSFER_FUNCTION_BT709_OETF) |
        BIT(AMDGPU_TRANSFER_FUNCTION_PQ_INV_EOTF) |
        BIT(AMDGPU_TRANSFER_FUNCTION_GAMMA22_INV_EOTF) |
        BIT(AMDGPU_TRANSFER_FUNCTION_GAMMA24_INV_EOTF) |
        BIT(AMDGPU_TRANSFER_FUNCTION_GAMMA26_INV_EOTF);

static struct drm_property *
amdgpu_create_tf_property(struct drm_device *dev,
                          const char *name,
                          u32 supported_tf)
{
        u32 transfer_functions = supported_tf |
                                 BIT(AMDGPU_TRANSFER_FUNCTION_DEFAULT) |
                                 BIT(AMDGPU_TRANSFER_FUNCTION_IDENTITY);
        struct drm_prop_enum_list enum_list[AMDGPU_TRANSFER_FUNCTION_COUNT];
        int i, len;

        len = 0;
        for (i = 0; i < AMDGPU_TRANSFER_FUNCTION_COUNT; i++) {
                if ((transfer_functions & BIT(i)) == 0)
                        continue;

                enum_list[len].type = i;
                enum_list[len].name = amdgpu_transfer_function_names[i];
                len++;
        }

        return drm_property_create_enum(dev, DRM_MODE_PROP_ENUM,
                                        name, enum_list, len);
}

int
amdgpu_dm_create_color_properties(struct amdgpu_device *adev)
{
        struct drm_property *prop;

        prop = drm_property_create(adev_to_drm(adev),
                                   DRM_MODE_PROP_BLOB,
                                   "AMD_PLANE_DEGAMMA_LUT", 0);
        if (!prop)
                return -ENOMEM;
        adev->mode_info.plane_degamma_lut_property = prop;

        prop = drm_property_create_range(adev_to_drm(adev),
                                         DRM_MODE_PROP_IMMUTABLE,
                                         "AMD_PLANE_DEGAMMA_LUT_SIZE",
                                         0, UINT_MAX);
        if (!prop)
                return -ENOMEM;
        adev->mode_info.plane_degamma_lut_size_property = prop;

        prop = amdgpu_create_tf_property(adev_to_drm(adev),
                                         "AMD_PLANE_DEGAMMA_TF",
                                         amdgpu_eotf);
        if (!prop)
                return -ENOMEM;
        adev->mode_info.plane_degamma_tf_property = prop;

        prop = drm_property_create_range(adev_to_drm(adev),
                                         0, "AMD_PLANE_HDR_MULT", 0, U64_MAX);
        if (!prop)
                return -ENOMEM;
        adev->mode_info.plane_hdr_mult_property = prop;

        prop = drm_property_create(adev_to_drm(adev),
                                   DRM_MODE_PROP_BLOB,
                                   "AMD_PLANE_CTM", 0);
        if (!prop)
                return -ENOMEM;
        adev->mode_info.plane_ctm_property = prop;

        prop = drm_property_create(adev_to_drm(adev),
                                   DRM_MODE_PROP_BLOB,
                                   "AMD_PLANE_SHAPER_LUT", 0);
        if (!prop)
                return -ENOMEM;
        adev->mode_info.plane_shaper_lut_property = prop;

        prop = drm_property_create_range(adev_to_drm(adev),
                                         DRM_MODE_PROP_IMMUTABLE,
                                         "AMD_PLANE_SHAPER_LUT_SIZE", 0, UINT_MAX);
        if (!prop)
                return -ENOMEM;
        adev->mode_info.plane_shaper_lut_size_property = prop;

        prop = amdgpu_create_tf_property(adev_to_drm(adev),
                                         "AMD_PLANE_SHAPER_TF",
                                         amdgpu_inv_eotf);
        if (!prop)
                return -ENOMEM;
        adev->mode_info.plane_shaper_tf_property = prop;

        prop = drm_property_create(adev_to_drm(adev),
                                   DRM_MODE_PROP_BLOB,
                                   "AMD_PLANE_LUT3D", 0);
        if (!prop)
                return -ENOMEM;
        adev->mode_info.plane_lut3d_property = prop;

        prop = drm_property_create_range(adev_to_drm(adev),
                                         DRM_MODE_PROP_IMMUTABLE,
                                         "AMD_PLANE_LUT3D_SIZE", 0, UINT_MAX);
        if (!prop)
                return -ENOMEM;
        adev->mode_info.plane_lut3d_size_property = prop;

        prop = drm_property_create(adev_to_drm(adev),
                                   DRM_MODE_PROP_BLOB,
                                   "AMD_PLANE_BLEND_LUT", 0);
        if (!prop)
                return -ENOMEM;
        adev->mode_info.plane_blend_lut_property = prop;

        prop = drm_property_create_range(adev_to_drm(adev),
                                         DRM_MODE_PROP_IMMUTABLE,
                                         "AMD_PLANE_BLEND_LUT_SIZE", 0, UINT_MAX);
        if (!prop)
                return -ENOMEM;
        adev->mode_info.plane_blend_lut_size_property = prop;

        prop = amdgpu_create_tf_property(adev_to_drm(adev),
                                         "AMD_PLANE_BLEND_TF",
                                         amdgpu_eotf);
        if (!prop)
                return -ENOMEM;
        adev->mode_info.plane_blend_tf_property = prop;

        prop = amdgpu_create_tf_property(adev_to_drm(adev),
                                         "AMD_CRTC_REGAMMA_TF",
                                         amdgpu_inv_eotf);
        if (!prop)
                return -ENOMEM;
        adev->mode_info.regamma_tf_property = prop;

        return 0;
}
#endif

/**
 * __extract_blob_lut - Extracts the DRM lut and lut size from a blob.
 * @blob: DRM color mgmt property blob
 * @size: lut size
 *
 * Returns:
 * DRM LUT or NULL
 */
static const struct drm_color_lut *
__extract_blob_lut(const struct drm_property_blob *blob, uint32_t *size)
{
        *size = blob ? drm_color_lut_size(blob) : 0;
        return blob ? (struct drm_color_lut *)blob->data : NULL;
}

/**
 * __extract_blob_lut32 - Extracts the DRM lut and lut size from a blob.
 * @blob: DRM color mgmt property blob
 * @size: lut size
 *
 * Returns:
 * DRM LUT or NULL
 */
static const struct drm_color_lut32 *
__extract_blob_lut32(const struct drm_property_blob *blob, uint32_t *size)
{
        *size = blob ? drm_color_lut32_size(blob) : 0;
        return blob ? (struct drm_color_lut32 *)blob->data : NULL;
}

/**
 * __is_lut_linear - check if the given lut is a linear mapping of values
 * @lut: given lut to check values
 * @size: lut size
 *
 * It is considered linear if the lut represents:
 * f(a) = (0xFF00/MAX_COLOR_LUT_ENTRIES-1)a; for integer a in [0,
 * MAX_COLOR_LUT_ENTRIES)
 *
 * Returns:
 * True if the given lut is a linear mapping of values, i.e. it acts like a
 * bypass LUT. Otherwise, false.
 */
static bool __is_lut_linear(const struct drm_color_lut *lut, uint32_t size)
{
        int i;
        uint32_t expected;
        int delta;

        for (i = 0; i < size; i++) {
                /* All color values should equal */
                if ((lut[i].red != lut[i].green) || (lut[i].green != lut[i].blue))
                        return false;

                expected = i * MAX_DRM_LUT_VALUE / (size-1);

                /* Allow a +/-1 error. */
                delta = lut[i].red - expected;
                if (delta < -1 || 1 < delta)
                        return false;
        }
        return true;
}

/**
 * __drm_lut_to_dc_gamma - convert the drm_color_lut to dc_gamma.
 * @lut: DRM lookup table for color conversion
 * @gamma: DC gamma to set entries
 * @is_legacy: legacy or atomic gamma
 *
 * The conversion depends on the size of the lut - whether or not it's legacy.
 */
static void __drm_lut_to_dc_gamma(const struct drm_color_lut *lut,
                                  struct dc_gamma *gamma, bool is_legacy)
{
        uint32_t r, g, b;
        int i;

        if (is_legacy) {
                for (i = 0; i < MAX_COLOR_LEGACY_LUT_ENTRIES; i++) {
                        r = drm_color_lut_extract(lut[i].red, 16);
                        g = drm_color_lut_extract(lut[i].green, 16);
                        b = drm_color_lut_extract(lut[i].blue, 16);

                        gamma->entries.red[i] = dc_fixpt_from_int(r);
                        gamma->entries.green[i] = dc_fixpt_from_int(g);
                        gamma->entries.blue[i] = dc_fixpt_from_int(b);
                }
                return;
        }

        /* else */
        for (i = 0; i < MAX_COLOR_LUT_ENTRIES; i++) {
                r = drm_color_lut_extract(lut[i].red, 16);
                g = drm_color_lut_extract(lut[i].green, 16);
                b = drm_color_lut_extract(lut[i].blue, 16);

                gamma->entries.red[i] = dc_fixpt_from_fraction(r, MAX_DRM_LUT_VALUE);
                gamma->entries.green[i] = dc_fixpt_from_fraction(g, MAX_DRM_LUT_VALUE);
                gamma->entries.blue[i] = dc_fixpt_from_fraction(b, MAX_DRM_LUT_VALUE);
        }
}

/**
 * __drm_lut32_to_dc_gamma - convert the drm_color_lut to dc_gamma.
 * @lut: DRM lookup table for color conversion
 * @gamma: DC gamma to set entries
 *
 * The conversion depends on the size of the lut - whether or not it's legacy.
 */
static void __drm_lut32_to_dc_gamma(const struct drm_color_lut32 *lut, struct dc_gamma *gamma)
{
        int i;

        for (i = 0; i < MAX_COLOR_LUT_ENTRIES; i++) {
                gamma->entries.red[i] = dc_fixpt_from_fraction(lut[i].red, MAX_DRM_LUT32_VALUE);
                gamma->entries.green[i] = dc_fixpt_from_fraction(lut[i].green, MAX_DRM_LUT32_VALUE);
                gamma->entries.blue[i] = dc_fixpt_from_fraction(lut[i].blue, MAX_DRM_LUT32_VALUE);
        }
}

/**
 * __drm_ctm_to_dc_matrix - converts a DRM CTM to a DC CSC float matrix
 * @ctm: DRM color transformation matrix
 * @matrix: DC CSC float matrix
 *
 * The matrix needs to be a 3x4 (12 entry) matrix.
 */
static void __drm_ctm_to_dc_matrix(const struct drm_color_ctm *ctm,
                                   struct fixed31_32 *matrix)
{
        int i;

        /*
         * DRM gives a 3x3 matrix, but DC wants 3x4. Assuming we're operating
         * with homogeneous coordinates, augment the matrix with 0's.
         *
         * The format provided is S31.32, using signed-magnitude representation.
         * Our fixed31_32 is also S31.32, but is using 2's complement. We have
         * to convert from signed-magnitude to 2's complement.
         */
        for (i = 0; i < 12; i++) {
                /* Skip 4th element */
                if (i % 4 == 3) {
                        matrix[i] = dc_fixpt_zero;
                        continue;
                }

                /* gamut_remap_matrix[i] = ctm[i - floor(i/4)] */
                matrix[i] = amdgpu_dm_fixpt_from_s3132(ctm->matrix[i - (i / 4)]);
        }
}

/**
 * __drm_ctm_3x4_to_dc_matrix - converts a DRM CTM 3x4 to a DC CSC float matrix
 * @ctm: DRM color transformation matrix with 3x4 dimensions
 * @matrix: DC CSC float matrix
 *
 * The matrix needs to be a 3x4 (12 entry) matrix.
 */
static void __drm_ctm_3x4_to_dc_matrix(const struct drm_color_ctm_3x4 *ctm,
                                       struct fixed31_32 *matrix)
{
        int i;

        /* The format provided is S31.32, using signed-magnitude representation.
         * Our fixed31_32 is also S31.32, but is using 2's complement. We have
         * to convert from signed-magnitude to 2's complement.
         */
        for (i = 0; i < 12; i++) {
                /* gamut_remap_matrix[i] = ctm[i - floor(i/4)] */
                matrix[i] = amdgpu_dm_fixpt_from_s3132(ctm->matrix[i]);
        }
}

/**
 * __set_legacy_tf - Calculates the legacy transfer function
 * @func: transfer function
 * @lut: lookup table that defines the color space
 * @lut_size: size of respective lut
 * @has_rom: if ROM can be used for hardcoded curve
 *
 * Only for sRGB input space
 *
 * Returns:
 * 0 in case of success, -ENOMEM if fails
 */
static int __set_legacy_tf(struct dc_transfer_func *func,
                           const struct drm_color_lut *lut, uint32_t lut_size,
                           bool has_rom)
{
        struct dc_gamma *gamma = NULL;
        struct calculate_buffer cal_buffer = {0};
        bool res;

        ASSERT(lut && lut_size == MAX_COLOR_LEGACY_LUT_ENTRIES);

        cal_buffer.buffer_index = -1;

        gamma = dc_create_gamma();
        if (!gamma)
                return -ENOMEM;

        gamma->type = GAMMA_RGB_256;
        gamma->num_entries = lut_size;
        __drm_lut_to_dc_gamma(lut, gamma, true);

        res = mod_color_calculate_regamma_params(func, gamma, true, has_rom,
                                                 NULL, &cal_buffer);

        dc_gamma_release(&gamma);

        return res ? 0 : -ENOMEM;
}

/**
 * __set_output_tf - calculates the output transfer function based on expected input space.
 * @func: transfer function
 * @lut: lookup table that defines the color space
 * @lut_size: size of respective lut
 * @has_rom: if ROM can be used for hardcoded curve
 *
 * Returns:
 * 0 in case of success. -ENOMEM if fails.
 */
static int __set_output_tf(struct dc_transfer_func *func,
                           const struct drm_color_lut *lut, uint32_t lut_size,
                           bool has_rom)
{
        struct dc_gamma *gamma = NULL;
        struct calculate_buffer cal_buffer = {0};
        bool res;

        cal_buffer.buffer_index = -1;

        if (lut_size) {
                ASSERT(lut && lut_size == MAX_COLOR_LUT_ENTRIES);

                gamma = dc_create_gamma();
                if (!gamma)
                        return -ENOMEM;

                gamma->num_entries = lut_size;
                __drm_lut_to_dc_gamma(lut, gamma, false);
        }

        if (func->tf == TRANSFER_FUNCTION_LINEAR) {
                /*
                 * Color module doesn't like calculating regamma params
                 * on top of a linear input. But degamma params can be used
                 * instead to simulate this.
                 */
                if (gamma)
                        gamma->type = GAMMA_CUSTOM;
                res = mod_color_calculate_degamma_params(NULL, func,
                                                         gamma, gamma != NULL);
        } else {
                /*
                 * Assume sRGB. The actual mapping will depend on whether the
                 * input was legacy or not.
                 */
                if (gamma)
                        gamma->type = GAMMA_CS_TFM_1D;
                res = mod_color_calculate_regamma_params(func, gamma, gamma != NULL,
                                                         has_rom, NULL, &cal_buffer);
        }

        if (gamma)
                dc_gamma_release(&gamma);

        return res ? 0 : -ENOMEM;
}

/**
 * __set_output_tf_32 - calculates the output transfer function based on expected input space.
 * @func: transfer function
 * @lut: lookup table that defines the color space
 * @lut_size: size of respective lut
 * @has_rom: if ROM can be used for hardcoded curve
 *
 * Returns:
 * 0 in case of success. -ENOMEM if fails.
 */
static int __set_output_tf_32(struct dc_transfer_func *func,
                              const struct drm_color_lut32 *lut, uint32_t lut_size,
                              bool has_rom)
{
        struct dc_gamma *gamma = NULL;
        struct calculate_buffer cal_buffer = {0};
        bool res;

        cal_buffer.buffer_index = -1;

        if (lut_size) {
                gamma = dc_create_gamma();
                if (!gamma)
                        return -ENOMEM;

                gamma->num_entries = lut_size;
                __drm_lut32_to_dc_gamma(lut, gamma);
        }

        if (func->tf == TRANSFER_FUNCTION_LINEAR) {
                /*
                 * Color module doesn't like calculating regamma params
                 * on top of a linear input. But degamma params can be used
                 * instead to simulate this.
                 */
                if (gamma)
                        gamma->type = GAMMA_CUSTOM;
                res = mod_color_calculate_degamma_params(NULL, func,
                                                         gamma, gamma != NULL);
        } else {
                /*
                 * Assume sRGB. The actual mapping will depend on whether the
                 * input was legacy or not.
                 */
                if (gamma)
                        gamma->type = GAMMA_CS_TFM_1D;
                res = mod_color_calculate_regamma_params(func, gamma, gamma != NULL,
                                                         has_rom, NULL, &cal_buffer);
        }

        if (gamma)
                dc_gamma_release(&gamma);

        return res ? 0 : -ENOMEM;
}


static int amdgpu_dm_set_atomic_regamma(struct dc_transfer_func *out_tf,
                                        const struct drm_color_lut *regamma_lut,
                                        uint32_t regamma_size, bool has_rom,
                                        enum dc_transfer_func_predefined tf)
{
        int ret = 0;

        if (regamma_size || tf != TRANSFER_FUNCTION_LINEAR) {
                /*
                 * CRTC RGM goes into RGM LUT.
                 *
                 * Note: there is no implicit sRGB regamma here. We are using
                 * degamma calculation from color module to calculate the curve
                 * from a linear base if gamma TF is not set. However, if gamma
                 * TF (!= Linear) and LUT are set at the same time, we will use
                 * regamma calculation, and the color module will combine the
                 * pre-defined TF and the custom LUT values into the LUT that's
                 * actually programmed.
                 */
                out_tf->type = TF_TYPE_DISTRIBUTED_POINTS;
                out_tf->tf = tf;
                out_tf->sdr_ref_white_level = SDR_WHITE_LEVEL_INIT_VALUE;

                ret = __set_output_tf(out_tf, regamma_lut, regamma_size, has_rom);
        } else {
                /*
                 * No CRTC RGM means we can just put the block into bypass
                 * since we don't have any plane level adjustments using it.
                 */
                out_tf->type = TF_TYPE_BYPASS;
                out_tf->tf = TRANSFER_FUNCTION_LINEAR;
        }

        return ret;
}

/**
 * __set_input_tf - calculates the input transfer function based on expected
 * input space.
 * @caps: dc color capabilities
 * @func: transfer function
 * @lut: lookup table that defines the color space
 * @lut_size: size of respective lut.
 *
 * Returns:
 * 0 in case of success. -ENOMEM if fails.
 */
static int __set_input_tf(struct dc_color_caps *caps, struct dc_transfer_func *func,
                          const struct drm_color_lut *lut, uint32_t lut_size)
{
        struct dc_gamma *gamma = NULL;
        bool res;

        if (lut_size) {
                gamma = dc_create_gamma();
                if (!gamma)
                        return -ENOMEM;

                gamma->type = GAMMA_CUSTOM;
                gamma->num_entries = lut_size;

                __drm_lut_to_dc_gamma(lut, gamma, false);
        }

        res = mod_color_calculate_degamma_params(caps, func, gamma, gamma != NULL);

        if (gamma)
                dc_gamma_release(&gamma);

        return res ? 0 : -ENOMEM;
}

/**
 * __set_input_tf_32 - calculates the input transfer function based on expected
 * input space.
 * @caps: dc color capabilities
 * @func: transfer function
 * @lut: lookup table that defines the color space
 * @lut_size: size of respective lut.
 *
 * Returns:
 * 0 in case of success. -ENOMEM if fails.
 */
static int __set_input_tf_32(struct dc_color_caps *caps, struct dc_transfer_func *func,
                             const struct drm_color_lut32 *lut, uint32_t lut_size)
{
        struct dc_gamma *gamma = NULL;
        bool res;

        if (lut_size) {
                gamma = dc_create_gamma();
                if (!gamma)
                        return -ENOMEM;

                gamma->type = GAMMA_CUSTOM;
                gamma->num_entries = lut_size;

                __drm_lut32_to_dc_gamma(lut, gamma);
        }

        res = mod_color_calculate_degamma_params(caps, func, gamma, gamma != NULL);

        if (gamma)
                dc_gamma_release(&gamma);

        return res ? 0 : -ENOMEM;
}

static enum dc_transfer_func_predefined
amdgpu_tf_to_dc_tf(enum amdgpu_transfer_function tf)
{
        switch (tf) {
        default:
        case AMDGPU_TRANSFER_FUNCTION_DEFAULT:
        case AMDGPU_TRANSFER_FUNCTION_IDENTITY:
                return TRANSFER_FUNCTION_LINEAR;
        case AMDGPU_TRANSFER_FUNCTION_SRGB_EOTF:
        case AMDGPU_TRANSFER_FUNCTION_SRGB_INV_EOTF:
                return TRANSFER_FUNCTION_SRGB;
        case AMDGPU_TRANSFER_FUNCTION_BT709_OETF:
        case AMDGPU_TRANSFER_FUNCTION_BT709_INV_OETF:
                return TRANSFER_FUNCTION_BT709;
        case AMDGPU_TRANSFER_FUNCTION_PQ_EOTF:
        case AMDGPU_TRANSFER_FUNCTION_PQ_INV_EOTF:
                return TRANSFER_FUNCTION_PQ;
        case AMDGPU_TRANSFER_FUNCTION_GAMMA22_EOTF:
        case AMDGPU_TRANSFER_FUNCTION_GAMMA22_INV_EOTF:
                return TRANSFER_FUNCTION_GAMMA22;
        case AMDGPU_TRANSFER_FUNCTION_GAMMA24_EOTF:
        case AMDGPU_TRANSFER_FUNCTION_GAMMA24_INV_EOTF:
                return TRANSFER_FUNCTION_GAMMA24;
        case AMDGPU_TRANSFER_FUNCTION_GAMMA26_EOTF:
        case AMDGPU_TRANSFER_FUNCTION_GAMMA26_INV_EOTF:
                return TRANSFER_FUNCTION_GAMMA26;
        }
}

static enum dc_transfer_func_predefined
amdgpu_colorop_tf_to_dc_tf(enum drm_colorop_curve_1d_type tf)
{
        switch (tf) {
        case DRM_COLOROP_1D_CURVE_SRGB_EOTF:
        case DRM_COLOROP_1D_CURVE_SRGB_INV_EOTF:
                return TRANSFER_FUNCTION_SRGB;
        case DRM_COLOROP_1D_CURVE_PQ_125_EOTF:
        case DRM_COLOROP_1D_CURVE_PQ_125_INV_EOTF:
                return TRANSFER_FUNCTION_PQ;
        case DRM_COLOROP_1D_CURVE_BT2020_INV_OETF:
        case DRM_COLOROP_1D_CURVE_BT2020_OETF:
                return TRANSFER_FUNCTION_BT709;
        case DRM_COLOROP_1D_CURVE_GAMMA22:
        case DRM_COLOROP_1D_CURVE_GAMMA22_INV:
                return TRANSFER_FUNCTION_GAMMA22;
        default:
                return TRANSFER_FUNCTION_LINEAR;
        }
}

static void __to_dc_lut3d_color(struct dc_rgb *rgb,
                                const struct drm_color_lut lut,
                                int bit_precision)
{
        rgb->red = drm_color_lut_extract(lut.red, bit_precision);
        rgb->green = drm_color_lut_extract(lut.green, bit_precision);
        rgb->blue  = drm_color_lut_extract(lut.blue, bit_precision);
}

static void __drm_3dlut_to_dc_3dlut(const struct drm_color_lut *lut,
                                    uint32_t lut3d_size,
                                    struct tetrahedral_params *params,
                                    bool use_tetrahedral_9,
                                    int bit_depth)
{
        struct dc_rgb *lut0;
        struct dc_rgb *lut1;
        struct dc_rgb *lut2;
        struct dc_rgb *lut3;
        int lut_i, i;


        if (use_tetrahedral_9) {
                lut0 = params->tetrahedral_9.lut0;
                lut1 = params->tetrahedral_9.lut1;
                lut2 = params->tetrahedral_9.lut2;
                lut3 = params->tetrahedral_9.lut3;
        } else {
                lut0 = params->tetrahedral_17.lut0;
                lut1 = params->tetrahedral_17.lut1;
                lut2 = params->tetrahedral_17.lut2;
                lut3 = params->tetrahedral_17.lut3;
        }

        for (lut_i = 0, i = 0; i < lut3d_size - 4; lut_i++, i += 4) {
                /*
                 * We should consider the 3D LUT RGB values are distributed
                 * along four arrays lut0-3 where the first sizes 1229 and the
                 * other 1228. The bit depth supported for 3dlut channel is
                 * 12-bit, but DC also supports 10-bit.
                 *
                 * TODO: improve color pipeline API to enable the userspace set
                 * bit depth and 3D LUT size/stride, as specified by VA-API.
                 */
                __to_dc_lut3d_color(&lut0[lut_i], lut[i], bit_depth);
                __to_dc_lut3d_color(&lut1[lut_i], lut[i + 1], bit_depth);
                __to_dc_lut3d_color(&lut2[lut_i], lut[i + 2], bit_depth);
                __to_dc_lut3d_color(&lut3[lut_i], lut[i + 3], bit_depth);
        }
        /* lut0 has 1229 points (lut_size/4 + 1) */
        __to_dc_lut3d_color(&lut0[lut_i], lut[i], bit_depth);
}

static void __to_dc_lut3d_32_color(struct dc_rgb *rgb,
                                   const struct drm_color_lut32 lut,
                                   int bit_precision)
{
        rgb->red = drm_color_lut32_extract(lut.red, bit_precision);
        rgb->green = drm_color_lut32_extract(lut.green, bit_precision);
        rgb->blue  = drm_color_lut32_extract(lut.blue, bit_precision);
}

static void __drm_3dlut32_to_dc_3dlut(const struct drm_color_lut32 *lut,
                                       uint32_t lut3d_size,
                                       struct tetrahedral_params *params,
                                       bool use_tetrahedral_9,
                                       int bit_depth)
{
        struct dc_rgb *lut0;
        struct dc_rgb *lut1;
        struct dc_rgb *lut2;
        struct dc_rgb *lut3;
        int lut_i, i;


        if (use_tetrahedral_9) {
                lut0 = params->tetrahedral_9.lut0;
                lut1 = params->tetrahedral_9.lut1;
                lut2 = params->tetrahedral_9.lut2;
                lut3 = params->tetrahedral_9.lut3;
        } else {
                lut0 = params->tetrahedral_17.lut0;
                lut1 = params->tetrahedral_17.lut1;
                lut2 = params->tetrahedral_17.lut2;
                lut3 = params->tetrahedral_17.lut3;
        }

        for (lut_i = 0, i = 0; i < lut3d_size - 4; lut_i++, i += 4) {
                /*
                 * We should consider the 3D LUT RGB values are distributed
                 * along four arrays lut0-3 where the first sizes 1229 and the
                 * other 1228. The bit depth supported for 3dlut channel is
                 * 12-bit, but DC also supports 10-bit.
                 *
                 * TODO: improve color pipeline API to enable the userspace set
                 * bit depth and 3D LUT size/stride, as specified by VA-API.
                 */
                __to_dc_lut3d_32_color(&lut0[lut_i], lut[i], bit_depth);
                __to_dc_lut3d_32_color(&lut1[lut_i], lut[i + 1], bit_depth);
                __to_dc_lut3d_32_color(&lut2[lut_i], lut[i + 2], bit_depth);
                __to_dc_lut3d_32_color(&lut3[lut_i], lut[i + 3], bit_depth);
        }
        /* lut0 has 1229 points (lut_size/4 + 1) */
        __to_dc_lut3d_32_color(&lut0[lut_i], lut[i], bit_depth);
}

/* amdgpu_dm_atomic_lut3d - set DRM 3D LUT to DC stream
 * @drm_lut3d: user 3D LUT
 * @drm_lut3d_size: size of 3D LUT
 * @lut3d: DC 3D LUT
 *
 * Map user 3D LUT data to DC 3D LUT and all necessary bits to program it
 * on DCN accordingly.
 */
static void amdgpu_dm_atomic_lut3d(const struct drm_color_lut *drm_lut3d,
                                   uint32_t drm_lut3d_size,
                                   struct dc_3dlut *lut)
{
        if (!drm_lut3d_size) {
                lut->state.bits.initialized = 0;
        } else {
                /* Stride and bit depth are not programmable by API yet.
                 * Therefore, only supports 17x17x17 3D LUT (12-bit).
                 */
                lut->lut_3d.use_tetrahedral_9 = false;
                lut->lut_3d.use_12bits = true;
                lut->state.bits.initialized = 1;
                __drm_3dlut_to_dc_3dlut(drm_lut3d, drm_lut3d_size, &lut->lut_3d,
                                        lut->lut_3d.use_tetrahedral_9,
                                        MAX_COLOR_3DLUT_BITDEPTH);
        }
}

static int amdgpu_dm_atomic_shaper_lut(const struct drm_color_lut *shaper_lut,
                                       bool has_rom,
                                       enum dc_transfer_func_predefined tf,
                                       uint32_t shaper_size,
                                       struct dc_transfer_func *func_shaper)
{
        int ret = 0;

        if (shaper_size || tf != TRANSFER_FUNCTION_LINEAR) {
                /*
                 * If user shaper LUT is set, we assume a linear color space
                 * (linearized by degamma 1D LUT or not).
                 */
                func_shaper->type = TF_TYPE_DISTRIBUTED_POINTS;
                func_shaper->tf = tf;
                func_shaper->sdr_ref_white_level = SDR_WHITE_LEVEL_INIT_VALUE;

                ret = __set_output_tf(func_shaper, shaper_lut, shaper_size, has_rom);
        } else {
                func_shaper->type = TF_TYPE_BYPASS;
                func_shaper->tf = TRANSFER_FUNCTION_LINEAR;
        }

        return ret;
}

static int amdgpu_dm_atomic_blend_lut(const struct drm_color_lut *blend_lut,
                                       bool has_rom,
                                       enum dc_transfer_func_predefined tf,
                                       uint32_t blend_size,
                                       struct dc_transfer_func *func_blend)
{
        int ret = 0;

        if (blend_size || tf != TRANSFER_FUNCTION_LINEAR) {
                /*
                 * DRM plane gamma LUT or TF means we are linearizing color
                 * space before blending (similar to degamma programming). As
                 * we don't have hardcoded curve support, or we use AMD color
                 * module to fill the parameters that will be translated to HW
                 * points.
                 */
                func_blend->type = TF_TYPE_DISTRIBUTED_POINTS;
                func_blend->tf = tf;
                func_blend->sdr_ref_white_level = SDR_WHITE_LEVEL_INIT_VALUE;

                ret = __set_input_tf(NULL, func_blend, blend_lut, blend_size);
        } else {
                func_blend->type = TF_TYPE_BYPASS;
                func_blend->tf = TRANSFER_FUNCTION_LINEAR;
        }

        return ret;
}

/**
 * amdgpu_dm_verify_lut3d_size - verifies if 3D LUT is supported and if user
 * shaper and 3D LUTs match the hw supported size
 * @adev: amdgpu device
 * @plane_state: the DRM plane state
 *
 * Verifies if pre-blending (DPP) 3D LUT is supported by the HW (DCN 2.0 or
 * newer) and if the user shaper and 3D LUTs match the supported size.
 *
 * Returns:
 * 0 on success. -EINVAL if lut size are invalid.
 */
int amdgpu_dm_verify_lut3d_size(struct amdgpu_device *adev,
                                struct drm_plane_state *plane_state)
{
        struct dm_plane_state *dm_plane_state = to_dm_plane_state(plane_state);
        const struct drm_color_lut *shaper = NULL, *lut3d = NULL;
        uint32_t exp_size, size, dim_size = MAX_COLOR_3DLUT_SIZE;
        bool has_3dlut = adev->dm.dc->caps.color.dpp.hw_3d_lut || adev->dm.dc->caps.color.mpc.preblend;

        /* shaper LUT is only available if 3D LUT color caps */
        exp_size = has_3dlut ? MAX_COLOR_LUT_ENTRIES : 0;
        shaper = __extract_blob_lut(dm_plane_state->shaper_lut, &size);

        if (shaper && size != exp_size) {
                drm_dbg(&adev->ddev,
                        "Invalid Shaper LUT size. Should be %u but got %u.\n",
                        exp_size, size);
                return -EINVAL;
        }

        /* The number of 3D LUT entries is the dimension size cubed */
        exp_size = has_3dlut ? dim_size * dim_size * dim_size : 0;
        lut3d = __extract_blob_lut(dm_plane_state->lut3d, &size);

        if (lut3d && size != exp_size) {
                drm_dbg(&adev->ddev,
                        "Invalid 3D LUT size. Should be %u but got %u.\n",
                        exp_size, size);
                return -EINVAL;
        }

        return 0;
}

/**
 * amdgpu_dm_verify_lut_sizes - verifies if DRM luts match the hw supported sizes
 * @crtc_state: the DRM CRTC state
 *
 * Verifies that the Degamma and Gamma LUTs attached to the &crtc_state
 * are of the expected size.
 *
 * Returns:
 * 0 on success. -EINVAL if any lut sizes are invalid.
 */
int amdgpu_dm_verify_lut_sizes(const struct drm_crtc_state *crtc_state)
{
        const struct drm_color_lut *lut = NULL;
        uint32_t size = 0;

        lut = __extract_blob_lut(crtc_state->degamma_lut, &size);
        if (lut && size != MAX_COLOR_LUT_ENTRIES) {
                DRM_DEBUG_DRIVER(
                        "Invalid Degamma LUT size. Should be %u but got %u.\n",
                        MAX_COLOR_LUT_ENTRIES, size);
                return -EINVAL;
        }

        lut = __extract_blob_lut(crtc_state->gamma_lut, &size);
        if (lut && size != MAX_COLOR_LUT_ENTRIES &&
            size != MAX_COLOR_LEGACY_LUT_ENTRIES) {
                DRM_DEBUG_DRIVER(
                        "Invalid Gamma LUT size. Should be %u (or %u for legacy) but got %u.\n",
                        MAX_COLOR_LUT_ENTRIES, MAX_COLOR_LEGACY_LUT_ENTRIES,
                        size);
                return -EINVAL;
        }

        return 0;
}

/**
 * amdgpu_dm_check_crtc_color_mgmt: Check if DRM color props are programmable by DC.
 * @crtc: amdgpu_dm crtc state
 * @check_only: only check color state without update dc stream
 *
 * This function just verifies CRTC LUT sizes, if there is enough space for
 * output transfer function and if its parameters can be calculated by AMD
 * color module. It also adjusts some settings for programming CRTC degamma at
 * plane stage, using plane DGM block.
 *
 * The RGM block is typically more fully featured and accurate across
 * all ASICs - DCE can't support a custom non-linear CRTC DGM.
 *
 * For supporting both plane level color management and CRTC level color
 * management at once we have to either restrict the usage of some CRTC
 * properties or blend adjustments together.
 *
 * Returns:
 * 0 on success. Error code if validation fails.
 */

int amdgpu_dm_check_crtc_color_mgmt(struct dm_crtc_state *crtc,
                                    bool check_only)
{
        struct dc_stream_state *stream = crtc->stream;
        struct amdgpu_device *adev = drm_to_adev(crtc->base.state->dev);
        bool has_rom = adev->asic_type <= CHIP_RAVEN;
        struct dc_transfer_func *out_tf;
        const struct drm_color_lut *degamma_lut, *regamma_lut;
        uint32_t degamma_size, regamma_size;
        bool has_regamma, has_degamma;
        enum dc_transfer_func_predefined tf = TRANSFER_FUNCTION_LINEAR;
        bool is_legacy;
        int r;

        tf = amdgpu_tf_to_dc_tf(crtc->regamma_tf);

        r = amdgpu_dm_verify_lut_sizes(&crtc->base);
        if (r)
                return r;

        degamma_lut = __extract_blob_lut(crtc->base.degamma_lut, &degamma_size);
        regamma_lut = __extract_blob_lut(crtc->base.gamma_lut, &regamma_size);

        has_degamma =
                degamma_lut && !__is_lut_linear(degamma_lut, degamma_size);

        has_regamma =
                regamma_lut && !__is_lut_linear(regamma_lut, regamma_size);

        is_legacy = regamma_size == MAX_COLOR_LEGACY_LUT_ENTRIES;

        /* Reset all adjustments. */
        crtc->cm_has_degamma = false;
        crtc->cm_is_degamma_srgb = false;

        if (check_only) {
                out_tf = kvzalloc_obj(*out_tf);
                if (!out_tf)
                        return -ENOMEM;
        } else {
                out_tf = &stream->out_transfer_func;
        }

        /* Setup regamma and degamma. */
        if (is_legacy) {
                /*
                 * Legacy regamma forces us to use the sRGB RGM as a base.
                 * This also means we can't use linear DGM since DGM needs
                 * to use sRGB as a base as well, resulting in incorrect CRTC
                 * DGM and CRTC CTM.
                 *
                 * TODO: Just map this to the standard regamma interface
                 * instead since this isn't really right. One of the cases
                 * where this setup currently fails is trying to do an
                 * inverse color ramp in legacy userspace.
                 */
                crtc->cm_is_degamma_srgb = true;
                out_tf->type = TF_TYPE_DISTRIBUTED_POINTS;
                out_tf->tf = TRANSFER_FUNCTION_SRGB;
                /*
                 * Note: although we pass has_rom as parameter here, we never
                 * actually use ROM because the color module only takes the ROM
                 * path if transfer_func->type == PREDEFINED.
                 *
                 * See more in mod_color_calculate_regamma_params()
                 */
                r = __set_legacy_tf(out_tf, regamma_lut,
                                    regamma_size, has_rom);
        } else {
                regamma_size = has_regamma ? regamma_size : 0;
                r = amdgpu_dm_set_atomic_regamma(out_tf, regamma_lut,
                                                 regamma_size, has_rom, tf);
        }

        /*
         * CRTC DGM goes into DGM LUT. It would be nice to place it
         * into the RGM since it's a more featured block but we'd
         * have to place the CTM in the OCSC in that case.
         */
        crtc->cm_has_degamma = has_degamma;
        if (check_only)
                kvfree(out_tf);

        return r;
}

/**
 * amdgpu_dm_update_crtc_color_mgmt: Maps DRM color management to DC stream.
 * @crtc: amdgpu_dm crtc state
 *
 * With no plane level color management properties we're free to use any
 * of the HW blocks as long as the CRTC CTM always comes before the
 * CRTC RGM and after the CRTC DGM.
 *
 * - The CRTC RGM block will be placed in the RGM LUT block if it is non-linear.
 * - The CRTC DGM block will be placed in the DGM LUT block if it is non-linear.
 * - The CRTC CTM will be placed in the gamut remap block if it is non-linear.
 *
 * The RGM block is typically more fully featured and accurate across
 * all ASICs - DCE can't support a custom non-linear CRTC DGM.
 *
 * For supporting both plane level color management and CRTC level color
 * management at once we have to either restrict the usage of CRTC properties
 * or blend adjustments together.
 *
 * Returns:
 * 0 on success. Error code if setup fails.
 */
int amdgpu_dm_update_crtc_color_mgmt(struct dm_crtc_state *crtc)
{
        struct dc_stream_state *stream = crtc->stream;
        struct drm_color_ctm *ctm = NULL;
        int ret;

        ret = amdgpu_dm_check_crtc_color_mgmt(crtc, false);
        if (ret)
                return ret;

        /* Setup CRTC CTM. */
        if (crtc->base.ctm) {
                ctm = (struct drm_color_ctm *)crtc->base.ctm->data;

                /*
                 * Gamut remapping must be used for gamma correction
                 * since it comes before the regamma correction.
                 *
                 * OCSC could be used for gamma correction, but we'd need to
                 * blend the adjustments together with the required output
                 * conversion matrix - so just use the gamut remap block
                 * for now.
                 */
                __drm_ctm_to_dc_matrix(ctm, stream->gamut_remap_matrix.matrix);

                stream->gamut_remap_matrix.enable_remap = true;
                stream->csc_color_matrix.enable_adjustment = false;
        } else {
                /* Bypass CTM. */
                stream->gamut_remap_matrix.enable_remap = false;
                stream->csc_color_matrix.enable_adjustment = false;
        }

        return 0;
}

static int
map_crtc_degamma_to_dc_plane(struct dm_crtc_state *crtc,
                             struct dc_plane_state *dc_plane_state,
                             struct dc_color_caps *caps)
{
        const struct drm_color_lut *degamma_lut;
        enum dc_transfer_func_predefined tf = TRANSFER_FUNCTION_SRGB;
        uint32_t degamma_size;
        int r;

        /* Get the correct base transfer function for implicit degamma. */
        switch (dc_plane_state->format) {
        case SURFACE_PIXEL_FORMAT_VIDEO_420_YCbCr:
        case SURFACE_PIXEL_FORMAT_VIDEO_420_YCrCb:
                /* DC doesn't have a transfer function for BT601 specifically. */
                tf = TRANSFER_FUNCTION_BT709;
                break;
        default:
                break;
        }

        if (crtc->cm_has_degamma) {
                degamma_lut = __extract_blob_lut(crtc->base.degamma_lut,
                                                 &degamma_size);
                ASSERT(degamma_size == MAX_COLOR_LUT_ENTRIES);

                dc_plane_state->in_transfer_func.type = TF_TYPE_DISTRIBUTED_POINTS;

                /*
                 * This case isn't fully correct, but also fairly
                 * uncommon. This is userspace trying to use a
                 * legacy gamma LUT + atomic degamma LUT
                 * at the same time.
                 *
                 * Legacy gamma requires the input to be in linear
                 * space, so that means we need to apply an sRGB
                 * degamma. But color module also doesn't support
                 * a user ramp in this case so the degamma will
                 * be lost.
                 *
                 * Even if we did support it, it's still not right:
                 *
                 * Input -> CRTC DGM -> sRGB DGM -> CRTC CTM ->
                 * sRGB RGM -> CRTC RGM -> Output
                 *
                 * The CSC will be done in the wrong space since
                 * we're applying an sRGB DGM on top of the CRTC
                 * DGM.
                 *
                 * TODO: Don't use the legacy gamma interface and just
                 * map these to the atomic one instead.
                 */
                if (crtc->cm_is_degamma_srgb)
                        dc_plane_state->in_transfer_func.tf = tf;
                else
                        dc_plane_state->in_transfer_func.tf =
                                TRANSFER_FUNCTION_LINEAR;

                r = __set_input_tf(caps, &dc_plane_state->in_transfer_func,
                                   degamma_lut, degamma_size);
                if (r)
                        return r;
        } else {
                /*
                 * For legacy gamma support we need the regamma input
                 * in linear space. Assume that the input is sRGB.
                 */
                dc_plane_state->in_transfer_func.type = TF_TYPE_PREDEFINED;
                dc_plane_state->in_transfer_func.tf = tf;

                if (tf != TRANSFER_FUNCTION_SRGB &&
                    !mod_color_calculate_degamma_params(caps,
                                                        &dc_plane_state->in_transfer_func,
                                                        NULL, false))
                        return -ENOMEM;
        }

        return 0;
}

static int
__set_dm_plane_degamma(struct drm_plane_state *plane_state,
                       struct dc_plane_state *dc_plane_state,
                       struct dc_color_caps *color_caps)
{
        struct dm_plane_state *dm_plane_state = to_dm_plane_state(plane_state);
        const struct drm_color_lut *degamma_lut;
        enum amdgpu_transfer_function tf = AMDGPU_TRANSFER_FUNCTION_DEFAULT;
        uint32_t degamma_size;
        bool has_degamma_lut;
        int ret;

        degamma_lut = __extract_blob_lut(dm_plane_state->degamma_lut,
                                         &degamma_size);

        has_degamma_lut = degamma_lut &&
                          !__is_lut_linear(degamma_lut, degamma_size);

        tf = dm_plane_state->degamma_tf;

        /* If we don't have plane degamma LUT nor TF to set on DC, we have
         * nothing to do here, return.
         */
        if (!has_degamma_lut && tf == AMDGPU_TRANSFER_FUNCTION_DEFAULT)
                return -EINVAL;

        dc_plane_state->in_transfer_func.tf = amdgpu_tf_to_dc_tf(tf);

        if (has_degamma_lut) {
                ASSERT(degamma_size == MAX_COLOR_LUT_ENTRIES);

                dc_plane_state->in_transfer_func.type =
                        TF_TYPE_DISTRIBUTED_POINTS;

                ret = __set_input_tf(color_caps, &dc_plane_state->in_transfer_func,
                                     degamma_lut, degamma_size);
                if (ret)
                        return ret;
       } else {
                dc_plane_state->in_transfer_func.type =
                        TF_TYPE_PREDEFINED;

                if (!mod_color_calculate_degamma_params(color_caps,
                    &dc_plane_state->in_transfer_func, NULL, false))
                        return -ENOMEM;
        }
        return 0;
}

static int
__set_colorop_in_tf_1d_curve(struct dc_plane_state *dc_plane_state,
                             struct drm_colorop_state *colorop_state)
{
        struct dc_transfer_func *tf = &dc_plane_state->in_transfer_func;
        struct drm_colorop *colorop = colorop_state->colorop;
        struct drm_device *drm = colorop->dev;

        if (colorop->type != DRM_COLOROP_1D_CURVE)
                return -EINVAL;

        if (!(BIT(colorop_state->curve_1d_type) & amdgpu_dm_supported_degam_tfs))
                return -EINVAL;

        if (colorop_state->bypass) {
                tf->type = TF_TYPE_BYPASS;
                tf->tf = TRANSFER_FUNCTION_LINEAR;
                return 0;
        }

        drm_dbg(drm, "Degamma colorop with ID: %d\n", colorop->base.id);

        tf->type = TF_TYPE_PREDEFINED;
        tf->tf = amdgpu_colorop_tf_to_dc_tf(colorop_state->curve_1d_type);

        return 0;
}

static int
__set_dm_plane_colorop_degamma(struct drm_plane_state *plane_state,
                               struct dc_plane_state *dc_plane_state,
                               struct drm_colorop *colorop)
{
        struct drm_colorop *old_colorop;
        struct drm_colorop_state *colorop_state = NULL, *new_colorop_state;
        struct drm_atomic_state *state = plane_state->state;
        int i = 0;

        old_colorop = colorop;

        /* 1st op: 1d curve - degamma */
        for_each_new_colorop_in_state(state, colorop, new_colorop_state, i) {
                if (new_colorop_state->colorop == old_colorop &&
                    (BIT(new_colorop_state->curve_1d_type) & amdgpu_dm_supported_degam_tfs)) {
                        colorop_state = new_colorop_state;
                        break;
                }
        }

        if (!colorop_state)
                return -EINVAL;

        return __set_colorop_in_tf_1d_curve(dc_plane_state, colorop_state);
}

static int
__set_dm_plane_colorop_3x4_matrix(struct drm_plane_state *plane_state,
                                  struct dc_plane_state *dc_plane_state,
                                  struct drm_colorop *colorop)
{
        struct drm_colorop *old_colorop;
        struct drm_colorop_state *colorop_state = NULL, *new_colorop_state;
        struct drm_atomic_state *state = plane_state->state;
        const struct drm_device *dev = colorop->dev;
        const struct drm_property_blob *blob;
        struct drm_color_ctm_3x4 *ctm = NULL;
        int i = 0;

        /* 3x4 matrix */
        old_colorop = colorop;
        for_each_new_colorop_in_state(state, colorop, new_colorop_state, i) {
                if (new_colorop_state->colorop == old_colorop &&
                    new_colorop_state->colorop->type == DRM_COLOROP_CTM_3X4) {
                        colorop_state = new_colorop_state;
                        break;
                }
        }

        if (colorop_state && !colorop_state->bypass && colorop->type == DRM_COLOROP_CTM_3X4) {
                drm_dbg(dev, "3x4 matrix colorop with ID: %d\n", colorop->base.id);
                blob = colorop_state->data;
                if (blob->length == sizeof(struct drm_color_ctm_3x4)) {
                        ctm = (struct drm_color_ctm_3x4 *) blob->data;
                        __drm_ctm_3x4_to_dc_matrix(ctm, dc_plane_state->gamut_remap_matrix.matrix);
                        dc_plane_state->gamut_remap_matrix.enable_remap = true;
                        dc_plane_state->input_csc_color_matrix.enable_adjustment = false;
                } else {
                        drm_warn(dev, "blob->length (%zu) isn't equal to drm_color_ctm_3x4 (%zu)\n",
                                 blob->length, sizeof(struct drm_color_ctm_3x4));
                        return -EINVAL;
                }
        }

        return 0;
}

static int
__set_dm_plane_colorop_multiplier(struct drm_plane_state *plane_state,
                                  struct dc_plane_state *dc_plane_state,
                                  struct drm_colorop *colorop)
{
        struct drm_colorop *old_colorop;
        struct drm_colorop_state *colorop_state = NULL, *new_colorop_state;
        struct drm_atomic_state *state = plane_state->state;
        const struct drm_device *dev = colorop->dev;
        int i = 0;

        /* Multiplier */
        old_colorop = colorop;
        for_each_new_colorop_in_state(state, colorop, new_colorop_state, i) {
                if (new_colorop_state->colorop == old_colorop &&
                    new_colorop_state->colorop->type == DRM_COLOROP_MULTIPLIER) {
                        colorop_state = new_colorop_state;
                        break;
                }
        }

        if (colorop_state && !colorop_state->bypass && colorop->type == DRM_COLOROP_MULTIPLIER) {
                drm_dbg(dev, "Multiplier colorop with ID: %d\n", colorop->base.id);
                dc_plane_state->hdr_mult = amdgpu_dm_fixpt_from_s3132(colorop_state->multiplier);
        }

        return 0;
}

static int
__set_dm_plane_colorop_shaper(struct drm_plane_state *plane_state,
                              struct dc_plane_state *dc_plane_state,
                              struct drm_colorop *colorop)
{
        struct drm_colorop *old_colorop;
        struct drm_colorop_state *colorop_state = NULL, *new_colorop_state;
        struct drm_atomic_state *state = plane_state->state;
        enum dc_transfer_func_predefined default_tf = TRANSFER_FUNCTION_LINEAR;
        struct dc_transfer_func *tf = &dc_plane_state->in_shaper_func;
        const struct drm_color_lut32 *shaper_lut;
        struct drm_device *dev = colorop->dev;
        bool enabled = false;
        u32 shaper_size;
        int i = 0, ret = 0;

        /* 1D Curve - SHAPER TF */
        old_colorop = colorop;
        for_each_new_colorop_in_state(state, colorop, new_colorop_state, i) {
                if (new_colorop_state->colorop == old_colorop &&
                    (BIT(new_colorop_state->curve_1d_type) & amdgpu_dm_supported_shaper_tfs)) {
                        colorop_state = new_colorop_state;
                        break;
                }
        }

        if (colorop_state && !colorop_state->bypass && colorop->type == DRM_COLOROP_1D_CURVE) {
                drm_dbg(dev, "Shaper TF colorop with ID: %d\n", colorop->base.id);
                tf->type = TF_TYPE_DISTRIBUTED_POINTS;
                tf->tf = default_tf = amdgpu_colorop_tf_to_dc_tf(colorop_state->curve_1d_type);
                tf->sdr_ref_white_level = SDR_WHITE_LEVEL_INIT_VALUE;
                ret = __set_output_tf(tf, 0, 0, false);
                if (ret)
                        return ret;
                enabled = true;
        }

        /* 1D LUT - SHAPER LUT */
        colorop = old_colorop->next;
        if (!colorop) {
                drm_dbg(dev, "no Shaper LUT colorop found\n");
                return -EINVAL;
        }

        old_colorop = colorop;
        for_each_new_colorop_in_state(state, colorop, new_colorop_state, i) {
                if (new_colorop_state->colorop == old_colorop &&
                    new_colorop_state->colorop->type == DRM_COLOROP_1D_LUT) {
                        colorop_state = new_colorop_state;
                        break;
                }
        }

        if (colorop_state && !colorop_state->bypass && colorop->type == DRM_COLOROP_1D_LUT) {
                drm_dbg(dev, "Shaper LUT colorop with ID: %d\n", colorop->base.id);
                tf->type = TF_TYPE_DISTRIBUTED_POINTS;
                tf->tf = default_tf;
                tf->sdr_ref_white_level = SDR_WHITE_LEVEL_INIT_VALUE;
                shaper_lut = __extract_blob_lut32(colorop_state->data, &shaper_size);
                shaper_size = shaper_lut != NULL ? shaper_size : 0;

                /* Custom LUT size must be the same as supported size */
                if (shaper_size == colorop->size) {
                        ret = __set_output_tf_32(tf, shaper_lut, shaper_size, false);
                        if (ret)
                                return ret;
                        enabled = true;
                }
        }

        if (!enabled)
                tf->type = TF_TYPE_BYPASS;

        return 0;
}

/* __set_colorop_3dlut - set DRM 3D LUT to DC stream
 * @drm_lut3d: user 3D LUT
 * @drm_lut3d_size: size of 3D LUT
 * @lut3d: DC 3D LUT
 *
 * Map user 3D LUT data to DC 3D LUT and all necessary bits to program it
 * on DCN accordingly.
 *
 * Returns:
 * 0 on success. -EINVAL if drm_lut3d_size is zero.
 */
static int __set_colorop_3dlut(const struct drm_color_lut32 *drm_lut3d,
                                uint32_t drm_lut3d_size,
                                struct dc_3dlut *lut)
{
        if (!drm_lut3d_size) {
                lut->state.bits.initialized = 0;
                return -EINVAL;
        }

        /* Only supports 17x17x17 3D LUT (12-bit) now */
        lut->lut_3d.use_12bits = true;
        lut->lut_3d.use_tetrahedral_9 = false;

        lut->state.bits.initialized = 1;
        __drm_3dlut32_to_dc_3dlut(drm_lut3d, drm_lut3d_size, &lut->lut_3d,
                                   lut->lut_3d.use_tetrahedral_9, 12);

        return 0;
}

static int
__set_dm_plane_colorop_3dlut(struct drm_plane_state *plane_state,
                             struct dc_plane_state *dc_plane_state,
                             struct drm_colorop *colorop)
{
        struct drm_colorop *old_colorop;
        struct drm_colorop_state *colorop_state = NULL, *new_colorop_state;
        struct dc_transfer_func *tf = &dc_plane_state->in_shaper_func;
        struct drm_atomic_state *state = plane_state->state;
        const struct amdgpu_device *adev = drm_to_adev(colorop->dev);
        bool has_3dlut = adev->dm.dc->caps.color.dpp.hw_3d_lut || adev->dm.dc->caps.color.mpc.preblend;
        const struct drm_device *dev = colorop->dev;
        const struct drm_color_lut32 *lut3d;
        uint32_t lut3d_size;
        int i = 0, ret = 0;

        /* 3D LUT */
        old_colorop = colorop;
        for_each_new_colorop_in_state(state, colorop, new_colorop_state, i) {
                if (new_colorop_state->colorop == old_colorop &&
                    new_colorop_state->colorop->type == DRM_COLOROP_3D_LUT) {
                        colorop_state = new_colorop_state;
                        break;
                }
        }

        if (colorop_state && !colorop_state->bypass && colorop->type == DRM_COLOROP_3D_LUT) {
                if (!has_3dlut) {
                        drm_dbg(dev, "3D LUT is not supported by hardware\n");
                        return -EINVAL;
                }

                drm_dbg(dev, "3D LUT colorop with ID: %d\n", colorop->base.id);
                lut3d = __extract_blob_lut32(colorop_state->data, &lut3d_size);
                lut3d_size = lut3d != NULL ? lut3d_size : 0;
                ret = __set_colorop_3dlut(lut3d, lut3d_size, &dc_plane_state->lut3d_func);
                if (ret) {
                        drm_dbg(dev, "3D LUT colorop with ID: %d has LUT size = %d\n",
                                colorop->base.id, lut3d_size);
                        return ret;
                }

                /* 3D LUT requires shaper. If shaper colorop is bypassed, enable shaper curve
                 * with TRANSFER_FUNCTION_LINEAR
                 */
                if (tf->type == TF_TYPE_BYPASS) {
                        tf->type = TF_TYPE_DISTRIBUTED_POINTS;
                        tf->tf = TRANSFER_FUNCTION_LINEAR;
                        tf->sdr_ref_white_level = SDR_WHITE_LEVEL_INIT_VALUE;
                        ret = __set_output_tf_32(tf, NULL, 0, false);
                }
        }

        return ret;
}

static int
__set_dm_plane_colorop_blend(struct drm_plane_state *plane_state,
                             struct dc_plane_state *dc_plane_state,
                             struct drm_colorop *colorop)
{
        struct drm_colorop *old_colorop;
        struct drm_colorop_state *colorop_state = NULL, *new_colorop_state;
        struct drm_atomic_state *state = plane_state->state;
        enum dc_transfer_func_predefined default_tf = TRANSFER_FUNCTION_LINEAR;
        struct dc_transfer_func *tf = &dc_plane_state->blend_tf;
        const struct drm_color_lut32 *blend_lut = NULL;
        struct drm_device *dev = colorop->dev;
        uint32_t blend_size = 0;
        int i = 0;

        /* 1D Curve - BLND TF */
        old_colorop = colorop;
        for_each_new_colorop_in_state(state, colorop, new_colorop_state, i) {
                if (new_colorop_state->colorop == old_colorop &&
                    (BIT(new_colorop_state->curve_1d_type) & amdgpu_dm_supported_blnd_tfs)) {
                        colorop_state = new_colorop_state;
                        break;
                }
        }

        if (colorop_state && !colorop_state->bypass && colorop->type == DRM_COLOROP_1D_CURVE &&
            (BIT(colorop_state->curve_1d_type) & amdgpu_dm_supported_blnd_tfs)) {
                drm_dbg(dev, "Blend TF colorop with ID: %d\n", colorop->base.id);
                tf->type = TF_TYPE_DISTRIBUTED_POINTS;
                tf->tf = default_tf = amdgpu_colorop_tf_to_dc_tf(colorop_state->curve_1d_type);
                tf->sdr_ref_white_level = SDR_WHITE_LEVEL_INIT_VALUE;
                __set_input_tf_32(NULL, tf, blend_lut, blend_size);
        }

        /* 1D Curve - BLND LUT */
        colorop = old_colorop->next;
        if (!colorop) {
                drm_dbg(dev, "no Blend LUT colorop found\n");
                return -EINVAL;
        }

        old_colorop = colorop;
        for_each_new_colorop_in_state(state, colorop, new_colorop_state, i) {
                if (new_colorop_state->colorop == old_colorop &&
                    new_colorop_state->colorop->type == DRM_COLOROP_1D_LUT) {
                        colorop_state = new_colorop_state;
                        break;
                }
        }

        if (colorop_state && !colorop_state->bypass && colorop->type == DRM_COLOROP_1D_LUT &&
            (BIT(colorop_state->curve_1d_type) & amdgpu_dm_supported_blnd_tfs)) {
                drm_dbg(dev, "Blend LUT colorop with ID: %d\n", colorop->base.id);
                tf->type = TF_TYPE_DISTRIBUTED_POINTS;
                tf->tf = default_tf;
                tf->sdr_ref_white_level = SDR_WHITE_LEVEL_INIT_VALUE;
                blend_lut = __extract_blob_lut32(colorop_state->data, &blend_size);
                blend_size = blend_lut != NULL ? blend_size : 0;

                /* Custom LUT size must be the same as supported size */
                if (blend_size == colorop->size)
                        __set_input_tf_32(NULL, tf, blend_lut, blend_size);
        }

        return 0;
}

static int
amdgpu_dm_plane_set_color_properties(struct drm_plane_state *plane_state,
                                     struct dc_plane_state *dc_plane_state)
{
        struct dm_plane_state *dm_plane_state = to_dm_plane_state(plane_state);
        enum amdgpu_transfer_function shaper_tf = AMDGPU_TRANSFER_FUNCTION_DEFAULT;
        enum amdgpu_transfer_function blend_tf = AMDGPU_TRANSFER_FUNCTION_DEFAULT;
        const struct drm_color_lut *shaper_lut, *lut3d, *blend_lut;
        uint32_t shaper_size, lut3d_size, blend_size;
        int ret;

        dc_plane_state->hdr_mult = amdgpu_dm_fixpt_from_s3132(dm_plane_state->hdr_mult);

        shaper_lut = __extract_blob_lut(dm_plane_state->shaper_lut, &shaper_size);
        shaper_size = shaper_lut != NULL ? shaper_size : 0;
        shaper_tf = dm_plane_state->shaper_tf;
        lut3d = __extract_blob_lut(dm_plane_state->lut3d, &lut3d_size);
        lut3d_size = lut3d != NULL ? lut3d_size : 0;

        amdgpu_dm_atomic_lut3d(lut3d, lut3d_size, &dc_plane_state->lut3d_func);
        ret = amdgpu_dm_atomic_shaper_lut(shaper_lut, false,
                                          amdgpu_tf_to_dc_tf(shaper_tf),
                                          shaper_size,
                                          &dc_plane_state->in_shaper_func);
        if (ret) {
                drm_dbg_kms(plane_state->plane->dev,
                            "setting plane %d shaper LUT failed.\n",
                            plane_state->plane->index);

                return ret;
        }

        blend_tf = dm_plane_state->blend_tf;
        blend_lut = __extract_blob_lut(dm_plane_state->blend_lut, &blend_size);
        blend_size = blend_lut != NULL ? blend_size : 0;

        ret = amdgpu_dm_atomic_blend_lut(blend_lut, false,
                                         amdgpu_tf_to_dc_tf(blend_tf),
                                         blend_size, &dc_plane_state->blend_tf);
        if (ret) {
                drm_dbg_kms(plane_state->plane->dev,
                            "setting plane %d gamma lut failed.\n",
                            plane_state->plane->index);

                return ret;
        }

        return 0;
}

static int
amdgpu_dm_plane_set_colorop_properties(struct drm_plane_state *plane_state,
                                       struct dc_plane_state *dc_plane_state)
{
        struct drm_colorop *colorop = plane_state->color_pipeline;
        struct drm_device *dev = plane_state->plane->dev;
        struct amdgpu_device *adev = drm_to_adev(dev);
        bool has_3dlut = adev->dm.dc->caps.color.dpp.hw_3d_lut || adev->dm.dc->caps.color.mpc.preblend;
        int ret;

        /* 1D Curve - DEGAM TF */
        if (!colorop)
                return -EINVAL;

        ret = __set_dm_plane_colorop_degamma(plane_state, dc_plane_state, colorop);
        if (ret)
                return ret;

        /* Multiplier */
        colorop = colorop->next;
        if (!colorop) {
                drm_dbg(dev, "no multiplier colorop found\n");
                return -EINVAL;
        }

        ret = __set_dm_plane_colorop_multiplier(plane_state, dc_plane_state, colorop);
        if (ret)
                return ret;

        /* 3x4 matrix */
        colorop = colorop->next;
        if (!colorop) {
                drm_dbg(dev, "no 3x4 matrix colorop found\n");
                return -EINVAL;
        }

        ret = __set_dm_plane_colorop_3x4_matrix(plane_state, dc_plane_state, colorop);
        if (ret)
                return ret;

        if (has_3dlut) {
                /* 1D Curve & LUT - SHAPER TF & LUT */
                colorop = colorop->next;
                if (!colorop) {
                        drm_dbg(dev, "no Shaper TF colorop found\n");
                        return -EINVAL;
                }

                ret = __set_dm_plane_colorop_shaper(plane_state, dc_plane_state, colorop);
                if (ret)
                        return ret;

                /* Shaper LUT colorop is already handled, just skip here */
                colorop = colorop->next;
                if (!colorop)
                        return -EINVAL;

                /* 3D LUT */
                colorop = colorop->next;
                if (!colorop) {
                        drm_dbg(dev, "no 3D LUT colorop found\n");
                        return -EINVAL;
                }

                ret = __set_dm_plane_colorop_3dlut(plane_state, dc_plane_state, colorop);
                if (ret)
                        return ret;
        }

        /* 1D Curve & LUT - BLND TF & LUT */
        colorop = colorop->next;
        if (!colorop) {
                drm_dbg(dev, "no Blend TF colorop found\n");
                return -EINVAL;
        }

        ret = __set_dm_plane_colorop_blend(plane_state, dc_plane_state, colorop);
        if (ret)
                return ret;

        /* BLND LUT colorop is already handled, just skip here */
        colorop = colorop->next;
        if (!colorop)
                return -EINVAL;

        return 0;
}

/**
 * amdgpu_dm_update_plane_color_mgmt: Maps DRM color management to DC plane.
 * @crtc: amdgpu_dm crtc state
 * @plane_state: DRM plane state
 * @dc_plane_state: target DC surface
 *
 * Update the underlying dc_stream_state's input transfer function (ITF) in
 * preparation for hardware commit. The transfer function used depends on
 * the preparation done on the stream for color management.
 *
 * Returns:
 * 0 on success. -ENOMEM if mem allocation fails.
 */
int amdgpu_dm_update_plane_color_mgmt(struct dm_crtc_state *crtc,
                                      struct drm_plane_state *plane_state,
                                      struct dc_plane_state *dc_plane_state)
{
        struct amdgpu_device *adev = drm_to_adev(crtc->base.state->dev);
        struct dm_plane_state *dm_plane_state = to_dm_plane_state(plane_state);
        struct drm_color_ctm_3x4 *ctm = NULL;
        struct dc_color_caps *color_caps = NULL;
        bool has_crtc_cm_degamma;
        int ret;

        ret = amdgpu_dm_verify_lut3d_size(adev, plane_state);
        if (ret) {
                drm_dbg_driver(&adev->ddev, "amdgpu_dm_verify_lut3d_size() failed\n");
                return ret;
        }

        if (dc_plane_state->ctx && dc_plane_state->ctx->dc)
                color_caps = &dc_plane_state->ctx->dc->caps.color;

        /* Initially, we can just bypass the DGM block. */
        dc_plane_state->in_transfer_func.type = TF_TYPE_BYPASS;
        dc_plane_state->in_transfer_func.tf = TRANSFER_FUNCTION_LINEAR;

        /* After, we start to update values according to color props */
        has_crtc_cm_degamma = (crtc->cm_has_degamma || crtc->cm_is_degamma_srgb);

        ret = __set_dm_plane_degamma(plane_state, dc_plane_state, color_caps);
        if (ret == -ENOMEM)
                return ret;

        /* We only have one degamma block available (pre-blending) for the
         * whole color correction pipeline, so that we can't actually perform
         * plane and CRTC degamma at the same time. Explicitly reject atomic
         * updates when userspace sets both plane and CRTC degamma properties.
         */
        if (has_crtc_cm_degamma && ret != -EINVAL) {
                drm_dbg_kms(crtc->base.crtc->dev,
                            "doesn't support plane and CRTC degamma at the same time\n");
                return -EINVAL;
        }

        /* If we are here, it means we don't have plane degamma settings, check
         * if we have CRTC degamma waiting for mapping to pre-blending degamma
         * block
         */
        if (has_crtc_cm_degamma) {
                /*
                 * AMD HW doesn't have post-blending degamma caps. When DRM
                 * CRTC atomic degamma is set, we maps it to DPP degamma block
                 * (pre-blending) or, on legacy gamma, we use DPP degamma to
                 * linearize (implicit degamma) from sRGB/BT709 according to
                 * the input space.
                 */
                ret = map_crtc_degamma_to_dc_plane(crtc, dc_plane_state, color_caps);
                if (ret)
                        return ret;
        }

        /* Setup CRTC CTM. */
        if (dm_plane_state->ctm) {
                ctm = (struct drm_color_ctm_3x4 *)dm_plane_state->ctm->data;
                /*
                 * DCN2 and older don't support both pre-blending and
                 * post-blending gamut remap. For this HW family, if we have
                 * the plane and CRTC CTMs simultaneously, CRTC CTM takes
                 * priority, and we discard plane CTM, as implemented in
                 * dcn10_program_gamut_remap(). However, DCN3+ has DPP
                 * (pre-blending) and MPC (post-blending) `gamut remap` blocks;
                 * therefore, we can program plane and CRTC CTMs together by
                 * mapping CRTC CTM to MPC and keeping plane CTM setup at DPP,
                 * as it's done by dcn30_program_gamut_remap().
                 */
                __drm_ctm_3x4_to_dc_matrix(ctm, dc_plane_state->gamut_remap_matrix.matrix);

                dc_plane_state->gamut_remap_matrix.enable_remap = true;
                dc_plane_state->input_csc_color_matrix.enable_adjustment = false;
        } else {
                /* Bypass CTM. */
                dc_plane_state->gamut_remap_matrix.enable_remap = false;
                dc_plane_state->input_csc_color_matrix.enable_adjustment = false;
        }

        if (!amdgpu_dm_plane_set_colorop_properties(plane_state, dc_plane_state))
                return 0;

        return amdgpu_dm_plane_set_color_properties(plane_state, dc_plane_state);
}