root/drivers/gpu/drm/i915/gt/intel_sseu.h
/* SPDX-License-Identifier: MIT */
/*
 * Copyright © 2019 Intel Corporation
 */

#ifndef __INTEL_SSEU_H__
#define __INTEL_SSEU_H__

#include <linux/types.h>
#include <linux/kernel.h>

#include "i915_gem.h"

struct drm_i915_private;
struct intel_gt;
struct drm_printer;

/*
 * Maximum number of slices on older platforms.  Slices no longer exist
 * starting on Xe_HP ("gslices," "cslices," etc. are a different concept and
 * are not expressed through fusing).
 */
#define GEN_MAX_HSW_SLICES              3

/*
 * Maximum number of subslices that can exist within a HSW-style slice.  This
 * is only relevant to pre-Xe_HP platforms (Xe_HP and beyond use the
 * I915_MAX_SS_FUSE_BITS value below).
 */
#define GEN_MAX_SS_PER_HSW_SLICE        8

/*
 * Maximum number of 32-bit registers used by hardware to express the
 * enabled/disabled subslices.
 */
#define I915_MAX_SS_FUSE_REGS   2
#define I915_MAX_SS_FUSE_BITS   (I915_MAX_SS_FUSE_REGS * 32)

/* Maximum number of EUs that can exist within a subslice or DSS. */
#define GEN_MAX_EUS_PER_SS              16

#define SSEU_MAX(a, b)                  ((a) > (b) ? (a) : (b))

/* The maximum number of bits needed to express each subslice/DSS independently */
#define GEN_SS_MASK_SIZE                SSEU_MAX(I915_MAX_SS_FUSE_BITS, \
                                                 GEN_MAX_HSW_SLICES * GEN_MAX_SS_PER_HSW_SLICE)

#define GEN_SSEU_STRIDE(max_entries)    DIV_ROUND_UP(max_entries, BITS_PER_BYTE)
#define GEN_MAX_SUBSLICE_STRIDE         GEN_SSEU_STRIDE(GEN_SS_MASK_SIZE)
#define GEN_MAX_EU_STRIDE               GEN_SSEU_STRIDE(GEN_MAX_EUS_PER_SS)

#define GEN_DSS_PER_GSLICE      4
#define GEN_DSS_PER_CSLICE      8
#define GEN_DSS_PER_MSLICE      8

#define GEN_MAX_GSLICES         (I915_MAX_SS_FUSE_BITS / GEN_DSS_PER_GSLICE)
#define GEN_MAX_CSLICES         (I915_MAX_SS_FUSE_BITS / GEN_DSS_PER_CSLICE)

typedef union {
        u8 hsw[GEN_MAX_HSW_SLICES];

        /* Bitmap compatible with linux/bitmap.h; may exceed size of u64 */
        unsigned long xehp[BITS_TO_LONGS(I915_MAX_SS_FUSE_BITS)];
} intel_sseu_ss_mask_t;

#define XEHP_BITMAP_BITS(mask)  ((int)BITS_PER_TYPE(typeof(mask.xehp)))

struct sseu_dev_info {
        u8 slice_mask;
        intel_sseu_ss_mask_t subslice_mask;
        intel_sseu_ss_mask_t geometry_subslice_mask;
        intel_sseu_ss_mask_t compute_subslice_mask;
        union {
                u16 hsw[GEN_MAX_HSW_SLICES][GEN_MAX_SS_PER_HSW_SLICE];
                u16 xehp[I915_MAX_SS_FUSE_BITS];
        } eu_mask;

        u16 eu_total;
        u8 eu_per_subslice;
        u8 min_eu_in_pool;
        /* For each slice, which subslice(s) has(have) 7 EUs (bitfield)? */
        u8 subslice_7eu[3];
        u8 has_slice_pg:1;
        u8 has_subslice_pg:1;
        u8 has_eu_pg:1;
        /*
         * For Xe_HP and beyond, the hardware no longer has traditional slices
         * so we just report the entire DSS pool under a fake "slice 0."
         */
        u8 has_xehp_dss:1;

        /* Topology fields */
        u8 max_slices;
        u8 max_subslices;
        u8 max_eus_per_subslice;
};

/*
 * Powergating configuration for a particular (context,engine).
 */
struct intel_sseu {
        u8 slice_mask;
        u8 subslice_mask;
        u8 min_eus_per_subslice;
        u8 max_eus_per_subslice;
};

static inline struct intel_sseu
intel_sseu_from_device_info(const struct sseu_dev_info *sseu)
{
        struct intel_sseu value = {
                .slice_mask = sseu->slice_mask,
                .subslice_mask = sseu->subslice_mask.hsw[0],
                .min_eus_per_subslice = sseu->max_eus_per_subslice,
                .max_eus_per_subslice = sseu->max_eus_per_subslice,
        };

        return value;
}

static inline bool
intel_sseu_has_subslice(const struct sseu_dev_info *sseu, int slice,
                        int subslice)
{
        if (slice >= sseu->max_slices ||
            subslice >= sseu->max_subslices)
                return false;

        if (sseu->has_xehp_dss)
                return test_bit(subslice, sseu->subslice_mask.xehp);
        else
                return sseu->subslice_mask.hsw[slice] & BIT(subslice);
}

/*
 * Used to obtain the index of the first DSS.  Can start searching from the
 * beginning of a specific dss group (e.g., gslice, cslice, etc.) if
 * groupsize and groupnum are non-zero.
 */
static inline unsigned int
intel_sseu_find_first_xehp_dss(const struct sseu_dev_info *sseu, int groupsize,
                               int groupnum)
{
        return find_next_bit(sseu->subslice_mask.xehp,
                             XEHP_BITMAP_BITS(sseu->subslice_mask),
                             groupnum * groupsize);
}

void intel_sseu_set_info(struct sseu_dev_info *sseu, u8 max_slices,
                         u8 max_subslices, u8 max_eus_per_subslice);

unsigned int
intel_sseu_subslice_total(const struct sseu_dev_info *sseu);

unsigned int
intel_sseu_get_hsw_subslices(const struct sseu_dev_info *sseu, u8 slice);

intel_sseu_ss_mask_t
intel_sseu_get_compute_subslices(const struct sseu_dev_info *sseu);

void intel_sseu_info_init(struct intel_gt *gt);

u32 intel_sseu_make_rpcs(struct intel_gt *gt,
                         const struct intel_sseu *req_sseu);

void intel_sseu_dump(const struct sseu_dev_info *sseu, struct drm_printer *p);
void intel_sseu_print_topology(struct drm_i915_private *i915,
                               const struct sseu_dev_info *sseu,
                               struct drm_printer *p);

u16 intel_slicemask_from_xehp_dssmask(intel_sseu_ss_mask_t dss_mask, int dss_per_slice);

int intel_sseu_copy_eumask_to_user(void __user *to,
                                   const struct sseu_dev_info *sseu);
int intel_sseu_copy_ssmask_to_user(void __user *to,
                                   const struct sseu_dev_info *sseu);

void intel_sseu_print_ss_info(const char *type,
                              const struct sseu_dev_info *sseu,
                              struct seq_file *m);

#endif /* __INTEL_SSEU_H__ */