root/drivers/net/ethernet/mellanox/mlxsw/spectrum_buffers.c
// SPDX-License-Identifier: BSD-3-Clause OR GPL-2.0
/* Copyright (c) 2015-2018 Mellanox Technologies. All rights reserved */

#include <linux/kernel.h>
#include <linux/types.h>
#include <linux/dcbnl.h>
#include <linux/if_ether.h>
#include <linux/list.h>
#include <linux/netlink.h>

#include "spectrum.h"
#include "core.h"
#include "port.h"
#include "reg.h"

struct mlxsw_sp_sb_pr {
        enum mlxsw_reg_sbpr_mode mode;
        u32 size;
        u8 freeze_mode:1,
           freeze_size:1;
};

struct mlxsw_cp_sb_occ {
        u32 cur;
        u32 max;
};

struct mlxsw_sp_sb_cm {
        u32 min_buff;
        u32 max_buff;
        u16 pool_index;
        struct mlxsw_cp_sb_occ occ;
        u8 freeze_pool:1,
           freeze_thresh:1;
};

#define MLXSW_SP_SB_INFI -1U
#define MLXSW_SP_SB_REST -2U

struct mlxsw_sp_sb_pm {
        u32 min_buff;
        u32 max_buff;
        struct mlxsw_cp_sb_occ occ;
};

struct mlxsw_sp_sb_mm {
        u32 min_buff;
        u32 max_buff;
        u16 pool_index;
};

struct mlxsw_sp_sb_pool_des {
        enum mlxsw_reg_sbxx_dir dir;
        u8 pool;
};

#define MLXSW_SP_SB_POOL_ING            0
#define MLXSW_SP_SB_POOL_EGR            4
#define MLXSW_SP_SB_POOL_EGR_MC         8
#define MLXSW_SP_SB_POOL_ING_CPU        9
#define MLXSW_SP_SB_POOL_EGR_CPU        10

static const struct mlxsw_sp_sb_pool_des mlxsw_sp1_sb_pool_dess[] = {
        {MLXSW_REG_SBXX_DIR_INGRESS, 0},
        {MLXSW_REG_SBXX_DIR_INGRESS, 1},
        {MLXSW_REG_SBXX_DIR_INGRESS, 2},
        {MLXSW_REG_SBXX_DIR_INGRESS, 3},
        {MLXSW_REG_SBXX_DIR_EGRESS, 0},
        {MLXSW_REG_SBXX_DIR_EGRESS, 1},
        {MLXSW_REG_SBXX_DIR_EGRESS, 2},
        {MLXSW_REG_SBXX_DIR_EGRESS, 3},
        {MLXSW_REG_SBXX_DIR_EGRESS, 15},
        {MLXSW_REG_SBXX_DIR_INGRESS, 4},
        {MLXSW_REG_SBXX_DIR_EGRESS, 4},
};

static const struct mlxsw_sp_sb_pool_des mlxsw_sp2_sb_pool_dess[] = {
        {MLXSW_REG_SBXX_DIR_INGRESS, 0},
        {MLXSW_REG_SBXX_DIR_INGRESS, 1},
        {MLXSW_REG_SBXX_DIR_INGRESS, 2},
        {MLXSW_REG_SBXX_DIR_INGRESS, 3},
        {MLXSW_REG_SBXX_DIR_EGRESS, 0},
        {MLXSW_REG_SBXX_DIR_EGRESS, 1},
        {MLXSW_REG_SBXX_DIR_EGRESS, 2},
        {MLXSW_REG_SBXX_DIR_EGRESS, 3},
        {MLXSW_REG_SBXX_DIR_EGRESS, 15},
        {MLXSW_REG_SBXX_DIR_INGRESS, 4},
        {MLXSW_REG_SBXX_DIR_EGRESS, 4},
};

#define MLXSW_SP_SB_ING_TC_COUNT 8
#define MLXSW_SP_SB_EG_TC_COUNT 16

struct mlxsw_sp_sb_port {
        struct mlxsw_sp_sb_cm ing_cms[MLXSW_SP_SB_ING_TC_COUNT];
        struct mlxsw_sp_sb_cm eg_cms[MLXSW_SP_SB_EG_TC_COUNT];
        struct mlxsw_sp_sb_pm *pms;
};

struct mlxsw_sp_sb {
        struct mlxsw_sp_sb_pr *prs;
        struct mlxsw_sp_sb_port *ports;
        u32 cell_size;
        u32 max_headroom_cells;
        u64 sb_size;
};

struct mlxsw_sp_sb_vals {
        unsigned int pool_count;
        const struct mlxsw_sp_sb_pool_des *pool_dess;
        const struct mlxsw_sp_sb_pm *pms;
        const struct mlxsw_sp_sb_pm *pms_cpu;
        const struct mlxsw_sp_sb_pr *prs;
        const struct mlxsw_sp_sb_mm *mms;
        const struct mlxsw_sp_sb_cm *cms_ingress;
        const struct mlxsw_sp_sb_cm *cms_egress;
        const struct mlxsw_sp_sb_cm *cms_cpu;
        unsigned int mms_count;
        unsigned int cms_ingress_count;
        unsigned int cms_egress_count;
        unsigned int cms_cpu_count;
};

struct mlxsw_sp_sb_ops {
        u32 (*int_buf_size_get)(int mtu, u32 speed);
};

u32 mlxsw_sp_cells_bytes(const struct mlxsw_sp *mlxsw_sp, u32 cells)
{
        return mlxsw_sp->sb->cell_size * cells;
}

u32 mlxsw_sp_bytes_cells(const struct mlxsw_sp *mlxsw_sp, u32 bytes)
{
        return DIV_ROUND_UP(bytes, mlxsw_sp->sb->cell_size);
}

static u32 mlxsw_sp_port_headroom_8x_adjust(const struct mlxsw_sp_port *mlxsw_sp_port,
                                            u32 size_cells)
{
        /* Ports with eight lanes use two headroom buffers between which the
         * configured headroom size is split. Therefore, multiply the calculated
         * headroom size by two.
         */
        return mlxsw_sp_port->mapping.width == 8 ? 2 * size_cells : size_cells;
}

static struct mlxsw_sp_sb_pr *mlxsw_sp_sb_pr_get(struct mlxsw_sp *mlxsw_sp,
                                                 u16 pool_index)
{
        return &mlxsw_sp->sb->prs[pool_index];
}

static bool mlxsw_sp_sb_cm_exists(u8 pg_buff, enum mlxsw_reg_sbxx_dir dir)
{
        if (dir == MLXSW_REG_SBXX_DIR_INGRESS)
                return pg_buff < MLXSW_SP_SB_ING_TC_COUNT;
        else
                return pg_buff < MLXSW_SP_SB_EG_TC_COUNT;
}

static struct mlxsw_sp_sb_cm *mlxsw_sp_sb_cm_get(struct mlxsw_sp *mlxsw_sp,
                                                 u16 local_port, u8 pg_buff,
                                                 enum mlxsw_reg_sbxx_dir dir)
{
        struct mlxsw_sp_sb_port *sb_port = &mlxsw_sp->sb->ports[local_port];

        WARN_ON(!mlxsw_sp_sb_cm_exists(pg_buff, dir));
        if (dir == MLXSW_REG_SBXX_DIR_INGRESS)
                return &sb_port->ing_cms[pg_buff];
        else
                return &sb_port->eg_cms[pg_buff];
}

static struct mlxsw_sp_sb_pm *mlxsw_sp_sb_pm_get(struct mlxsw_sp *mlxsw_sp,
                                                 u16 local_port, u16 pool_index)
{
        return &mlxsw_sp->sb->ports[local_port].pms[pool_index];
}

static int mlxsw_sp_sb_pr_write(struct mlxsw_sp *mlxsw_sp, u16 pool_index,
                                enum mlxsw_reg_sbpr_mode mode,
                                u32 size, bool infi_size)
{
        const struct mlxsw_sp_sb_pool_des *des =
                &mlxsw_sp->sb_vals->pool_dess[pool_index];
        char sbpr_pl[MLXSW_REG_SBPR_LEN];
        struct mlxsw_sp_sb_pr *pr;
        int err;

        mlxsw_reg_sbpr_pack(sbpr_pl, des->pool, des->dir, mode,
                            size, infi_size);
        err = mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(sbpr), sbpr_pl);
        if (err)
                return err;

        if (infi_size)
                size = mlxsw_sp_bytes_cells(mlxsw_sp, mlxsw_sp->sb->sb_size);
        pr = mlxsw_sp_sb_pr_get(mlxsw_sp, pool_index);
        pr->mode = mode;
        pr->size = size;
        return 0;
}

static int mlxsw_sp_sb_pr_desc_write(struct mlxsw_sp *mlxsw_sp,
                                     enum mlxsw_reg_sbxx_dir dir,
                                     enum mlxsw_reg_sbpr_mode mode,
                                     u32 size, bool infi_size)
{
        char sbpr_pl[MLXSW_REG_SBPR_LEN];

        /* The FW default descriptor buffer configuration uses only pool 14 for
         * descriptors.
         */
        mlxsw_reg_sbpr_pack(sbpr_pl, 14, dir, mode, size, infi_size);
        mlxsw_reg_sbpr_desc_set(sbpr_pl, true);
        return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(sbpr), sbpr_pl);
}

static int mlxsw_sp_sb_cm_write(struct mlxsw_sp *mlxsw_sp, u16 local_port,
                                u8 pg_buff, u32 min_buff, u32 max_buff,
                                bool infi_max, u16 pool_index)
{
        const struct mlxsw_sp_sb_pool_des *des =
                &mlxsw_sp->sb_vals->pool_dess[pool_index];
        char sbcm_pl[MLXSW_REG_SBCM_LEN];
        struct mlxsw_sp_sb_cm *cm;
        int err;

        mlxsw_reg_sbcm_pack(sbcm_pl, local_port, pg_buff, des->dir,
                            min_buff, max_buff, infi_max, des->pool);
        err = mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(sbcm), sbcm_pl);
        if (err)
                return err;

        if (mlxsw_sp_sb_cm_exists(pg_buff, des->dir)) {
                if (infi_max)
                        max_buff = mlxsw_sp_bytes_cells(mlxsw_sp,
                                                        mlxsw_sp->sb->sb_size);

                cm = mlxsw_sp_sb_cm_get(mlxsw_sp, local_port, pg_buff,
                                        des->dir);
                cm->min_buff = min_buff;
                cm->max_buff = max_buff;
                cm->pool_index = pool_index;
        }
        return 0;
}

static int mlxsw_sp_sb_pm_write(struct mlxsw_sp *mlxsw_sp, u16 local_port,
                                u16 pool_index, u32 min_buff, u32 max_buff)
{
        const struct mlxsw_sp_sb_pool_des *des =
                &mlxsw_sp->sb_vals->pool_dess[pool_index];
        char sbpm_pl[MLXSW_REG_SBPM_LEN];
        struct mlxsw_sp_sb_pm *pm;
        int err;

        mlxsw_reg_sbpm_pack(sbpm_pl, local_port, des->pool, des->dir, false,
                            min_buff, max_buff);
        err = mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(sbpm), sbpm_pl);
        if (err)
                return err;

        pm = mlxsw_sp_sb_pm_get(mlxsw_sp, local_port, pool_index);
        pm->min_buff = min_buff;
        pm->max_buff = max_buff;
        return 0;
}

static int mlxsw_sp_sb_pm_occ_clear(struct mlxsw_sp *mlxsw_sp, u16 local_port,
                                    u16 pool_index, struct list_head *bulk_list)
{
        const struct mlxsw_sp_sb_pool_des *des =
                &mlxsw_sp->sb_vals->pool_dess[pool_index];
        char sbpm_pl[MLXSW_REG_SBPM_LEN];

        if (local_port == MLXSW_PORT_CPU_PORT &&
            des->dir == MLXSW_REG_SBXX_DIR_INGRESS)
                return 0;

        mlxsw_reg_sbpm_pack(sbpm_pl, local_port, des->pool, des->dir,
                            true, 0, 0);
        return mlxsw_reg_trans_query(mlxsw_sp->core, MLXSW_REG(sbpm), sbpm_pl,
                                     bulk_list, NULL, 0);
}

static void mlxsw_sp_sb_pm_occ_query_cb(struct mlxsw_core *mlxsw_core,
                                        char *sbpm_pl, size_t sbpm_pl_len,
                                        unsigned long cb_priv)
{
        struct mlxsw_sp_sb_pm *pm = (struct mlxsw_sp_sb_pm *) cb_priv;

        mlxsw_reg_sbpm_unpack(sbpm_pl, &pm->occ.cur, &pm->occ.max);
}

static int mlxsw_sp_sb_pm_occ_query(struct mlxsw_sp *mlxsw_sp, u16 local_port,
                                    u16 pool_index, struct list_head *bulk_list)
{
        const struct mlxsw_sp_sb_pool_des *des =
                &mlxsw_sp->sb_vals->pool_dess[pool_index];
        char sbpm_pl[MLXSW_REG_SBPM_LEN];
        struct mlxsw_sp_sb_pm *pm;

        if (local_port == MLXSW_PORT_CPU_PORT &&
            des->dir == MLXSW_REG_SBXX_DIR_INGRESS)
                return 0;

        pm = mlxsw_sp_sb_pm_get(mlxsw_sp, local_port, pool_index);
        mlxsw_reg_sbpm_pack(sbpm_pl, local_port, des->pool, des->dir,
                            false, 0, 0);
        return mlxsw_reg_trans_query(mlxsw_sp->core, MLXSW_REG(sbpm), sbpm_pl,
                                     bulk_list,
                                     mlxsw_sp_sb_pm_occ_query_cb,
                                     (unsigned long) pm);
}

void mlxsw_sp_hdroom_prios_reset_buf_idx(struct mlxsw_sp_hdroom *hdroom)
{
        int prio;

        for (prio = 0; prio < IEEE_8021QAZ_MAX_TCS; prio++) {
                switch (hdroom->mode) {
                case MLXSW_SP_HDROOM_MODE_DCB:
                        hdroom->prios.prio[prio].buf_idx = hdroom->prios.prio[prio].ets_buf_idx;
                        break;
                case MLXSW_SP_HDROOM_MODE_TC:
                        hdroom->prios.prio[prio].buf_idx = hdroom->prios.prio[prio].set_buf_idx;
                        break;
                }
        }
}

void mlxsw_sp_hdroom_bufs_reset_lossiness(struct mlxsw_sp_hdroom *hdroom)
{
        int prio;
        int i;

        for (i = 0; i < DCBX_MAX_BUFFERS; i++)
                hdroom->bufs.buf[i].lossy = true;

        for (prio = 0; prio < IEEE_8021Q_MAX_PRIORITIES; prio++) {
                if (!hdroom->prios.prio[prio].lossy)
                        hdroom->bufs.buf[hdroom->prios.prio[prio].buf_idx].lossy = false;
        }
}

static u16 mlxsw_sp_hdroom_buf_threshold_get(const struct mlxsw_sp *mlxsw_sp, int mtu)
{
        return 2 * mlxsw_sp_bytes_cells(mlxsw_sp, mtu);
}

static void mlxsw_sp_hdroom_buf_pack(char *pbmc_pl, int index, u16 size, u16 thres, bool lossy)
{
        if (lossy)
                mlxsw_reg_pbmc_lossy_buffer_pack(pbmc_pl, index, size);
        else
                mlxsw_reg_pbmc_lossless_buffer_pack(pbmc_pl, index, size,
                                                    thres);
}

static u16 mlxsw_sp_hdroom_buf_delay_get(const struct mlxsw_sp *mlxsw_sp,
                                         const struct mlxsw_sp_hdroom *hdroom)
{
        u16 delay_cells;

        delay_cells = mlxsw_sp_bytes_cells(mlxsw_sp, hdroom->delay_bytes);

        /* In the worst case scenario the delay will be made up of packets that
         * are all of size CELL_SIZE + 1, which means each packet will require
         * almost twice its true size when buffered in the switch. We therefore
         * multiply this value by the "cell factor", which is close to 2.
         *
         * Another MTU is added in case the transmitting host already started
         * transmitting a maximum length frame when the PFC packet was received.
         */
        return 2 * delay_cells + mlxsw_sp_bytes_cells(mlxsw_sp, hdroom->mtu);
}

static u32 mlxsw_sp_hdroom_int_buf_size_get(struct mlxsw_sp *mlxsw_sp, int mtu, u32 speed)
{
        u32 buffsize = mlxsw_sp->sb_ops->int_buf_size_get(mtu, speed);

        return mlxsw_sp_bytes_cells(mlxsw_sp, buffsize) + 1;
}

static bool mlxsw_sp_hdroom_buf_is_used(const struct mlxsw_sp_hdroom *hdroom, int buf)
{
        int prio;

        for (prio = 0; prio < IEEE_8021QAZ_MAX_TCS; prio++) {
                if (hdroom->prios.prio[prio].buf_idx == buf)
                        return true;
        }
        return false;
}

void mlxsw_sp_hdroom_bufs_reset_sizes(struct mlxsw_sp_port *mlxsw_sp_port,
                                      struct mlxsw_sp_hdroom *hdroom)
{
        struct mlxsw_sp *mlxsw_sp = mlxsw_sp_port->mlxsw_sp;
        unsigned int max_mtu = mlxsw_sp_port->dev->max_mtu;
        u16 reserve_cells;
        int i;

        max_mtu += MLXSW_PORT_ETH_FRAME_HDR;
        /* Internal buffer. */
        reserve_cells = mlxsw_sp_hdroom_int_buf_size_get(mlxsw_sp, max_mtu,
                                                         mlxsw_sp_port->max_speed);
        reserve_cells = mlxsw_sp_port_headroom_8x_adjust(mlxsw_sp_port, reserve_cells);
        hdroom->int_buf.reserve_cells = reserve_cells;

        if (hdroom->int_buf.enable)
                hdroom->int_buf.size_cells = reserve_cells;
        else
                hdroom->int_buf.size_cells = 0;

        /* PG buffers. */
        for (i = 0; i < DCBX_MAX_BUFFERS; i++) {
                struct mlxsw_sp_hdroom_buf *buf = &hdroom->bufs.buf[i];
                u16 thres_cells;
                u16 delay_cells;

                if (!mlxsw_sp_hdroom_buf_is_used(hdroom, i)) {
                        thres_cells = 0;
                        delay_cells = 0;
                } else if (buf->lossy) {
                        thres_cells = mlxsw_sp_hdroom_buf_threshold_get(mlxsw_sp, hdroom->mtu);
                        delay_cells = 0;
                } else {
                        thres_cells = mlxsw_sp_hdroom_buf_threshold_get(mlxsw_sp, hdroom->mtu);
                        delay_cells = mlxsw_sp_hdroom_buf_delay_get(mlxsw_sp, hdroom);
                }

                thres_cells = mlxsw_sp_port_headroom_8x_adjust(mlxsw_sp_port, thres_cells);
                delay_cells = mlxsw_sp_port_headroom_8x_adjust(mlxsw_sp_port, delay_cells);

                buf->thres_cells = thres_cells;
                if (hdroom->mode == MLXSW_SP_HDROOM_MODE_DCB) {
                        buf->size_cells = thres_cells + delay_cells;
                } else {
                        /* Do not allow going below the minimum size, even if
                         * the user requested it.
                         */
                        buf->size_cells = max(buf->set_size_cells, buf->thres_cells);
                }
        }
}

#define MLXSW_SP_PB_UNUSED 8

static int mlxsw_sp_hdroom_configure_buffers(struct mlxsw_sp_port *mlxsw_sp_port,
                                             const struct mlxsw_sp_hdroom *hdroom, bool force)
{
        struct mlxsw_sp *mlxsw_sp = mlxsw_sp_port->mlxsw_sp;
        char pbmc_pl[MLXSW_REG_PBMC_LEN];
        bool dirty;
        int err;
        int i;

        dirty = memcmp(&mlxsw_sp_port->hdroom->bufs, &hdroom->bufs, sizeof(hdroom->bufs));
        if (!dirty && !force)
                return 0;

        mlxsw_reg_pbmc_pack(pbmc_pl, mlxsw_sp_port->local_port, 0xffff, 0xffff / 2);
        for (i = 0; i < MLXSW_SP_PB_COUNT; i++) {
                const struct mlxsw_sp_hdroom_buf *buf = &hdroom->bufs.buf[i];

                if (i == MLXSW_SP_PB_UNUSED)
                        continue;

                mlxsw_sp_hdroom_buf_pack(pbmc_pl, i, buf->size_cells, buf->thres_cells, buf->lossy);
        }

        mlxsw_reg_pbmc_lossy_buffer_pack(pbmc_pl, MLXSW_REG_PBMC_PORT_SHARED_BUF_IDX, 0);
        err = mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(pbmc), pbmc_pl);
        if (err)
                return err;

        mlxsw_sp_port->hdroom->bufs = hdroom->bufs;
        return 0;
}

static int mlxsw_sp_hdroom_configure_priomap(struct mlxsw_sp_port *mlxsw_sp_port,
                                             const struct mlxsw_sp_hdroom *hdroom, bool force)
{
        char pptb_pl[MLXSW_REG_PPTB_LEN];
        bool dirty;
        int prio;
        int err;

        dirty = memcmp(&mlxsw_sp_port->hdroom->prios, &hdroom->prios, sizeof(hdroom->prios));
        if (!dirty && !force)
                return 0;

        mlxsw_reg_pptb_pack(pptb_pl, mlxsw_sp_port->local_port);
        for (prio = 0; prio < IEEE_8021QAZ_MAX_TCS; prio++)
                mlxsw_reg_pptb_prio_to_buff_pack(pptb_pl, prio, hdroom->prios.prio[prio].buf_idx);

        err = mlxsw_reg_write(mlxsw_sp_port->mlxsw_sp->core, MLXSW_REG(pptb), pptb_pl);
        if (err)
                return err;

        mlxsw_sp_port->hdroom->prios = hdroom->prios;
        return 0;
}

static int mlxsw_sp_hdroom_configure_int_buf(struct mlxsw_sp_port *mlxsw_sp_port,
                                             const struct mlxsw_sp_hdroom *hdroom, bool force)
{
        char sbib_pl[MLXSW_REG_SBIB_LEN];
        bool dirty;
        int err;

        dirty = memcmp(&mlxsw_sp_port->hdroom->int_buf, &hdroom->int_buf, sizeof(hdroom->int_buf));
        if (!dirty && !force)
                return 0;

        mlxsw_reg_sbib_pack(sbib_pl, mlxsw_sp_port->local_port, hdroom->int_buf.size_cells);
        err = mlxsw_reg_write(mlxsw_sp_port->mlxsw_sp->core, MLXSW_REG(sbib), sbib_pl);
        if (err)
                return err;

        mlxsw_sp_port->hdroom->int_buf = hdroom->int_buf;
        return 0;
}

static bool mlxsw_sp_hdroom_bufs_fit(struct mlxsw_sp *mlxsw_sp,
                                     const struct mlxsw_sp_hdroom *hdroom)
{
        u32 taken_headroom_cells = 0;
        int i;

        for (i = 0; i < MLXSW_SP_PB_COUNT; i++)
                taken_headroom_cells += hdroom->bufs.buf[i].size_cells;

        taken_headroom_cells += hdroom->int_buf.reserve_cells;
        return taken_headroom_cells <= mlxsw_sp->sb->max_headroom_cells;
}

static int __mlxsw_sp_hdroom_configure(struct mlxsw_sp_port *mlxsw_sp_port,
                                       const struct mlxsw_sp_hdroom *hdroom, bool force)
{
        struct mlxsw_sp_hdroom orig_hdroom;
        struct mlxsw_sp_hdroom tmp_hdroom;
        int err;
        int i;

        /* Port buffers need to be configured in three steps. First, all buffers
         * with non-zero size are configured. Then, prio-to-buffer map is
         * updated, allowing traffic to flow to the now non-zero buffers.
         * Finally, zero-sized buffers are configured, because now no traffic
         * should be directed to them anymore. This way, in a non-congested
         * system, no packet drops are introduced by the reconfiguration.
         */

        orig_hdroom = *mlxsw_sp_port->hdroom;
        tmp_hdroom = orig_hdroom;
        for (i = 0; i < MLXSW_SP_PB_COUNT; i++) {
                if (hdroom->bufs.buf[i].size_cells)
                        tmp_hdroom.bufs.buf[i] = hdroom->bufs.buf[i];
        }

        if (!mlxsw_sp_hdroom_bufs_fit(mlxsw_sp_port->mlxsw_sp, &tmp_hdroom) ||
            !mlxsw_sp_hdroom_bufs_fit(mlxsw_sp_port->mlxsw_sp, hdroom))
                return -ENOBUFS;

        err = mlxsw_sp_hdroom_configure_buffers(mlxsw_sp_port, &tmp_hdroom, force);
        if (err)
                return err;

        err = mlxsw_sp_hdroom_configure_priomap(mlxsw_sp_port, hdroom, force);
        if (err)
                goto err_configure_priomap;

        err = mlxsw_sp_hdroom_configure_buffers(mlxsw_sp_port, hdroom, false);
        if (err)
                goto err_configure_buffers;

        err = mlxsw_sp_hdroom_configure_int_buf(mlxsw_sp_port, hdroom, false);
        if (err)
                goto err_configure_int_buf;

        *mlxsw_sp_port->hdroom = *hdroom;
        return 0;

err_configure_int_buf:
        mlxsw_sp_hdroom_configure_buffers(mlxsw_sp_port, &tmp_hdroom, false);
err_configure_buffers:
        mlxsw_sp_hdroom_configure_priomap(mlxsw_sp_port, &tmp_hdroom, false);
err_configure_priomap:
        mlxsw_sp_hdroom_configure_buffers(mlxsw_sp_port, &orig_hdroom, false);
        return err;
}

int mlxsw_sp_hdroom_configure(struct mlxsw_sp_port *mlxsw_sp_port,
                              const struct mlxsw_sp_hdroom *hdroom)
{
        return __mlxsw_sp_hdroom_configure(mlxsw_sp_port, hdroom, false);
}

static int mlxsw_sp_port_headroom_init(struct mlxsw_sp_port *mlxsw_sp_port)
{
        struct mlxsw_sp *mlxsw_sp = mlxsw_sp_port->mlxsw_sp;
        struct mlxsw_sp_hdroom hdroom = {};
        u32 size9;
        int prio;

        hdroom.mtu = mlxsw_sp_port->dev->mtu;
        hdroom.mode = MLXSW_SP_HDROOM_MODE_DCB;
        for (prio = 0; prio < IEEE_8021QAZ_MAX_TCS; prio++)
                hdroom.prios.prio[prio].lossy = true;

        mlxsw_sp_hdroom_bufs_reset_lossiness(&hdroom);
        mlxsw_sp_hdroom_bufs_reset_sizes(mlxsw_sp_port, &hdroom);

        /* Buffer 9 is used for control traffic. */
        size9 = mlxsw_sp_port_headroom_8x_adjust(mlxsw_sp_port,
                                                 mlxsw_sp_port->dev->max_mtu +
                                                 MLXSW_PORT_ETH_FRAME_HDR);
        hdroom.bufs.buf[9].size_cells = mlxsw_sp_bytes_cells(mlxsw_sp, size9);

        return __mlxsw_sp_hdroom_configure(mlxsw_sp_port, &hdroom, true);
}

static int mlxsw_sp_sb_port_init(struct mlxsw_sp *mlxsw_sp,
                                 struct mlxsw_sp_sb_port *sb_port)
{
        struct mlxsw_sp_sb_pm *pms;

        pms = kzalloc_objs(*pms, mlxsw_sp->sb_vals->pool_count);
        if (!pms)
                return -ENOMEM;
        sb_port->pms = pms;
        return 0;
}

static void mlxsw_sp_sb_port_fini(struct mlxsw_sp_sb_port *sb_port)
{
        kfree(sb_port->pms);
}

static int mlxsw_sp_sb_ports_init(struct mlxsw_sp *mlxsw_sp)
{
        unsigned int max_ports = mlxsw_core_max_ports(mlxsw_sp->core);
        struct mlxsw_sp_sb_pr *prs;
        int i;
        int err;

        mlxsw_sp->sb->ports = kzalloc_objs(struct mlxsw_sp_sb_port, max_ports);
        if (!mlxsw_sp->sb->ports)
                return -ENOMEM;

        prs = kzalloc_objs(*prs, mlxsw_sp->sb_vals->pool_count);
        if (!prs) {
                err = -ENOMEM;
                goto err_alloc_prs;
        }
        mlxsw_sp->sb->prs = prs;

        for (i = 0; i < max_ports; i++) {
                err = mlxsw_sp_sb_port_init(mlxsw_sp, &mlxsw_sp->sb->ports[i]);
                if (err)
                        goto err_sb_port_init;
        }

        return 0;

err_sb_port_init:
        for (i--; i >= 0; i--)
                mlxsw_sp_sb_port_fini(&mlxsw_sp->sb->ports[i]);
        kfree(mlxsw_sp->sb->prs);
err_alloc_prs:
        kfree(mlxsw_sp->sb->ports);
        return err;
}

static void mlxsw_sp_sb_ports_fini(struct mlxsw_sp *mlxsw_sp)
{
        int max_ports = mlxsw_core_max_ports(mlxsw_sp->core);
        int i;

        for (i = max_ports - 1; i >= 0; i--)
                mlxsw_sp_sb_port_fini(&mlxsw_sp->sb->ports[i]);
        kfree(mlxsw_sp->sb->prs);
        kfree(mlxsw_sp->sb->ports);
}

#define MLXSW_SP_SB_PR(_mode, _size)    \
        {                               \
                .mode = _mode,          \
                .size = _size,          \
        }

#define MLXSW_SP_SB_PR_EXT(_mode, _size, _freeze_mode, _freeze_size)    \
        {                                                               \
                .mode = _mode,                                          \
                .size = _size,                                          \
                .freeze_mode = _freeze_mode,                            \
                .freeze_size = _freeze_size,                            \
        }

#define MLXSW_SP1_SB_PR_CPU_SIZE        (256 * 1000)

/* Order according to mlxsw_sp1_sb_pool_dess */
static const struct mlxsw_sp_sb_pr mlxsw_sp1_sb_prs[] = {
        MLXSW_SP_SB_PR(MLXSW_REG_SBPR_MODE_DYNAMIC, MLXSW_SP_SB_REST),
        MLXSW_SP_SB_PR(MLXSW_REG_SBPR_MODE_DYNAMIC, 0),
        MLXSW_SP_SB_PR(MLXSW_REG_SBPR_MODE_DYNAMIC, 0),
        MLXSW_SP_SB_PR(MLXSW_REG_SBPR_MODE_DYNAMIC, 0),
        MLXSW_SP_SB_PR_EXT(MLXSW_REG_SBPR_MODE_DYNAMIC, MLXSW_SP_SB_REST,
                           true, false),
        MLXSW_SP_SB_PR(MLXSW_REG_SBPR_MODE_DYNAMIC, 0),
        MLXSW_SP_SB_PR(MLXSW_REG_SBPR_MODE_DYNAMIC, 0),
        MLXSW_SP_SB_PR(MLXSW_REG_SBPR_MODE_DYNAMIC, 0),
        MLXSW_SP_SB_PR_EXT(MLXSW_REG_SBPR_MODE_STATIC, MLXSW_SP_SB_INFI,
                           true, true),
        MLXSW_SP_SB_PR_EXT(MLXSW_REG_SBPR_MODE_DYNAMIC,
                           MLXSW_SP1_SB_PR_CPU_SIZE, true, false),
        MLXSW_SP_SB_PR_EXT(MLXSW_REG_SBPR_MODE_DYNAMIC,
                           MLXSW_SP1_SB_PR_CPU_SIZE, true, false),
};

#define MLXSW_SP2_SB_PR_CPU_SIZE        (256 * 1000)

/* Order according to mlxsw_sp2_sb_pool_dess */
static const struct mlxsw_sp_sb_pr mlxsw_sp2_sb_prs[] = {
        MLXSW_SP_SB_PR(MLXSW_REG_SBPR_MODE_DYNAMIC, MLXSW_SP_SB_REST),
        MLXSW_SP_SB_PR(MLXSW_REG_SBPR_MODE_STATIC, 0),
        MLXSW_SP_SB_PR(MLXSW_REG_SBPR_MODE_STATIC, 0),
        MLXSW_SP_SB_PR(MLXSW_REG_SBPR_MODE_STATIC, 0),
        MLXSW_SP_SB_PR_EXT(MLXSW_REG_SBPR_MODE_DYNAMIC, MLXSW_SP_SB_REST,
                           true, false),
        MLXSW_SP_SB_PR(MLXSW_REG_SBPR_MODE_STATIC, 0),
        MLXSW_SP_SB_PR(MLXSW_REG_SBPR_MODE_STATIC, 0),
        MLXSW_SP_SB_PR(MLXSW_REG_SBPR_MODE_STATIC, 0),
        MLXSW_SP_SB_PR_EXT(MLXSW_REG_SBPR_MODE_STATIC, MLXSW_SP_SB_INFI,
                           true, true),
        MLXSW_SP_SB_PR_EXT(MLXSW_REG_SBPR_MODE_DYNAMIC,
                           MLXSW_SP2_SB_PR_CPU_SIZE, true, false),
        MLXSW_SP_SB_PR_EXT(MLXSW_REG_SBPR_MODE_DYNAMIC,
                           MLXSW_SP2_SB_PR_CPU_SIZE, true, false),
};

static int mlxsw_sp_sb_prs_init(struct mlxsw_sp *mlxsw_sp,
                                const struct mlxsw_sp_sb_pr *prs,
                                const struct mlxsw_sp_sb_pool_des *pool_dess,
                                size_t prs_len)
{
        /* Round down, unlike mlxsw_sp_bytes_cells(). */
        u32 sb_cells = div_u64(mlxsw_sp->sb->sb_size, mlxsw_sp->sb->cell_size);
        u32 rest_cells[2] = {sb_cells, sb_cells};
        int i;
        int err;

        /* Calculate how much space to give to the "REST" pools in either
         * direction.
         */
        for (i = 0; i < prs_len; i++) {
                enum mlxsw_reg_sbxx_dir dir = pool_dess[i].dir;
                u32 size = prs[i].size;
                u32 size_cells;

                if (size == MLXSW_SP_SB_INFI || size == MLXSW_SP_SB_REST)
                        continue;

                size_cells = mlxsw_sp_bytes_cells(mlxsw_sp, size);
                if (WARN_ON_ONCE(size_cells > rest_cells[dir]))
                        continue;

                rest_cells[dir] -= size_cells;
        }

        for (i = 0; i < prs_len; i++) {
                u32 size = prs[i].size;
                u32 size_cells;

                if (size == MLXSW_SP_SB_INFI) {
                        err = mlxsw_sp_sb_pr_write(mlxsw_sp, i, prs[i].mode,
                                                   0, true);
                } else if (size == MLXSW_SP_SB_REST) {
                        size_cells = rest_cells[pool_dess[i].dir];
                        err = mlxsw_sp_sb_pr_write(mlxsw_sp, i, prs[i].mode,
                                                   size_cells, false);
                } else {
                        size_cells = mlxsw_sp_bytes_cells(mlxsw_sp, size);
                        err = mlxsw_sp_sb_pr_write(mlxsw_sp, i, prs[i].mode,
                                                   size_cells, false);
                }
                if (err)
                        return err;
        }

        err = mlxsw_sp_sb_pr_desc_write(mlxsw_sp, MLXSW_REG_SBXX_DIR_INGRESS,
                                        MLXSW_REG_SBPR_MODE_DYNAMIC, 0, true);
        if (err)
                return err;

        err = mlxsw_sp_sb_pr_desc_write(mlxsw_sp, MLXSW_REG_SBXX_DIR_EGRESS,
                                        MLXSW_REG_SBPR_MODE_DYNAMIC, 0, true);
        if (err)
                return err;

        return 0;
}

#define MLXSW_SP_SB_CM(_min_buff, _max_buff, _pool)     \
        {                                               \
                .min_buff = _min_buff,                  \
                .max_buff = _max_buff,                  \
                .pool_index = _pool,                    \
        }

#define MLXSW_SP_SB_CM_ING(_min_buff, _max_buff)        \
        {                                               \
                .min_buff = _min_buff,                  \
                .max_buff = _max_buff,                  \
                .pool_index = MLXSW_SP_SB_POOL_ING,     \
        }

#define MLXSW_SP_SB_CM_EGR(_min_buff, _max_buff)        \
        {                                               \
                .min_buff = _min_buff,                  \
                .max_buff = _max_buff,                  \
                .pool_index = MLXSW_SP_SB_POOL_EGR,     \
        }

#define MLXSW_SP_SB_CM_EGR_MC(_min_buff, _max_buff)     \
        {                                               \
                .min_buff = _min_buff,                  \
                .max_buff = _max_buff,                  \
                .pool_index = MLXSW_SP_SB_POOL_EGR_MC,  \
                .freeze_pool = true,                    \
                .freeze_thresh = true,                  \
        }

static const struct mlxsw_sp_sb_cm mlxsw_sp1_sb_cms_ingress[] = {
        MLXSW_SP_SB_CM_ING(10000, 8),
        MLXSW_SP_SB_CM_ING(0, MLXSW_REG_SBXX_DYN_MAX_BUFF_MIN),
        MLXSW_SP_SB_CM_ING(0, MLXSW_REG_SBXX_DYN_MAX_BUFF_MIN),
        MLXSW_SP_SB_CM_ING(0, MLXSW_REG_SBXX_DYN_MAX_BUFF_MIN),
        MLXSW_SP_SB_CM_ING(0, MLXSW_REG_SBXX_DYN_MAX_BUFF_MIN),
        MLXSW_SP_SB_CM_ING(0, MLXSW_REG_SBXX_DYN_MAX_BUFF_MIN),
        MLXSW_SP_SB_CM_ING(0, MLXSW_REG_SBXX_DYN_MAX_BUFF_MIN),
        MLXSW_SP_SB_CM_ING(0, MLXSW_REG_SBXX_DYN_MAX_BUFF_MIN),
        MLXSW_SP_SB_CM_ING(0, 0), /* dummy, this PG does not exist */
        MLXSW_SP_SB_CM(10000, 8, MLXSW_SP_SB_POOL_ING_CPU),
};

static const struct mlxsw_sp_sb_cm mlxsw_sp2_sb_cms_ingress[] = {
        MLXSW_SP_SB_CM_ING(0, 7),
        MLXSW_SP_SB_CM_ING(0, MLXSW_REG_SBXX_DYN_MAX_BUFF_MIN),
        MLXSW_SP_SB_CM_ING(0, MLXSW_REG_SBXX_DYN_MAX_BUFF_MIN),
        MLXSW_SP_SB_CM_ING(0, MLXSW_REG_SBXX_DYN_MAX_BUFF_MIN),
        MLXSW_SP_SB_CM_ING(0, MLXSW_REG_SBXX_DYN_MAX_BUFF_MIN),
        MLXSW_SP_SB_CM_ING(0, MLXSW_REG_SBXX_DYN_MAX_BUFF_MIN),
        MLXSW_SP_SB_CM_ING(0, MLXSW_REG_SBXX_DYN_MAX_BUFF_MIN),
        MLXSW_SP_SB_CM_ING(0, MLXSW_REG_SBXX_DYN_MAX_BUFF_MIN),
        MLXSW_SP_SB_CM_ING(0, 0), /* dummy, this PG does not exist */
        MLXSW_SP_SB_CM(10000, 8, MLXSW_SP_SB_POOL_ING_CPU),
};

static const struct mlxsw_sp_sb_cm mlxsw_sp1_sb_cms_egress[] = {
        MLXSW_SP_SB_CM_EGR(1500, 9),
        MLXSW_SP_SB_CM_EGR(1500, 9),
        MLXSW_SP_SB_CM_EGR(1500, 9),
        MLXSW_SP_SB_CM_EGR(1500, 9),
        MLXSW_SP_SB_CM_EGR(1500, 9),
        MLXSW_SP_SB_CM_EGR(1500, 9),
        MLXSW_SP_SB_CM_EGR(1500, 9),
        MLXSW_SP_SB_CM_EGR(1500, 9),
        MLXSW_SP_SB_CM_EGR_MC(0, MLXSW_SP_SB_INFI),
        MLXSW_SP_SB_CM_EGR_MC(0, MLXSW_SP_SB_INFI),
        MLXSW_SP_SB_CM_EGR_MC(0, MLXSW_SP_SB_INFI),
        MLXSW_SP_SB_CM_EGR_MC(0, MLXSW_SP_SB_INFI),
        MLXSW_SP_SB_CM_EGR_MC(0, MLXSW_SP_SB_INFI),
        MLXSW_SP_SB_CM_EGR_MC(0, MLXSW_SP_SB_INFI),
        MLXSW_SP_SB_CM_EGR_MC(0, MLXSW_SP_SB_INFI),
        MLXSW_SP_SB_CM_EGR_MC(0, MLXSW_SP_SB_INFI),
        MLXSW_SP_SB_CM_EGR(1, 0xff),
};

static const struct mlxsw_sp_sb_cm mlxsw_sp2_sb_cms_egress[] = {
        MLXSW_SP_SB_CM_EGR(0, 7),
        MLXSW_SP_SB_CM_EGR(0, 7),
        MLXSW_SP_SB_CM_EGR(0, 7),
        MLXSW_SP_SB_CM_EGR(0, 7),
        MLXSW_SP_SB_CM_EGR(0, 7),
        MLXSW_SP_SB_CM_EGR(0, 7),
        MLXSW_SP_SB_CM_EGR(0, 7),
        MLXSW_SP_SB_CM_EGR(0, 7),
        MLXSW_SP_SB_CM_EGR_MC(0, MLXSW_SP_SB_INFI),
        MLXSW_SP_SB_CM_EGR_MC(0, MLXSW_SP_SB_INFI),
        MLXSW_SP_SB_CM_EGR_MC(0, MLXSW_SP_SB_INFI),
        MLXSW_SP_SB_CM_EGR_MC(0, MLXSW_SP_SB_INFI),
        MLXSW_SP_SB_CM_EGR_MC(0, MLXSW_SP_SB_INFI),
        MLXSW_SP_SB_CM_EGR_MC(0, MLXSW_SP_SB_INFI),
        MLXSW_SP_SB_CM_EGR_MC(0, MLXSW_SP_SB_INFI),
        MLXSW_SP_SB_CM_EGR_MC(0, MLXSW_SP_SB_INFI),
        MLXSW_SP_SB_CM_EGR(1, 0xff),
};

#define MLXSW_SP_CPU_PORT_SB_CM MLXSW_SP_SB_CM(0, 0, MLXSW_SP_SB_POOL_EGR_CPU)

static const struct mlxsw_sp_sb_cm mlxsw_sp_cpu_port_sb_cms[] = {
        MLXSW_SP_SB_CM(1000, 8, MLXSW_SP_SB_POOL_EGR_CPU),
        MLXSW_SP_SB_CM(1000, 8, MLXSW_SP_SB_POOL_EGR_CPU),
        MLXSW_SP_SB_CM(1000, 8, MLXSW_SP_SB_POOL_EGR_CPU),
        MLXSW_SP_SB_CM(1000, 8, MLXSW_SP_SB_POOL_EGR_CPU),
        MLXSW_SP_SB_CM(1000, 8, MLXSW_SP_SB_POOL_EGR_CPU),
        MLXSW_SP_SB_CM(1000, 8, MLXSW_SP_SB_POOL_EGR_CPU),
        MLXSW_SP_CPU_PORT_SB_CM,
        MLXSW_SP_SB_CM(1000, 8, MLXSW_SP_SB_POOL_EGR_CPU),
        MLXSW_SP_CPU_PORT_SB_CM,
        MLXSW_SP_CPU_PORT_SB_CM,
        MLXSW_SP_CPU_PORT_SB_CM,
        MLXSW_SP_CPU_PORT_SB_CM,
        MLXSW_SP_CPU_PORT_SB_CM,
        MLXSW_SP_CPU_PORT_SB_CM,
        MLXSW_SP_CPU_PORT_SB_CM,
        MLXSW_SP_CPU_PORT_SB_CM,
        MLXSW_SP_CPU_PORT_SB_CM,
        MLXSW_SP_CPU_PORT_SB_CM,
        MLXSW_SP_CPU_PORT_SB_CM,
        MLXSW_SP_CPU_PORT_SB_CM,
        MLXSW_SP_CPU_PORT_SB_CM,
        MLXSW_SP_CPU_PORT_SB_CM,
        MLXSW_SP_CPU_PORT_SB_CM,
        MLXSW_SP_CPU_PORT_SB_CM,
        MLXSW_SP_CPU_PORT_SB_CM,
        MLXSW_SP_CPU_PORT_SB_CM,
        MLXSW_SP_CPU_PORT_SB_CM,
        MLXSW_SP_CPU_PORT_SB_CM,
        MLXSW_SP_CPU_PORT_SB_CM,
        MLXSW_SP_CPU_PORT_SB_CM,
        MLXSW_SP_CPU_PORT_SB_CM,
        MLXSW_SP_CPU_PORT_SB_CM,
};

static bool
mlxsw_sp_sb_pool_is_static(struct mlxsw_sp *mlxsw_sp, u16 pool_index)
{
        struct mlxsw_sp_sb_pr *pr = mlxsw_sp_sb_pr_get(mlxsw_sp, pool_index);

        return pr->mode == MLXSW_REG_SBPR_MODE_STATIC;
}

static int __mlxsw_sp_sb_cms_init(struct mlxsw_sp *mlxsw_sp, u16 local_port,
                                  enum mlxsw_reg_sbxx_dir dir,
                                  const struct mlxsw_sp_sb_cm *cms,
                                  size_t cms_len)
{
        const struct mlxsw_sp_sb_vals *sb_vals = mlxsw_sp->sb_vals;
        int i;
        int err;

        for (i = 0; i < cms_len; i++) {
                const struct mlxsw_sp_sb_cm *cm;
                u32 min_buff;
                u32 max_buff;

                if (i == 8 && dir == MLXSW_REG_SBXX_DIR_INGRESS)
                        continue; /* PG number 8 does not exist, skip it */
                cm = &cms[i];
                if (WARN_ON(sb_vals->pool_dess[cm->pool_index].dir != dir))
                        continue;

                min_buff = mlxsw_sp_bytes_cells(mlxsw_sp, cm->min_buff);
                max_buff = cm->max_buff;
                if (max_buff == MLXSW_SP_SB_INFI) {
                        err = mlxsw_sp_sb_cm_write(mlxsw_sp, local_port, i,
                                                   min_buff, 0,
                                                   true, cm->pool_index);
                } else {
                        if (mlxsw_sp_sb_pool_is_static(mlxsw_sp,
                                                       cm->pool_index))
                                max_buff = mlxsw_sp_bytes_cells(mlxsw_sp,
                                                                max_buff);
                        err = mlxsw_sp_sb_cm_write(mlxsw_sp, local_port, i,
                                                   min_buff, max_buff,
                                                   false, cm->pool_index);
                }
                if (err)
                        return err;
        }
        return 0;
}

static int mlxsw_sp_port_sb_cms_init(struct mlxsw_sp_port *mlxsw_sp_port)
{
        struct mlxsw_sp *mlxsw_sp = mlxsw_sp_port->mlxsw_sp;
        int err;

        err = __mlxsw_sp_sb_cms_init(mlxsw_sp,
                                     mlxsw_sp_port->local_port,
                                     MLXSW_REG_SBXX_DIR_INGRESS,
                                     mlxsw_sp->sb_vals->cms_ingress,
                                     mlxsw_sp->sb_vals->cms_ingress_count);
        if (err)
                return err;
        return __mlxsw_sp_sb_cms_init(mlxsw_sp_port->mlxsw_sp,
                                      mlxsw_sp_port->local_port,
                                      MLXSW_REG_SBXX_DIR_EGRESS,
                                      mlxsw_sp->sb_vals->cms_egress,
                                      mlxsw_sp->sb_vals->cms_egress_count);
}

static int mlxsw_sp_cpu_port_sb_cms_init(struct mlxsw_sp *mlxsw_sp)
{
        return __mlxsw_sp_sb_cms_init(mlxsw_sp, 0, MLXSW_REG_SBXX_DIR_EGRESS,
                                      mlxsw_sp->sb_vals->cms_cpu,
                                      mlxsw_sp->sb_vals->cms_cpu_count);
}

#define MLXSW_SP_SB_PM(_min_buff, _max_buff)    \
        {                                       \
                .min_buff = _min_buff,          \
                .max_buff = _max_buff,          \
        }

/* Order according to mlxsw_sp1_sb_pool_dess */
static const struct mlxsw_sp_sb_pm mlxsw_sp1_sb_pms[] = {
        MLXSW_SP_SB_PM(0, MLXSW_REG_SBXX_DYN_MAX_BUFF_MAX),
        MLXSW_SP_SB_PM(0, MLXSW_REG_SBXX_DYN_MAX_BUFF_MIN),
        MLXSW_SP_SB_PM(0, MLXSW_REG_SBXX_DYN_MAX_BUFF_MIN),
        MLXSW_SP_SB_PM(0, MLXSW_REG_SBXX_DYN_MAX_BUFF_MIN),
        MLXSW_SP_SB_PM(0, 7),
        MLXSW_SP_SB_PM(0, MLXSW_REG_SBXX_DYN_MAX_BUFF_MIN),
        MLXSW_SP_SB_PM(0, MLXSW_REG_SBXX_DYN_MAX_BUFF_MIN),
        MLXSW_SP_SB_PM(0, MLXSW_REG_SBXX_DYN_MAX_BUFF_MIN),
        MLXSW_SP_SB_PM(10000, 90000),
        MLXSW_SP_SB_PM(0, 8),   /* 50% occupancy */
        MLXSW_SP_SB_PM(0, MLXSW_REG_SBXX_DYN_MAX_BUFF_MIN),
};

/* Order according to mlxsw_sp2_sb_pool_dess */
static const struct mlxsw_sp_sb_pm mlxsw_sp2_sb_pms[] = {
        MLXSW_SP_SB_PM(0, 7),
        MLXSW_SP_SB_PM(0, 0),
        MLXSW_SP_SB_PM(0, 0),
        MLXSW_SP_SB_PM(0, 0),
        MLXSW_SP_SB_PM(0, 7),
        MLXSW_SP_SB_PM(0, 0),
        MLXSW_SP_SB_PM(0, 0),
        MLXSW_SP_SB_PM(0, 0),
        MLXSW_SP_SB_PM(10000, 90000),
        MLXSW_SP_SB_PM(0, 8),   /* 50% occupancy */
        MLXSW_SP_SB_PM(0, MLXSW_REG_SBXX_DYN_MAX_BUFF_MIN),
};

/* Order according to mlxsw_sp*_sb_pool_dess */
static const struct mlxsw_sp_sb_pm mlxsw_sp_cpu_port_sb_pms[] = {
        MLXSW_SP_SB_PM(0, 0),
        MLXSW_SP_SB_PM(0, 0),
        MLXSW_SP_SB_PM(0, 0),
        MLXSW_SP_SB_PM(0, 0),
        MLXSW_SP_SB_PM(0, 0),
        MLXSW_SP_SB_PM(0, 0),
        MLXSW_SP_SB_PM(0, 0),
        MLXSW_SP_SB_PM(0, 0),
        MLXSW_SP_SB_PM(0, 90000),
        MLXSW_SP_SB_PM(0, 0),
        MLXSW_SP_SB_PM(0, MLXSW_REG_SBXX_DYN_MAX_BUFF_MAX),
};

static int mlxsw_sp_sb_pms_init(struct mlxsw_sp *mlxsw_sp, u16 local_port,
                                const struct mlxsw_sp_sb_pm *pms,
                                bool skip_ingress)
{
        int i, err;

        for (i = 0; i < mlxsw_sp->sb_vals->pool_count; i++) {
                const struct mlxsw_sp_sb_pm *pm = &pms[i];
                const struct mlxsw_sp_sb_pool_des *des;
                u32 max_buff;
                u32 min_buff;

                des = &mlxsw_sp->sb_vals->pool_dess[i];
                if (skip_ingress && des->dir == MLXSW_REG_SBXX_DIR_INGRESS)
                        continue;

                min_buff = mlxsw_sp_bytes_cells(mlxsw_sp, pm->min_buff);
                max_buff = pm->max_buff;
                if (mlxsw_sp_sb_pool_is_static(mlxsw_sp, i))
                        max_buff = mlxsw_sp_bytes_cells(mlxsw_sp, max_buff);
                err = mlxsw_sp_sb_pm_write(mlxsw_sp, local_port, i, min_buff,
                                           max_buff);
                if (err)
                        return err;
        }
        return 0;
}

static int mlxsw_sp_port_sb_pms_init(struct mlxsw_sp_port *mlxsw_sp_port)
{
        struct mlxsw_sp *mlxsw_sp = mlxsw_sp_port->mlxsw_sp;

        return mlxsw_sp_sb_pms_init(mlxsw_sp, mlxsw_sp_port->local_port,
                                    mlxsw_sp->sb_vals->pms, false);
}

static int mlxsw_sp_cpu_port_sb_pms_init(struct mlxsw_sp *mlxsw_sp)
{
        return mlxsw_sp_sb_pms_init(mlxsw_sp, 0, mlxsw_sp->sb_vals->pms_cpu,
                                    true);
}

#define MLXSW_SP_SB_MM(_min_buff, _max_buff)            \
        {                                               \
                .min_buff = _min_buff,                  \
                .max_buff = _max_buff,                  \
                .pool_index = MLXSW_SP_SB_POOL_EGR,     \
        }

static const struct mlxsw_sp_sb_mm mlxsw_sp_sb_mms[] = {
        MLXSW_SP_SB_MM(0, 6),
        MLXSW_SP_SB_MM(0, 6),
        MLXSW_SP_SB_MM(0, 6),
        MLXSW_SP_SB_MM(0, 6),
        MLXSW_SP_SB_MM(0, 6),
        MLXSW_SP_SB_MM(0, 6),
        MLXSW_SP_SB_MM(0, 6),
        MLXSW_SP_SB_MM(0, 6),
        MLXSW_SP_SB_MM(0, 6),
        MLXSW_SP_SB_MM(0, 6),
        MLXSW_SP_SB_MM(0, 6),
        MLXSW_SP_SB_MM(0, 6),
        MLXSW_SP_SB_MM(0, 6),
        MLXSW_SP_SB_MM(0, 6),
        MLXSW_SP_SB_MM(0, 6),
};

static int mlxsw_sp_sb_mms_init(struct mlxsw_sp *mlxsw_sp)
{
        char sbmm_pl[MLXSW_REG_SBMM_LEN];
        int i;
        int err;

        for (i = 0; i < mlxsw_sp->sb_vals->mms_count; i++) {
                const struct mlxsw_sp_sb_pool_des *des;
                const struct mlxsw_sp_sb_mm *mc;
                u32 min_buff;

                mc = &mlxsw_sp->sb_vals->mms[i];
                des = &mlxsw_sp->sb_vals->pool_dess[mc->pool_index];
                /* All pools used by sb_mm's are initialized using dynamic
                 * thresholds, therefore 'max_buff' isn't specified in cells.
                 */
                min_buff = mlxsw_sp_bytes_cells(mlxsw_sp, mc->min_buff);
                mlxsw_reg_sbmm_pack(sbmm_pl, i, min_buff, mc->max_buff,
                                    des->pool);
                err = mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(sbmm), sbmm_pl);
                if (err)
                        return err;
        }
        return 0;
}

static void mlxsw_sp_pool_count(struct mlxsw_sp *mlxsw_sp,
                                u16 *p_ingress_len, u16 *p_egress_len)
{
        int i;

        for (i = 0; i < mlxsw_sp->sb_vals->pool_count; ++i) {
                if (mlxsw_sp->sb_vals->pool_dess[i].dir ==
                    MLXSW_REG_SBXX_DIR_INGRESS)
                        (*p_ingress_len)++;
                else
                        (*p_egress_len)++;
        }

        WARN(*p_egress_len == 0, "No egress pools\n");
}

const struct mlxsw_sp_sb_vals mlxsw_sp1_sb_vals = {
        .pool_count = ARRAY_SIZE(mlxsw_sp1_sb_pool_dess),
        .pool_dess = mlxsw_sp1_sb_pool_dess,
        .pms = mlxsw_sp1_sb_pms,
        .pms_cpu = mlxsw_sp_cpu_port_sb_pms,
        .prs = mlxsw_sp1_sb_prs,
        .mms = mlxsw_sp_sb_mms,
        .cms_ingress = mlxsw_sp1_sb_cms_ingress,
        .cms_egress = mlxsw_sp1_sb_cms_egress,
        .cms_cpu = mlxsw_sp_cpu_port_sb_cms,
        .mms_count = ARRAY_SIZE(mlxsw_sp_sb_mms),
        .cms_ingress_count = ARRAY_SIZE(mlxsw_sp1_sb_cms_ingress),
        .cms_egress_count = ARRAY_SIZE(mlxsw_sp1_sb_cms_egress),
        .cms_cpu_count = ARRAY_SIZE(mlxsw_sp_cpu_port_sb_cms),
};

const struct mlxsw_sp_sb_vals mlxsw_sp2_sb_vals = {
        .pool_count = ARRAY_SIZE(mlxsw_sp2_sb_pool_dess),
        .pool_dess = mlxsw_sp2_sb_pool_dess,
        .pms = mlxsw_sp2_sb_pms,
        .pms_cpu = mlxsw_sp_cpu_port_sb_pms,
        .prs = mlxsw_sp2_sb_prs,
        .mms = mlxsw_sp_sb_mms,
        .cms_ingress = mlxsw_sp2_sb_cms_ingress,
        .cms_egress = mlxsw_sp2_sb_cms_egress,
        .cms_cpu = mlxsw_sp_cpu_port_sb_cms,
        .mms_count = ARRAY_SIZE(mlxsw_sp_sb_mms),
        .cms_ingress_count = ARRAY_SIZE(mlxsw_sp2_sb_cms_ingress),
        .cms_egress_count = ARRAY_SIZE(mlxsw_sp2_sb_cms_egress),
        .cms_cpu_count = ARRAY_SIZE(mlxsw_sp_cpu_port_sb_cms),
};

static u32 mlxsw_sp1_pb_int_buf_size_get(int mtu, u32 speed)
{
        return mtu * 5 / 2;
}

static u32 __mlxsw_sp_pb_int_buf_size_get(int mtu, u32 speed, u32 buffer_factor)
{
        return 3 * mtu + buffer_factor * speed / 1000;
}

#define MLXSW_SP2_SPAN_EG_MIRROR_BUFFER_FACTOR 38

static u32 mlxsw_sp2_pb_int_buf_size_get(int mtu, u32 speed)
{
        int factor = MLXSW_SP2_SPAN_EG_MIRROR_BUFFER_FACTOR;

        return __mlxsw_sp_pb_int_buf_size_get(mtu, speed, factor);
}

#define MLXSW_SP3_SPAN_EG_MIRROR_BUFFER_FACTOR 50

static u32 mlxsw_sp3_pb_int_buf_size_get(int mtu, u32 speed)
{
        int factor = MLXSW_SP3_SPAN_EG_MIRROR_BUFFER_FACTOR;

        return __mlxsw_sp_pb_int_buf_size_get(mtu, speed, factor);
}

const struct mlxsw_sp_sb_ops mlxsw_sp1_sb_ops = {
        .int_buf_size_get = mlxsw_sp1_pb_int_buf_size_get,
};

const struct mlxsw_sp_sb_ops mlxsw_sp2_sb_ops = {
        .int_buf_size_get = mlxsw_sp2_pb_int_buf_size_get,
};

const struct mlxsw_sp_sb_ops mlxsw_sp3_sb_ops = {
        .int_buf_size_get = mlxsw_sp3_pb_int_buf_size_get,
};

int mlxsw_sp_buffers_init(struct mlxsw_sp *mlxsw_sp)
{
        u32 max_headroom_size;
        u16 ing_pool_count = 0;
        u16 eg_pool_count = 0;
        int err;

        if (!MLXSW_CORE_RES_VALID(mlxsw_sp->core, CELL_SIZE))
                return -EIO;

        if (!MLXSW_CORE_RES_VALID(mlxsw_sp->core, GUARANTEED_SHARED_BUFFER))
                return -EIO;

        if (!MLXSW_CORE_RES_VALID(mlxsw_sp->core, MAX_HEADROOM_SIZE))
                return -EIO;

        mlxsw_sp->sb = kzalloc_obj(*mlxsw_sp->sb);
        if (!mlxsw_sp->sb)
                return -ENOMEM;
        mlxsw_sp->sb->cell_size = MLXSW_CORE_RES_GET(mlxsw_sp->core, CELL_SIZE);
        mlxsw_sp->sb->sb_size = MLXSW_CORE_RES_GET(mlxsw_sp->core,
                                                   GUARANTEED_SHARED_BUFFER);
        max_headroom_size = MLXSW_CORE_RES_GET(mlxsw_sp->core,
                                               MAX_HEADROOM_SIZE);
        /* Round down, because this limit must not be overstepped. */
        mlxsw_sp->sb->max_headroom_cells = max_headroom_size /
                                                mlxsw_sp->sb->cell_size;

        err = mlxsw_sp_sb_ports_init(mlxsw_sp);
        if (err)
                goto err_sb_ports_init;
        err = mlxsw_sp_sb_prs_init(mlxsw_sp, mlxsw_sp->sb_vals->prs,
                                   mlxsw_sp->sb_vals->pool_dess,
                                   mlxsw_sp->sb_vals->pool_count);
        if (err)
                goto err_sb_prs_init;
        err = mlxsw_sp_cpu_port_sb_cms_init(mlxsw_sp);
        if (err)
                goto err_sb_cpu_port_sb_cms_init;
        err = mlxsw_sp_cpu_port_sb_pms_init(mlxsw_sp);
        if (err)
                goto err_sb_cpu_port_pms_init;
        err = mlxsw_sp_sb_mms_init(mlxsw_sp);
        if (err)
                goto err_sb_mms_init;
        mlxsw_sp_pool_count(mlxsw_sp, &ing_pool_count, &eg_pool_count);
        err = devl_sb_register(priv_to_devlink(mlxsw_sp->core), 0,
                               mlxsw_sp->sb->sb_size,
                               ing_pool_count,
                               eg_pool_count,
                               MLXSW_SP_SB_ING_TC_COUNT,
                               MLXSW_SP_SB_EG_TC_COUNT);
        if (err)
                goto err_devlink_sb_register;

        return 0;

err_devlink_sb_register:
err_sb_mms_init:
err_sb_cpu_port_pms_init:
err_sb_cpu_port_sb_cms_init:
err_sb_prs_init:
        mlxsw_sp_sb_ports_fini(mlxsw_sp);
err_sb_ports_init:
        kfree(mlxsw_sp->sb);
        return err;
}

void mlxsw_sp_buffers_fini(struct mlxsw_sp *mlxsw_sp)
{
        devl_sb_unregister(priv_to_devlink(mlxsw_sp->core), 0);
        mlxsw_sp_sb_ports_fini(mlxsw_sp);
        kfree(mlxsw_sp->sb);
}

int mlxsw_sp_port_buffers_init(struct mlxsw_sp_port *mlxsw_sp_port)
{
        int err;

        mlxsw_sp_port->hdroom = kzalloc_obj(*mlxsw_sp_port->hdroom);
        if (!mlxsw_sp_port->hdroom)
                return -ENOMEM;
        mlxsw_sp_port->hdroom->mtu = mlxsw_sp_port->dev->mtu;

        err = mlxsw_sp_port_headroom_init(mlxsw_sp_port);
        if (err)
                goto err_headroom_init;
        err = mlxsw_sp_port_sb_cms_init(mlxsw_sp_port);
        if (err)
                goto err_port_sb_cms_init;
        err = mlxsw_sp_port_sb_pms_init(mlxsw_sp_port);
        if (err)
                goto err_port_sb_pms_init;
        return 0;

err_port_sb_pms_init:
err_port_sb_cms_init:
err_headroom_init:
        kfree(mlxsw_sp_port->hdroom);
        return err;
}

void mlxsw_sp_port_buffers_fini(struct mlxsw_sp_port *mlxsw_sp_port)
{
        kfree(mlxsw_sp_port->hdroom);
}

int mlxsw_sp_sb_pool_get(struct mlxsw_core *mlxsw_core,
                         unsigned int sb_index, u16 pool_index,
                         struct devlink_sb_pool_info *pool_info)
{
        struct mlxsw_sp *mlxsw_sp = mlxsw_core_driver_priv(mlxsw_core);
        enum mlxsw_reg_sbxx_dir dir;
        struct mlxsw_sp_sb_pr *pr;

        dir = mlxsw_sp->sb_vals->pool_dess[pool_index].dir;
        pr = mlxsw_sp_sb_pr_get(mlxsw_sp, pool_index);
        pool_info->pool_type = (enum devlink_sb_pool_type) dir;
        pool_info->size = mlxsw_sp_cells_bytes(mlxsw_sp, pr->size);
        pool_info->threshold_type = (enum devlink_sb_threshold_type) pr->mode;
        pool_info->cell_size = mlxsw_sp->sb->cell_size;
        return 0;
}

int mlxsw_sp_sb_pool_set(struct mlxsw_core *mlxsw_core,
                         unsigned int sb_index, u16 pool_index, u32 size,
                         enum devlink_sb_threshold_type threshold_type,
                         struct netlink_ext_ack *extack)
{
        struct mlxsw_sp *mlxsw_sp = mlxsw_core_driver_priv(mlxsw_core);
        u32 pool_size = mlxsw_sp_bytes_cells(mlxsw_sp, size);
        const struct mlxsw_sp_sb_pr *pr;
        enum mlxsw_reg_sbpr_mode mode;

        mode = (enum mlxsw_reg_sbpr_mode) threshold_type;
        pr = &mlxsw_sp->sb_vals->prs[pool_index];

        if (size > MLXSW_CORE_RES_GET(mlxsw_sp->core,
                                      GUARANTEED_SHARED_BUFFER)) {
                NL_SET_ERR_MSG_MOD(extack, "Exceeded shared buffer size");
                return -EINVAL;
        }

        if (pr->freeze_mode && pr->mode != mode) {
                NL_SET_ERR_MSG_MOD(extack, "Changing this pool's threshold type is forbidden");
                return -EINVAL;
        }

        if (pr->freeze_size && pr->size != size) {
                NL_SET_ERR_MSG_MOD(extack, "Changing this pool's size is forbidden");
                return -EINVAL;
        }

        return mlxsw_sp_sb_pr_write(mlxsw_sp, pool_index, mode,
                                    pool_size, false);
}

#define MLXSW_SP_SB_THRESHOLD_TO_ALPHA_OFFSET (-2) /* 3->1, 16->14 */

static u32 mlxsw_sp_sb_threshold_out(struct mlxsw_sp *mlxsw_sp, u16 pool_index,
                                     u32 max_buff)
{
        struct mlxsw_sp_sb_pr *pr = mlxsw_sp_sb_pr_get(mlxsw_sp, pool_index);

        if (pr->mode == MLXSW_REG_SBPR_MODE_DYNAMIC)
                return max_buff - MLXSW_SP_SB_THRESHOLD_TO_ALPHA_OFFSET;
        return mlxsw_sp_cells_bytes(mlxsw_sp, max_buff);
}

static int mlxsw_sp_sb_threshold_in(struct mlxsw_sp *mlxsw_sp, u16 pool_index,
                                    u32 threshold, u32 *p_max_buff,
                                    struct netlink_ext_ack *extack)
{
        struct mlxsw_sp_sb_pr *pr = mlxsw_sp_sb_pr_get(mlxsw_sp, pool_index);

        if (pr->mode == MLXSW_REG_SBPR_MODE_DYNAMIC) {
                int val;

                val = threshold + MLXSW_SP_SB_THRESHOLD_TO_ALPHA_OFFSET;
                if (val < MLXSW_REG_SBXX_DYN_MAX_BUFF_MIN ||
                    val > MLXSW_REG_SBXX_DYN_MAX_BUFF_MAX) {
                        NL_SET_ERR_MSG_MOD(extack, "Invalid dynamic threshold value");
                        return -EINVAL;
                }
                *p_max_buff = val;
        } else {
                *p_max_buff = mlxsw_sp_bytes_cells(mlxsw_sp, threshold);
        }
        return 0;
}

int mlxsw_sp_sb_port_pool_get(struct mlxsw_core_port *mlxsw_core_port,
                              unsigned int sb_index, u16 pool_index,
                              u32 *p_threshold)
{
        struct mlxsw_sp_port *mlxsw_sp_port =
                        mlxsw_core_port_driver_priv(mlxsw_core_port);
        struct mlxsw_sp *mlxsw_sp = mlxsw_sp_port->mlxsw_sp;
        u16 local_port = mlxsw_sp_port->local_port;
        struct mlxsw_sp_sb_pm *pm = mlxsw_sp_sb_pm_get(mlxsw_sp, local_port,
                                                       pool_index);

        *p_threshold = mlxsw_sp_sb_threshold_out(mlxsw_sp, pool_index,
                                                 pm->max_buff);
        return 0;
}

int mlxsw_sp_sb_port_pool_set(struct mlxsw_core_port *mlxsw_core_port,
                              unsigned int sb_index, u16 pool_index,
                              u32 threshold, struct netlink_ext_ack *extack)
{
        struct mlxsw_sp_port *mlxsw_sp_port =
                        mlxsw_core_port_driver_priv(mlxsw_core_port);
        struct mlxsw_sp *mlxsw_sp = mlxsw_sp_port->mlxsw_sp;
        u16 local_port = mlxsw_sp_port->local_port;
        u32 max_buff;
        int err;

        if (local_port == MLXSW_PORT_CPU_PORT) {
                NL_SET_ERR_MSG_MOD(extack, "Changing CPU port's threshold is forbidden");
                return -EINVAL;
        }

        err = mlxsw_sp_sb_threshold_in(mlxsw_sp, pool_index,
                                       threshold, &max_buff, extack);
        if (err)
                return err;

        return mlxsw_sp_sb_pm_write(mlxsw_sp, local_port, pool_index,
                                    0, max_buff);
}

int mlxsw_sp_sb_tc_pool_bind_get(struct mlxsw_core_port *mlxsw_core_port,
                                 unsigned int sb_index, u16 tc_index,
                                 enum devlink_sb_pool_type pool_type,
                                 u16 *p_pool_index, u32 *p_threshold)
{
        struct mlxsw_sp_port *mlxsw_sp_port =
                        mlxsw_core_port_driver_priv(mlxsw_core_port);
        struct mlxsw_sp *mlxsw_sp = mlxsw_sp_port->mlxsw_sp;
        u16 local_port = mlxsw_sp_port->local_port;
        u8 pg_buff = tc_index;
        enum mlxsw_reg_sbxx_dir dir = (enum mlxsw_reg_sbxx_dir) pool_type;
        struct mlxsw_sp_sb_cm *cm = mlxsw_sp_sb_cm_get(mlxsw_sp, local_port,
                                                       pg_buff, dir);

        *p_threshold = mlxsw_sp_sb_threshold_out(mlxsw_sp, cm->pool_index,
                                                 cm->max_buff);
        *p_pool_index = cm->pool_index;
        return 0;
}

int mlxsw_sp_sb_tc_pool_bind_set(struct mlxsw_core_port *mlxsw_core_port,
                                 unsigned int sb_index, u16 tc_index,
                                 enum devlink_sb_pool_type pool_type,
                                 u16 pool_index, u32 threshold,
                                 struct netlink_ext_ack *extack)
{
        struct mlxsw_sp_port *mlxsw_sp_port =
                        mlxsw_core_port_driver_priv(mlxsw_core_port);
        struct mlxsw_sp *mlxsw_sp = mlxsw_sp_port->mlxsw_sp;
        u16 local_port = mlxsw_sp_port->local_port;
        const struct mlxsw_sp_sb_cm *cm;
        u8 pg_buff = tc_index;
        enum mlxsw_reg_sbxx_dir dir = (enum mlxsw_reg_sbxx_dir) pool_type;
        u32 max_buff;
        int err;

        if (local_port == MLXSW_PORT_CPU_PORT) {
                NL_SET_ERR_MSG_MOD(extack, "Changing CPU port's binding is forbidden");
                return -EINVAL;
        }

        if (dir != mlxsw_sp->sb_vals->pool_dess[pool_index].dir) {
                NL_SET_ERR_MSG_MOD(extack, "Binding egress TC to ingress pool and vice versa is forbidden");
                return -EINVAL;
        }

        if (dir == MLXSW_REG_SBXX_DIR_INGRESS)
                cm = &mlxsw_sp->sb_vals->cms_ingress[tc_index];
        else
                cm = &mlxsw_sp->sb_vals->cms_egress[tc_index];

        if (cm->freeze_pool && cm->pool_index != pool_index) {
                NL_SET_ERR_MSG_MOD(extack, "Binding this TC to a different pool is forbidden");
                return -EINVAL;
        }

        if (cm->freeze_thresh && cm->max_buff != threshold) {
                NL_SET_ERR_MSG_MOD(extack, "Changing this TC's threshold is forbidden");
                return -EINVAL;
        }

        err = mlxsw_sp_sb_threshold_in(mlxsw_sp, pool_index,
                                       threshold, &max_buff, extack);
        if (err)
                return err;

        return mlxsw_sp_sb_cm_write(mlxsw_sp, local_port, pg_buff,
                                    0, max_buff, false, pool_index);
}

#define MASKED_COUNT_MAX \
        (MLXSW_REG_SBSR_REC_MAX_COUNT / \
         (MLXSW_SP_SB_ING_TC_COUNT + MLXSW_SP_SB_EG_TC_COUNT))

struct mlxsw_sp_sb_sr_occ_query_cb_ctx {
        u8 masked_count;
        u16 local_port_1;
};

static void mlxsw_sp_sb_sr_occ_query_cb(struct mlxsw_core *mlxsw_core,
                                        char *sbsr_pl, size_t sbsr_pl_len,
                                        unsigned long cb_priv)
{
        struct mlxsw_sp *mlxsw_sp = mlxsw_core_driver_priv(mlxsw_core);
        struct mlxsw_sp_sb_sr_occ_query_cb_ctx cb_ctx;
        u8 masked_count;
        u16 local_port;
        int rec_index = 0;
        struct mlxsw_sp_sb_cm *cm;
        int i;

        memcpy(&cb_ctx, &cb_priv, sizeof(cb_ctx));

        masked_count = 0;
        for (local_port = cb_ctx.local_port_1;
             local_port < mlxsw_core_max_ports(mlxsw_core); local_port++) {
                if (!mlxsw_sp->ports[local_port])
                        continue;
                if (local_port == MLXSW_PORT_CPU_PORT) {
                        /* Ingress quotas are not supported for the CPU port */
                        masked_count++;
                        continue;
                }
                for (i = 0; i < MLXSW_SP_SB_ING_TC_COUNT; i++) {
                        cm = mlxsw_sp_sb_cm_get(mlxsw_sp, local_port, i,
                                                MLXSW_REG_SBXX_DIR_INGRESS);
                        mlxsw_reg_sbsr_rec_unpack(sbsr_pl, rec_index++,
                                                  &cm->occ.cur, &cm->occ.max);
                }
                if (++masked_count == cb_ctx.masked_count)
                        break;
        }
        masked_count = 0;
        for (local_port = cb_ctx.local_port_1;
             local_port < mlxsw_core_max_ports(mlxsw_core); local_port++) {
                if (!mlxsw_sp->ports[local_port])
                        continue;
                for (i = 0; i < MLXSW_SP_SB_EG_TC_COUNT; i++) {
                        cm = mlxsw_sp_sb_cm_get(mlxsw_sp, local_port, i,
                                                MLXSW_REG_SBXX_DIR_EGRESS);
                        mlxsw_reg_sbsr_rec_unpack(sbsr_pl, rec_index++,
                                                  &cm->occ.cur, &cm->occ.max);
                }
                if (++masked_count == cb_ctx.masked_count)
                        break;
        }
}

int mlxsw_sp_sb_occ_snapshot(struct mlxsw_core *mlxsw_core,
                             unsigned int sb_index)
{
        u16 local_port, local_port_1, first_local_port, last_local_port;
        struct mlxsw_sp *mlxsw_sp = mlxsw_core_driver_priv(mlxsw_core);
        struct mlxsw_sp_sb_sr_occ_query_cb_ctx cb_ctx;
        u8 masked_count, current_page = 0;
        unsigned long cb_priv = 0;
        LIST_HEAD(bulk_list);
        char *sbsr_pl;
        int i;
        int err;
        int err2;

        sbsr_pl = kmalloc(MLXSW_REG_SBSR_LEN, GFP_KERNEL);
        if (!sbsr_pl)
                return -ENOMEM;

        local_port = MLXSW_PORT_CPU_PORT;
next_batch:
        local_port_1 = local_port;
        masked_count = 0;
        mlxsw_reg_sbsr_pack(sbsr_pl, false);
        mlxsw_reg_sbsr_port_page_set(sbsr_pl, current_page);
        first_local_port = current_page * MLXSW_REG_SBSR_NUM_PORTS_IN_PAGE;
        last_local_port = current_page * MLXSW_REG_SBSR_NUM_PORTS_IN_PAGE +
                          MLXSW_REG_SBSR_NUM_PORTS_IN_PAGE - 1;

        for (i = 0; i < MLXSW_SP_SB_ING_TC_COUNT; i++)
                mlxsw_reg_sbsr_pg_buff_mask_set(sbsr_pl, i, 1);
        for (i = 0; i < MLXSW_SP_SB_EG_TC_COUNT; i++)
                mlxsw_reg_sbsr_tclass_mask_set(sbsr_pl, i, 1);
        for (; local_port < mlxsw_core_max_ports(mlxsw_core); local_port++) {
                if (!mlxsw_sp->ports[local_port])
                        continue;
                if (local_port > last_local_port) {
                        current_page++;
                        goto do_query;
                }
                if (local_port != MLXSW_PORT_CPU_PORT) {
                        /* Ingress quotas are not supported for the CPU port */
                        mlxsw_reg_sbsr_ingress_port_mask_set(sbsr_pl,
                                                             local_port - first_local_port,
                                                             1);
                }
                mlxsw_reg_sbsr_egress_port_mask_set(sbsr_pl,
                                                    local_port - first_local_port,
                                                    1);
                for (i = 0; i < mlxsw_sp->sb_vals->pool_count; i++) {
                        err = mlxsw_sp_sb_pm_occ_query(mlxsw_sp, local_port, i,
                                                       &bulk_list);
                        if (err)
                                goto out;
                }
                if (++masked_count == MASKED_COUNT_MAX)
                        goto do_query;
        }

do_query:
        cb_ctx.masked_count = masked_count;
        cb_ctx.local_port_1 = local_port_1;
        memcpy(&cb_priv, &cb_ctx, sizeof(cb_ctx));
        err = mlxsw_reg_trans_query(mlxsw_core, MLXSW_REG(sbsr), sbsr_pl,
                                    &bulk_list, mlxsw_sp_sb_sr_occ_query_cb,
                                    cb_priv);
        if (err)
                goto out;
        if (local_port < mlxsw_core_max_ports(mlxsw_core)) {
                local_port++;
                goto next_batch;
        }

out:
        err2 = mlxsw_reg_trans_bulk_wait(&bulk_list);
        if (!err)
                err = err2;
        kfree(sbsr_pl);
        return err;
}

int mlxsw_sp_sb_occ_max_clear(struct mlxsw_core *mlxsw_core,
                              unsigned int sb_index)
{
        struct mlxsw_sp *mlxsw_sp = mlxsw_core_driver_priv(mlxsw_core);
        u16 local_port, first_local_port, last_local_port;
        LIST_HEAD(bulk_list);
        unsigned int masked_count;
        u8 current_page = 0;
        char *sbsr_pl;
        int i;
        int err;
        int err2;

        sbsr_pl = kmalloc(MLXSW_REG_SBSR_LEN, GFP_KERNEL);
        if (!sbsr_pl)
                return -ENOMEM;

        local_port = MLXSW_PORT_CPU_PORT;
next_batch:
        masked_count = 0;
        mlxsw_reg_sbsr_pack(sbsr_pl, true);
        mlxsw_reg_sbsr_port_page_set(sbsr_pl, current_page);
        first_local_port = current_page * MLXSW_REG_SBSR_NUM_PORTS_IN_PAGE;
        last_local_port = current_page * MLXSW_REG_SBSR_NUM_PORTS_IN_PAGE +
                          MLXSW_REG_SBSR_NUM_PORTS_IN_PAGE - 1;

        for (i = 0; i < MLXSW_SP_SB_ING_TC_COUNT; i++)
                mlxsw_reg_sbsr_pg_buff_mask_set(sbsr_pl, i, 1);
        for (i = 0; i < MLXSW_SP_SB_EG_TC_COUNT; i++)
                mlxsw_reg_sbsr_tclass_mask_set(sbsr_pl, i, 1);
        for (; local_port < mlxsw_core_max_ports(mlxsw_core); local_port++) {
                if (!mlxsw_sp->ports[local_port])
                        continue;
                if (local_port > last_local_port) {
                        current_page++;
                        goto do_query;
                }
                if (local_port != MLXSW_PORT_CPU_PORT) {
                        /* Ingress quotas are not supported for the CPU port */
                        mlxsw_reg_sbsr_ingress_port_mask_set(sbsr_pl,
                                                             local_port - first_local_port,
                                                             1);
                }
                mlxsw_reg_sbsr_egress_port_mask_set(sbsr_pl,
                                                    local_port - first_local_port,
                                                    1);
                for (i = 0; i < mlxsw_sp->sb_vals->pool_count; i++) {
                        err = mlxsw_sp_sb_pm_occ_clear(mlxsw_sp, local_port, i,
                                                       &bulk_list);
                        if (err)
                                goto out;
                }
                if (++masked_count == MASKED_COUNT_MAX)
                        goto do_query;
        }

do_query:
        err = mlxsw_reg_trans_query(mlxsw_core, MLXSW_REG(sbsr), sbsr_pl,
                                    &bulk_list, NULL, 0);
        if (err)
                goto out;
        if (local_port < mlxsw_core_max_ports(mlxsw_core)) {
                local_port++;
                goto next_batch;
        }

out:
        err2 = mlxsw_reg_trans_bulk_wait(&bulk_list);
        if (!err)
                err = err2;
        kfree(sbsr_pl);
        return err;
}

int mlxsw_sp_sb_occ_port_pool_get(struct mlxsw_core_port *mlxsw_core_port,
                                  unsigned int sb_index, u16 pool_index,
                                  u32 *p_cur, u32 *p_max)
{
        struct mlxsw_sp_port *mlxsw_sp_port =
                        mlxsw_core_port_driver_priv(mlxsw_core_port);
        struct mlxsw_sp *mlxsw_sp = mlxsw_sp_port->mlxsw_sp;
        u16 local_port = mlxsw_sp_port->local_port;
        struct mlxsw_sp_sb_pm *pm = mlxsw_sp_sb_pm_get(mlxsw_sp, local_port,
                                                       pool_index);

        *p_cur = mlxsw_sp_cells_bytes(mlxsw_sp, pm->occ.cur);
        *p_max = mlxsw_sp_cells_bytes(mlxsw_sp, pm->occ.max);
        return 0;
}

int mlxsw_sp_sb_occ_tc_port_bind_get(struct mlxsw_core_port *mlxsw_core_port,
                                     unsigned int sb_index, u16 tc_index,
                                     enum devlink_sb_pool_type pool_type,
                                     u32 *p_cur, u32 *p_max)
{
        struct mlxsw_sp_port *mlxsw_sp_port =
                        mlxsw_core_port_driver_priv(mlxsw_core_port);
        struct mlxsw_sp *mlxsw_sp = mlxsw_sp_port->mlxsw_sp;
        u16 local_port = mlxsw_sp_port->local_port;
        u8 pg_buff = tc_index;
        enum mlxsw_reg_sbxx_dir dir = (enum mlxsw_reg_sbxx_dir) pool_type;
        struct mlxsw_sp_sb_cm *cm = mlxsw_sp_sb_cm_get(mlxsw_sp, local_port,
                                                       pg_buff, dir);

        *p_cur = mlxsw_sp_cells_bytes(mlxsw_sp, cm->occ.cur);
        *p_max = mlxsw_sp_cells_bytes(mlxsw_sp, cm->occ.max);
        return 0;
}