root/sys/dev/mlx5/mlx5_core/mlx5_cmd.c
/*-
 * Copyright (c) 2013-2019, Mellanox Technologies, Ltd.  All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions
 * are met:
 * 1. Redistributions of source code must retain the above copyright
 *    notice, this list of conditions and the following disclaimer.
 * 2. Redistributions in binary form must reproduce the above copyright
 *    notice, this list of conditions and the following disclaimer in the
 *    documentation and/or other materials provided with the distribution.
 *
 * THIS SOFTWARE IS PROVIDED BY AUTHOR AND CONTRIBUTORS `AS IS' AND
 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED.  IN NO EVENT SHALL AUTHOR OR CONTRIBUTORS BE LIABLE
 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
 * SUCH DAMAGE.
 */

#include "opt_rss.h"
#include "opt_ratelimit.h"

#include <linux/module.h>
#include <linux/errno.h>
#include <linux/pci.h>
#include <linux/dma-mapping.h>
#include <linux/slab.h>
#include <linux/delay.h>
#include <linux/random.h>
#include <linux/io-mapping.h>
#include <linux/hardirq.h>
#include <linux/ktime.h>
#include <dev/mlx5/driver.h>
#include <dev/mlx5/cmd.h>
#include <dev/mlx5/mlx5_core/mlx5_core.h>

static int mlx5_copy_from_msg(void *to, struct mlx5_cmd_msg *from, int size);
static void mlx5_free_cmd_msg(struct mlx5_core_dev *dev,
                              struct mlx5_cmd_msg *msg);
static void free_msg(struct mlx5_core_dev *dev, struct mlx5_cmd_msg *msg);

enum {
        CMD_IF_REV = 5,
};

enum {
        NUM_LONG_LISTS    = 2,
        NUM_MED_LISTS     = 64,
        LONG_LIST_SIZE    = (2ULL * 1024 * 1024 * 1024 / PAGE_SIZE) * 8 + 16 +
                                MLX5_CMD_DATA_BLOCK_SIZE,
        MED_LIST_SIZE     = 16 + MLX5_CMD_DATA_BLOCK_SIZE,
};

enum {
        MLX5_CMD_DELIVERY_STAT_OK                       = 0x0,
        MLX5_CMD_DELIVERY_STAT_SIGNAT_ERR               = 0x1,
        MLX5_CMD_DELIVERY_STAT_TOK_ERR                  = 0x2,
        MLX5_CMD_DELIVERY_STAT_BAD_BLK_NUM_ERR          = 0x3,
        MLX5_CMD_DELIVERY_STAT_OUT_PTR_ALIGN_ERR        = 0x4,
        MLX5_CMD_DELIVERY_STAT_IN_PTR_ALIGN_ERR         = 0x5,
        MLX5_CMD_DELIVERY_STAT_FW_ERR                   = 0x6,
        MLX5_CMD_DELIVERY_STAT_IN_LENGTH_ERR            = 0x7,
        MLX5_CMD_DELIVERY_STAT_OUT_LENGTH_ERR           = 0x8,
        MLX5_CMD_DELIVERY_STAT_RES_FLD_NOT_CLR_ERR      = 0x9,
        MLX5_CMD_DELIVERY_STAT_CMD_DESCR_ERR            = 0x10,
};

struct mlx5_ifc_mbox_out_bits {
        u8         status[0x8];
        u8         reserved_at_8[0x18];

        u8         syndrome[0x20];

        u8         reserved_at_40[0x40];
};

struct mlx5_ifc_mbox_in_bits {
        u8         opcode[0x10];
        u8         reserved_at_10[0x10];

        u8         reserved_at_20[0x10];
        u8         op_mod[0x10];

        u8         reserved_at_40[0x40];
};


static struct mlx5_cmd_work_ent *alloc_cmd(struct mlx5_cmd *cmd,
                                           struct mlx5_cmd_msg *in,
                                           int uin_size,
                                           struct mlx5_cmd_msg *out,
                                           void *uout, int uout_size,
                                           mlx5_cmd_cbk_t cbk,
                                           void *context, int page_queue)
{
        gfp_t alloc_flags = cbk ? GFP_ATOMIC : GFP_KERNEL;
        struct mlx5_cmd_work_ent *ent;

        ent = kzalloc(sizeof(*ent), alloc_flags);
        if (!ent)
                return ERR_PTR(-ENOMEM);

        ent->in         = in;
        ent->uin_size   = uin_size;
        ent->out        = out;
        ent->uout       = uout;
        ent->uout_size  = uout_size;
        ent->callback   = cbk;
        ent->context    = context;
        ent->cmd        = cmd;
        ent->page_queue = page_queue;

        return ent;
}

static u8 alloc_token(struct mlx5_cmd *cmd)
{
        u8 token;

        spin_lock(&cmd->token_lock);
        cmd->token++;
        if (cmd->token == 0)
                cmd->token++;
        token = cmd->token;
        spin_unlock(&cmd->token_lock);

        return token;
}

static int alloc_ent(struct mlx5_cmd_work_ent *ent)
{
        unsigned long flags;
        struct mlx5_cmd *cmd = ent->cmd;
        struct mlx5_core_dev *dev =
                container_of(cmd, struct mlx5_core_dev, cmd);
        int ret = cmd->max_reg_cmds;

        spin_lock_irqsave(&cmd->alloc_lock, flags);
        if (!ent->page_queue) {
                ret = find_first_bit(&cmd->bitmask, cmd->max_reg_cmds);
                if (ret >= cmd->max_reg_cmds)
                        ret = -1;
        }

        if (dev->state != MLX5_DEVICE_STATE_UP)
                ret = -1;

        if (ret != -1) {
                ent->busy = 1;
                ent->idx = ret;
                clear_bit(ent->idx, &cmd->bitmask);
                cmd->ent_mode[ent->idx] =
                    ent->polling ? MLX5_CMD_MODE_POLLING : MLX5_CMD_MODE_EVENTS;
                cmd->ent_arr[ent->idx] = ent;
        }
        spin_unlock_irqrestore(&cmd->alloc_lock, flags);

        return ret;
}

static void free_ent(struct mlx5_cmd *cmd, int idx)
{
        unsigned long flags;

        spin_lock_irqsave(&cmd->alloc_lock, flags);
        cmd->ent_arr[idx] = NULL;       /* safety clear */
        cmd->ent_mode[idx] = MLX5_CMD_MODE_POLLING;     /* reset mode */
        set_bit(idx, &cmd->bitmask);
        spin_unlock_irqrestore(&cmd->alloc_lock, flags);
}

static struct mlx5_cmd_layout *get_inst(struct mlx5_cmd *cmd, int idx)
{
        return cmd->cmd_buf + (idx << cmd->log_stride);
}

static u8 xor8_buf(void *buf, int len)
{
        u8 *ptr = buf;
        u8 sum = 0;
        int i;

        for (i = 0; i < len; i++)
                sum ^= ptr[i];

        return sum;
}

static int verify_block_sig(struct mlx5_cmd_prot_block *block)
{
        if (xor8_buf(block->rsvd0, sizeof(*block) - sizeof(block->data) - 1) != 0xff)
                return -EINVAL;

        if (xor8_buf(block, sizeof(*block)) != 0xff)
                return -EINVAL;

        return 0;
}

static void calc_block_sig(struct mlx5_cmd_prot_block *block, u8 token,
                           int csum)
{
        block->token = token;
        if (csum) {
                block->ctrl_sig = ~xor8_buf(block->rsvd0, sizeof(*block) -
                                            sizeof(block->data) - 2);
                block->sig = ~xor8_buf(block, sizeof(*block) - 1);
        }
}

static void
calc_chain_sig(struct mlx5_cmd_msg *msg, u8 token, int csum)
{
        size_t i;

        for (i = 0; i != (msg->numpages * MLX5_NUM_CMDS_IN_ADAPTER_PAGE); i++) {
                struct mlx5_cmd_prot_block *block;

                block = mlx5_fwp_get_virt(msg, i * MLX5_CMD_MBOX_SIZE);

                /* compute signature */
                calc_block_sig(block, token, csum);

                /* check for last block */
                if (block->next == 0)
                        break;
        }

        /* make sure data gets written to RAM */
        mlx5_fwp_flush(msg);
}

static void set_signature(struct mlx5_cmd_work_ent *ent, int csum)
{
        ent->lay->sig = ~xor8_buf(ent->lay, sizeof(*ent->lay));
        calc_chain_sig(ent->in, ent->token, csum);
        calc_chain_sig(ent->out, ent->token, csum);
}

static void poll_timeout(struct mlx5_cmd_work_ent *ent)
{
        struct mlx5_core_dev *dev = container_of(ent->cmd,
                                                 struct mlx5_core_dev, cmd);
        long poll_end = jiffies +
                                msecs_to_jiffies(MLX5_CMD_TIMEOUT_MSEC + 1000);
        u8 own;

        do {
                own = ent->lay->status_own;
                if (!(own & CMD_OWNER_HW) ||
                    dev->state != MLX5_DEVICE_STATE_UP) {
                        ent->ret = 0;
                        return;
                }
                usleep_range(5000, 10000);
        } while (time_before(jiffies, poll_end));

        ent->ret = -ETIMEDOUT;
}

static void free_cmd(struct mlx5_cmd_work_ent *ent)
{
        cancel_delayed_work_sync(&ent->cb_timeout_work);
        kfree(ent);
}

static int
verify_signature(struct mlx5_cmd_work_ent *ent)
{
        struct mlx5_cmd_msg *msg = ent->out;
        size_t i;
        int err;
        u8 sig;

        sig = xor8_buf(ent->lay, sizeof(*ent->lay));
        if (sig != 0xff)
                return -EINVAL;

        for (i = 0; i != (msg->numpages * MLX5_NUM_CMDS_IN_ADAPTER_PAGE); i++) {
                struct mlx5_cmd_prot_block *block;

                block = mlx5_fwp_get_virt(msg, i * MLX5_CMD_MBOX_SIZE);

                /* compute signature */
                err = verify_block_sig(block);
                if (err != 0)
                        return (err);

                /* check for last block */
                if (block->next == 0)
                        break;
        }
        return (0);
}

static void dump_buf(void *buf, int size, int data_only, int offset)
{
        __be32 *p = buf;
        int i;

        for (i = 0; i < size; i += 16) {
                pr_debug("%03x: %08x %08x %08x %08x\n", offset, be32_to_cpu(p[0]),
                         be32_to_cpu(p[1]), be32_to_cpu(p[2]),
                         be32_to_cpu(p[3]));
                p += 4;
                offset += 16;
        }
        if (!data_only)
                pr_debug("\n");
}

enum {
        MLX5_DRIVER_STATUS_ABORTED = 0xfe,
        MLX5_DRIVER_SYND = 0xbadd00de,
};

static int mlx5_internal_err_ret_value(struct mlx5_core_dev *dev, u16 op,
                                       u32 *synd, u8 *status)
{
        *synd = 0;
        *status = 0;

        switch (op) {
        case MLX5_CMD_OP_TEARDOWN_HCA:
        case MLX5_CMD_OP_DISABLE_HCA:
        case MLX5_CMD_OP_MANAGE_PAGES:
        case MLX5_CMD_OP_DESTROY_MKEY:
        case MLX5_CMD_OP_DESTROY_EQ:
        case MLX5_CMD_OP_DESTROY_CQ:
        case MLX5_CMD_OP_DESTROY_QP:
        case MLX5_CMD_OP_DESTROY_PSV:
        case MLX5_CMD_OP_DESTROY_SRQ:
        case MLX5_CMD_OP_DESTROY_XRC_SRQ:
        case MLX5_CMD_OP_DESTROY_DCT:
        case MLX5_CMD_OP_DEALLOC_Q_COUNTER:
        case MLX5_CMD_OP_DEALLOC_PD:
        case MLX5_CMD_OP_DEALLOC_UAR:
        case MLX5_CMD_OP_DETACH_FROM_MCG:
        case MLX5_CMD_OP_DEALLOC_XRCD:
        case MLX5_CMD_OP_DEALLOC_TRANSPORT_DOMAIN:
        case MLX5_CMD_OP_DELETE_VXLAN_UDP_DPORT:
        case MLX5_CMD_OP_DELETE_L2_TABLE_ENTRY:
        case MLX5_CMD_OP_DESTROY_TIR:
        case MLX5_CMD_OP_DESTROY_SQ:
        case MLX5_CMD_OP_DESTROY_RQ:
        case MLX5_CMD_OP_DESTROY_RMP:
        case MLX5_CMD_OP_DESTROY_TIS:
        case MLX5_CMD_OP_DESTROY_RQT:
        case MLX5_CMD_OP_DESTROY_FLOW_TABLE:
        case MLX5_CMD_OP_DESTROY_FLOW_GROUP:
        case MLX5_CMD_OP_DELETE_FLOW_TABLE_ENTRY:
        case MLX5_CMD_OP_2ERR_QP:
        case MLX5_CMD_OP_2RST_QP:
        case MLX5_CMD_OP_MODIFY_NIC_VPORT_CONTEXT:
        case MLX5_CMD_OP_MODIFY_FLOW_TABLE:
        case MLX5_CMD_OP_SET_FLOW_TABLE_ENTRY:
        case MLX5_CMD_OP_SET_FLOW_TABLE_ROOT:
        case MLX5_CMD_OP_DESTROY_GENERAL_OBJ:
                return MLX5_CMD_STAT_OK;

        case MLX5_CMD_OP_QUERY_HCA_CAP:
        case MLX5_CMD_OP_QUERY_ADAPTER:
        case MLX5_CMD_OP_INIT_HCA:
        case MLX5_CMD_OP_ENABLE_HCA:
        case MLX5_CMD_OP_QUERY_PAGES:
        case MLX5_CMD_OP_SET_HCA_CAP:
        case MLX5_CMD_OP_QUERY_ISSI:
        case MLX5_CMD_OP_SET_ISSI:
        case MLX5_CMD_OP_CREATE_MKEY:
        case MLX5_CMD_OP_QUERY_MKEY:
        case MLX5_CMD_OP_QUERY_SPECIAL_CONTEXTS:
        case MLX5_CMD_OP_PAGE_FAULT_RESUME:
        case MLX5_CMD_OP_CREATE_EQ:
        case MLX5_CMD_OP_QUERY_EQ:
        case MLX5_CMD_OP_GEN_EQE:
        case MLX5_CMD_OP_CREATE_CQ:
        case MLX5_CMD_OP_QUERY_CQ:
        case MLX5_CMD_OP_MODIFY_CQ:
        case MLX5_CMD_OP_CREATE_QP:
        case MLX5_CMD_OP_RST2INIT_QP:
        case MLX5_CMD_OP_INIT2RTR_QP:
        case MLX5_CMD_OP_RTR2RTS_QP:
        case MLX5_CMD_OP_RTS2RTS_QP:
        case MLX5_CMD_OP_SQERR2RTS_QP:
        case MLX5_CMD_OP_QUERY_QP:
        case MLX5_CMD_OP_SQD_RTS_QP:
        case MLX5_CMD_OP_INIT2INIT_QP:
        case MLX5_CMD_OP_CREATE_PSV:
        case MLX5_CMD_OP_CREATE_SRQ:
        case MLX5_CMD_OP_QUERY_SRQ:
        case MLX5_CMD_OP_ARM_RQ:
        case MLX5_CMD_OP_CREATE_XRC_SRQ:
        case MLX5_CMD_OP_QUERY_XRC_SRQ:
        case MLX5_CMD_OP_ARM_XRC_SRQ:
        case MLX5_CMD_OP_CREATE_DCT:
        case MLX5_CMD_OP_DRAIN_DCT:
        case MLX5_CMD_OP_QUERY_DCT:
        case MLX5_CMD_OP_ARM_DCT_FOR_KEY_VIOLATION:
        case MLX5_CMD_OP_QUERY_VPORT_STATE:
        case MLX5_CMD_OP_MODIFY_VPORT_STATE:
        case MLX5_CMD_OP_QUERY_ESW_VPORT_CONTEXT:
        case MLX5_CMD_OP_MODIFY_ESW_VPORT_CONTEXT:
        case MLX5_CMD_OP_QUERY_NIC_VPORT_CONTEXT:
        case MLX5_CMD_OP_QUERY_ROCE_ADDRESS:
        case MLX5_CMD_OP_SET_ROCE_ADDRESS:
        case MLX5_CMD_OP_QUERY_HCA_VPORT_CONTEXT:
        case MLX5_CMD_OP_MODIFY_HCA_VPORT_CONTEXT:
        case MLX5_CMD_OP_QUERY_HCA_VPORT_GID:
        case MLX5_CMD_OP_QUERY_HCA_VPORT_PKEY:
        case MLX5_CMD_OP_QUERY_VNIC_ENV:
        case MLX5_CMD_OP_QUERY_VPORT_COUNTER:
        case MLX5_CMD_OP_ALLOC_Q_COUNTER:
        case MLX5_CMD_OP_QUERY_Q_COUNTER:
        case MLX5_CMD_OP_QUERY_FLOW_COUNTER:
        case MLX5_CMD_OP_ALLOC_PD:
        case MLX5_CMD_OP_ALLOC_UAR:
        case MLX5_CMD_OP_CONFIG_INT_MODERATION:
        case MLX5_CMD_OP_ACCESS_REG:
        case MLX5_CMD_OP_ATTACH_TO_MCG:
        case MLX5_CMD_OP_GET_DROPPED_PACKET_LOG:
        case MLX5_CMD_OP_MAD_IFC:
        case MLX5_CMD_OP_QUERY_MAD_DEMUX:
        case MLX5_CMD_OP_SET_MAD_DEMUX:
        case MLX5_CMD_OP_NOP:
        case MLX5_CMD_OP_ALLOC_XRCD:
        case MLX5_CMD_OP_ALLOC_TRANSPORT_DOMAIN:
        case MLX5_CMD_OP_QUERY_CONG_STATUS:
        case MLX5_CMD_OP_MODIFY_CONG_STATUS:
        case MLX5_CMD_OP_QUERY_CONG_PARAMS:
        case MLX5_CMD_OP_MODIFY_CONG_PARAMS:
        case MLX5_CMD_OP_QUERY_CONG_STATISTICS:
        case MLX5_CMD_OP_ADD_VXLAN_UDP_DPORT:
        case MLX5_CMD_OP_SET_L2_TABLE_ENTRY:
        case MLX5_CMD_OP_QUERY_L2_TABLE_ENTRY:
        case MLX5_CMD_OP_CREATE_TIR:
        case MLX5_CMD_OP_MODIFY_TIR:
        case MLX5_CMD_OP_QUERY_TIR:
        case MLX5_CMD_OP_CREATE_SQ:
        case MLX5_CMD_OP_MODIFY_SQ:
        case MLX5_CMD_OP_QUERY_SQ:
        case MLX5_CMD_OP_CREATE_RQ:
        case MLX5_CMD_OP_MODIFY_RQ:
        case MLX5_CMD_OP_QUERY_RQ:
        case MLX5_CMD_OP_CREATE_RMP:
        case MLX5_CMD_OP_MODIFY_RMP:
        case MLX5_CMD_OP_QUERY_RMP:
        case MLX5_CMD_OP_CREATE_TIS:
        case MLX5_CMD_OP_MODIFY_TIS:
        case MLX5_CMD_OP_QUERY_TIS:
        case MLX5_CMD_OP_CREATE_RQT:
        case MLX5_CMD_OP_MODIFY_RQT:
        case MLX5_CMD_OP_QUERY_RQT:
        case MLX5_CMD_OP_CREATE_FLOW_TABLE:
        case MLX5_CMD_OP_QUERY_FLOW_TABLE:
        case MLX5_CMD_OP_CREATE_FLOW_GROUP:
        case MLX5_CMD_OP_QUERY_FLOW_GROUP:
        case MLX5_CMD_OP_QUERY_FLOW_TABLE_ENTRY:
        case MLX5_CMD_OP_CREATE_GENERAL_OBJ:
        case MLX5_CMD_OP_MODIFY_GENERAL_OBJ:
        case MLX5_CMD_OP_QUERY_GENERAL_OBJ:
                *status = MLX5_DRIVER_STATUS_ABORTED;
                *synd = MLX5_DRIVER_SYND;
                return -EIO;
        default:
                mlx5_core_err(dev, "Unknown FW command (%d)\n", op);
                return -EINVAL;
        }
}

const char *mlx5_command_str(int command)
{
        #define MLX5_COMMAND_STR_CASE(__cmd) case MLX5_CMD_OP_ ## __cmd: return #__cmd

        switch (command) {
        MLX5_COMMAND_STR_CASE(QUERY_HCA_CAP);
        MLX5_COMMAND_STR_CASE(SET_HCA_CAP);
        MLX5_COMMAND_STR_CASE(QUERY_ADAPTER);
        MLX5_COMMAND_STR_CASE(INIT_HCA);
        MLX5_COMMAND_STR_CASE(TEARDOWN_HCA);
        MLX5_COMMAND_STR_CASE(ENABLE_HCA);
        MLX5_COMMAND_STR_CASE(DISABLE_HCA);
        MLX5_COMMAND_STR_CASE(QUERY_PAGES);
        MLX5_COMMAND_STR_CASE(MANAGE_PAGES);
        MLX5_COMMAND_STR_CASE(QUERY_ISSI);
        MLX5_COMMAND_STR_CASE(SET_ISSI);
        MLX5_COMMAND_STR_CASE(CREATE_MKEY);
        MLX5_COMMAND_STR_CASE(QUERY_MKEY);
        MLX5_COMMAND_STR_CASE(DESTROY_MKEY);
        MLX5_COMMAND_STR_CASE(QUERY_SPECIAL_CONTEXTS);
        MLX5_COMMAND_STR_CASE(PAGE_FAULT_RESUME);
        MLX5_COMMAND_STR_CASE(CREATE_EQ);
        MLX5_COMMAND_STR_CASE(DESTROY_EQ);
        MLX5_COMMAND_STR_CASE(QUERY_EQ);
        MLX5_COMMAND_STR_CASE(GEN_EQE);
        MLX5_COMMAND_STR_CASE(CREATE_CQ);
        MLX5_COMMAND_STR_CASE(DESTROY_CQ);
        MLX5_COMMAND_STR_CASE(QUERY_CQ);
        MLX5_COMMAND_STR_CASE(MODIFY_CQ);
        MLX5_COMMAND_STR_CASE(CREATE_QP);
        MLX5_COMMAND_STR_CASE(DESTROY_QP);
        MLX5_COMMAND_STR_CASE(RST2INIT_QP);
        MLX5_COMMAND_STR_CASE(INIT2RTR_QP);
        MLX5_COMMAND_STR_CASE(RTR2RTS_QP);
        MLX5_COMMAND_STR_CASE(RTS2RTS_QP);
        MLX5_COMMAND_STR_CASE(SQERR2RTS_QP);
        MLX5_COMMAND_STR_CASE(2ERR_QP);
        MLX5_COMMAND_STR_CASE(2RST_QP);
        MLX5_COMMAND_STR_CASE(QUERY_QP);
        MLX5_COMMAND_STR_CASE(SQD_RTS_QP);
        MLX5_COMMAND_STR_CASE(MAD_IFC);
        MLX5_COMMAND_STR_CASE(INIT2INIT_QP);
        MLX5_COMMAND_STR_CASE(CREATE_PSV);
        MLX5_COMMAND_STR_CASE(DESTROY_PSV);
        MLX5_COMMAND_STR_CASE(CREATE_SRQ);
        MLX5_COMMAND_STR_CASE(DESTROY_SRQ);
        MLX5_COMMAND_STR_CASE(QUERY_SRQ);
        MLX5_COMMAND_STR_CASE(ARM_RQ);
        MLX5_COMMAND_STR_CASE(CREATE_XRC_SRQ);
        MLX5_COMMAND_STR_CASE(DESTROY_XRC_SRQ);
        MLX5_COMMAND_STR_CASE(QUERY_XRC_SRQ);
        MLX5_COMMAND_STR_CASE(ARM_XRC_SRQ);
        MLX5_COMMAND_STR_CASE(CREATE_DCT);
        MLX5_COMMAND_STR_CASE(SET_DC_CNAK_TRACE);
        MLX5_COMMAND_STR_CASE(DESTROY_DCT);
        MLX5_COMMAND_STR_CASE(DRAIN_DCT);
        MLX5_COMMAND_STR_CASE(QUERY_DCT);
        MLX5_COMMAND_STR_CASE(ARM_DCT_FOR_KEY_VIOLATION);
        MLX5_COMMAND_STR_CASE(QUERY_VPORT_STATE);
        MLX5_COMMAND_STR_CASE(MODIFY_VPORT_STATE);
        MLX5_COMMAND_STR_CASE(QUERY_ESW_VPORT_CONTEXT);
        MLX5_COMMAND_STR_CASE(MODIFY_ESW_VPORT_CONTEXT);
        MLX5_COMMAND_STR_CASE(QUERY_NIC_VPORT_CONTEXT);
        MLX5_COMMAND_STR_CASE(MODIFY_NIC_VPORT_CONTEXT);
        MLX5_COMMAND_STR_CASE(QUERY_ROCE_ADDRESS);
        MLX5_COMMAND_STR_CASE(SET_ROCE_ADDRESS);
        MLX5_COMMAND_STR_CASE(QUERY_HCA_VPORT_CONTEXT);
        MLX5_COMMAND_STR_CASE(MODIFY_HCA_VPORT_CONTEXT);
        MLX5_COMMAND_STR_CASE(QUERY_HCA_VPORT_GID);
        MLX5_COMMAND_STR_CASE(QUERY_HCA_VPORT_PKEY);
        MLX5_COMMAND_STR_CASE(QUERY_VNIC_ENV);
        MLX5_COMMAND_STR_CASE(QUERY_VPORT_COUNTER);
        MLX5_COMMAND_STR_CASE(SET_WOL_ROL);
        MLX5_COMMAND_STR_CASE(QUERY_WOL_ROL);
        MLX5_COMMAND_STR_CASE(ALLOC_Q_COUNTER);
        MLX5_COMMAND_STR_CASE(DEALLOC_Q_COUNTER);
        MLX5_COMMAND_STR_CASE(QUERY_Q_COUNTER);
        MLX5_COMMAND_STR_CASE(ALLOC_PD);
        MLX5_COMMAND_STR_CASE(DEALLOC_PD);
        MLX5_COMMAND_STR_CASE(ALLOC_UAR);
        MLX5_COMMAND_STR_CASE(DEALLOC_UAR);
        MLX5_COMMAND_STR_CASE(CONFIG_INT_MODERATION);
        MLX5_COMMAND_STR_CASE(ATTACH_TO_MCG);
        MLX5_COMMAND_STR_CASE(DETACH_FROM_MCG);
        MLX5_COMMAND_STR_CASE(GET_DROPPED_PACKET_LOG);
        MLX5_COMMAND_STR_CASE(QUERY_MAD_DEMUX);
        MLX5_COMMAND_STR_CASE(SET_MAD_DEMUX);
        MLX5_COMMAND_STR_CASE(NOP);
        MLX5_COMMAND_STR_CASE(ALLOC_XRCD);
        MLX5_COMMAND_STR_CASE(DEALLOC_XRCD);
        MLX5_COMMAND_STR_CASE(ALLOC_TRANSPORT_DOMAIN);
        MLX5_COMMAND_STR_CASE(DEALLOC_TRANSPORT_DOMAIN);
        MLX5_COMMAND_STR_CASE(QUERY_CONG_STATUS);
        MLX5_COMMAND_STR_CASE(MODIFY_CONG_STATUS);
        MLX5_COMMAND_STR_CASE(QUERY_CONG_PARAMS);
        MLX5_COMMAND_STR_CASE(MODIFY_CONG_PARAMS);
        MLX5_COMMAND_STR_CASE(QUERY_CONG_STATISTICS);
        MLX5_COMMAND_STR_CASE(ADD_VXLAN_UDP_DPORT);
        MLX5_COMMAND_STR_CASE(DELETE_VXLAN_UDP_DPORT);
        MLX5_COMMAND_STR_CASE(SET_L2_TABLE_ENTRY);
        MLX5_COMMAND_STR_CASE(QUERY_L2_TABLE_ENTRY);
        MLX5_COMMAND_STR_CASE(DELETE_L2_TABLE_ENTRY);
        MLX5_COMMAND_STR_CASE(CREATE_RMP);
        MLX5_COMMAND_STR_CASE(MODIFY_RMP);
        MLX5_COMMAND_STR_CASE(DESTROY_RMP);
        MLX5_COMMAND_STR_CASE(QUERY_RMP);
        MLX5_COMMAND_STR_CASE(CREATE_RQT);
        MLX5_COMMAND_STR_CASE(MODIFY_RQT);
        MLX5_COMMAND_STR_CASE(DESTROY_RQT);
        MLX5_COMMAND_STR_CASE(QUERY_RQT);
        MLX5_COMMAND_STR_CASE(ACCESS_REG);
        MLX5_COMMAND_STR_CASE(CREATE_SQ);
        MLX5_COMMAND_STR_CASE(MODIFY_SQ);
        MLX5_COMMAND_STR_CASE(DESTROY_SQ);
        MLX5_COMMAND_STR_CASE(QUERY_SQ);
        MLX5_COMMAND_STR_CASE(CREATE_RQ);
        MLX5_COMMAND_STR_CASE(MODIFY_RQ);
        MLX5_COMMAND_STR_CASE(DESTROY_RQ);
        MLX5_COMMAND_STR_CASE(QUERY_RQ);
        MLX5_COMMAND_STR_CASE(CREATE_TIR);
        MLX5_COMMAND_STR_CASE(MODIFY_TIR);
        MLX5_COMMAND_STR_CASE(DESTROY_TIR);
        MLX5_COMMAND_STR_CASE(QUERY_TIR);
        MLX5_COMMAND_STR_CASE(CREATE_TIS);
        MLX5_COMMAND_STR_CASE(MODIFY_TIS);
        MLX5_COMMAND_STR_CASE(DESTROY_TIS);
        MLX5_COMMAND_STR_CASE(QUERY_TIS);
        MLX5_COMMAND_STR_CASE(CREATE_FLOW_TABLE);
        MLX5_COMMAND_STR_CASE(DESTROY_FLOW_TABLE);
        MLX5_COMMAND_STR_CASE(QUERY_FLOW_TABLE);
        MLX5_COMMAND_STR_CASE(CREATE_FLOW_GROUP);
        MLX5_COMMAND_STR_CASE(DESTROY_FLOW_GROUP);
        MLX5_COMMAND_STR_CASE(QUERY_FLOW_GROUP);
        MLX5_COMMAND_STR_CASE(SET_FLOW_TABLE_ENTRY);
        MLX5_COMMAND_STR_CASE(QUERY_FLOW_TABLE_ENTRY);
        MLX5_COMMAND_STR_CASE(DELETE_FLOW_TABLE_ENTRY);
        MLX5_COMMAND_STR_CASE(SET_DIAGNOSTICS);
        MLX5_COMMAND_STR_CASE(QUERY_DIAGNOSTICS);
        MLX5_COMMAND_STR_CASE(CREATE_GENERAL_OBJ);
        MLX5_COMMAND_STR_CASE(MODIFY_GENERAL_OBJ);
        MLX5_COMMAND_STR_CASE(QUERY_GENERAL_OBJ);
        MLX5_COMMAND_STR_CASE(DESTROY_GENERAL_OBJ);
        MLX5_COMMAND_STR_CASE(ALLOC_FLOW_COUNTER);
        MLX5_COMMAND_STR_CASE(DEALLOC_FLOW_COUNTER);
        MLX5_COMMAND_STR_CASE(QUERY_FLOW_COUNTER);
        default: return "unknown command opcode";
        }
}

static const char *cmd_status_str(u8 status)
{
        switch (status) {
        case MLX5_CMD_STAT_OK:
                return "OK";
        case MLX5_CMD_STAT_INT_ERR:
                return "internal error";
        case MLX5_CMD_STAT_BAD_OP_ERR:
                return "bad operation";
        case MLX5_CMD_STAT_BAD_PARAM_ERR:
                return "bad parameter";
        case MLX5_CMD_STAT_BAD_SYS_STATE_ERR:
                return "bad system state";
        case MLX5_CMD_STAT_BAD_RES_ERR:
                return "bad resource";
        case MLX5_CMD_STAT_RES_BUSY:
                return "resource busy";
        case MLX5_CMD_STAT_LIM_ERR:
                return "limits exceeded";
        case MLX5_CMD_STAT_BAD_RES_STATE_ERR:
                return "bad resource state";
        case MLX5_CMD_STAT_IX_ERR:
                return "bad index";
        case MLX5_CMD_STAT_NO_RES_ERR:
                return "no resources";
        case MLX5_CMD_STAT_BAD_INP_LEN_ERR:
                return "bad input length";
        case MLX5_CMD_STAT_BAD_OUTP_LEN_ERR:
                return "bad output length";
        case MLX5_CMD_STAT_BAD_QP_STATE_ERR:
                return "bad QP state";
        case MLX5_CMD_STAT_BAD_PKT_ERR:
                return "bad packet (discarded)";
        case MLX5_CMD_STAT_BAD_SIZE_OUTS_CQES_ERR:
                return "bad size too many outstanding CQEs";
        default:
                return "unknown status";
        }
}

static int cmd_status_to_err_helper(u8 status)
{
        switch (status) {
        case MLX5_CMD_STAT_OK:                          return 0;
        case MLX5_CMD_STAT_INT_ERR:                     return -EIO;
        case MLX5_CMD_STAT_BAD_OP_ERR:                  return -EINVAL;
        case MLX5_CMD_STAT_BAD_PARAM_ERR:               return -EINVAL;
        case MLX5_CMD_STAT_BAD_SYS_STATE_ERR:           return -EIO;
        case MLX5_CMD_STAT_BAD_RES_ERR:                 return -EINVAL;
        case MLX5_CMD_STAT_RES_BUSY:                    return -EBUSY;
        case MLX5_CMD_STAT_LIM_ERR:                     return -ENOMEM;
        case MLX5_CMD_STAT_BAD_RES_STATE_ERR:           return -EINVAL;
        case MLX5_CMD_STAT_IX_ERR:                      return -EINVAL;
        case MLX5_CMD_STAT_NO_RES_ERR:                  return -EAGAIN;
        case MLX5_CMD_STAT_BAD_INP_LEN_ERR:             return -EIO;
        case MLX5_CMD_STAT_BAD_OUTP_LEN_ERR:            return -EIO;
        case MLX5_CMD_STAT_BAD_QP_STATE_ERR:            return -EINVAL;
        case MLX5_CMD_STAT_BAD_PKT_ERR:                 return -EINVAL;
        case MLX5_CMD_STAT_BAD_SIZE_OUTS_CQES_ERR:      return -EINVAL;
        default:                                        return -EIO;
        }
}

void mlx5_cmd_mbox_status(void *out, u8 *status, u32 *syndrome)
{
        *status = MLX5_GET(mbox_out, out, status);
        *syndrome = MLX5_GET(mbox_out, out, syndrome);
}

static int mlx5_cmd_check(struct mlx5_core_dev *dev, void *in, void *out)
{
        u32 syndrome;
        u8  status;
        u16 opcode;
        u16 op_mod;

        mlx5_cmd_mbox_status(out, &status, &syndrome);
        if (!status)
                return 0;

        opcode = MLX5_GET(mbox_in, in, opcode);
        op_mod = MLX5_GET(mbox_in, in, op_mod);

        mlx5_core_err(dev,
                      "%s(0x%x) op_mod(0x%x) failed, status %s(0x%x), syndrome (0x%x)\n",
                       mlx5_command_str(opcode),
                       opcode, op_mod,
                       cmd_status_str(status),
                       status,
                       syndrome);

        return cmd_status_to_err_helper(status);
}

static void dump_command(struct mlx5_core_dev *dev,
                         struct mlx5_cmd_work_ent *ent, int input)
{
        struct mlx5_cmd_msg *msg = input ? ent->in : ent->out;
        u16 op = MLX5_GET(mbox_in, ent->lay->in, opcode);
        size_t i;
        int data_only;
        int offset = 0;
        int msg_len = input ? ent->uin_size : ent->uout_size;
        int dump_len;

        data_only = !!(mlx5_core_debug_mask & (1 << MLX5_CMD_DATA));

        if (data_only)
                mlx5_core_dbg_mask(dev, 1 << MLX5_CMD_DATA,
                                   "dump command data %s(0x%x) %s\n",
                                   mlx5_command_str(op), op,
                                   input ? "INPUT" : "OUTPUT");
        else
                mlx5_core_dbg(dev, "dump command %s(0x%x) %s\n",
                              mlx5_command_str(op), op,
                              input ? "INPUT" : "OUTPUT");

        if (data_only) {
                if (input) {
                        dump_buf(ent->lay->in, sizeof(ent->lay->in), 1, offset);
                        offset += sizeof(ent->lay->in);
                } else {
                        dump_buf(ent->lay->out, sizeof(ent->lay->out), 1, offset);
                        offset += sizeof(ent->lay->out);
                }
        } else {
                dump_buf(ent->lay, sizeof(*ent->lay), 0, offset);
                offset += sizeof(*ent->lay);
        }

        for (i = 0; i != (msg->numpages * MLX5_NUM_CMDS_IN_ADAPTER_PAGE); i++) {
                struct mlx5_cmd_prot_block *block;

                block = mlx5_fwp_get_virt(msg, i * MLX5_CMD_MBOX_SIZE);

                if (data_only) {
                        if (offset >= msg_len)
                                break;
                        dump_len = min_t(int,
                            MLX5_CMD_DATA_BLOCK_SIZE, msg_len - offset);

                        dump_buf(block->data, dump_len, 1, offset);
                        offset += MLX5_CMD_DATA_BLOCK_SIZE;
                } else {
                        mlx5_core_dbg(dev, "command block:\n");
                        dump_buf(block, sizeof(*block), 0, offset);
                        offset += sizeof(*block);
                }

                /* check for last block */
                if (block->next == 0)
                        break;
        }

        if (data_only)
                pr_debug("\n");
}

static u16 msg_to_opcode(struct mlx5_cmd_msg *in)
{
        return MLX5_GET(mbox_in, in->first.data, opcode);
}

static void cb_timeout_handler(struct work_struct *work)
{
        struct delayed_work *dwork = container_of(work, struct delayed_work,
                                                  work);
        struct mlx5_cmd_work_ent *ent = container_of(dwork,
                                                     struct mlx5_cmd_work_ent,
                                                     cb_timeout_work);
        struct mlx5_core_dev *dev = container_of(ent->cmd, struct mlx5_core_dev,
                                                 cmd);

        ent->ret = -ETIMEDOUT;
        mlx5_core_warn(dev, "%s(0x%x) timeout. Will cause a leak of a command resource\n",
                       mlx5_command_str(msg_to_opcode(ent->in)),
                       msg_to_opcode(ent->in));
        mlx5_cmd_comp_handler(dev, 1UL << ent->idx, MLX5_CMD_MODE_EVENTS);
}

static void
cmd_free_work(struct work_struct *work)
{
        struct mlx5_cmd_work_ent *ent = container_of(work,
            struct mlx5_cmd_work_ent, freew);

        free_cmd(ent);
}

static void complete_command(struct mlx5_cmd_work_ent *ent)
{
        struct mlx5_cmd *cmd = ent->cmd;
        struct mlx5_core_dev *dev = container_of(cmd, struct mlx5_core_dev,
                                                 cmd);
        mlx5_cmd_cbk_t callback;
        void *context;

        s64 ds;
        struct mlx5_cmd_stats *stats;
        unsigned long flags;
        int err;
        struct semaphore *sem;

        if (ent->page_queue)
                sem = &cmd->pages_sem;
        else
                sem = &cmd->sem;

        if (dev->state != MLX5_DEVICE_STATE_UP) {
                u8 status = 0;
                u32 drv_synd;

                ent->ret = mlx5_internal_err_ret_value(dev, msg_to_opcode(ent->in), &drv_synd, &status);
                MLX5_SET(mbox_out, ent->out, status, status);
                MLX5_SET(mbox_out, ent->out, syndrome, drv_synd);
        }

        if (ent->callback) {
                ds = ent->ts2 - ent->ts1;
                if (ent->op < ARRAY_SIZE(cmd->stats)) {
                        stats = &cmd->stats[ent->op];
                        spin_lock_irqsave(&stats->lock, flags);
                        stats->sum += ds;
                        ++stats->n;
                        spin_unlock_irqrestore(&stats->lock, flags);
                }

                callback = ent->callback;
                context = ent->context;
                err = ent->ret;
                if (!err) {
                        err = mlx5_copy_from_msg(ent->uout,
                                                 ent->out,
                                                 ent->uout_size);
                        err = err ? err : mlx5_cmd_check(dev,
                                                         ent->in->first.data,
                                                         ent->uout);
                }

                mlx5_free_cmd_msg(dev, ent->out);
                free_msg(dev, ent->in);

                err = err ? err : ent->status;
                INIT_WORK(&ent->freew, cmd_free_work);
                schedule_work(&ent->freew);
                callback(err, context);
        } else {
                complete(&ent->done);
        }
        up(sem);
}

static void cmd_work_handler(struct work_struct *work)
{
        struct mlx5_cmd_work_ent *ent = container_of(work, struct mlx5_cmd_work_ent, work);
        struct mlx5_cmd *cmd = ent->cmd;
        struct mlx5_core_dev *dev = container_of(cmd, struct mlx5_core_dev, cmd);
        unsigned long cb_timeout = msecs_to_jiffies(MLX5_CMD_TIMEOUT_MSEC);
        struct mlx5_cmd_layout *lay;
        struct semaphore *sem;
        bool poll_cmd = ent->polling;

        sem = ent->page_queue ? &cmd->pages_sem : &cmd->sem;
        down(sem);

        if (alloc_ent(ent) < 0) {
                complete_command(ent);
                return;
        }

        ent->token = alloc_token(cmd);
        lay = get_inst(cmd, ent->idx);
        ent->lay = lay;
        memset(lay, 0, sizeof(*lay));
        memcpy(lay->in, ent->in->first.data, sizeof(lay->in));
        ent->op = be32_to_cpu(lay->in[0]) >> 16;
        if (ent->in->numpages != 0)
                lay->in_ptr = cpu_to_be64(mlx5_fwp_get_dma(ent->in, 0));
        if (ent->out->numpages != 0)
                lay->out_ptr = cpu_to_be64(mlx5_fwp_get_dma(ent->out, 0));
        lay->inlen = cpu_to_be32(ent->uin_size);
        lay->outlen = cpu_to_be32(ent->uout_size);
        lay->type = MLX5_PCI_CMD_XPORT;
        lay->token = ent->token;
        lay->status_own = CMD_OWNER_HW;
        set_signature(ent, !cmd->checksum_disabled);
        dump_command(dev, ent, 1);
        ent->ts1 = ktime_get_ns();
        ent->busy = 0;
        if (ent->callback)
                schedule_delayed_work(&ent->cb_timeout_work, cb_timeout);

        /* ring doorbell after the descriptor is valid */
        mlx5_core_dbg(dev, "writing 0x%x to command doorbell\n", 1 << ent->idx);
        /* make sure data is written to RAM */
        mlx5_fwp_flush(cmd->cmd_page);
        iowrite32be(1 << ent->idx, &dev->iseg->cmd_dbell);
        mmiowb();

        /* if not in polling don't use ent after this point */
        if (poll_cmd) {
                poll_timeout(ent);
                /* make sure we read the descriptor after ownership is SW */
                mlx5_cmd_comp_handler(dev, 1U << ent->idx, MLX5_CMD_MODE_POLLING);
        }
}

static const char *deliv_status_to_str(u8 status)
{
        switch (status) {
        case MLX5_CMD_DELIVERY_STAT_OK:
                return "no errors";
        case MLX5_CMD_DELIVERY_STAT_SIGNAT_ERR:
                return "signature error";
        case MLX5_CMD_DELIVERY_STAT_TOK_ERR:
                return "token error";
        case MLX5_CMD_DELIVERY_STAT_BAD_BLK_NUM_ERR:
                return "bad block number";
        case MLX5_CMD_DELIVERY_STAT_OUT_PTR_ALIGN_ERR:
                return "output pointer not aligned to block size";
        case MLX5_CMD_DELIVERY_STAT_IN_PTR_ALIGN_ERR:
                return "input pointer not aligned to block size";
        case MLX5_CMD_DELIVERY_STAT_FW_ERR:
                return "firmware internal error";
        case MLX5_CMD_DELIVERY_STAT_IN_LENGTH_ERR:
                return "command input length error";
        case MLX5_CMD_DELIVERY_STAT_OUT_LENGTH_ERR:
                return "command output length error";
        case MLX5_CMD_DELIVERY_STAT_RES_FLD_NOT_CLR_ERR:
                return "reserved fields not cleared";
        case MLX5_CMD_DELIVERY_STAT_CMD_DESCR_ERR:
                return "bad command descriptor type";
        default:
                return "unknown status code";
        }
}

static int wait_func(struct mlx5_core_dev *dev, struct mlx5_cmd_work_ent *ent)
{
        unsigned long timeout = msecs_to_jiffies(MLX5_CMD_TIMEOUT_MSEC);
        int err;

        if (ent->polling) {
                wait_for_completion(&ent->done);
        } else if (!wait_for_completion_timeout(&ent->done, timeout)) {
                ent->ret = -ETIMEDOUT;
                mlx5_cmd_comp_handler(dev, 1UL << ent->idx, MLX5_CMD_MODE_EVENTS);
        }

        err = ent->ret;

        if (err == -ETIMEDOUT) {
                mlx5_core_warn(dev, "%s(0x%x) timeout. Will cause a leak of a command resource\n",
                               mlx5_command_str(msg_to_opcode(ent->in)),
                               msg_to_opcode(ent->in));
        }
        mlx5_core_dbg(dev, "err %d, delivery status %s(%d)\n",
                      err, deliv_status_to_str(ent->status), ent->status);

        return err;
}

/*  Notes:
 *    1. Callback functions may not sleep
 *    2. page queue commands do not support asynchrous completion
 */
static int mlx5_cmd_invoke(struct mlx5_core_dev *dev, struct mlx5_cmd_msg *in,
                           int uin_size,
                           struct mlx5_cmd_msg *out, void *uout, int uout_size,
                           mlx5_cmd_cbk_t callback,
                           void *context, int page_queue, u8 *status,
                           bool force_polling)
{
        struct mlx5_cmd *cmd = &dev->cmd;
        struct mlx5_cmd_work_ent *ent;
        struct mlx5_cmd_stats *stats;
        int err = 0;
        s64 ds;
        u16 op;

        if (callback && page_queue)
                return -EINVAL;

        ent = alloc_cmd(cmd, in, uin_size, out, uout, uout_size, callback,
                        context, page_queue);
        if (IS_ERR(ent))
                return PTR_ERR(ent);

        ent->polling = force_polling || (cmd->mode == MLX5_CMD_MODE_POLLING);

        if (!callback)
                init_completion(&ent->done);

        INIT_DELAYED_WORK(&ent->cb_timeout_work, cb_timeout_handler);
        INIT_WORK(&ent->work, cmd_work_handler);
        if (page_queue) {
                cmd_work_handler(&ent->work);
        } else if (!queue_work(dev->priv.health.wq_cmd, &ent->work)) {
                mlx5_core_warn(dev, "failed to queue work\n");
                err = -ENOMEM;
                goto out_free;
        }

        if (callback)
                goto out;

        err = wait_func(dev, ent);
        if (err == -ETIMEDOUT)
                goto out;

        ds = ent->ts2 - ent->ts1;
        op = MLX5_GET(mbox_in, in->first.data, opcode);
        if (op < ARRAY_SIZE(cmd->stats)) {
                stats = &cmd->stats[op];
                spin_lock_irq(&stats->lock);
                stats->sum += ds;
                ++stats->n;
                spin_unlock_irq(&stats->lock);
        }
        mlx5_core_dbg_mask(dev, 1 << MLX5_CMD_TIME,
                           "fw exec time for %s is %lld nsec\n",
                           mlx5_command_str(op), (long long)ds);
        *status = ent->status;
        free_cmd(ent);

        return err;

out_free:
        free_cmd(ent);
out:
        return err;
}

static int mlx5_copy_to_msg(struct mlx5_cmd_msg *to, void *from, size_t size)
{
        size_t delta;
        size_t i;

        if (to == NULL || from == NULL)
                return (-ENOMEM);

        delta = min_t(size_t, size, sizeof(to->first.data));
        memcpy(to->first.data, from, delta);
        from = (char *)from + delta;
        size -= delta;

        for (i = 0; size != 0; i++) {
                struct mlx5_cmd_prot_block *block;

                block = mlx5_fwp_get_virt(to, i * MLX5_CMD_MBOX_SIZE);

                delta = min_t(size_t, size, MLX5_CMD_DATA_BLOCK_SIZE);
                memcpy(block->data, from, delta);
                from = (char *)from + delta;
                size -= delta;
        }
        return (0);
}

static int mlx5_copy_from_msg(void *to, struct mlx5_cmd_msg *from, int size)
{
        size_t delta;
        size_t i;

        if (to == NULL || from == NULL)
                return (-ENOMEM);

        delta = min_t(size_t, size, sizeof(from->first.data));
        memcpy(to, from->first.data, delta);
        to = (char *)to + delta;
        size -= delta;

        for (i = 0; size != 0; i++) {
                struct mlx5_cmd_prot_block *block;

                block = mlx5_fwp_get_virt(from, i * MLX5_CMD_MBOX_SIZE);

                delta = min_t(size_t, size, MLX5_CMD_DATA_BLOCK_SIZE);
                memcpy(to, block->data, delta);
                to = (char *)to + delta;
                size -= delta;
        }
        return (0);
}

static struct mlx5_cmd_msg *
mlx5_alloc_cmd_msg(struct mlx5_core_dev *dev, gfp_t flags, size_t size)
{
        struct mlx5_cmd_msg *msg;
        size_t blen;
        size_t n;
        size_t i;

        blen = size - min_t(size_t, sizeof(msg->first.data), size);
        n = howmany(blen, MLX5_CMD_DATA_BLOCK_SIZE);

        msg = mlx5_fwp_alloc(dev, flags, howmany(n, MLX5_NUM_CMDS_IN_ADAPTER_PAGE));
        if (msg == NULL)
                return (ERR_PTR(-ENOMEM));

        for (i = 0; i != n; i++) {
                struct mlx5_cmd_prot_block *block;

                block = mlx5_fwp_get_virt(msg, i * MLX5_CMD_MBOX_SIZE);

                if (i != (n - 1)) {
                        memset(block, 0, MLX5_CMD_MBOX_SIZE);

                        u64 dma = mlx5_fwp_get_dma(msg, (i + 1) * MLX5_CMD_MBOX_SIZE);
                        block->next = cpu_to_be64(dma);
                } else {
                        /* Zero the rest of the page to satisfy KMSAN. */
                        memset(block, 0, MLX5_ADAPTER_PAGE_SIZE -
                            (i % MLX5_NUM_CMDS_IN_ADAPTER_PAGE) *
                            MLX5_CMD_MBOX_SIZE);
                }
                block->block_num = cpu_to_be32(i);
        }

        /* make sure initial data is written to RAM */
        mlx5_fwp_flush(msg);

        return (msg);
}

static void
mlx5_free_cmd_msg(struct mlx5_core_dev *dev, struct mlx5_cmd_msg *msg)
{

        mlx5_fwp_free(msg);
}

static void clean_debug_files(struct mlx5_core_dev *dev)
{
}


static void mlx5_cmd_change_mod(struct mlx5_core_dev *dev, int mode)
{
        struct mlx5_cmd *cmd = &dev->cmd;
        int i;

        if (cmd->mode == mode)
                return;

        for (i = 0; i < cmd->max_reg_cmds; i++)
                down(&cmd->sem);

        down(&cmd->pages_sem);
        cmd->mode = mode;

        up(&cmd->pages_sem);
        for (i = 0; i < cmd->max_reg_cmds; i++)
                up(&cmd->sem);
}

void mlx5_cmd_use_events(struct mlx5_core_dev *dev)
{
        mlx5_cmd_change_mod(dev, MLX5_CMD_MODE_EVENTS);
}

void mlx5_cmd_use_polling(struct mlx5_core_dev *dev)
{
        mlx5_cmd_change_mod(dev, MLX5_CMD_MODE_POLLING);
}

static void free_msg(struct mlx5_core_dev *dev, struct mlx5_cmd_msg *msg)
{
        unsigned long flags;

        if (msg->cache) {
                spin_lock_irqsave(&msg->cache->lock, flags);
                list_add_tail(&msg->list, &msg->cache->head);
                spin_unlock_irqrestore(&msg->cache->lock, flags);
        } else {
                mlx5_free_cmd_msg(dev, msg);
        }
}

void mlx5_cmd_comp_handler(struct mlx5_core_dev *dev, u64 vector_flags,
    enum mlx5_cmd_mode cmd_mode)
{
        struct mlx5_cmd *cmd = &dev->cmd;
        struct mlx5_cmd_work_ent *ent;
        bool triggered = (vector_flags & MLX5_TRIGGERED_CMD_COMP) ? 1 : 0;
        u32 vector = vector_flags; /* discard flags in the upper dword */
        int i;

        /* make sure data gets read from RAM */
        mlx5_fwp_invalidate(cmd->cmd_page);

        while (vector != 0) {
                i = ffs(vector) - 1;
                vector &= ~(1U << i);
                /* check command mode */
                if (cmd->ent_mode[i] != cmd_mode)
                        continue;
                ent = cmd->ent_arr[i];
                /* check if command was already handled */
                if (ent == NULL)
                        continue;
                if (ent->callback)
                        cancel_delayed_work(&ent->cb_timeout_work);
                ent->ts2 = ktime_get_ns();
                memcpy(ent->out->first.data, ent->lay->out,
                       sizeof(ent->lay->out));
                /* make sure data gets read from RAM */
                mlx5_fwp_invalidate(ent->out);
                dump_command(dev, ent, 0);
                if (!ent->ret) {
                        if (!cmd->checksum_disabled)
                                ent->ret = verify_signature(ent);
                        else
                                ent->ret = 0;

                        if (triggered)
                                ent->status = MLX5_DRIVER_STATUS_ABORTED;
                        else
                                ent->status = ent->lay->status_own >> 1;

                        mlx5_core_dbg(dev,
                                      "FW command ret 0x%x, status %s(0x%x)\n",
                                      ent->ret,
                                      deliv_status_to_str(ent->status),
                                      ent->status);
                }
                free_ent(cmd, ent->idx);
                complete_command(ent);
        }
}
EXPORT_SYMBOL(mlx5_cmd_comp_handler);

static int status_to_err(u8 status)
{
        return status ? -EIO : 0; /* TBD more meaningful codes */
}

static struct mlx5_cmd_msg *alloc_msg(struct mlx5_core_dev *dev, int in_size,
                                      gfp_t gfp)
{
        struct mlx5_cmd_msg *msg = ERR_PTR(-ENOMEM);
        struct mlx5_cmd *cmd = &dev->cmd;
        struct cache_ent *ent = NULL;

        if (in_size > MED_LIST_SIZE && in_size <= LONG_LIST_SIZE)
                ent = &cmd->cache.large;
        else if (in_size > 16 && in_size <= MED_LIST_SIZE)
                ent = &cmd->cache.med;

        if (ent) {
                spin_lock_irq(&ent->lock);
                if (!list_empty(&ent->head)) {
                        msg = list_entry(ent->head.next, struct mlx5_cmd_msg,
                                         list);
                        list_del(&msg->list);
                }
                spin_unlock_irq(&ent->lock);
        }

        if (IS_ERR(msg))
                msg = mlx5_alloc_cmd_msg(dev, gfp, in_size);

        return msg;
}

static int is_manage_pages(void *in)
{
        return MLX5_GET(mbox_in, in, opcode) == MLX5_CMD_OP_MANAGE_PAGES;
}

static int cmd_exec_helper(struct mlx5_core_dev *dev,
                           void *in, int in_size,
                           void *out, int out_size,
                           mlx5_cmd_cbk_t callback, void *context,
                           bool force_polling)
{
        struct mlx5_cmd_msg *inb;
        struct mlx5_cmd_msg *outb;
        int pages_queue;
        const gfp_t gfp = GFP_KERNEL;
        int err;
        u8 status = 0;
        u32 drv_synd;

        if (dev->state == MLX5_DEVICE_STATE_INTERNAL_ERROR) {
                u16 opcode = MLX5_GET(mbox_in, in, opcode);
                err = mlx5_internal_err_ret_value(dev, opcode, &drv_synd, &status);
                MLX5_SET(mbox_out, out, status, status);
                MLX5_SET(mbox_out, out, syndrome, drv_synd);
                return err;
        }

        pages_queue = is_manage_pages(in);

        inb = alloc_msg(dev, in_size, gfp);
        if (IS_ERR(inb)) {
                err = PTR_ERR(inb);
                return err;
        }

        err = mlx5_copy_to_msg(inb, in, in_size);
        if (err) {
                mlx5_core_warn(dev, "err %d\n", err);
                goto out_in;
        }

        outb = mlx5_alloc_cmd_msg(dev, gfp, out_size);
        if (IS_ERR(outb)) {
                err = PTR_ERR(outb);
                goto out_in;
        }

        err = mlx5_cmd_invoke(dev, inb, in_size, outb, out, out_size, callback,
                              context, pages_queue, &status, force_polling);
        if (err) {
                if (err == -ETIMEDOUT)
                        return err;
                goto out_out;
        }

        mlx5_core_dbg(dev, "err %d, status %d\n", err, status);
        if (status) {
                err = status_to_err(status);
                goto out_out;
        }

        if (callback)
                return err;

        err = mlx5_copy_from_msg(out, outb, out_size);

out_out:
        mlx5_free_cmd_msg(dev, outb);

out_in:
        free_msg(dev, inb);
        return err;
}

int mlx5_cmd_exec(struct mlx5_core_dev *dev, void *in, int in_size, void *out,
                  int out_size)
{
        int err;

        err = cmd_exec_helper(dev, in, in_size, out, out_size, NULL, NULL, false);
        return err ? : mlx5_cmd_check(dev, in, out);
}
EXPORT_SYMBOL(mlx5_cmd_exec);

void mlx5_cmd_init_async_ctx(struct mlx5_core_dev *dev,
                             struct mlx5_async_ctx *ctx)
{
        ctx->dev = dev;
        /* Starts at 1 to avoid doing wake_up if we are not cleaning up */
        atomic_set(&ctx->num_inflight, 1);
        init_waitqueue_head(&ctx->wait);
}
EXPORT_SYMBOL(mlx5_cmd_init_async_ctx);

/**
 * mlx5_cmd_cleanup_async_ctx - Clean up an async_ctx
 * @ctx: The ctx to clean
 *
 * Upon return all callbacks given to mlx5_cmd_exec_cb() have been called. The
 * caller must ensure that mlx5_cmd_exec_cb() is not called during or after
 * the call mlx5_cleanup_async_ctx().
 */
void mlx5_cmd_cleanup_async_ctx(struct mlx5_async_ctx *ctx)
{
        atomic_dec(&ctx->num_inflight);
        wait_event(ctx->wait, atomic_read(&ctx->num_inflight) == 0);
}
EXPORT_SYMBOL(mlx5_cmd_cleanup_async_ctx);

static void mlx5_cmd_exec_cb_handler(int status, void *_work)
{
        struct mlx5_async_work *work = _work;
        struct mlx5_async_ctx *ctx = work->ctx;

        work->user_callback(status, work);
        if (atomic_dec_and_test(&ctx->num_inflight))
                wake_up(&ctx->wait);
}

int mlx5_cmd_exec_cb(struct mlx5_async_ctx *ctx, void *in, int in_size,
                     void *out, int out_size, mlx5_async_cbk_t callback,
                     struct mlx5_async_work *work)
{
        int ret;

        work->ctx = ctx;
        work->user_callback = callback;
        if (WARN_ON(!atomic_inc_not_zero(&ctx->num_inflight)))
                return -EIO;
        ret = cmd_exec_helper(ctx->dev, in, in_size, out, out_size,
                              mlx5_cmd_exec_cb_handler, work, false);
        if (ret && atomic_dec_and_test(&ctx->num_inflight))
                wake_up(&ctx->wait);

        return ret;
}
EXPORT_SYMBOL(mlx5_cmd_exec_cb);

int mlx5_cmd_exec_polling(struct mlx5_core_dev *dev, void *in, int in_size,
                          void *out, int out_size)
{
        int err;

        err = cmd_exec_helper(dev, in, in_size, out, out_size, NULL, NULL, true);
        return err ? : mlx5_cmd_check(dev, in, out);
}
EXPORT_SYMBOL(mlx5_cmd_exec_polling);

static void destroy_msg_cache(struct mlx5_core_dev *dev)
{
        struct mlx5_cmd *cmd = &dev->cmd;
        struct mlx5_cmd_msg *msg;
        struct mlx5_cmd_msg *n;

        list_for_each_entry_safe(msg, n, &cmd->cache.large.head, list) {
                list_del(&msg->list);
                mlx5_free_cmd_msg(dev, msg);
        }

        list_for_each_entry_safe(msg, n, &cmd->cache.med.head, list) {
                list_del(&msg->list);
                mlx5_free_cmd_msg(dev, msg);
        }
}

static int create_msg_cache(struct mlx5_core_dev *dev)
{
        struct mlx5_cmd *cmd = &dev->cmd;
        struct mlx5_cmd_msg *msg;
        int err;
        int i;

        spin_lock_init(&cmd->cache.large.lock);
        INIT_LIST_HEAD(&cmd->cache.large.head);
        spin_lock_init(&cmd->cache.med.lock);
        INIT_LIST_HEAD(&cmd->cache.med.head);

        for (i = 0; i < NUM_LONG_LISTS; i++) {
                msg = mlx5_alloc_cmd_msg(dev, GFP_KERNEL, LONG_LIST_SIZE);
                if (IS_ERR(msg)) {
                        err = PTR_ERR(msg);
                        goto ex_err;
                }
                msg->cache = &cmd->cache.large;
                list_add_tail(&msg->list, &cmd->cache.large.head);
        }

        for (i = 0; i < NUM_MED_LISTS; i++) {
                msg = mlx5_alloc_cmd_msg(dev, GFP_KERNEL, MED_LIST_SIZE);
                if (IS_ERR(msg)) {
                        err = PTR_ERR(msg);
                        goto ex_err;
                }
                msg->cache = &cmd->cache.med;
                list_add_tail(&msg->list, &cmd->cache.med.head);
        }

        return 0;

ex_err:
        destroy_msg_cache(dev);
        return err;
}

static int
alloc_cmd_page(struct mlx5_core_dev *dev, struct mlx5_cmd *cmd)
{
        int err;

        sx_init(&cmd->dma_sx, "MLX5-DMA-SX");
        mtx_init(&cmd->dma_mtx, "MLX5-DMA-MTX", NULL, MTX_DEF);
        cv_init(&cmd->dma_cv, "MLX5-DMA-CV");

        /*
         * Create global DMA descriptor tag for allocating
         * 4K firmware pages:
         */
        err = -bus_dma_tag_create(
            bus_get_dma_tag(dev->pdev->dev.bsddev),
            MLX5_ADAPTER_PAGE_SIZE,     /* alignment */
            0,                          /* no boundary */
            BUS_SPACE_MAXADDR,          /* lowaddr */
            BUS_SPACE_MAXADDR,          /* highaddr */
            NULL, NULL,                 /* filter, filterarg */
            MLX5_ADAPTER_PAGE_SIZE,     /* maxsize */
            1,                          /* nsegments */
            MLX5_ADAPTER_PAGE_SIZE,     /* maxsegsize */
            0,                          /* flags */
            NULL, NULL,                 /* lockfunc, lockfuncarg */
            &cmd->dma_tag);
        if (err != 0)
                goto failure_destroy_sx;

        cmd->cmd_page = mlx5_fwp_alloc(dev, GFP_KERNEL, 1);
        if (cmd->cmd_page == NULL) {
                err = -ENOMEM;
                goto failure_alloc_page;
        }
        cmd->dma = mlx5_fwp_get_dma(cmd->cmd_page, 0);
        cmd->cmd_buf = mlx5_fwp_get_virt(cmd->cmd_page, 0);
        memset(cmd->cmd_buf, 0, MLX5_ADAPTER_PAGE_SIZE);
        return (0);

failure_alloc_page:
        bus_dma_tag_destroy(cmd->dma_tag);

failure_destroy_sx:
        cv_destroy(&cmd->dma_cv);
        mtx_destroy(&cmd->dma_mtx);
        sx_destroy(&cmd->dma_sx);
        return (err);
}

static void
free_cmd_page(struct mlx5_core_dev *dev, struct mlx5_cmd *cmd)
{

        mlx5_fwp_free(cmd->cmd_page);
        bus_dma_tag_destroy(cmd->dma_tag);
        cv_destroy(&cmd->dma_cv);
        mtx_destroy(&cmd->dma_mtx);
        sx_destroy(&cmd->dma_sx);
}

int mlx5_cmd_init(struct mlx5_core_dev *dev)
{
        struct mlx5_cmd *cmd = &dev->cmd;
        u32 cmd_h, cmd_l;
        u16 cmd_if_rev;
        int err;
        int i;

        memset(cmd, 0, sizeof(*cmd));
        cmd_if_rev = cmdif_rev_get(dev);
        if (cmd_if_rev != CMD_IF_REV) {
                mlx5_core_err(dev,
                    "Driver cmdif rev(%d) differs from firmware's(%d)\n",
                    CMD_IF_REV, cmd_if_rev);
                return -EINVAL;
        }

        err = alloc_cmd_page(dev, cmd);
        if (err)
                goto err_free_pool;

        cmd_l = ioread32be(&dev->iseg->cmdq_addr_l_sz) & 0xff;
        cmd->log_sz = cmd_l >> 4 & 0xf;
        cmd->log_stride = cmd_l & 0xf;
        if (1 << cmd->log_sz > MLX5_MAX_COMMANDS) {
                mlx5_core_err(dev,
                    "firmware reports too many outstanding commands %d\n",
                    1 << cmd->log_sz);
                err = -EINVAL;
                goto err_free_page;
        }

        if (cmd->log_sz + cmd->log_stride > MLX5_ADAPTER_PAGE_SHIFT) {
                mlx5_core_err(dev,
                    "command queue size overflow\n");
                err = -EINVAL;
                goto err_free_page;
        }

        cmd->checksum_disabled = 1;
        cmd->max_reg_cmds = (1 << cmd->log_sz) - 1;
        cmd->bitmask = (1 << cmd->max_reg_cmds) - 1;

        cmd->cmdif_rev = ioread32be(&dev->iseg->cmdif_rev_fw_sub) >> 16;
        if (cmd->cmdif_rev > CMD_IF_REV) {
                mlx5_core_err(dev,
                    "driver does not support command interface version. driver %d, firmware %d\n",
                    CMD_IF_REV, cmd->cmdif_rev);
                err = -ENOTSUPP;
                goto err_free_page;
        }

        spin_lock_init(&cmd->alloc_lock);
        spin_lock_init(&cmd->token_lock);
        for (i = 0; i < ARRAY_SIZE(cmd->stats); i++)
                spin_lock_init(&cmd->stats[i].lock);

        sema_init(&cmd->sem, cmd->max_reg_cmds);
        sema_init(&cmd->pages_sem, 1);

        cmd_h = (u32)((u64)(cmd->dma) >> 32);
        cmd_l = (u32)(cmd->dma);
        if (cmd_l & 0xfff) {
                mlx5_core_err(dev, "invalid command queue address\n");
                err = -ENOMEM;
                goto err_free_page;
        }

        iowrite32be(cmd_h, &dev->iseg->cmdq_addr_h);
        iowrite32be(cmd_l, &dev->iseg->cmdq_addr_l_sz);

        /* Make sure firmware sees the complete address before we proceed */
        wmb();

        mlx5_core_dbg(dev, "descriptor at dma 0x%llx\n", (unsigned long long)(cmd->dma));

        cmd->mode = MLX5_CMD_MODE_POLLING;

        err = create_msg_cache(dev);
        if (err) {
                mlx5_core_err(dev, "failed to create command cache\n");
                goto err_free_page;
        }
        return 0;

err_free_page:
        free_cmd_page(dev, cmd);

err_free_pool:
        return err;
}
EXPORT_SYMBOL(mlx5_cmd_init);

void mlx5_cmd_cleanup(struct mlx5_core_dev *dev)
{
        struct mlx5_cmd *cmd = &dev->cmd;

        clean_debug_files(dev);
        flush_workqueue(dev->priv.health.wq_cmd);
        destroy_msg_cache(dev);
        free_cmd_page(dev, cmd);
}
EXPORT_SYMBOL(mlx5_cmd_cleanup);

int mlx5_cmd_query_cong_counter(struct mlx5_core_dev *dev,
                                bool reset, void *out, int out_size)
{
        u32 in[MLX5_ST_SZ_DW(query_cong_statistics_in)] = { };

        MLX5_SET(query_cong_statistics_in, in, opcode,
                 MLX5_CMD_OP_QUERY_CONG_STATISTICS);
        MLX5_SET(query_cong_statistics_in, in, clear, reset);
        return mlx5_cmd_exec(dev, in, sizeof(in), out, out_size);
}
EXPORT_SYMBOL(mlx5_cmd_query_cong_counter);

int mlx5_cmd_query_cong_params(struct mlx5_core_dev *dev, int cong_point,
                               void *out, int out_size)
{
        u32 in[MLX5_ST_SZ_DW(query_cong_params_in)] = { };

        MLX5_SET(query_cong_params_in, in, opcode,
                 MLX5_CMD_OP_QUERY_CONG_PARAMS);
        MLX5_SET(query_cong_params_in, in, cong_protocol, cong_point);

        return mlx5_cmd_exec(dev, in, sizeof(in), out, out_size);
}
EXPORT_SYMBOL(mlx5_cmd_query_cong_params);

int mlx5_cmd_modify_cong_params(struct mlx5_core_dev *dev,
                                void *in, int in_size)
{
        u32 out[MLX5_ST_SZ_DW(modify_cong_params_out)] = { };

        return mlx5_cmd_exec(dev, in, in_size, out, sizeof(out));
}
EXPORT_SYMBOL(mlx5_cmd_modify_cong_params);

int mlx5_cmd_query_cong_status(struct mlx5_core_dev *dev, int cong_point,
                               int prio, void *out, int out_size)
{
        u32 in[MLX5_ST_SZ_DW(query_cong_status_in)] = { };

        MLX5_SET(query_cong_status_in, in, opcode,
                 MLX5_CMD_OP_QUERY_CONG_STATUS);
        MLX5_SET(query_cong_status_in, in, priority, prio);
        MLX5_SET(query_cong_status_in, in, cong_protocol, cong_point);

        return mlx5_cmd_exec(dev, in, sizeof(in), out, out_size);
}
EXPORT_SYMBOL(mlx5_cmd_query_cong_status);

int mlx5_cmd_modify_cong_status(struct mlx5_core_dev *dev,
                                void *in, int in_size)
{
        u32 out[MLX5_ST_SZ_DW(modify_cong_status_out)] = { };

        return mlx5_cmd_exec(dev, in, in_size, out, sizeof(out));
}
EXPORT_SYMBOL(mlx5_cmd_modify_cong_status);