root/drivers/infiniband/sw/rdmavt/vt.c
// SPDX-License-Identifier: GPL-2.0 OR BSD-3-Clause
/*
 * Copyright(c) 2016 - 2018 Intel Corporation.
 */

#include <linux/module.h>
#include <linux/kernel.h>
#include <linux/dma-mapping.h>
#include "vt.h"
#include "cq.h"
#include "trace.h"

#define RVT_UVERBS_ABI_VERSION 2

MODULE_LICENSE("Dual BSD/GPL");
MODULE_DESCRIPTION("RDMA Verbs Transport Library");

static int __init rvt_init(void)
{
        int ret = rvt_driver_cq_init();

        if (ret)
                pr_err("Error in driver CQ init.\n");

        return ret;
}
module_init(rvt_init);

static void __exit rvt_cleanup(void)
{
        rvt_cq_exit();
}
module_exit(rvt_cleanup);

/**
 * rvt_alloc_device - allocate rdi
 * @size: how big of a structure to allocate
 * @nports: number of ports to allocate array slots for
 *
 * Use IB core device alloc to allocate space for the rdi which is assumed to be
 * inside of the ib_device. Any extra space that drivers require should be
 * included in size.
 *
 * We also allocate a port array based on the number of ports.
 *
 * Return: pointer to allocated rdi
 */
struct rvt_dev_info *rvt_alloc_device(size_t size, int nports)
{
        struct rvt_dev_info *rdi;

        rdi = container_of(_ib_alloc_device(size, &init_net), struct rvt_dev_info, ibdev);
        if (!rdi)
                return rdi;

        rdi->ports = kzalloc_objs(*rdi->ports, nports);
        if (!rdi->ports)
                ib_dealloc_device(&rdi->ibdev);

        return rdi;
}
EXPORT_SYMBOL(rvt_alloc_device);

/**
 * rvt_dealloc_device - deallocate rdi
 * @rdi: structure to free
 *
 * Free a structure allocated with rvt_alloc_device()
 */
void rvt_dealloc_device(struct rvt_dev_info *rdi)
{
        kfree(rdi->ports);
        ib_dealloc_device(&rdi->ibdev);
}
EXPORT_SYMBOL(rvt_dealloc_device);

static int rvt_query_device(struct ib_device *ibdev,
                            struct ib_device_attr *props,
                            struct ib_udata *uhw)
{
        struct rvt_dev_info *rdi = ib_to_rvt(ibdev);

        if (uhw->inlen || uhw->outlen)
                return -EINVAL;
        /*
         * Return rvt_dev_info.dparms.props contents
         */
        *props = rdi->dparms.props;
        return 0;
}

static int rvt_get_numa_node(struct ib_device *ibdev)
{
        struct rvt_dev_info *rdi = ib_to_rvt(ibdev);

        return rdi->dparms.node;
}

static int rvt_modify_device(struct ib_device *device,
                             int device_modify_mask,
                             struct ib_device_modify *device_modify)
{
        /*
         * There is currently no need to supply this based on qib and hfi1.
         * Future drivers may need to implement this though.
         */

        return -EOPNOTSUPP;
}

/**
 * rvt_query_port - Passes the query port call to the driver
 * @ibdev: Verbs IB dev
 * @port_num: port number, 1 based from ib core
 * @props: structure to hold returned properties
 *
 * Return: 0 on success
 */
static int rvt_query_port(struct ib_device *ibdev, u32 port_num,
                          struct ib_port_attr *props)
{
        struct rvt_dev_info *rdi = ib_to_rvt(ibdev);
        struct rvt_ibport *rvp;
        u32 port_index = ibport_num_to_idx(ibdev, port_num);

        rvp = rdi->ports[port_index];
        /* props being zeroed by the caller, avoid zeroing it here */
        props->sm_lid = rvp->sm_lid;
        props->sm_sl = rvp->sm_sl;
        props->port_cap_flags = rvp->port_cap_flags;
        props->max_msg_sz = 0x80000000;
        props->pkey_tbl_len = rvt_get_npkeys(rdi);
        props->bad_pkey_cntr = rvp->pkey_violations;
        props->qkey_viol_cntr = rvp->qkey_violations;
        props->subnet_timeout = rvp->subnet_timeout;
        props->init_type_reply = 0;

        /* Populate the remaining ib_port_attr elements */
        return rdi->driver_f.query_port_state(rdi, port_num, props);
}

/**
 * rvt_modify_port - modify port
 * @ibdev: Verbs IB dev
 * @port_num: Port number, 1 based from ib core
 * @port_modify_mask: How to change the port
 * @props: Structure to fill in
 *
 * Return: 0 on success
 */
static int rvt_modify_port(struct ib_device *ibdev, u32 port_num,
                           int port_modify_mask, struct ib_port_modify *props)
{
        struct rvt_dev_info *rdi = ib_to_rvt(ibdev);
        struct rvt_ibport *rvp;
        int ret = 0;
        u32 port_index = ibport_num_to_idx(ibdev, port_num);

        rvp = rdi->ports[port_index];
        if (port_modify_mask & IB_PORT_OPA_MASK_CHG) {
                rvp->port_cap3_flags |= props->set_port_cap_mask;
                rvp->port_cap3_flags &= ~props->clr_port_cap_mask;
        } else {
                rvp->port_cap_flags |= props->set_port_cap_mask;
                rvp->port_cap_flags &= ~props->clr_port_cap_mask;
        }

        if (props->set_port_cap_mask || props->clr_port_cap_mask)
                rdi->driver_f.cap_mask_chg(rdi, port_num);
        if (port_modify_mask & IB_PORT_SHUTDOWN)
                ret = rdi->driver_f.shut_down_port(rdi, port_num);
        if (port_modify_mask & IB_PORT_RESET_QKEY_CNTR)
                rvp->qkey_violations = 0;

        return ret;
}

/**
 * rvt_query_pkey - Return a pkey from the table at a given index
 * @ibdev: Verbs IB dev
 * @port_num: Port number, 1 based from ib core
 * @index: Index into pkey table
 * @pkey: returned pkey from the port pkey table
 *
 * Return: 0 on failure pkey otherwise
 */
static int rvt_query_pkey(struct ib_device *ibdev, u32 port_num, u16 index,
                          u16 *pkey)
{
        /*
         * Driver will be responsible for keeping rvt_dev_info.pkey_table up to
         * date. This function will just return that value. There is no need to
         * lock, if a stale value is read and sent to the user so be it there is
         * no way to protect against that anyway.
         */
        struct rvt_dev_info *rdi = ib_to_rvt(ibdev);
        u32 port_index;

        port_index = ibport_num_to_idx(ibdev, port_num);

        if (index >= rvt_get_npkeys(rdi))
                return -EINVAL;

        *pkey = rvt_get_pkey(rdi, port_index, index);
        return 0;
}

/**
 * rvt_query_gid - Return a gid from the table
 * @ibdev: Verbs IB dev
 * @port_num: Port number, 1 based from ib core
 * @guid_index: Index in table
 * @gid: Gid to return
 *
 * Return: 0 on success
 */
static int rvt_query_gid(struct ib_device *ibdev, u32 port_num,
                         int guid_index, union ib_gid *gid)
{
        struct rvt_dev_info *rdi;
        struct rvt_ibport *rvp;
        u32 port_index;

        /*
         * Driver is responsible for updating the guid table. Which will be used
         * to craft the return value. This will work similar to how query_pkey()
         * is being done.
         */
        port_index = ibport_num_to_idx(ibdev, port_num);

        rdi = ib_to_rvt(ibdev);
        rvp = rdi->ports[port_index];

        gid->global.subnet_prefix = rvp->gid_prefix;

        return rdi->driver_f.get_guid_be(rdi, rvp, guid_index,
                                         &gid->global.interface_id);
}

/**
 * rvt_alloc_ucontext - Allocate a user context
 * @uctx: Verbs context
 * @udata: User data allocated
 */
static int rvt_alloc_ucontext(struct ib_ucontext *uctx, struct ib_udata *udata)
{
        return 0;
}

/**
 * rvt_dealloc_ucontext - Free a user context
 * @context: Unused
 */
static void rvt_dealloc_ucontext(struct ib_ucontext *context)
{
        return;
}

static int rvt_get_port_immutable(struct ib_device *ibdev, u32 port_num,
                                  struct ib_port_immutable *immutable)
{
        struct rvt_dev_info *rdi = ib_to_rvt(ibdev);
        struct ib_port_attr attr;
        int err;

        immutable->core_cap_flags = rdi->dparms.core_cap_flags;

        err = ib_query_port(ibdev, port_num, &attr);
        if (err)
                return err;

        immutable->pkey_tbl_len = attr.pkey_tbl_len;
        immutable->gid_tbl_len = attr.gid_tbl_len;
        immutable->max_mad_size = rdi->dparms.max_mad_size;

        return 0;
}

enum {
        MISC,
        QUERY_DEVICE,
        MODIFY_DEVICE,
        QUERY_PORT,
        MODIFY_PORT,
        QUERY_PKEY,
        QUERY_GID,
        ALLOC_UCONTEXT,
        DEALLOC_UCONTEXT,
        GET_PORT_IMMUTABLE,
        CREATE_QP,
        MODIFY_QP,
        DESTROY_QP,
        QUERY_QP,
        POST_SEND,
        POST_RECV,
        POST_SRQ_RECV,
        CREATE_AH,
        DESTROY_AH,
        MODIFY_AH,
        QUERY_AH,
        CREATE_SRQ,
        MODIFY_SRQ,
        DESTROY_SRQ,
        QUERY_SRQ,
        ATTACH_MCAST,
        DETACH_MCAST,
        GET_DMA_MR,
        REG_USER_MR,
        DEREG_MR,
        ALLOC_MR,
        MAP_MR_SG,
        ALLOC_FMR,
        MAP_PHYS_FMR,
        UNMAP_FMR,
        DEALLOC_FMR,
        MMAP,
        CREATE_CQ,
        DESTROY_CQ,
        POLL_CQ,
        REQ_NOTFIY_CQ,
        RESIZE_CQ,
        ALLOC_PD,
        DEALLOC_PD,
        _VERB_IDX_MAX /* Must always be last! */
};

static const struct ib_device_ops rvt_dev_ops = {
        .uverbs_abi_ver = RVT_UVERBS_ABI_VERSION,

        .alloc_mr = rvt_alloc_mr,
        .alloc_pd = rvt_alloc_pd,
        .alloc_ucontext = rvt_alloc_ucontext,
        .attach_mcast = rvt_attach_mcast,
        .create_ah = rvt_create_ah,
        .create_cq = rvt_create_cq,
        .create_qp = rvt_create_qp,
        .create_srq = rvt_create_srq,
        .create_user_ah = rvt_create_ah,
        .dealloc_pd = rvt_dealloc_pd,
        .dealloc_ucontext = rvt_dealloc_ucontext,
        .dereg_mr = rvt_dereg_mr,
        .destroy_ah = rvt_destroy_ah,
        .destroy_cq = rvt_destroy_cq,
        .destroy_qp = rvt_destroy_qp,
        .destroy_srq = rvt_destroy_srq,
        .detach_mcast = rvt_detach_mcast,
        .get_dma_mr = rvt_get_dma_mr,
        .get_numa_node = rvt_get_numa_node,
        .get_port_immutable = rvt_get_port_immutable,
        .map_mr_sg = rvt_map_mr_sg,
        .mmap = rvt_mmap,
        .modify_ah = rvt_modify_ah,
        .modify_device = rvt_modify_device,
        .modify_port = rvt_modify_port,
        .modify_qp = rvt_modify_qp,
        .modify_srq = rvt_modify_srq,
        .poll_cq = rvt_poll_cq,
        .post_recv = rvt_post_recv,
        .post_send = rvt_post_send,
        .post_srq_recv = rvt_post_srq_recv,
        .query_ah = rvt_query_ah,
        .query_device = rvt_query_device,
        .query_gid = rvt_query_gid,
        .query_pkey = rvt_query_pkey,
        .query_port = rvt_query_port,
        .query_qp = rvt_query_qp,
        .query_srq = rvt_query_srq,
        .reg_user_mr = rvt_reg_user_mr,
        .req_notify_cq = rvt_req_notify_cq,
        .resize_cq = rvt_resize_cq,

        INIT_RDMA_OBJ_SIZE(ib_ah, rvt_ah, ibah),
        INIT_RDMA_OBJ_SIZE(ib_cq, rvt_cq, ibcq),
        INIT_RDMA_OBJ_SIZE(ib_pd, rvt_pd, ibpd),
        INIT_RDMA_OBJ_SIZE(ib_qp, rvt_qp, ibqp),
        INIT_RDMA_OBJ_SIZE(ib_srq, rvt_srq, ibsrq),
        INIT_RDMA_OBJ_SIZE(ib_ucontext, rvt_ucontext, ibucontext),
};

static noinline int check_support(struct rvt_dev_info *rdi, int verb)
{
        switch (verb) {
        case MISC:
                /*
                 * These functions are not part of verbs specifically but are
                 * required for rdmavt to function.
                 */
                if ((!rdi->ibdev.ops.port_groups) ||
                    (!rdi->driver_f.get_pci_dev))
                        return -EINVAL;
                break;

        case MODIFY_DEVICE:
                /*
                 * rdmavt does not support modify device currently drivers must
                 * provide.
                 */
                if (!rdi->ibdev.ops.modify_device)
                        return -EOPNOTSUPP;
                break;

        case QUERY_PORT:
                if (!rdi->ibdev.ops.query_port)
                        if (!rdi->driver_f.query_port_state)
                                return -EINVAL;
                break;

        case MODIFY_PORT:
                if (!rdi->ibdev.ops.modify_port)
                        if (!rdi->driver_f.cap_mask_chg ||
                            !rdi->driver_f.shut_down_port)
                                return -EINVAL;
                break;

        case QUERY_GID:
                if (!rdi->ibdev.ops.query_gid)
                        if (!rdi->driver_f.get_guid_be)
                                return -EINVAL;
                break;

        case CREATE_QP:
                if (!rdi->ibdev.ops.create_qp)
                        if (!rdi->driver_f.qp_priv_alloc ||
                            !rdi->driver_f.qp_priv_free ||
                            !rdi->driver_f.notify_qp_reset ||
                            !rdi->driver_f.flush_qp_waiters ||
                            !rdi->driver_f.stop_send_queue ||
                            !rdi->driver_f.quiesce_qp)
                                return -EINVAL;
                break;

        case MODIFY_QP:
                if (!rdi->ibdev.ops.modify_qp)
                        if (!rdi->driver_f.notify_qp_reset ||
                            !rdi->driver_f.schedule_send ||
                            !rdi->driver_f.get_pmtu_from_attr ||
                            !rdi->driver_f.flush_qp_waiters ||
                            !rdi->driver_f.stop_send_queue ||
                            !rdi->driver_f.quiesce_qp ||
                            !rdi->driver_f.notify_error_qp ||
                            !rdi->driver_f.mtu_from_qp ||
                            !rdi->driver_f.mtu_to_path_mtu)
                                return -EINVAL;
                break;

        case DESTROY_QP:
                if (!rdi->ibdev.ops.destroy_qp)
                        if (!rdi->driver_f.qp_priv_free ||
                            !rdi->driver_f.notify_qp_reset ||
                            !rdi->driver_f.flush_qp_waiters ||
                            !rdi->driver_f.stop_send_queue ||
                            !rdi->driver_f.quiesce_qp)
                                return -EINVAL;
                break;

        case POST_SEND:
                if (!rdi->ibdev.ops.post_send)
                        if (!rdi->driver_f.schedule_send ||
                            !rdi->driver_f.do_send ||
                            !rdi->post_parms)
                                return -EINVAL;
                break;

        }

        return 0;
}

/**
 * rvt_register_device - register a driver
 * @rdi: main dev structure for all of rdmavt operations
 *
 * It is up to drivers to allocate the rdi and fill in the appropriate
 * information.
 *
 * Return: 0 on success otherwise an errno.
 */
int rvt_register_device(struct rvt_dev_info *rdi)
{
        int ret = 0, i;

        if (!rdi)
                return -EINVAL;

        /*
         * Check to ensure drivers have setup the required helpers for the verbs
         * they want rdmavt to handle
         */
        for (i = 0; i < _VERB_IDX_MAX; i++)
                if (check_support(rdi, i)) {
                        pr_err("Driver support req not met at %d\n", i);
                        return -EINVAL;
                }

        ib_set_device_ops(&rdi->ibdev, &rvt_dev_ops);

        /* Once we get past here we can use rvt_pr macros and tracepoints */
        trace_rvt_dbg(rdi, "Driver attempting registration");
        rvt_mmap_init(rdi);

        /* Queue Pairs */
        ret = rvt_driver_qp_init(rdi);
        if (ret) {
                pr_err("Error in driver QP init.\n");
                return -EINVAL;
        }

        /* Address Handle */
        spin_lock_init(&rdi->n_ahs_lock);
        rdi->n_ahs_allocated = 0;

        /* Shared Receive Queue */
        rvt_driver_srq_init(rdi);

        /* Multicast */
        rvt_driver_mcast_init(rdi);

        /* Mem Region */
        ret = rvt_driver_mr_init(rdi);
        if (ret) {
                pr_err("Error in driver MR init.\n");
                goto bail_no_mr;
        }

        /* Memory Working Set Size */
        ret = rvt_wss_init(rdi);
        if (ret) {
                rvt_pr_err(rdi, "Error in WSS init.\n");
                goto bail_mr;
        }

        /* Completion queues */
        spin_lock_init(&rdi->n_cqs_lock);

        /* Protection Domain */
        spin_lock_init(&rdi->n_pds_lock);
        rdi->n_pds_allocated = 0;

        /*
         * There are some things which could be set by underlying drivers but
         * really should be up to rdmavt to set. For instance drivers can't know
         * exactly which functions rdmavt supports, nor do they know the ABI
         * version, so we do all of this sort of stuff here.
         */
        rdi->ibdev.uverbs_cmd_mask |=
                (1ull << IB_USER_VERBS_CMD_POLL_CQ)             |
                (1ull << IB_USER_VERBS_CMD_REQ_NOTIFY_CQ)       |
                (1ull << IB_USER_VERBS_CMD_POST_SEND)           |
                (1ull << IB_USER_VERBS_CMD_POST_RECV)           |
                (1ull << IB_USER_VERBS_CMD_POST_SRQ_RECV);
        rdi->ibdev.node_type = RDMA_NODE_IB_CA;
        if (!rdi->ibdev.num_comp_vectors)
                rdi->ibdev.num_comp_vectors = 1;

        /* We are now good to announce we exist */
        ret = ib_register_device(&rdi->ibdev, dev_name(&rdi->ibdev.dev), NULL);
        if (ret) {
                rvt_pr_err(rdi, "Failed to register driver with ib core.\n");
                goto bail_wss;
        }

        rvt_create_mad_agents(rdi);

        rvt_pr_info(rdi, "Registration with rdmavt done.\n");
        return ret;

bail_wss:
        rvt_wss_exit(rdi);
bail_mr:
        rvt_mr_exit(rdi);

bail_no_mr:
        rvt_qp_exit(rdi);

        return ret;
}
EXPORT_SYMBOL(rvt_register_device);

/**
 * rvt_unregister_device - remove a driver
 * @rdi: rvt dev struct
 */
void rvt_unregister_device(struct rvt_dev_info *rdi)
{
        trace_rvt_dbg(rdi, "Driver is unregistering.");
        if (!rdi)
                return;

        rvt_free_mad_agents(rdi);

        ib_unregister_device(&rdi->ibdev);
        rvt_wss_exit(rdi);
        rvt_mr_exit(rdi);
        rvt_qp_exit(rdi);
}
EXPORT_SYMBOL(rvt_unregister_device);

/**
 * rvt_init_port - init internal data for driver port
 * @rdi: rvt_dev_info struct
 * @port: rvt port
 * @port_index: 0 based index of ports, different from IB core port num
 * @pkey_table: pkey_table for @port
 *
 * Keep track of a list of ports. No need to have a detach port.
 * They persist until the driver goes away.
 *
 * Return: always 0
 */
int rvt_init_port(struct rvt_dev_info *rdi, struct rvt_ibport *port,
                  int port_index, u16 *pkey_table)
{

        rdi->ports[port_index] = port;
        rdi->ports[port_index]->pkey_table = pkey_table;

        return 0;
}
EXPORT_SYMBOL(rvt_init_port);