root/sys/dev/cxgbe/iw_cxgbe/provider.c
/*-
 * SPDX-License-Identifier: BSD-2-Clause
 *
 * Copyright (c) 2009-2013, 2016 Chelsio, Inc. All rights reserved.
 *
 * This software is available to you under a choice of one of two
 * licenses.  You may choose to be licensed under the terms of the GNU
 * General Public License (GPL) Version 2, available from the file
 * COPYING in the main directory of this source tree, or the
 * OpenIB.org BSD license below:
 *
 *     Redistribution and use in source and binary forms, with or
 *     without modification, are permitted provided that the following
 *     conditions are met:
 *
 *      - Redistributions of source code must retain the above
 *        copyright notice, this list of conditions and the following
 *        disclaimer.
 *
 *      - Redistributions in binary form must reproduce the above
 *        copyright notice, this list of conditions and the following
 *        disclaimer in the documentation and/or other materials
 *        provided with the distribution.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 * SOFTWARE.
 */
#include <sys/cdefs.h>
#define LINUXKPI_PARAM_PREFIX iw_cxgbe_

#include "opt_inet.h"

#ifdef TCP_OFFLOAD
#include <asm/pgtable.h>
#include <linux/page.h>
#include <rdma/ib_verbs.h>
#include <rdma/ib_user_verbs.h>

#include "iw_cxgbe.h"
#include "user.h"

static int fastreg_support = 1;
module_param(fastreg_support, int, 0644);
MODULE_PARM_DESC(fastreg_support, "Advertise fastreg support (default = 1)");

static int c4iw_modify_port(struct ib_device *ibdev,
                            u8 port, int port_modify_mask,
                            struct ib_port_modify *props)
{
        return -ENOSYS;
}

static int c4iw_ah_create(struct ib_ah *ah,
                          struct ib_ah_attr *ah_attr, u32 flags,
                          struct ib_udata *udata)
{
        return -ENOSYS;
}

static void c4iw_ah_destroy(struct ib_ah *ah, u32 flags)
{
}

static int c4iw_multicast_attach(struct ib_qp *ibqp, union ib_gid *gid, u16 lid)
{
        return -ENOSYS;
}

static int c4iw_multicast_detach(struct ib_qp *ibqp, union ib_gid *gid, u16 lid)
{
        return -ENOSYS;
}

static int c4iw_process_mad(struct ib_device *ibdev, int mad_flags,
                u8 port_num, const struct ib_wc *in_wc,
                const struct ib_grh *in_grh,
                const struct ib_mad_hdr *in_mad,
                size_t in_mad_size,
                struct ib_mad_hdr *out_mad,
                size_t *out_mad_size,
                u16 *out_mad_pkey_index)

{
        return -ENOSYS;
}

static void c4iw_dealloc_ucontext(struct ib_ucontext *context)
{
        struct c4iw_ucontext *ucontext = to_c4iw_ucontext(context);
        struct c4iw_dev *rhp;
        struct c4iw_mm_entry *mm, *tmp;

        pr_debug("context %p\n", context);
        rhp = to_c4iw_dev(ucontext->ibucontext.device);

        CTR2(KTR_IW_CXGBE, "%s ucontext %p", __func__, ucontext);

        list_for_each_entry_safe(mm, tmp, &ucontext->mmaps, entry)
                kfree(mm);
        c4iw_release_dev_ucontext(&rhp->rdev, &ucontext->uctx);
}

static int c4iw_alloc_ucontext(struct ib_ucontext *ucontext,
                               struct ib_udata *udata)
{
        struct ib_device *ibdev = ucontext->device;
        struct c4iw_ucontext *context = to_c4iw_ucontext(ucontext);
        struct c4iw_dev *rhp = to_c4iw_dev(ibdev);
        static int warned;
        struct c4iw_alloc_ucontext_resp uresp;
        int ret = 0;
        struct c4iw_mm_entry *mm = NULL;

        PDBG("%s ibdev %p\n", __func__, ibdev);
        c4iw_init_dev_ucontext(&rhp->rdev, &context->uctx);
        INIT_LIST_HEAD(&context->mmaps);
        spin_lock_init(&context->mmap_lock);

        if (udata->outlen < sizeof(uresp) - sizeof(uresp.reserved)) {
                if (!warned++)
                        log(LOG_ERR, "%s Warning - downlevel libcxgb4 "
                               "(non-fatal), device status page disabled.\n",
                               __func__);
                rhp->rdev.flags |= T4_STATUS_PAGE_DISABLED;
        } else {

                mm = kmalloc(sizeof *mm, GFP_KERNEL);
                if (!mm)
                        goto err;

                uresp.status_page_size = PAGE_SIZE;

                spin_lock(&context->mmap_lock);
                uresp.status_page_key = context->key;
                context->key += PAGE_SIZE;
                spin_unlock(&context->mmap_lock);

                ret = ib_copy_to_udata(udata, &uresp,
                                       sizeof(uresp) - sizeof(uresp.reserved));
                if (ret)
                        goto err_mm;

                mm->key = uresp.status_page_key;
                mm->addr = vtophys(rhp->rdev.status_page);
                mm->len = PAGE_SIZE;
                insert_mmap(context, mm);
        }
        return 0;
err_mm:
        kfree(mm);
err:
        return ret;
}

static int c4iw_mmap(struct ib_ucontext *context, struct vm_area_struct *vma)
{
        int len = vma->vm_end - vma->vm_start;
        u32 key = vma->vm_pgoff << PAGE_SHIFT;
        struct c4iw_rdev *rdev;
        int ret = 0;
        struct c4iw_mm_entry *mm;
        struct c4iw_ucontext *ucontext;
        u64 addr = 0;

        CTR4(KTR_IW_CXGBE, "%s:1 ctx %p vma %p, vm_start %u", __func__,
                        context, vma, vma->vm_start);

        CTR4(KTR_IW_CXGBE, "%s:1a pgoff 0x%lx key 0x%x len %d", __func__,
            vma->vm_pgoff, key, len);

        if (vma->vm_start & (PAGE_SIZE-1)) {
                CTR3(KTR_IW_CXGBE, "%s:2 unaligned vm_start %u vma %p",
                    __func__, vma->vm_start, vma);
                return -EINVAL;
        }

        rdev = &(to_c4iw_dev(context->device)->rdev);
        ucontext = to_c4iw_ucontext(context);

        mm = remove_mmap(ucontext, key, len);
        if (!mm) {
                CTR4(KTR_IW_CXGBE, "%s:3 ucontext %p key %u len %u", __func__,
                    ucontext, key, len);
                return -EINVAL;
        }
        addr = mm->addr;
        kfree(mm);

        /* user DB-GTS registers if addr in udbs_res range,
         * else WQ or CQ memory.
         * */
        if (rdev->adap->iwt.wc_en && addr >= rdev->bar2_pa &&
                        addr < rdev->bar2_pa + rdev->bar2_len)
                vma->vm_page_prot = t4_pgprot_wc(vma->vm_page_prot);

        ret = rdma_user_mmap_io(context, vma, addr >> PAGE_SHIFT, len,
            vma->vm_page_prot, NULL);
        CTR4(KTR_IW_CXGBE, "%s:4 ctx %p vma %p ret %u", __func__, context, vma,
            ret);
        return ret;
}

static void
c4iw_deallocate_pd(struct ib_pd *pd, struct ib_udata *udata)
{
        struct c4iw_pd *php = to_c4iw_pd(pd);
        struct c4iw_dev *rhp = php->rhp;

        CTR3(KTR_IW_CXGBE, "%s: pd %p, pdid 0x%x", __func__, pd, php->pdid);

        c4iw_put_resource(&rhp->rdev.resource.pdid_table, php->pdid);
        mutex_lock(&rhp->rdev.stats.lock);
        rhp->rdev.stats.pd.cur--;
        mutex_unlock(&rhp->rdev.stats.lock);
}

static int
c4iw_allocate_pd(struct ib_pd *pd, struct ib_udata *udata)
{
        struct c4iw_pd *php = to_c4iw_pd(pd);
        struct ib_device *ibdev = pd->device;
        u32 pdid;
        struct c4iw_dev *rhp;

        CTR4(KTR_IW_CXGBE, "%s: ibdev %p, pd %p, data %p", __func__, ibdev,
            pd, udata);
        rhp = (struct c4iw_dev *) ibdev;
        if (__predict_false(c4iw_stopped(&rhp->rdev)))
                return -EIO;
        pdid =  c4iw_get_resource(&rhp->rdev.resource.pdid_table);
        if (!pdid)
                return -EINVAL;

        php->pdid = pdid;
        php->rhp = rhp;
        if (udata) {
                if (ib_copy_to_udata(udata, &php->pdid, sizeof(u32))) {
                        c4iw_deallocate_pd(&php->ibpd, udata);
                        return -EFAULT;
                }
        }
        mutex_lock(&rhp->rdev.stats.lock);
        rhp->rdev.stats.pd.cur++;
        if (rhp->rdev.stats.pd.cur > rhp->rdev.stats.pd.max)
                rhp->rdev.stats.pd.max = rhp->rdev.stats.pd.cur;
        mutex_unlock(&rhp->rdev.stats.lock);

        CTR5(KTR_IW_CXGBE,
            "%s: ibdev %p, context %p, data %p, pddid 0x%x, pd %p", __func__,
            ibdev, udata, pdid, php);
        return (0);
}

static int
c4iw_query_pkey(struct ib_device *ibdev, u8 port, u16 index, u16 *pkey)
{

        CTR5(KTR_IW_CXGBE, "%s ibdev %p, port %d, index %d, pkey %p", __func__,
            ibdev, port, index, pkey);

        *pkey = 0;
        return (0);
}

static int
c4iw_query_gid(struct ib_device *ibdev, u8 port, int index, union ib_gid *gid)
{
        struct c4iw_dev *dev;
        struct port_info *pi;
        struct adapter *sc;

        CTR5(KTR_IW_CXGBE, "%s ibdev %p, port %d, index %d, gid %p", __func__,
            ibdev, port, index, gid);

        memset(&gid->raw[0], 0, sizeof(gid->raw));
        dev = to_c4iw_dev(ibdev);
        sc = dev->rdev.adap;
        if (port == 0 || port > sc->params.nports)
                return (-EINVAL);
        pi = sc->port[port - 1];
        memcpy(&gid->raw[0], pi->vi[0].hw_addr, ETHER_ADDR_LEN);
        return (0);
}

static int
c4iw_query_device(struct ib_device *ibdev, struct ib_device_attr *props,
                struct ib_udata *uhw)
{
        struct c4iw_dev *dev = to_c4iw_dev(ibdev);
        struct adapter *sc = dev->rdev.adap;

        CTR3(KTR_IW_CXGBE, "%s ibdev %p, props %p", __func__, ibdev, props);

        if (uhw->inlen || uhw->outlen)
                return -EINVAL;

        memset(props, 0, sizeof *props);
        memcpy(&props->sys_image_guid, sc->port[0]->vi[0].hw_addr,
            ETHER_ADDR_LEN);
        props->hw_ver = sc->params.chipid;
        props->fw_ver = sc->params.fw_vers;
        props->device_cap_flags = dev->device_cap_flags;
        props->page_size_cap = T4_PAGESIZE_MASK;
        props->vendor_id = pci_get_vendor(sc->dev);
        props->vendor_part_id = pci_get_device(sc->dev);
        props->max_mr_size = T4_MAX_MR_SIZE;
        props->max_qp = sc->vres.qp.size / 2;
        props->max_qp_wr = dev->rdev.hw_queue.t4_max_qp_depth;
        props->max_sge = T4_MAX_RECV_SGE;
        props->max_sge_rd = 1;
        props->max_res_rd_atom = sc->params.max_ird_adapter;
        props->max_qp_rd_atom = min(sc->params.max_ordird_qp,
            c4iw_max_read_depth);
        props->max_qp_init_rd_atom = props->max_qp_rd_atom;
        props->max_cq = sc->vres.qp.size;
        props->max_cqe = dev->rdev.hw_queue.t4_max_cq_depth;
        props->max_mr = c4iw_num_stags(&dev->rdev);
        props->max_pd = T4_MAX_NUM_PD;
        props->local_ca_ack_delay = 0;
        props->max_fast_reg_page_list_len = t4_max_fr_depth(&dev->rdev, use_dsgl);

        return (0);
}

/*
 * Returns -errno on failure.
 */
static int
c4iw_query_port(struct ib_device *ibdev, u8 port, struct ib_port_attr *props)
{
        struct c4iw_dev *dev;
        struct adapter *sc;
        struct port_info *pi;
        if_t ifp;

        CTR4(KTR_IW_CXGBE, "%s ibdev %p, port %d, props %p", __func__, ibdev,
            port, props);

        dev = to_c4iw_dev(ibdev);
        sc = dev->rdev.adap;
        if (port > sc->params.nports)
                return (-EINVAL);
        pi = sc->port[port - 1];
        ifp = pi->vi[0].ifp;

        memset(props, 0, sizeof(struct ib_port_attr));
        props->max_mtu = IB_MTU_4096;
        if (if_getmtu(ifp) >= 4096)
                props->active_mtu = IB_MTU_4096;
        else if (if_getmtu(ifp) >= 2048)
                props->active_mtu = IB_MTU_2048;
        else if (if_getmtu(ifp) >= 1024)
                props->active_mtu = IB_MTU_1024;
        else if (if_getmtu(ifp) >= 512)
                props->active_mtu = IB_MTU_512;
        else
                props->active_mtu = IB_MTU_256;
        props->state = pi->link_cfg.link_ok ? IB_PORT_ACTIVE : IB_PORT_DOWN;
        props->port_cap_flags =
            IB_PORT_CM_SUP |
            IB_PORT_SNMP_TUNNEL_SUP |
            IB_PORT_REINIT_SUP |
            IB_PORT_DEVICE_MGMT_SUP |
            IB_PORT_VENDOR_CLASS_SUP | IB_PORT_BOOT_MGMT_SUP;
        props->gid_tbl_len = 1;
        props->pkey_tbl_len = 1;
        props->active_width = 2;
        props->active_speed = 2;
        props->max_msg_sz = -1;

        return 0;
}

static int c4iw_port_immutable(struct ib_device *ibdev, u8 port_num,
                               struct ib_port_immutable *immutable)
{
        struct ib_port_attr attr;
        int err;

        immutable->core_cap_flags = RDMA_CORE_PORT_IWARP;

        err = ib_query_port(ibdev, port_num, &attr);
        if (err)
                return err;

        immutable->pkey_tbl_len = attr.pkey_tbl_len;
        immutable->gid_tbl_len = attr.gid_tbl_len;

        return 0;
}

/*
 * Returns -errno on error.
 */
int
c4iw_register_device(struct c4iw_dev *dev)
{
        struct adapter *sc = dev->rdev.adap;
        struct ib_device *ibdev = &dev->ibdev;
        struct iw_cm_verbs *iwcm;
        int ret;

        CTR3(KTR_IW_CXGBE, "%s c4iw_dev %p, adapter %p", __func__, dev, sc);
        BUG_ON(!sc->port[0]);
        ret = linux_pci_attach_device(sc->dev, NULL, NULL, &dev->pdev);
        if (ret)
                return (ret);

#define c4iw_ib_cq c4iw_cq
#define c4iw_ib_pd c4iw_pd
#define c4iw_ib_qp c4iw_qp
#define c4iw_ib_ucontext c4iw_ucontext
        INIT_IB_DEVICE_OPS(&ibdev->ops, c4iw, CXGB4);

        strlcpy(ibdev->name, device_get_nameunit(sc->dev), sizeof(ibdev->name));
        memset(&ibdev->node_guid, 0, sizeof(ibdev->node_guid));
        memcpy(&ibdev->node_guid, sc->port[0]->vi[0].hw_addr, ETHER_ADDR_LEN);
        ibdev->owner = THIS_MODULE;
        dev->device_cap_flags = IB_DEVICE_LOCAL_DMA_LKEY | IB_DEVICE_MEM_WINDOW;
        if (fastreg_support)
                dev->device_cap_flags |= IB_DEVICE_MEM_MGT_EXTENSIONS;
        ibdev->local_dma_lkey = 0;
        ibdev->uverbs_cmd_mask =
            (1ull << IB_USER_VERBS_CMD_GET_CONTEXT) |
            (1ull << IB_USER_VERBS_CMD_QUERY_DEVICE) |
            (1ull << IB_USER_VERBS_CMD_QUERY_PORT) |
            (1ull << IB_USER_VERBS_CMD_ALLOC_PD) |
            (1ull << IB_USER_VERBS_CMD_DEALLOC_PD) |
            (1ull << IB_USER_VERBS_CMD_REG_MR) |
            (1ull << IB_USER_VERBS_CMD_DEREG_MR) |
            (1ull << IB_USER_VERBS_CMD_CREATE_COMP_CHANNEL) |
            (1ull << IB_USER_VERBS_CMD_CREATE_CQ) |
            (1ull << IB_USER_VERBS_CMD_DESTROY_CQ) |
            (1ull << IB_USER_VERBS_CMD_REQ_NOTIFY_CQ) |
            (1ull << IB_USER_VERBS_CMD_CREATE_QP) |
            (1ull << IB_USER_VERBS_CMD_MODIFY_QP) |
            (1ull << IB_USER_VERBS_CMD_QUERY_QP) |
            (1ull << IB_USER_VERBS_CMD_POLL_CQ) |
            (1ull << IB_USER_VERBS_CMD_DESTROY_QP) |
            (1ull << IB_USER_VERBS_CMD_POST_SEND) |
            (1ull << IB_USER_VERBS_CMD_POST_RECV);
        ibdev->node_type = RDMA_NODE_RNIC;
        strlcpy(ibdev->node_desc, C4IW_NODE_DESC, sizeof(ibdev->node_desc));
        ibdev->phys_port_cnt = sc->params.nports;
        ibdev->num_comp_vectors = 1;
        ibdev->dma_device = &dev->pdev.dev;
        ibdev->query_device = c4iw_query_device;
        ibdev->query_port = c4iw_query_port;
        ibdev->modify_port = c4iw_modify_port;
        ibdev->query_pkey = c4iw_query_pkey;
        ibdev->query_gid = c4iw_query_gid;
        ibdev->alloc_ucontext = c4iw_alloc_ucontext;
        ibdev->dealloc_ucontext = c4iw_dealloc_ucontext;
        ibdev->mmap = c4iw_mmap;
        ibdev->alloc_pd = c4iw_allocate_pd;
        ibdev->dealloc_pd = c4iw_deallocate_pd;
        ibdev->create_ah = c4iw_ah_create;
        ibdev->destroy_ah = c4iw_ah_destroy;
        ibdev->create_qp = c4iw_create_qp;
        ibdev->modify_qp = c4iw_ib_modify_qp;
        ibdev->query_qp = c4iw_ib_query_qp;
        ibdev->destroy_qp = c4iw_destroy_qp;
        ibdev->create_cq = c4iw_create_cq;
        ibdev->destroy_cq = c4iw_destroy_cq;
        ibdev->resize_cq = c4iw_resize_cq;
        ibdev->poll_cq = c4iw_poll_cq;
        ibdev->get_dma_mr = c4iw_get_dma_mr;
        ibdev->reg_user_mr = c4iw_reg_user_mr;
        ibdev->dereg_mr = c4iw_dereg_mr;
        ibdev->alloc_mw = c4iw_alloc_mw;
        ibdev->dealloc_mw = c4iw_dealloc_mw;
        ibdev->alloc_mr = c4iw_alloc_mr;
        ibdev->map_mr_sg = c4iw_map_mr_sg;
        ibdev->attach_mcast = c4iw_multicast_attach;
        ibdev->detach_mcast = c4iw_multicast_detach;
        ibdev->process_mad = c4iw_process_mad;
        ibdev->req_notify_cq = c4iw_arm_cq;
        ibdev->post_send = c4iw_post_send;
        ibdev->post_recv = c4iw_post_receive;
        ibdev->uverbs_abi_ver = C4IW_UVERBS_ABI_VERSION;
        ibdev->get_port_immutable = c4iw_port_immutable;

        iwcm = kmalloc(sizeof(*iwcm), GFP_KERNEL);
        if (iwcm == NULL)
                return (-ENOMEM);

        iwcm->connect = c4iw_connect;
        iwcm->accept = c4iw_accept_cr;
        iwcm->reject = c4iw_reject_cr;
        iwcm->create_listen = c4iw_create_listen;
        iwcm->destroy_listen = c4iw_destroy_listen;
        iwcm->add_ref = c4iw_qp_add_ref;
        iwcm->rem_ref = c4iw_qp_rem_ref;
        iwcm->get_qp = c4iw_get_qp;
        ibdev->iwcm = iwcm;

        ret = ib_register_device(&dev->ibdev, NULL);
        if (ret) {
                kfree(iwcm);
                linux_pci_detach_device(&dev->pdev);
        }

        return (ret);
}

void
c4iw_unregister_device(struct c4iw_dev *dev)
{

        CTR3(KTR_IW_CXGBE, "%s c4iw_dev %p, adapter %p", __func__, dev,
            dev->rdev.adap);
        ib_unregister_device(&dev->ibdev);
        kfree(dev->ibdev.iwcm);
        linux_pci_detach_device(&dev->pdev);
        return;
}
#endif