#include <sys/sysmacros.h>
#include <sys/types.h>
#include <sys/conf.h>
#include <sys/ddi.h>
#include <sys/sunddi.h>
#include <sys/modctl.h>
#include <sys/bitmap.h>
#include <sys/ib/adapters/hermon/hermon.h>
static void hermon_srq_sgl_to_logwqesz(hermon_state_t *state, uint_t num_sgl,
hermon_qp_wq_type_t wq_type, uint_t *logwqesz, uint_t *max_sgl);
int
hermon_srq_alloc(hermon_state_t *state, hermon_srq_info_t *srqinfo,
uint_t sleepflag)
{
ibt_srq_hdl_t ibt_srqhdl;
hermon_pdhdl_t pd;
ibt_srq_sizes_t *sizes;
ibt_srq_sizes_t *real_sizes;
hermon_srqhdl_t *srqhdl;
ibt_srq_flags_t flags;
hermon_rsrc_t *srqc, *rsrc;
hermon_hw_srqc_t srqc_entry;
uint32_t *buf;
hermon_srqhdl_t srq;
hermon_umap_db_entry_t *umapdb;
ibt_mr_attr_t mr_attr;
hermon_mr_options_t mr_op;
hermon_mrhdl_t mr;
uint64_t value, srq_desc_off;
uint32_t log_srq_size;
uint32_t uarpg;
uint_t srq_is_umap;
int flag, status;
uint_t max_sgl;
uint_t wqesz;
uint_t srq_wr_sz;
_NOTE(NOW_INVISIBLE_TO_OTHER_THREADS(*sizes))
real_sizes = srqinfo->srqi_real_sizes;
sizes = srqinfo->srqi_sizes;
pd = srqinfo->srqi_pd;
ibt_srqhdl = srqinfo->srqi_ibt_srqhdl;
flags = srqinfo->srqi_flags;
srqhdl = srqinfo->srqi_srqhdl;
srq_is_umap = (flags & IBT_SRQ_USER_MAP) ? 1 : 0;
if (srq_is_umap) {
status = hermon_umap_db_find(state->hs_instance, ddi_get_pid(),
MLNX_UMAP_UARPG_RSRC, &value, 0, NULL);
if (status != DDI_SUCCESS) {
status = IBT_INVALID_PARAM;
goto srqalloc_fail3;
}
uarpg = ((hermon_rsrc_t *)(uintptr_t)value)->hr_indx;
} else {
uarpg = state->hs_kernel_uar_index;
}
hermon_pd_refcnt_inc(pd);
status = hermon_rsrc_alloc(state, HERMON_SRQC, 1, sleepflag, &srqc);
if (status != DDI_SUCCESS) {
status = IBT_INSUFF_RESOURCE;
goto srqalloc_fail1;
}
status = hermon_rsrc_alloc(state, HERMON_SRQHDL, 1, sleepflag, &rsrc);
if (status != DDI_SUCCESS) {
status = IBT_INSUFF_RESOURCE;
goto srqalloc_fail2;
}
srq = (hermon_srqhdl_t)rsrc->hr_addr;
_NOTE(NOW_INVISIBLE_TO_OTHER_THREADS(*srq))
bzero(srq, sizeof (struct hermon_sw_srq_s));
srq->srq_srqnum = srqc->hr_indx;
if (srq_is_umap) {
umapdb = hermon_umap_db_alloc(state->hs_instance,
srq->srq_srqnum, MLNX_UMAP_SRQMEM_RSRC,
(uint64_t)(uintptr_t)rsrc);
if (umapdb == NULL) {
status = IBT_INSUFF_RESOURCE;
goto srqalloc_fail3;
}
}
status = hermon_dbr_alloc(state, uarpg, &srq->srq_wq_dbr_acchdl,
&srq->srq_wq_vdbr, &srq->srq_wq_pdbr, &srq->srq_rdbr_mapoffset);
if (status != DDI_SUCCESS) {
status = IBT_INSUFF_RESOURCE;
goto srqalloc_fail4;
}
srq_wr_sz = max(sizes->srq_wr_sz + 1, HERMON_SRQ_MIN_SIZE);
log_srq_size = highbit(srq_wr_sz);
if (ISP2(srq_wr_sz)) {
log_srq_size = log_srq_size - 1;
}
if (log_srq_size > state->hs_cfg_profile->cp_log_max_srq_sz) {
status = IBT_HCA_WR_EXCEEDED;
goto srqalloc_fail4a;
}
max_sgl = state->hs_ibtfinfo.hca_attr->hca_max_srq_sgl;
if (sizes->srq_sgl_sz > max_sgl) {
status = IBT_HCA_SGL_EXCEEDED;
goto srqalloc_fail4a;
}
hermon_srq_sgl_to_logwqesz(state, sizes->srq_sgl_sz,
HERMON_QP_WQ_TYPE_RECVQ, &srq->srq_wq_log_wqesz,
&srq->srq_wq_sgl);
wqesz = (1 << srq->srq_wq_log_wqesz);
srq->srq_wqinfo.qa_size = (1 << log_srq_size) * wqesz;
srq->srq_wqinfo.qa_alloc_align = PAGESIZE;
srq->srq_wqinfo.qa_bind_align = PAGESIZE;
if (srq_is_umap) {
srq->srq_wqinfo.qa_location = HERMON_QUEUE_LOCATION_USERLAND;
} else {
srq->srq_wqinfo.qa_location = HERMON_QUEUE_LOCATION_NORMAL;
}
status = hermon_queue_alloc(state, &srq->srq_wqinfo, sleepflag);
if (status != DDI_SUCCESS) {
status = IBT_INSUFF_RESOURCE;
goto srqalloc_fail4a;
}
buf = (uint32_t *)srq->srq_wqinfo.qa_buf_aligned;
_NOTE(NOW_INVISIBLE_TO_OTHER_THREADS(*buf))
flag = (sleepflag == HERMON_SLEEP) ? IBT_MR_SLEEP :
IBT_MR_NOSLEEP;
mr_attr.mr_vaddr = (uint64_t)(uintptr_t)buf;
mr_attr.mr_len = srq->srq_wqinfo.qa_size;
mr_attr.mr_as = NULL;
mr_attr.mr_flags = flag | IBT_MR_ENABLE_LOCAL_WRITE;
mr_op.mro_bind_type = state->hs_cfg_profile->cp_iommu_bypass;
mr_op.mro_bind_dmahdl = srq->srq_wqinfo.qa_dmahdl;
mr_op.mro_bind_override_addr = 1;
status = hermon_mr_register(state, pd, &mr_attr, &mr,
&mr_op, HERMON_SRQ_CMPT);
if (status != DDI_SUCCESS) {
status = IBT_INSUFF_RESOURCE;
goto srqalloc_fail5;
}
_NOTE(NOW_INVISIBLE_TO_OTHER_THREADS(*mr))
srq_desc_off = (uint64_t)(uintptr_t)srq->srq_wqinfo.qa_buf_aligned -
(uint64_t)mr->mr_bindinfo.bi_addr;
srq->srq_wq_wqhdr = hermon_wrid_wqhdr_create(1 << log_srq_size);
if (real_sizes != NULL) {
real_sizes->srq_wr_sz = (1 << log_srq_size) - 1;
real_sizes->srq_sgl_sz = srq->srq_wq_sgl;
}
bzero(&srqc_entry, sizeof (hermon_hw_srqc_t));
srqc_entry.state = HERMON_SRQ_STATE_HW_OWNER;
srqc_entry.log_srq_size = log_srq_size;
srqc_entry.srqn = srq->srq_srqnum;
srqc_entry.log_rq_stride = srq->srq_wq_log_wqesz - 4;
srqc_entry.page_offs = srq->srq_wqinfo.qa_pgoffs >> 6;
srqc_entry.log2_pgsz = mr->mr_log2_pgsz;
srqc_entry.mtt_base_addrh = (uint32_t)((mr->mr_mttaddr >> 32) & 0xFF);
srqc_entry.mtt_base_addrl = mr->mr_mttaddr >> 3;
srqc_entry.pd = pd->pd_pdnum;
srqc_entry.dbr_addrh = (uint32_t)((uint64_t)srq->srq_wq_pdbr >> 32);
srqc_entry.dbr_addrl = (uint32_t)((uint64_t)srq->srq_wq_pdbr >> 2);
status = hermon_cmn_ownership_cmd_post(state, SW2HW_SRQ, &srqc_entry,
sizeof (hermon_hw_srqc_t), srq->srq_srqnum,
sleepflag);
if (status != HERMON_CMD_SUCCESS) {
cmn_err(CE_CONT, "Hermon: SW2HW_SRQ command failed: %08x\n",
status);
if (status == HERMON_CMD_INVALID_STATUS) {
hermon_fm_ereport(state, HCA_SYS_ERR, HCA_ERR_SRV_LOST);
}
status = ibc_get_ci_failure(0);
goto srqalloc_fail8;
}
srq->srq_srqcrsrcp = srqc;
srq->srq_rsrcp = rsrc;
srq->srq_mrhdl = mr;
srq->srq_refcnt = 0;
srq->srq_is_umap = srq_is_umap;
srq->srq_uarpg = uarpg;
srq->srq_umap_dhp = (devmap_cookie_t)NULL;
srq->srq_pdhdl = pd;
srq->srq_wq_bufsz = (1 << log_srq_size);
srq->srq_wq_buf = buf;
srq->srq_desc_off = srq_desc_off;
srq->srq_hdlrarg = (void *)ibt_srqhdl;
srq->srq_state = 0;
srq->srq_real_sizes.srq_wr_sz = (1 << log_srq_size);
srq->srq_real_sizes.srq_sgl_sz = srq->srq_wq_sgl;
hermon_icm_set_num_to_hdl(state, HERMON_SRQC, srqc->hr_indx, srq);
if (srq->srq_is_umap) {
hermon_umap_db_add(umapdb);
} else {
int i, len, last;
uint16_t *desc;
desc = (uint16_t *)buf;
len = wqesz / sizeof (*desc);
last = srq->srq_wq_bufsz - 1;
for (i = 0; i < last; i++) {
desc[1] = htons(i + 1);
desc += len;
}
srq->srq_wq_wqhdr->wq_tail = last;
srq->srq_wq_wqhdr->wq_head = 0;
}
*srqhdl = srq;
return (status);
srqalloc_fail8:
hermon_wrid_wqhdr_destroy(srq->srq_wq_wqhdr);
if (hermon_mr_deregister(state, &mr, HERMON_MR_DEREG_ALL,
HERMON_SLEEPFLAG_FOR_CONTEXT()) != DDI_SUCCESS) {
HERMON_WARNING(state, "failed to deregister SRQ memory");
}
srqalloc_fail5:
hermon_queue_free(&srq->srq_wqinfo);
srqalloc_fail4a:
hermon_dbr_free(state, uarpg, srq->srq_wq_vdbr);
srqalloc_fail4:
if (srq_is_umap) {
hermon_umap_db_free(umapdb);
}
srqalloc_fail3:
hermon_rsrc_free(state, &rsrc);
srqalloc_fail2:
hermon_rsrc_free(state, &srqc);
srqalloc_fail1:
hermon_pd_refcnt_dec(pd);
return (status);
}
int
hermon_srq_free(hermon_state_t *state, hermon_srqhdl_t *srqhdl,
uint_t sleepflag)
{
hermon_rsrc_t *srqc, *rsrc;
hermon_umap_db_entry_t *umapdb;
uint64_t value;
hermon_srqhdl_t srq;
hermon_mrhdl_t mr;
hermon_pdhdl_t pd;
hermon_hw_srqc_t srqc_entry;
uint32_t srqnum;
uint_t maxprot;
int status;
srq = *srqhdl;
mutex_enter(&srq->srq_lock);
srqc = srq->srq_srqcrsrcp;
rsrc = srq->srq_rsrcp;
pd = srq->srq_pdhdl;
mr = srq->srq_mrhdl;
srqnum = srq->srq_srqnum;
if (srq->srq_refcnt != 0) {
mutex_exit(&srq->srq_lock);
return (IBT_SRQ_IN_USE);
}
if (srq->srq_is_umap) {
status = hermon_umap_db_find(state->hs_instance,
srq->srq_srqnum, MLNX_UMAP_SRQMEM_RSRC, &value,
HERMON_UMAP_DB_REMOVE, &umapdb);
if (status != DDI_SUCCESS) {
mutex_exit(&srq->srq_lock);
HERMON_WARNING(state, "failed to find in database");
return (ibc_get_ci_failure(0));
}
hermon_umap_db_free(umapdb);
if (srq->srq_umap_dhp != NULL) {
maxprot = (PROT_READ | PROT_WRITE | PROT_USER);
status = devmap_devmem_remap(srq->srq_umap_dhp,
state->hs_dip, 0, 0, srq->srq_wqinfo.qa_size,
maxprot, DEVMAP_MAPPING_INVALID, NULL);
if (status != DDI_SUCCESS) {
mutex_exit(&srq->srq_lock);
HERMON_WARNING(state, "failed in SRQ memory "
"devmap_devmem_remap()");
return (ibc_get_ci_failure(0));
}
srq->srq_umap_dhp = (devmap_cookie_t)NULL;
}
}
hermon_icm_set_num_to_hdl(state, HERMON_SRQC, srqc->hr_indx, NULL);
mutex_exit(&srq->srq_lock);
_NOTE(NOW_INVISIBLE_TO_OTHER_THREADS(*srq));
status = hermon_cmn_ownership_cmd_post(state, HW2SW_SRQ, &srqc_entry,
sizeof (hermon_hw_srqc_t), srqnum, sleepflag);
if (status != HERMON_CMD_SUCCESS) {
HERMON_WARNING(state, "failed to reclaim SRQC ownership");
cmn_err(CE_CONT, "Hermon: HW2SW_SRQ command failed: %08x\n",
status);
if (status == HERMON_CMD_INVALID_STATUS) {
hermon_fm_ereport(state, HCA_SYS_ERR, HCA_ERR_SRV_LOST);
}
return (ibc_get_ci_failure(0));
}
status = hermon_mr_deregister(state, &mr, HERMON_MR_DEREG_ALL,
sleepflag);
if (status != DDI_SUCCESS) {
HERMON_WARNING(state, "failed to deregister SRQ memory");
return (IBT_FAILURE);
}
hermon_wrid_wqhdr_destroy(srq->srq_wq_wqhdr);
hermon_queue_free(&srq->srq_wqinfo);
hermon_dbr_free(state, srq->srq_uarpg, srq->srq_wq_vdbr);
hermon_rsrc_free(state, &rsrc);
hermon_rsrc_free(state, &srqc);
hermon_pd_refcnt_dec(pd);
*srqhdl = NULL;
return (DDI_SUCCESS);
}
int
hermon_srq_modify(hermon_state_t *state, hermon_srqhdl_t srq, uint_t size,
uint_t *real_size, uint_t sleepflag)
{
hermon_qalloc_info_t new_srqinfo, old_srqinfo;
hermon_rsrc_t *mtt, *old_mtt;
hermon_bind_info_t bind;
hermon_bind_info_t old_bind;
hermon_mrhdl_t mr;
hermon_hw_srqc_t srqc_entry;
hermon_hw_dmpt_t mpt_entry;
uint64_t *wre_new, *wre_old;
uint64_t mtt_addr;
uint64_t srq_pgoffs;
uint64_t srq_desc_off;
uint32_t *buf, srq_old_bufsz;
uint32_t wqesz;
uint_t max_srq_size;
uint_t mtt_pgsize_bits;
uint_t log_srq_size, maxprot;
int status;
if ((state->hs_devlim.mod_wr_srq == 0) ||
(state->hs_cfg_profile->cp_srq_resize_enabled == 0))
return (IBT_NOT_SUPPORTED);
max_srq_size = (1 << state->hs_cfg_profile->cp_log_max_srq_sz);
if (size > max_srq_size) {
return (IBT_HCA_WR_EXCEEDED);
}
size = max(size, HERMON_SRQ_MIN_SIZE);
log_srq_size = highbit(size);
if (ISP2(size)) {
log_srq_size = log_srq_size - 1;
}
if (log_srq_size > state->hs_cfg_profile->cp_log_max_srq_sz) {
status = IBT_HCA_WR_EXCEEDED;
goto srqmodify_fail;
}
wqesz = (1 << srq->srq_wq_log_wqesz);
new_srqinfo.qa_size = (1 << log_srq_size) * wqesz;
new_srqinfo.qa_alloc_align = PAGESIZE;
new_srqinfo.qa_bind_align = PAGESIZE;
if (srq->srq_is_umap) {
new_srqinfo.qa_location = HERMON_QUEUE_LOCATION_USERLAND;
} else {
new_srqinfo.qa_location = HERMON_QUEUE_LOCATION_NORMAL;
}
status = hermon_queue_alloc(state, &new_srqinfo, sleepflag);
if (status != DDI_SUCCESS) {
status = IBT_INSUFF_RESOURCE;
goto srqmodify_fail;
}
buf = (uint32_t *)new_srqinfo.qa_buf_aligned;
_NOTE(NOW_INVISIBLE_TO_OTHER_THREADS(*buf))
wre_new = kmem_zalloc((1 << log_srq_size) * sizeof (uint64_t),
sleepflag);
if (wre_new == NULL) {
status = IBT_INSUFF_RESOURCE;
goto srqmodify_fail;
}
_NOTE(NOW_INVISIBLE_TO_OTHER_THREADS(bind))
bzero(&bind, sizeof (hermon_bind_info_t));
bind.bi_type = HERMON_BINDHDL_VADDR;
bind.bi_addr = (uint64_t)(uintptr_t)buf;
bind.bi_len = new_srqinfo.qa_size;
bind.bi_as = NULL;
bind.bi_flags = sleepflag == HERMON_SLEEP ? IBT_MR_SLEEP :
IBT_MR_NOSLEEP | IBT_MR_ENABLE_LOCAL_WRITE;
bind.bi_bypass = state->hs_cfg_profile->cp_iommu_bypass;
status = hermon_mr_mtt_bind(state, &bind, new_srqinfo.qa_dmahdl, &mtt,
&mtt_pgsize_bits, 0);
if (status != DDI_SUCCESS) {
status = status;
kmem_free(wre_new, (1 << log_srq_size) *
sizeof (uint64_t));
hermon_queue_free(&new_srqinfo);
goto srqmodify_fail;
}
bind.bi_addr = bind.bi_addr & ((1 << mtt_pgsize_bits) - 1);
srq_desc_off = (uint64_t)(uintptr_t)new_srqinfo.qa_buf_aligned -
(uint64_t)bind.bi_addr;
srq_pgoffs = (uint_t)
((uintptr_t)new_srqinfo.qa_buf_aligned & HERMON_PAGEOFFSET);
bzero(&mpt_entry, sizeof (hermon_hw_dmpt_t));
mpt_entry.reg_win_len = bind.bi_len;
mtt_addr = (mtt->hr_indx << HERMON_MTT_SIZE_SHIFT);
mpt_entry.mtt_addr_h = mtt_addr >> 32;
mpt_entry.mtt_addr_l = mtt_addr >> 3;
mutex_enter(&srq->srq_lock);
srq_old_bufsz = srq->srq_wq_bufsz;
bcopy(srq->srq_wq_buf, buf, srq_old_bufsz * wqesz);
mr = srq->srq_mrhdl;
mutex_enter(&mr->mr_lock);
srqc_entry.log_srq_size = log_srq_size;
srqc_entry.page_offs = srq_pgoffs >> 6;
srqc_entry.log2_pgsz = mr->mr_log2_pgsz;
srqc_entry.mtt_base_addrl = (uint64_t)mtt_addr >> 32;
srqc_entry.mtt_base_addrh = mtt_addr >> 3;
status = hermon_resize_srq_cmd_post(state, &srqc_entry,
srq->srq_srqnum, sleepflag);
if (status != HERMON_CMD_SUCCESS) {
cmn_err(CE_CONT, "Hermon: RESIZE_SRQ command failed: %08x\n",
status);
if (status == HERMON_CMD_INVALID_STATUS) {
hermon_fm_ereport(state, HCA_SYS_ERR, HCA_ERR_SRV_LOST);
}
(void) hermon_mr_mtt_unbind(state, &bind, mtt);
kmem_free(wre_new, (1 << log_srq_size) *
sizeof (uint64_t));
hermon_queue_free(&new_srqinfo);
mutex_exit(&mr->mr_lock);
mutex_exit(&srq->srq_lock);
return (ibc_get_ci_failure(0));
}
old_srqinfo = srq->srq_wqinfo;
old_mtt = srq->srq_mrhdl->mr_mttrsrcp;
bcopy(&srq->srq_mrhdl->mr_bindinfo, &old_bind,
sizeof (hermon_bind_info_t));
srq->srq_wqinfo = new_srqinfo;
srq->srq_wq_buf = buf;
srq->srq_wq_bufsz = (1 << log_srq_size);
bcopy(&bind, &srq->srq_mrhdl->mr_bindinfo, sizeof (hermon_bind_info_t));
srq->srq_mrhdl->mr_mttrsrcp = mtt;
srq->srq_desc_off = srq_desc_off;
srq->srq_real_sizes.srq_wr_sz = (1 << log_srq_size);
mr->mr_logmttpgsz = mtt_pgsize_bits;
mutex_exit(&mr->mr_lock);
wre_old = srq->srq_wq_wqhdr->wq_wrid;
bcopy(wre_old, wre_new, srq_old_bufsz * sizeof (uint64_t));
srq->srq_wq_wqhdr->wq_wrid = wre_new;
if ((srq->srq_is_umap) && (srq->srq_umap_dhp != NULL)) {
maxprot = (PROT_READ | PROT_WRITE | PROT_USER);
status = devmap_devmem_remap(srq->srq_umap_dhp,
state->hs_dip, 0, 0, srq->srq_wqinfo.qa_size, maxprot,
DEVMAP_MAPPING_INVALID, NULL);
if (status != DDI_SUCCESS) {
mutex_exit(&srq->srq_lock);
HERMON_WARNING(state, "failed in SRQ memory "
"devmap_devmem_remap()");
kmem_free(wre_old, srq_old_bufsz * sizeof (uint64_t));
return (ibc_get_ci_failure(0));
}
srq->srq_umap_dhp = (devmap_cookie_t)NULL;
}
mutex_exit(&srq->srq_lock);
status = hermon_mr_mtt_unbind(state, &old_bind, old_mtt);
if (status != DDI_SUCCESS) {
HERMON_WARNING(state, "failed to unbind old SRQ memory");
status = ibc_get_ci_failure(0);
goto srqmodify_fail;
}
kmem_free(wre_old, srq_old_bufsz * sizeof (uint64_t));
hermon_queue_free(&old_srqinfo);
if (real_size != NULL) {
*real_size = (1 << log_srq_size);
}
return (DDI_SUCCESS);
srqmodify_fail:
return (status);
}
void
hermon_srq_refcnt_inc(hermon_srqhdl_t srq)
{
mutex_enter(&srq->srq_lock);
srq->srq_refcnt++;
mutex_exit(&srq->srq_lock);
}
void
hermon_srq_refcnt_dec(hermon_srqhdl_t srq)
{
mutex_enter(&srq->srq_lock);
srq->srq_refcnt--;
mutex_exit(&srq->srq_lock);
}
hermon_srqhdl_t
hermon_srqhdl_from_srqnum(hermon_state_t *state, uint_t srqnum)
{
uint_t srqindx, srqmask;
srqmask = (1 << state->hs_cfg_profile->cp_log_num_srq) - 1;
srqindx = srqnum & srqmask;
return (hermon_icm_num_to_hdl(state, HERMON_SRQC, srqindx));
}
static void
hermon_srq_sgl_to_logwqesz(hermon_state_t *state, uint_t num_sgl,
hermon_qp_wq_type_t wq_type, uint_t *logwqesz, uint_t *max_sgl)
{
uint_t max_size, log2, actual_sgl;
switch (wq_type) {
case HERMON_QP_WQ_TYPE_RECVQ:
max_size = (HERMON_QP_WQE_MLX_SRQ_HDRS + (num_sgl << 4));
log2 = highbit(max_size);
if (ISP2(max_size)) {
log2 = log2 - 1;
}
log2 = max(log2, HERMON_QP_WQE_LOG_MINIMUM);
actual_sgl = ((1 << log2) - HERMON_QP_WQE_MLX_SRQ_HDRS) >> 4;
break;
default:
HERMON_WARNING(state, "unexpected work queue type");
break;
}
*logwqesz = log2;
*max_sgl = min(state->hs_cfg_profile->cp_srq_max_sgl, actual_sgl);
}