#ifndef _RPC_RPC_RDMA_H
#define _RPC_RPC_RDMA_H
#include <rpc/rpc.h>
#include <rpc/rpc_sztypes.h>
#include <sys/sunddi.h>
#include <sys/sunldi.h>
#ifdef __cplusplus
extern "C" {
#endif
#define RPCRDMA_VERS 1
#define RDMATF_VERS 1
#define RDMATF_VERS_1 1
#define RPC_MSG_SZ 1024
#define RDMA_MINCHUNK 1024
#define RPC_CL_SZ 1024
#define MINCHUNK 1024
#define RPC_BUF_SIZE 2048
#define NOWAIT 0
#define WAIT 1
#define XDR_RDMA_CHUNK 0x1
#define XDR_RDMA_WLIST_REG 0x2
#define XDR_RDMA_RLIST_REG 0x4
#define LONG_REPLY_LEN 65536
#define WCL_BUF_LEN 32768
#define RCL_BUF_LEN 32768
#define RDMA_BUFS_RQST 34
#define RDMA_BUFS_GRANT 32
struct xdr_ops *xdrrdma_xops(void);
typedef enum rdma_cc_type {
RDMA_CC_CLNT,
RDMA_CC_SRV
} rdma_cc_type_t;
typedef struct rdma_clnt_cred_ctrl {
uint32_t clnt_cc_granted_ops;
uint32_t clnt_cc_in_flight_ops;
kcondvar_t clnt_cc_cv;
} rdma_clnt_cred_ctrl_t;
typedef struct rdma_srv_cred_ctrl {
uint32_t srv_cc_buffers_granted;
uint32_t srv_cc_cur_buffers_used;
uint32_t srv_cc_posted;
uint32_t srv_cc_max_buf_size;
uint32_t srv_cc_cur_buf_size;
} rdma_srv_cred_ctrl_t;
typedef enum {
RPCCALL_WLIST,
RPCCALL_WCHUNK,
RPCCALL_NOWRITE
}rpccall_write_t;
typedef enum {
CLIST_REG_SOURCE = 1,
CLIST_REG_DST
} clist_dstsrc;
typedef enum {
RDMA_SUCCESS = 0,
RDMA_INVAL = 1,
RDMA_TIMEDOUT = 2,
RDMA_INTR = 3,
RDMA_NORESOURCE = 4,
RDMA_REJECT = 5,
RDMA_NOLISTENER = 6,
RDMA_UNREACHABLE = 7,
RDMA_CONNLOST = 8,
RDMA_XPRTFAILED = 9,
RDMA_PROTECTERR = 10,
RDMA_OVERRUN = 11,
RDMA_RECVQEMPTY = 12,
RDMA_PROTFAILED = 13,
RDMA_NOTSUPP = 14,
RDMA_REMOTERR = 15,
RDMA_BADVERS = 16,
RDMA_REG_EXIST = 17,
RDMA_HCA_ATTACH = 18,
RDMA_HCA_DETACH = 19,
RDMA_FAILED = 20
} rdma_stat;
struct mrc {
uint32_t mrc_rmr;
union {
struct mr {
uint32_t lmr;
uint64_t linfo;
} mr;
} lhdl;
};
#define mrc_lmr lhdl.mr.lmr
#define mrc_linfo lhdl.mr.linfo
typedef enum {
SEND_BUFFER,
SEND_DESCRIPTOR,
RECV_BUFFER,
RECV_DESCRIPTOR,
RDMA_LONG_BUFFER
} rdma_btype;
typedef struct rdma_buf {
rdma_btype type;
uint_t len;
caddr_t addr;
struct mrc handle;
caddr_t rb_private;
} rdma_buf_t;
struct clist {
uint32 c_xdroff;
uint32 c_len;
clist_dstsrc c_regtype;
struct mrc c_smemhandle;
uint64 c_ssynchandle;
union {
uint64 c_saddr;
caddr_t c_saddr3;
} w;
struct mrc c_dmemhandle;
uint64 c_dsynchandle;
union {
uint64 c_daddr;
caddr_t c_daddr3;
} u;
struct as *c_adspc;
rdma_buf_t rb_longbuf;
struct clist *c_next;
};
typedef struct clist clist;
#define MAX_SVC_XFER_SIZE (4*1024*1024)
enum rdma_proc {
RDMA_MSG = 0,
RDMA_NOMSG = 1,
RDMA_MSGP = 2,
RDMA_DONE = 3
};
struct rdma_svc_data {
queue_t q;
int active;
rdma_stat err_code;
int32_t svcid;
};
typedef struct rdma_mod {
char *rdma_api;
uint_t rdma_version;
int rdma_count;
struct rdmaops *rdma_ops;
} rdma_mod_t;
typedef struct rdma_registry {
rdma_mod_t *r_mod;
uint32_t r_mod_state;
struct rdma_registry *r_next;
} rdma_registry_t;
#define RDMA_MOD_ACTIVE 1
#define RDMA_MOD_INACTIVE 0
typedef struct rdma_info {
uint_t addrlen;
uint_t mts;
uint_t mtu;
} rdma_info_t;
typedef enum {
C_IDLE = 0x00000001,
C_CONN_PEND = 0x00000002,
C_CONNECTED = 0x00000004,
C_ERROR_CONN = 0x00000008,
C_DISCONN_PEND = 0x00000010,
C_REMOTE_DOWN = 0x00000020
} conn_c_state;
#define C_CLOSE_NOTNEEDED 0x00000001
#define C_CLOSE_PENDING 0x00000002
typedef struct conn {
rdma_mod_t *c_rdmamod;
char *c_netid;
struct netbuf c_raddr;
struct netbuf c_laddr;
struct netbuf c_addrmask;
int c_ref;
struct conn *c_next;
struct conn *c_prev;
caddr_t c_private;
conn_c_state c_state;
int c_flags;
rdma_cc_type_t c_cc_type;
union {
rdma_clnt_cred_ctrl_t c_clnt_cc;
rdma_srv_cred_ctrl_t c_srv_cc;
} rdma_conn_cred_ctrl_u;
kmutex_t c_lock;
kcondvar_t c_cv;
timeout_id_t c_timeout;
time_t c_last_used;
} CONN;
typedef struct rdma_recv_data {
CONN *conn;
int status;
rdma_buf_t rpcmsg;
} rdma_recv_data_t;
typedef enum {
RCI_WRITE_UIO_CHUNK = 1,
RCI_WRITE_ADDR_CHUNK = 2,
RCI_REPLY_CHUNK = 3
} rci_type_t;
typedef struct {
rci_type_t rci_type;
union {
struct uio *rci_uiop;
caddr_t rci_addr;
} rci_a;
uint32 rci_len;
struct clist **rci_clpp;
} rdma_chunkinfo_t;
typedef struct {
uint_t rcil_len;
uint_t rcil_len_alt;
} rdma_chunkinfo_lengths_t;
typedef struct {
struct clist *rwci_wlist;
CONN *rwci_conn;
} rdma_wlist_conn_info_t;
typedef struct rdmaops {
rdma_stat (*rdma_reachable)(int addr_type, struct netbuf *,
void **handle);
rdma_stat (*rdma_get_conn)(struct netbuf *, struct netbuf *,
int addr_type, void *, CONN **);
rdma_stat (*rdma_rel_conn)(CONN *);
void (*rdma_svc_listen)(struct rdma_svc_data *);
void (*rdma_svc_stop)(struct rdma_svc_data *);
rdma_stat (*rdma_regmem)(CONN *, caddr_t, caddr_t,
uint_t, struct mrc *);
rdma_stat (*rdma_deregmem)(CONN *, caddr_t, struct mrc);
rdma_stat (*rdma_regmemsync)(CONN *, caddr_t, caddr_t, uint_t,
struct mrc *, void **, void *);
rdma_stat (*rdma_deregmemsync)(CONN *, caddr_t, struct mrc,
void *, void *);
rdma_stat (*rdma_syncmem)(CONN *, void *, caddr_t, int, int);
rdma_stat (*rdma_buf_alloc)(CONN *, rdma_buf_t *);
void (*rdma_buf_free)(CONN *, rdma_buf_t *);
rdma_stat (*rdma_send)(CONN *, clist *, uint32_t);
rdma_stat (*rdma_send_resp)(CONN *, clist *, uint32_t);
rdma_stat (*rdma_clnt_recvbuf)(CONN *, clist *, uint32_t);
rdma_stat (*rdma_clnt_recvbuf_remove)(CONN *, uint32_t);
rdma_stat (*rdma_svc_recvbuf)(CONN *, clist *);
rdma_stat (*rdma_recv)(CONN *, clist **, uint32_t);
rdma_stat (*rdma_read)(CONN *, clist *, int);
rdma_stat (*rdma_write)(CONN *, clist *, int);
rdma_stat (*rdma_getinfo)(rdma_info_t *info);
} rdmaops_t;
typedef struct rdma_svc_wait {
kmutex_t svc_lock;
kcondvar_t svc_cv;
rdma_stat svc_stat;
} rdma_svc_wait_t;
extern rdma_svc_wait_t rdma_wait;
#define RDMA_REACHABLE(rdma_ops, addr_type, addr, handle) \
(*(rdma_ops)->rdma_reachable)(addr_type, addr, handle)
#define RDMA_GET_CONN(rdma_ops, saddr, daddr, addr_type, handle, conn) \
(*(rdma_ops)->rdma_get_conn)(saddr, daddr, addr_type, handle, conn)
#define RDMA_REL_CONN(conn) \
(*(conn)->c_rdmamod->rdma_ops->rdma_rel_conn)(conn)
#define RDMA_REGMEM(conn, adsp, buff, len, handle) \
(*(conn)->c_rdmamod->rdma_ops->rdma_regmem)(conn, adsp, \
buff, len, handle)
#define RDMA_DEREGMEM(conn, buff, handle) \
(*(conn)->c_rdmamod->rdma_ops->rdma_deregmem)(conn, buff, handle)
#define RDMA_REGMEMSYNC(conn, adsp, buff, len, handle, synchandle, lrc) \
(*(conn)->c_rdmamod->rdma_ops->rdma_regmemsync)(conn, adsp, buff, \
len, handle, synchandle, lrc)
#define RDMA_DEREGMEMSYNC(conn, buff, handle, synchandle, lrc) \
(*(conn)->c_rdmamod->rdma_ops->rdma_deregmemsync)(conn, buff, \
handle, synchandle, lrc)
#define RDMA_SYNCMEM(conn, handle, buff, len, direction) \
(*(conn)->c_rdmamod->rdma_ops->rdma_syncmem)(conn, handle, \
buff, len, direction)
#define RDMA_BUF_ALLOC(conn, rbuf) \
(*(conn)->c_rdmamod->rdma_ops->rdma_buf_alloc)(conn, rbuf)
#define RDMA_BUF_FREE(conn, rbuf) \
(*(conn)->c_rdmamod->rdma_ops->rdma_buf_free)(conn, rbuf)
#define RDMA_SEND(conn, sendlist, xid) \
(*(conn)->c_rdmamod->rdma_ops->rdma_send)(conn, sendlist, xid)
#define RDMA_SEND_RESP(conn, sendlist, xid) \
(*(conn)->c_rdmamod->rdma_ops->rdma_send_resp)(conn, sendlist, xid)
#define RDMA_CLNT_RECVBUF(conn, cl, xid) \
(*(conn)->c_rdmamod->rdma_ops->rdma_clnt_recvbuf)(conn, cl, xid)
#define RDMA_CLNT_RECVBUF_REMOVE(conn, xid) \
(*(conn)->c_rdmamod->rdma_ops->rdma_clnt_recvbuf_remove)(conn, xid)
#define RDMA_SVC_RECVBUF(conn, cl) \
(*(conn)->c_rdmamod->rdma_ops->rdma_svc_recvbuf)(conn, cl)
#define RDMA_RECV(conn, recvlist, xid) \
(*(conn)->c_rdmamod->rdma_ops->rdma_recv)(conn, recvlist, xid)
#define RDMA_READ(conn, cl, wait) \
(*(conn)->c_rdmamod->rdma_ops->rdma_read)(conn, cl, wait)
#define RDMA_WRITE(conn, cl, wait) \
(*(conn)->c_rdmamod->rdma_ops->rdma_write)(conn, cl, wait)
#define RDMA_GETINFO(rdma_mod, info) \
(*(rdma_mod)->rdma_ops->rdma_getinfo)(info)
#ifdef _KERNEL
extern rdma_registry_t *rdma_mod_head;
extern krwlock_t rdma_lock;
extern int rdma_modloaded;
extern int rdma_dev_available;
extern kmutex_t rdma_modload_lock;
extern uint_t rdma_minchunk;
extern ldi_ident_t rpcmod_li;
extern struct clist *clist_alloc(void);
extern void clist_add(struct clist **, uint32_t, int,
struct mrc *, caddr_t, struct mrc *, caddr_t);
extern void clist_free(struct clist *);
extern uint32_t clist_len(struct clist *);
extern void clist_zero_len(struct clist *);
extern rdma_stat clist_register(CONN *conn, struct clist *cl, clist_dstsrc);
extern rdma_stat clist_deregister(CONN *conn, struct clist *cl);
extern rdma_stat clist_syncmem(CONN *conn, struct clist *cl, clist_dstsrc);
extern rdma_stat rdma_clnt_postrecv(CONN *conn, uint32_t xid);
extern rdma_stat rdma_clnt_postrecv_remove(CONN *conn, uint32_t xid);
extern rdma_stat rdma_svc_postrecv(CONN *conn);
extern rdma_stat rdma_register_mod(rdma_mod_t *mod);
extern rdma_stat rdma_unregister_mod(rdma_mod_t *mod);
extern rdma_stat rdma_buf_alloc(CONN *, rdma_buf_t *);
extern void rdma_buf_free(CONN *, rdma_buf_t *);
extern int rdma_modload();
extern bool_t rdma_get_wchunk(struct svc_req *, iovec_t *, struct clist *);
extern rdma_stat rdma_kwait(void);
extern int rdma_setup_read_chunks(struct clist *, uint32_t, int *);
extern void xdrrdma_create(XDR *, caddr_t, uint_t, int, struct clist *,
enum xdr_op, CONN *);
extern void xdrrdma_destroy(XDR *);
extern uint_t xdrrdma_getpos(XDR *);
extern bool_t xdrrdma_setpos(XDR *, uint_t);
extern bool_t xdr_clist(XDR *, clist *);
extern bool_t xdr_do_clist(XDR *, clist **);
extern uint_t xdr_getbufsize(XDR *);
extern unsigned int xdrrdma_sizeof(xdrproc_t, void *, int, uint_t *, uint_t *);
extern unsigned int xdrrdma_authsize(AUTH *, struct cred *, int);
extern void xdrrdma_store_wlist(XDR *, struct clist *);
extern struct clist *xdrrdma_wclist(XDR *);
extern bool_t xdr_decode_reply_wchunk(XDR *, struct clist **);
extern bool_t xdr_decode_wlist(XDR *xdrs, struct clist **, bool_t *);
extern bool_t xdr_decode_wlist_svc(XDR *xdrs, struct clist **, bool_t *,
uint32_t *, CONN *);
extern bool_t xdr_encode_rlist_svc(XDR *, clist *);
extern bool_t xdr_encode_wlist(XDR *, clist *);
extern bool_t xdr_encode_reply_wchunk(XDR *, struct clist *,
uint32_t seg_array_len);
bool_t xdrrdma_getrdmablk(XDR *, struct clist **, uint_t *,
CONN **conn, const uint_t);
bool_t xdrrdma_read_from_client(struct clist *, CONN **, uint_t);
bool_t xdrrdma_send_read_data(XDR *, uint_t, struct clist *);
bool_t xdrrdma_free_clist(CONN *, struct clist *);
#endif
#ifdef __cplusplus
}
#endif
#endif