#include <sys/param.h>
#include <sys/types.h>
#include <sys/systm.h>
#include <sys/cred.h>
#include <sys/vfs.h>
#include <sys/vnode.h>
#include <sys/pathname.h>
#include <sys/sysmacros.h>
#include <sys/kmem.h>
#include <sys/kstat.h>
#include <sys/mkdev.h>
#include <sys/mount.h>
#include <sys/statvfs.h>
#include <sys/errno.h>
#include <sys/debug.h>
#include <sys/cmn_err.h>
#include <sys/utsname.h>
#include <sys/bootconf.h>
#include <sys/modctl.h>
#include <sys/acl.h>
#include <sys/flock.h>
#include <sys/kstr.h>
#include <sys/stropts.h>
#include <sys/strsubr.h>
#include <sys/atomic.h>
#include <sys/disp.h>
#include <sys/policy.h>
#include <sys/list.h>
#include <sys/zone.h>
#include <rpc/types.h>
#include <rpc/auth.h>
#include <rpc/rpcsec_gss.h>
#include <rpc/clnt.h>
#include <rpc/xdr.h>
#include <nfs/nfs.h>
#include <nfs/nfs_clnt.h>
#include <nfs/mount.h>
#include <nfs/nfs_acl.h>
#include <fs/fs_subr.h>
#include <nfs/nfs4.h>
#include <nfs/rnode4.h>
#include <nfs/nfs4_clnt.h>
#include <nfs/nfssys.h>
#ifdef DEBUG
stateid4 nfs4_deleg_any = { 0x7FFFFFF0 };
char nfs4_deleg_fh[] = "\0377\0376\0375\0374";
nfs_fh4 nfs4_deleg_anyfh = { sizeof (nfs4_deleg_fh)-1, nfs4_deleg_fh };
nfsstat4 cb4_getattr_fail = NFS4_OK;
nfsstat4 cb4_recall_fail = NFS4_OK;
int nfs4_callback_debug;
int nfs4_recall_debug;
int nfs4_drat_debug;
#endif
#define CB_NOTE(x) NFS4_DEBUG(nfs4_callback_debug, (CE_NOTE, x))
#define CB_WARN(x) NFS4_DEBUG(nfs4_callback_debug, (CE_WARN, x))
#define CB_WARN1(x, y) NFS4_DEBUG(nfs4_callback_debug, (CE_WARN, x, y))
enum nfs4_delegreturn_policy nfs4_delegreturn_policy = INACTIVE;
static zone_key_t nfs4_callback_zone_key;
#define NFS4_MAPSIZE 8192
#define NFS4_MAPWORDS NFS4_MAPSIZE/sizeof (uint_t)
#define NbPW (NBBY*sizeof (uint_t))
static int nfs4_num_prognums = 1024;
static SVC_CALLOUT_TABLE nfs4_cb_sct;
struct nfs4_dnode {
list_node_t linkage;
rnode4_t *rnodep;
int flags;
};
static const struct nfs4_callback_stats nfs4_callback_stats_tmpl = {
{ "delegations", KSTAT_DATA_UINT64 },
{ "cb_getattr", KSTAT_DATA_UINT64 },
{ "cb_recall", KSTAT_DATA_UINT64 },
{ "cb_null", KSTAT_DATA_UINT64 },
{ "cb_dispatch", KSTAT_DATA_UINT64 },
{ "delegaccept_r", KSTAT_DATA_UINT64 },
{ "delegaccept_rw", KSTAT_DATA_UINT64 },
{ "delegreturn", KSTAT_DATA_UINT64 },
{ "callbacks", KSTAT_DATA_UINT64 },
{ "claim_cur", KSTAT_DATA_UINT64 },
{ "claim_cur_ok", KSTAT_DATA_UINT64 },
{ "recall_trunc", KSTAT_DATA_UINT64 },
{ "recall_failed", KSTAT_DATA_UINT64 },
{ "return_limit_write", KSTAT_DATA_UINT64 },
{ "return_limit_addmap", KSTAT_DATA_UINT64 },
{ "deleg_recover", KSTAT_DATA_UINT64 },
{ "cb_illegal", KSTAT_DATA_UINT64 }
};
struct nfs4_cb_port {
list_node_t linkage;
char netid[KNC_STRSIZE];
char uaddr[KNC_STRSIZE];
char protofmly[KNC_STRSIZE];
char proto[KNC_STRSIZE];
};
static int cb_getattr_bytes;
struct cb_recall_pass {
rnode4_t *rp;
int flags;
bool_t truncate;
};
static nfs4_open_stream_t *get_next_deleg_stream(rnode4_t *, int);
static void nfs4delegreturn_thread(struct cb_recall_pass *);
static int deleg_reopen(vnode_t *, bool_t *, struct nfs4_callback_globals *,
int);
static void nfs4_dlistadd(rnode4_t *, struct nfs4_callback_globals *, int);
static void nfs4_dlistclean_impl(struct nfs4_callback_globals *, int);
static int nfs4delegreturn_impl(rnode4_t *, int,
struct nfs4_callback_globals *);
static void nfs4delegreturn_cleanup_impl(rnode4_t *, nfs4_server_t *,
struct nfs4_callback_globals *);
static void
cb_getattr(nfs_cb_argop4 *argop, nfs_cb_resop4 *resop, struct svc_req *req,
struct compound_state *cs, struct nfs4_callback_globals *ncg)
{
CB_GETATTR4args *args = &argop->nfs_cb_argop4_u.opcbgetattr;
CB_GETATTR4res *resp = &resop->nfs_cb_resop4_u.opcbgetattr;
rnode4_t *rp;
vnode_t *vp;
bool_t found = FALSE;
struct nfs4_server *sp;
struct fattr4 *fap;
rpc_inline_t *fdata;
long mapcnt;
fattr4_change change;
fattr4_size size;
uint_t rflag;
ncg->nfs4_callback_stats.cb_getattr.value.ui64++;
#ifdef DEBUG
if (cb4_getattr_fail != NFS4_OK) {
*cs->statusp = resp->status = cb4_getattr_fail;
return;
}
#endif
resp->obj_attributes.attrmask = 0;
mutex_enter(&ncg->nfs4_cb_lock);
sp = ncg->nfs4prog2server[req->rq_prog - NFS4_CALLBACK];
mutex_exit(&ncg->nfs4_cb_lock);
if (nfs4_server_vlock(sp, 0) == FALSE) {
CB_WARN("cb_getattr: cannot find server\n");
*cs->statusp = resp->status = NFS4ERR_BADHANDLE;
return;
}
if (sp->s_program != req->rq_prog) {
#ifdef DEBUG
zcmn_err(getzoneid(), CE_WARN,
"cb_getattr: wrong server program number srv=%d req=%d\n",
sp->s_program, req->rq_prog);
#else
zcmn_err(getzoneid(), CE_WARN,
"cb_getattr: wrong server program number\n");
#endif
mutex_exit(&sp->s_lock);
nfs4_server_rele(sp);
*cs->statusp = resp->status = NFS4ERR_BADHANDLE;
return;
}
rp = list_head(&sp->s_deleg_list);
for (; rp != NULL; rp = list_next(&sp->s_deleg_list, rp)) {
nfs4_fhandle_t fhandle;
sfh4_copyval(rp->r_fh, &fhandle);
if ((fhandle.fh_len == args->fh.nfs_fh4_len &&
bcmp(fhandle.fh_buf, args->fh.nfs_fh4_val,
fhandle.fh_len) == 0)) {
found = TRUE;
break;
}
#ifdef DEBUG
if (nfs4_deleg_anyfh.nfs_fh4_len == args->fh.nfs_fh4_len &&
bcmp(nfs4_deleg_anyfh.nfs_fh4_val, args->fh.nfs_fh4_val,
args->fh.nfs_fh4_len) == 0) {
found = TRUE;
break;
}
#endif
}
if (found == TRUE) {
vp = RTOV4(rp);
VN_HOLD(vp);
}
mutex_exit(&sp->s_lock);
nfs4_server_rele(sp);
if (found == FALSE) {
CB_WARN("cb_getattr: bad fhandle\n");
*cs->statusp = resp->status = NFS4ERR_BADHANDLE;
return;
}
fdata = kmem_alloc(cb_getattr_bytes, KM_SLEEP);
fap = &resp->obj_attributes;
fap->attrmask = 0;
fap->attrlist4 = (char *)fdata;
fap->attrlist4_len = 0;
if (args->attr_request != 0) {
if (args->attr_request & FATTR4_CHANGE_MASK) {
mutex_enter(&rp->r_statelock);
mapcnt = rp->r_mapcnt;
rflag = rp->r_flags;
mutex_exit(&rp->r_statelock);
mutex_enter(&rp->r_statev4_lock);
if (mapcnt)
rp->r_deleg_change++;
else if (! (rflag & R4DIRTY))
rp->r_deleg_change = rp->r_deleg_change_grant;
change = rp->r_deleg_change;
mutex_exit(&rp->r_statev4_lock);
IXDR_PUT_U_HYPER(fdata, change);
fap->attrlist4_len += 2 * BYTES_PER_XDR_UNIT;
fap->attrmask |= FATTR4_CHANGE_MASK;
}
if (args->attr_request & FATTR4_SIZE_MASK) {
size = atomic_add_64_nv((uint64_t *)&rp->r_size, 0);
IXDR_PUT_U_HYPER(fdata, size);
fap->attrlist4_len += 2 * BYTES_PER_XDR_UNIT;
fap->attrmask |= FATTR4_SIZE_MASK;
}
}
VN_RELE(vp);
*cs->statusp = resp->status = NFS4_OK;
}
static void
cb_getattr_free(nfs_cb_resop4 *resop)
{
if (resop->nfs_cb_resop4_u.opcbgetattr.obj_attributes.attrlist4)
kmem_free(resop->nfs_cb_resop4_u.opcbgetattr.
obj_attributes.attrlist4, cb_getattr_bytes);
}
static void
cb_recall(nfs_cb_argop4 *argop, nfs_cb_resop4 *resop, struct svc_req *req,
struct compound_state *cs, struct nfs4_callback_globals *ncg)
{
CB_RECALL4args * args = &argop->nfs_cb_argop4_u.opcbrecall;
CB_RECALL4res *resp = &resop->nfs_cb_resop4_u.opcbrecall;
rnode4_t *rp;
vnode_t *vp;
struct nfs4_server *sp;
bool_t found = FALSE;
ncg->nfs4_callback_stats.cb_recall.value.ui64++;
ASSERT(req->rq_prog >= NFS4_CALLBACK);
ASSERT(req->rq_prog < NFS4_CALLBACK+nfs4_num_prognums);
#ifdef DEBUG
if (cb4_recall_fail != NFS4_OK) {
*cs->statusp = resp->status = cb4_recall_fail;
return;
}
#endif
mutex_enter(&ncg->nfs4_cb_lock);
sp = ncg->nfs4prog2server[req->rq_prog - NFS4_CALLBACK];
mutex_exit(&ncg->nfs4_cb_lock);
if (nfs4_server_vlock(sp, 0) == FALSE) {
CB_WARN("cb_recall: cannot find server\n");
*cs->statusp = resp->status = NFS4ERR_BADHANDLE;
return;
}
rp = list_head(&sp->s_deleg_list);
for (; rp != NULL; rp = list_next(&sp->s_deleg_list, rp)) {
mutex_enter(&rp->r_statev4_lock);
if ((bcmp(&rp->r_deleg_stateid, &args->stateid,
sizeof (stateid4)) == 0)) {
nfs4_fhandle_t fhandle;
sfh4_copyval(rp->r_fh, &fhandle);
if ((fhandle.fh_len == args->fh.nfs_fh4_len &&
bcmp(fhandle.fh_buf, args->fh.nfs_fh4_val,
fhandle.fh_len) == 0)) {
found = TRUE;
break;
} else {
#ifdef DEBUG
CB_WARN("cb_recall: stateid OK, bad fh");
#endif
}
}
#ifdef DEBUG
if (bcmp(&args->stateid, &nfs4_deleg_any,
sizeof (stateid4)) == 0) {
found = TRUE;
break;
}
#endif
mutex_exit(&rp->r_statev4_lock);
}
if (found == TRUE) {
mutex_exit(&rp->r_statev4_lock);
vp = RTOV4(rp);
VN_HOLD(vp);
}
mutex_exit(&sp->s_lock);
nfs4_server_rele(sp);
if (found == FALSE) {
CB_WARN("cb_recall: bad stateid\n");
*cs->statusp = resp->status = NFS4ERR_BAD_STATEID;
return;
}
nfs4delegreturn_async(rp, NFS4_DR_RECALL|NFS4_DR_REOPEN,
args->truncate);
*cs->statusp = resp->status = 0;
}
static void
cb_recall_free(nfs_cb_resop4 *resop)
{
}
static void
cb_null(CB_COMPOUND4args *args, CB_COMPOUND4res *resp, struct svc_req *req,
struct nfs4_callback_globals *ncg)
{
struct nfs4_server *sp;
ncg->nfs4_callback_stats.cb_null.value.ui64++;
ASSERT(req->rq_prog >= NFS4_CALLBACK);
ASSERT(req->rq_prog < NFS4_CALLBACK+nfs4_num_prognums);
mutex_enter(&ncg->nfs4_cb_lock);
sp = ncg->nfs4prog2server[req->rq_prog - NFS4_CALLBACK];
mutex_exit(&ncg->nfs4_cb_lock);
if (nfs4_server_vlock(sp, 0) != FALSE) {
sp->s_flags |= N4S_CB_PINGED;
cv_broadcast(&sp->wait_cb_null);
mutex_exit(&sp->s_lock);
nfs4_server_rele(sp);
}
}
static void
cb_illegal(nfs_cb_argop4 *argop, nfs_cb_resop4 *resop, struct svc_req *req,
struct compound_state *cs, struct nfs4_callback_globals *ncg)
{
CB_ILLEGAL4res *resp = &resop->nfs_cb_resop4_u.opcbillegal;
ncg->nfs4_callback_stats.cb_illegal.value.ui64++;
resop->resop = OP_CB_ILLEGAL;
*cs->statusp = resp->status = NFS4ERR_OP_ILLEGAL;
}
static void
cb_compound(CB_COMPOUND4args *args, CB_COMPOUND4res *resp, struct svc_req *req,
struct nfs4_callback_globals *ncg)
{
uint_t i;
struct compound_state cs;
nfs_cb_argop4 *argop;
nfs_cb_resop4 *resop, *new_res;
uint_t op;
bzero(&cs, sizeof (cs));
cs.statusp = &resp->status;
cs.cont = TRUE;
resp->tag.utf8string_len = args->tag.utf8string_len;
if (args->tag.utf8string_len != 0) {
resp->tag.utf8string_val =
kmem_alloc(resp->tag.utf8string_len, KM_SLEEP);
bcopy(args->tag.utf8string_val, resp->tag.utf8string_val,
args->tag.utf8string_len);
} else {
resp->tag.utf8string_val = NULL;
}
if (args->minorversion != CB4_MINORVERSION) {
resp->array_len = 0;
resp->array = NULL;
resp->status = NFS4ERR_MINOR_VERS_MISMATCH;
return;
}
#ifdef DEBUG
if (args->callback_ident != req->rq_prog)
zcmn_err(getzoneid(), CE_WARN,
"cb_compound: cb_client using wrong "
"callback_ident(%d), should be %d",
args->callback_ident, req->rq_prog);
#endif
resp->array_len = args->array_len;
resp->array = kmem_zalloc(args->array_len * sizeof (nfs_cb_resop4),
KM_SLEEP);
for (i = 0; i < args->array_len && cs.cont; i++) {
argop = &args->array[i];
resop = &resp->array[i];
resop->resop = argop->argop;
op = (uint_t)resop->resop;
switch (op) {
case OP_CB_GETATTR:
cb_getattr(argop, resop, req, &cs, ncg);
break;
case OP_CB_RECALL:
cb_recall(argop, resop, req, &cs, ncg);
break;
case OP_CB_ILLEGAL:
default:
op = OP_CB_ILLEGAL;
cb_illegal(argop, resop, req, &cs, ncg);
}
if (*cs.statusp != NFS4_OK)
cs.cont = FALSE;
if ((i + 1) < args->array_len && !cs.cont) {
new_res = kmem_alloc(
(i+1) * sizeof (nfs_cb_resop4), KM_SLEEP);
bcopy(resp->array,
new_res, (i+1) * sizeof (nfs_cb_resop4));
kmem_free(resp->array,
args->array_len * sizeof (nfs_cb_resop4));
resp->array_len = i + 1;
resp->array = new_res;
}
}
}
static void
cb_compound_free(CB_COMPOUND4res *resp)
{
uint_t i, op;
nfs_cb_resop4 *resop;
if (resp->tag.utf8string_val) {
UTF8STRING_FREE(resp->tag)
}
for (i = 0; i < resp->array_len; i++) {
resop = &resp->array[i];
op = (uint_t)resop->resop;
switch (op) {
case OP_CB_GETATTR:
cb_getattr_free(resop);
break;
case OP_CB_RECALL:
cb_recall_free(resop);
break;
default:
break;
}
}
if (resp->array != NULL) {
kmem_free(resp->array,
resp->array_len * sizeof (nfs_cb_resop4));
}
}
static void
cb_dispatch(struct svc_req *req, SVCXPRT *xprt)
{
CB_COMPOUND4args args;
CB_COMPOUND4res res;
struct nfs4_callback_globals *ncg;
bool_t (*xdr_args)(), (*xdr_res)();
void (*proc)(CB_COMPOUND4args *, CB_COMPOUND4res *, struct svc_req *,
struct nfs4_callback_globals *);
void (*freeproc)(CB_COMPOUND4res *);
ncg = zone_getspecific(nfs4_callback_zone_key, nfs_zone());
ASSERT(ncg != NULL);
ncg->nfs4_callback_stats.cb_dispatch.value.ui64++;
switch (req->rq_proc) {
case CB_NULL:
xdr_args = xdr_void;
xdr_res = xdr_void;
proc = cb_null;
freeproc = NULL;
break;
case CB_COMPOUND:
xdr_args = xdr_CB_COMPOUND4args_clnt;
xdr_res = xdr_CB_COMPOUND4res;
proc = cb_compound;
freeproc = cb_compound_free;
break;
default:
CB_WARN("cb_dispatch: no proc\n");
svcerr_noproc(xprt);
return;
}
args.tag.utf8string_val = NULL;
args.array = NULL;
if (!SVC_GETARGS(xprt, xdr_args, (caddr_t)&args)) {
CB_WARN("cb_dispatch: cannot getargs\n");
svcerr_decode(xprt);
return;
}
(*proc)(&args, &res, req, ncg);
if (svc_sendreply(xprt, xdr_res, (caddr_t)&res) == FALSE) {
CB_WARN("cb_dispatch: bad sendreply\n");
svcerr_systemerr(xprt);
}
if (freeproc)
(*freeproc)(&res);
if (!SVC_FREEARGS(xprt, xdr_args, (caddr_t)&args)) {
CB_WARN("cb_dispatch: bad freeargs\n");
}
}
static rpcprog_t
nfs4_getnextprogram(struct nfs4_callback_globals *ncg)
{
int i, j;
j = ncg->nfs4_program_hint;
for (i = 0; i < nfs4_num_prognums; i++, j++) {
if (j >= nfs4_num_prognums)
j = 0;
if (ncg->nfs4prog2server[j] == NULL) {
ncg->nfs4_program_hint = j+1;
return (j+NFS4_CALLBACK);
}
}
return (0);
}
void
nfs4callback_destroy(nfs4_server_t *np)
{
struct nfs4_callback_globals *ncg;
int i;
if (np->s_program == 0)
return;
ncg = np->zone_globals;
i = np->s_program - NFS4_CALLBACK;
mutex_enter(&ncg->nfs4_cb_lock);
ASSERT(ncg->nfs4prog2server[i] == np);
ncg->nfs4prog2server[i] = NULL;
if (i < ncg->nfs4_program_hint)
ncg->nfs4_program_hint = i;
mutex_exit(&ncg->nfs4_cb_lock);
}
static void
nfs4_setport(char *netid, char *uaddr, char *protofmly, char *proto,
struct nfs4_callback_globals *ncg)
{
struct nfs4_cb_port *p;
bool_t found = FALSE;
ASSERT(MUTEX_HELD(&ncg->nfs4_cb_lock));
p = list_head(&ncg->nfs4_cb_ports);
for (; p != NULL; p = list_next(&ncg->nfs4_cb_ports, p)) {
if (strcmp(p->netid, netid) == 0) {
found = TRUE;
break;
}
}
if (found == TRUE)
(void) strcpy(p->uaddr, uaddr);
else {
p = kmem_alloc(sizeof (*p), KM_SLEEP);
(void) strcpy(p->uaddr, uaddr);
(void) strcpy(p->netid, netid);
(void) strcpy(p->protofmly, protofmly);
(void) strcpy(p->proto, proto);
list_insert_head(&ncg->nfs4_cb_ports, p);
}
}
void
nfs4_cb_args(nfs4_server_t *np, struct knetconfig *knc, SETCLIENTID4args *args)
{
struct nfs4_cb_port *p;
bool_t found = FALSE;
rpcprog_t pgm;
struct nfs4_callback_globals *ncg = np->zone_globals;
if (np->s_program >= NFS4_CALLBACK &&
np->s_program < NFS4_CALLBACK + nfs4_num_prognums)
nfs4callback_destroy(np);
mutex_enter(&ncg->nfs4_cb_lock);
p = list_head(&ncg->nfs4_cb_ports);
for (; p != NULL; p = list_next(&ncg->nfs4_cb_ports, p)) {
if (strcmp(p->protofmly, knc->knc_protofmly) == 0 &&
strcmp(p->proto, knc->knc_proto) == 0) {
found = TRUE;
break;
}
}
if (found == FALSE) {
NFS4_DEBUG(nfs4_callback_debug,
(CE_WARN, "nfs4_cb_args: could not find netid for %s/%s\n",
knc->knc_protofmly, knc->knc_proto));
args->callback.cb_program = 0;
args->callback.cb_location.r_netid = NULL;
args->callback.cb_location.r_addr = NULL;
args->callback_ident = 0;
mutex_exit(&ncg->nfs4_cb_lock);
return;
}
if ((pgm = nfs4_getnextprogram(ncg)) == 0) {
CB_WARN("nfs4_cb_args: out of program numbers\n");
args->callback.cb_program = 0;
args->callback.cb_location.r_netid = NULL;
args->callback.cb_location.r_addr = NULL;
args->callback_ident = 0;
mutex_exit(&ncg->nfs4_cb_lock);
return;
}
ncg->nfs4prog2server[pgm-NFS4_CALLBACK] = np;
args->callback.cb_program = pgm;
args->callback.cb_location.r_netid = p->netid;
args->callback.cb_location.r_addr = p->uaddr;
args->callback_ident = pgm;
np->s_program = pgm;
mutex_exit(&ncg->nfs4_cb_lock);
}
static int
nfs4_dquery(struct nfs4_svc_args *arg, model_t model)
{
file_t *fp;
vnode_t *vp;
rnode4_t *rp;
int error;
STRUCT_HANDLE(nfs4_svc_args, uap);
STRUCT_SET_HANDLE(uap, model, arg);
if ((fp = getf(STRUCT_FGET(uap, fd))) == NULL)
return (EBADF);
vp = fp->f_vnode;
if (vp == NULL || vp->v_type != VREG ||
!vn_matchops(vp, nfs4_vnodeops)) {
releasef(STRUCT_FGET(uap, fd));
return (EBADF);
}
rp = VTOR4(vp);
error = suword32(STRUCT_FGETP(uap, netid), rp->r_deleg_type);
releasef(STRUCT_FGET(uap, fd));
return (error);
}
int
nfs4_svc(struct nfs4_svc_args *arg, model_t model)
{
file_t *fp;
int error;
int readsize;
char buf[KNC_STRSIZE], uaddr[KNC_STRSIZE];
char protofmly[KNC_STRSIZE], proto[KNC_STRSIZE];
size_t len;
STRUCT_HANDLE(nfs4_svc_args, uap);
struct netbuf addrmask;
int cmd;
SVCMASTERXPRT *cb_xprt;
struct nfs4_callback_globals *ncg;
#ifdef lint
model = model;
#endif
STRUCT_SET_HANDLE(uap, model, arg);
if (STRUCT_FGET(uap, cmd) == NFS4_DQUERY)
return (nfs4_dquery(arg, model));
if (secpolicy_nfs(CRED()) != 0)
return (EPERM);
if ((fp = getf(STRUCT_FGET(uap, fd))) == NULL)
return (EBADF);
readsize = nfs3tsize() + (RPC_MAXDATASIZE - NFS_MAXDATA);
if (readsize < RPC_MAXDATASIZE)
readsize = RPC_MAXDATASIZE;
error = copyinstr((const char *)STRUCT_FGETP(uap, netid), buf,
KNC_STRSIZE, &len);
if (error) {
releasef(STRUCT_FGET(uap, fd));
return (error);
}
cmd = STRUCT_FGET(uap, cmd);
if (cmd & NFS4_KRPC_START) {
addrmask.len = STRUCT_FGET(uap, addrmask.len);
addrmask.maxlen = STRUCT_FGET(uap, addrmask.maxlen);
addrmask.buf = kmem_alloc(addrmask.maxlen, KM_SLEEP);
error = copyin(STRUCT_FGETP(uap, addrmask.buf), addrmask.buf,
addrmask.len);
if (error) {
releasef(STRUCT_FGET(uap, fd));
kmem_free(addrmask.buf, addrmask.maxlen);
return (error);
}
}
else
addrmask.buf = NULL;
error = copyinstr((const char *)STRUCT_FGETP(uap, addr), uaddr,
sizeof (uaddr), &len);
if (error) {
releasef(STRUCT_FGET(uap, fd));
if (addrmask.buf)
kmem_free(addrmask.buf, addrmask.maxlen);
return (error);
}
error = copyinstr((const char *)STRUCT_FGETP(uap, protofmly), protofmly,
sizeof (protofmly), &len);
if (error) {
releasef(STRUCT_FGET(uap, fd));
if (addrmask.buf)
kmem_free(addrmask.buf, addrmask.maxlen);
return (error);
}
error = copyinstr((const char *)STRUCT_FGETP(uap, proto), proto,
sizeof (proto), &len);
if (error) {
releasef(STRUCT_FGET(uap, fd));
if (addrmask.buf)
kmem_free(addrmask.buf, addrmask.maxlen);
return (error);
}
ncg = zone_getspecific(nfs4_callback_zone_key, nfs_zone());
ASSERT(ncg != NULL);
mutex_enter(&ncg->nfs4_cb_lock);
if (cmd & NFS4_SETPORT)
nfs4_setport(buf, uaddr, protofmly, proto, ncg);
if (cmd & NFS4_KRPC_START) {
error = svc_tli_kcreate(fp, readsize, buf, &addrmask, &cb_xprt,
&nfs4_cb_sct, NULL, NFS_CB_SVCPOOL_ID, FALSE);
if (error) {
CB_WARN1("nfs4_svc: svc_tli_kcreate failed %d\n",
error);
kmem_free(addrmask.buf, addrmask.maxlen);
}
}
mutex_exit(&ncg->nfs4_cb_lock);
releasef(STRUCT_FGET(uap, fd));
return (error);
}
struct nfs4_callback_globals *
nfs4_get_callback_globals(void)
{
return (zone_getspecific(nfs4_callback_zone_key, nfs_zone()));
}
static void *
nfs4_callback_init_zone(zoneid_t zoneid)
{
kstat_t *nfs4_callback_kstat;
struct nfs4_callback_globals *ncg;
ncg = kmem_zalloc(sizeof (*ncg), KM_SLEEP);
ncg->nfs4prog2server = kmem_zalloc(nfs4_num_prognums *
sizeof (struct nfs4_server *), KM_SLEEP);
mutex_init(&ncg->nfs4_dlist_lock, NULL, MUTEX_DEFAULT, NULL);
list_create(&ncg->nfs4_dlist, sizeof (struct nfs4_dnode),
offsetof(struct nfs4_dnode, linkage));
mutex_init(&ncg->nfs4_cb_lock, NULL, MUTEX_DEFAULT, NULL);
list_create(&ncg->nfs4_cb_ports, sizeof (struct nfs4_cb_port),
offsetof(struct nfs4_cb_port, linkage));
bcopy(&nfs4_callback_stats_tmpl, &ncg->nfs4_callback_stats,
sizeof (nfs4_callback_stats_tmpl));
if ((nfs4_callback_kstat =
kstat_create_zone("nfs", 0, "nfs4_callback_stats", "misc",
KSTAT_TYPE_NAMED,
sizeof (ncg->nfs4_callback_stats) / sizeof (kstat_named_t),
KSTAT_FLAG_VIRTUAL | KSTAT_FLAG_WRITABLE,
zoneid)) != NULL) {
nfs4_callback_kstat->ks_data = &ncg->nfs4_callback_stats;
kstat_install(nfs4_callback_kstat);
}
return (ncg);
}
static void
nfs4_discard_delegations(struct nfs4_callback_globals *ncg)
{
nfs4_server_t *sp;
int i, num_removed;
for (i = 0; i < nfs4_num_prognums; i++) {
rnode4_t *rp;
mutex_enter(&ncg->nfs4_cb_lock);
sp = ncg->nfs4prog2server[i];
mutex_exit(&ncg->nfs4_cb_lock);
if (nfs4_server_vlock(sp, 1) == FALSE)
continue;
num_removed = 0;
while ((rp = list_head(&sp->s_deleg_list)) != NULL) {
mutex_enter(&rp->r_statev4_lock);
if (rp->r_deleg_type == OPEN_DELEGATE_NONE) {
list_remove(&sp->s_deleg_list, rp);
mutex_exit(&rp->r_statev4_lock);
nfs4_dec_state_ref_count_nolock(sp,
VTOMI4(RTOV4(rp)));
num_removed++;
continue;
}
mutex_exit(&rp->r_statev4_lock);
VN_HOLD(RTOV4(rp));
mutex_exit(&sp->s_lock);
nfs4delegreturn_cleanup_impl(rp, sp, ncg);
VN_RELE(RTOV4(rp));
mutex_enter(&sp->s_lock);
}
mutex_exit(&sp->s_lock);
while (num_removed-- > 0)
nfs4_server_rele(sp);
nfs4_server_rele(sp);
}
}
static void
nfs4_callback_shutdown_zone(zoneid_t zoneid, void *data)
{
struct nfs4_callback_globals *ncg = data;
nfs4_dlistclean_impl(ncg, NFS4_DR_DISCARD);
nfs4_discard_delegations(ncg);
}
static void
nfs4_callback_fini_zone(zoneid_t zoneid, void *data)
{
struct nfs4_callback_globals *ncg = data;
struct nfs4_cb_port *p;
nfs4_server_t *sp, *next;
nfs4_server_t freelist;
int i;
kstat_delete_byname_zone("nfs", 0, "nfs4_callback_stats", zoneid);
nfs4_discard_delegations(ncg);
freelist.forw = &freelist;
freelist.back = &freelist;
mutex_enter(&nfs4_server_lst_lock);
sp = nfs4_server_lst.forw;
while (sp != &nfs4_server_lst) {
next = sp->forw;
if (sp->zoneid == zoneid) {
remque(sp);
insque(sp, &freelist);
}
sp = next;
}
mutex_exit(&nfs4_server_lst_lock);
sp = freelist.forw;
while (sp != &freelist) {
next = sp->forw;
nfs4_server_rele(sp);
sp = next;
}
#ifdef DEBUG
for (i = 0; i < nfs4_num_prognums; i++) {
ASSERT(ncg->nfs4prog2server[i] == NULL);
}
#endif
kmem_free(ncg->nfs4prog2server, nfs4_num_prognums *
sizeof (struct nfs4_server *));
mutex_enter(&ncg->nfs4_cb_lock);
while ((p = list_head(&ncg->nfs4_cb_ports)) != NULL) {
list_remove(&ncg->nfs4_cb_ports, p);
kmem_free(p, sizeof (*p));
}
list_destroy(&ncg->nfs4_cb_ports);
mutex_destroy(&ncg->nfs4_cb_lock);
list_destroy(&ncg->nfs4_dlist);
mutex_destroy(&ncg->nfs4_dlist_lock);
kmem_free(ncg, sizeof (*ncg));
}
void
nfs4_callback_init(void)
{
int i;
SVC_CALLOUT *nfs4_cb_sc;
nfs4_cb_sc = kmem_alloc(nfs4_num_prognums *
sizeof (SVC_CALLOUT), KM_SLEEP);
for (i = 0; i < nfs4_num_prognums; i++) {
nfs4_cb_sc[i].sc_prog = NFS4_CALLBACK+i;
nfs4_cb_sc[i].sc_versmin = NFS_CB;
nfs4_cb_sc[i].sc_versmax = NFS_CB;
nfs4_cb_sc[i].sc_dispatch = cb_dispatch;
}
nfs4_cb_sct.sct_size = nfs4_num_prognums;
nfs4_cb_sct.sct_free = FALSE;
nfs4_cb_sct.sct_sc = nfs4_cb_sc;
cb_getattr_bytes = 2 * BYTES_PER_XDR_UNIT + 2 * BYTES_PER_XDR_UNIT;
zone_key_create(&nfs4_callback_zone_key, nfs4_callback_init_zone,
nfs4_callback_shutdown_zone, nfs4_callback_fini_zone);
}
void
nfs4_callback_fini(void)
{
}
static void
nfs4delegreturn_cleanup_impl(rnode4_t *rp, nfs4_server_t *np,
struct nfs4_callback_globals *ncg)
{
mntinfo4_t *mi = VTOMI4(RTOV4(rp));
boolean_t need_rele = B_FALSE;
if (np == NULL) {
np = find_nfs4_server_all(mi, 1);
if (np == NULL)
return;
need_rele = B_TRUE;
} else {
mutex_enter(&np->s_lock);
}
mutex_enter(&rp->r_statev4_lock);
if (rp->r_deleg_type == OPEN_DELEGATE_NONE) {
mutex_exit(&rp->r_statev4_lock);
mutex_exit(&np->s_lock);
if (need_rele)
nfs4_server_rele(np);
return;
}
crfree(rp->r_deleg_cred);
rp->r_deleg_cred = NULL;
rp->r_deleg_type = OPEN_DELEGATE_NONE;
rp->r_deleg_needs_recovery = OPEN_DELEGATE_NONE;
rp->r_deleg_needs_recall = FALSE;
rp->r_deleg_return_pending = FALSE;
list_remove(&np->s_deleg_list, rp);
mutex_exit(&rp->r_statev4_lock);
nfs4_dec_state_ref_count_nolock(np, mi);
mutex_exit(&np->s_lock);
nfs4_server_rele(np);
if (need_rele)
nfs4_server_rele(np);
if (ncg != NULL)
ncg->nfs4_callback_stats.delegations.value.ui64--;
}
void
nfs4delegreturn_cleanup(rnode4_t *rp, nfs4_server_t *np)
{
struct nfs4_callback_globals *ncg;
if (np != NULL) {
ncg = np->zone_globals;
} else if (nfs_zone() == VTOMI4(RTOV4(rp))->mi_zone) {
ncg = zone_getspecific(nfs4_callback_zone_key, nfs_zone());
ASSERT(ncg != NULL);
} else {
ASSERT(getzoneid() == GLOBAL_ZONEID);
ncg = NULL;
}
nfs4delegreturn_cleanup_impl(rp, np, ncg);
}
static void
nfs4delegreturn_save_lost_rqst(int error, nfs4_lost_rqst_t *lost_rqstp,
cred_t *cr, vnode_t *vp)
{
if (error != ETIMEDOUT && error != EINTR &&
!NFS4_FRC_UNMT_ERR(error, vp->v_vfsp)) {
lost_rqstp->lr_op = 0;
return;
}
NFS4_DEBUG(nfs4_lost_rqst_debug, (CE_NOTE,
"nfs4close_save_lost_rqst: error %d", error));
lost_rqstp->lr_op = OP_DELEGRETURN;
lost_rqstp->lr_vp = vp;
lost_rqstp->lr_dvp = NULL;
lost_rqstp->lr_oop = NULL;
lost_rqstp->lr_osp = NULL;
lost_rqstp->lr_lop = NULL;
lost_rqstp->lr_cr = cr;
lost_rqstp->lr_flk = NULL;
lost_rqstp->lr_putfirst = FALSE;
}
static void
nfs4delegreturn_otw(rnode4_t *rp, cred_t *cr, nfs4_error_t *ep)
{
COMPOUND4args_clnt args;
COMPOUND4res_clnt res;
nfs_argop4 argops[3];
nfs4_ga_res_t *garp = NULL;
hrtime_t t;
int numops;
int doqueue = 1;
args.ctag = TAG_DELEGRETURN;
numops = 3;
args.array = argops;
args.array_len = numops;
argops[0].argop = OP_CPUTFH;
argops[0].nfs_argop4_u.opcputfh.sfh = rp->r_fh;
argops[1].argop = OP_GETATTR;
argops[1].nfs_argop4_u.opgetattr.attr_request = NFS4_VATTR_MASK;
argops[1].nfs_argop4_u.opgetattr.mi = VTOMI4(RTOV4(rp));
argops[2].argop = OP_DELEGRETURN;
argops[2].nfs_argop4_u.opdelegreturn.deleg_stateid =
rp->r_deleg_stateid;
t = gethrtime();
rfs4call(VTOMI4(RTOV4(rp)), &args, &res, cr, &doqueue, 0, ep);
if (ep->error)
return;
if (res.status == NFS4_OK) {
garp = &res.array[1].nfs_resop4_u.opgetattr.ga_res;
nfs4_attr_cache(RTOV4(rp), garp, t, cr, TRUE, NULL);
}
xdr_free(xdr_COMPOUND4res_clnt, (caddr_t)&res);
}
int
nfs4_do_delegreturn(rnode4_t *rp, int flags, cred_t *cr,
struct nfs4_callback_globals *ncg)
{
vnode_t *vp = RTOV4(rp);
mntinfo4_t *mi = VTOMI4(vp);
nfs4_lost_rqst_t lost_rqst;
nfs4_recov_state_t recov_state;
bool_t needrecov = FALSE, recovonly, done = FALSE;
nfs4_error_t e = { 0, NFS4_OK, RPC_SUCCESS };
ncg->nfs4_callback_stats.delegreturn.value.ui64++;
while (!done) {
e.error = nfs4_start_fop(mi, vp, NULL, OH_DELEGRETURN,
&recov_state, &recovonly);
if (e.error) {
if (flags & NFS4_DR_FORCE) {
(void) nfs_rw_enter_sig(&mi->mi_recovlock,
RW_READER, 0);
nfs4delegreturn_cleanup_impl(rp, NULL, ncg);
nfs_rw_exit(&mi->mi_recovlock);
}
break;
}
if (rp->r_deleg_type == OPEN_DELEGATE_NONE) {
e.error = 0;
nfs4_end_op(mi, vp, NULL, &recov_state, needrecov);
break;
}
if (recovonly) {
nfs4_error_init(&e, EINTR);
nfs4delegreturn_save_lost_rqst(e.error, &lost_rqst,
cr, vp);
(void) nfs4_start_recovery(&e, mi, vp,
NULL, &rp->r_deleg_stateid,
lost_rqst.lr_op == OP_DELEGRETURN ?
&lost_rqst : NULL, OP_DELEGRETURN, NULL,
NULL, NULL);
nfs4_end_op(mi, vp, NULL, &recov_state, needrecov);
break;
}
nfs4delegreturn_otw(rp, cr, &e);
if (e.error == 0 && (nfs4_recov_marks_dead(e.stat) ||
e.stat == NFS4ERR_BADHANDLE ||
e.stat == NFS4ERR_STALE))
needrecov = FALSE;
else
needrecov = nfs4_needs_recovery(&e, TRUE, vp->v_vfsp);
if (needrecov) {
nfs4delegreturn_save_lost_rqst(e.error, &lost_rqst,
cr, vp);
(void) nfs4_start_recovery(&e, mi, vp,
NULL, &rp->r_deleg_stateid,
lost_rqst.lr_op == OP_DELEGRETURN ?
&lost_rqst : NULL, OP_DELEGRETURN, NULL,
NULL, NULL);
} else {
nfs4delegreturn_cleanup_impl(rp, NULL, ncg);
done = TRUE;
}
nfs4_end_op(mi, vp, NULL, &recov_state, needrecov);
}
return (e.error);
}
void
nfs4_resend_delegreturn(nfs4_lost_rqst_t *lorp, nfs4_error_t *ep,
nfs4_server_t *np)
{
rnode4_t *rp = VTOR4(lorp->lr_vp);
mutex_enter(&rp->r_statelock);
if (rp->r_flags & R4RECOVERR) {
ep->error = EIO;
}
mutex_exit(&rp->r_statelock);
if (!ep->error)
nfs4delegreturn_otw(rp, lorp->lr_cr, ep);
if (nfs4_needs_recovery(ep, TRUE, lorp->lr_vp->v_vfsp))
return;
if (rp->r_deleg_type != OPEN_DELEGATE_NONE)
nfs4delegreturn_cleanup(rp, np);
nfs4_error_zinit(ep);
}
static int
nfs4delegreturn_impl(rnode4_t *rp, int flags, struct nfs4_callback_globals *ncg)
{
int error = 0;
cred_t *cr = NULL;
vnode_t *vp;
bool_t needrecov = FALSE;
bool_t rw_entered = FALSE;
bool_t do_reopen;
vp = RTOV4(rp);
if (flags == NFS4_DR_DISCARD) {
nfs4delegreturn_cleanup_impl(rp, NULL, ncg);
return (0);
}
if (flags & NFS4_DR_DID_OP) {
VN_HOLD(vp);
nfs4delegreturn_async(rp, (flags & ~NFS4_DR_DID_OP), FALSE);
return (0);
}
mutex_enter(&rp->r_statev4_lock);
if (rp->r_deleg_type == OPEN_DELEGATE_NONE) {
mutex_exit(&rp->r_statev4_lock);
goto out;
}
cr = rp->r_deleg_cred;
ASSERT(cr != NULL);
crhold(cr);
mutex_exit(&rp->r_statev4_lock);
if (flags & NFS4_DR_PUSH)
(void) VOP_PUTPAGE(vp, 0, 0, 0, cr, NULL);
(void) nfs_rw_enter_sig(&rp->r_deleg_recall_lock, RW_WRITER, FALSE);
rw_entered = TRUE;
if (rp->r_deleg_type == OPEN_DELEGATE_NONE)
goto out;
if (flags & NFS4_DR_REOPEN) {
mutex_enter(&rp->r_statelock);
do_reopen = !(rp->r_flags & R4RECOVERRP);
mutex_exit(&rp->r_statelock);
if (do_reopen) {
error = deleg_reopen(vp, &needrecov, ncg, flags);
if (error != 0) {
if ((flags & (NFS4_DR_FORCE | NFS4_DR_RECALL))
== 0)
goto out;
} else if (needrecov) {
if ((flags & NFS4_DR_FORCE) == 0)
goto out;
}
}
}
if (flags & NFS4_DR_DISCARD) {
mntinfo4_t *mi = VTOMI4(RTOV4(rp));
mutex_enter(&rp->r_statelock);
if (!rp->r_deleg_return_pending) {
mutex_exit(&rp->r_statelock);
goto out;
}
mutex_exit(&rp->r_statelock);
(void) nfs_rw_enter_sig(&mi->mi_recovlock, RW_READER, FALSE);
nfs4delegreturn_cleanup_impl(rp, NULL, ncg);
nfs_rw_exit(&mi->mi_recovlock);
} else {
error = nfs4_do_delegreturn(rp, flags, cr, ncg);
}
out:
if (cr)
crfree(cr);
if (rw_entered)
nfs_rw_exit(&rp->r_deleg_recall_lock);
return (error);
}
int
nfs4delegreturn(rnode4_t *rp, int flags)
{
struct nfs4_callback_globals *ncg;
ncg = zone_getspecific(nfs4_callback_zone_key, nfs_zone());
ASSERT(ncg != NULL);
return (nfs4delegreturn_impl(rp, flags, ncg));
}
void
nfs4delegreturn_async(rnode4_t *rp, int flags, bool_t trunc)
{
struct cb_recall_pass *pp;
pp = kmem_alloc(sizeof (struct cb_recall_pass), KM_SLEEP);
pp->rp = rp;
pp->flags = flags;
pp->truncate = trunc;
(void) zthread_create(NULL, 0, nfs4delegreturn_thread, pp, 0,
minclsyspri);
}
static void
delegreturn_all_thread(rpcprog_t *pp)
{
nfs4_server_t *np;
bool_t found = FALSE;
rpcprog_t prog;
rnode4_t *rp;
vnode_t *vp;
zoneid_t zoneid = getzoneid();
struct nfs4_callback_globals *ncg;
NFS4_DEBUG(nfs4_drat_debug,
(CE_NOTE, "delereturn_all_thread: prog %d\n", *pp));
prog = *pp;
kmem_free(pp, sizeof (*pp));
pp = NULL;
mutex_enter(&nfs4_server_lst_lock);
for (np = nfs4_server_lst.forw; np != &nfs4_server_lst; np = np->forw) {
if (np->zoneid == zoneid && np->s_program == prog) {
mutex_enter(&np->s_lock);
found = TRUE;
break;
}
}
mutex_exit(&nfs4_server_lst_lock);
if (!found)
goto out;
ncg = np->zone_globals;
while ((rp = list_head(&np->s_deleg_list)) != NULL) {
vp = RTOV4(rp);
VN_HOLD(vp);
mutex_exit(&np->s_lock);
(void) nfs4delegreturn_impl(rp, NFS4_DR_PUSH|NFS4_DR_REOPEN,
ncg);
VN_RELE(vp);
mutex_enter(&np->s_lock);
}
mutex_exit(&np->s_lock);
out:
NFS4_DEBUG(nfs4_drat_debug,
(CE_NOTE, "delereturn_all_thread: complete\n"));
zthread_exit();
}
void
nfs4_delegreturn_all(nfs4_server_t *sp)
{
rpcprog_t pro, *pp;
mutex_enter(&sp->s_lock);
if (list_head(&sp->s_deleg_list) == NULL) {
mutex_exit(&sp->s_lock);
return;
}
pro = sp->s_program;
mutex_exit(&sp->s_lock);
pp = kmem_alloc(sizeof (rpcprog_t), KM_SLEEP);
*pp = pro;
(void) zthread_create(NULL, 0, delegreturn_all_thread, pp, 0,
minclsyspri);
}
void
nfs4_deleg_discard(mntinfo4_t *mi, nfs4_server_t *sp)
{
rnode4_t *rp, *next;
mntinfo4_t *r_mi;
struct nfs4_callback_globals *ncg;
ASSERT(mutex_owned(&sp->s_lock));
ncg = sp->zone_globals;
for (rp = list_head(&sp->s_deleg_list); rp != NULL; rp = next) {
r_mi = VTOMI4(RTOV4(rp));
next = list_next(&sp->s_deleg_list, rp);
if (r_mi != mi) {
continue;
}
ASSERT(rp->r_deleg_type == OPEN_DELEGATE_READ);
#ifdef DEBUG
if (nfs4_client_recov_debug) {
zprintf(getzoneid(),
"nfs4_deleg_discard: matched rnode %p "
"-- discarding delegation\n", (void *)rp);
}
#endif
mutex_enter(&rp->r_statev4_lock);
if (rp->r_deleg_cred)
crfree(rp->r_deleg_cred);
rp->r_deleg_cred = NULL;
rp->r_deleg_type = OPEN_DELEGATE_NONE;
rp->r_deleg_needs_recovery = OPEN_DELEGATE_NONE;
rp->r_deleg_needs_recall = FALSE;
ASSERT(sp->s_refcnt > 1);
sp->s_refcnt--;
list_remove(&sp->s_deleg_list, rp);
mutex_exit(&rp->r_statev4_lock);
nfs4_dec_state_ref_count_nolock(sp, mi);
ncg->nfs4_callback_stats.delegations.value.ui64--;
}
}
static int
deleg_reopen(vnode_t *vp, bool_t *recovp, struct nfs4_callback_globals *ncg,
int flags)
{
nfs4_open_stream_t *osp;
nfs4_recov_state_t recov_state;
bool_t needrecov = FALSE;
mntinfo4_t *mi;
rnode4_t *rp;
nfs4_error_t e = { 0, NFS4_OK, RPC_SUCCESS };
int claimnull;
mi = VTOMI4(vp);
rp = VTOR4(vp);
recov_state.rs_flags = 0;
recov_state.rs_num_retry_despite_err = 0;
retry:
if ((e.error = nfs4_start_op(mi, vp, NULL, &recov_state)) != 0) {
return (e.error);
}
claimnull = (flags & NFS4_DR_DISCARD);
while ((osp = get_next_deleg_stream(rp, claimnull)) != NULL) {
if (claimnull) {
nfs4_reopen(vp, osp, &e, CLAIM_NULL, FALSE, FALSE);
} else {
ncg->nfs4_callback_stats.claim_cur.value.ui64++;
nfs4_reopen(vp, osp, &e, CLAIM_DELEGATE_CUR, FALSE,
FALSE);
if (e.error == 0 && e.stat == NFS4_OK)
ncg->nfs4_callback_stats.
claim_cur_ok.value.ui64++;
}
if (e.error == EAGAIN) {
open_stream_rele(osp, rp);
nfs4_end_op(mi, vp, NULL, &recov_state, TRUE);
goto retry;
}
if (e.error == EINTR || e.error == ETIMEDOUT ||
NFS4_FRC_UNMT_ERR(e.error, vp->v_vfsp)) {
open_stream_rele(osp, rp);
break;
}
needrecov = nfs4_needs_recovery(&e, TRUE, vp->v_vfsp);
if (e.error != 0 && !needrecov) {
ncg->nfs4_callback_stats.recall_failed.value.ui64++;
} else if (needrecov) {
(void) nfs4_start_recovery(&e, mi, vp, NULL, NULL,
NULL, OP_OPEN, NULL, NULL, NULL);
open_stream_rele(osp, rp);
*recovp = TRUE;
break;
}
open_stream_rele(osp, rp);
}
nfs4_end_op(mi, vp, NULL, &recov_state, needrecov);
return (e.error);
}
static nfs4_open_stream_t *
get_next_deleg_stream(rnode4_t *rp, int claimnull)
{
nfs4_open_stream_t *osp;
ASSERT(nfs_rw_lock_held(&rp->r_deleg_recall_lock, RW_WRITER));
mutex_enter(&rp->r_os_lock);
for (osp = list_head(&rp->r_open_streams); osp != NULL;
osp = list_next(&rp->r_open_streams, osp)) {
mutex_enter(&osp->os_sync_lock);
if (!osp->os_delegation || osp->os_failed_reopen ||
!osp->os_valid) {
mutex_exit(&osp->os_sync_lock);
continue;
}
if (!claimnull || rp->r_deleg_return_pending ||
!stateid4_cmp(&osp->open_stateid, &rp->r_deleg_stateid)) {
osp->os_ref_count++;
mutex_exit(&osp->os_sync_lock);
mutex_exit(&rp->r_os_lock);
return (osp);
}
mutex_exit(&osp->os_sync_lock);
}
mutex_exit(&rp->r_os_lock);
return (NULL);
}
static void
nfs4delegreturn_thread(struct cb_recall_pass *args)
{
rnode4_t *rp;
vnode_t *vp;
cred_t *cr;
int dtype, error, flags;
bool_t rdirty, rip;
kmutex_t cpr_lock;
callb_cpr_t cpr_info;
struct nfs4_callback_globals *ncg;
ncg = zone_getspecific(nfs4_callback_zone_key, nfs_zone());
ASSERT(ncg != NULL);
mutex_init(&cpr_lock, NULL, MUTEX_DEFAULT, NULL);
CALLB_CPR_INIT(&cpr_info, &cpr_lock, callb_generic_cpr,
"nfsv4delegRtn");
rp = args->rp;
vp = RTOV4(rp);
mutex_enter(&rp->r_statev4_lock);
if (rp->r_deleg_type == OPEN_DELEGATE_NONE) {
mutex_exit(&rp->r_statev4_lock);
goto out;
}
mutex_exit(&rp->r_statev4_lock);
(void) nfs_rw_enter_sig(&rp->r_rwlock, RW_READER, FALSE);
mutex_enter(&rp->r_statev4_lock);
if (rp->r_deleg_type == OPEN_DELEGATE_NONE) {
mutex_exit(&rp->r_statev4_lock);
nfs_rw_exit(&rp->r_rwlock);
goto out;
}
dtype = rp->r_deleg_type;
cr = rp->r_deleg_cred;
ASSERT(cr != NULL);
crhold(cr);
mutex_exit(&rp->r_statev4_lock);
flags = args->flags;
if (args->truncate) {
ncg->nfs4_callback_stats.recall_trunc.value.ui64++;
nfs4_invalidate_pages(vp, 0, cr);
} else if (dtype == OPEN_DELEGATE_WRITE) {
mutex_enter(&rp->r_statelock);
rdirty = rp->r_flags & R4DIRTY;
mutex_exit(&rp->r_statelock);
if (rdirty) {
error = VOP_PUTPAGE(vp, 0, 0, 0, cr, NULL);
if (error)
CB_WARN1("nfs4delegreturn_thread:"
" VOP_PUTPAGE: %d\n", error);
}
flags &= ~NFS4_DR_PUSH;
}
mutex_enter(&rp->r_statelock);
rip = rp->r_flags & R4RECOVERRP;
mutex_exit(&rp->r_statelock);
if (rip) {
error = VOP_PUTPAGE(vp, 0, 0, B_INVAL, cr, NULL);
if (error)
CB_WARN1("nfs4delegreturn_thread: VOP_PUTPAGE: %d\n",
error);
}
flags &= ~NFS4_DR_DID_OP;
(void) nfs4delegreturn_impl(rp, flags, ncg);
nfs_rw_exit(&rp->r_rwlock);
crfree(cr);
out:
kmem_free(args, sizeof (struct cb_recall_pass));
VN_RELE(vp);
mutex_enter(&cpr_lock);
CALLB_CPR_EXIT(&cpr_info);
mutex_destroy(&cpr_lock);
zthread_exit();
}
void
nfs4_delegation_accept(rnode4_t *rp, open_claim_type4 claim, OPEN4res *res,
nfs4_ga_res_t *garp, cred_t *cr)
{
open_read_delegation4 *orp;
open_write_delegation4 *owp;
nfs4_server_t *np;
bool_t already = FALSE;
bool_t recall = FALSE;
bool_t valid_garp = TRUE;
bool_t delegation_granted = FALSE;
bool_t dr_needed = FALSE;
bool_t recov;
int dr_flags = 0;
long mapcnt;
uint_t rflag;
mntinfo4_t *mi;
struct nfs4_callback_globals *ncg;
open_delegation_type4 odt;
ncg = zone_getspecific(nfs4_callback_zone_key, nfs_zone());
ASSERT(ncg != NULL);
mi = VTOMI4(RTOV4(rp));
if ((np = find_nfs4_server(mi)) == NULL)
return;
mutex_enter(&rp->r_statelock);
mutex_enter(&rp->r_statev4_lock);
if (rp->r_deleg_type == OPEN_DELEGATE_READ ||
rp->r_deleg_type == OPEN_DELEGATE_WRITE)
already = TRUE;
odt = res->delegation.delegation_type;
if (odt == OPEN_DELEGATE_READ) {
rp->r_deleg_type = res->delegation.delegation_type;
orp = &res->delegation.open_delegation4_u.read;
rp->r_deleg_stateid = orp->stateid;
rp->r_deleg_perms = orp->permissions;
if (claim == CLAIM_PREVIOUS)
if ((recall = orp->recall) != 0)
dr_needed = TRUE;
delegation_granted = TRUE;
ncg->nfs4_callback_stats.delegations.value.ui64++;
ncg->nfs4_callback_stats.delegaccept_r.value.ui64++;
} else if (odt == OPEN_DELEGATE_WRITE) {
rp->r_deleg_type = res->delegation.delegation_type;
owp = &res->delegation.open_delegation4_u.write;
rp->r_deleg_stateid = owp->stateid;
rp->r_deleg_perms = owp->permissions;
rp->r_deleg_limit = owp->space_limit;
if (claim == CLAIM_PREVIOUS)
if ((recall = owp->recall) != 0)
dr_needed = TRUE;
delegation_granted = TRUE;
if (garp == NULL || !garp->n4g_change_valid) {
valid_garp = FALSE;
rp->r_deleg_change = 0;
rp->r_deleg_change_grant = 0;
} else {
rp->r_deleg_change = garp->n4g_change;
rp->r_deleg_change_grant = garp->n4g_change;
}
mapcnt = rp->r_mapcnt;
rflag = rp->r_flags;
if (mapcnt > 0 || rflag & R4DIRTY)
rp->r_deleg_change++;
NFS4_DEBUG(nfs4_callback_debug, (CE_NOTE,
"nfs4_delegation_accept: r_deleg_change: 0x%x\n",
(int)(rp->r_deleg_change >> 32)));
NFS4_DEBUG(nfs4_callback_debug, (CE_NOTE,
"nfs4_delegation_accept: r_delg_change_grant: 0x%x\n",
(int)(rp->r_deleg_change_grant >> 32)));
ncg->nfs4_callback_stats.delegations.value.ui64++;
ncg->nfs4_callback_stats.delegaccept_rw.value.ui64++;
} else if (already) {
dr_needed = TRUE;
}
if (delegation_granted) {
if (!already) {
crhold(cr);
rp->r_deleg_cred = cr;
ASSERT(mutex_owned(&np->s_lock));
list_insert_head(&np->s_deleg_list, rp);
np->s_refcnt++;
nfs4_inc_state_ref_count_nolock(np, mi);
}
rp->r_deleg_needs_recovery = OPEN_DELEGATE_NONE;
}
mutex_exit(&rp->r_statev4_lock);
mutex_exit(&rp->r_statelock);
mutex_exit(&np->s_lock);
nfs4_server_rele(np);
mutex_enter(&mi->mi_lock);
recov = mi->mi_recovflags & MI4_RECOV_ACTIV;
mutex_exit(&mi->mi_lock);
mutex_enter(&rp->r_statev4_lock);
if (nfs4_delegreturn_policy == IMMEDIATE || !valid_garp)
dr_needed = TRUE;
if (dr_needed && rp->r_deleg_return_pending == FALSE) {
if (recov) {
if (recall)
dr_flags = NFS4_DR_PUSH;
else
dr_flags = NFS4_DR_PUSH|NFS4_DR_DISCARD;
nfs4_dlistadd(rp, ncg, dr_flags);
dr_flags = 0;
} else {
dr_flags = NFS4_DR_PUSH|NFS4_DR_DID_OP|NFS4_DR_REOPEN;
}
}
mutex_exit(&rp->r_statev4_lock);
if (dr_flags)
(void) nfs4delegreturn_impl(rp, dr_flags, ncg);
}
void
nfs4delegabandon(rnode4_t *rp)
{
vnode_t *vp;
struct cb_recall_pass *pp;
open_delegation_type4 dt;
mutex_enter(&rp->r_statev4_lock);
dt = rp->r_deleg_type;
mutex_exit(&rp->r_statev4_lock);
if (dt == OPEN_DELEGATE_NONE)
return;
vp = RTOV4(rp);
VN_HOLD(vp);
pp = kmem_alloc(sizeof (struct cb_recall_pass), KM_SLEEP);
pp->rp = rp;
pp->flags = 0;
pp->truncate = FALSE;
(void) zthread_create(NULL, 0, nfs4delegreturn_thread, pp, 0,
minclsyspri);
}
static int
wait_for_recall1(vnode_t *vp, nfs4_op_hint_t op, nfs4_recov_state_t *rsp,
int flg)
{
rnode4_t *rp;
int error = 0;
#ifdef lint
op = op;
#endif
if (vp && vp->v_type == VREG) {
rp = VTOR4(vp);
error = nfs_rw_enter_sig(&rp->r_deleg_recall_lock,
RW_READER, INTR4(vp));
if (error == 0)
rsp->rs_flags |= flg;
}
return (error);
}
void
nfs4_end_op_recall(vnode_t *vp1, vnode_t *vp2, nfs4_recov_state_t *rsp)
{
NFS4_DEBUG(nfs4_recall_debug,
(CE_NOTE, "nfs4_end_op_recall: 0x%p, 0x%p\n",
(void *)vp1, (void *)vp2));
if (vp2 && rsp->rs_flags & NFS4_RS_RECALL_HELD2)
nfs_rw_exit(&VTOR4(vp2)->r_deleg_recall_lock);
if (vp1 && rsp->rs_flags & NFS4_RS_RECALL_HELD1)
nfs_rw_exit(&VTOR4(vp1)->r_deleg_recall_lock);
}
int
wait_for_recall(vnode_t *vp1, vnode_t *vp2, nfs4_op_hint_t op,
nfs4_recov_state_t *rsp)
{
int error;
NFS4_DEBUG(nfs4_recall_debug,
(CE_NOTE, "wait_for_recall: 0x%p, 0x%p\n",
(void *)vp1, (void *) vp2));
rsp->rs_flags &= ~(NFS4_RS_RECALL_HELD1|NFS4_RS_RECALL_HELD2);
if ((error = wait_for_recall1(vp1, op, rsp, NFS4_RS_RECALL_HELD1)) != 0)
return (error);
if ((error = wait_for_recall1(vp2, op, rsp, NFS4_RS_RECALL_HELD2))
!= 0) {
if (rsp->rs_flags & NFS4_RS_RECALL_HELD1) {
nfs_rw_exit(&VTOR4(vp1)->r_deleg_recall_lock);
rsp->rs_flags &= ~NFS4_RS_RECALL_HELD1;
}
return (error);
}
return (0);
}
static void
nfs4_dlistadd(rnode4_t *rp, struct nfs4_callback_globals *ncg, int flags)
{
struct nfs4_dnode *dp;
ASSERT(mutex_owned(&rp->r_statev4_lock));
rp->r_deleg_return_pending = TRUE;
dp = kmem_alloc(sizeof (*dp), KM_SLEEP);
VN_HOLD(RTOV4(rp));
dp->rnodep = rp;
dp->flags = flags;
mutex_enter(&ncg->nfs4_dlist_lock);
list_insert_head(&ncg->nfs4_dlist, dp);
#ifdef DEBUG
ncg->nfs4_dlistadd_c++;
#endif
mutex_exit(&ncg->nfs4_dlist_lock);
}
static void
nfs4_dlistclean_impl(struct nfs4_callback_globals *ncg, int override_flags)
{
rnode4_t *rp;
struct nfs4_dnode *dp;
int flags;
ASSERT(override_flags == 0 || override_flags == NFS4_DR_DISCARD);
mutex_enter(&ncg->nfs4_dlist_lock);
while ((dp = list_head(&ncg->nfs4_dlist)) != NULL) {
#ifdef DEBUG
ncg->nfs4_dlistclean_c++;
#endif
list_remove(&ncg->nfs4_dlist, dp);
mutex_exit(&ncg->nfs4_dlist_lock);
rp = dp->rnodep;
flags = (override_flags != 0) ? override_flags : dp->flags;
kmem_free(dp, sizeof (*dp));
(void) nfs4delegreturn_impl(rp, flags, ncg);
VN_RELE(RTOV4(rp));
mutex_enter(&ncg->nfs4_dlist_lock);
}
mutex_exit(&ncg->nfs4_dlist_lock);
}
void
nfs4_dlistclean(void)
{
struct nfs4_callback_globals *ncg;
ncg = zone_getspecific(nfs4_callback_zone_key, nfs_zone());
ASSERT(ncg != NULL);
nfs4_dlistclean_impl(ncg, 0);
}