#include "rcm_impl.h"
#include "rcm_module.h"
mutex_t rcm_req_lock;
static int state_fd;
#define RCM_STATE_FILE "/var/run/rcm_daemon_state"
#define N_REQ_CHUNK 10
#define RCM_DAEMON_TIMEOUT 300
typedef struct {
int seq_num;
int state;
pid_t pid;
uint_t flag;
int type;
timespec_t interval;
char device[MAXPATHLEN];
} req_t;
typedef struct {
int n_req;
int n_req_max;
int n_seq_max;
int idle_timeout;
req_t req[1];
} req_list_t;
static req_list_t *dr_req_list;
static req_list_t *info_req_list;
static const char *locked_info = "DR operation in progress";
static const char *locked_err = "Resource is busy";
static int rcmd_get_state();
static void add_to_polling_list(pid_t);
static void remove_from_polling_list(pid_t);
void start_polling_thread();
static void stop_polling_thread();
void
rcmd_lock_init(void)
{
int size;
struct stat fbuf;
info_req_list = s_calloc(1, sizeof (req_list_t));
info_req_list->n_req_max = 1;
state_fd = open(RCM_STATE_FILE, O_CREAT|O_RDWR, 0600);
if (state_fd == -1) {
rcm_log_message(RCM_ERROR, gettext("cannot open %s: %s\n"),
RCM_STATE_FILE, strerror(errno));
rcmd_exit(errno);
}
if (fstat(state_fd, &fbuf) != 0) {
rcm_log_message(RCM_ERROR, gettext("cannot stat %s: %s\n"),
RCM_STATE_FILE, strerror(errno));
rcmd_exit(errno);
}
size = fbuf.st_size;
if (size == 0) {
size = sizeof (req_list_t);
if (ftruncate(state_fd, size) != 0) {
rcm_log_message(RCM_ERROR,
gettext("cannot truncate %s: %s\n"),
RCM_STATE_FILE, strerror(errno));
rcmd_exit(errno);
}
}
dr_req_list = (req_list_t *)mmap(NULL, size, PROT_READ|PROT_WRITE,
MAP_SHARED, state_fd, 0);
if (dr_req_list == MAP_FAILED) {
rcm_log_message(RCM_ERROR, gettext("cannot mmap %s: %s\n"),
RCM_STATE_FILE, strerror(errno));
rcmd_exit(errno);
}
if (dr_req_list->n_req_max == 0) {
dr_req_list->n_req_max = 1;
(void) fsync(state_fd);
return;
}
rcm_log_message(RCM_DEBUG, "n_req = %d, n_req_max = %d\n",
dr_req_list->n_req, dr_req_list->n_req_max);
clean_dr_list();
}
static int
get_seq_number()
{
int number;
if (dr_req_list == NULL)
return (0);
dr_req_list->n_seq_max++;
number = (dr_req_list->n_seq_max << SEQ_NUM_SHIFT);
(void) fsync(state_fd);
return (number);
}
static req_t *
find_req_entry(char *device, uint_t flag, int seq_num, req_list_t *list)
{
int i;
for (i = 0; i < list->n_req_max; i++) {
if (list->req[i].state == RCM_STATE_REMOVE)
continue;
if ((strcmp(device, list->req[i].device) != 0) ||
(list->req[i].flag & RCM_FILESYS) != (flag & RCM_FILESYS))
continue;
if ((seq_num != -1) && ((seq_num >> SEQ_NUM_SHIFT) !=
(list->req[i].seq_num >> SEQ_NUM_SHIFT)))
continue;
return (&list->req[i]);
}
return (NULL);
}
static req_t *
get_req_entry(req_list_t **listp)
{
int i;
int n_req = (*listp)->n_req;
int n_req_max = (*listp)->n_req_max;
if (n_req == n_req_max) {
int newsize;
n_req_max += N_REQ_CHUNK;
newsize = sizeof (req_list_t) + (n_req_max - 1) *
sizeof (req_t);
if (listp == &info_req_list) {
*listp = s_realloc(*listp, newsize);
} else if (ftruncate(state_fd, newsize) != 0) {
rcm_log_message(RCM_ERROR,
gettext("cannot truncate %s: %s\n"),
RCM_STATE_FILE, strerror(errno));
rcmd_exit(errno);
} else if ((*listp = (req_list_t *)mmap(NULL, newsize,
PROT_READ|PROT_WRITE, MAP_SHARED, state_fd, 0)) ==
MAP_FAILED) {
rcm_log_message(RCM_ERROR,
gettext("cannot mmap %s: %s\n"),
RCM_STATE_FILE, strerror(errno));
rcmd_exit(errno);
}
for (i = (*listp)->n_req_max; i < n_req_max; i++) {
(*listp)->req[i].state = RCM_STATE_REMOVE;
(void) strcpy((*listp)->req[i].device, "");
}
(*listp)->n_req_max = n_req_max;
(*listp)->n_req++;
return (&(*listp)->req[n_req]);
}
for (i = 0; i < n_req_max; i++) {
if (((*listp)->req[i].device[0] == '\0') ||
((*listp)->req[i].state == RCM_STATE_REMOVE)) {
break;
}
}
assert(i < n_req_max);
(*listp)->n_req++;
return (&(*listp)->req[i]);
}
int
info_req_add(char *rsrcname, uint_t flag, int seq_num)
{
int error = 0;
char *device;
req_t *req;
rcm_log_message(RCM_TRACE2, "info_req_add(%s, %d)\n",
rsrcname, seq_num);
device = resolve_name(rsrcname);
(void) mutex_lock(&rcm_req_lock);
if (find_req_entry(device, flag, seq_num, info_req_list) != NULL) {
rcm_log_message(RCM_DEBUG, "getinfo cycle: %s %d \n",
device, seq_num);
error = -1;
goto out;
}
req = get_req_entry(&info_req_list);
req->seq_num = seq_num;
req->state = RCM_STATE_ONLINE;
req->flag = flag;
(void) strcpy(req->device, device);
out:
(void) mutex_unlock(&rcm_req_lock);
free(device);
return (error);
}
void
info_req_remove(int seq_num)
{
int i;
rcm_log_message(RCM_TRACE3, "info_req_remove(%d)\n", seq_num);
seq_num >>= SEQ_NUM_SHIFT;
(void) mutex_lock(&rcm_req_lock);
for (i = 0; i < info_req_list->n_req_max; i++) {
if (info_req_list->req[i].state == RCM_STATE_REMOVE)
continue;
if ((info_req_list->req[i].seq_num >> SEQ_NUM_SHIFT) != seq_num)
continue;
info_req_list->req[i].state = RCM_STATE_REMOVE;
info_req_list->n_req--;
}
(void) mutex_unlock(&rcm_req_lock);
}
static int
check_lock(char *device, uint_t flag, int cflag, rcm_info_t **info)
{
int i, ret = RCM_SUCCESS;
if (info)
*info = NULL;
if (dr_req_list == NULL)
return (ret);
for (i = 0; i < dr_req_list->n_req; i++) {
req_t *req = &dr_req_list->req[i];
char *dr_dev = req->device;
if ((req->state == RCM_STATE_REMOVE) || (dr_dev[0] == '\0'))
continue;
if (EQUAL(device, dr_dev) || DESCENDENT(device, dr_dev)) {
if ((flag & RCM_FILESYS) && (!EQUAL(device, dr_dev) ||
((dr_req_list->req[i].flag & RCM_FILESYS) == 0)))
continue;
assert(info != 0);
add_busy_rsrc_to_list(dr_dev, dr_req_list->req[i].pid,
dr_req_list->req[i].state,
dr_req_list->req[i].seq_num, NULL, locked_info,
locked_err, NULL, info);
ret = RCM_CONFLICT;
break;
}
if ((cflag == LOCK_FOR_DR) && DESCENDENT(dr_dev, device)) {
assert(info != 0);
add_busy_rsrc_to_list(dr_dev, dr_req_list->req[i].pid,
dr_req_list->req[i].state,
dr_req_list->req[i].seq_num, NULL, locked_info,
locked_err, NULL, info);
ret = RCM_CONFLICT;
}
}
return (ret);
}
int
rsrc_check_lock_conflicts(char *rsrcname, uint_t flag, int cflag,
rcm_info_t **info)
{
int result;
char *device;
device = resolve_name(rsrcname);
result = check_lock(device, flag, cflag, info);
free(device);
return (result);
}
static int
transition_state(int state)
{
switch (state) {
case RCM_STATE_OFFLINING:
case RCM_STATE_SUSPENDING:
case RCM_STATE_RESUMING:
case RCM_STATE_ONLINING:
case RCM_STATE_REMOVING:
return (1);
default:
break;
}
return (0);
}
static int
dr_req_update_entry(char *device, pid_t pid, uint_t flag, int state,
int seq_num, timespec_t *interval, rcm_info_t **infop)
{
req_t *req;
req = find_req_entry(device, flag, -1, dr_req_list);
if (req == NULL) {
switch (state) {
case RCM_STATE_OFFLINE_QUERYING:
case RCM_STATE_SUSPEND_QUERYING:
case RCM_STATE_OFFLINING:
case RCM_STATE_SUSPENDING:
break;
default:
rcm_log_message(RCM_DEBUG,
"update non-existing resource %s\n", device);
}
return (RCM_FAILURE);
}
if (rcmd_get_state() == RCMD_INIT)
goto update;
if (pid != req->pid) {
rcm_log_message(RCM_INFO,
gettext("mismatched dr initiator pid: %ld %ld\n"),
req->pid, pid);
goto failure;
}
rcm_log_message(RCM_TRACE4,
"dr_req_update_entry: state=%d, device=%s\n",
req->state, req->device);
switch (state) {
case RCM_STATE_OFFLINE_QUERYING:
case RCM_STATE_OFFLINING:
if ((req->state != RCM_STATE_OFFLINE_FAIL) &&
(req->state != RCM_STATE_OFFLINE_QUERYING) &&
(req->state != RCM_STATE_OFFLINE_QUERY) &&
(req->state != RCM_STATE_OFFLINE_QUERY_FAIL) &&
(req->state != RCM_STATE_OFFLINE)) {
rcm_log_message(RCM_WARNING,
gettext("%s: invalid offlining from state %d\n"),
device, req->state);
goto failure;
}
break;
case RCM_STATE_SUSPEND_QUERYING:
case RCM_STATE_SUSPENDING:
if ((req->state != RCM_STATE_SUSPEND_FAIL) &&
(req->state != RCM_STATE_SUSPEND_QUERYING) &&
(req->state != RCM_STATE_SUSPEND_QUERY) &&
(req->state != RCM_STATE_SUSPEND_QUERY_FAIL) &&
(req->state != RCM_STATE_SUSPEND)) {
rcm_log_message(RCM_WARNING,
gettext("%s: invalid suspending from state %d\n"),
device, req->state);
goto failure;
}
break;
case RCM_STATE_RESUMING:
if ((req->state != RCM_STATE_SUSPEND) &&
(req->state != RCM_STATE_SUSPEND_QUERYING) &&
(req->state != RCM_STATE_SUSPEND_QUERY) &&
(req->state != RCM_STATE_SUSPEND_QUERY_FAIL) &&
(req->state != RCM_STATE_SUSPEND_FAIL)) {
rcm_log_message(RCM_DEBUG,
"%s: invalid resuming from state %d\n",
device, req->state);
goto failure;
}
break;
case RCM_STATE_ONLINING:
if ((req->state != RCM_STATE_OFFLINE) &&
(req->state != RCM_STATE_OFFLINE_QUERYING) &&
(req->state != RCM_STATE_OFFLINE_QUERY) &&
(req->state != RCM_STATE_OFFLINE_QUERY_FAIL) &&
(req->state != RCM_STATE_OFFLINE_FAIL)) {
rcm_log_message(RCM_INFO,
gettext("%s: invalid onlining from state %d\n"),
device, req->state);
goto failure;
}
break;
case RCM_STATE_REMOVING:
if ((req->state != RCM_STATE_OFFLINE) &&
(req->state != RCM_STATE_OFFLINE_FAIL)) {
rcm_log_message(RCM_INFO,
gettext("%s: invalid removing from state %d\n"),
device, req->state);
goto failure;
}
break;
case RCM_STATE_SUSPEND_FAIL:
assert(req->state == RCM_STATE_SUSPENDING);
break;
case RCM_STATE_OFFLINE_FAIL:
assert(req->state == RCM_STATE_OFFLINING);
break;
case RCM_STATE_SUSPEND:
assert(req->state == RCM_STATE_SUSPENDING);
break;
case RCM_STATE_OFFLINE:
assert(req->state == RCM_STATE_OFFLINING);
break;
case RCM_STATE_ONLINE:
assert((req->state == RCM_STATE_RESUMING) ||
(req->state == RCM_STATE_ONLINING));
break;
default:
rcm_log_message(RCM_ERROR,
gettext("invalid update to dr state: %d\n"), state);
return (RCM_FAILURE);
}
update:
req->state = state;
req->seq_num = seq_num;
if (interval)
req->interval = *interval;
else
bzero(&req->interval, sizeof (timespec_t));
(void) fsync(state_fd);
return (RCM_SUCCESS);
failure:
if (infop != NULL) {
add_busy_rsrc_to_list(req->device, req->pid, req->state,
req->seq_num, NULL, locked_info, locked_err, NULL, infop);
}
if (transition_state(req->state)) {
return (EAGAIN);
}
return (RCM_CONFLICT);
}
int
dr_req_add(char *rsrcname, pid_t pid, uint_t flag, int state, int seq_num,
timespec_t *interval, rcm_info_t **info)
{
int error;
char *device;
req_t *req;
rcm_log_message(RCM_TRACE3, "dr_req_add(%s, %ld, 0x%x, %d, %d, %p)\n",
rsrcname, pid, flag, state, seq_num, (void *)info);
device = resolve_name(rsrcname);
if (device == NULL)
return (EINVAL);
(void) mutex_lock(&rcm_req_lock);
error = dr_req_update_entry(device, pid, flag, state, seq_num, interval,
info);
switch (error) {
case RCM_FAILURE:
break;
case RCM_CONFLICT:
case RCM_SUCCESS:
case EAGAIN:
default:
goto out;
}
error = check_lock(device, flag, LOCK_FOR_DR, info);
if (error != RCM_SUCCESS) {
error = RCM_CONFLICT;
goto out;
}
req = get_req_entry(&dr_req_list);
req->seq_num = seq_num;
req->pid = pid;
req->flag = flag;
req->state = state;
req->type = rsrc_get_type(device);
(void) strcpy(req->device, device);
if (interval)
req->interval = *interval;
else
bzero(&req->interval, sizeof (timespec_t));
(void) fsync(state_fd);
add_to_polling_list(req->pid);
out:
(void) mutex_unlock(&rcm_req_lock);
free(device);
return (error);
}
int
dr_req_update(char *rsrcname, pid_t pid, uint_t flag, int state, int seq_num,
rcm_info_t **info)
{
int error;
char *device = resolve_name(rsrcname);
rcm_log_message(RCM_TRACE3, "dr_req_update(%s, %ld, 0x%x, %d, %d)\n",
rsrcname, pid, flag, state, seq_num);
(void) mutex_lock(&rcm_req_lock);
error = dr_req_update_entry(device, pid, flag, state, seq_num, NULL,
info);
(void) mutex_unlock(&rcm_req_lock);
free(device);
return (error);
}
int
dr_req_lookup(int seq_num, char *rsrc)
{
int i;
int len;
int base = (seq_num >> SEQ_NUM_SHIFT);
int retval = RCM_FAILURE;
if (rsrc == NULL) {
return (RCM_FAILURE);
}
(void) mutex_lock(&rcm_req_lock);
for (i = 0; i < dr_req_list->n_req_max; i++) {
if ((dr_req_list->req[i].state == RCM_STATE_REMOVE) ||
((dr_req_list->req[i].seq_num >> SEQ_NUM_SHIFT) != base)) {
continue;
}
len = strlcpy(rsrc, dr_req_list->req[i].device, MAXPATHLEN);
if (len < MAXPATHLEN) {
retval = RCM_SUCCESS;
}
break;
}
(void) mutex_unlock(&rcm_req_lock);
return (retval);
}
void
dr_req_remove(char *rsrcname, uint_t flag)
{
req_t *req;
char *device = resolve_name(rsrcname);
rcm_log_message(RCM_TRACE3, "dr_req_remove(%s)\n", rsrcname);
(void) mutex_lock(&rcm_req_lock);
req = find_req_entry(device, flag, -1, dr_req_list);
free(device);
if (req == NULL) {
(void) mutex_unlock(&rcm_req_lock);
rcm_log_message(RCM_WARNING,
gettext("dr_req entry %s not found\n"), rsrcname);
return;
}
req->state = RCM_STATE_REMOVE;
dr_req_list->n_req--;
(void) fsync(state_fd);
remove_from_polling_list(req->pid);
(void) mutex_unlock(&rcm_req_lock);
}
rcm_info_t *
rsrc_dr_info()
{
int i;
rcm_info_t *info;
rcm_info_t *result = NULL;
char *rsrc;
int len;
rcm_log_message(RCM_TRACE2, "rsrc_dr_info()\n");
(void) mutex_lock(&rcm_req_lock);
for (i = 0; i < dr_req_list->n_req_max; i++) {
if (dr_req_list->req[i].state == RCM_STATE_REMOVE)
continue;
if (dr_req_list->req[i].device[0] == '\0')
continue;
if (dr_req_list->req[i].flag & RCM_FILESYS) {
len = strlen(dr_req_list->req[i].device) + 5;
rsrc = s_malloc(len);
(void) snprintf(rsrc, len, "%s(fs)",
dr_req_list->req[i].device);
} else {
rsrc = s_strdup(dr_req_list->req[i].device);
}
info = s_calloc(1, sizeof (*info));
if (errno = nvlist_alloc(&(info->info), NV_UNIQUE_NAME, 0)) {
rcm_log_message(RCM_ERROR,
gettext("failed (nvlist_alloc=%s).\n"),
strerror(errno));
rcmd_exit(errno);
}
if (errno = nvlist_add_string(info->info, RCM_RSRCNAME, rsrc)) {
rcm_log_message(RCM_ERROR,
gettext("failed (nvlist_add=%s).\n"),
strerror(errno));
rcmd_exit(errno);
}
(void) free(rsrc);
if (errno = nvlist_add_int64(info->info, RCM_CLIENT_ID,
dr_req_list->req[i].pid)) {
rcm_log_message(RCM_ERROR,
gettext("failed (nvlist_add=%s).\n"),
strerror(errno));
rcmd_exit(errno);
}
if (errno = nvlist_add_int32(info->info, RCM_SEQ_NUM,
dr_req_list->req[i].seq_num)) {
rcm_log_message(RCM_ERROR,
gettext("failed (nvlist_add=%s).\n"),
strerror(errno));
rcmd_exit(errno);
}
if (errno = nvlist_add_int32(info->info, RCM_RSRCSTATE,
dr_req_list->req[i].state)) {
rcm_log_message(RCM_ERROR,
gettext("failed (nvlist_add=%s).\n"),
strerror(errno));
rcmd_exit(errno);
}
if (errno = nvlist_add_string(info->info, RCM_CLIENT_INFO,
(char *)locked_info)) {
rcm_log_message(RCM_ERROR,
gettext("failed (nvlist_add=%s).\n"),
strerror(errno));
rcmd_exit(errno);
}
info->next = result;
result = info;
}
(void) mutex_unlock(&rcm_req_lock);
return (result);
}
void
clean_dr_list()
{
int i;
struct clean_list {
struct clean_list *next;
char *rsrcname;
pid_t pid;
int seq_num;
int state;
timespec_t interval;
} *tmp, *list = NULL;
char *rsrcnames[2];
rcm_log_message(RCM_TRACE3,
"clean_dr_list(): look for stale dr initiators\n");
rsrcnames[1] = NULL;
(void) mutex_lock(&rcm_req_lock);
for (i = 0; i < dr_req_list->n_req_max; i++) {
if (dr_req_list->req[i].state == RCM_STATE_REMOVE)
continue;
if (dr_req_list->req[i].device[0] == '\0')
continue;
if (dr_req_list->req[i].seq_num & SEQ_NUM_MASK)
continue;
if ((rcmd_get_state() == RCMD_CLEANUP) &&
proc_exist(dr_req_list->req[i].pid))
continue;
rcm_log_message(RCM_TRACE1,
"found stale entry: %s\n", dr_req_list->req[i].device);
tmp = s_malloc(sizeof (*tmp));
tmp->rsrcname = s_strdup(dr_req_list->req[i].device);
tmp->state = dr_req_list->req[i].state;
tmp->pid = dr_req_list->req[i].pid;
tmp->seq_num = dr_req_list->req[i].seq_num;
tmp->interval = dr_req_list->req[i].interval;
tmp->next = list;
list = tmp;
}
(void) mutex_unlock(&rcm_req_lock);
if (list == NULL)
return;
if (rcmd_get_state() == RCMD_INIT) {
rcm_log_message(RCM_NOTICE, gettext("rcm_daemon died "
"unexpectedly, recovering previous daemon state\n"));
} else {
rcm_log_message(RCM_INFO, gettext("one or more dr initiator "
"died, attempting automatic recovery\n"));
}
while (list) {
tmp = list;
list = tmp->next;
switch (tmp->state) {
case RCM_STATE_OFFLINE_QUERY:
case RCM_STATE_OFFLINE_QUERY_FAIL:
rsrcnames[0] = tmp->rsrcname;
if (proc_exist(tmp->pid)) {
(void) process_resource_offline(rsrcnames,
tmp->pid, RCM_QUERY, tmp->seq_num, NULL);
} else {
(void) notify_resource_online(rsrcnames,
tmp->pid, 0, tmp->seq_num, NULL);
}
break;
case RCM_STATE_OFFLINE:
case RCM_STATE_OFFLINE_FAIL:
rsrcnames[0] = tmp->rsrcname;
if (proc_exist(tmp->pid)) {
(void) process_resource_offline(rsrcnames,
tmp->pid, 0, tmp->seq_num, NULL);
} else {
(void) notify_resource_online(rsrcnames,
tmp->pid, 0, tmp->seq_num, NULL);
}
break;
case RCM_STATE_SUSPEND_QUERY:
case RCM_STATE_SUSPEND_QUERY_FAIL:
rsrcnames[0] = tmp->rsrcname;
if (proc_exist(tmp->pid)) {
(void) process_resource_suspend(rsrcnames,
tmp->pid, RCM_QUERY, tmp->seq_num,
&tmp->interval, NULL);
} else {
(void) notify_resource_resume(rsrcnames,
tmp->pid, 0, tmp->seq_num, NULL);
}
break;
case RCM_STATE_SUSPEND:
case RCM_STATE_SUSPEND_FAIL:
rsrcnames[0] = tmp->rsrcname;
if (proc_exist(tmp->pid)) {
(void) process_resource_suspend(rsrcnames,
tmp->pid, 0, tmp->seq_num, &tmp->interval,
NULL);
} else {
(void) notify_resource_resume(rsrcnames,
tmp->pid, 0, tmp->seq_num, NULL);
}
break;
case RCM_STATE_OFFLINING:
case RCM_STATE_ONLINING:
rsrcnames[0] = tmp->rsrcname;
(void) notify_resource_online(rsrcnames, tmp->pid, 0,
tmp->seq_num, NULL);
break;
case RCM_STATE_SUSPENDING:
case RCM_STATE_RESUMING:
rsrcnames[0] = tmp->rsrcname;
(void) notify_resource_resume(rsrcnames, tmp->pid, 0,
tmp->seq_num, NULL);
break;
case RCM_STATE_REMOVING:
rsrcnames[0] = tmp->rsrcname;
(void) notify_resource_remove(rsrcnames, tmp->pid, 0,
tmp->seq_num, NULL);
break;
default:
rcm_log_message(RCM_WARNING,
gettext("%s in unknown state %d\n"),
tmp->rsrcname, tmp->state);
break;
}
free(tmp->rsrcname);
free(tmp);
}
}
barrier_t barrier;
int
rcmd_get_state()
{
return (barrier.state);
}
void
rcmd_set_state(int state)
{
(void) mutex_lock(&barrier.lock);
barrier.state = state;
switch (state) {
case RCMD_CLEANUP:
barrier.wanted++;
while (barrier.thr_count != 0)
(void) cond_wait(&barrier.cv, &barrier.lock);
barrier.wanted--;
barrier.thr_count = -1;
break;
case RCMD_INIT:
case RCMD_NORMAL:
default:
if (barrier.thr_count == -1)
barrier.thr_count = 0;
if (barrier.wanted)
(void) cond_broadcast(&barrier.cv);
break;
}
(void) mutex_unlock(&barrier.lock);
}
int
rcmd_thr_incr(int cmd)
{
int seq_num;
(void) mutex_lock(&barrier.lock);
barrier.wanted++;
while (barrier.state != RCMD_NORMAL)
(void) cond_wait(&barrier.cv, &barrier.lock);
if ((cmd == CMD_EVENT) ||
(cmd == CMD_REGISTER) ||
(cmd == CMD_UNREGISTER)) {
seq_num = -1;
} else {
seq_num = get_seq_number();
}
barrier.wanted--;
barrier.thr_count++;
(void) mutex_unlock(&barrier.lock);
if ((cmd == CMD_OFFLINE) ||
(cmd == CMD_SUSPEND) ||
(cmd == CMD_GETINFO)) {
rcmd_db_sync();
}
return (seq_num);
}
void
rcmd_thr_decr()
{
(void) mutex_lock(&barrier.lock);
barrier.last_update = time(NULL);
if (--barrier.thr_count == 0)
(void) cond_broadcast(&barrier.cv);
(void) mutex_unlock(&barrier.lock);
}
static int sighup_received = 0;
void
rcmd_thr_signal()
{
(void) mutex_lock(&barrier.lock);
sighup_received = 1;
(void) cond_broadcast(&barrier.cv);
(void) mutex_unlock(&barrier.lock);
}
void
rcmd_start_timer(int timeout)
{
timestruc_t abstime;
if (timeout == 0)
timeout = RCM_DAEMON_TIMEOUT;
else
dr_req_list->idle_timeout = timeout;
if (timeout > 0) {
abstime.tv_sec = time(NULL) + timeout;
}
(void) mutex_lock(&barrier.lock);
for (;;) {
int idletime;
int is_active;
if (timeout > 0)
(void) cond_timedwait(&barrier.cv, &barrier.lock,
&abstime);
else
(void) cond_wait(&barrier.cv, &barrier.lock);
if (sighup_received)
timeout = 0;
if (timeout < 0)
continue;
is_active = (barrier.thr_count || barrier.wanted ||
(dr_req_list->n_req != 0));
if (is_active) {
abstime.tv_sec = time(NULL) + timeout;
continue;
}
idletime = time(NULL) - barrier.last_update;
if (idletime < timeout) {
abstime.tv_sec = barrier.last_update + timeout;
continue;
}
break;
}
(void) script_main_fini();
rcm_log_message(RCM_INFO, gettext("rcm_daemon is shut down.\n"));
}
struct {
int n_pids;
int n_max_pids;
thread_t poll_tid;
int signaled;
pid_t *pids;
int *refcnt;
struct pollfd *fds;
cond_t cv;
} polllist;
static int
find_pid_index(pid_t pid)
{
int i;
for (i = 0; i < polllist.n_pids; i++) {
if (polllist.pids[i] == pid) {
return (i);
}
}
return (-1);
}
static int
get_pid_index()
{
const int n_chunk = 10;
int n_max;
int index = polllist.n_pids;
if (polllist.n_pids < polllist.n_max_pids) {
polllist.n_pids++;
return (index);
}
if (polllist.n_max_pids == 0) {
n_max = n_chunk;
polllist.pids = s_calloc(n_max, sizeof (pid_t));
polllist.refcnt = s_calloc(n_max, sizeof (int));
polllist.fds = s_calloc(n_max, sizeof (struct pollfd));
} else {
n_max = polllist.n_max_pids + n_chunk;
polllist.pids = s_realloc(polllist.pids,
n_max * sizeof (pid_t));
polllist.refcnt = s_realloc(polllist.refcnt,
n_max * sizeof (int));
polllist.fds = s_realloc(polllist.fds,
n_max * sizeof (struct pollfd));
}
polllist.n_max_pids = n_max;
polllist.n_pids++;
return (index);
}
static void
add_to_polling_list(pid_t pid)
{
int fd, index;
char procfile[MAXPATHLEN];
if (pid == (pid_t)0)
return;
rcm_log_message(RCM_TRACE1, "add_to_polling_list(%ld)\n", pid);
index = find_pid_index(pid);
if (index != -1) {
polllist.refcnt[index]++;
return;
}
stop_polling_thread();
index = find_pid_index(pid);
if (index != -1) {
polllist.refcnt[index]++;
goto done;
}
(void) sprintf(procfile, "/proc/%ld/as", pid);
if ((fd = open(procfile, O_RDONLY)) == -1) {
rcm_log_message(RCM_NOTICE, gettext("open(%s): %s\n"),
procfile, strerror(errno));
goto done;
}
index = get_pid_index();
polllist.pids[index] = pid;
polllist.refcnt[index] = 1;
polllist.fds[index].fd = fd;
polllist.fds[index].events = 0;
polllist.fds[index].revents = 0;
rcm_log_message(RCM_DEBUG, "add pid %ld at index %ld\n", pid, index);
done:
start_polling_thread();
}
static void
remove_from_polling_list(pid_t pid)
{
int i, index;
if (pid == (pid_t)0)
return;
rcm_log_message(RCM_TRACE1, "remove_from_polling_list(%ld)\n", pid);
index = find_pid_index(pid);
if (index == -1) {
rcm_log_message(RCM_NOTICE,
gettext("error removing pid %ld from polling list\n"), pid);
return;
}
if (polllist.refcnt[index] > 1) {
polllist.refcnt[index]--;
return;
}
stop_polling_thread();
index = find_pid_index(pid);
if (index == -1) {
rcm_log_message(RCM_NOTICE,
gettext("error removing pid %ld from polling list\n"), pid);
goto done;
}
if (--polllist.refcnt[index] > 0)
goto done;
(void) close(polllist.fds[index].fd);
polllist.n_pids--;
for (i = index; i < polllist.n_pids; i++) {
polllist.pids[i] = polllist.pids[i + 1];
polllist.refcnt[i] = polllist.refcnt[i + 1];
bcopy(&polllist.fds[i + 1], &polllist.fds[i],
sizeof (struct pollfd));
}
rcm_log_message(RCM_DEBUG, "remove pid %ld at index %d\n", pid, index);
done:
start_polling_thread();
}
void
init_poll_thread()
{
polllist.poll_tid = (thread_t)-1;
}
void
cleanup_poll_thread()
{
(void) mutex_lock(&rcm_req_lock);
if (polllist.poll_tid == thr_self()) {
rcm_log_message(RCM_TRACE2,
"cleanup_poll_thread: n_pids = %d\n", polllist.n_pids);
polllist.poll_tid = (thread_t)-1;
(void) cond_broadcast(&polllist.cv);
}
(void) mutex_unlock(&rcm_req_lock);
}
static void *
pollfunc(void *arg)
{
sigset_t mask;
rcm_log_message(RCM_TRACE2, "poll thread started. n_pids = %d\n",
polllist.n_pids);
(void) sigemptyset(&mask);
(void) sigaddset(&mask, SIGUSR1);
(void) thr_sigsetmask(SIG_UNBLOCK, &mask, NULL);
(void) poll(polllist.fds, polllist.n_pids, (time_t)-1);
(void) sigemptyset(&mask);
(void) sigaddset(&mask, SIGUSR1);
(void) thr_sigsetmask(SIG_BLOCK, &mask, NULL);
rcm_log_message(RCM_TRACE2, "returned from poll()\n");
cleanup_poll_thread();
(void) mutex_lock(&barrier.lock);
need_cleanup = 1;
(void) cond_broadcast(&barrier.cv);
(void) mutex_unlock(&barrier.lock);
return (NULL);
}
void
start_polling_thread()
{
int err;
if (rcmd_get_state() != RCMD_NORMAL)
return;
if (polllist.poll_tid != (thread_t)-1 || polllist.n_pids == 0)
return;
if ((err = thr_create(NULL, 0, pollfunc, NULL, THR_DETACHED,
&polllist.poll_tid)) == 0)
polllist.signaled = 0;
else
rcm_log_message(RCM_ERROR,
gettext("failed to create polling thread: %s\n"),
strerror(err));
}
static void
stop_polling_thread()
{
int err;
while (polllist.poll_tid != (thread_t)-1) {
if (polllist.signaled == 0) {
if ((err = thr_kill(polllist.poll_tid, SIGUSR1)) == 0)
polllist.signaled = 1;
else
rcm_log_message(RCM_ERROR,
gettext(
"fail to kill polling thread %d: %s\n"),
polllist.poll_tid, strerror(err));
}
(void) cond_wait(&polllist.cv, &rcm_req_lock);
}
}