#include <assert.h>
#include <stddef.h>
#include <strings.h>
#include <libuutil.h>
#include <libzfs.h>
#include <fm/fmd_api.h>
#include <fm/libtopo.h>
#include <sys/types.h>
#include <sys/time.h>
#include <sys/fs/zfs.h>
#include <sys/fm/protocol.h>
#include <sys/fm/fs/zfs.h>
#define MAX_SERDLEN (16 * 2 + sizeof ("zfs___checksum"))
typedef struct zfs_case_data {
uint64_t zc_version;
uint64_t zc_ena;
uint64_t zc_pool_guid;
uint64_t zc_vdev_guid;
int zc_has_timer;
int zc_pool_state;
char zc_serd_checksum[MAX_SERDLEN];
char zc_serd_io[MAX_SERDLEN];
int zc_has_remove_timer;
char zc_serd_probe[MAX_SERDLEN];
} zfs_case_data_t;
typedef struct er_timeval {
uint64_t ertv_sec;
uint64_t ertv_nsec;
} er_timeval_t;
typedef struct zfs_case {
boolean_t zc_present;
uint32_t zc_version;
zfs_case_data_t zc_data;
fmd_case_t *zc_case;
uu_list_node_t zc_node;
id_t zc_remove_timer;
char *zc_fru;
er_timeval_t zc_when;
} zfs_case_t;
#define CASE_DATA "data"
#define CASE_FRU "fru"
#define CASE_DATA_VERSION_INITIAL 1
#define CASE_DATA_VERSION_SERD 2
#define MAX_ULL_STR 21
typedef struct zfs_de_stats {
fmd_stat_t old_drops;
fmd_stat_t dev_drops;
fmd_stat_t vdev_drops;
fmd_stat_t import_drops;
fmd_stat_t resource_drops;
fmd_stat_t pool_drops;
} zfs_de_stats_t;
zfs_de_stats_t zfs_stats = {
{ "old_drops", FMD_TYPE_UINT64, "ereports dropped (from before load)" },
{ "dev_drops", FMD_TYPE_UINT64, "ereports dropped (dev during open)"},
{ "vdev_drops", FMD_TYPE_UINT64, "ereports dropped (weird vdev types)"},
{ "import_drops", FMD_TYPE_UINT64, "ereports dropped (during import)" },
{ "resource_drops", FMD_TYPE_UINT64, "resource related ereports" },
{ "pool_drops", FMD_TYPE_UINT64, "ereports dropped (pool iter failed)"},
};
static hrtime_t zfs_remove_timeout;
uu_list_pool_t *zfs_case_pool;
uu_list_t *zfs_cases;
#define ZFS_MAKE_RSRC(type) \
FM_RSRC_CLASS "." ZFS_ERROR_CLASS "." type
#define ZFS_MAKE_EREPORT(type) \
FM_EREPORT_CLASS "." ZFS_ERROR_CLASS "." type
static void
zfs_case_serialize(fmd_hdl_t *hdl, zfs_case_t *zcp)
{
zcp->zc_data.zc_version = CASE_DATA_VERSION_SERD;
fmd_buf_write(hdl, zcp->zc_case, CASE_DATA, &zcp->zc_data,
sizeof (zcp->zc_data));
if (zcp->zc_fru != NULL)
fmd_buf_write(hdl, zcp->zc_case, CASE_FRU, zcp->zc_fru,
strlen(zcp->zc_fru));
}
static zfs_case_t *
zfs_case_unserialize(fmd_hdl_t *hdl, fmd_case_t *cp)
{
zfs_case_t *zcp;
size_t frulen;
zcp = fmd_hdl_zalloc(hdl, sizeof (zfs_case_t), FMD_SLEEP);
zcp->zc_case = cp;
fmd_buf_read(hdl, cp, CASE_DATA, &zcp->zc_data,
sizeof (zcp->zc_data));
if (zcp->zc_data.zc_version > CASE_DATA_VERSION_SERD) {
fmd_hdl_free(hdl, zcp, sizeof (zfs_case_t));
return (NULL);
}
if ((frulen = fmd_buf_size(hdl, zcp->zc_case, CASE_FRU)) > 0) {
zcp->zc_fru = fmd_hdl_alloc(hdl, frulen + 1, FMD_SLEEP);
fmd_buf_read(hdl, zcp->zc_case, CASE_FRU, zcp->zc_fru,
frulen);
zcp->zc_fru[frulen] = '\0';
}
if (zcp->zc_data.zc_has_remove_timer)
zcp->zc_remove_timer = fmd_timer_install(hdl, zcp,
NULL, zfs_remove_timeout);
(void) uu_list_insert_before(zfs_cases, NULL, zcp);
fmd_case_setspecific(hdl, cp, zcp);
return (zcp);
}
static void
zfs_mark_vdev(uint64_t pool_guid, nvlist_t *vd, er_timeval_t *loaded)
{
uint64_t vdev_guid;
uint_t c, children;
nvlist_t **child;
zfs_case_t *zcp;
int ret;
ret = nvlist_lookup_uint64(vd, ZPOOL_CONFIG_GUID, &vdev_guid);
assert(ret == 0);
for (zcp = uu_list_first(zfs_cases); zcp != NULL;
zcp = uu_list_next(zfs_cases, zcp)) {
if (zcp->zc_data.zc_pool_guid == pool_guid &&
zcp->zc_data.zc_vdev_guid == vdev_guid) {
zcp->zc_present = B_TRUE;
zcp->zc_when = *loaded;
}
}
if (nvlist_lookup_nvlist_array(vd, ZPOOL_CONFIG_CHILDREN, &child,
&children) == 0) {
for (c = 0; c < children; c++)
zfs_mark_vdev(pool_guid, child[c], loaded);
}
if (nvlist_lookup_nvlist_array(vd, ZPOOL_CONFIG_L2CACHE, &child,
&children) == 0) {
for (c = 0; c < children; c++)
zfs_mark_vdev(pool_guid, child[c], loaded);
}
if (nvlist_lookup_nvlist_array(vd, ZPOOL_CONFIG_SPARES, &child,
&children) == 0) {
for (c = 0; c < children; c++)
zfs_mark_vdev(pool_guid, child[c], loaded);
}
}
static int
zfs_mark_pool(zpool_handle_t *zhp, void *unused)
{
zfs_case_t *zcp;
uint64_t pool_guid;
uint64_t *tod;
er_timeval_t loaded = { 0 };
nvlist_t *config, *vd;
uint_t nelem = 0;
int ret;
pool_guid = zpool_get_prop_int(zhp, ZPOOL_PROP_GUID, NULL);
for (zcp = uu_list_first(zfs_cases); zcp != NULL;
zcp = uu_list_next(zfs_cases, zcp)) {
if (zcp->zc_data.zc_pool_guid == pool_guid &&
zcp->zc_data.zc_vdev_guid == 0)
zcp->zc_present = B_TRUE;
}
if ((config = zpool_get_config(zhp, NULL)) == NULL) {
zpool_close(zhp);
return (-1);
}
(void) nvlist_lookup_uint64_array(config, ZPOOL_CONFIG_LOADED_TIME,
&tod, &nelem);
if (nelem == 2) {
loaded.ertv_sec = tod[0];
loaded.ertv_nsec = tod[1];
for (zcp = uu_list_first(zfs_cases); zcp != NULL;
zcp = uu_list_next(zfs_cases, zcp)) {
if (zcp->zc_data.zc_pool_guid == pool_guid &&
zcp->zc_data.zc_vdev_guid == 0) {
zcp->zc_when = loaded;
}
}
}
ret = nvlist_lookup_nvlist(config, ZPOOL_CONFIG_VDEV_TREE, &vd);
assert(ret == 0);
zfs_mark_vdev(pool_guid, vd, &loaded);
zpool_close(zhp);
return (0);
}
typedef struct find_cbdata {
uint64_t cb_guid;
zpool_handle_t *cb_zhp;
} find_cbdata_t;
static int
find_pool(zpool_handle_t *zhp, void *data)
{
find_cbdata_t *cbp = data;
if (cbp->cb_guid ==
zpool_get_prop_int(zhp, ZPOOL_PROP_GUID, NULL)) {
cbp->cb_zhp = zhp;
return (0);
}
zpool_close(zhp);
return (0);
}
struct load_time_arg {
uint64_t lt_guid;
er_timeval_t *lt_time;
boolean_t lt_found;
};
static int
zpool_find_load_time(zpool_handle_t *zhp, void *arg)
{
struct load_time_arg *lta = arg;
uint64_t pool_guid;
uint64_t *tod;
nvlist_t *config;
uint_t nelem;
if (lta->lt_found) {
zpool_close(zhp);
return (0);
}
pool_guid = zpool_get_prop_int(zhp, ZPOOL_PROP_GUID, NULL);
if (pool_guid != lta->lt_guid) {
zpool_close(zhp);
return (0);
}
if ((config = zpool_get_config(zhp, NULL)) == NULL) {
zpool_close(zhp);
return (-1);
}
if (nvlist_lookup_uint64_array(config, ZPOOL_CONFIG_LOADED_TIME,
&tod, &nelem) == 0 && nelem == 2) {
lta->lt_found = B_TRUE;
lta->lt_time->ertv_sec = tod[0];
lta->lt_time->ertv_nsec = tod[1];
}
zpool_close(zhp);
return (0);
}
static void
zfs_purge_cases(fmd_hdl_t *hdl)
{
zfs_case_t *zcp;
uu_list_walk_t *walk;
libzfs_handle_t *zhdl = fmd_hdl_getspecific(hdl);
for (zcp = uu_list_first(zfs_cases); zcp != NULL;
zcp = uu_list_next(zfs_cases, zcp))
zcp->zc_present = B_FALSE;
if (zpool_iter(zhdl, zfs_mark_pool, NULL) != 0)
return;
walk = uu_list_walk_start(zfs_cases, UU_WALK_ROBUST);
while ((zcp = uu_list_walk_next(walk)) != NULL) {
if (!zcp->zc_present)
fmd_case_close(hdl, zcp->zc_case);
}
uu_list_walk_end(walk);
}
static void
zfs_serd_name(char *buf, uint64_t pool_guid, uint64_t vdev_guid,
const char *type)
{
(void) snprintf(buf, MAX_SERDLEN, "zfs_%llx_%llx_%s", pool_guid,
vdev_guid, type);
}
static void
zfs_case_solve(fmd_hdl_t *hdl, zfs_case_t *zcp, const char *faultname,
boolean_t checkunusable)
{
libzfs_handle_t *zhdl = fmd_hdl_getspecific(hdl);
nvlist_t *detector, *fault;
boolean_t serialize;
nvlist_t *fmri, *fru;
topo_hdl_t *thp;
int err;
detector = fmd_nvl_alloc(hdl, FMD_SLEEP);
(void) nvlist_add_uint8(detector, FM_VERSION, ZFS_SCHEME_VERSION0);
(void) nvlist_add_string(detector, FM_FMRI_SCHEME, FM_FMRI_SCHEME_ZFS);
(void) nvlist_add_uint64(detector, FM_FMRI_ZFS_POOL,
zcp->zc_data.zc_pool_guid);
if (zcp->zc_data.zc_vdev_guid != 0) {
(void) nvlist_add_uint64(detector, FM_FMRI_ZFS_VDEV,
zcp->zc_data.zc_vdev_guid);
}
if (!fmd_nvl_fmri_present(hdl, detector) ||
(checkunusable && !fmd_nvl_fmri_unusable(hdl, detector))) {
fmd_case_close(hdl, zcp->zc_case);
nvlist_free(detector);
return;
}
fru = NULL;
if (zcp->zc_fru != NULL &&
(thp = fmd_hdl_topo_hold(hdl, TOPO_VERSION)) != NULL) {
if (topo_fmri_str2nvl(thp, zcp->zc_fru, &fmri, &err) == 0) {
if (libzfs_fru_notself(zhdl, zcp->zc_fru)) {
fmd_case_close(hdl, zcp->zc_case);
nvlist_free(fmri);
fmd_hdl_topo_rele(hdl, thp);
nvlist_free(detector);
return;
}
if (topo_fmri_fru(thp, fmri, &fru, &err) != 0)
fru = fmd_nvl_dup(hdl, fmri, FMD_SLEEP);
nvlist_free(fmri);
}
fmd_hdl_topo_rele(hdl, thp);
}
fault = fmd_nvl_create_fault(hdl, faultname, 100, detector,
fru, detector);
fmd_case_add_suspect(hdl, zcp->zc_case, fault);
nvlist_free(fru);
fmd_case_solve(hdl, zcp->zc_case);
serialize = B_FALSE;
if (zcp->zc_data.zc_has_remove_timer) {
fmd_timer_remove(hdl, zcp->zc_remove_timer);
zcp->zc_data.zc_has_remove_timer = 0;
serialize = B_TRUE;
}
if (serialize)
zfs_case_serialize(hdl, zcp);
nvlist_free(detector);
}
#define FMD_EVN_TOD "__tod"
static boolean_t
timeval_earlier(er_timeval_t *a, er_timeval_t *b)
{
return (a->ertv_sec < b->ertv_sec ||
(a->ertv_sec == b->ertv_sec && a->ertv_nsec < b->ertv_nsec));
}
static void
zfs_ereport_when(fmd_hdl_t *hdl, nvlist_t *nvl, er_timeval_t *when)
{
uint64_t *tod;
uint_t nelem;
if (nvlist_lookup_uint64_array(nvl, FMD_EVN_TOD, &tod, &nelem) == 0 &&
nelem == 2) {
when->ertv_sec = tod[0];
when->ertv_nsec = tod[1];
} else {
when->ertv_sec = when->ertv_nsec = UINT64_MAX;
}
}
static void
zfs_fm_recv(fmd_hdl_t *hdl, fmd_event_t *ep, nvlist_t *nvl, const char *class)
{
zfs_case_t *zcp, *dcp;
libzfs_handle_t *zhdl;
zpool_handle_t *zhp;
int32_t pool_state;
uint64_t ena, pool_guid, vdev_guid;
er_timeval_t pool_load;
er_timeval_t er_when;
nvlist_t *detector;
boolean_t pool_found = B_FALSE;
boolean_t isresource;
boolean_t is_inactive_spare, islog, iscache;
nvlist_t *vd_nvl = NULL;
char *fru, *type, *vdg;
find_cbdata_t cb;
if (fmd_nvl_class_match(hdl, nvl, "resource.sysevent.EC_zfs.*")) {
zfs_purge_cases(hdl);
zfs_stats.resource_drops.fmds_value.ui64++;
return;
}
isresource = fmd_nvl_class_match(hdl, nvl, "resource.fs.zfs.*");
if (isresource) {
if (nvlist_lookup_uint64(nvl, FM_EREPORT_PAYLOAD_ZFS_VDEV_GUID,
&vdev_guid) != 0)
pool_state = SPA_LOAD_OPEN;
else
pool_state = SPA_LOAD_NONE;
detector = NULL;
} else {
(void) nvlist_lookup_nvlist(nvl,
FM_EREPORT_DETECTOR, &detector);
(void) nvlist_lookup_int32(nvl,
FM_EREPORT_PAYLOAD_ZFS_POOL_CONTEXT, &pool_state);
}
if (pool_state == SPA_LOAD_IMPORT) {
zfs_stats.import_drops.fmds_value.ui64++;
return;
}
if (pool_state == SPA_LOAD_OPEN &&
(fmd_nvl_class_match(hdl, nvl,
ZFS_MAKE_EREPORT(FM_EREPORT_ZFS_CHECKSUM)) ||
fmd_nvl_class_match(hdl, nvl,
ZFS_MAKE_EREPORT(FM_EREPORT_ZFS_IO)) ||
fmd_nvl_class_match(hdl, nvl,
ZFS_MAKE_EREPORT(FM_EREPORT_ZFS_PROBE_FAILURE)))) {
zfs_stats.dev_drops.fmds_value.ui64++;
return;
}
if (nvlist_lookup_string(nvl, FM_EREPORT_PAYLOAD_ZFS_VDEV_TYPE,
&type) == 0) {
if (strcmp(type, VDEV_TYPE_DISK) != 0 &&
strcmp(type, VDEV_TYPE_FILE) != 0) {
zfs_stats.vdev_drops.fmds_value.ui64++;
return;
}
}
(void) nvlist_lookup_uint64(nvl,
FM_EREPORT_PAYLOAD_ZFS_POOL_GUID, &pool_guid);
if (nvlist_lookup_uint64(nvl,
FM_EREPORT_PAYLOAD_ZFS_VDEV_GUID, &vdev_guid) != 0)
vdev_guid = 0;
if (nvlist_lookup_uint64(nvl, FM_EREPORT_ENA, &ena) != 0)
ena = 0;
zfs_ereport_when(hdl, nvl, &er_when);
for (zcp = uu_list_first(zfs_cases); zcp != NULL;
zcp = uu_list_next(zfs_cases, zcp)) {
if (zcp->zc_data.zc_pool_guid == pool_guid) {
pool_found = B_TRUE;
pool_load = zcp->zc_when;
}
if (zcp->zc_data.zc_vdev_guid == vdev_guid &&
zcp->zc_data.zc_pool_guid == pool_guid)
break;
}
if (pool_found) {
fmd_hdl_debug(hdl, "pool %llx, "
"ereport time %lld.%lld, pool load time = %lld.%lld\n",
pool_guid, er_when.ertv_sec, er_when.ertv_nsec,
pool_load.ertv_sec, pool_load.ertv_nsec);
}
if (pool_found && timeval_earlier(&er_when, &pool_load)) {
zfs_stats.old_drops.fmds_value.ui64++;
return;
}
if (!pool_found) {
libzfs_handle_t *zhdl = fmd_hdl_getspecific(hdl);
struct load_time_arg la;
la.lt_guid = pool_guid;
la.lt_time = &pool_load;
la.lt_found = B_FALSE;
if (zhdl != NULL &&
zpool_iter(zhdl, zpool_find_load_time, &la) == 0 &&
la.lt_found == B_TRUE) {
pool_found = B_TRUE;
fmd_hdl_debug(hdl, "pool %llx, "
"ereport time %lld.%lld, "
"pool load time = %lld.%lld\n",
pool_guid, er_when.ertv_sec, er_when.ertv_nsec,
pool_load.ertv_sec, pool_load.ertv_nsec);
if (timeval_earlier(&er_when, &pool_load)) {
zfs_stats.old_drops.fmds_value.ui64++;
return;
}
}
}
if (zcp == NULL) {
fmd_case_t *cs;
zfs_case_data_t data = { 0 };
if (isresource) {
zfs_stats.resource_drops.fmds_value.ui64++;
return;
}
cs = fmd_case_open(hdl, NULL);
fmd_buf_create(hdl, cs, CASE_DATA,
sizeof (zfs_case_data_t));
data.zc_version = CASE_DATA_VERSION_SERD;
data.zc_ena = ena;
data.zc_pool_guid = pool_guid;
data.zc_vdev_guid = vdev_guid;
data.zc_pool_state = (int)pool_state;
fmd_buf_write(hdl, cs, CASE_DATA, &data, sizeof (data));
zcp = zfs_case_unserialize(hdl, cs);
assert(zcp != NULL);
if (pool_found)
zcp->zc_when = pool_load;
}
if (nvlist_lookup_string(nvl, FM_EREPORT_PAYLOAD_ZFS_VDEV_FRU,
&fru) == 0) {
topo_hdl_t *thp = fmd_hdl_topo_hold(hdl, TOPO_VERSION);
if (zcp->zc_fru == NULL ||
!topo_fmri_strcmp(thp, zcp->zc_fru, fru)) {
if (zcp->zc_fru != NULL) {
fmd_hdl_strfree(hdl, zcp->zc_fru);
fmd_buf_destroy(hdl, zcp->zc_case, CASE_FRU);
}
zcp->zc_fru = fmd_hdl_strdup(hdl, fru, FMD_SLEEP);
zfs_case_serialize(hdl, zcp);
}
fmd_hdl_topo_rele(hdl, thp);
}
if (isresource) {
if (fmd_nvl_class_match(hdl, nvl,
ZFS_MAKE_RSRC(FM_RESOURCE_AUTOREPLACE))) {
fmd_case_close(hdl, zcp->zc_case);
} else if (fmd_nvl_class_match(hdl, nvl,
ZFS_MAKE_RSRC(FM_RESOURCE_REMOVED))) {
if (zcp->zc_data.zc_has_remove_timer) {
fmd_timer_remove(hdl, zcp->zc_remove_timer);
zcp->zc_data.zc_has_remove_timer = 0;
zfs_case_serialize(hdl, zcp);
}
if (zcp->zc_data.zc_serd_io[0] != '\0')
fmd_serd_reset(hdl,
zcp->zc_data.zc_serd_io);
if (zcp->zc_data.zc_serd_checksum[0] != '\0')
fmd_serd_reset(hdl,
zcp->zc_data.zc_serd_checksum);
if (zcp->zc_data.zc_serd_probe[0] != '\0')
fmd_serd_reset(hdl, zcp->zc_data.zc_serd_probe);
}
zfs_stats.resource_drops.fmds_value.ui64++;
return;
}
fmd_case_add_ereport(hdl, zcp->zc_case, ep);
if (fmd_case_solved(hdl, zcp->zc_case))
return;
zhdl = fmd_hdl_getspecific(hdl);
cb.cb_guid = pool_guid;
cb.cb_zhp = NULL;
if (zhdl != NULL && zpool_iter(zhdl, find_pool, &cb) != 0) {
zfs_stats.pool_drops.fmds_value.ui64++;
return;
}
zhp = cb.cb_zhp;
if (zhp != NULL) {
vdg = fmd_hdl_zalloc(hdl, MAX_ULL_STR, FMD_SLEEP);
(void) snprintf(vdg, MAX_ULL_STR, "%" PRIx64, vdev_guid);
if ((vd_nvl = zpool_find_vdev(zhp, vdg,
&is_inactive_spare, &islog, &iscache)) != NULL) {
nvlist_free(vd_nvl);
}
fmd_hdl_free(hdl, vdg, MAX_ULL_STR);
}
if (fmd_nvl_class_match(hdl, nvl,
ZFS_MAKE_EREPORT(FM_EREPORT_ZFS_POOL))) {
for (dcp = uu_list_first(zfs_cases); dcp != NULL;
dcp = uu_list_next(zfs_cases, dcp)) {
if (dcp->zc_data.zc_pool_guid ==
zcp->zc_data.zc_pool_guid &&
dcp->zc_data.zc_vdev_guid != 0)
fmd_case_close(hdl, dcp->zc_case);
}
zfs_case_solve(hdl, zcp, "fault.fs.zfs.pool", B_TRUE);
} else if (fmd_nvl_class_match(hdl, nvl,
ZFS_MAKE_EREPORT(FM_EREPORT_ZFS_LOG_REPLAY))) {
zfs_case_solve(hdl, zcp, "fault.fs.zfs.log_replay", B_TRUE);
} else if (fmd_nvl_class_match(hdl, nvl, "ereport.fs.zfs.vdev.*")) {
zfs_case_solve(hdl, zcp, "fault.fs.zfs.device", B_TRUE);
} else if (fmd_nvl_class_match(hdl, nvl,
ZFS_MAKE_EREPORT(FM_EREPORT_ZFS_IO)) ||
fmd_nvl_class_match(hdl, nvl,
ZFS_MAKE_EREPORT(FM_EREPORT_ZFS_CHECKSUM)) ||
fmd_nvl_class_match(hdl, nvl,
ZFS_MAKE_EREPORT(FM_EREPORT_ZFS_IO_FAILURE)) ||
fmd_nvl_class_match(hdl, nvl,
ZFS_MAKE_EREPORT(FM_EREPORT_ZFS_PROBE_FAILURE))) {
char *failmode = NULL;
boolean_t checkremove = B_FALSE;
if (fmd_nvl_class_match(hdl, nvl,
ZFS_MAKE_EREPORT(FM_EREPORT_ZFS_IO))) {
if (zcp->zc_data.zc_serd_io[0] == '\0') {
zfs_serd_name(zcp->zc_data.zc_serd_io,
pool_guid, vdev_guid, "io");
fmd_serd_create(hdl, zcp->zc_data.zc_serd_io,
fmd_prop_get_int32(hdl, "io_N"),
fmd_prop_get_int64(hdl, "io_T"));
zfs_case_serialize(hdl, zcp);
}
if (fmd_serd_record(hdl, zcp->zc_data.zc_serd_io, ep))
checkremove = B_TRUE;
} else if (fmd_nvl_class_match(hdl, nvl,
ZFS_MAKE_EREPORT(FM_EREPORT_ZFS_CHECKSUM))) {
if (zcp->zc_data.zc_serd_checksum[0] == '\0') {
zfs_serd_name(zcp->zc_data.zc_serd_checksum,
pool_guid, vdev_guid, "checksum");
fmd_serd_create(hdl,
zcp->zc_data.zc_serd_checksum,
fmd_prop_get_int32(hdl, "checksum_N"),
fmd_prop_get_int64(hdl, "checksum_T"));
zfs_case_serialize(hdl, zcp);
}
if (fmd_serd_record(hdl,
zcp->zc_data.zc_serd_checksum, ep)) {
zfs_case_solve(hdl, zcp,
"fault.fs.zfs.vdev.checksum", B_FALSE);
}
} else if (fmd_nvl_class_match(hdl, nvl,
ZFS_MAKE_EREPORT(FM_EREPORT_ZFS_IO_FAILURE)) &&
(nvlist_lookup_string(nvl,
FM_EREPORT_PAYLOAD_ZFS_POOL_FAILMODE, &failmode) == 0) &&
failmode != NULL) {
if (strncmp(failmode, FM_EREPORT_FAILMODE_CONTINUE,
strlen(FM_EREPORT_FAILMODE_CONTINUE)) == 0) {
zfs_case_solve(hdl, zcp,
"fault.fs.zfs.io_failure_continue",
B_FALSE);
} else if (strncmp(failmode, FM_EREPORT_FAILMODE_WAIT,
strlen(FM_EREPORT_FAILMODE_WAIT)) == 0) {
zfs_case_solve(hdl, zcp,
"fault.fs.zfs.io_failure_wait", B_FALSE);
}
} else if (fmd_nvl_class_match(hdl, nvl,
ZFS_MAKE_EREPORT(FM_EREPORT_ZFS_PROBE_FAILURE))) {
if (zcp->zc_data.zc_serd_probe[0] == '\0') {
zfs_serd_name(zcp->zc_data.zc_serd_probe,
pool_guid, vdev_guid, "probe");
fmd_serd_create(hdl, zcp->zc_data.zc_serd_probe,
fmd_prop_get_int32(hdl, "probe_N"),
fmd_prop_get_int64(hdl, "probe_T"));
zfs_case_serialize(hdl, zcp);
}
if (!is_inactive_spare || fmd_serd_record(hdl,
zcp->zc_data.zc_serd_probe, ep)) {
checkremove = B_TRUE;
}
}
if (checkremove) {
if (zcp->zc_data.zc_has_remove_timer)
fmd_timer_remove(hdl, zcp->zc_remove_timer);
zcp->zc_remove_timer = fmd_timer_install(hdl, zcp, NULL,
zfs_remove_timeout);
if (!zcp->zc_data.zc_has_remove_timer) {
zcp->zc_data.zc_has_remove_timer = 1;
zfs_case_serialize(hdl, zcp);
}
}
}
}
static void
zfs_fm_timeout(fmd_hdl_t *hdl, id_t id, void *data)
{
zfs_case_t *zcp = data;
if (id == zcp->zc_remove_timer)
zfs_case_solve(hdl, zcp, "fault.fs.zfs.vdev.io", B_FALSE);
}
static void
zfs_fm_close(fmd_hdl_t *hdl, fmd_case_t *cs)
{
zfs_case_t *zcp = fmd_case_getspecific(hdl, cs);
if (zcp->zc_data.zc_serd_checksum[0] != '\0')
fmd_serd_destroy(hdl, zcp->zc_data.zc_serd_checksum);
if (zcp->zc_data.zc_serd_io[0] != '\0')
fmd_serd_destroy(hdl, zcp->zc_data.zc_serd_io);
if (zcp->zc_data.zc_serd_probe[0] != '\0')
fmd_serd_destroy(hdl, zcp->zc_data.zc_serd_probe);
if (zcp->zc_data.zc_has_remove_timer)
fmd_timer_remove(hdl, zcp->zc_remove_timer);
uu_list_remove(zfs_cases, zcp);
fmd_hdl_free(hdl, zcp, sizeof (zfs_case_t));
}
static void
zfs_fm_gc(fmd_hdl_t *hdl)
{
zfs_purge_cases(hdl);
}
static const fmd_hdl_ops_t fmd_ops = {
zfs_fm_recv,
zfs_fm_timeout,
zfs_fm_close,
NULL,
zfs_fm_gc,
};
static const fmd_prop_t fmd_props[] = {
{ "checksum_N", FMD_TYPE_UINT32, "10" },
{ "checksum_T", FMD_TYPE_TIME, "10min" },
{ "io_N", FMD_TYPE_UINT32, "10" },
{ "io_T", FMD_TYPE_TIME, "10min" },
{ "probe_N", FMD_TYPE_UINT32, "5" },
{ "probe_T", FMD_TYPE_TIME, "24hour" },
{ "remove_timeout", FMD_TYPE_TIME, "15sec" },
{ NULL, 0, NULL }
};
static const fmd_hdl_info_t fmd_info = {
"ZFS Diagnosis Engine", "1.0", &fmd_ops, fmd_props
};
void
_fmd_init(fmd_hdl_t *hdl)
{
fmd_case_t *cp;
libzfs_handle_t *zhdl;
if ((zhdl = libzfs_init()) == NULL)
return;
if ((zfs_case_pool = uu_list_pool_create("zfs_case_pool",
sizeof (zfs_case_t), offsetof(zfs_case_t, zc_node),
NULL, 0)) == NULL) {
libzfs_fini(zhdl);
return;
}
if ((zfs_cases = uu_list_create(zfs_case_pool, NULL, 0)) == NULL) {
uu_list_pool_destroy(zfs_case_pool);
libzfs_fini(zhdl);
return;
}
if (fmd_hdl_register(hdl, FMD_API_VERSION, &fmd_info) != 0) {
uu_list_destroy(zfs_cases);
uu_list_pool_destroy(zfs_case_pool);
libzfs_fini(zhdl);
return;
}
fmd_hdl_setspecific(hdl, zhdl);
(void) fmd_stat_create(hdl, FMD_STAT_NOALLOC, sizeof (zfs_stats) /
sizeof (fmd_stat_t), (fmd_stat_t *)&zfs_stats);
for (cp = fmd_case_next(hdl, NULL);
cp != NULL; cp = fmd_case_next(hdl, cp))
(void) zfs_case_unserialize(hdl, cp);
zfs_purge_cases(hdl);
zfs_remove_timeout = fmd_prop_get_int64(hdl, "remove_timeout");
}
void
_fmd_fini(fmd_hdl_t *hdl)
{
zfs_case_t *zcp;
uu_list_walk_t *walk;
libzfs_handle_t *zhdl;
walk = uu_list_walk_start(zfs_cases, UU_WALK_ROBUST);
while ((zcp = uu_list_walk_next(walk)) != NULL) {
uu_list_remove(zfs_cases, zcp);
fmd_hdl_free(hdl, zcp, sizeof (zfs_case_t));
}
uu_list_walk_end(walk);
uu_list_destroy(zfs_cases);
uu_list_pool_destroy(zfs_case_pool);
zhdl = fmd_hdl_getspecific(hdl);
libzfs_fini(zhdl);
}