#include <cma.h>
#include <time.h>
#include <errno.h>
#include <unistd.h>
#include <strings.h>
#include <fm/fmd_api.h>
#include <fm/libtopo.h>
#include <fm/fmd_fmri.h>
#include <fm/fmd_agent.h>
#include <sys/fm/protocol.h>
static void
cma_page_free(fmd_hdl_t *hdl, cma_page_t *page)
{
nvlist_free(page->pg_asru);
nvlist_free(page->pg_rsrc);
fmd_hdl_free(hdl, page, sizeof (cma_page_t));
}
int
cma_page_retire(fmd_hdl_t *hdl, nvlist_t *nvl, nvlist_t *asru,
const char *uuid, boolean_t repair)
{
cma_page_t *page;
uint64_t pageaddr;
const char *action = repair ? "unretire" : "retire";
int rc;
nvlist_t *rsrc = NULL, *asrucp = NULL, *hcsp;
(void) nvlist_lookup_nvlist(nvl, FM_FAULT_RESOURCE, &rsrc);
if (nvlist_dup(asru, &asrucp, 0) != 0) {
fmd_hdl_debug(hdl, "page retire nvlist dup failed\n");
return (CMA_RA_FAILURE);
}
if (fmd_nvl_fmri_expand(hdl, asrucp) < 0) {
fmd_hdl_debug(hdl, "failed to expand page asru\n");
cma_stats.bad_flts.fmds_value.ui64++;
nvlist_free(asrucp);
return (CMA_RA_FAILURE);
}
if (!repair && !fmd_nvl_fmri_present(hdl, asrucp)) {
fmd_hdl_debug(hdl, "page retire overtaken by events\n");
cma_stats.page_nonent.fmds_value.ui64++;
nvlist_free(asrucp);
return (CMA_RA_SUCCESS);
}
if (rsrc == NULL ||
nvlist_lookup_nvlist(rsrc, FM_FMRI_HC_SPECIFIC, &hcsp) != 0 ||
(nvlist_lookup_uint64(hcsp, "asru-" FM_FMRI_HC_SPECIFIC_PHYSADDR,
&pageaddr) != 0 && nvlist_lookup_uint64(hcsp,
FM_FMRI_HC_SPECIFIC_PHYSADDR, &pageaddr) != 0)) {
if (nvlist_lookup_uint64(asrucp, FM_FMRI_MEM_PHYSADDR,
&pageaddr) != 0) {
fmd_hdl_debug(hdl, "mem fault missing 'physaddr'\n");
cma_stats.bad_flts.fmds_value.ui64++;
nvlist_free(asrucp);
return (CMA_RA_FAILURE);
}
}
if (repair) {
if (!cma.cma_page_dounretire) {
fmd_hdl_debug(hdl, "suppressed unretire of page %llx\n",
(u_longlong_t)pageaddr);
cma_stats.page_supp.fmds_value.ui64++;
nvlist_free(asrucp);
return (CMA_RA_SUCCESS);
}
if (rsrc == NULL || (rc = fmd_nvl_fmri_unretire(hdl, rsrc)) < 0)
rc = cma_fmri_page_unretire(hdl, asrucp);
} else {
if (!cma.cma_page_doretire) {
fmd_hdl_debug(hdl, "suppressed retire of page %llx\n",
(u_longlong_t)pageaddr);
cma_stats.page_supp.fmds_value.ui64++;
nvlist_free(asrucp);
return (CMA_RA_FAILURE);
}
if (rsrc == NULL || (rc = fmd_nvl_fmri_retire(hdl, rsrc)) < 0)
rc = cma_fmri_page_retire(hdl, asrucp);
}
if (rc == FMD_AGENT_RETIRE_DONE) {
fmd_hdl_debug(hdl, "%sd page 0x%llx\n",
action, (u_longlong_t)pageaddr);
if (repair)
cma_stats.page_repairs.fmds_value.ui64++;
else
cma_stats.page_flts.fmds_value.ui64++;
nvlist_free(asrucp);
return (CMA_RA_SUCCESS);
} else if (repair || rc != FMD_AGENT_RETIRE_ASYNC) {
fmd_hdl_debug(hdl, "%s of page 0x%llx failed, will not "
"retry: %s\n", action, (u_longlong_t)pageaddr,
strerror(errno));
cma_stats.page_fails.fmds_value.ui64++;
nvlist_free(asrucp);
return (CMA_RA_FAILURE);
}
fmd_hdl_debug(hdl, "page didn't retire - sleeping\n");
page = fmd_hdl_zalloc(hdl, sizeof (cma_page_t), FMD_SLEEP);
page->pg_addr = pageaddr;
if (rsrc != NULL)
(void) nvlist_dup(rsrc, &page->pg_rsrc, 0);
page->pg_asru = asrucp;
if (uuid != NULL)
page->pg_uuid = fmd_hdl_strdup(hdl, uuid, FMD_SLEEP);
page->pg_next = cma.cma_pages;
cma.cma_pages = page;
if (cma.cma_page_timerid != 0)
fmd_timer_remove(hdl, cma.cma_page_timerid);
cma.cma_page_curdelay = cma.cma_page_mindelay;
cma.cma_page_timerid =
fmd_timer_install(hdl, NULL, NULL, cma.cma_page_curdelay);
return (CMA_RA_FAILURE);
}
static int
page_retry(fmd_hdl_t *hdl, cma_page_t *page)
{
int rc;
if (page->pg_asru != NULL &&
!fmd_nvl_fmri_present(hdl, page->pg_asru)) {
fmd_hdl_debug(hdl, "page retire overtaken by events");
cma_stats.page_nonent.fmds_value.ui64++;
if (page->pg_uuid != NULL)
fmd_case_uuclose(hdl, page->pg_uuid);
return (1);
}
if (page->pg_rsrc == NULL ||
(rc = fmd_nvl_fmri_service_state(hdl, page->pg_rsrc)) < 0)
rc = cma_fmri_page_service_state(hdl, page->pg_asru);
if (rc == FMD_SERVICE_STATE_UNUSABLE) {
fmd_hdl_debug(hdl, "retired page 0x%llx on retry %u\n",
page->pg_addr, page->pg_nretries);
cma_stats.page_flts.fmds_value.ui64++;
if (page->pg_uuid != NULL)
fmd_case_uuclose(hdl, page->pg_uuid);
return (1);
}
if (rc == FMD_SERVICE_STATE_ISOLATE_PENDING) {
fmd_hdl_debug(hdl, "scheduling another retry for 0x%llx\n",
page->pg_addr);
return (0);
} else {
fmd_hdl_debug(hdl, "failed to retry page 0x%llx "
"retirement: %s\n", page->pg_addr,
strerror(errno));
cma_stats.page_fails.fmds_value.ui64++;
return (1);
}
}
void
cma_page_retry(fmd_hdl_t *hdl)
{
cma_page_t **pagep;
cma.cma_page_timerid = 0;
fmd_hdl_debug(hdl, "page_retry: timer fired\n");
pagep = &cma.cma_pages;
while (*pagep != NULL) {
cma_page_t *page = *pagep;
if (page_retry(hdl, page)) {
*pagep = page->pg_next;
if (page->pg_uuid != NULL)
fmd_hdl_strfree(hdl, page->pg_uuid);
cma_page_free(hdl, page);
} else {
page->pg_nretries++;
pagep = &page->pg_next;
}
}
if (cma.cma_pages == NULL)
return;
cma.cma_page_curdelay = MIN(cma.cma_page_curdelay * 2,
cma.cma_page_maxdelay);
fmd_hdl_debug(hdl, "scheduled page retirement retry for %llu secs\n",
(u_longlong_t)(cma.cma_page_curdelay / NANOSEC));
cma.cma_page_timerid =
fmd_timer_install(hdl, NULL, NULL, cma.cma_page_curdelay);
}
void
cma_page_fini(fmd_hdl_t *hdl)
{
cma_page_t *page;
while ((page = cma.cma_pages) != NULL) {
cma.cma_pages = page->pg_next;
if (page->pg_uuid != NULL)
fmd_hdl_strfree(hdl, page->pg_uuid);
cma_page_free(hdl, page);
}
}