/* * CDDL HEADER START * * The contents of this file are subject to the terms of the * Common Development and Distribution License, Version 1.0 only * (the "License"). You may not use this file except in compliance * with the License. * * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE * or http://www.opensolaris.org/os/licensing. * See the License for the specific language governing permissions * and limitations under the License. * * When distributing Covered Code, include this CDDL HEADER in each * file and include the License file at usr/src/OPENSOLARIS.LICENSE. * If applicable, add the following below this CDDL HEADER, with the * fields enclosed by brackets "[]" replaced with your own identifying * information: Portions Copyright [yyyy] [name of copyright owner] * * CDDL HEADER END */ /* * Copyright 2005 Sun Microsystems, Inc. All rights reserved. * Use is subject to license terms. */ #pragma ident "%Z%%M% %I% %E% SMI" #include #include #include #include #include #include #include #include /* * The scheme plugin for mem FMRIs. */ mem_t mem; /* * Retry values for handling the case where the kernel is not yet ready * to provide DIMM serial ids. Some platforms acquire DIMM serial id * information from their System Controller via a mailbox interface. * The values chosen are for 10 retries 3 seconds apart to approximate the * possible 30 second timeout length of a mailbox message request. */ #define MAX_MEM_SID_RETRIES 10 #define MEM_SID_RETRY_WAIT 3 static mem_dimm_map_t * dm_lookup(const char *name) { mem_dimm_map_t *dm; for (dm = mem.mem_dm; dm != NULL; dm = dm->dm_next) { if (strcmp(name, dm->dm_label) == 0) return (dm); } return (NULL); } /* * Returns 0 with serial numbers if found, -1 (with errno set) for errors. If * the unum (or a component of same) wasn't found, -1 is returned with errno * set to ENOENT. If the kernel doesn't have support for serial numbers, * -1 is returned with errno set to ENOTSUP. */ static int mem_get_serids_from_kernel(const char *unum, char ***seridsp, size_t *nseridsp) { char **dimms, **serids; size_t ndimms, nserids; int i, rc = 0; int fd; int retries = MAX_MEM_SID_RETRIES; mem_name_t mn; struct timespec rqt; if ((fd = open("/dev/mem", O_RDONLY)) < 0) return (-1); if (mem_unum_burst(unum, &dimms, &ndimms) < 0) { (void) close(fd); return (-1); /* errno is set for us */ } serids = fmd_fmri_zalloc(sizeof (char *) * ndimms); nserids = ndimms; bzero(&mn, sizeof (mn)); for (i = 0; i < ndimms; i++) { mn.m_namelen = strlen(dimms[i]) + 1; mn.m_sidlen = MEM_SERID_MAXLEN; mn.m_name = fmd_fmri_alloc(mn.m_namelen); mn.m_sid = fmd_fmri_alloc(mn.m_sidlen); (void) strcpy(mn.m_name, dimms[i]); do { rc = ioctl(fd, MEM_SID, &mn); if (rc >= 0 || errno != EAGAIN) break; if (retries == 0) { errno = ETIMEDOUT; break; } /* * EAGAIN indicates the kernel is * not ready to provide DIMM serial * ids. Sleep MEM_SID_RETRY_WAIT seconds * and try again. * nanosleep() is used instead of sleep() * to avoid interfering with fmd timers. */ rqt.tv_sec = MEM_SID_RETRY_WAIT; rqt.tv_nsec = 0; (void) nanosleep(&rqt, NULL); } while (retries--); if (rc < 0) { /* * ENXIO can happen if the kernel memory driver * doesn't have the MEM_SID ioctl (e.g. if the * kernel hasn't been patched to provide the * support). * * If the MEM_SID ioctl is available but the * particular platform doesn't support providing * serial ids, ENOTSUP will be returned by the ioctl. */ if (errno == ENXIO) errno = ENOTSUP; fmd_fmri_free(mn.m_name, mn.m_namelen); fmd_fmri_free(mn.m_sid, mn.m_sidlen); mem_strarray_free(serids, nserids); mem_strarray_free(dimms, ndimms); (void) close(fd); return (-1); } serids[i] = fmd_fmri_strdup(mn.m_sid); fmd_fmri_free(mn.m_name, mn.m_namelen); fmd_fmri_free(mn.m_sid, mn.m_sidlen); } mem_strarray_free(dimms, ndimms); (void) close(fd); *seridsp = serids; *nseridsp = nserids; return (0); } /* * Returns 0 with serial numbers if found, -1 (with errno set) for errors. If * the unum (or a component of same) wasn't found, -1 is returned with errno * set to ENOENT. */ static int mem_get_serids_from_cache(const char *unum, char ***seridsp, size_t *nseridsp) { uint64_t drgen = fmd_fmri_get_drgen(); char **dimms, **serids; size_t ndimms, nserids; mem_dimm_map_t *dm; int i, rc = 0; if (mem_unum_burst(unum, &dimms, &ndimms) < 0) return (-1); /* errno is set for us */ serids = fmd_fmri_zalloc(sizeof (char *) * ndimms); nserids = ndimms; for (i = 0; i < ndimms; i++) { if ((dm = dm_lookup(dimms[i])) == NULL) { rc = fmd_fmri_set_errno(EINVAL); break; } if (*dm->dm_serid == '\0' || dm->dm_drgen != drgen) { /* * We don't have a cached copy, or the copy we've got is * out of date. Look it up again. */ if (mem_get_serid(dm->dm_device, dm->dm_serid, sizeof (dm->dm_serid)) < 0) { rc = -1; /* errno is set for us */ break; } dm->dm_drgen = drgen; } serids[i] = fmd_fmri_strdup(dm->dm_serid); } mem_strarray_free(dimms, ndimms); if (rc == 0) { *seridsp = serids; *nseridsp = nserids; } else { mem_strarray_free(serids, nserids); } return (rc); } static int mem_get_serids_by_unum(const char *unum, char ***seridsp, size_t *nseridsp) { /* * Some platforms do not support the caching of serial ids by the * mem scheme plugin but instead support making serial ids available * via the kernel. */ if (mem.mem_dm == NULL) return (mem_get_serids_from_kernel(unum, seridsp, nseridsp)); else return (mem_get_serids_from_cache(unum, seridsp, nseridsp)); } static int mem_fmri_get_unum(nvlist_t *nvl, char **unump) { uint8_t version; char *unum; if (nvlist_lookup_uint8(nvl, FM_VERSION, &version) != 0 || version > FM_MEM_SCHEME_VERSION || nvlist_lookup_string(nvl, FM_FMRI_MEM_UNUM, &unum) != 0) return (fmd_fmri_set_errno(EINVAL)); *unump = unum; return (0); } ssize_t fmd_fmri_nvl2str(nvlist_t *nvl, char *buf, size_t buflen) { const char *fmt = "mem:///component=%1$s"; ssize_t size, presz; uint64_t pa; char *rawunum, *preunum, *escunum; int i; if (mem_fmri_get_unum(nvl, &rawunum) < 0) return (-1); /* errno is set for us */ if (nvlist_lookup_uint64(nvl, FM_FMRI_MEM_PHYSADDR, &pa) == 0) fmt = "mem:///pa=%2$llx/component=%1$s"; /* * If we leave the unum as-is, the spaces and colons will be escaped, * rendering the resulting FMRI pretty much unreadable. We're therefore * going to do some escaping of our own first. */ preunum = fmd_fmri_strdup(rawunum); presz = strlen(preunum) + 1; for (i = 0; i < presz - 1; i++) { if (preunum[i] == ':' && preunum[i + 1] == ' ') { bcopy(preunum + i + 2, preunum + i + 1, presz - (i + 2)); } else if (preunum[i] == ' ') { preunum[i] = ','; } } escunum = fmd_fmri_strescape(preunum); fmd_fmri_free(preunum, presz); size = snprintf(buf, buflen, fmt, escunum, (u_longlong_t)pa); fmd_fmri_strfree(escunum); return (size); } int fmd_fmri_expand(nvlist_t *nvl) { char *unum, **serids; uint_t nserids; int rc; if (mem_fmri_get_unum(nvl, &unum) < 0) return (fmd_fmri_set_errno(EINVAL)); if ((rc = nvlist_lookup_string_array(nvl, FM_FMRI_MEM_SERIAL_ID, &serids, &nserids)) == 0) return (0); /* fmri is already expanded */ else if (rc != ENOENT) return (fmd_fmri_set_errno(EINVAL)); if (mem_get_serids_by_unum(unum, &serids, &nserids) < 0) { /* errno is set for us */ if (errno == ENOTSUP) return (0); /* nothing to add - no s/n support */ else return (-1); } rc = nvlist_add_string_array(nvl, FM_FMRI_MEM_SERIAL_ID, serids, nserids); mem_strarray_free(serids, nserids); if (rc != 0) return (fmd_fmri_set_errno(EINVAL)); return (0); } static int serids_eq(char **serids1, uint_t nserids1, char **serids2, uint_t nserids2) { int i; if (nserids1 != nserids2) return (0); for (i = 0; i < nserids1; i++) { if (strcmp(serids1[i], serids2[i]) != 0) return (0); } return (1); } int fmd_fmri_present(nvlist_t *nvl) { char *unum, **nvlserids, **serids; uint_t nnvlserids, nserids; uint64_t memconfig; int rc; if (mem_fmri_get_unum(nvl, &unum) < 0) return (-1); /* errno is set for us */ if (nvlist_lookup_string_array(nvl, FM_FMRI_MEM_SERIAL_ID, &nvlserids, &nnvlserids) != 0) { /* * Some mem scheme FMRIs don't have serial ids because * either the platform does not support them, or because * the FMRI was created before support for serial ids was * introduced. If this is the case, assume it is there. */ if (mem.mem_dm == NULL) return (1); else return (fmd_fmri_set_errno(EINVAL)); } /* * Hypervisor will change the memconfig value when the mapping of * pages to DIMMs changes, e.g. for change in DIMM size or interleave. * If we detect such a change, we discard ereports associated with a * previous memconfig value as invalid. */ if ((nvlist_lookup_uint64(nvl, FM_FMRI_MEM_MEMCONFIG, &memconfig) == 0) && memconfig != mem.mem_memconfig) return (0); if (mem_get_serids_by_unum(unum, &serids, &nserids) < 0) { if (errno == ENOTSUP) return (1); /* assume it's there, no s/n support here */ if (errno != ENOENT) { /* * Errors are only signalled to the caller if they're * the caller's fault. This isn't - it's a failure on * our part to burst or read the serial numbers. We'll * whine about it, and tell the caller the named * module(s) isn't/aren't there. */ fmd_fmri_warn("failed to retrieve serial number for " "unum %s", unum); } return (0); } rc = serids_eq(serids, nserids, nvlserids, nnvlserids); mem_strarray_free(serids, nserids); return (rc); } int fmd_fmri_contains(nvlist_t *er, nvlist_t *ee) { char *erunum, *eeunum; uint64_t erpa = 0, eepa = 0; if (mem_fmri_get_unum(er, &erunum) < 0 || mem_fmri_get_unum(ee, &eeunum) < 0) return (-1); /* errno is set for us */ if (mem_unum_contains(erunum, eeunum) <= 0) return (0); /* can't parse/match, so assume no containment */ if (nvlist_lookup_uint64(er, FM_FMRI_MEM_PHYSADDR, &erpa) == 0) { /* container has a PA; only match if containee has same PA */ return (nvlist_lookup_uint64(ee, FM_FMRI_MEM_PHYSADDR, &eepa) == 0 && erpa == eepa); } return (1); } int fmd_fmri_unusable(nvlist_t *nvl) { uint64_t pageaddr; uint8_t version; int rc, err; /* * We can only make a usable/unusable determination for pages. FMRIs * without page addresses will be reported as usable. */ if (nvlist_lookup_uint8(nvl, FM_VERSION, &version) != 0 || version > FM_MEM_SCHEME_VERSION) return (fmd_fmri_set_errno(EINVAL)); if ((err = nvlist_lookup_uint64(nvl, FM_FMRI_MEM_PHYSADDR, &pageaddr)) == ENOENT) return (0); /* no page, so assume it's still usable */ else if (err != 0) return (fmd_fmri_set_errno(EINVAL)); if ((rc = mem_page_cmd(MEM_PAGE_FMRI_ISRETIRED, nvl)) < 0 && errno == EIO) { return (0); /* the page wonders, "why all the fuss?" */ } else if (rc == 0 || errno == EAGAIN || errno == EINVAL) { /* * The page has been retired, is in the process of being * retired, or doesn't exist. The latter is valid if the page * existed in the past but has been DR'd out. */ return (1); } else { /* * Errors are only signalled to the caller if they're the * caller's fault. This isn't - it's a failure of the * retirement-check code. We'll whine about it and tell * the caller the page is unusable. */ fmd_fmri_warn("failed to determine usability of page %llx", pageaddr); return (1); } } int fmd_fmri_init(void) { bzero(&mem, sizeof (mem_t)); return (mem_discover()); } void fmd_fmri_fini(void) { mem_destroy(); }