cmi.c revision e4b86885570d77af552e9cf94f142f4d744fb8c8
3ad553a7dabf3c8bcb69dd1ceeb13938fa526aedgavinm * CDDL HEADER START
3ad553a7dabf3c8bcb69dd1ceeb13938fa526aedgavinm * The contents of this file are subject to the terms of the
3ad553a7dabf3c8bcb69dd1ceeb13938fa526aedgavinm * Common Development and Distribution License (the "License").
3ad553a7dabf3c8bcb69dd1ceeb13938fa526aedgavinm * You may not use this file except in compliance with the License.
3ad553a7dabf3c8bcb69dd1ceeb13938fa526aedgavinm * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
3ad553a7dabf3c8bcb69dd1ceeb13938fa526aedgavinm * See the License for the specific language governing permissions
3ad553a7dabf3c8bcb69dd1ceeb13938fa526aedgavinm * and limitations under the License.
3ad553a7dabf3c8bcb69dd1ceeb13938fa526aedgavinm * When distributing Covered Code, include this CDDL HEADER in each
3ad553a7dabf3c8bcb69dd1ceeb13938fa526aedgavinm * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
3ad553a7dabf3c8bcb69dd1ceeb13938fa526aedgavinm * If applicable, add the following below this CDDL HEADER, with the
3ad553a7dabf3c8bcb69dd1ceeb13938fa526aedgavinm * fields enclosed by brackets "[]" replaced with your own identifying
3ad553a7dabf3c8bcb69dd1ceeb13938fa526aedgavinm * information: Portions Copyright [yyyy] [name of copyright owner]
3ad553a7dabf3c8bcb69dd1ceeb13938fa526aedgavinm * CDDL HEADER END
e3d60c9bd991a9826cbfa63b10595d44e123b9c4Adrian Frost * Copyright 2008 Sun Microsystems, Inc. All rights reserved.
7aec1d6e253b21f9e9b7ef68b4d81ab9859b51fecindi * Use is subject to license terms.
7aec1d6e253b21f9e9b7ef68b4d81ab9859b51fecindi * Public interface to routines implemented by CPU modules
20c794b39650d115e17a15983b6b82e46238cf45gavinm * Set to force cmi_init to fail.
20c794b39650d115e17a15983b6b82e46238cf45gavinm * Set to avoid MCA initialization.
8a40a695ee676a322b094e9afe5375567bfb51e3gavinm * If cleared for debugging we will not attempt to load a model-specific
8a40a695ee676a322b094e9afe5375567bfb51e3gavinm * cpu module but will load the generic cpu module instead.
7aec1d6e253b21f9e9b7ef68b4d81ab9859b51fecindi * If cleared for debugging, we will suppress panicking on fatal hardware
7aec1d6e253b21f9e9b7ef68b4d81ab9859b51fecindi * errors. This should *only* be used for debugging; it use can and will
7aec1d6e253b21f9e9b7ef68b4d81ab9859b51fecindi * cause data corruption if actual hardware errors are detected by the system.
e3d60c9bd991a9826cbfa63b10595d44e123b9c4Adrian Frost * Set to indicate whether we are able to enable cmci interrupt.
20c794b39650d115e17a15983b6b82e46238cf45gavinm * Subdirectory (relative to the module search path) in which we will
20c794b39650d115e17a15983b6b82e46238cf45gavinm * look for cpu modules.
20c794b39650d115e17a15983b6b82e46238cf45gavinm * CPU modules have a filenames such as "cpu.AuthenticAMD.15" and
20c794b39650d115e17a15983b6b82e46238cf45gavinm * "cpu.generic" - the "cpu" prefix is specified by the following.
20c794b39650d115e17a15983b6b82e46238cf45gavinm * Structure used to keep track of cpu modules we have loaded and their ops
20c794b39650d115e17a15983b6b82e46238cf45gavinmtypedef struct cmi {
20c794b39650d115e17a15983b6b82e46238cf45gavinm * Functions we need from cmi_hw.c that are not part of the cpu_module.h
20c794b39650d115e17a15983b6b82e46238cf45gavinm * interface.
e4b86885570d77af552e9cf94f142f4d744fb8c8Cheng Sean Yeextern cmi_hdl_t cmi_hdl_create(enum cmi_hdl_class, uint_t, uint_t, uint_t);
20c794b39650d115e17a15983b6b82e46238cf45gavinmextern void cmi_hdl_setcmi(cmi_hdl_t, void *, void *);
20c794b39650d115e17a15983b6b82e46238cf45gavinmextern void cmi_hdl_setmc(cmi_hdl_t, const struct cmi_mc_ops *, void *);
20c794b39650d115e17a15983b6b82e46238cf45gavinm#define CMI_OP_PRESENT(cmi, op) ((cmi) && CMI_OPS(cmi)->op != NULL)
20c794b39650d115e17a15983b6b82e46238cf45gavinm#define CMI_MATCH_STEPPING 3 /* Match down to stepping */
20c794b39650d115e17a15983b6b82e46238cf45gavinm * Hold the module in memory. We call to CPU modules without using the
20c794b39650d115e17a15983b6b82e46238cf45gavinm * stubs mechanism, so these modules must be manually held in memory.
20c794b39650d115e17a15983b6b82e46238cf45gavinm * The mod_ref acts as if another loaded module has a dependency on us.
20c794b39650d115e17a15983b6b82e46238cf45gavinm if ((ops = (cmi_ops_t *)modlookup_by_modctl(modp, "_cmi_ops")) ==
20c794b39650d115e17a15983b6b82e46238cf45gavinm cmn_err(CE_WARN, "cpu module '%s' is invalid: no _cmi_ops "
20c794b39650d115e17a15983b6b82e46238cf45gavinm cmn_err(CE_WARN, "cpu module '%s' is invalid: no cmi_init "
7aec1d6e253b21f9e9b7ef68b4d81ab9859b51fecindi for (cmi = cmi_list; cmi != NULL; cmi = cmi->cmi_next) {
20c794b39650d115e17a15983b6b82e46238cf45gavinm if ((ver = modlookup_by_modctl(modp, "_cmi_api_version")) == NULL) {
20c794b39650d115e17a15983b6b82e46238cf45gavinm * Apparently a cpu module before versioning was introduced -
20c794b39650d115e17a15983b6b82e46238cf45gavinm * we call this version 0.
20c794b39650d115e17a15983b6b82e46238cf45gavinm "_cmi_api_version 0x%x has bad magic",
20c794b39650d115e17a15983b6b82e46238cf45gavinm cmn_err(CE_WARN, "cpu module '%s' has API version %d, "
20c794b39650d115e17a15983b6b82e46238cf45gavinmcmi_cpu_match(cmi_hdl_t hdl1, cmi_hdl_t hdl2, int match)
20c794b39650d115e17a15983b6b82e46238cf45gavinm return (0);
20c794b39650d115e17a15983b6b82e46238cf45gavinm return (0);
20c794b39650d115e17a15983b6b82e46238cf45gavinm return (0);
20c794b39650d115e17a15983b6b82e46238cf45gavinm return (0);
20c794b39650d115e17a15983b6b82e46238cf45gavinm return (1);
20c794b39650d115e17a15983b6b82e46238cf45gavinmcmi_search_list_cb(cmi_hdl_t whdl, void *arg1, void *arg2, void *arg3)
20c794b39650d115e17a15983b6b82e46238cf45gavinm cmi_hdl_walk(cmi_search_list_cb, (void *)hdl, (void *)&match, &dhdl);
20c794b39650d115e17a15983b6b82e46238cf45gavinmcmi_load_module(cmi_hdl_t hdl, int match, int *chosenp)
20c794b39650d115e17a15983b6b82e46238cf45gavinm ASSERT(match == CMI_MATCH_STEPPING || match == CMI_MATCH_MODEL ||
20c794b39650d115e17a15983b6b82e46238cf45gavinm match == CMI_MATCH_FAMILY || match == CMI_MATCH_VENDOR);
20c794b39650d115e17a15983b6b82e46238cf45gavinm * Have we already loaded a module for a cpu with the same
7aec1d6e253b21f9e9b7ef68b4d81ab9859b51fecindi modid = modload_qualified(CPUMOD_SUBDIR, CPUMOD_PREFIX,
20c794b39650d115e17a15983b6b82e46238cf45gavinm * Try to load a cpu module with specific support for this chip type.
20c794b39650d115e17a15983b6b82e46238cf45gavinm for (i = CMI_MATCH_STEPPING; i >= CMI_MATCH_VENDOR; i--) {
20c794b39650d115e17a15983b6b82e46238cf45gavinm if ((cmi = cmi_load_module(hdl, i, &suffixlevel)) == NULL)
20c794b39650d115e17a15983b6b82e46238cf45gavinm * A module has loaded and has a _cmi_ops structure, and the
20c794b39650d115e17a15983b6b82e46238cf45gavinm * module has been held for this instance. Call its cmi_init
20c794b39650d115e17a15983b6b82e46238cf45gavinm * entry point - we expect success (0) or ENOTSUP.
20c794b39650d115e17a15983b6b82e46238cf45gavinm if ((err = cmi->cmi_ops->cmi_init(hdl, datap)) == 0) {
20c794b39650d115e17a15983b6b82e46238cf45gavinm "chip %d core %d strand %d\n",
20c794b39650d115e17a15983b6b82e46238cf45gavinm cmn_err(CE_WARN, "failed to init cpu module '%s' on "
20c794b39650d115e17a15983b6b82e46238cf45gavinm "chip %d core %d strand %d: err=%d\n",
20c794b39650d115e17a15983b6b82e46238cf45gavinm * The module failed or declined to init, so release
20c794b39650d115e17a15983b6b82e46238cf45gavinm * it and update i to be equal to the number
20c794b39650d115e17a15983b6b82e46238cf45gavinm * of suffices actually used in the last module path.
20c794b39650d115e17a15983b6b82e46238cf45gavinm * Load the generic IA32 MCA cpu module, which may still supplement
20c794b39650d115e17a15983b6b82e46238cf45gavinm * itself with model-specific support through cpu model-specific modules.
7aec1d6e253b21f9e9b7ef68b4d81ab9859b51fecindi if ((modid = modload(CPUMOD_SUBDIR, CPUMOD_PREFIX ".generic")) == -1)
20c794b39650d115e17a15983b6b82e46238cf45gavinm if ((err = cmi->cmi_ops->cmi_init(hdl, datap)) != 0) {
20c794b39650d115e17a15983b6b82e46238cf45gavinmcmi_init(enum cmi_hdl_class class, uint_t chipid, uint_t coreid,
e4b86885570d77af552e9cf94f142f4d744fb8c8Cheng Sean Ye if ((hdl = cmi_hdl_create(class, chipid, coreid, strandid)) == NULL) {
20c794b39650d115e17a15983b6b82e46238cf45gavinm cmn_err(CE_WARN, "There will be no MCA support on chip %d "
20c794b39650d115e17a15983b6b82e46238cf45gavinm "core %d strand %d (cmi_hdl_create returned NULL)\n",
20c794b39650d115e17a15983b6b82e46238cf45gavinm if (cmi == NULL && (cmi = cmi_load_generic(hdl, &data)) == NULL) {
20c794b39650d115e17a15983b6b82e46238cf45gavinm cmn_err(CE_WARN, "There will be no MCA support on chip %d "
20c794b39650d115e17a15983b6b82e46238cf45gavinm * cmi_fini is not called at the moment. It is intended to be called
20c794b39650d115e17a15983b6b82e46238cf45gavinm * on DR deconfigure of a cpu resource. It should not be called at
20c794b39650d115e17a15983b6b82e46238cf45gavinm * simple offline of a cpu.
20c794b39650d115e17a15983b6b82e46238cf45gavinm cmi_hdl_rele(hdl); /* release hold obtained in cmi_hdl_create */
e4b86885570d77af552e9cf94f142f4d744fb8c8Cheng Sean Ye * cmi_post_startup is called from post_startup for the boot cpu only (no
e4b86885570d77af552e9cf94f142f4d744fb8c8Cheng Sean Ye * other cpus are started yet).
8a40a695ee676a322b094e9afe5375567bfb51e3gavinm * Called just once from start_other_cpus when all processors are started.
8a40a695ee676a322b094e9afe5375567bfb51e3gavinm * This will not be called for each cpu, so the registered op must not
e4b86885570d77af552e9cf94f142f4d744fb8c8Cheng Sean Ye * assume it is called as such. We are not necessarily executing on
e4b86885570d77af552e9cf94f142f4d744fb8c8Cheng Sean Ye * the boot cpu.
20c794b39650d115e17a15983b6b82e46238cf45gavinm#define CMI_RESPONSE_PANIC 0x0 /* panic must have value 0 */
20c794b39650d115e17a15983b6b82e46238cf45gavinm * Return 0 if we will panic in response to this machine check, otherwise
20c794b39650d115e17a15983b6b82e46238cf45gavinm * non-zero. If the caller is cmi_mca_trap in this file then the nonzero
20c794b39650d115e17a15983b6b82e46238cf45gavinm * return values are to be interpreted from CMI_RESPONSE_* above.
20c794b39650d115e17a15983b6b82e46238cf45gavinm * This function must just return what will be done without actually
20c794b39650d115e17a15983b6b82e46238cf45gavinm * doing anything; this includes not changing the regs.
20c794b39650d115e17a15983b6b82e46238cf45gavinm int panicrsp = cmi_panic_on_uncorrectable_error ? CMI_RESPONSE_PANIC :
20c794b39650d115e17a15983b6b82e46238cf45gavinm ASSERT(rp != NULL); /* don't call for polling, only on #MC */
20c794b39650d115e17a15983b6b82e46238cf45gavinm * If no bits are set in the disposition then there is nothing to
20c794b39650d115e17a15983b6b82e46238cf45gavinm * worry about and we do not need to trampoline to ontrap or
20c794b39650d115e17a15983b6b82e46238cf45gavinm * lofault handlers.
20c794b39650d115e17a15983b6b82e46238cf45gavinm * Unconstrained errors cannot be forgiven, even by ontrap or
20c794b39650d115e17a15983b6b82e46238cf45gavinm * lofault protection. The data is not poisoned and may not
20c794b39650d115e17a15983b6b82e46238cf45gavinm * even belong to the trapped context - eg a writeback of
20c794b39650d115e17a15983b6b82e46238cf45gavinm * data that is found to be bad.
20c794b39650d115e17a15983b6b82e46238cf45gavinm * ontrap OT_DATA_EC and lofault protection forgive any disposition
20c794b39650d115e17a15983b6b82e46238cf45gavinm * other than unconstrained, even those normally forced fatal.
20c794b39650d115e17a15983b6b82e46238cf45gavinm if ((otp = curthread->t_ontrap) != NULL && otp->ot_prot & OT_DATA_EC)
20c794b39650d115e17a15983b6b82e46238cf45gavinm * Forced-fatal errors are terminal even in user mode.
20c794b39650d115e17a15983b6b82e46238cf45gavinm * If the trapped context is corrupt or we have no instruction pointer
20c794b39650d115e17a15983b6b82e46238cf45gavinm * to resume at (and aren't trampolining to a fault handler)
20c794b39650d115e17a15983b6b82e46238cf45gavinm * then in the kernel case we must panic and in usermode we
20c794b39650d115e17a15983b6b82e46238cf45gavinm * kill the affected contract.
20c794b39650d115e17a15983b6b82e46238cf45gavinm if (disp & (CMI_ERRDISP_CURCTXBAD | CMI_ERRDISP_RIPV_INVALID))
20c794b39650d115e17a15983b6b82e46238cf45gavinm return (USERMODE(rp->r_cs) ? CMI_RESPONSE_CKILL : panicrsp);
20c794b39650d115e17a15983b6b82e46238cf45gavinm * Anything else is harmless
20c794b39650d115e17a15983b6b82e46238cf45gavinm cmn_err(CE_WARN, "suppressing panic from fatal #mc");
20c794b39650d115e17a15983b6b82e46238cf45gavinm * Native #MC handler - we branch to here from mcetrap
20c794b39650d115e17a15983b6b82e46238cf45gavinm/*ARGSUSED*/
20c794b39650d115e17a15983b6b82e46238cf45gavinm * This function can call cmn_err, and the cpu module cmi_mca_trap
20c794b39650d115e17a15983b6b82e46238cf45gavinm * entry point may also elect to call cmn_err (e.g., if it can't
20c794b39650d115e17a15983b6b82e46238cf45gavinm * log the error onto an errorq, say very early in boot).
20c794b39650d115e17a15983b6b82e46238cf45gavinm * We need to let cprintf know that we must not block.
20c794b39650d115e17a15983b6b82e46238cf45gavinm if ((hdl = cmi_hdl_lookup(CMI_HDL_NATIVE, cmi_ntv_hwchipid(CPU),
20c794b39650d115e17a15983b6b82e46238cf45gavinm cmi_ntv_hwcoreid(CPU), cmi_ntv_hwstrandid(CPU))) == NULL ||
20c794b39650d115e17a15983b6b82e46238cf45gavinm "handle lookup failed");
20c794b39650d115e17a15983b6b82e46238cf45gavinm cmn_err(CE_WARN, "Invalid response from cmi_mce_response");
20c794b39650d115e17a15983b6b82e46238cf45gavinm /*FALLTHRU*/
20c794b39650d115e17a15983b6b82e46238cf45gavinm#endif /* __xpv */
e3d60c9bd991a9826cbfa63b10595d44e123b9c4Adrian Frost if ((hdl = cmi_hdl_lookup(CMI_HDL_NATIVE, cmi_ntv_hwchipid(CPU),
e3d60c9bd991a9826cbfa63b10595d44e123b9c4Adrian Frost cmi_ntv_hwcoreid(CPU), cmi_ntv_hwstrandid(CPU))) == NULL ||
e3d60c9bd991a9826cbfa63b10595d44e123b9c4Adrian Frost cmn_err(CE_WARN, "CMCI interrupt on cpuid %d: %s",
e3d60c9bd991a9826cbfa63b10595d44e123b9c4Adrian Frost hdl ? "handle lookup ok but no CMCI handler found" :
e3d60c9bd991a9826cbfa63b10595d44e123b9c4Adrian Frost "handle lookup failed");
e4b86885570d77af552e9cf94f142f4d744fb8c8Cheng Sean Ye#endif /* __xpv */
20c794b39650d115e17a15983b6b82e46238cf45gavinmcmi_mc_register(cmi_hdl_t hdl, const cmi_mc_ops_t *mcops, void *mcdata)
4156fc34b973159b0334e05ae5ec19344487bdc0gavinmcmi_mc_patounum(uint64_t pa, uint8_t valid_hi, uint8_t valid_lo, uint32_t synd,
20c794b39650d115e17a15983b6b82e46238cf45gavinm rv = mcops->cmi_mc_patounum(cmi_hdl_getmcdata(hdl), pa, valid_hi,
7aec1d6e253b21f9e9b7ef68b4d81ab9859b51fecindicmi_mc_unumtopa(mc_unum_t *up, nvlist_t *nvl, uint64_t *pap)
20c794b39650d115e17a15983b6b82e46238cf45gavinm return (CMIERR_API); /* convert from just one form */
e4b86885570d77af552e9cf94f142f4d744fb8c8Cheng Sean Ye "asru-" FM_FMRI_HC_SPECIFIC_PHYSADDR, pap) == 0 ||
e4b86885570d77af552e9cf94f142f4d744fb8c8Cheng Sean Ye nvlist_lookup_uint64(hcsp, FM_FMRI_HC_SPECIFIC_PHYSADDR,
20c794b39650d115e17a15983b6b82e46238cf45gavinm rv = mcops->cmi_mc_unumtopa(cmi_hdl_getmcdata(hdl), up, nvl, pap);
20c794b39650d115e17a15983b6b82e46238cf45gavinmcmi_mc_logout(cmi_hdl_t hdl, boolean_t ismc, boolean_t sync)
20c794b39650d115e17a15983b6b82e46238cf45gavinm if (cmi_no_mca_init || (mcops = cmi_hdl_getmcops(hdl)) == NULL)
20c794b39650d115e17a15983b6b82e46238cf45gavinmcmi_hdl_msrinject(cmi_hdl_t hdl, cmi_mca_regs_t *regs, uint_t nregs,
e4b86885570d77af552e9cf94f142f4d744fb8c8Cheng Sean Ye rc = CMI_OPS(cmi)->cmi_msrinject(hdl, regs, nregs, force);
20c794b39650d115e17a15983b6b82e46238cf45gavinm return (cmi_panic_on_uncorrectable_error ? B_TRUE : B_FALSE);