17c478bd9Sstevel@tonic-gate /*
27c478bd9Sstevel@tonic-gate  * CDDL HEADER START
37c478bd9Sstevel@tonic-gate  *
47c478bd9Sstevel@tonic-gate  * The contents of this file are subject to the terms of the
55f25dc2aSgavinm  * Common Development and Distribution License (the "License").
65f25dc2aSgavinm  * You may not use this file except in compliance with the License.
77c478bd9Sstevel@tonic-gate  *
87c478bd9Sstevel@tonic-gate  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
97c478bd9Sstevel@tonic-gate  * or http://www.opensolaris.org/os/licensing.
107c478bd9Sstevel@tonic-gate  * See the License for the specific language governing permissions
117c478bd9Sstevel@tonic-gate  * and limitations under the License.
127c478bd9Sstevel@tonic-gate  *
137c478bd9Sstevel@tonic-gate  * When distributing Covered Code, include this CDDL HEADER in each
147c478bd9Sstevel@tonic-gate  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
157c478bd9Sstevel@tonic-gate  * If applicable, add the following below this CDDL HEADER, with the
167c478bd9Sstevel@tonic-gate  * fields enclosed by brackets "[]" replaced with your own identifying
177c478bd9Sstevel@tonic-gate  * information: Portions Copyright [yyyy] [name of copyright owner]
187c478bd9Sstevel@tonic-gate  *
197c478bd9Sstevel@tonic-gate  * CDDL HEADER END
207c478bd9Sstevel@tonic-gate  */
21d9638e54Smws 
227c478bd9Sstevel@tonic-gate /*
23*d4ac42a1STrang Do  * Copyright (c) 2004, 2010, Oracle and/or its affiliates. All rights reserved.
247c478bd9Sstevel@tonic-gate  */
257c478bd9Sstevel@tonic-gate 
267c478bd9Sstevel@tonic-gate #include <cma.h>
277c478bd9Sstevel@tonic-gate 
28e4b86885SCheng Sean Ye #include <unistd.h>
29e4b86885SCheng Sean Ye #include <fcntl.h>
307c478bd9Sstevel@tonic-gate #include <strings.h>
317c478bd9Sstevel@tonic-gate #include <errno.h>
327c478bd9Sstevel@tonic-gate #include <time.h>
337c478bd9Sstevel@tonic-gate #include <fm/fmd_api.h>
347c478bd9Sstevel@tonic-gate #include <sys/fm/protocol.h>
35843e1988Sjohnlev #include <sys/systeminfo.h>
36843e1988Sjohnlev #include <sys/utsname.h>
377c478bd9Sstevel@tonic-gate 
385f149bcaScy #ifdef sun4v
395f149bcaScy #include <sys/fm/ldom.h>
405f149bcaScy 
415f149bcaScy static fmd_hdl_t *init_hdl;
425f149bcaScy ldom_hdl_t *cma_lhp;
435f149bcaScy #endif
445f149bcaScy 
45e4b86885SCheng Sean Ye #ifdef i386
46e4b86885SCheng Sean Ye boolean_t cma_is_native;
47e4b86885SCheng Sean Ye #endif
48e4b86885SCheng Sean Ye 
495f149bcaScy extern const char *fmd_fmri_get_platform();
505f149bcaScy 
517c478bd9Sstevel@tonic-gate cma_t cma;
527c478bd9Sstevel@tonic-gate 
537c478bd9Sstevel@tonic-gate cma_stats_t cma_stats = {
547c478bd9Sstevel@tonic-gate 	{ "cpu_flts", FMD_TYPE_UINT64, "cpu faults resolved" },
555f149bcaScy 	{ "cpu_repairs", FMD_TYPE_UINT64, "cpu faults repaired" },
567c478bd9Sstevel@tonic-gate 	{ "cpu_fails", FMD_TYPE_UINT64, "cpu faults unresolveable" },
577c478bd9Sstevel@tonic-gate 	{ "cpu_blfails", FMD_TYPE_UINT64, "failed cpu blacklists" },
587c478bd9Sstevel@tonic-gate 	{ "cpu_supp", FMD_TYPE_UINT64, "cpu offlines suppressed" },
597c478bd9Sstevel@tonic-gate 	{ "cpu_blsupp", FMD_TYPE_UINT64, "cpu blacklists suppressed" },
607c478bd9Sstevel@tonic-gate 	{ "page_flts", FMD_TYPE_UINT64, "page faults resolved" },
615f149bcaScy 	{ "page_repairs", FMD_TYPE_UINT64, "page faults repaired" },
627c478bd9Sstevel@tonic-gate 	{ "page_fails", FMD_TYPE_UINT64, "page faults unresolveable" },
637c478bd9Sstevel@tonic-gate 	{ "page_supp", FMD_TYPE_UINT64, "page retires suppressed" },
647c478bd9Sstevel@tonic-gate 	{ "page_nonent", FMD_TYPE_UINT64, "retires for non-existent fmris" },
657c478bd9Sstevel@tonic-gate 	{ "bad_flts", FMD_TYPE_UINT64, "invalid fault events received" },
667c478bd9Sstevel@tonic-gate 	{ "nop_flts", FMD_TYPE_UINT64, "inapplicable fault events received" },
677c478bd9Sstevel@tonic-gate 	{ "auto_flts", FMD_TYPE_UINT64, "auto-close faults received" }
687c478bd9Sstevel@tonic-gate };
697c478bd9Sstevel@tonic-gate 
707c478bd9Sstevel@tonic-gate typedef struct cma_subscriber {
717c478bd9Sstevel@tonic-gate 	const char *subr_class;
727c478bd9Sstevel@tonic-gate 	const char *subr_sname;
737c478bd9Sstevel@tonic-gate 	uint_t subr_svers;
745f149bcaScy 	int (*subr_func)(fmd_hdl_t *, nvlist_t *, nvlist_t *, const char *,
755f149bcaScy 	    boolean_t);
767c478bd9Sstevel@tonic-gate } cma_subscriber_t;
777c478bd9Sstevel@tonic-gate 
787c478bd9Sstevel@tonic-gate static const cma_subscriber_t cma_subrs[] = {
79e4b86885SCheng Sean Ye #if defined(i386)
80e4b86885SCheng Sean Ye 	/*
81e4b86885SCheng Sean Ye 	 * On x86, the ASRUs are expected to be in hc scheme.  When
82e4b86885SCheng Sean Ye 	 * cpumem-retire wants to retire a cpu or mem page, it calls the
83e4b86885SCheng Sean Ye 	 * methods registered in the topo node to do that.  The topo
84e4b86885SCheng Sean Ye 	 * enumerator, which necessarily knows all the config info that
85e4b86885SCheng Sean Ye 	 * we'd ever need in deciding what/how to retire etc.  This takes
86e4b86885SCheng Sean Ye 	 * away much of that complexity from the agent into the entity
87e4b86885SCheng Sean Ye 	 * that knows all config/topo information.
88e4b86885SCheng Sean Ye 	 */
89e4b86885SCheng Sean Ye 	{ "fault.memory.page", FM_FMRI_SCHEME_HC, FM_HC_SCHEME_VERSION,
90e4b86885SCheng Sean Ye 	    cma_page_retire },
91e4b86885SCheng Sean Ye 	{ "fault.memory.page_sb", FM_FMRI_SCHEME_HC, FM_HC_SCHEME_VERSION,
92e4b86885SCheng Sean Ye 	    cma_page_retire },
93e4b86885SCheng Sean Ye 	{ "fault.memory.page_ck", FM_FMRI_SCHEME_HC, FM_HC_SCHEME_VERSION,
94e4b86885SCheng Sean Ye 	    cma_page_retire },
95e4b86885SCheng Sean Ye 	{ "fault.memory.page_ue", FM_FMRI_SCHEME_HC, FM_HC_SCHEME_VERSION,
96e4b86885SCheng Sean Ye 	    cma_page_retire },
97e4b86885SCheng Sean Ye 	{ "fault.memory.generic-x86.page_ce", FM_FMRI_SCHEME_HC,
98e4b86885SCheng Sean Ye 	    FM_HC_SCHEME_VERSION, cma_page_retire },
99e4b86885SCheng Sean Ye 	{ "fault.memory.generic-x86.page_ue", FM_FMRI_SCHEME_HC,
100e4b86885SCheng Sean Ye 	    FM_HC_SCHEME_VERSION, cma_page_retire },
101e4b86885SCheng Sean Ye 	{ "fault.memory.intel.page_ce", FM_FMRI_SCHEME_HC,
102e4b86885SCheng Sean Ye 	    FM_HC_SCHEME_VERSION, cma_page_retire },
103e4b86885SCheng Sean Ye 	{ "fault.memory.intel.page_ue", FM_FMRI_SCHEME_HC,
104e4b86885SCheng Sean Ye 	    FM_HC_SCHEME_VERSION, cma_page_retire },
105e4b86885SCheng Sean Ye 	{ "fault.memory.dimm", FM_FMRI_SCHEME_HC, FM_HC_SCHEME_VERSION,
106e4b86885SCheng Sean Ye 	    NULL },
107e4b86885SCheng Sean Ye 	{ "fault.memory.dimm_sb", FM_FMRI_SCHEME_HC, FM_HC_SCHEME_VERSION,
108e4b86885SCheng Sean Ye 	    NULL },
109e4b86885SCheng Sean Ye 	{ "fault.memory.dimm_ck", FM_FMRI_SCHEME_HC, FM_HC_SCHEME_VERSION,
110e4b86885SCheng Sean Ye 	    NULL },
111e4b86885SCheng Sean Ye 	{ "fault.memory.dimm_ue", FM_FMRI_SCHEME_HC, FM_HC_SCHEME_VERSION,
112e4b86885SCheng Sean Ye 	    NULL },
113e4b86885SCheng Sean Ye 	{ "fault.memory.generic-x86.dimm_ce", FM_FMRI_SCHEME_HC,
114e4b86885SCheng Sean Ye 	    FM_HC_SCHEME_VERSION, NULL },
115e4b86885SCheng Sean Ye 	{ "fault.memory.generic-x86.dimm_ue", FM_FMRI_SCHEME_HC,
116e4b86885SCheng Sean Ye 	    FM_HC_SCHEME_VERSION, NULL },
117e4b86885SCheng Sean Ye 	{ "fault.memory.intel.dimm_ce", FM_FMRI_SCHEME_HC,
118e4b86885SCheng Sean Ye 	    FM_HC_SCHEME_VERSION, NULL },
119e4b86885SCheng Sean Ye 	{ "fault.memory.intel.dimm_ue", FM_FMRI_SCHEME_HC,
120e4b86885SCheng Sean Ye 	    FM_HC_SCHEME_VERSION, NULL },
121e4b86885SCheng Sean Ye 	{ "fault.memory.intel.fbd.*", FM_FMRI_SCHEME_HC,
122e4b86885SCheng Sean Ye 	    FM_HC_SCHEME_VERSION, NULL },
123e4b86885SCheng Sean Ye 	{ "fault.memory.dimm_testfail", FM_FMRI_SCHEME_HC,
124e4b86885SCheng Sean Ye 	    FM_HC_SCHEME_VERSION, NULL },
125e4b86885SCheng Sean Ye 	{ "fault.memory.bank", FM_FMRI_SCHEME_HC, FM_HC_SCHEME_VERSION,
126e4b86885SCheng Sean Ye 	    NULL },
127e4b86885SCheng Sean Ye 	{ "fault.memory.datapath", FM_FMRI_SCHEME_HC, FM_HC_SCHEME_VERSION,
128e4b86885SCheng Sean Ye 	    NULL },
129491f61a1SYanmin Sun 	{ "fault.cpu.intel.quickpath.mem_scrubbing", FM_FMRI_SCHEME_HC,
130491f61a1SYanmin Sun 	    FM_HC_SCHEME_VERSION, cma_page_retire },
131e4b86885SCheng Sean Ye 	{ "fault.cpu.intel.quickpath.*", FM_FMRI_SCHEME_HC,
132e4b86885SCheng Sean Ye 	    FM_HC_SCHEME_VERSION, NULL },
133e4b86885SCheng Sean Ye 	{ "fault.cpu.generic-x86.mc", FM_FMRI_SCHEME_HC,
134e4b86885SCheng Sean Ye 	    FM_HC_SCHEME_VERSION, NULL },
135e4b86885SCheng Sean Ye 	{ "fault.cpu.intel.dma", FM_FMRI_SCHEME_HC,
136e4b86885SCheng Sean Ye 	    FM_HC_SCHEME_VERSION, NULL },
137e4b86885SCheng Sean Ye 	{ "fault.cpu.intel.dma", FM_FMRI_SCHEME_CPU,
138e4b86885SCheng Sean Ye 	    FM_CPU_SCHEME_VERSION, NULL },
139e4b86885SCheng Sean Ye 
140e4b86885SCheng Sean Ye 	/*
141e4b86885SCheng Sean Ye 	 * The ASRU for cpu faults are in cpu scheme on native and in hc
142e4b86885SCheng Sean Ye 	 * scheme on xpv.  So each cpu fault class needs to be listed twice.
143e4b86885SCheng Sean Ye 	 */
144e4b86885SCheng Sean Ye 
145e4b86885SCheng Sean Ye 	/*
146e4b86885SCheng Sean Ye 	 * The following faults do NOT retire a cpu thread,
147e4b86885SCheng Sean Ye 	 * and therefore must be intercepted before
1483f1e69beSCheng Sean Ye 	 * the default "fault.cpu.*" dispatch to cma_cpu_hc_retire.
149e4b86885SCheng Sean Ye 	 */
150e4b86885SCheng Sean Ye 	{ "fault.cpu.amd.dramchannel", FM_FMRI_SCHEME_HC, FM_HC_SCHEME_VERSION,
151e4b86885SCheng Sean Ye 	    NULL },
152e4b86885SCheng Sean Ye 	{ "fault.cpu.amd.dramchannel", FM_FMRI_SCHEME_CPU,
153e4b86885SCheng Sean Ye 	    FM_CPU_SCHEME_VERSION, NULL },
154e4b86885SCheng Sean Ye 	{ "fault.cpu.generic-x86.bus_interconnect_memory", FM_FMRI_SCHEME_HC,
155e4b86885SCheng Sean Ye 	    FM_HC_SCHEME_VERSION, NULL },
156e4b86885SCheng Sean Ye 	{ "fault.cpu.generic-x86.bus_interconnect_memory", FM_FMRI_SCHEME_CPU,
157e4b86885SCheng Sean Ye 	    FM_CPU_SCHEME_VERSION, NULL },
158e4b86885SCheng Sean Ye 	{ "fault.cpu.generic-x86.bus_interconnect_io", FM_FMRI_SCHEME_HC,
159e4b86885SCheng Sean Ye 	    FM_HC_SCHEME_VERSION, NULL },
160e4b86885SCheng Sean Ye 	{ "fault.cpu.generic-x86.bus_interconnect_io", FM_FMRI_SCHEME_CPU,
161e4b86885SCheng Sean Ye 	    FM_CPU_SCHEME_VERSION, NULL },
162e4b86885SCheng Sean Ye 	{ "fault.cpu.generic-x86.bus_interconnect", FM_FMRI_SCHEME_HC,
163e4b86885SCheng Sean Ye 	    FM_HC_SCHEME_VERSION, NULL },
164e4b86885SCheng Sean Ye 	{ "fault.cpu.generic-x86.bus_interconnect", FM_FMRI_SCHEME_CPU,
165e4b86885SCheng Sean Ye 	    FM_CPU_SCHEME_VERSION, NULL },
166e4b86885SCheng Sean Ye 	{ "fault.cpu.intel.bus_interconnect_memory", FM_FMRI_SCHEME_HC,
167e4b86885SCheng Sean Ye 	    FM_HC_SCHEME_VERSION, NULL },
168e4b86885SCheng Sean Ye 	{ "fault.cpu.intel.bus_interconnect_memory", FM_FMRI_SCHEME_CPU,
169e4b86885SCheng Sean Ye 	    FM_CPU_SCHEME_VERSION, NULL },
170e4b86885SCheng Sean Ye 	{ "fault.cpu.intel.bus_interconnect_io", FM_FMRI_SCHEME_HC,
171e4b86885SCheng Sean Ye 	    FM_HC_SCHEME_VERSION, NULL },
172e4b86885SCheng Sean Ye 	{ "fault.cpu.intel.bus_interconnect_io", FM_FMRI_SCHEME_CPU,
173e4b86885SCheng Sean Ye 	    FM_CPU_SCHEME_VERSION, NULL },
174e4b86885SCheng Sean Ye 	{ "fault.cpu.intel.bus_interconnect", FM_FMRI_SCHEME_HC,
175e4b86885SCheng Sean Ye 	    FM_HC_SCHEME_VERSION, NULL },
176e4b86885SCheng Sean Ye 	{ "fault.cpu.intel.bus_interconnect", FM_FMRI_SCHEME_CPU,
177e4b86885SCheng Sean Ye 	    FM_CPU_SCHEME_VERSION, NULL },
178e4b86885SCheng Sean Ye 	{ "fault.cpu.intel.nb.*", FM_FMRI_SCHEME_HC, FM_HC_SCHEME_VERSION,
179e4b86885SCheng Sean Ye 	    NULL },
180e4b86885SCheng Sean Ye 	{ "fault.cpu.intel.nb.*", FM_FMRI_SCHEME_CPU, FM_CPU_SCHEME_VERSION,
181e4b86885SCheng Sean Ye 	    NULL },
182e4b86885SCheng Sean Ye 	{ "fault.cpu.intel.dma", FM_FMRI_SCHEME_HC, FM_HC_SCHEME_VERSION,
183e4b86885SCheng Sean Ye 	    NULL },
184e4b86885SCheng Sean Ye 	{ "fault.cpu.intel.dma", FM_FMRI_SCHEME_CPU, FM_CPU_SCHEME_VERSION,
185e4b86885SCheng Sean Ye 	    NULL },
186e4b86885SCheng Sean Ye 	{ "fault.cpu.*", FM_FMRI_SCHEME_HC, FM_HC_SCHEME_VERSION,
187e4b86885SCheng Sean Ye 	    cma_cpu_hc_retire },
188e4b86885SCheng Sean Ye 	{ "fault.cpu.*", FM_FMRI_SCHEME_CPU, FM_CPU_SCHEME_VERSION,
189e4b86885SCheng Sean Ye 	    cma_cpu_hc_retire },
190e4b86885SCheng Sean Ye #elif defined(sun4v)
1911529f529SScott Davenport 	/*
1921529f529SScott Davenport 	 * The following are PI sun4v faults
1931529f529SScott Davenport 	 */
1941529f529SScott Davenport 	{ "fault.memory.memlink", FM_FMRI_SCHEME_HC,
1951529f529SScott Davenport 	    FM_HC_SCHEME_VERSION, NULL },
1961529f529SScott Davenport 	{ "fault.memory.memlink-uc", FM_FMRI_SCHEME_HC,
1971529f529SScott Davenport 	    FM_HC_SCHEME_VERSION, NULL },
1981529f529SScott Davenport 	{ "fault.memory.memlink-failover", FM_FMRI_SCHEME_HC,
1991529f529SScott Davenport 	    FM_HC_SCHEME_VERSION, NULL },
2001529f529SScott Davenport 	{ "fault.memory.dimm-ue-imminent", FM_FMRI_SCHEME_HC,
2011529f529SScott Davenport 	    FM_HC_SCHEME_VERSION, NULL },
2021529f529SScott Davenport 	{ "fault.memory.dram-ue-imminent", FM_FMRI_SCHEME_HC,
2031529f529SScott Davenport 	    FM_HC_SCHEME_VERSION, NULL },
2041529f529SScott Davenport 	{ "fault.memory.dimm-page-retires-excessive", FM_FMRI_SCHEME_HC,
2051529f529SScott Davenport 	    FM_HC_SCHEME_VERSION, NULL },
2065f149bcaScy 	{ "fault.memory.page", FM_FMRI_SCHEME_MEM, FM_MEM_SCHEME_VERSION,
2075f149bcaScy 	    cma_page_retire },
2085f149bcaScy 	{ "fault.memory.dimm", FM_FMRI_SCHEME_MEM, FM_MEM_SCHEME_VERSION,
2095f149bcaScy 	    NULL },
2105f149bcaScy 	{ "fault.memory.dimm_sb", FM_FMRI_SCHEME_MEM, FM_MEM_SCHEME_VERSION,
2115f149bcaScy 	    NULL },
2125f149bcaScy 	{ "fault.memory.dimm_ck", FM_FMRI_SCHEME_MEM, FM_MEM_SCHEME_VERSION,
2135f149bcaScy 	    NULL },
2145f149bcaScy 	{ "fault.memory.dimm_ue", FM_FMRI_SCHEME_MEM, FM_MEM_SCHEME_VERSION,
2155f149bcaScy 	    NULL },
216f6452528STom Pothier 	{ "fault.memory.dimm-page-retires-excessive", FM_FMRI_SCHEME_MEM,
217f6452528STom Pothier 	    FM_MEM_SCHEME_VERSION, NULL },
218f6452528STom Pothier 	{ "fault.memory.dimm-ue-imminent", FM_FMRI_SCHEME_MEM,
219f6452528STom Pothier 	    FM_MEM_SCHEME_VERSION, NULL },
220f6452528STom Pothier 	{ "fault.memory.dram-ue-imminent", FM_FMRI_SCHEME_MEM,
221f6452528STom Pothier 	    FM_MEM_SCHEME_VERSION, NULL },
2225f149bcaScy 	{ "fault.memory.bank", FM_FMRI_SCHEME_MEM, FM_MEM_SCHEME_VERSION,
2235f149bcaScy 	    NULL },
2245f149bcaScy 	{ "fault.memory.datapath", FM_FMRI_SCHEME_MEM, FM_MEM_SCHEME_VERSION,
2255f149bcaScy 	    NULL },
226*d4ac42a1STrang Do 	{ "fault.memory.datapath", FM_FMRI_SCHEME_HC, FM_HC_SCHEME_VERSION,
227*d4ac42a1STrang Do 	    NULL },
2285f149bcaScy 	{ "fault.memory.link-c", FM_FMRI_SCHEME_MEM, FM_MEM_SCHEME_VERSION,
2295f149bcaScy 	    NULL },
2305f149bcaScy 	{ "fault.memory.link-u", FM_FMRI_SCHEME_MEM, FM_MEM_SCHEME_VERSION,
2315f149bcaScy 	    NULL },
2325f149bcaScy 	{ "fault.memory.link-f", FM_FMRI_SCHEME_MEM, FM_MEM_SCHEME_VERSION,
2335f149bcaScy 	    NULL },
234d3169229SJakub Jermar 	{ "fault.memory.link-c", FM_FMRI_SCHEME_HC, FM_HC_SCHEME_VERSION,
235d3169229SJakub Jermar 	    NULL },
236d3169229SJakub Jermar 	{ "fault.memory.link-u", FM_FMRI_SCHEME_HC, FM_HC_SCHEME_VERSION,
237d3169229SJakub Jermar 	    NULL },
238d3169229SJakub Jermar 	{ "fault.memory.link-f", FM_FMRI_SCHEME_HC, FM_HC_SCHEME_VERSION,
239d3169229SJakub Jermar 	    NULL },
2405f149bcaScy 
2415f149bcaScy 	/*
2425f149bcaScy 	 * The following ultraSPARC-T1/T2 faults do NOT retire a cpu thread,
2435f149bcaScy 	 * and therefore must be intercepted before
2443f1e69beSCheng Sean Ye 	 * the default "fault.cpu.*" dispatch to cma_cpu_hc_retire.
2455f149bcaScy 	 */
2465f149bcaScy 	{ "fault.cpu.*.l2cachedata", FM_FMRI_SCHEME_CPU,
2475f149bcaScy 	    FM_CPU_SCHEME_VERSION, NULL },
2485f149bcaScy 	{ "fault.cpu.*.l2cachetag", FM_FMRI_SCHEME_CPU,
2495f149bcaScy 	    FM_CPU_SCHEME_VERSION, NULL },
2505f149bcaScy 	{ "fault.cpu.*.l2cachectl", FM_FMRI_SCHEME_CPU,
2515f149bcaScy 	    FM_CPU_SCHEME_VERSION, NULL },
2525f149bcaScy 	{ "fault.cpu.*.l2data-c", FM_FMRI_SCHEME_CPU,
2535f149bcaScy 	    FM_CPU_SCHEME_VERSION, NULL },
2545f149bcaScy 	{ "fault.cpu.*.l2data-u", FM_FMRI_SCHEME_CPU,
2555f149bcaScy 	    FM_CPU_SCHEME_VERSION, NULL },
2565f149bcaScy 	{ "fault.cpu.*.mau", FM_FMRI_SCHEME_CPU,
2575f149bcaScy 	    FM_CPU_SCHEME_VERSION, NULL },
2585f149bcaScy 	{ "fault.cpu.*.lfu-u", FM_FMRI_SCHEME_CPU,
2595f149bcaScy 	    FM_CPU_SCHEME_VERSION, NULL },
2605f149bcaScy 	{ "fault.cpu.*.lfu-f", FM_FMRI_SCHEME_CPU,
2615f149bcaScy 	    FM_CPU_SCHEME_VERSION, NULL },
2625f149bcaScy 	{ "fault.cpu.*.lfu-p", FM_FMRI_SCHEME_CPU,
2635f149bcaScy 	    FM_CPU_SCHEME_VERSION, NULL },
264d3169229SJakub Jermar 	{ "fault.cpu.ultraSPARC-T1.freg", FM_FMRI_SCHEME_CPU,
265d3169229SJakub Jermar 	    FM_CPU_SCHEME_VERSION, NULL },
266d3169229SJakub Jermar 	{ "fault.cpu.ultraSPARC-T1.l2cachedata", FM_FMRI_SCHEME_CPU,
267d3169229SJakub Jermar 	    FM_CPU_SCHEME_VERSION, NULL },
268d3169229SJakub Jermar 	{ "fault.cpu.ultraSPARC-T1.l2cachetag", FM_FMRI_SCHEME_CPU,
269d3169229SJakub Jermar 	    FM_CPU_SCHEME_VERSION, NULL },
270d3169229SJakub Jermar 	{ "fault.cpu.ultraSPARC-T1.l2cachectl", FM_FMRI_SCHEME_CPU,
271d3169229SJakub Jermar 	    FM_CPU_SCHEME_VERSION, NULL },
272d3169229SJakub Jermar 	{ "fault.cpu.ultraSPARC-T1.mau", FM_FMRI_SCHEME_CPU,
273d3169229SJakub Jermar 	    FM_CPU_SCHEME_VERSION, NULL },
274d3169229SJakub Jermar 	{ "fault.cpu.ultraSPARC-T2plus.chip", FM_FMRI_SCHEME_HC,
275d3169229SJakub Jermar 	    FM_HC_SCHEME_VERSION, NULL },
2763f1e69beSCheng Sean Ye 	{ "fault.cpu.*", FM_FMRI_SCHEME_HC, FM_HC_SCHEME_VERSION,
2773f1e69beSCheng Sean Ye 	    cma_cpu_hc_retire },
2785f149bcaScy 	{ "fault.cpu.*", FM_FMRI_SCHEME_CPU, FM_CPU_SCHEME_VERSION,
2793f1e69beSCheng Sean Ye 	    cma_cpu_hc_retire },
2805f149bcaScy #elif defined(opl)
2815f149bcaScy 	{ "fault.memory.page", FM_FMRI_SCHEME_MEM, FM_MEM_SCHEME_VERSION,
2825f149bcaScy 	    cma_page_retire },
2835f149bcaScy 	{ "fault.memory.dimm", FM_FMRI_SCHEME_MEM, FM_MEM_SCHEME_VERSION,
2845f149bcaScy 	    NULL },
285f6452528STom Pothier 	{ "fault.memory.dimm-page-retires-excessive", FM_FMRI_SCHEME_MEM,
286f6452528STom Pothier 	    FM_MEM_SCHEME_VERSION, NULL },
287f6452528STom Pothier 	{ "fault.memory.dimm-ue-imminent", FM_FMRI_SCHEME_MEM,
288f6452528STom Pothier 	    FM_MEM_SCHEME_VERSION, NULL },
289f6452528STom Pothier 	{ "fault.memory.dram-ue-imminent", FM_FMRI_SCHEME_MEM,
290f6452528STom Pothier 	    FM_MEM_SCHEME_VERSION, NULL },
2915f149bcaScy 	{ "fault.memory.bank", FM_FMRI_SCHEME_MEM, FM_MEM_SCHEME_VERSION,
2925f149bcaScy 	    NULL },
2935f149bcaScy 	{ "fault.cpu.SPARC64-VI.*", FM_FMRI_SCHEME_CPU, FM_CPU_SCHEME_VERSION,
2943f1e69beSCheng Sean Ye 	    cma_cpu_cpu_retire },
2955f149bcaScy 	{ "fault.cpu.SPARC64-VII.*", FM_FMRI_SCHEME_CPU, FM_CPU_SCHEME_VERSION,
2963f1e69beSCheng Sean Ye 	    cma_cpu_cpu_retire },
2975f149bcaScy 	{ "fault.chassis.SPARC-Enterprise.cpu.SPARC64-VI.core.se",
2985f149bcaScy 		FM_FMRI_SCHEME_HC, FM_HC_SCHEME_VERSION, cma_cpu_hc_retire },
2995f149bcaScy 	{ "fault.chassis.SPARC-Enterprise.cpu.SPARC64-VI.core.se-offlinereq",
3005f149bcaScy 		FM_FMRI_SCHEME_HC, FM_HC_SCHEME_VERSION, cma_cpu_hc_retire },
3015f149bcaScy 	{ "fault.chassis.SPARC-Enterprise.cpu.SPARC64-VI.core.ce",
3025f149bcaScy 		FM_FMRI_SCHEME_HC, FM_HC_SCHEME_VERSION, cma_cpu_hc_retire },
3035f149bcaScy 	{ "fault.chassis.SPARC-Enterprise.cpu.SPARC64-VI.core.ce-offlinereq",
3045f149bcaScy 		FM_FMRI_SCHEME_HC, FM_HC_SCHEME_VERSION, cma_cpu_hc_retire },
3055f149bcaScy 	{ "fault.chassis.SPARC-Enterprise.cpu.SPARC64-VII.core.se",
3065f149bcaScy 		FM_FMRI_SCHEME_HC, FM_HC_SCHEME_VERSION, cma_cpu_hc_retire },
3075f149bcaScy 	{ "fault.chassis.SPARC-Enterprise.cpu.SPARC64-VII.core.se-offlinereq",
3085f149bcaScy 		FM_FMRI_SCHEME_HC, FM_HC_SCHEME_VERSION, cma_cpu_hc_retire },
3095f149bcaScy 	{ "fault.chassis.SPARC-Enterprise.cpu.SPARC64-VII.core.ce",
3105f149bcaScy 		FM_FMRI_SCHEME_HC, FM_HC_SCHEME_VERSION, cma_cpu_hc_retire },
3115f149bcaScy 	{ "fault.chassis.SPARC-Enterprise.cpu.SPARC64-VII.core.ce-offlinereq",
3125f149bcaScy 		FM_FMRI_SCHEME_HC, FM_HC_SCHEME_VERSION, cma_cpu_hc_retire },
313e4b86885SCheng Sean Ye #else
314e4b86885SCheng Sean Ye 	/*
315e4b86885SCheng Sean Ye 	 * For platforms excluding i386, sun4v and opl.
316e4b86885SCheng Sean Ye 	 */
3177c478bd9Sstevel@tonic-gate 	{ "fault.memory.page", FM_FMRI_SCHEME_MEM, FM_MEM_SCHEME_VERSION,
3187c478bd9Sstevel@tonic-gate 	    cma_page_retire },
3198a40a695Sgavinm 	{ "fault.memory.page_sb", FM_FMRI_SCHEME_MEM, FM_MEM_SCHEME_VERSION,
3208a40a695Sgavinm 	    cma_page_retire },
3218a40a695Sgavinm 	{ "fault.memory.page_ck", FM_FMRI_SCHEME_MEM, FM_MEM_SCHEME_VERSION,
3228a40a695Sgavinm 	    cma_page_retire },
3238a40a695Sgavinm 	{ "fault.memory.page_ue", FM_FMRI_SCHEME_MEM, FM_MEM_SCHEME_VERSION,
3248a40a695Sgavinm 	    cma_page_retire },
3257c478bd9Sstevel@tonic-gate 	{ "fault.memory.dimm", FM_FMRI_SCHEME_MEM, FM_MEM_SCHEME_VERSION,
3267c478bd9Sstevel@tonic-gate 	    NULL },
3275f25dc2aSgavinm 	{ "fault.memory.dimm_sb", FM_FMRI_SCHEME_MEM, FM_MEM_SCHEME_VERSION,
3287aec1d6eScindi 	    NULL },
3295f25dc2aSgavinm 	{ "fault.memory.dimm_ck", FM_FMRI_SCHEME_MEM, FM_MEM_SCHEME_VERSION,
3307aec1d6eScindi 	    NULL },
3315f25dc2aSgavinm 	{ "fault.memory.dimm_ue", FM_FMRI_SCHEME_MEM, FM_MEM_SCHEME_VERSION,
3327aec1d6eScindi 	    NULL },
333f6452528STom Pothier 	{ "fault.memory.dimm-page-retires-excessive", FM_FMRI_SCHEME_MEM,
334f6452528STom Pothier 	    FM_MEM_SCHEME_VERSION, NULL },
335f6452528STom Pothier 	{ "fault.memory.dimm-ue-imminent", FM_FMRI_SCHEME_MEM,
336f6452528STom Pothier 	    FM_MEM_SCHEME_VERSION, NULL },
337f6452528STom Pothier 	{ "fault.memory.dram-ue-imminent", FM_FMRI_SCHEME_MEM,
338f6452528STom Pothier 	    FM_MEM_SCHEME_VERSION, NULL },
3398a40a695Sgavinm 	{ "fault.memory.dimm_testfail", FM_FMRI_SCHEME_MEM,
3408a40a695Sgavinm 	    FM_MEM_SCHEME_VERSION, NULL },
3417c478bd9Sstevel@tonic-gate 	{ "fault.memory.bank", FM_FMRI_SCHEME_MEM, FM_MEM_SCHEME_VERSION,
3427c478bd9Sstevel@tonic-gate 	    NULL },
3437c478bd9Sstevel@tonic-gate 	{ "fault.memory.datapath", FM_FMRI_SCHEME_MEM, FM_MEM_SCHEME_VERSION,
3447c478bd9Sstevel@tonic-gate 	    NULL },
345*d4ac42a1STrang Do 	{ "fault.memory.datapath", FM_FMRI_SCHEME_HC, FM_HC_SCHEME_VERSION,
346*d4ac42a1STrang Do 	    NULL },
347*d4ac42a1STrang Do 	{ "fault.memory.datapath", FM_FMRI_SCHEME_CPU, FM_CPU_SCHEME_VERSION,
348*d4ac42a1STrang Do 	    NULL },
3496dfee483Stsien 
3506dfee483Stsien 	/*
3518a40a695Sgavinm 	 * The following faults do NOT retire a cpu thread,
3526dfee483Stsien 	 * and therefore must be intercepted before
3533f1e69beSCheng Sean Ye 	 * the default "fault.cpu.*" dispatch to cma_cpu_cpu_retire.
3546dfee483Stsien 	 */
3557bebe46cSjc 	{ "fault.cpu.ultraSPARC-IVplus.l2cachedata-line",
3567bebe46cSjc 	    FM_FMRI_SCHEME_CPU, FM_CPU_SCHEME_VERSION,
3577bebe46cSjc 	    cma_cache_way_retire },
3587bebe46cSjc 	{ "fault.cpu.ultraSPARC-IVplus.l3cachedata-line",
3597bebe46cSjc 	    FM_FMRI_SCHEME_CPU, FM_CPU_SCHEME_VERSION,
3607bebe46cSjc 	    cma_cache_way_retire },
3617bebe46cSjc 	{ "fault.cpu.ultraSPARC-IVplus.l2cachetag-line",
3627bebe46cSjc 	    FM_FMRI_SCHEME_CPU, FM_CPU_SCHEME_VERSION,
3637bebe46cSjc 	    cma_cache_way_retire },
3647bebe46cSjc 	{ "fault.cpu.ultraSPARC-IVplus.l3cachetag-line",
3657bebe46cSjc 	    FM_FMRI_SCHEME_CPU, FM_CPU_SCHEME_VERSION,
3667bebe46cSjc 	    cma_cache_way_retire },
367d3169229SJakub Jermar 
36820c794b3Sgavinm 	/*
369e4b86885SCheng Sean Ye 	 * Default "fault.cpu.*" for "cpu" scheme ASRU dispatch.
37020c794b3Sgavinm 	 */
3716dfee483Stsien 	{ "fault.cpu.*", FM_FMRI_SCHEME_CPU, FM_CPU_SCHEME_VERSION,
3723f1e69beSCheng Sean Ye 	    cma_cpu_cpu_retire },
3735f149bcaScy #endif
3747c478bd9Sstevel@tonic-gate 	{ NULL, NULL, 0, NULL }
3757c478bd9Sstevel@tonic-gate };
3767c478bd9Sstevel@tonic-gate 
3777c478bd9Sstevel@tonic-gate static const cma_subscriber_t *
nvl2subr(fmd_hdl_t * hdl,nvlist_t * nvl,nvlist_t ** asrup)3787c478bd9Sstevel@tonic-gate nvl2subr(fmd_hdl_t *hdl, nvlist_t *nvl, nvlist_t **asrup)
3797c478bd9Sstevel@tonic-gate {
3807c478bd9Sstevel@tonic-gate 	const cma_subscriber_t *sp;
3817c478bd9Sstevel@tonic-gate 	nvlist_t *asru;
3827c478bd9Sstevel@tonic-gate 	char *scheme;
3837c478bd9Sstevel@tonic-gate 	uint8_t version;
384b7d3956bSstephh 	boolean_t retire;
385b7d3956bSstephh 
386b7d3956bSstephh 	if (nvlist_lookup_boolean_value(nvl, FM_SUSPECT_RETIRE, &retire) == 0 &&
387b7d3956bSstephh 	    retire == 0) {
388b7d3956bSstephh 		fmd_hdl_debug(hdl, "cma_recv: retire suppressed");
389b7d3956bSstephh 		return (NULL);
390b7d3956bSstephh 	}
3917c478bd9Sstevel@tonic-gate 
3927c478bd9Sstevel@tonic-gate 	if (nvlist_lookup_nvlist(nvl, FM_FAULT_ASRU, &asru) != 0 ||
3937c478bd9Sstevel@tonic-gate 	    nvlist_lookup_string(asru, FM_FMRI_SCHEME, &scheme) != 0 ||
3947c478bd9Sstevel@tonic-gate 	    nvlist_lookup_uint8(asru, FM_VERSION, &version) != 0) {
3957c478bd9Sstevel@tonic-gate 		cma_stats.bad_flts.fmds_value.ui64++;
3967c478bd9Sstevel@tonic-gate 		return (NULL);
3977c478bd9Sstevel@tonic-gate 	}
3987c478bd9Sstevel@tonic-gate 
3997c478bd9Sstevel@tonic-gate 	for (sp = cma_subrs; sp->subr_class != NULL; sp++) {
4007c478bd9Sstevel@tonic-gate 		if (fmd_nvl_class_match(hdl, nvl, sp->subr_class) &&
4017c478bd9Sstevel@tonic-gate 		    strcmp(scheme, sp->subr_sname) == 0 &&
4027c478bd9Sstevel@tonic-gate 		    version <= sp->subr_svers) {
4037c478bd9Sstevel@tonic-gate 			*asrup = asru;
4047c478bd9Sstevel@tonic-gate 			return (sp);
4057c478bd9Sstevel@tonic-gate 		}
4067c478bd9Sstevel@tonic-gate 	}
4077c478bd9Sstevel@tonic-gate 
4087c478bd9Sstevel@tonic-gate 	cma_stats.nop_flts.fmds_value.ui64++;
4097c478bd9Sstevel@tonic-gate 	return (NULL);
4107c478bd9Sstevel@tonic-gate }
4117c478bd9Sstevel@tonic-gate 
4127c478bd9Sstevel@tonic-gate static void
cma_recv_list(fmd_hdl_t * hdl,nvlist_t * nvl,const char * class)41325c6ff4bSstephh cma_recv_list(fmd_hdl_t *hdl, nvlist_t *nvl, const char *class)
4147c478bd9Sstevel@tonic-gate {
4157c478bd9Sstevel@tonic-gate 	char *uuid = NULL;
4165750ef5cSStephen Hanson 	nvlist_t **nva, **save_nva;
4175750ef5cSStephen Hanson 	uint_t nvc = 0, save_nvc;
41825cf1a30Sjl 	uint_t keepopen;
4197c478bd9Sstevel@tonic-gate 	int err = 0;
42063bacb40SScott Davenport 	nvlist_t *asru = NULL;
421d69c2551Sjc 	uint32_t index;
4227c478bd9Sstevel@tonic-gate 
4237c478bd9Sstevel@tonic-gate 	err |= nvlist_lookup_string(nvl, FM_SUSPECT_UUID, &uuid);
4247c478bd9Sstevel@tonic-gate 	err |= nvlist_lookup_nvlist_array(nvl, FM_SUSPECT_FAULT_LIST,
4257c478bd9Sstevel@tonic-gate 	    &nva, &nvc);
4267c478bd9Sstevel@tonic-gate 	if (err != 0) {
4277c478bd9Sstevel@tonic-gate 		cma_stats.bad_flts.fmds_value.ui64++;
4287c478bd9Sstevel@tonic-gate 		return;
4297c478bd9Sstevel@tonic-gate 	}
4307c478bd9Sstevel@tonic-gate 
4315750ef5cSStephen Hanson 	save_nvc = keepopen = nvc;
4325750ef5cSStephen Hanson 	save_nva = nva;
43325c6ff4bSstephh 	while (nvc-- != 0 && (strcmp(class, FM_LIST_SUSPECT_CLASS) != 0 ||
43425c6ff4bSstephh 	    !fmd_case_uuclosed(hdl, uuid))) {
4357c478bd9Sstevel@tonic-gate 		nvlist_t *nvl = *nva++;
4367c478bd9Sstevel@tonic-gate 		const cma_subscriber_t *subr;
43725c6ff4bSstephh 		int has_fault;
4387c478bd9Sstevel@tonic-gate 
4397c478bd9Sstevel@tonic-gate 		if ((subr = nvl2subr(hdl, nvl, &asru)) == NULL)
4407c478bd9Sstevel@tonic-gate 			continue;
4417c478bd9Sstevel@tonic-gate 
44225cf1a30Sjl 		/*
44325cf1a30Sjl 		 * A handler returns CMA_RA_SUCCESS to indicate that
44425cf1a30Sjl 		 * from this suspects  point-of-view the case may be
44525cf1a30Sjl 		 * closed, CMA_RA_FAILURE otherwise.
44625cf1a30Sjl 		 * A handler must not close the case itself.
44725cf1a30Sjl 		 */
44825cf1a30Sjl 		if (subr->subr_func != NULL) {
44925c6ff4bSstephh 			has_fault = fmd_nvl_fmri_has_fault(hdl, asru,
45025c6ff4bSstephh 			    FMD_HAS_FAULT_ASRU, NULL);
45125c6ff4bSstephh 			if (strcmp(class, FM_LIST_SUSPECT_CLASS) == 0) {
45225c6ff4bSstephh 				if (has_fault == 1)
45325c6ff4bSstephh 					err = subr->subr_func(hdl, nvl, asru,
45425c6ff4bSstephh 					    uuid, 0);
45525c6ff4bSstephh 			} else {
45625c6ff4bSstephh 				if (has_fault == 0)
45725c6ff4bSstephh 					err = subr->subr_func(hdl, nvl, asru,
45825c6ff4bSstephh 					    uuid, 1);
45925c6ff4bSstephh 			}
46025cf1a30Sjl 			if (err == CMA_RA_SUCCESS)
46125cf1a30Sjl 				keepopen--;
46225cf1a30Sjl 		}
4637c478bd9Sstevel@tonic-gate 	}
464e4b86885SCheng Sean Ye 
4655750ef5cSStephen Hanson 	/*
4665750ef5cSStephen Hanson 	 * Run though again to catch any new faults in list.updated.
4675750ef5cSStephen Hanson 	 */
4685750ef5cSStephen Hanson 	while (save_nvc-- != 0 && (strcmp(class, FM_LIST_UPDATED_CLASS) == 0)) {
4695750ef5cSStephen Hanson 		nvlist_t *nvl = *save_nva++;
4705750ef5cSStephen Hanson 		const cma_subscriber_t *subr;
4715750ef5cSStephen Hanson 		int has_fault;
4725750ef5cSStephen Hanson 
4735750ef5cSStephen Hanson 		if ((subr = nvl2subr(hdl, nvl, &asru)) == NULL)
4745750ef5cSStephen Hanson 			continue;
4755750ef5cSStephen Hanson 		if (subr->subr_func != NULL) {
4765750ef5cSStephen Hanson 			has_fault = fmd_nvl_fmri_has_fault(hdl, asru,
4775750ef5cSStephen Hanson 			    FMD_HAS_FAULT_ASRU, NULL);
4785750ef5cSStephen Hanson 			if (has_fault == 1)
4795750ef5cSStephen Hanson 				err = subr->subr_func(hdl, nvl, asru, uuid, 0);
4805750ef5cSStephen Hanson 		}
4815750ef5cSStephen Hanson 	}
4825750ef5cSStephen Hanson 
483d69c2551Sjc 	/*
484d69c2551Sjc 	 * Do not close the case if we are handling cache faults.
485d69c2551Sjc 	 */
48663bacb40SScott Davenport 	if (asru != NULL) {
48763bacb40SScott Davenport 		if (nvlist_lookup_uint32(asru, FM_FMRI_CPU_CACHE_INDEX,
48863bacb40SScott Davenport 		    &index) != 0) {
48963bacb40SScott Davenport 			if (!keepopen && strcmp(class,
49063bacb40SScott Davenport 			    FM_LIST_SUSPECT_CLASS) == 0) {
49163bacb40SScott Davenport 				fmd_case_uuclose(hdl, uuid);
49263bacb40SScott Davenport 			}
493d69c2551Sjc 		}
494d69c2551Sjc 	}
495e4b86885SCheng Sean Ye 
49625c6ff4bSstephh 	if (!keepopen && strcmp(class, FM_LIST_REPAIRED_CLASS) == 0)
49725c6ff4bSstephh 		fmd_case_uuresolved(hdl, uuid);
4987c478bd9Sstevel@tonic-gate }
4997c478bd9Sstevel@tonic-gate 
5007c478bd9Sstevel@tonic-gate static void
cma_recv_one(fmd_hdl_t * hdl,nvlist_t * nvl)5017c478bd9Sstevel@tonic-gate cma_recv_one(fmd_hdl_t *hdl, nvlist_t *nvl)
5027c478bd9Sstevel@tonic-gate {
5037c478bd9Sstevel@tonic-gate 	const cma_subscriber_t *subr;
5047c478bd9Sstevel@tonic-gate 	nvlist_t *asru;
5057c478bd9Sstevel@tonic-gate 
5067c478bd9Sstevel@tonic-gate 	if ((subr = nvl2subr(hdl, nvl, &asru)) == NULL)
5077c478bd9Sstevel@tonic-gate 		return;
5087c478bd9Sstevel@tonic-gate 
50925c6ff4bSstephh 	if (subr->subr_func != NULL) {
51025c6ff4bSstephh 		if (fmd_nvl_fmri_has_fault(hdl, asru,
51125c6ff4bSstephh 		    FMD_HAS_FAULT_ASRU, NULL) == 1)
51225c6ff4bSstephh 			(void) subr->subr_func(hdl, nvl, asru, NULL, 0);
51325c6ff4bSstephh 	}
5147c478bd9Sstevel@tonic-gate }
5157c478bd9Sstevel@tonic-gate 
5167c478bd9Sstevel@tonic-gate /*ARGSUSED*/
5177c478bd9Sstevel@tonic-gate static void
cma_recv(fmd_hdl_t * hdl,fmd_event_t * ep,nvlist_t * nvl,const char * class)5187c478bd9Sstevel@tonic-gate cma_recv(fmd_hdl_t *hdl, fmd_event_t *ep, nvlist_t *nvl, const char *class)
5197c478bd9Sstevel@tonic-gate {
5207c478bd9Sstevel@tonic-gate 	fmd_hdl_debug(hdl, "received %s\n", class);
5217c478bd9Sstevel@tonic-gate 
522cbf75e67SStephen Hanson 	if (strcmp(class, FM_LIST_RESOLVED_CLASS) == 0)
523cbf75e67SStephen Hanson 		return;
524cbf75e67SStephen Hanson 
5255f149bcaScy 	if (strcmp(class, FM_LIST_SUSPECT_CLASS) == 0 ||
52625c6ff4bSstephh 	    strcmp(class, FM_LIST_REPAIRED_CLASS) == 0 ||
52725c6ff4bSstephh 	    strcmp(class, FM_LIST_UPDATED_CLASS) == 0)
52825c6ff4bSstephh 		cma_recv_list(hdl, nvl, class);
5297c478bd9Sstevel@tonic-gate 	else
5307c478bd9Sstevel@tonic-gate 		cma_recv_one(hdl, nvl);
5317c478bd9Sstevel@tonic-gate }
5327c478bd9Sstevel@tonic-gate 
5337c478bd9Sstevel@tonic-gate /*ARGSUSED*/
5347c478bd9Sstevel@tonic-gate static void
cma_timeout(fmd_hdl_t * hdl,id_t id,void * arg)5357c478bd9Sstevel@tonic-gate cma_timeout(fmd_hdl_t *hdl, id_t id, void *arg)
5367c478bd9Sstevel@tonic-gate {
5377c478bd9Sstevel@tonic-gate 	if (id == cma.cma_page_timerid)
5387c478bd9Sstevel@tonic-gate 		cma_page_retry(hdl);
5395f149bcaScy #ifdef sun4v
5405f149bcaScy 	/*
5415f149bcaScy 	 * cpu offline/online needs to be retried on sun4v because
5425f149bcaScy 	 * ldom request can be asynchronous.
5435f149bcaScy 	 */
5445f149bcaScy 	else if (id == cma.cma_cpu_timerid)
5455f149bcaScy 		cma_cpu_retry(hdl);
5465f149bcaScy #endif
5475f149bcaScy }
5485f149bcaScy 
5495f149bcaScy #ifdef sun4v
5505f149bcaScy static void *
cma_init_alloc(size_t size)5515f149bcaScy cma_init_alloc(size_t size)
5525f149bcaScy {
5535f149bcaScy 	return (fmd_hdl_alloc(init_hdl, size, FMD_SLEEP));
5545f149bcaScy }
5555f149bcaScy 
5565f149bcaScy static void
cma_init_free(void * addr,size_t size)5575f149bcaScy cma_init_free(void *addr, size_t size)
5585f149bcaScy {
5595f149bcaScy 	fmd_hdl_free(init_hdl, addr, size);
5607c478bd9Sstevel@tonic-gate }
5615f149bcaScy #endif
5627c478bd9Sstevel@tonic-gate 
5637c478bd9Sstevel@tonic-gate static const fmd_hdl_ops_t fmd_ops = {
5647c478bd9Sstevel@tonic-gate 	cma_recv,	/* fmdo_recv */
5657c478bd9Sstevel@tonic-gate 	cma_timeout,	/* fmdo_timeout */
5667c478bd9Sstevel@tonic-gate 	NULL,		/* fmdo_close */
5677c478bd9Sstevel@tonic-gate 	NULL,		/* fmdo_stats */
5687c478bd9Sstevel@tonic-gate 	NULL,		/* fmdo_gc */
5697c478bd9Sstevel@tonic-gate };
5707c478bd9Sstevel@tonic-gate 
5717c478bd9Sstevel@tonic-gate static const fmd_prop_t fmd_props[] = {
5727c478bd9Sstevel@tonic-gate 	{ "cpu_tries", FMD_TYPE_UINT32, "10" },
5737c478bd9Sstevel@tonic-gate 	{ "cpu_delay", FMD_TYPE_TIME, "1sec" },
5745f149bcaScy #ifdef sun4v
5755f149bcaScy 	{ "cpu_ret_mindelay", FMD_TYPE_TIME, "5sec" },
5765f149bcaScy 	{ "cpu_ret_maxdelay", FMD_TYPE_TIME, "5min" },
5775f149bcaScy #endif /* sun4v */
5787c478bd9Sstevel@tonic-gate 	{ "cpu_offline_enable", FMD_TYPE_BOOL, "true" },
5795f149bcaScy 	{ "cpu_online_enable", FMD_TYPE_BOOL, "true" },
5807c478bd9Sstevel@tonic-gate 	{ "cpu_forced_offline", FMD_TYPE_BOOL, "true" },
5815f149bcaScy #ifdef opl
5825f149bcaScy 	{ "cpu_blacklist_enable", FMD_TYPE_BOOL, "false" },
5835f149bcaScy 	{ "cpu_unblacklist_enable", FMD_TYPE_BOOL, "false" },
5845f149bcaScy #else
5857c478bd9Sstevel@tonic-gate 	{ "cpu_blacklist_enable", FMD_TYPE_BOOL, "true" },
5865f149bcaScy 	{ "cpu_unblacklist_enable", FMD_TYPE_BOOL, "true" },
5875f149bcaScy #endif /* opl */
5887c478bd9Sstevel@tonic-gate 	{ "page_ret_mindelay", FMD_TYPE_TIME, "1sec" },
5897c478bd9Sstevel@tonic-gate 	{ "page_ret_maxdelay", FMD_TYPE_TIME, "5min" },
5907c478bd9Sstevel@tonic-gate 	{ "page_retire_enable", FMD_TYPE_BOOL, "true" },
5915f149bcaScy 	{ "page_unretire_enable", FMD_TYPE_BOOL, "true" },
5927c478bd9Sstevel@tonic-gate 	{ NULL, 0, NULL }
5937c478bd9Sstevel@tonic-gate };
5947c478bd9Sstevel@tonic-gate 
5957c478bd9Sstevel@tonic-gate static const fmd_hdl_info_t fmd_info = {
5967c478bd9Sstevel@tonic-gate 	"CPU/Memory Retire Agent", CMA_VERSION, &fmd_ops, fmd_props
5977c478bd9Sstevel@tonic-gate };
5987c478bd9Sstevel@tonic-gate 
5997c478bd9Sstevel@tonic-gate void
_fmd_init(fmd_hdl_t * hdl)6007c478bd9Sstevel@tonic-gate _fmd_init(fmd_hdl_t *hdl)
6017c478bd9Sstevel@tonic-gate {
6027c478bd9Sstevel@tonic-gate 	hrtime_t nsec;
6035f149bcaScy #ifdef i386
604e4b86885SCheng Sean Ye 	char buf[BUFSIZ];
605e4b86885SCheng Sean Ye 	const char *dom0 = "control_d";
606e4b86885SCheng Sean Ye 
607843e1988Sjohnlev 	/*
608e4b86885SCheng Sean Ye 	 * Abort the cpumem-retire module if Solaris is running under DomU.
609843e1988Sjohnlev 	 */
610e4b86885SCheng Sean Ye 	if (sysinfo(SI_PLATFORM, buf, sizeof (buf)) == -1)
611843e1988Sjohnlev 		return;
612e4b86885SCheng Sean Ye 
613e4b86885SCheng Sean Ye 	if (strncmp(buf, "i86pc", sizeof (buf)) == 0) {
614e4b86885SCheng Sean Ye 		cma_is_native = B_TRUE;
615e4b86885SCheng Sean Ye 	} else if (strncmp(buf, "i86xpv", sizeof (buf)) != 0) {
616e4b86885SCheng Sean Ye 		return;
617e4b86885SCheng Sean Ye 	} else {
618e4b86885SCheng Sean Ye 		int fd = open("/dev/xen/domcaps", O_RDONLY);
619e4b86885SCheng Sean Ye 
620e4b86885SCheng Sean Ye 		if (fd != -1) {
621e4b86885SCheng Sean Ye 			if (read(fd, buf, sizeof (buf)) <= 0 ||
622e4b86885SCheng Sean Ye 			    strncmp(buf, dom0, strlen(dom0)) != 0) {
623e4b86885SCheng Sean Ye 				(void) close(fd);
624e4b86885SCheng Sean Ye 				return;
625e4b86885SCheng Sean Ye 			}
626e4b86885SCheng Sean Ye 			(void) close(fd);
627e4b86885SCheng Sean Ye 		}
628e4b86885SCheng Sean Ye 		cma_is_native = B_FALSE;
629e4b86885SCheng Sean Ye 	}
630e4b86885SCheng Sean Ye #endif /* i386 */
6317c478bd9Sstevel@tonic-gate 
6327c478bd9Sstevel@tonic-gate 	if (fmd_hdl_register(hdl, FMD_API_VERSION, &fmd_info) != 0)
6337c478bd9Sstevel@tonic-gate 		return; /* invalid data in configuration file */
6347c478bd9Sstevel@tonic-gate 
6357c478bd9Sstevel@tonic-gate 	fmd_hdl_subscribe(hdl, "fault.cpu.*");
6367c478bd9Sstevel@tonic-gate 	fmd_hdl_subscribe(hdl, "fault.memory.*");
6375f149bcaScy #ifdef opl
6385f149bcaScy 	fmd_hdl_subscribe(hdl, "fault.chassis.SPARC-Enterprise.cpu.*");
6395f149bcaScy #endif
6407c478bd9Sstevel@tonic-gate 
6417c478bd9Sstevel@tonic-gate 	(void) fmd_stat_create(hdl, FMD_STAT_NOALLOC, sizeof (cma_stats) /
6427c478bd9Sstevel@tonic-gate 	    sizeof (fmd_stat_t), (fmd_stat_t *)&cma_stats);
6437c478bd9Sstevel@tonic-gate 
6447c478bd9Sstevel@tonic-gate 	cma.cma_cpu_tries = fmd_prop_get_int32(hdl, "cpu_tries");
6457c478bd9Sstevel@tonic-gate 
6467c478bd9Sstevel@tonic-gate 	nsec = fmd_prop_get_int64(hdl, "cpu_delay");
6477c478bd9Sstevel@tonic-gate 	cma.cma_cpu_delay.tv_sec = nsec / NANOSEC;
6487c478bd9Sstevel@tonic-gate 	cma.cma_cpu_delay.tv_nsec = nsec % NANOSEC;
6497c478bd9Sstevel@tonic-gate 
6507c478bd9Sstevel@tonic-gate 	cma.cma_page_mindelay = fmd_prop_get_int64(hdl, "page_ret_mindelay");
6517c478bd9Sstevel@tonic-gate 	cma.cma_page_maxdelay = fmd_prop_get_int64(hdl, "page_ret_maxdelay");
6527c478bd9Sstevel@tonic-gate 
6535f149bcaScy #ifdef sun4v
6545f149bcaScy 	cma.cma_cpu_mindelay = fmd_prop_get_int64(hdl, "cpu_ret_mindelay");
6555f149bcaScy 	cma.cma_cpu_maxdelay = fmd_prop_get_int64(hdl, "cpu_ret_maxdelay");
6565f149bcaScy #endif
6575f149bcaScy 
6587c478bd9Sstevel@tonic-gate 	cma.cma_cpu_dooffline = fmd_prop_get_int32(hdl, "cpu_offline_enable");
6597c478bd9Sstevel@tonic-gate 	cma.cma_cpu_forcedoffline = fmd_prop_get_int32(hdl,
6607c478bd9Sstevel@tonic-gate 	    "cpu_forced_offline");
6615f149bcaScy 	cma.cma_cpu_doonline = fmd_prop_get_int32(hdl, "cpu_online_enable");
6627c478bd9Sstevel@tonic-gate 	cma.cma_cpu_doblacklist = fmd_prop_get_int32(hdl,
6637c478bd9Sstevel@tonic-gate 	    "cpu_blacklist_enable");
6645f149bcaScy 	cma.cma_cpu_dounblacklist = fmd_prop_get_int32(hdl,
6655f149bcaScy 	    "cpu_unblacklist_enable");
6667c478bd9Sstevel@tonic-gate 	cma.cma_page_doretire = fmd_prop_get_int32(hdl, "page_retire_enable");
6675f149bcaScy 	cma.cma_page_dounretire = fmd_prop_get_int32(hdl,
6685f149bcaScy 	    "page_unretire_enable");
6697c478bd9Sstevel@tonic-gate 
6707c478bd9Sstevel@tonic-gate 	if (cma.cma_page_maxdelay < cma.cma_page_mindelay)
6717c478bd9Sstevel@tonic-gate 		fmd_hdl_abort(hdl, "page retirement delays conflict\n");
6725f149bcaScy 
6735f149bcaScy #ifdef sun4v
6745f149bcaScy 	init_hdl = hdl;
6755f149bcaScy 	cma_lhp = ldom_init(cma_init_alloc, cma_init_free);
6765f149bcaScy #endif
6777c478bd9Sstevel@tonic-gate }
6787c478bd9Sstevel@tonic-gate 
6797c478bd9Sstevel@tonic-gate void
_fmd_fini(fmd_hdl_t * hdl)6807c478bd9Sstevel@tonic-gate _fmd_fini(fmd_hdl_t *hdl)
6817c478bd9Sstevel@tonic-gate {
6825f149bcaScy #ifdef sun4v
6835f149bcaScy 	ldom_fini(cma_lhp);
6845f149bcaScy 	cma_cpu_fini(hdl);
6855f149bcaScy #endif
6867c478bd9Sstevel@tonic-gate 	cma_page_fini(hdl);
6877c478bd9Sstevel@tonic-gate }
688