1/*
2 * CDDL HEADER START
3 *
4 * The contents of this file are subject to the terms of the
5 * Common Development and Distribution License, Version 1.0 only
6 * (the "License").  You may not use this file except in compliance
7 * with the License.
8 *
9 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
10 * or http://www.opensolaris.org/os/licensing.
11 * See the License for the specific language governing permissions
12 * and limitations under the License.
13 *
14 * When distributing Covered Code, include this CDDL HEADER in each
15 * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
16 * If applicable, add the following below this CDDL HEADER, with the
17 * fields enclosed by brackets "[]" replaced with your own identifying
18 * information: Portions Copyright [yyyy] [name of copyright owner]
19 *
20 * CDDL HEADER END
21 */
22/*
23 * Copyright 2007 Sun Microsystems, Inc.  All rights reserved.
24 * Use is subject to license terms.
25 *
26 * Assembly code support for the jalapeno module
27 */
28
29#include "assym.h"
30
31#include <sys/asm_linkage.h>
32#include <sys/mmu.h>
33#include <vm/hat_sfmmu.h>
34#include <sys/machparam.h>
35#include <sys/machcpuvar.h>
36#include <sys/machthread.h>
37#include <sys/machtrap.h>
38#include <sys/privregs.h>
39#include <sys/asm_linkage.h>
40#include <sys/trap.h>
41#include <sys/cheetahregs.h>
42#include <sys/us3_module.h>
43#include <sys/xc_impl.h>
44#include <sys/intreg.h>
45#include <sys/async.h>
46#include <sys/clock.h>
47#include <sys/cheetahasm.h>
48
49#ifdef TRAPTRACE
50#include <sys/traptrace.h>
51#endif /* TRAPTRACE */
52
53/* BEGIN CSTYLED */
54
55#if defined(JALAPENO) && defined(JALAPENO_ERRATA_85)
56
57#define	CHK_JP_ERRATA85_ENABLED(scr, label)				\
58	ASM_LD(scr, jp_errata_85_active);				\
59	cmp	scr, 1;							\
60	bne	%icc, label;						\
61	nop
62
63#define	SET_64BIT_PA(dest, scr, hi32, lo32)				\
64	set	hi32, scr;						\
65	sllx	scr, 32, scr;						\
66	sethi	%hi(lo32), dest;					\
67	or	dest, %lo(lo32), dest;					\
68	or	scr, dest, dest
69
70/*
71 * Macro to trigger Jalapeno/Tomatillo speed change
72 *   j_chng_pa - scratch register
73 *   scr - scratch register
74 */
75#define	JP_ESTAR_TRIGGER(j_chng_pa, scr)				\
76	SET_64BIT_PA(j_chng_pa, scr, TOM_HIGH_PA, M_T_J_CHNG_INIT_PA);	\
77	ldxa	[j_chng_pa]ASI_IO, scr;					\
785:									\
79	and	scr, TOM_TRIGGER_MASK, scr;				\
80	cmp	scr, TOM_TRIGGER;					\
81	be,pt %icc, 5b;			/* wait while 10 */		\
82	ldxa	[j_chng_pa]ASI_IO, scr;					\
83	andn	scr, TOM_TRIGGER_MASK, scr;				\
84	stxa	scr, [j_chng_pa]ASI_IO;	/* clear j_chng[1:0] */		\
85	or	scr, TOM_TRIGGER, scr;					\
86	stxa	scr, [j_chng_pa]ASI_IO;	/* trigger j_chng */		\
87	ldxa	[j_chng_pa]ASI_IO, scr;					\
886:									\
89	and	scr, TOM_TRIGGER_MASK, scr;				\
90	cmp	scr, TOM_TRIGGER;					\
91	be,pt %icc, 6b;			/* wait while 10 */		\
92	ldxa	[j_chng_pa]ASI_IO, scr;					\
93	andn	scr, TOM_TRIGGER_MASK, scr;				\
94	stxa	scr, [j_chng_pa]ASI_IO;	/* deassert j_chng */
95
96/*
97 * Macro to set Jalapeno CPU speed
98 *   speed - new speed constant
99 *   scr1  - scratch register
100 *   scr2  - scratch register
101 */
102#define	SET_JP_SPEED(speed, scr1, scr2)					\
103	ldxa	[%g0]ASI_JBUS_CONFIG, scr1;				\
104	set	JBUS_CONFIG_ECLK_MASK, scr2;				\
105	andn	scr1, scr2, scr1;					\
106	set	speed, scr2;						\
107	or	scr1, scr2, scr1;					\
108	stxa	scr1, [%g0]ASI_JBUS_CONFIG;
109
110/*
111 * macro to set Master Tomatillo speed
112 *   speed - tomatillo speed constant
113 *   tpa   - tomatillo estar control register PA
114 *   scr  - scratch register
115 */
116#define	SET_TOM_SPEED(speed, tpa, scr)					\
117	ldxa	[tpa]ASI_IO, scr;					\
118	andn	scr, TOM_ESTAR_ELCK_MASK, scr;				\
119	or	scr, speed, scr;					\
120	stxa	scr, [tpa]ASI_IO;
121
122/*
123 * macro to check and set Slave Tomatillo speed
124 *   speed - tomatillo speed constant
125 *   scr1   - scratch register
126 *   scr2   - scratch register
127 */
128
129#define	SET_SLAVE_T_SPEED(speed, scr1, scr2)				\
130	ldxa	[%g0]ASI_JBUS_CONFIG, scr2;				\
131	srlx	scr2, JBUS_SLAVE_T_PORT_BIT, scr2;			\
132	btst	1, scr2;						\
133	bz,pt	%icc, 4f;						\
134	nop;								\
135	SET_64BIT_PA(scr1, scr2, TOM_HIGH_PA, S_T_ESTAR_CTRL_PA);	\
136	SET_TOM_SPEED(speed, scr1, scr2);				\
1374:
138
139
140/*
141 * macro to adjust ASI_MCU_CTL_REG1[26:25] fsm bits according to
142 * new cpu speed: fsm[1:0]=11b for full speed, fsm[1:0]=0 for estar speed
143 *    value - fsm bit value constant
144 *    scr1  - scratch register
145 *    scr2  - scratch register
146 */
147#define	JP_ADJUST_FSM(value, scr1, scr2)				\
148	ldxa	[%g0]ASI_MCU_CTRL, scr1;				\
149	set	JP_MCU_FSM_MASK, scr2;					\
150	andn	scr1, scr2, scr1;					\
151	set	value, scr2;						\
152	or	scr1, scr2, scr1;					\
153	stxa	scr1, [%g0]ASI_MCU_CTRL;				\
154	membar	#Sync;
155
156/*
157 * JP_FORCE_FULL_SPEED and its fellow macros are for Jalapeno
158 * workstation to work around Errata 85. The front portion of
159 * it packs JP speed(14..13) and Tomatillo speed(5..0) into one
160 * register.
161 *
162 * Current code assumes that these two fields are non-overlapping.
163 * If that assumption changes, then this code won't work. If so, we
164 * force a compile time error by not defining the JP_FORCE_FULL_SPEED
165 * and JP_RESTORE_SPEED macros below.
166 */
167
168#if !(JBUS_CONFIG_ECLK_MASK & TOM_SPEED_MASK)
169
170/*
171 * Macro to force Jalapeno/Tomatillo to full speed
172 *   old_lvl - register used to save original cpu, tomatillo speed
173 *   scr2 - scratch register
174 *   scr3 - scratch register
175 *   scr4 - scratch register
176 */
177#define	JP_FORCE_FULL_SPEED(old_lvl, scr2, scr3, scr4)			\
178	ldxa	[%g0]ASI_JBUS_CONFIG, old_lvl;				\
179	set	JBUS_CONFIG_ECLK_MASK, scr4;				\
180	and	old_lvl, scr4, old_lvl;					\
181	SET_64BIT_PA(scr2, scr3, TOM_HIGH_PA, M_T_ESTAR_CTRL_PA);	\
182	ldxa	[scr2]ASI_IO, scr3;					\
183	set	TOM_ESTAR_ELCK_MASK, scr4;				\
184	and	scr3, scr4, scr3;					\
185	or	old_lvl, scr3, old_lvl;					\
186	/* original jp and tomatillo speed saved in old_lvl */		\
187									\
188	/* either intended or currently at full speed */		\
189	set	JBUS_CONFIG_ECLK_MASK, scr4;				\
190	andcc	old_lvl, scr4, %g0;					\
191	bz,pt	%icc, 8f;						\
192	nop;								\
193	/* go through 1/2 speed. */					\
194	SET_JP_SPEED(JBUS_CONFIG_ECLK_2, scr3, scr4);			\
195	SET_TOM_SPEED(TOM_HALF_SPEED, scr2, scr3);			\
196	SET_SLAVE_T_SPEED(TOM_HALF_SPEED, scr3, scr4);			\
197	JP_ADJUST_FSM(0, scr3, scr4);					\
198	set	jp_estar_tl0_data, scr3;				\
199	ldx	[scr3], %g0;						\
200	membar	#Sync;		/* or busy wait 1us */			\
201	JP_ESTAR_TRIGGER(scr3, scr4);					\
2028:									\
203	/* bring to 1:1 speed */					\
204	SET_JP_SPEED(JBUS_CONFIG_ECLK_1, scr3, scr4);			\
205	SET_TOM_SPEED(TOM_FULL_SPEED, scr2, scr3);			\
206	SET_SLAVE_T_SPEED(TOM_FULL_SPEED, scr3, scr4);			\
207	JP_ADJUST_FSM(JP_MCU_FSM_MASK, scr3, scr4);			\
208	JP_ESTAR_TRIGGER(scr3, scr4)
209
210
211/*
212 * Macro to restore Jalapeno/Tomatillo to original speed
213 *     old_lvl - register contains saved original cpu, tomatillo speed
214 *     scr2 - scratch register
215 *     scr3 - scratch register
216 *     scr4 - scratch register
217 *
218 * If trap had occured in the middle of ppm cpu speed transtion, then
219 * old_lvl[31:10] contains the intended new speed written into jbus_config.
220 * if old_lvl[9:0] is inconsistent with old_lvl[31:10], then the trap surely
221 * interrupted the ppm cpu speed transition, otherwise nothing for sure.
222 * We'll restore the intended/then-current speed, that should cause no
223 * trouble to subsequent ppm cpu speed change code.
224 */
225#define	JP_RESTORE_SPEED(old_lvl, scr2, scr3, scr4)			\
226	srlx	old_lvl, JBUS_CONFIG_ECLK_SHIFT, scr2;			\
227	and	scr2, 3, scr2;						\
228	add	scr2, 1, scr2;						\
229	cmp	scr2, 3;						\
230	bne,pt	%icc, 7f;						\
231	  nop;								\
232	set	TOM_SLOW_SPEED, scr2;					\
233	/* scr2 contains tom speed according to intended jp speed */	\
2347:									\
235	andn	old_lvl, TOM_ESTAR_ELCK_MASK, old_lvl;			\
236	or	scr2, old_lvl, old_lvl;					\
237	/* updated old_lvl to contain intended jp and tom speed */	\
238	andcc	old_lvl, TOM_FULL_SPEED, %g0;				\
239	bnz,pt	%icc, 9f;	/* intended full, already at full */	\
240	nop;								\
241									\
242	/* go to half speed */						\
243	SET_JP_SPEED(JBUS_CONFIG_ECLK_2, scr3, scr4);			\
244	SET_64BIT_PA(scr2, scr3, TOM_HIGH_PA, M_T_ESTAR_CTRL_PA);	\
245	SET_TOM_SPEED(TOM_HALF_SPEED, scr2, scr3);			\
246	SET_SLAVE_T_SPEED(TOM_HALF_SPEED, scr3, scr4);			\
247	JP_ADJUST_FSM(0, scr3, scr4);					\
248	set	jp_estar_tl0_data, scr3;				\
249	ldx	[scr3], %g0;						\
250	membar	#Sync;							\
251	JP_ESTAR_TRIGGER(scr3, scr4);					\
252	andcc	old_lvl, TOM_SLOW_SPEED, %g0;				\
253	bz,pt	%icc, 9f;	/* intended 1:2, already at 1:2 */	\
254	  nop;								\
255									\
256	/* go to 1:32 speed */						\
257	SET_JP_SPEED(JBUS_CONFIG_ECLK_32, scr3, scr4);			\
258	SET_TOM_SPEED(TOM_SLOW_SPEED, scr2, scr3);			\
259	SET_SLAVE_T_SPEED(TOM_SLOW_SPEED, scr3, scr4);			\
260	JP_ESTAR_TRIGGER(scr3, scr4);					\
2619:
262
263#endif /* !(JBUS_CONFIG_ECLK_MASK & TOM_SPEED_MASK) */
264#endif	/* JALAPENO && JALAPENO_ERRATA_85 */
265
266/*
267 * Jalapeno version to reflush an Ecache line by index.
268 * Will flush all 4 ways (with only one scratch register).
269 * Note that the code will be faster if we use 2 scratch registers.
270 */
271#define	ECACHE_REFLUSH_LINE(ec_set_size, index, scr1)			\
272	JP_EC_DIAG_ACCESS_MEMBAR;					\
273	ldxa	[index]ASI_EC_DIAG, %g0;				\
274	JP_EC_DIAG_ACCESS_MEMBAR;					\
275	mov	1, scr1;						\
276	sllx	scr1, JP_ECFLUSH_EC_WAY_SHIFT, scr1;			\
277	add	scr1, index, scr1;					\
278	JP_EC_DIAG_ACCESS_MEMBAR;					\
279	ldxa	[scr1]ASI_EC_DIAG, %g0;					\
280	JP_EC_DIAG_ACCESS_MEMBAR;					\
281	mov	2, scr1;						\
282	sllx	scr1, JP_ECFLUSH_EC_WAY_SHIFT, scr1;			\
283	add	scr1, index, scr1;					\
284	JP_EC_DIAG_ACCESS_MEMBAR;					\
285	ldxa	[scr1]ASI_EC_DIAG, %g0;					\
286	JP_EC_DIAG_ACCESS_MEMBAR;					\
287	mov	3, scr1;						\
288	sllx	scr1, JP_ECFLUSH_EC_WAY_SHIFT, scr1;			\
289	add	scr1, index, scr1;					\
290	JP_EC_DIAG_ACCESS_MEMBAR;					\
291	ldxa	[scr1]ASI_EC_DIAG, %g0;					\
292	JP_EC_DIAG_ACCESS_MEMBAR
293
294/*
295 * Jalapeno version of ecache_flush_line.  Uses Jalapeno Ecache Displacement
296 * Flush feature to flush all 4 sets/ways.
297 */
298#define	ECACHE_FLUSH_LINE(physaddr, ec_set_size, scr1, scr2)		\
299	CPU_INDEX(scr1, scr2);						\
300	sllx	scr1, JP_ECFLUSH_PORTID_SHIFT, scr1;			\
301	set	JP_ECACHE_IDX_DISP_FLUSH, scr2;				\
302	or	scr2, scr1, scr2;					\
303	sub	ec_set_size, 1, scr1;					\
304	and	physaddr, scr1, scr1;					\
305	or	scr2, scr1, scr1;					\
306	ECACHE_REFLUSH_LINE(ec_set_size, scr1, scr2)
307
308/*
309 * Macro for getting ecache size from cpunodes structure
310 *  scr1:    Scratch, ecache size returned in this
311 *  scr2:    Scratch
312 */
313#define	GET_ECACHE_SIZE(scr1, scr2)					\
314	CPU_INDEX(scr1, scr2);						\
315	mulx	scr1, CPU_NODE_SIZE, scr1;				\
316	set	cpunodes + ECACHE_SIZE, scr2;				\
317	ld	[scr1 + scr2], scr1
318
319/* END CSTYLED */
320
321/*
322 * Ship mondo to aid using implicit busy/nack pair (bn ignored)
323 */
324	ENTRY_NP(shipit)
325	sll	%o0, IDCR_PID_SHIFT, %g1	! IDCR<18:14> = agent id
326	or	%g1, IDCR_OFFSET, %g1		! IDCR<13:0> = 0x70
327	stxa	%g0, [%g1]ASI_INTR_DISPATCH	! interrupt vector dispatch
328	membar	#Sync
329	retl
330	nop
331	SET_SIZE(shipit)
332
333
334/*
335 * flush_ecache:
336 *	%o0 - 64 bit physical address
337 *	%o1 - ecache size
338 *	%o2 - ecache linesize
339 */
340
341	ENTRY(flush_ecache)
342#if defined(JALAPENO) && defined(JALAPENO_ERRATA_85)
343	CHK_JP_ERRATA85_ENABLED(%g1, flush_ecache_1);
344	JP_FORCE_FULL_SPEED(%o3, %g1, %g2, %g3);	/* %o3: saved speed */
345flush_ecache_1:
346#endif	/* JALAPENO && JALAPENO_ERRATA_85 */
347
348	/*
349	 * Flush the entire Ecache using displacement flush.
350	 */
351	ECACHE_FLUSHALL(%o1, %o2, %o0, %o4)
352
353#if defined(JALAPENO) && defined(JALAPENO_ERRATA_85)
354	CHK_JP_ERRATA85_ENABLED(%g1, flush_ecache_2);
355	JP_RESTORE_SPEED(%o3, %g1, %g2, %g3);		/* %o3: saved speed */
356flush_ecache_2:
357#endif	/* JALAPENO && JALAPENO_ERRATA_85 */
358
359	retl
360	nop
361	SET_SIZE(flush_ecache)
362
363
364	.section ".text"
365	.align	64
366	ENTRY_NP(fast_ecc_err)
367
368	/*
369	 * Turn off CEEN and NCEEN.
370	 */
371	ldxa	[%g0]ASI_ESTATE_ERR, %g3
372	andn	%g3, EN_REG_NCEEN + EN_REG_CEEN, %g4
373	stxa	%g4, [%g0]ASI_ESTATE_ERR
374	membar	#Sync			! membar sync required
375
376	/*
377	 * Do the CPU log out capture.
378	 *   %g3 = "failed?" return value.
379	 *   %g2 = Input = AFAR. Output the clo_flags info which is passed
380	 *         into this macro via %g4. Output only valid if cpu_private
381	 *         struct has not been initialized.
382	 *   CHPR_FECCTL0_LOGOUT = cpu logout structure offset input
383	 *   %g4 = Trap information stored in the cpu logout flags field
384	 *   %g5 = scr1
385	 *   %g6 = scr2
386	 *   %g3 = scr3
387	 *   %g4 = scr4
388	 */
389	and	%g3, EN_REG_CEEN, %g4		! store the CEEN value, TL=0
390	set	CHPR_FECCTL0_LOGOUT, %g6
391	DO_CPU_LOGOUT(%g3, %g2, %g6, %g4, %g5, %g6, %g3, %g4)
392
393	/*
394	 * Flush the Ecache to get the error out of the Ecache.  If the UCC
395	 * or UCU is on a dirty line, then the following flush will turn
396	 * that into a WDC or WDU, respectively.
397	 */
398	CPU_INDEX(%g4, %g5)
399	mulx	%g4, CPU_NODE_SIZE, %g4
400	set	cpunodes, %g5
401	add	%g4, %g5, %g4
402	ld	[%g4 + ECACHE_LINESIZE], %g5
403	ld	[%g4 + ECACHE_SIZE], %g4
404#if defined(JALAPENO) && defined(JALAPENO_ERRATA_85)
405	CHK_JP_ERRATA85_ENABLED(%g6, fast_ecc_err_1);
406        set     jp_estar_tl0_data, %g6
407        stx     %g2, [%g6 + 0]
408        stx     %g3, [%g6 + 8]
409	JP_FORCE_FULL_SPEED(%g2, %g3, %g6, %g7)		/* %g2: saved speed */
410fast_ecc_err_1:
411#endif	/* JALAPENO && JALAPENO_ERRATA_85 */
412	ECACHE_FLUSHALL(%g4, %g5, %g6, %g7)
413#if defined(JALAPENO) && defined(JALAPENO_ERRATA_85)
414	CHK_JP_ERRATA85_ENABLED(%g6, fast_ecc_err_2);
415	JP_RESTORE_SPEED(%g2, %g3, %g6, %g7)		/* %g2: saved speed */
416        set     jp_estar_tl0_data, %g6
417        ldx     [%g6 + 0], %g2
418        ldx     [%g6 + 8], %g3
419fast_ecc_err_2:
420#endif	/* JALAPENO && JALAPENO_ERRATA_85 */
421
422	/*
423	 * Flush the Dcache.  Since bad data could have been installed in
424	 * the Dcache we must flush it before re-enabling it.
425	 */
426	ASM_LD(%g5, dcache_size)
427	ASM_LD(%g6, dcache_linesize)
428	CH_DCACHE_FLUSHALL(%g5, %g6, %g7)
429
430	/*
431	 * Flush the Icache.  Since we turned off the Icache to capture the
432	 * Icache line it is now stale or corrupted and we must flush it
433	 * before re-enabling it.
434	 */
435	GET_CPU_PRIVATE_PTR(%g0, %g5, %g7, fast_ecc_err_4);
436	ld	[%g5 + CHPR_ICACHE_LINESIZE], %g6
437	ba,pt	%icc, 5f
438	  ld	[%g5 + CHPR_ICACHE_SIZE], %g5
439fast_ecc_err_4:
440	ASM_LD(%g5, icache_size)
441	ASM_LD(%g6, icache_linesize)
4425:
443	CH_ICACHE_FLUSHALL(%g5, %g6, %g7, %g4)
444
445	/*
446	 * Restore the Dcache and Icache to the previous state.
447	 */
448	stxa	%g1, [%g0]ASI_DCU
449	flush	%g0	/* flush required after changing the IC bit */
450
451	/*
452	 * Make sure our CPU logout operation was successful.
453	 */
454	cmp	%g3, %g0
455	be	8f
456	  nop
457
458	/*
459	 * If the logout structure had been busy, how many times have
460	 * we tried to use it and failed (nesting count)? If we have
461	 * already recursed a substantial number of times, then we can
462	 * assume things are not going to get better by themselves and
463	 * so it would be best to panic.
464	 */
465	cmp	%g3, CLO_NESTING_MAX
466	blt	7f
467	  nop
468
469        call ptl1_panic
470          mov   PTL1_BAD_ECC, %g1
471
4727:
473	/*
474	 * Otherwise, if the logout structure was busy but we have not
475	 * nested more times than our maximum value, then we simply
476	 * issue a retry. Our TL=0 trap handler code will check and
477	 * clear the AFSR after it is done logging what is currently
478	 * in the logout struct and handle this event at that time.
479	 */
480	retry
4818:
482	/*
483	 * Call cpu_fast_ecc_error via systrap at PIL 14 unless we're
484	 * already at PIL 15.
485	 */
486	set	cpu_fast_ecc_error, %g1
487	rdpr	%pil, %g4
488	cmp	%g4, PIL_14
489	ba	sys_trap
490	  movl	%icc, PIL_14, %g4
491
492	SET_SIZE(fast_ecc_err)
493
494
495/*
496 * Fast ECC error at TL>0 handler
497 * We get here via trap 70 at TL>0->Software trap 0 at TL>0.  We enter
498 * this routine with %g1 and %g2 already saved in %tpc, %tnpc and %tstate.
499 * For a complete description of the Fast ECC at TL>0 handling see the
500 * comment block "Cheetah/Cheetah+ Fast ECC at TL>0 trap strategy" in
501 * us3_common_asm.s
502 */
503
504	.section ".text"
505	.align	64
506	ENTRY_NP(fast_ecc_tl1_err)
507
508	/*
509	 * This macro turns off the D$/I$ if they are on and saves their
510	 * original state in ch_err_tl1_tmp, saves all the %g registers in the
511	 * ch_err_tl1_data structure, updates the ch_err_tl1_flags and saves
512	 * the %tpc in ch_err_tl1_tpc.  At the end of this macro, %g1 will
513	 * point to the ch_err_tl1_data structure and the original D$/I$ state
514	 * will be saved in ch_err_tl1_tmp.  All %g registers except for %g1
515	 * will be available.
516	 */
517	CH_ERR_TL1_FECC_ENTER;
518
519	/*
520	 * Get the diagnostic logout data.  %g4 must be initialized to
521	 * current CEEN state, %g5 must point to logout structure in
522	 * ch_err_tl1_data_t.  %g3 will contain the nesting count upon
523	 * return.
524	 */
525	ldxa	[%g0]ASI_ESTATE_ERR, %g4
526	and	%g4, EN_REG_CEEN, %g4
527	add	%g1, CH_ERR_TL1_LOGOUT, %g5
528	DO_TL1_CPU_LOGOUT(%g3, %g2, %g4, %g5, %g6, %g3, %g4)
529
530	/*
531	 * If the logout nesting count is exceeded, we're probably
532	 * not making any progress, try to panic instead.
533	 */
534	cmp	%g3, CLO_NESTING_MAX
535	bge	fecc_tl1_err
536	  nop
537
538	/*
539	 * Save the current CEEN and NCEEN state in %g7 and turn them off
540	 * before flushing the Ecache.
541	 */
542	ldxa	[%g0]ASI_ESTATE_ERR, %g7
543	andn	%g7, EN_REG_CEEN | EN_REG_NCEEN, %g5
544	stxa	%g5, [%g0]ASI_ESTATE_ERR
545	membar	#Sync
546
547	/*
548	 * Flush the Ecache, using the largest possible cache size with the
549	 * smallest possible line size since we can't get the actual sizes
550	 * from the cpu_node due to DTLB misses.
551	 */
552	set	JP_ECACHE_MAX_SIZE, %g4
553#if defined(JALAPENO) && defined(JALAPENO_ERRATA_85)
554	CHK_JP_ERRATA85_ENABLED(%g6, fast_ecc_tl1_err_1);
555        set     jp_estar_tl1_data, %g6
556        stx     %g2, [%g6 + 0]
557        stx     %g3, [%g6 + 8]
558	JP_FORCE_FULL_SPEED(%g2, %g3, %g5, %g6)
559fast_ecc_tl1_err_1:
560#endif	/* JALAPENO && JALAPENO_ERRATA_85 */
561	ECACHE_FLUSHALL(%g4, JP_ECACHE_MAX_LSIZE, %g5, %g6)
562#if defined(JALAPENO) && defined(JALAPENO_ERRATA_85)
563	CHK_JP_ERRATA85_ENABLED(%g6, fast_ecc_tl1_err_2);
564	JP_RESTORE_SPEED(%g2, %g3, %g5, %g6)
565        set     jp_estar_tl1_data, %g6
566        ldx     [%g6 + 0], %g2
567        ldx     [%g6 + 8], %g3
568fast_ecc_tl1_err_2:
569#endif	/* JALAPENO && JALAPENO_ERRATA_85 */
570
571	/*
572	 * Restore CEEN and NCEEN to the previous state.
573	 */
574	stxa	%g7, [%g0]ASI_ESTATE_ERR
575	membar	#Sync
576
577	/*
578	 * If we turned off the D$, then flush it and turn it back on.
579	 */
580	ldxa	[%g1 + CH_ERR_TL1_TMP]%asi, %g3
581	andcc	%g3, CH_ERR_TSTATE_DC_ON, %g0
582	bz	%xcc, 3f
583	  nop
584
585	/*
586	 * Flush the D$.
587	 */
588	ASM_LD(%g4, dcache_size)
589	ASM_LD(%g5, dcache_linesize)
590	CH_DCACHE_FLUSHALL(%g4, %g5, %g6)
591
592	/*
593	 * Turn the D$ back on.
594	 */
595	ldxa	[%g0]ASI_DCU, %g3
596	or	%g3, DCU_DC, %g3
597	stxa	%g3, [%g0]ASI_DCU
598	membar	#Sync
5993:
600	/*
601	 * If we turned off the I$, then flush it and turn it back on.
602	 */
603	ldxa	[%g1 + CH_ERR_TL1_TMP]%asi, %g3
604	andcc	%g3, CH_ERR_TSTATE_IC_ON, %g0
605	bz	%xcc, 4f
606	  nop
607
608	/*
609	 * Flush the I$.
610	 */
611	ASM_LD(%g4, icache_size)
612	ASM_LD(%g5, icache_linesize)
613	CH_ICACHE_FLUSHALL(%g4, %g5, %g6, %g3)
614
615	/*
616	 * Turn the I$ back on.  Changing DCU_IC requires flush.
617	 */
618	ldxa	[%g0]ASI_DCU, %g3
619	or	%g3, DCU_IC, %g3
620	stxa	%g3, [%g0]ASI_DCU
621	flush	%g0
6224:
623
624#ifdef TRAPTRACE
625	/*
626	 * Get current trap trace entry physical pointer.
627	 */
628	CPU_INDEX(%g6, %g5)
629	sll	%g6, TRAPTR_SIZE_SHIFT, %g6
630	set	trap_trace_ctl, %g5
631	add	%g6, %g5, %g6
632	ld	[%g6 + TRAPTR_LIMIT], %g5
633	tst	%g5
634	be	%icc, skip_traptrace
635	  nop
636	ldx	[%g6 + TRAPTR_PBASE], %g5
637	ld	[%g6 + TRAPTR_OFFSET], %g4
638	add	%g5, %g4, %g5
639
640	/*
641	 * Create trap trace entry.
642	 */
643	rd	%asi, %g7
644	wr	%g0, TRAPTR_ASI, %asi
645	rd	STICK, %g4
646	stxa	%g4, [%g5 + TRAP_ENT_TICK]%asi
647	rdpr	%tl, %g4
648	stha	%g4, [%g5 + TRAP_ENT_TL]%asi
649	rdpr	%tt, %g4
650	stha	%g4, [%g5 + TRAP_ENT_TT]%asi
651	rdpr	%tpc, %g4
652	stna	%g4, [%g5 + TRAP_ENT_TPC]%asi
653	rdpr	%tstate, %g4
654	stxa	%g4, [%g5 + TRAP_ENT_TSTATE]%asi
655	stna	%sp, [%g5 + TRAP_ENT_SP]%asi
656	stna	%g0, [%g5 + TRAP_ENT_TR]%asi
657	wr	%g0, %g7, %asi
658	ldxa	[%g1 + CH_ERR_TL1_SDW_AFAR]%asi, %g3
659	ldxa	[%g1 + CH_ERR_TL1_SDW_AFSR]%asi, %g4
660	wr	%g0, TRAPTR_ASI, %asi
661	stna	%g3, [%g5 + TRAP_ENT_F1]%asi
662	stna	%g4, [%g5 + TRAP_ENT_F2]%asi
663	wr	%g0, %g7, %asi
664	ldxa	[%g1 + CH_ERR_TL1_AFAR]%asi, %g3
665	ldxa	[%g1 + CH_ERR_TL1_AFSR]%asi, %g4
666	wr	%g0, TRAPTR_ASI, %asi
667	stna	%g3, [%g5 + TRAP_ENT_F3]%asi
668	stna	%g4, [%g5 + TRAP_ENT_F4]%asi
669	wr	%g0, %g7, %asi
670
671	/*
672	 * Advance trap trace pointer.
673	 */
674	ld	[%g6 + TRAPTR_OFFSET], %g5
675	ld	[%g6 + TRAPTR_LIMIT], %g4
676	st	%g5, [%g6 + TRAPTR_LAST_OFFSET]
677	add	%g5, TRAP_ENT_SIZE, %g5
678	sub	%g4, TRAP_ENT_SIZE, %g4
679	cmp	%g5, %g4
680	movge	%icc, 0, %g5
681	st	%g5, [%g6 + TRAPTR_OFFSET]
682skip_traptrace:
683#endif	/* TRAPTRACE */
684
685	/*
686	 * If nesting count is not zero, skip all the AFSR/AFAR
687	 * handling and just do the necessary cache-flushing.
688	 */
689	ldxa	[%g1 + CH_ERR_TL1_NEST_CNT]%asi, %g2
690	brnz	%g2, 6f
691	  nop
692
693	/*
694	 * If a UCU followed by a WDU has occurred go ahead and panic
695	 * since a UE will occur (on the retry) before the UCU and WDU
696	 * messages are enqueued.
697	 */
698	ldxa	[%g1 + CH_ERR_TL1_AFSR]%asi, %g3
699	set	1, %g4
700	sllx	%g4, C_AFSR_UCU_SHIFT, %g4
701	btst	%g4, %g3		! UCU in original AFSR?
702	bz	%xcc, 6f
703	  nop
704	ldxa	[%g0]ASI_AFSR, %g4	! current AFSR
705	or	%g3, %g4, %g3		! %g3 = original + current AFSR
706	set	1, %g4
707	sllx	%g4, C_AFSR_WDU_SHIFT, %g4
708	btst	%g4, %g3		! WDU in original or current AFSR?
709	bnz	%xcc, fecc_tl1_err
710	  nop
711
7126:
713	/*
714	 * We fall into this macro if we've successfully logged the error in
715	 * the ch_err_tl1_data structure and want the PIL15 softint to pick
716	 * it up and log it.  %g1 must point to the ch_err_tl1_data structure.
717	 * Restores the %g registers and issues retry.
718	 */
719	CH_ERR_TL1_EXIT;
720	/*
721	 * Establish panic exit label.
722	 */
723	CH_ERR_TL1_PANIC_EXIT(fecc_tl1_err);
724
725	SET_SIZE(fast_ecc_tl1_err)
726
727
728	ENTRY(get_jbus_config)
729	ldxa	[%g0]ASI_JBUS_CONFIG, %o0
730	retl
731	nop
732	SET_SIZE(get_jbus_config)
733
734	ENTRY(set_jbus_config)
735	stxa	%o0, [%g0]ASI_JBUS_CONFIG
736	membar	#Sync
737	retl
738	nop
739	SET_SIZE(set_jbus_config)
740
741
742	ENTRY(get_mcu_ctl_reg1)
743	ldxa	[%g0]ASI_MCU_CTRL, %o0	! MCU control reg1 is at offset 0
744	retl
745	nop
746	SET_SIZE(get_mcu_ctl_reg1)
747
748
749	ENTRY(set_mcu_ctl_reg1)
750	stxa	%o0, [%g0]ASI_MCU_CTRL	! MCU control reg1 is at offset 0
751	membar	#Sync
752	retl
753	nop
754	SET_SIZE(set_mcu_ctl_reg1)
755
756
757/*
758 * scrubphys - Pass in the aligned physical memory address
759 * that you want to scrub, along with the ecache set size.
760 *
761 *	1) Displacement flush the E$ line corresponding to %addr.
762 *	   The first ldxa guarantees that the %addr is no longer in
763 *	   M, O, or E (goes to I or S (if instruction fetch also happens).
764 *	2) "Write" the data using a CAS %addr,%g0,%g0.
765 *	   The casxa guarantees a transition from I to M or S to M.
766 *	3) Displacement flush the E$ line corresponding to %addr.
767 *	   The second ldxa pushes the M line out of the ecache, into the
768 *	   writeback buffers, on the way to memory.
769 *	4) The "membar #Sync" pushes the cache line out of the writeback
770 *	   buffers onto the bus, on the way to dram finally.
771 *
772 * This is a modified version of the algorithm suggested by Gary Lauterbach.
773 * In theory the CAS %addr,%g0,%g0 is supposed to mark the addr's cache line
774 * as modified, but then we found out that for spitfire, if it misses in the
775 * E$ it will probably install as an M, but if it hits in the E$, then it
776 * will stay E, if the store doesn't happen. So the first displacement flush
777 * should ensure that the CAS will miss in the E$.  Arrgh.
778 */
779	ENTRY(scrubphys)
780	rdpr	%pstate, %o4
781	andn	%o4, PSTATE_IE | PSTATE_AM, %o5
782	wrpr	%o5, %g0, %pstate	! clear IE, AM bits
783
784#if defined(JALAPENO) && defined(JALAPENO_ERRATA_85)
785	CHK_JP_ERRATA85_ENABLED(%g1, scrubphys_1);
786	JP_FORCE_FULL_SPEED(%o5, %g1, %g2, %g3)		/* %o5: saved speed */
787scrubphys_1:
788#endif	/* JALAPENO && JALAPENO_ERRATA_85 */
789
790	ECACHE_FLUSH_LINE(%o0, %o1, %o2, %o3)
791	casxa	[%o0]ASI_MEM, %g0, %g0
792	ECACHE_REFLUSH_LINE(%o1, %o2, %o3)
793
794#if defined(JALAPENO) && defined(JALAPENO_ERRATA_85)
795	CHK_JP_ERRATA85_ENABLED(%g1, scrubphys_2);
796	JP_RESTORE_SPEED(%o5, %g1, %g2, %g3)		/* %o5: saved speed */
797scrubphys_2:
798#endif	/* JALAPENO && JALAPENO_ERRATA_85 */
799
800	wrpr	%g0, %o4, %pstate	! restore earlier pstate register value
801
802	retl
803	membar	#Sync			! move the data out of the load buffer
804	SET_SIZE(scrubphys)
805
806/*
807 * clearphys - Pass in the physical memory address of the checkblock
808 * that you want to push out, cleared with a recognizable pattern,
809 * from the ecache.
810 *
811 * To ensure that the ecc gets recalculated after the bad data is cleared,
812 * we must write out enough data to fill the w$ line (64 bytes). So we read
813 * in an entire ecache subblock's worth of data, and write it back out.
814 * Then we overwrite the 16 bytes of bad data with the pattern.
815 */
816	ENTRY(clearphys)
817	/* turn off IE, AM bits */
818	rdpr	%pstate, %o4
819	andn	%o4, PSTATE_IE | PSTATE_AM, %o5
820	wrpr	%o5, %g0, %pstate
821
822	/* turn off NCEEN */
823	ldxa	[%g0]ASI_ESTATE_ERR, %o5
824	andn	%o5, EN_REG_NCEEN, %o3
825	stxa	%o3, [%g0]ASI_ESTATE_ERR
826	membar	#Sync
827
828	/* align address passed with 64 bytes subblock size */
829	mov	CH_ECACHE_SUBBLK_SIZE, %o2
830	andn	%o0, (CH_ECACHE_SUBBLK_SIZE - 1), %g1
831
832	/* move the good data into the W$ */
8331:
834	subcc	%o2, 8, %o2
835	ldxa	[%g1 + %o2]ASI_MEM, %g2
836	bge	1b
837	  stxa	%g2, [%g1 + %o2]ASI_MEM
838
839	/* now overwrite the bad data */
840	setx	0xbadecc00badecc01, %g1, %g2
841	stxa	%g2, [%o0]ASI_MEM
842	mov	8, %g1
843	stxa	%g2, [%o0 + %g1]ASI_MEM
844
845#if defined(JALAPENO) && defined(JALAPENO_ERRATA_85)
846	CHK_JP_ERRATA85_ENABLED(%g1, clearphys_1);
847	JP_FORCE_FULL_SPEED(%o5, %g1, %g2, %g3)		/* %o5: saved speed */
848clearphys_1:
849#endif	/* JALAPENO && JALAPENO_ERRATA_85 */
850
851	ECACHE_FLUSH_LINE(%o0, %o1, %o2, %o3)
852	casxa	[%o0]ASI_MEM, %g0, %g0
853	ECACHE_REFLUSH_LINE(%o1, %o2, %o3)
854
855#if defined(JALAPENO) && defined(JALAPENO_ERRATA_85)
856	CHK_JP_ERRATA85_ENABLED(%g1, clearphys_2);
857	JP_RESTORE_SPEED(%o5, %g1, %g2, %g3)		/* %o5: saved speed */
858clearphys_2:
859#endif	/* JALAPENO && JALAPENO_ERRATA_85 */
860
861	/* clear the AFSR */
862	ldxa	[%g0]ASI_AFSR, %o1
863	stxa	%o1, [%g0]ASI_AFSR
864	membar	#Sync
865
866	/* turn NCEEN back on */
867	stxa	%o5, [%g0]ASI_ESTATE_ERR
868	membar	#Sync
869
870	/* return and re-enable IE and AM */
871	retl
872	  wrpr	%g0, %o4, %pstate
873	SET_SIZE(clearphys)
874
875
876/*
877 * Jalapeno Ecache displacement flush the specified line from the E$
878 *
879 * Register usage:
880 *	%o0 - 64 bit physical address for flushing
881 *	%o1 - Ecache set size
882 */
883	ENTRY(ecache_flush_line)
884
885#if defined(JALAPENO) && defined(JALAPENO_ERRATA_85)
886	CHK_JP_ERRATA85_ENABLED(%g1, ecache_flush_line_1);
887	JP_FORCE_FULL_SPEED(%o5, %g1, %g2, %g3)		/* %o5: saved speed */
888ecache_flush_line_1:
889#endif	/* JALAPENO && JALAPENO_ERRATA_85 */
890
891	ECACHE_FLUSH_LINE(%o0, %o1, %o2, %o3)
892
893#if defined(JALAPENO) && defined(JALAPENO_ERRATA_85)
894	CHK_JP_ERRATA85_ENABLED(%g1, ecache_flush_line_2);
895	JP_RESTORE_SPEED(%o5, %g1, %g2, %g3)		/* %o5: saved speed */
896ecache_flush_line_2:
897#endif	/* JALAPENO && JALAPENO_ERRATA_85 */
898
899	retl
900	  nop
901	SET_SIZE(ecache_flush_line)
902
903
904/*
905 * Perform necessary cpu workaround to ensure jbus ordering.
906 * Called only from Fire systems.
907 * CPU's internal "invalidate FIFOs" are flushed.
908 */
909
910#define	VIS_BLOCKSIZE	64
911
912	.seg    ".data"
913	.align  VIS_BLOCKSIZE
914	.type   sync_buf, #object
915sync_buf:
916	.skip   VIS_BLOCKSIZE
917	.size   sync_buf, VIS_BLOCKSIZE
918
919	ENTRY(jbus_stst_order)
920	set	sync_buf, %o1
921
922	rd	%fprs, %o2			! %o2 = saved fprs
923	or	%o2, FPRS_FEF, %o3
924	wr	%g0, %o3, %fprs			! make sure fp is enabled
925	stda    %d0, [%o1]ASI_BLK_COMMIT_P
926	wr	%o2, 0, %fprs			! restore fprs
927
928	retl
929	membar  #Sync
930	SET_SIZE(jbus_stst_order)
931
932/*
933 * This routine will not be called in Jalapeno systems.
934 */
935	ENTRY(flush_ipb)
936	retl
937	nop
938	SET_SIZE(flush_ipb)
939
940